diff --git a/act-dp-demo_clean-50-seed0/policy/DP/data/outputs/2026.04.21/19.57.41_robot_stack_blocks_two_stack_blocks_two/logs.json.txt b/act-dp-demo_clean-50-seed0/policy/DP/data/outputs/2026.04.21/19.57.41_robot_stack_blocks_two_stack_blocks_two/logs.json.txt new file mode 100644 index 0000000000000000000000000000000000000000..94e5a4f1f12a0b4f76584e049d9f711dff3b965c --- /dev/null +++ b/act-dp-demo_clean-50-seed0/policy/DP/data/outputs/2026.04.21/19.57.41_robot_stack_blocks_two_stack_blocks_two/logs.json.txt @@ -0,0 +1,71400 @@ +{"train_loss": 1.1882127523422241, "global_step": 0, "epoch": 0, "lr": 2.0000000000000002e-07} +{"train_loss": 1.1561558246612549, "global_step": 1, "epoch": 0, "lr": 4.0000000000000003e-07} +{"train_loss": 1.166137456893921, "global_step": 2, "epoch": 0, "lr": 6.000000000000001e-07} +{"train_loss": 1.1786892414093018, "global_step": 3, "epoch": 0, "lr": 8.000000000000001e-07} +{"train_loss": 1.1634478569030762, "global_step": 4, "epoch": 0, "lr": 1.0000000000000002e-06} +{"train_loss": 1.1371443271636963, "global_step": 5, "epoch": 0, "lr": 1.2000000000000002e-06} +{"train_loss": 1.1213637590408325, "global_step": 6, "epoch": 0, "lr": 1.4000000000000001e-06} +{"train_loss": 1.1273249387741089, "global_step": 7, "epoch": 0, "lr": 1.6000000000000001e-06} +{"train_loss": 1.1009774208068848, "global_step": 8, "epoch": 0, "lr": 1.8e-06} +{"train_loss": 1.070752501487732, "global_step": 9, "epoch": 0, "lr": 2.0000000000000003e-06} +{"train_loss": 1.0558642148971558, "global_step": 10, "epoch": 0, "lr": 2.2e-06} +{"train_loss": 1.083653450012207, "global_step": 11, "epoch": 0, "lr": 2.4000000000000003e-06} +{"train_loss": 1.0528476238250732, "global_step": 12, "epoch": 0, "lr": 2.6e-06} +{"train_loss": 1.0463639497756958, "global_step": 13, "epoch": 0, "lr": 2.8000000000000003e-06} +{"train_loss": 1.0027320384979248, "global_step": 14, "epoch": 0, "lr": 3e-06} +{"train_loss": 1.0634926557540894, "global_step": 15, "epoch": 0, "lr": 3.2000000000000003e-06} +{"train_loss": 1.0436252355575562, "global_step": 16, "epoch": 0, "lr": 3.4000000000000005e-06} +{"train_loss": 1.0283812284469604, "global_step": 17, "epoch": 0, "lr": 3.6e-06} +{"train_loss": 1.0361114740371704, "global_step": 18, "epoch": 0, "lr": 3.8e-06} +{"train_loss": 1.0179588794708252, "global_step": 19, "epoch": 0, "lr": 4.000000000000001e-06} +{"train_loss": 1.0137470960617065, "global_step": 20, "epoch": 0, "lr": 4.2000000000000004e-06} +{"train_loss": 1.01163911819458, "global_step": 21, "epoch": 0, "lr": 4.4e-06} +{"train_loss": 1.0207747220993042, "global_step": 22, "epoch": 0, "lr": 4.6e-06} +{"train_loss": 1.0215615034103394, "global_step": 23, "epoch": 0, "lr": 4.800000000000001e-06} +{"train_loss": 1.0065115690231323, "global_step": 24, "epoch": 0, "lr": 5e-06} +{"train_loss": 1.031944990158081, "global_step": 25, "epoch": 0, "lr": 5.2e-06} +{"train_loss": 1.0120434761047363, "global_step": 26, "epoch": 0, "lr": 5.4e-06} +{"train_loss": 1.008367896080017, "global_step": 27, "epoch": 0, "lr": 5.600000000000001e-06} +{"train_loss": 1.0272914171218872, "global_step": 28, "epoch": 0, "lr": 5.8e-06} +{"train_loss": 1.0197645425796509, "global_step": 29, "epoch": 0, "lr": 6e-06} +{"train_loss": 0.9934115409851074, "global_step": 30, "epoch": 0, "lr": 6.2e-06} +{"train_loss": 1.0228468179702759, "global_step": 31, "epoch": 0, "lr": 6.4000000000000006e-06} +{"train_loss": 1.006948709487915, "global_step": 32, "epoch": 0, "lr": 6.6e-06} +{"train_loss": 0.9970024824142456, "global_step": 33, "epoch": 0, "lr": 6.800000000000001e-06} +{"train_loss": 1.0009119510650635, "global_step": 34, "epoch": 0, "lr": 7.000000000000001e-06} +{"train_loss": 0.9750168919563293, "global_step": 35, "epoch": 0, "lr": 7.2e-06} +{"train_loss": 1.0062965154647827, "global_step": 36, "epoch": 0, "lr": 7.4e-06} +{"train_loss": 1.008097529411316, "global_step": 37, "epoch": 0, "lr": 7.6e-06} +{"train_loss": 1.0116143226623535, "global_step": 38, "epoch": 0, "lr": 7.8e-06} +{"train_loss": 1.0048813819885254, "global_step": 39, "epoch": 0, "lr": 8.000000000000001e-06} +{"train_loss": 0.9899671077728271, "global_step": 40, "epoch": 0, "lr": 8.200000000000001e-06} +{"train_loss": 1.0056407451629639, "global_step": 41, "epoch": 0, "lr": 8.400000000000001e-06} +{"train_loss": 0.9978185892105103, "global_step": 42, "epoch": 0, "lr": 8.599999999999999e-06} +{"train_loss": 1.0007599592208862, "global_step": 43, "epoch": 0, "lr": 8.8e-06} +{"train_loss": 0.9790144562721252, "global_step": 44, "epoch": 0, "lr": 9e-06} +{"train_loss": 0.9884657859802246, "global_step": 45, "epoch": 0, "lr": 9.2e-06} +{"train_loss": 0.9803248047828674, "global_step": 46, "epoch": 0, "lr": 9.4e-06} +{"train_loss": 0.9859092235565186, "global_step": 47, "epoch": 0, "lr": 9.600000000000001e-06} +{"train_loss": 0.99838787317276, "global_step": 48, "epoch": 0, "lr": 9.800000000000001e-06} +{"train_loss": 0.9829576015472412, "global_step": 49, "epoch": 0, "lr": 1e-05} +{"train_loss": 1.016957402229309, "global_step": 50, "epoch": 0, "lr": 1.02e-05} +{"train_loss": 0.9950236082077026, "global_step": 51, "epoch": 0, "lr": 1.04e-05} +{"train_loss": 0.9830098152160645, "global_step": 52, "epoch": 0, "lr": 1.06e-05} +{"train_loss": 0.98921138048172, "global_step": 53, "epoch": 0, "lr": 1.08e-05} +{"train_loss": 0.9964556694030762, "global_step": 54, "epoch": 0, "lr": 1.1000000000000001e-05} +{"train_loss": 0.9858956336975098, "global_step": 55, "epoch": 0, "lr": 1.1200000000000001e-05} +{"train_loss": 0.9918465614318848, "global_step": 56, "epoch": 0, "lr": 1.1400000000000001e-05} +{"train_loss": 0.9854735136032104, "global_step": 57, "epoch": 0, "lr": 1.16e-05} +{"train_loss": 0.9622071981430054, "global_step": 58, "epoch": 0, "lr": 1.18e-05} +{"train_loss": 0.9771512150764465, "global_step": 59, "epoch": 0, "lr": 1.2e-05} +{"train_loss": 0.9947948455810547, "global_step": 60, "epoch": 0, "lr": 1.22e-05} +{"train_loss": 0.9836923480033875, "global_step": 61, "epoch": 0, "lr": 1.24e-05} +{"train_loss": 0.9820349812507629, "global_step": 62, "epoch": 0, "lr": 1.2600000000000001e-05} +{"train_loss": 0.987995445728302, "global_step": 63, "epoch": 0, "lr": 1.2800000000000001e-05} +{"train_loss": 0.9772339463233948, "global_step": 64, "epoch": 0, "lr": 1.3000000000000001e-05} +{"train_loss": 0.9919653534889221, "global_step": 65, "epoch": 0, "lr": 1.32e-05} +{"train_loss": 0.9795792698860168, "global_step": 66, "epoch": 0, "lr": 1.3400000000000002e-05} +{"train_loss": 0.9624568223953247, "global_step": 67, "epoch": 0, "lr": 1.3600000000000002e-05} +{"train_loss": 0.9908638596534729, "global_step": 68, "epoch": 0, "lr": 1.3800000000000002e-05} +{"train_loss": 0.972754955291748, "global_step": 69, "epoch": 0, "lr": 1.4000000000000001e-05} +{"train_loss": 0.9771325588226318, "global_step": 70, "epoch": 0, "lr": 1.42e-05} +{"train_loss": 0.9854332208633423, "global_step": 71, "epoch": 0, "lr": 1.44e-05} +{"train_loss": 0.9936771392822266, "global_step": 72, "epoch": 0, "lr": 1.4599999999999999e-05} +{"train_loss": 0.9601161479949951, "global_step": 73, "epoch": 0, "lr": 1.48e-05} +{"train_loss": 0.9832988977432251, "global_step": 74, "epoch": 0, "lr": 1.5e-05} +{"train_loss": 0.9865148067474365, "global_step": 75, "epoch": 0, "lr": 1.52e-05} +{"train_loss": 0.9668901562690735, "global_step": 76, "epoch": 0, "lr": 1.54e-05} +{"train_loss": 0.9725744128227234, "global_step": 77, "epoch": 0, "lr": 1.56e-05} +{"train_loss": 0.9519546031951904, "global_step": 78, "epoch": 0, "lr": 1.58e-05} +{"train_loss": 0.964923083782196, "global_step": 79, "epoch": 0, "lr": 1.6000000000000003e-05} +{"train_loss": 0.9744236469268799, "global_step": 80, "epoch": 0, "lr": 1.62e-05} +{"train_loss": 0.9515497088432312, "global_step": 81, "epoch": 0, "lr": 1.6400000000000002e-05} +{"train_loss": 0.9499751925468445, "global_step": 82, "epoch": 0, "lr": 1.66e-05} +{"train_loss": 0.9494798183441162, "global_step": 83, "epoch": 0, "lr": 1.6800000000000002e-05} +{"train_loss": 0.9720651507377625, "global_step": 84, "epoch": 0, "lr": 1.7000000000000003e-05} +{"train_loss": 0.961525559425354, "global_step": 85, "epoch": 0, "lr": 1.7199999999999998e-05} +{"train_loss": 0.9681950807571411, "global_step": 86, "epoch": 0, "lr": 1.74e-05} +{"train_loss": 0.950670063495636, "global_step": 87, "epoch": 0, "lr": 1.76e-05} +{"train_loss": 0.9362554550170898, "global_step": 88, "epoch": 0, "lr": 1.78e-05} +{"train_loss": 0.9292432069778442, "global_step": 89, "epoch": 0, "lr": 1.8e-05} +{"train_loss": 0.9353529214859009, "global_step": 90, "epoch": 0, "lr": 1.8200000000000002e-05} +{"train_loss": 0.9320892095565796, "global_step": 91, "epoch": 0, "lr": 1.84e-05} +{"train_loss": 0.9338057041168213, "global_step": 92, "epoch": 0, "lr": 1.86e-05} +{"train_loss": 0.9403222799301147, "global_step": 93, "epoch": 0, "lr": 1.88e-05} +{"train_loss": 0.937178373336792, "global_step": 94, "epoch": 0, "lr": 1.9e-05} +{"train_loss": 0.9102622866630554, "global_step": 95, "epoch": 0, "lr": 1.9200000000000003e-05} +{"train_loss": 0.9041310548782349, "global_step": 96, "epoch": 0, "lr": 1.94e-05} +{"train_loss": 0.8875804543495178, "global_step": 97, "epoch": 0, "lr": 1.9600000000000002e-05} +{"train_loss": 0.8743413686752319, "global_step": 98, "epoch": 0, "lr": 1.9800000000000004e-05} +{"train_loss": 0.892768383026123, "global_step": 99, "epoch": 0, "lr": 2e-05} +{"train_loss": 0.8402594327926636, "global_step": 100, "epoch": 0, "lr": 2.0200000000000003e-05} +{"train_loss": 0.8493513464927673, "global_step": 101, "epoch": 0, "lr": 2.04e-05} +{"train_loss": 0.8711438179016113, "global_step": 102, "epoch": 0, "lr": 2.06e-05} +{"train_loss": 0.8561416864395142, "global_step": 103, "epoch": 0, "lr": 2.08e-05} +{"train_loss": 0.8297682404518127, "global_step": 104, "epoch": 0, "lr": 2.1e-05} +{"train_loss": 0.823895275592804, "global_step": 105, "epoch": 0, "lr": 2.12e-05} +{"train_loss": 0.8202869296073914, "global_step": 106, "epoch": 0, "lr": 2.1400000000000002e-05} +{"train_loss": 0.809857964515686, "global_step": 107, "epoch": 0, "lr": 2.16e-05} +{"train_loss": 0.8216232061386108, "global_step": 108, "epoch": 0, "lr": 2.18e-05} +{"train_loss": 0.7929455041885376, "global_step": 109, "epoch": 0, "lr": 2.2000000000000003e-05} +{"train_loss": 0.7858958840370178, "global_step": 110, "epoch": 0, "lr": 2.22e-05} +{"train_loss": 0.780771791934967, "global_step": 111, "epoch": 0, "lr": 2.2400000000000002e-05} +{"train_loss": 0.7981170415878296, "global_step": 112, "epoch": 0, "lr": 2.26e-05} +{"train_loss": 0.77723228931427, "global_step": 113, "epoch": 0, "lr": 2.2800000000000002e-05} +{"train_loss": 0.7696512341499329, "global_step": 114, "epoch": 0, "lr": 2.3000000000000003e-05} +{"train_loss": 0.7623881101608276, "global_step": 115, "epoch": 0, "lr": 2.32e-05} +{"train_loss": 0.7604321241378784, "global_step": 116, "epoch": 0, "lr": 2.3400000000000003e-05} +{"train_loss": 0.7363092303276062, "global_step": 117, "epoch": 0, "lr": 2.36e-05} +{"train_loss": 0.9690559080668858, "global_step": 118, "epoch": 0, "lr": 2.38e-05, "val_loss": 0.7522960901260376, "train_action_mse_error": 0.802158772945404} +{"train_loss": 0.7100940942764282, "global_step": 119, "epoch": 1, "lr": 2.4e-05} +{"train_loss": 0.7105453014373779, "global_step": 120, "epoch": 1, "lr": 2.4200000000000002e-05} +{"train_loss": 0.7348076105117798, "global_step": 121, "epoch": 1, "lr": 2.44e-05} +{"train_loss": 0.7255027294158936, "global_step": 122, "epoch": 1, "lr": 2.46e-05} +{"train_loss": 0.7123940587043762, "global_step": 123, "epoch": 1, "lr": 2.48e-05} +{"train_loss": 0.7084797620773315, "global_step": 124, "epoch": 1, "lr": 2.5e-05} +{"train_loss": 0.6995433568954468, "global_step": 125, "epoch": 1, "lr": 2.5200000000000003e-05} +{"train_loss": 0.6954721808433533, "global_step": 126, "epoch": 1, "lr": 2.54e-05} +{"train_loss": 0.6702844500541687, "global_step": 127, "epoch": 1, "lr": 2.5600000000000002e-05} +{"train_loss": 0.6770837306976318, "global_step": 128, "epoch": 1, "lr": 2.58e-05} +{"train_loss": 0.6789910197257996, "global_step": 129, "epoch": 1, "lr": 2.6000000000000002e-05} +{"train_loss": 0.6663735508918762, "global_step": 130, "epoch": 1, "lr": 2.6200000000000003e-05} +{"train_loss": 0.6690479516983032, "global_step": 131, "epoch": 1, "lr": 2.64e-05} +{"train_loss": 0.666845977306366, "global_step": 132, "epoch": 1, "lr": 2.6600000000000003e-05} +{"train_loss": 0.6427340507507324, "global_step": 133, "epoch": 1, "lr": 2.6800000000000004e-05} +{"train_loss": 0.6162322163581848, "global_step": 134, "epoch": 1, "lr": 2.7000000000000002e-05} +{"train_loss": 0.6399800777435303, "global_step": 135, "epoch": 1, "lr": 2.7200000000000004e-05} +{"train_loss": 0.5980362296104431, "global_step": 136, "epoch": 1, "lr": 2.7400000000000002e-05} +{"train_loss": 0.6145917177200317, "global_step": 137, "epoch": 1, "lr": 2.7600000000000003e-05} +{"train_loss": 0.6102718114852905, "global_step": 138, "epoch": 1, "lr": 2.7800000000000005e-05} +{"train_loss": 0.6070748567581177, "global_step": 139, "epoch": 1, "lr": 2.8000000000000003e-05} +{"train_loss": 0.5919065475463867, "global_step": 140, "epoch": 1, "lr": 2.8199999999999998e-05} +{"train_loss": 0.6039488911628723, "global_step": 141, "epoch": 1, "lr": 2.84e-05} +{"train_loss": 0.5931177139282227, "global_step": 142, "epoch": 1, "lr": 2.86e-05} +{"train_loss": 0.5452009439468384, "global_step": 143, "epoch": 1, "lr": 2.88e-05} +{"train_loss": 0.5756123661994934, "global_step": 144, "epoch": 1, "lr": 2.9e-05} +{"train_loss": 0.56138014793396, "global_step": 145, "epoch": 1, "lr": 2.9199999999999998e-05} +{"train_loss": 0.5502305030822754, "global_step": 146, "epoch": 1, "lr": 2.94e-05} +{"train_loss": 0.551827609539032, "global_step": 147, "epoch": 1, "lr": 2.96e-05} +{"train_loss": 0.5464308857917786, "global_step": 148, "epoch": 1, "lr": 2.98e-05} +{"train_loss": 0.54409259557724, "global_step": 149, "epoch": 1, "lr": 3e-05} +{"train_loss": 0.5297513008117676, "global_step": 150, "epoch": 1, "lr": 3.02e-05} +{"train_loss": 0.5507014393806458, "global_step": 151, "epoch": 1, "lr": 3.04e-05} +{"train_loss": 0.5269631743431091, "global_step": 152, "epoch": 1, "lr": 3.06e-05} +{"train_loss": 0.5166718363761902, "global_step": 153, "epoch": 1, "lr": 3.08e-05} +{"train_loss": 0.5267069935798645, "global_step": 154, "epoch": 1, "lr": 3.1e-05} +{"train_loss": 0.5084728598594666, "global_step": 155, "epoch": 1, "lr": 3.12e-05} +{"train_loss": 0.5149310827255249, "global_step": 156, "epoch": 1, "lr": 3.1400000000000004e-05} +{"train_loss": 0.5050822496414185, "global_step": 157, "epoch": 1, "lr": 3.16e-05} +{"train_loss": 0.5077612400054932, "global_step": 158, "epoch": 1, "lr": 3.18e-05} +{"train_loss": 0.5080159902572632, "global_step": 159, "epoch": 1, "lr": 3.2000000000000005e-05} +{"train_loss": 0.47209006547927856, "global_step": 160, "epoch": 1, "lr": 3.2200000000000003e-05} +{"train_loss": 0.5002748966217041, "global_step": 161, "epoch": 1, "lr": 3.24e-05} +{"train_loss": 0.47294744849205017, "global_step": 162, "epoch": 1, "lr": 3.26e-05} +{"train_loss": 0.47963860630989075, "global_step": 163, "epoch": 1, "lr": 3.2800000000000004e-05} +{"train_loss": 0.4737727642059326, "global_step": 164, "epoch": 1, "lr": 3.3e-05} +{"train_loss": 0.4452214241027832, "global_step": 165, "epoch": 1, "lr": 3.32e-05} +{"train_loss": 0.46673333644866943, "global_step": 166, "epoch": 1, "lr": 3.3400000000000005e-05} +{"train_loss": 0.4496968984603882, "global_step": 167, "epoch": 1, "lr": 3.3600000000000004e-05} +{"train_loss": 0.43550801277160645, "global_step": 168, "epoch": 1, "lr": 3.38e-05} +{"train_loss": 0.46227362751960754, "global_step": 169, "epoch": 1, "lr": 3.4000000000000007e-05} +{"train_loss": 0.4402351975440979, "global_step": 170, "epoch": 1, "lr": 3.4200000000000005e-05} +{"train_loss": 0.44062739610671997, "global_step": 171, "epoch": 1, "lr": 3.4399999999999996e-05} +{"train_loss": 0.441663920879364, "global_step": 172, "epoch": 1, "lr": 3.46e-05} +{"train_loss": 0.415875643491745, "global_step": 173, "epoch": 1, "lr": 3.48e-05} +{"train_loss": 0.4197201132774353, "global_step": 174, "epoch": 1, "lr": 3.5e-05} +{"train_loss": 0.43881458044052124, "global_step": 175, "epoch": 1, "lr": 3.52e-05} +{"train_loss": 0.4161137640476227, "global_step": 176, "epoch": 1, "lr": 3.54e-05} +{"train_loss": 0.401636004447937, "global_step": 177, "epoch": 1, "lr": 3.56e-05} +{"train_loss": 0.40984049439430237, "global_step": 178, "epoch": 1, "lr": 3.58e-05} +{"train_loss": 0.40822452306747437, "global_step": 179, "epoch": 1, "lr": 3.6e-05} +{"train_loss": 0.4135375916957855, "global_step": 180, "epoch": 1, "lr": 3.62e-05} +{"train_loss": 0.4071763753890991, "global_step": 181, "epoch": 1, "lr": 3.6400000000000004e-05} +{"train_loss": 0.37878116965293884, "global_step": 182, "epoch": 1, "lr": 3.66e-05} +{"train_loss": 0.39663249254226685, "global_step": 183, "epoch": 1, "lr": 3.68e-05} +{"train_loss": 0.3838426172733307, "global_step": 184, "epoch": 1, "lr": 3.7e-05} +{"train_loss": 0.3890102505683899, "global_step": 185, "epoch": 1, "lr": 3.72e-05} +{"train_loss": 0.36775079369544983, "global_step": 186, "epoch": 1, "lr": 3.74e-05} +{"train_loss": 0.36424681544303894, "global_step": 187, "epoch": 1, "lr": 3.76e-05} +{"train_loss": 0.3804420232772827, "global_step": 188, "epoch": 1, "lr": 3.7800000000000004e-05} +{"train_loss": 0.40171730518341064, "global_step": 189, "epoch": 1, "lr": 3.8e-05} +{"train_loss": 0.3647823631763458, "global_step": 190, "epoch": 1, "lr": 3.82e-05} +{"train_loss": 0.3834664523601532, "global_step": 191, "epoch": 1, "lr": 3.8400000000000005e-05} +{"train_loss": 0.37335318326950073, "global_step": 192, "epoch": 1, "lr": 3.86e-05} +{"train_loss": 0.3514520227909088, "global_step": 193, "epoch": 1, "lr": 3.88e-05} +{"train_loss": 0.3894202411174774, "global_step": 194, "epoch": 1, "lr": 3.9000000000000006e-05} +{"train_loss": 0.33931925892829895, "global_step": 195, "epoch": 1, "lr": 3.9200000000000004e-05} +{"train_loss": 0.3847713768482208, "global_step": 196, "epoch": 1, "lr": 3.94e-05} +{"train_loss": 0.33506497740745544, "global_step": 197, "epoch": 1, "lr": 3.960000000000001e-05} +{"train_loss": 0.35627108812332153, "global_step": 198, "epoch": 1, "lr": 3.9800000000000005e-05} +{"train_loss": 0.3373566269874573, "global_step": 199, "epoch": 1, "lr": 4e-05} +{"train_loss": 0.3400680124759674, "global_step": 200, "epoch": 1, "lr": 4.02e-05} +{"train_loss": 0.33941373229026794, "global_step": 201, "epoch": 1, "lr": 4.0400000000000006e-05} +{"train_loss": 0.3513265550136566, "global_step": 202, "epoch": 1, "lr": 4.0600000000000004e-05} +{"train_loss": 0.34658610820770264, "global_step": 203, "epoch": 1, "lr": 4.08e-05} +{"train_loss": 0.3317449986934662, "global_step": 204, "epoch": 1, "lr": 4.1e-05} +{"train_loss": 0.32609307765960693, "global_step": 205, "epoch": 1, "lr": 4.12e-05} +{"train_loss": 0.32155200839042664, "global_step": 206, "epoch": 1, "lr": 4.14e-05} +{"train_loss": 0.31701579689979553, "global_step": 207, "epoch": 1, "lr": 4.16e-05} +{"train_loss": 0.3251591920852661, "global_step": 208, "epoch": 1, "lr": 4.18e-05} +{"train_loss": 0.3135695457458496, "global_step": 209, "epoch": 1, "lr": 4.2e-05} +{"train_loss": 0.30341634154319763, "global_step": 210, "epoch": 1, "lr": 4.22e-05} +{"train_loss": 0.2995077669620514, "global_step": 211, "epoch": 1, "lr": 4.24e-05} +{"train_loss": 0.28728199005126953, "global_step": 212, "epoch": 1, "lr": 4.26e-05} +{"train_loss": 0.3105791509151459, "global_step": 213, "epoch": 1, "lr": 4.2800000000000004e-05} +{"train_loss": 0.2928420305252075, "global_step": 214, "epoch": 1, "lr": 4.3e-05} +{"train_loss": 0.3139539957046509, "global_step": 215, "epoch": 1, "lr": 4.32e-05} +{"train_loss": 0.2829352617263794, "global_step": 216, "epoch": 1, "lr": 4.3400000000000005e-05} +{"train_loss": 0.3004147708415985, "global_step": 217, "epoch": 1, "lr": 4.36e-05} +{"train_loss": 0.30192601680755615, "global_step": 218, "epoch": 1, "lr": 4.38e-05} +{"train_loss": 0.25327667593955994, "global_step": 219, "epoch": 1, "lr": 4.4000000000000006e-05} +{"train_loss": 0.2770618796348572, "global_step": 220, "epoch": 1, "lr": 4.4200000000000004e-05} +{"train_loss": 0.27952975034713745, "global_step": 221, "epoch": 1, "lr": 4.44e-05} +{"train_loss": 0.3138915002346039, "global_step": 222, "epoch": 1, "lr": 4.46e-05} +{"train_loss": 0.2693769335746765, "global_step": 223, "epoch": 1, "lr": 4.4800000000000005e-05} +{"train_loss": 0.2673851251602173, "global_step": 224, "epoch": 1, "lr": 4.5e-05} +{"train_loss": 0.2774020731449127, "global_step": 225, "epoch": 1, "lr": 4.52e-05} +{"train_loss": 0.27165669202804565, "global_step": 226, "epoch": 1, "lr": 4.5400000000000006e-05} +{"train_loss": 0.26036930084228516, "global_step": 227, "epoch": 1, "lr": 4.5600000000000004e-05} +{"train_loss": 0.26913678646087646, "global_step": 228, "epoch": 1, "lr": 4.58e-05} +{"train_loss": 0.25269338488578796, "global_step": 229, "epoch": 1, "lr": 4.600000000000001e-05} +{"train_loss": 0.24359309673309326, "global_step": 230, "epoch": 1, "lr": 4.6200000000000005e-05} +{"train_loss": 0.2836805582046509, "global_step": 231, "epoch": 1, "lr": 4.64e-05} +{"train_loss": 0.2542520761489868, "global_step": 232, "epoch": 1, "lr": 4.660000000000001e-05} +{"train_loss": 0.24863237142562866, "global_step": 233, "epoch": 1, "lr": 4.6800000000000006e-05} +{"train_loss": 0.24498601257801056, "global_step": 234, "epoch": 1, "lr": 4.7e-05} +{"train_loss": 0.25802117586135864, "global_step": 235, "epoch": 1, "lr": 4.72e-05} +{"train_loss": 0.24519598484039307, "global_step": 236, "epoch": 1, "lr": 4.74e-05} +{"train_loss": 0.43985399766629485, "global_step": 237, "epoch": 1, "lr": 4.76e-05, "val_loss": 0.26506876945495605} +{"train_loss": 0.25020161271095276, "global_step": 238, "epoch": 2, "lr": 4.78e-05} +{"train_loss": 0.2588903605937958, "global_step": 239, "epoch": 2, "lr": 4.8e-05} +{"train_loss": 0.2324771136045456, "global_step": 240, "epoch": 2, "lr": 4.82e-05} +{"train_loss": 0.2462558150291443, "global_step": 241, "epoch": 2, "lr": 4.8400000000000004e-05} +{"train_loss": 0.2285836935043335, "global_step": 242, "epoch": 2, "lr": 4.86e-05} +{"train_loss": 0.2627417743206024, "global_step": 243, "epoch": 2, "lr": 4.88e-05} +{"train_loss": 0.2288772165775299, "global_step": 244, "epoch": 2, "lr": 4.9e-05} +{"train_loss": 0.23994311690330505, "global_step": 245, "epoch": 2, "lr": 4.92e-05} +{"train_loss": 0.23224353790283203, "global_step": 246, "epoch": 2, "lr": 4.94e-05} +{"train_loss": 0.2521272301673889, "global_step": 247, "epoch": 2, "lr": 4.96e-05} +{"train_loss": 0.22856444120407104, "global_step": 248, "epoch": 2, "lr": 4.9800000000000004e-05} +{"train_loss": 0.24284426867961884, "global_step": 249, "epoch": 2, "lr": 5e-05} +{"train_loss": 0.21469631791114807, "global_step": 250, "epoch": 2, "lr": 5.02e-05} +{"train_loss": 0.26086845993995667, "global_step": 251, "epoch": 2, "lr": 5.0400000000000005e-05} +{"train_loss": 0.21903304755687714, "global_step": 252, "epoch": 2, "lr": 5.0600000000000003e-05} +{"train_loss": 0.236537903547287, "global_step": 253, "epoch": 2, "lr": 5.08e-05} +{"train_loss": 0.21336433291435242, "global_step": 254, "epoch": 2, "lr": 5.1000000000000006e-05} +{"train_loss": 0.23976078629493713, "global_step": 255, "epoch": 2, "lr": 5.1200000000000004e-05} +{"train_loss": 0.2093345820903778, "global_step": 256, "epoch": 2, "lr": 5.14e-05} +{"train_loss": 0.22410349547863007, "global_step": 257, "epoch": 2, "lr": 5.16e-05} +{"train_loss": 0.21397945284843445, "global_step": 258, "epoch": 2, "lr": 5.1800000000000005e-05} +{"train_loss": 0.20003679394721985, "global_step": 259, "epoch": 2, "lr": 5.2000000000000004e-05} +{"train_loss": 0.20134378969669342, "global_step": 260, "epoch": 2, "lr": 5.22e-05} +{"train_loss": 0.21130062639713287, "global_step": 261, "epoch": 2, "lr": 5.2400000000000007e-05} +{"train_loss": 0.20150218904018402, "global_step": 262, "epoch": 2, "lr": 5.2600000000000005e-05} +{"train_loss": 0.21297316253185272, "global_step": 263, "epoch": 2, "lr": 5.28e-05} +{"train_loss": 0.2330746054649353, "global_step": 264, "epoch": 2, "lr": 5.300000000000001e-05} +{"train_loss": 0.22450169920921326, "global_step": 265, "epoch": 2, "lr": 5.3200000000000006e-05} +{"train_loss": 0.20555514097213745, "global_step": 266, "epoch": 2, "lr": 5.3400000000000004e-05} +{"train_loss": 0.19731508195400238, "global_step": 267, "epoch": 2, "lr": 5.360000000000001e-05} +{"train_loss": 0.21695645153522491, "global_step": 268, "epoch": 2, "lr": 5.380000000000001e-05} +{"train_loss": 0.19985291361808777, "global_step": 269, "epoch": 2, "lr": 5.4000000000000005e-05} +{"train_loss": 0.20409686863422394, "global_step": 270, "epoch": 2, "lr": 5.420000000000001e-05} +{"train_loss": 0.1923757940530777, "global_step": 271, "epoch": 2, "lr": 5.440000000000001e-05} +{"train_loss": 0.19418074190616608, "global_step": 272, "epoch": 2, "lr": 5.4600000000000006e-05} +{"train_loss": 0.1894962042570114, "global_step": 273, "epoch": 2, "lr": 5.4800000000000004e-05} +{"train_loss": 0.19029556214809418, "global_step": 274, "epoch": 2, "lr": 5.500000000000001e-05} +{"train_loss": 0.1814350187778473, "global_step": 275, "epoch": 2, "lr": 5.520000000000001e-05} +{"train_loss": 0.176975816488266, "global_step": 276, "epoch": 2, "lr": 5.5400000000000005e-05} +{"train_loss": 0.1927560418844223, "global_step": 277, "epoch": 2, "lr": 5.560000000000001e-05} +{"train_loss": 0.19330133497714996, "global_step": 278, "epoch": 2, "lr": 5.580000000000001e-05} +{"train_loss": 0.16766957938671112, "global_step": 279, "epoch": 2, "lr": 5.6000000000000006e-05} +{"train_loss": 0.18325196206569672, "global_step": 280, "epoch": 2, "lr": 5.620000000000001e-05} +{"train_loss": 0.18095535039901733, "global_step": 281, "epoch": 2, "lr": 5.6399999999999995e-05} +{"train_loss": 0.1920679658651352, "global_step": 282, "epoch": 2, "lr": 5.66e-05} +{"train_loss": 0.19243599474430084, "global_step": 283, "epoch": 2, "lr": 5.68e-05} +{"train_loss": 0.17174987494945526, "global_step": 284, "epoch": 2, "lr": 5.6999999999999996e-05} +{"train_loss": 0.1762431114912033, "global_step": 285, "epoch": 2, "lr": 5.72e-05} +{"train_loss": 0.17706067860126495, "global_step": 286, "epoch": 2, "lr": 5.74e-05} +{"train_loss": 0.20773129165172577, "global_step": 287, "epoch": 2, "lr": 5.76e-05} +{"train_loss": 0.16983714699745178, "global_step": 288, "epoch": 2, "lr": 5.7799999999999995e-05} +{"train_loss": 0.18101173639297485, "global_step": 289, "epoch": 2, "lr": 5.8e-05} +{"train_loss": 0.17845402657985687, "global_step": 290, "epoch": 2, "lr": 5.82e-05} +{"train_loss": 0.15770310163497925, "global_step": 291, "epoch": 2, "lr": 5.8399999999999997e-05} +{"train_loss": 0.179216206073761, "global_step": 292, "epoch": 2, "lr": 5.86e-05} +{"train_loss": 0.17631344497203827, "global_step": 293, "epoch": 2, "lr": 5.88e-05} +{"train_loss": 0.16635234653949738, "global_step": 294, "epoch": 2, "lr": 5.9e-05} +{"train_loss": 0.1559981405735016, "global_step": 295, "epoch": 2, "lr": 5.92e-05} +{"train_loss": 0.18074554204940796, "global_step": 296, "epoch": 2, "lr": 5.94e-05} +{"train_loss": 0.18144376575946808, "global_step": 297, "epoch": 2, "lr": 5.96e-05} +{"train_loss": 0.16345606744289398, "global_step": 298, "epoch": 2, "lr": 5.9800000000000003e-05} +{"train_loss": 0.15693585574626923, "global_step": 299, "epoch": 2, "lr": 6e-05} +{"train_loss": 0.16103535890579224, "global_step": 300, "epoch": 2, "lr": 6.02e-05} +{"train_loss": 0.16305920481681824, "global_step": 301, "epoch": 2, "lr": 6.04e-05} +{"train_loss": 0.16911496222019196, "global_step": 302, "epoch": 2, "lr": 6.06e-05} +{"train_loss": 0.16229769587516785, "global_step": 303, "epoch": 2, "lr": 6.08e-05} +{"train_loss": 0.16338442265987396, "global_step": 304, "epoch": 2, "lr": 6.1e-05} +{"train_loss": 0.1602482795715332, "global_step": 305, "epoch": 2, "lr": 6.12e-05} +{"train_loss": 0.16597718000411987, "global_step": 306, "epoch": 2, "lr": 6.14e-05} +{"train_loss": 0.16857720911502838, "global_step": 307, "epoch": 2, "lr": 6.16e-05} +{"train_loss": 0.16989319026470184, "global_step": 308, "epoch": 2, "lr": 6.18e-05} +{"train_loss": 0.21535255014896393, "global_step": 309, "epoch": 2, "lr": 6.2e-05} +{"train_loss": 0.16718143224716187, "global_step": 310, "epoch": 2, "lr": 6.220000000000001e-05} +{"train_loss": 0.18658597767353058, "global_step": 311, "epoch": 2, "lr": 6.24e-05} +{"train_loss": 0.15159201622009277, "global_step": 312, "epoch": 2, "lr": 6.26e-05} +{"train_loss": 0.16916437447071075, "global_step": 313, "epoch": 2, "lr": 6.280000000000001e-05} +{"train_loss": 0.17171154916286469, "global_step": 314, "epoch": 2, "lr": 6.3e-05} +{"train_loss": 0.16639557480812073, "global_step": 315, "epoch": 2, "lr": 6.32e-05} +{"train_loss": 0.17819683253765106, "global_step": 316, "epoch": 2, "lr": 6.340000000000001e-05} +{"train_loss": 0.15909582376480103, "global_step": 317, "epoch": 2, "lr": 6.36e-05} +{"train_loss": 0.17972904443740845, "global_step": 318, "epoch": 2, "lr": 6.38e-05} +{"train_loss": 0.15854983031749725, "global_step": 319, "epoch": 2, "lr": 6.400000000000001e-05} +{"train_loss": 0.15874581038951874, "global_step": 320, "epoch": 2, "lr": 6.42e-05} +{"train_loss": 0.1414242684841156, "global_step": 321, "epoch": 2, "lr": 6.440000000000001e-05} +{"train_loss": 0.14350625872612, "global_step": 322, "epoch": 2, "lr": 6.460000000000001e-05} +{"train_loss": 0.14266537129878998, "global_step": 323, "epoch": 2, "lr": 6.48e-05} +{"train_loss": 0.14618441462516785, "global_step": 324, "epoch": 2, "lr": 6.500000000000001e-05} +{"train_loss": 0.15851998329162598, "global_step": 325, "epoch": 2, "lr": 6.52e-05} +{"train_loss": 0.16586343944072723, "global_step": 326, "epoch": 2, "lr": 6.54e-05} +{"train_loss": 0.1606559455394745, "global_step": 327, "epoch": 2, "lr": 6.560000000000001e-05} +{"train_loss": 0.16676980257034302, "global_step": 328, "epoch": 2, "lr": 6.58e-05} +{"train_loss": 0.1514260172843933, "global_step": 329, "epoch": 2, "lr": 6.6e-05} +{"train_loss": 0.14801625907421112, "global_step": 330, "epoch": 2, "lr": 6.620000000000001e-05} +{"train_loss": 0.15450775623321533, "global_step": 331, "epoch": 2, "lr": 6.64e-05} +{"train_loss": 0.14675498008728027, "global_step": 332, "epoch": 2, "lr": 6.66e-05} +{"train_loss": 0.15768985450267792, "global_step": 333, "epoch": 2, "lr": 6.680000000000001e-05} +{"train_loss": 0.1381881833076477, "global_step": 334, "epoch": 2, "lr": 6.7e-05} +{"train_loss": 0.13957548141479492, "global_step": 335, "epoch": 2, "lr": 6.720000000000001e-05} +{"train_loss": 0.15589933097362518, "global_step": 336, "epoch": 2, "lr": 6.740000000000001e-05} +{"train_loss": 0.13779698312282562, "global_step": 337, "epoch": 2, "lr": 6.76e-05} +{"train_loss": 0.1336258500814438, "global_step": 338, "epoch": 2, "lr": 6.780000000000001e-05} +{"train_loss": 0.1605987548828125, "global_step": 339, "epoch": 2, "lr": 6.800000000000001e-05} +{"train_loss": 0.18294812738895416, "global_step": 340, "epoch": 2, "lr": 6.82e-05} +{"train_loss": 0.14928488433361053, "global_step": 341, "epoch": 2, "lr": 6.840000000000001e-05} +{"train_loss": 0.1498057097196579, "global_step": 342, "epoch": 2, "lr": 6.860000000000001e-05} +{"train_loss": 0.13992884755134583, "global_step": 343, "epoch": 2, "lr": 6.879999999999999e-05} +{"train_loss": 0.14639249444007874, "global_step": 344, "epoch": 2, "lr": 6.9e-05} +{"train_loss": 0.16123215854167938, "global_step": 345, "epoch": 2, "lr": 6.92e-05} +{"train_loss": 0.1666526198387146, "global_step": 346, "epoch": 2, "lr": 6.939999999999999e-05} +{"train_loss": 0.1521976739168167, "global_step": 347, "epoch": 2, "lr": 6.96e-05} +{"train_loss": 0.1380234807729721, "global_step": 348, "epoch": 2, "lr": 6.98e-05} +{"train_loss": 0.16313393414020538, "global_step": 349, "epoch": 2, "lr": 7e-05} +{"train_loss": 0.15657813847064972, "global_step": 350, "epoch": 2, "lr": 7.02e-05} +{"train_loss": 0.15466904640197754, "global_step": 351, "epoch": 2, "lr": 7.04e-05} +{"train_loss": 0.1632477045059204, "global_step": 352, "epoch": 2, "lr": 7.06e-05} +{"train_loss": 0.13049593567848206, "global_step": 353, "epoch": 2, "lr": 7.08e-05} +{"train_loss": 0.13737556338310242, "global_step": 354, "epoch": 2, "lr": 7.1e-05} +{"train_loss": 0.14149831235408783, "global_step": 355, "epoch": 2, "lr": 7.12e-05} +{"train_loss": 0.18168591150716573, "global_step": 356, "epoch": 2, "lr": 7.14e-05, "val_loss": 0.1516994684934616} +{"train_loss": 0.14053155481815338, "global_step": 357, "epoch": 3, "lr": 7.16e-05} +{"train_loss": 0.150784432888031, "global_step": 358, "epoch": 3, "lr": 7.18e-05} +{"train_loss": 0.1534222960472107, "global_step": 359, "epoch": 3, "lr": 7.2e-05} +{"train_loss": 0.14042526483535767, "global_step": 360, "epoch": 3, "lr": 7.22e-05} +{"train_loss": 0.15135782957077026, "global_step": 361, "epoch": 3, "lr": 7.24e-05} +{"train_loss": 0.15268707275390625, "global_step": 362, "epoch": 3, "lr": 7.26e-05} +{"train_loss": 0.13308514654636383, "global_step": 363, "epoch": 3, "lr": 7.280000000000001e-05} +{"train_loss": 0.1488284468650818, "global_step": 364, "epoch": 3, "lr": 7.3e-05} +{"train_loss": 0.15160124003887177, "global_step": 365, "epoch": 3, "lr": 7.32e-05} +{"train_loss": 0.17233143746852875, "global_step": 366, "epoch": 3, "lr": 7.340000000000001e-05} +{"train_loss": 0.16250093281269073, "global_step": 367, "epoch": 3, "lr": 7.36e-05} +{"train_loss": 0.13248459994792938, "global_step": 368, "epoch": 3, "lr": 7.38e-05} +{"train_loss": 0.12345558404922485, "global_step": 369, "epoch": 3, "lr": 7.4e-05} +{"train_loss": 0.14148586988449097, "global_step": 370, "epoch": 3, "lr": 7.42e-05} +{"train_loss": 0.12385891377925873, "global_step": 371, "epoch": 3, "lr": 7.44e-05} +{"train_loss": 0.12416811287403107, "global_step": 372, "epoch": 3, "lr": 7.46e-05} +{"train_loss": 0.11685863882303238, "global_step": 373, "epoch": 3, "lr": 7.48e-05} +{"train_loss": 0.16256828606128693, "global_step": 374, "epoch": 3, "lr": 7.500000000000001e-05} +{"train_loss": 0.1292957067489624, "global_step": 375, "epoch": 3, "lr": 7.52e-05} +{"train_loss": 0.15342086553573608, "global_step": 376, "epoch": 3, "lr": 7.54e-05} +{"train_loss": 0.13965754210948944, "global_step": 377, "epoch": 3, "lr": 7.560000000000001e-05} +{"train_loss": 0.13519056141376495, "global_step": 378, "epoch": 3, "lr": 7.58e-05} +{"train_loss": 0.1275634914636612, "global_step": 379, "epoch": 3, "lr": 7.6e-05} +{"train_loss": 0.14124202728271484, "global_step": 380, "epoch": 3, "lr": 7.620000000000001e-05} +{"train_loss": 0.14474695920944214, "global_step": 381, "epoch": 3, "lr": 7.64e-05} +{"train_loss": 0.12577807903289795, "global_step": 382, "epoch": 3, "lr": 7.66e-05} +{"train_loss": 0.13598470389842987, "global_step": 383, "epoch": 3, "lr": 7.680000000000001e-05} +{"train_loss": 0.1507711261510849, "global_step": 384, "epoch": 3, "lr": 7.7e-05} +{"train_loss": 0.13224321603775024, "global_step": 385, "epoch": 3, "lr": 7.72e-05} +{"train_loss": 0.12392650544643402, "global_step": 386, "epoch": 3, "lr": 7.740000000000001e-05} +{"train_loss": 0.12616722285747528, "global_step": 387, "epoch": 3, "lr": 7.76e-05} +{"train_loss": 0.13131019473075867, "global_step": 388, "epoch": 3, "lr": 7.780000000000001e-05} +{"train_loss": 0.1403292715549469, "global_step": 389, "epoch": 3, "lr": 7.800000000000001e-05} +{"train_loss": 0.11869248002767563, "global_step": 390, "epoch": 3, "lr": 7.82e-05} +{"train_loss": 0.13089145720005035, "global_step": 391, "epoch": 3, "lr": 7.840000000000001e-05} +{"train_loss": 0.14653027057647705, "global_step": 392, "epoch": 3, "lr": 7.860000000000001e-05} +{"train_loss": 0.13999588787555695, "global_step": 393, "epoch": 3, "lr": 7.88e-05} +{"train_loss": 0.1517414152622223, "global_step": 394, "epoch": 3, "lr": 7.900000000000001e-05} +{"train_loss": 0.12786339223384857, "global_step": 395, "epoch": 3, "lr": 7.920000000000001e-05} +{"train_loss": 0.11844298988580704, "global_step": 396, "epoch": 3, "lr": 7.94e-05} +{"train_loss": 0.11780766397714615, "global_step": 397, "epoch": 3, "lr": 7.960000000000001e-05} +{"train_loss": 0.1603556126356125, "global_step": 398, "epoch": 3, "lr": 7.98e-05} +{"train_loss": 0.13223285973072052, "global_step": 399, "epoch": 3, "lr": 8e-05} +{"train_loss": 0.14851967990398407, "global_step": 400, "epoch": 3, "lr": 8.020000000000001e-05} +{"train_loss": 0.12220538407564163, "global_step": 401, "epoch": 3, "lr": 8.04e-05} +{"train_loss": 0.1365392953157425, "global_step": 402, "epoch": 3, "lr": 8.060000000000001e-05} +{"train_loss": 0.1434944123029709, "global_step": 403, "epoch": 3, "lr": 8.080000000000001e-05} +{"train_loss": 0.14017748832702637, "global_step": 404, "epoch": 3, "lr": 8.1e-05} +{"train_loss": 0.12143869698047638, "global_step": 405, "epoch": 3, "lr": 8.120000000000001e-05} +{"train_loss": 0.12800201773643494, "global_step": 406, "epoch": 3, "lr": 8.14e-05} +{"train_loss": 0.14347749948501587, "global_step": 407, "epoch": 3, "lr": 8.16e-05} +{"train_loss": 0.1274396777153015, "global_step": 408, "epoch": 3, "lr": 8.18e-05} +{"train_loss": 0.1292102336883545, "global_step": 409, "epoch": 3, "lr": 8.2e-05} +{"train_loss": 0.11637695878744125, "global_step": 410, "epoch": 3, "lr": 8.22e-05} +{"train_loss": 0.13352477550506592, "global_step": 411, "epoch": 3, "lr": 8.24e-05} +{"train_loss": 0.13469810783863068, "global_step": 412, "epoch": 3, "lr": 8.26e-05} +{"train_loss": 0.1393679976463318, "global_step": 413, "epoch": 3, "lr": 8.28e-05} +{"train_loss": 0.14283403754234314, "global_step": 414, "epoch": 3, "lr": 8.3e-05} +{"train_loss": 0.14630945026874542, "global_step": 415, "epoch": 3, "lr": 8.32e-05} +{"train_loss": 0.12799888849258423, "global_step": 416, "epoch": 3, "lr": 8.34e-05} +{"train_loss": 0.13630598783493042, "global_step": 417, "epoch": 3, "lr": 8.36e-05} +{"train_loss": 0.136213481426239, "global_step": 418, "epoch": 3, "lr": 8.38e-05} +{"train_loss": 0.13540737330913544, "global_step": 419, "epoch": 3, "lr": 8.4e-05} +{"train_loss": 0.12339404970407486, "global_step": 420, "epoch": 3, "lr": 8.42e-05} +{"train_loss": 0.13368692994117737, "global_step": 421, "epoch": 3, "lr": 8.44e-05} +{"train_loss": 0.12242767214775085, "global_step": 422, "epoch": 3, "lr": 8.46e-05} +{"train_loss": 0.10685405135154724, "global_step": 423, "epoch": 3, "lr": 8.48e-05} +{"train_loss": 0.1422540545463562, "global_step": 424, "epoch": 3, "lr": 8.5e-05} +{"train_loss": 0.1315847933292389, "global_step": 425, "epoch": 3, "lr": 8.52e-05} +{"train_loss": 0.14093017578125, "global_step": 426, "epoch": 3, "lr": 8.54e-05} +{"train_loss": 0.11728457361459732, "global_step": 427, "epoch": 3, "lr": 8.560000000000001e-05} +{"train_loss": 0.11963768303394318, "global_step": 428, "epoch": 3, "lr": 8.58e-05} +{"train_loss": 0.13704800605773926, "global_step": 429, "epoch": 3, "lr": 8.6e-05} +{"train_loss": 0.12486882507801056, "global_step": 430, "epoch": 3, "lr": 8.620000000000001e-05} +{"train_loss": 0.13422328233718872, "global_step": 431, "epoch": 3, "lr": 8.64e-05} +{"train_loss": 0.10449448972940445, "global_step": 432, "epoch": 3, "lr": 8.66e-05} +{"train_loss": 0.13375161588191986, "global_step": 433, "epoch": 3, "lr": 8.680000000000001e-05} +{"train_loss": 0.1182515025138855, "global_step": 434, "epoch": 3, "lr": 8.7e-05} +{"train_loss": 0.12172766029834747, "global_step": 435, "epoch": 3, "lr": 8.72e-05} +{"train_loss": 0.11964455991983414, "global_step": 436, "epoch": 3, "lr": 8.740000000000001e-05} +{"train_loss": 0.15353183448314667, "global_step": 437, "epoch": 3, "lr": 8.76e-05} +{"train_loss": 0.119454525411129, "global_step": 438, "epoch": 3, "lr": 8.78e-05} +{"train_loss": 0.1300676167011261, "global_step": 439, "epoch": 3, "lr": 8.800000000000001e-05} +{"train_loss": 0.12158691883087158, "global_step": 440, "epoch": 3, "lr": 8.82e-05} +{"train_loss": 0.09966110438108444, "global_step": 441, "epoch": 3, "lr": 8.840000000000001e-05} +{"train_loss": 0.12674199044704437, "global_step": 442, "epoch": 3, "lr": 8.86e-05} +{"train_loss": 0.1351359486579895, "global_step": 443, "epoch": 3, "lr": 8.88e-05} +{"train_loss": 0.10364194214344025, "global_step": 444, "epoch": 3, "lr": 8.900000000000001e-05} +{"train_loss": 0.14276167750358582, "global_step": 445, "epoch": 3, "lr": 8.92e-05} +{"train_loss": 0.1340264081954956, "global_step": 446, "epoch": 3, "lr": 8.94e-05} +{"train_loss": 0.13755472004413605, "global_step": 447, "epoch": 3, "lr": 8.960000000000001e-05} +{"train_loss": 0.13453218340873718, "global_step": 448, "epoch": 3, "lr": 8.98e-05} +{"train_loss": 0.13730691373348236, "global_step": 449, "epoch": 3, "lr": 9e-05} +{"train_loss": 0.12774914503097534, "global_step": 450, "epoch": 3, "lr": 9.020000000000001e-05} +{"train_loss": 0.09983737766742706, "global_step": 451, "epoch": 3, "lr": 9.04e-05} +{"train_loss": 0.12524756789207458, "global_step": 452, "epoch": 3, "lr": 9.06e-05} +{"train_loss": 0.1340307891368866, "global_step": 453, "epoch": 3, "lr": 9.080000000000001e-05} +{"train_loss": 0.11786915361881256, "global_step": 454, "epoch": 3, "lr": 9.1e-05} +{"train_loss": 0.11755063384771347, "global_step": 455, "epoch": 3, "lr": 9.120000000000001e-05} +{"train_loss": 0.12557153403759003, "global_step": 456, "epoch": 3, "lr": 9.140000000000001e-05} +{"train_loss": 0.11844519525766373, "global_step": 457, "epoch": 3, "lr": 9.16e-05} +{"train_loss": 0.10563043504953384, "global_step": 458, "epoch": 3, "lr": 9.180000000000001e-05} +{"train_loss": 0.11312022060155869, "global_step": 459, "epoch": 3, "lr": 9.200000000000001e-05} +{"train_loss": 0.13348619639873505, "global_step": 460, "epoch": 3, "lr": 9.22e-05} +{"train_loss": 0.14642976224422455, "global_step": 461, "epoch": 3, "lr": 9.240000000000001e-05} +{"train_loss": 0.12333590537309647, "global_step": 462, "epoch": 3, "lr": 9.260000000000001e-05} +{"train_loss": 0.12829749286174774, "global_step": 463, "epoch": 3, "lr": 9.28e-05} +{"train_loss": 0.12751540541648865, "global_step": 464, "epoch": 3, "lr": 9.300000000000001e-05} +{"train_loss": 0.12792763113975525, "global_step": 465, "epoch": 3, "lr": 9.320000000000002e-05} +{"train_loss": 0.1204768717288971, "global_step": 466, "epoch": 3, "lr": 9.340000000000001e-05} +{"train_loss": 0.1159939169883728, "global_step": 467, "epoch": 3, "lr": 9.360000000000001e-05} +{"train_loss": 0.12402334064245224, "global_step": 468, "epoch": 3, "lr": 9.38e-05} +{"train_loss": 0.12605474889278412, "global_step": 469, "epoch": 3, "lr": 9.4e-05} +{"train_loss": 0.12592606246471405, "global_step": 470, "epoch": 3, "lr": 9.42e-05} +{"train_loss": 0.12509498000144958, "global_step": 471, "epoch": 3, "lr": 9.44e-05} +{"train_loss": 0.11678960174322128, "global_step": 472, "epoch": 3, "lr": 9.46e-05} +{"train_loss": 0.11226163059473038, "global_step": 473, "epoch": 3, "lr": 9.48e-05} +{"train_loss": 0.12081819772720337, "global_step": 474, "epoch": 3, "lr": 9.5e-05} +{"train_loss": 0.13135296751220688, "global_step": 475, "epoch": 3, "lr": 9.52e-05, "val_loss": 0.14392778277397156} +{"train_loss": 0.12138625979423523, "global_step": 476, "epoch": 4, "lr": 9.54e-05} +{"train_loss": 0.09888642281293869, "global_step": 477, "epoch": 4, "lr": 9.56e-05} +{"train_loss": 0.12118476629257202, "global_step": 478, "epoch": 4, "lr": 9.58e-05} +{"train_loss": 0.12071169167757034, "global_step": 479, "epoch": 4, "lr": 9.6e-05} +{"train_loss": 0.10242989659309387, "global_step": 480, "epoch": 4, "lr": 9.620000000000001e-05} +{"train_loss": 0.11031793057918549, "global_step": 481, "epoch": 4, "lr": 9.64e-05} +{"train_loss": 0.12577694654464722, "global_step": 482, "epoch": 4, "lr": 9.66e-05} +{"train_loss": 0.12358536571264267, "global_step": 483, "epoch": 4, "lr": 9.680000000000001e-05} +{"train_loss": 0.08870110660791397, "global_step": 484, "epoch": 4, "lr": 9.7e-05} +{"train_loss": 0.12100303918123245, "global_step": 485, "epoch": 4, "lr": 9.72e-05} +{"train_loss": 0.10148248076438904, "global_step": 486, "epoch": 4, "lr": 9.74e-05} +{"train_loss": 0.09898301959037781, "global_step": 487, "epoch": 4, "lr": 9.76e-05} +{"train_loss": 0.11519238352775574, "global_step": 488, "epoch": 4, "lr": 9.78e-05} +{"train_loss": 0.0975944921374321, "global_step": 489, "epoch": 4, "lr": 9.8e-05} +{"train_loss": 0.09844187647104263, "global_step": 490, "epoch": 4, "lr": 9.82e-05} +{"train_loss": 0.1067580059170723, "global_step": 491, "epoch": 4, "lr": 9.84e-05} +{"train_loss": 0.10471536964178085, "global_step": 492, "epoch": 4, "lr": 9.86e-05} +{"train_loss": 0.11119586229324341, "global_step": 493, "epoch": 4, "lr": 9.88e-05} +{"train_loss": 0.11487189680337906, "global_step": 494, "epoch": 4, "lr": 9.900000000000001e-05} +{"train_loss": 0.09088850766420364, "global_step": 495, "epoch": 4, "lr": 9.92e-05} +{"train_loss": 0.10219863802194595, "global_step": 496, "epoch": 4, "lr": 9.94e-05} +{"train_loss": 0.11684788018465042, "global_step": 497, "epoch": 4, "lr": 9.960000000000001e-05} +{"train_loss": 0.12433011829853058, "global_step": 498, "epoch": 4, "lr": 9.98e-05} +{"train_loss": 0.1078641265630722, "global_step": 499, "epoch": 4, "lr": 0.0001} +{"train_loss": 0.10001112520694733, "global_step": 500, "epoch": 4, "lr": 9.999999995091518e-05} +{"train_loss": 0.1300722062587738, "global_step": 501, "epoch": 4, "lr": 9.999999980366068e-05} +{"train_loss": 0.10306678712368011, "global_step": 502, "epoch": 4, "lr": 9.999999955823654e-05} +{"train_loss": 0.10237957537174225, "global_step": 503, "epoch": 4, "lr": 9.999999921464274e-05} +{"train_loss": 0.10753781348466873, "global_step": 504, "epoch": 4, "lr": 9.999999877287929e-05} +{"train_loss": 0.1051240786910057, "global_step": 505, "epoch": 4, "lr": 9.999999823294616e-05} +{"train_loss": 0.11234217882156372, "global_step": 506, "epoch": 4, "lr": 9.999999759484339e-05} +{"train_loss": 0.10868202149868011, "global_step": 507, "epoch": 4, "lr": 9.999999685857098e-05} +{"train_loss": 0.10727688670158386, "global_step": 508, "epoch": 4, "lr": 9.99999960241289e-05} +{"train_loss": 0.09837634861469269, "global_step": 509, "epoch": 4, "lr": 9.999999509151716e-05} +{"train_loss": 0.10866411030292511, "global_step": 510, "epoch": 4, "lr": 9.999999406073579e-05} +{"train_loss": 0.12734195590019226, "global_step": 511, "epoch": 4, "lr": 9.999999293178477e-05} +{"train_loss": 0.10200458019971848, "global_step": 512, "epoch": 4, "lr": 9.999999170466411e-05} +{"train_loss": 0.10019566863775253, "global_step": 513, "epoch": 4, "lr": 9.99999903793738e-05} +{"train_loss": 0.1218469887971878, "global_step": 514, "epoch": 4, "lr": 9.999998895591385e-05} +{"train_loss": 0.10977951437234879, "global_step": 515, "epoch": 4, "lr": 9.999998743428427e-05} +{"train_loss": 0.1147487610578537, "global_step": 516, "epoch": 4, "lr": 9.999998581448506e-05} +{"train_loss": 0.11090978980064392, "global_step": 517, "epoch": 4, "lr": 9.999998409651621e-05} +{"train_loss": 0.09952022135257721, "global_step": 518, "epoch": 4, "lr": 9.999998228037773e-05} +{"train_loss": 0.09599240124225616, "global_step": 519, "epoch": 4, "lr": 9.999998036606963e-05} +{"train_loss": 0.09526573866605759, "global_step": 520, "epoch": 4, "lr": 9.999997835359192e-05} +{"train_loss": 0.09430214017629623, "global_step": 521, "epoch": 4, "lr": 9.999997624294457e-05} +{"train_loss": 0.10017483681440353, "global_step": 522, "epoch": 4, "lr": 9.999997403412764e-05} +{"train_loss": 0.09741931408643723, "global_step": 523, "epoch": 4, "lr": 9.999997172714108e-05} +{"train_loss": 0.09563460201025009, "global_step": 524, "epoch": 4, "lr": 9.999996932198492e-05} +{"train_loss": 0.10288666933774948, "global_step": 525, "epoch": 4, "lr": 9.999996681865918e-05} +{"train_loss": 0.09854231774806976, "global_step": 526, "epoch": 4, "lr": 9.999996421716382e-05} +{"train_loss": 0.09941034764051437, "global_step": 527, "epoch": 4, "lr": 9.999996151749888e-05} +{"train_loss": 0.11399150639772415, "global_step": 528, "epoch": 4, "lr": 9.999995871966437e-05} +{"train_loss": 0.09312618523836136, "global_step": 529, "epoch": 4, "lr": 9.999995582366027e-05} +{"train_loss": 0.10731193423271179, "global_step": 530, "epoch": 4, "lr": 9.99999528294866e-05} +{"train_loss": 0.09782609343528748, "global_step": 531, "epoch": 4, "lr": 9.999994973714337e-05} +{"train_loss": 0.1100301742553711, "global_step": 532, "epoch": 4, "lr": 9.999994654663059e-05} +{"train_loss": 0.11141213774681091, "global_step": 533, "epoch": 4, "lr": 9.999994325794823e-05} +{"train_loss": 0.09148990362882614, "global_step": 534, "epoch": 4, "lr": 9.999993987109634e-05} +{"train_loss": 0.09729243069887161, "global_step": 535, "epoch": 4, "lr": 9.999993638607492e-05} +{"train_loss": 0.11956006288528442, "global_step": 536, "epoch": 4, "lr": 9.999993280288396e-05} +{"train_loss": 0.0886547639966011, "global_step": 537, "epoch": 4, "lr": 9.999992912152345e-05} +{"train_loss": 0.10278422385454178, "global_step": 538, "epoch": 4, "lr": 9.999992534199345e-05} +{"train_loss": 0.1043257787823677, "global_step": 539, "epoch": 4, "lr": 9.999992146429392e-05} +{"train_loss": 0.08403509110212326, "global_step": 540, "epoch": 4, "lr": 9.99999174884249e-05} +{"train_loss": 0.10741160064935684, "global_step": 541, "epoch": 4, "lr": 9.999991341438637e-05} +{"train_loss": 0.10138138383626938, "global_step": 542, "epoch": 4, "lr": 9.999990924217836e-05} +{"train_loss": 0.08576754480600357, "global_step": 543, "epoch": 4, "lr": 9.999990497180087e-05} +{"train_loss": 0.08926771581172943, "global_step": 544, "epoch": 4, "lr": 9.999990060325391e-05} +{"train_loss": 0.08407390862703323, "global_step": 545, "epoch": 4, "lr": 9.999989613653748e-05} +{"train_loss": 0.11573916673660278, "global_step": 546, "epoch": 4, "lr": 9.999989157165159e-05} +{"train_loss": 0.09658820182085037, "global_step": 547, "epoch": 4, "lr": 9.999988690859628e-05} +{"train_loss": 0.09344366937875748, "global_step": 548, "epoch": 4, "lr": 9.999988214737151e-05} +{"train_loss": 0.09537786990404129, "global_step": 549, "epoch": 4, "lr": 9.999987728797733e-05} +{"train_loss": 0.08593470603227615, "global_step": 550, "epoch": 4, "lr": 9.999987233041372e-05} +{"train_loss": 0.09553012996912003, "global_step": 551, "epoch": 4, "lr": 9.999986727468069e-05} +{"train_loss": 0.1088055744767189, "global_step": 552, "epoch": 4, "lr": 9.999986212077829e-05} +{"train_loss": 0.1049174964427948, "global_step": 553, "epoch": 4, "lr": 9.999985686870648e-05} +{"train_loss": 0.08544386923313141, "global_step": 554, "epoch": 4, "lr": 9.999985151846532e-05} +{"train_loss": 0.09873655438423157, "global_step": 555, "epoch": 4, "lr": 9.999984607005477e-05} +{"train_loss": 0.09930121153593063, "global_step": 556, "epoch": 4, "lr": 9.999984052347487e-05} +{"train_loss": 0.09149663895368576, "global_step": 557, "epoch": 4, "lr": 9.999983487872562e-05} +{"train_loss": 0.08836468309164047, "global_step": 558, "epoch": 4, "lr": 9.999982913580704e-05} +{"train_loss": 0.07972612977027893, "global_step": 559, "epoch": 4, "lr": 9.999982329471914e-05} +{"train_loss": 0.09463271498680115, "global_step": 560, "epoch": 4, "lr": 9.999981735546193e-05} +{"train_loss": 0.099754199385643, "global_step": 561, "epoch": 4, "lr": 9.999981131803542e-05} +{"train_loss": 0.0871298611164093, "global_step": 562, "epoch": 4, "lr": 9.99998051824396e-05} +{"train_loss": 0.10875009000301361, "global_step": 563, "epoch": 4, "lr": 9.999979894867454e-05} +{"train_loss": 0.09185803681612015, "global_step": 564, "epoch": 4, "lr": 9.99997926167402e-05} +{"train_loss": 0.12082622945308685, "global_step": 565, "epoch": 4, "lr": 9.999978618663661e-05} +{"train_loss": 0.10163474828004837, "global_step": 566, "epoch": 4, "lr": 9.999977965836378e-05} +{"train_loss": 0.09266074746847153, "global_step": 567, "epoch": 4, "lr": 9.999977303192172e-05} +{"train_loss": 0.08805296570062637, "global_step": 568, "epoch": 4, "lr": 9.999976630731046e-05} +{"train_loss": 0.09728880226612091, "global_step": 569, "epoch": 4, "lr": 9.999975948452998e-05} +{"train_loss": 0.10043047368526459, "global_step": 570, "epoch": 4, "lr": 9.999975256358034e-05} +{"train_loss": 0.09570333361625671, "global_step": 571, "epoch": 4, "lr": 9.999974554446151e-05} +{"train_loss": 0.08350393921136856, "global_step": 572, "epoch": 4, "lr": 9.999973842717352e-05} +{"train_loss": 0.09510431438684464, "global_step": 573, "epoch": 4, "lr": 9.99997312117164e-05} +{"train_loss": 0.09613621979951859, "global_step": 574, "epoch": 4, "lr": 9.999972389809014e-05} +{"train_loss": 0.09855569154024124, "global_step": 575, "epoch": 4, "lr": 9.999971648629476e-05} +{"train_loss": 0.09081527590751648, "global_step": 576, "epoch": 4, "lr": 9.999970897633028e-05} +{"train_loss": 0.09666446596384048, "global_step": 577, "epoch": 4, "lr": 9.999970136819672e-05} +{"train_loss": 0.07433484494686127, "global_step": 578, "epoch": 4, "lr": 9.999969366189408e-05} +{"train_loss": 0.08859851211309433, "global_step": 579, "epoch": 4, "lr": 9.999968585742239e-05} +{"train_loss": 0.07819098234176636, "global_step": 580, "epoch": 4, "lr": 9.999967795478164e-05} +{"train_loss": 0.08203017711639404, "global_step": 581, "epoch": 4, "lr": 9.99996699539719e-05} +{"train_loss": 0.07854185998439789, "global_step": 582, "epoch": 4, "lr": 9.999966185499312e-05} +{"train_loss": 0.08877171576023102, "global_step": 583, "epoch": 4, "lr": 9.999965365784536e-05} +{"train_loss": 0.09367621690034866, "global_step": 584, "epoch": 4, "lr": 9.999964536252861e-05} +{"train_loss": 0.1018267497420311, "global_step": 585, "epoch": 4, "lr": 9.99996369690429e-05} +{"train_loss": 0.10182752460241318, "global_step": 586, "epoch": 4, "lr": 9.999962847738826e-05} +{"train_loss": 0.09604479372501373, "global_step": 587, "epoch": 4, "lr": 9.999961988756468e-05} +{"train_loss": 0.07829587906599045, "global_step": 588, "epoch": 4, "lr": 9.999961119957218e-05} +{"train_loss": 0.08167270570993423, "global_step": 589, "epoch": 4, "lr": 9.99996024134108e-05} +{"train_loss": 0.08866038173437119, "global_step": 590, "epoch": 4, "lr": 9.999959352908053e-05} +{"train_loss": 0.07940691709518433, "global_step": 591, "epoch": 4, "lr": 9.99995845465814e-05} +{"train_loss": 0.08656289428472519, "global_step": 592, "epoch": 4, "lr": 9.999957546591344e-05} +{"train_loss": 0.0952315628528595, "global_step": 593, "epoch": 4, "lr": 9.999956628707665e-05} +{"train_loss": 0.10022459805262189, "global_step": 594, "epoch": 4, "lr": 9.999955701007105e-05, "val_loss": 0.10767791420221329} +{"train_loss": 0.08333340287208557, "global_step": 595, "epoch": 5, "lr": 9.999954763489666e-05} +{"train_loss": 0.08371929079294205, "global_step": 596, "epoch": 5, "lr": 9.999953816155349e-05} +{"train_loss": 0.1019381731748581, "global_step": 597, "epoch": 5, "lr": 9.999952859004159e-05} +{"train_loss": 0.08263671398162842, "global_step": 598, "epoch": 5, "lr": 9.999951892036095e-05} +{"train_loss": 0.10416850447654724, "global_step": 599, "epoch": 5, "lr": 9.999950915251159e-05} +{"train_loss": 0.0718836560845375, "global_step": 600, "epoch": 5, "lr": 9.999949928649355e-05} +{"train_loss": 0.07944369316101074, "global_step": 601, "epoch": 5, "lr": 9.999948932230682e-05} +{"train_loss": 0.09552326798439026, "global_step": 602, "epoch": 5, "lr": 9.999947925995143e-05} +{"train_loss": 0.09668483585119247, "global_step": 603, "epoch": 5, "lr": 9.999946909942742e-05} +{"train_loss": 0.1005551740527153, "global_step": 604, "epoch": 5, "lr": 9.999945884073478e-05} +{"train_loss": 0.09146098047494888, "global_step": 605, "epoch": 5, "lr": 9.999944848387356e-05} +{"train_loss": 0.07714840769767761, "global_step": 606, "epoch": 5, "lr": 9.999943802884375e-05} +{"train_loss": 0.08165916055440903, "global_step": 607, "epoch": 5, "lr": 9.999942747564539e-05} +{"train_loss": 0.1016557589173317, "global_step": 608, "epoch": 5, "lr": 9.999941682427852e-05} +{"train_loss": 0.07621274143457413, "global_step": 609, "epoch": 5, "lr": 9.99994060747431e-05} +{"train_loss": 0.09438283741474152, "global_step": 610, "epoch": 5, "lr": 9.999939522703921e-05} +{"train_loss": 0.08211155980825424, "global_step": 611, "epoch": 5, "lr": 9.999938428116683e-05} +{"train_loss": 0.0763850137591362, "global_step": 612, "epoch": 5, "lr": 9.999937323712601e-05} +{"train_loss": 0.0697171613574028, "global_step": 613, "epoch": 5, "lr": 9.999936209491676e-05} +{"train_loss": 0.0854049026966095, "global_step": 614, "epoch": 5, "lr": 9.999935085453911e-05} +{"train_loss": 0.08937006443738937, "global_step": 615, "epoch": 5, "lr": 9.999933951599307e-05} +{"train_loss": 0.09193316847085953, "global_step": 616, "epoch": 5, "lr": 9.999932807927867e-05} +{"train_loss": 0.09701695293188095, "global_step": 617, "epoch": 5, "lr": 9.999931654439594e-05} +{"train_loss": 0.09331529587507248, "global_step": 618, "epoch": 5, "lr": 9.999930491134489e-05} +{"train_loss": 0.07433872669935226, "global_step": 619, "epoch": 5, "lr": 9.999929318012554e-05} +{"train_loss": 0.08246789872646332, "global_step": 620, "epoch": 5, "lr": 9.999928135073793e-05} +{"train_loss": 0.09820987284183502, "global_step": 621, "epoch": 5, "lr": 9.999926942318206e-05} +{"train_loss": 0.07701221853494644, "global_step": 622, "epoch": 5, "lr": 9.999925739745796e-05} +{"train_loss": 0.08598418533802032, "global_step": 623, "epoch": 5, "lr": 9.999924527356567e-05} +{"train_loss": 0.07941789925098419, "global_step": 624, "epoch": 5, "lr": 9.999923305150522e-05} +{"train_loss": 0.08784660696983337, "global_step": 625, "epoch": 5, "lr": 9.999922073127662e-05} +{"train_loss": 0.0889836773276329, "global_step": 626, "epoch": 5, "lr": 9.999920831287986e-05} +{"train_loss": 0.0937219187617302, "global_step": 627, "epoch": 5, "lr": 9.999919579631501e-05} +{"train_loss": 0.08190353214740753, "global_step": 628, "epoch": 5, "lr": 9.999918318158207e-05} +{"train_loss": 0.09093086421489716, "global_step": 629, "epoch": 5, "lr": 9.99991704686811e-05} +{"train_loss": 0.09022404998540878, "global_step": 630, "epoch": 5, "lr": 9.999915765761208e-05} +{"train_loss": 0.08662106841802597, "global_step": 631, "epoch": 5, "lr": 9.999914474837506e-05} +{"train_loss": 0.09006061404943466, "global_step": 632, "epoch": 5, "lr": 9.999913174097006e-05} +{"train_loss": 0.0903100073337555, "global_step": 633, "epoch": 5, "lr": 9.999911863539711e-05} +{"train_loss": 0.09345022588968277, "global_step": 634, "epoch": 5, "lr": 9.999910543165623e-05} +{"train_loss": 0.0792950764298439, "global_step": 635, "epoch": 5, "lr": 9.999909212974745e-05} +{"train_loss": 0.09809236973524094, "global_step": 636, "epoch": 5, "lr": 9.99990787296708e-05} +{"train_loss": 0.09328614175319672, "global_step": 637, "epoch": 5, "lr": 9.99990652314263e-05} +{"train_loss": 0.07444731146097183, "global_step": 638, "epoch": 5, "lr": 9.999905163501398e-05} +{"train_loss": 0.07450294494628906, "global_step": 639, "epoch": 5, "lr": 9.999903794043385e-05} +{"train_loss": 0.08637706190347672, "global_step": 640, "epoch": 5, "lr": 9.999902414768596e-05} +{"train_loss": 0.07246264070272446, "global_step": 641, "epoch": 5, "lr": 9.999901025677032e-05} +{"train_loss": 0.08140533417463303, "global_step": 642, "epoch": 5, "lr": 9.999899626768696e-05} +{"train_loss": 0.08807607740163803, "global_step": 643, "epoch": 5, "lr": 9.999898218043593e-05} +{"train_loss": 0.0836075097322464, "global_step": 644, "epoch": 5, "lr": 9.999896799501722e-05} +{"train_loss": 0.0824812650680542, "global_step": 645, "epoch": 5, "lr": 9.99989537114309e-05} +{"train_loss": 0.07268460839986801, "global_step": 646, "epoch": 5, "lr": 9.999893932967696e-05} +{"train_loss": 0.10556581616401672, "global_step": 647, "epoch": 5, "lr": 9.999892484975545e-05} +{"train_loss": 0.06874729692935944, "global_step": 648, "epoch": 5, "lr": 9.99989102716664e-05} +{"train_loss": 0.08793231844902039, "global_step": 649, "epoch": 5, "lr": 9.999889559540982e-05} +{"train_loss": 0.08153464645147324, "global_step": 650, "epoch": 5, "lr": 9.999888082098576e-05} +{"train_loss": 0.07522215694189072, "global_step": 651, "epoch": 5, "lr": 9.999886594839422e-05} +{"train_loss": 0.07981689274311066, "global_step": 652, "epoch": 5, "lr": 9.999885097763526e-05} +{"train_loss": 0.07946617901325226, "global_step": 653, "epoch": 5, "lr": 9.999883590870891e-05} +{"train_loss": 0.08149869740009308, "global_step": 654, "epoch": 5, "lr": 9.999882074161517e-05} +{"train_loss": 0.0773647204041481, "global_step": 655, "epoch": 5, "lr": 9.99988054763541e-05} +{"train_loss": 0.08387850224971771, "global_step": 656, "epoch": 5, "lr": 9.99987901129257e-05} +{"train_loss": 0.08471863716840744, "global_step": 657, "epoch": 5, "lr": 9.999877465133003e-05} +{"train_loss": 0.06945350766181946, "global_step": 658, "epoch": 5, "lr": 9.999875909156711e-05} +{"train_loss": 0.0826660618185997, "global_step": 659, "epoch": 5, "lr": 9.999874343363696e-05} +{"train_loss": 0.08285294473171234, "global_step": 660, "epoch": 5, "lr": 9.999872767753962e-05} +{"train_loss": 0.09057612717151642, "global_step": 661, "epoch": 5, "lr": 9.999871182327512e-05} +{"train_loss": 0.09557955712080002, "global_step": 662, "epoch": 5, "lr": 9.999869587084349e-05} +{"train_loss": 0.0958888903260231, "global_step": 663, "epoch": 5, "lr": 9.999867982024476e-05} +{"train_loss": 0.09806328266859055, "global_step": 664, "epoch": 5, "lr": 9.999866367147898e-05} +{"train_loss": 0.07886544615030289, "global_step": 665, "epoch": 5, "lr": 9.999864742454614e-05} +{"train_loss": 0.09518852084875107, "global_step": 666, "epoch": 5, "lr": 9.999863107944631e-05} +{"train_loss": 0.08006918430328369, "global_step": 667, "epoch": 5, "lr": 9.999861463617952e-05} +{"train_loss": 0.06123119592666626, "global_step": 668, "epoch": 5, "lr": 9.999859809474578e-05} +{"train_loss": 0.07639435678720474, "global_step": 669, "epoch": 5, "lr": 9.999858145514514e-05} +{"train_loss": 0.09184326976537704, "global_step": 670, "epoch": 5, "lr": 9.999856471737762e-05} +{"train_loss": 0.08484018594026566, "global_step": 671, "epoch": 5, "lr": 9.999854788144327e-05} +{"train_loss": 0.08489017933607101, "global_step": 672, "epoch": 5, "lr": 9.999853094734211e-05} +{"train_loss": 0.08244530856609344, "global_step": 673, "epoch": 5, "lr": 9.999851391507417e-05} +{"train_loss": 0.10983666032552719, "global_step": 674, "epoch": 5, "lr": 9.999849678463948e-05} +{"train_loss": 0.1008448675274849, "global_step": 675, "epoch": 5, "lr": 9.99984795560381e-05} +{"train_loss": 0.07203064858913422, "global_step": 676, "epoch": 5, "lr": 9.999846222927005e-05} +{"train_loss": 0.06432382762432098, "global_step": 677, "epoch": 5, "lr": 9.999844480433535e-05} +{"train_loss": 0.0842532366514206, "global_step": 678, "epoch": 5, "lr": 9.999842728123404e-05} +{"train_loss": 0.07972952723503113, "global_step": 679, "epoch": 5, "lr": 9.999840965996616e-05} +{"train_loss": 0.06753173470497131, "global_step": 680, "epoch": 5, "lr": 9.999839194053176e-05} +{"train_loss": 0.08197684586048126, "global_step": 681, "epoch": 5, "lr": 9.999837412293085e-05} +{"train_loss": 0.08744686096906662, "global_step": 682, "epoch": 5, "lr": 9.999835620716348e-05} +{"train_loss": 0.0825050100684166, "global_step": 683, "epoch": 5, "lr": 9.999833819322967e-05} +{"train_loss": 0.08312217146158218, "global_step": 684, "epoch": 5, "lr": 9.999832008112948e-05} +{"train_loss": 0.08603321015834808, "global_step": 685, "epoch": 5, "lr": 9.999830187086292e-05} +{"train_loss": 0.07294507324695587, "global_step": 686, "epoch": 5, "lr": 9.999828356243002e-05} +{"train_loss": 0.05816567316651344, "global_step": 687, "epoch": 5, "lr": 9.999826515583085e-05} +{"train_loss": 0.08467456698417664, "global_step": 688, "epoch": 5, "lr": 9.999824665106542e-05} +{"train_loss": 0.09871955960988998, "global_step": 689, "epoch": 5, "lr": 9.999822804813378e-05} +{"train_loss": 0.08887019008398056, "global_step": 690, "epoch": 5, "lr": 9.999820934703595e-05} +{"train_loss": 0.08477671444416046, "global_step": 691, "epoch": 5, "lr": 9.999819054777199e-05} +{"train_loss": 0.0925469845533371, "global_step": 692, "epoch": 5, "lr": 9.999817165034192e-05} +{"train_loss": 0.06607725471258163, "global_step": 693, "epoch": 5, "lr": 9.999815265474579e-05} +{"train_loss": 0.08911833167076111, "global_step": 694, "epoch": 5, "lr": 9.999813356098362e-05} +{"train_loss": 0.09006961435079575, "global_step": 695, "epoch": 5, "lr": 9.999811436905545e-05} +{"train_loss": 0.0873715952038765, "global_step": 696, "epoch": 5, "lr": 9.999809507896135e-05} +{"train_loss": 0.08591724932193756, "global_step": 697, "epoch": 5, "lr": 9.999807569070129e-05} +{"train_loss": 0.06844954937696457, "global_step": 698, "epoch": 5, "lr": 9.999805620427538e-05} +{"train_loss": 0.08224784582853317, "global_step": 699, "epoch": 5, "lr": 9.99980366196836e-05} +{"train_loss": 0.07912563532590866, "global_step": 700, "epoch": 5, "lr": 9.999801693692605e-05} +{"train_loss": 0.08530230820178986, "global_step": 701, "epoch": 5, "lr": 9.999799715600273e-05} +{"train_loss": 0.07167301326990128, "global_step": 702, "epoch": 5, "lr": 9.999797727691366e-05} +{"train_loss": 0.07816177606582642, "global_step": 703, "epoch": 5, "lr": 9.999795729965893e-05} +{"train_loss": 0.08895016461610794, "global_step": 704, "epoch": 5, "lr": 9.999793722423855e-05} +{"train_loss": 0.08275025337934494, "global_step": 705, "epoch": 5, "lr": 9.999791705065255e-05} +{"train_loss": 0.07842014729976654, "global_step": 706, "epoch": 5, "lr": 9.999789677890099e-05} +{"train_loss": 0.07025288790464401, "global_step": 707, "epoch": 5, "lr": 9.999787640898389e-05} +{"train_loss": 0.06965624541044235, "global_step": 708, "epoch": 5, "lr": 9.999785594090131e-05} +{"train_loss": 0.08941708505153656, "global_step": 709, "epoch": 5, "lr": 9.999783537465328e-05} +{"train_loss": 0.0663776621222496, "global_step": 710, "epoch": 5, "lr": 9.999781471023984e-05} +{"train_loss": 0.06847947835922241, "global_step": 711, "epoch": 5, "lr": 9.999779394766103e-05} +{"train_loss": 0.07280389219522476, "global_step": 712, "epoch": 5, "lr": 9.99977730869169e-05} +{"train_loss": 0.08380984925046689, "global_step": 713, "epoch": 5, "lr": 9.999775212800748e-05, "val_loss": 0.09592325985431671, "train_action_mse_error": 0.09311316907405853} +{"train_loss": 0.06123559549450874, "global_step": 714, "epoch": 6, "lr": 9.999773107093282e-05} +{"train_loss": 0.06380432844161987, "global_step": 715, "epoch": 6, "lr": 9.999770991569295e-05} +{"train_loss": 0.07188919186592102, "global_step": 716, "epoch": 6, "lr": 9.999768866228792e-05} +{"train_loss": 0.0767282098531723, "global_step": 717, "epoch": 6, "lr": 9.999766731071776e-05} +{"train_loss": 0.08329850435256958, "global_step": 718, "epoch": 6, "lr": 9.999764586098253e-05} +{"train_loss": 0.0738845095038414, "global_step": 719, "epoch": 6, "lr": 9.999762431308227e-05} +{"train_loss": 0.06514452397823334, "global_step": 720, "epoch": 6, "lr": 9.999760266701701e-05} +{"train_loss": 0.07805565744638443, "global_step": 721, "epoch": 6, "lr": 9.999758092278679e-05} +{"train_loss": 0.07780313491821289, "global_step": 722, "epoch": 6, "lr": 9.999755908039168e-05} +{"train_loss": 0.07594841718673706, "global_step": 723, "epoch": 6, "lr": 9.99975371398317e-05} +{"train_loss": 0.09138169139623642, "global_step": 724, "epoch": 6, "lr": 9.999751510110688e-05} +{"train_loss": 0.07129106670618057, "global_step": 725, "epoch": 6, "lr": 9.99974929642173e-05} +{"train_loss": 0.08800076693296432, "global_step": 726, "epoch": 6, "lr": 9.999747072916298e-05} +{"train_loss": 0.08720991015434265, "global_step": 727, "epoch": 6, "lr": 9.999744839594396e-05} +{"train_loss": 0.08714676648378372, "global_step": 728, "epoch": 6, "lr": 9.99974259645603e-05} +{"train_loss": 0.07949887216091156, "global_step": 729, "epoch": 6, "lr": 9.999740343501203e-05} +{"train_loss": 0.08436319231987, "global_step": 730, "epoch": 6, "lr": 9.99973808072992e-05} +{"train_loss": 0.0732613131403923, "global_step": 731, "epoch": 6, "lr": 9.999735808142185e-05} +{"train_loss": 0.0902213305234909, "global_step": 732, "epoch": 6, "lr": 9.999733525738004e-05} +{"train_loss": 0.06498824059963226, "global_step": 733, "epoch": 6, "lr": 9.99973123351738e-05} +{"train_loss": 0.081046462059021, "global_step": 734, "epoch": 6, "lr": 9.999728931480318e-05} +{"train_loss": 0.06545358896255493, "global_step": 735, "epoch": 6, "lr": 9.999726619626822e-05} +{"train_loss": 0.08057444542646408, "global_step": 736, "epoch": 6, "lr": 9.999724297956897e-05} +{"train_loss": 0.07193209230899811, "global_step": 737, "epoch": 6, "lr": 9.999721966470548e-05} +{"train_loss": 0.07720082253217697, "global_step": 738, "epoch": 6, "lr": 9.999719625167779e-05} +{"train_loss": 0.07435022294521332, "global_step": 739, "epoch": 6, "lr": 9.999717274048594e-05} +{"train_loss": 0.06704042106866837, "global_step": 740, "epoch": 6, "lr": 9.999714913112997e-05} +{"train_loss": 0.07265358418226242, "global_step": 741, "epoch": 6, "lr": 9.999712542360996e-05} +{"train_loss": 0.06219964474439621, "global_step": 742, "epoch": 6, "lr": 9.999710161792593e-05} +{"train_loss": 0.07205361127853394, "global_step": 743, "epoch": 6, "lr": 9.999707771407794e-05} +{"train_loss": 0.0671626627445221, "global_step": 744, "epoch": 6, "lr": 9.999705371206602e-05} +{"train_loss": 0.069279745221138, "global_step": 745, "epoch": 6, "lr": 9.999702961189021e-05} +{"train_loss": 0.06578776240348816, "global_step": 746, "epoch": 6, "lr": 9.99970054135506e-05} +{"train_loss": 0.06882361322641373, "global_step": 747, "epoch": 6, "lr": 9.99969811170472e-05} +{"train_loss": 0.07544250786304474, "global_step": 748, "epoch": 6, "lr": 9.999695672238008e-05} +{"train_loss": 0.07517673075199127, "global_step": 749, "epoch": 6, "lr": 9.999693222954926e-05} +{"train_loss": 0.0646846666932106, "global_step": 750, "epoch": 6, "lr": 9.999690763855483e-05} +{"train_loss": 0.06679940223693848, "global_step": 751, "epoch": 6, "lr": 9.999688294939679e-05} +{"train_loss": 0.0894770473241806, "global_step": 752, "epoch": 6, "lr": 9.999685816207521e-05} +{"train_loss": 0.06131419911980629, "global_step": 753, "epoch": 6, "lr": 9.999683327659015e-05} +{"train_loss": 0.06121160462498665, "global_step": 754, "epoch": 6, "lr": 9.999680829294165e-05} +{"train_loss": 0.0786774531006813, "global_step": 755, "epoch": 6, "lr": 9.999678321112975e-05} +{"train_loss": 0.06695454567670822, "global_step": 756, "epoch": 6, "lr": 9.999675803115451e-05} +{"train_loss": 0.07556966692209244, "global_step": 757, "epoch": 6, "lr": 9.9996732753016e-05} +{"train_loss": 0.07386508584022522, "global_step": 758, "epoch": 6, "lr": 9.999670737671422e-05} +{"train_loss": 0.062461622059345245, "global_step": 759, "epoch": 6, "lr": 9.999668190224925e-05} +{"train_loss": 0.06792375445365906, "global_step": 760, "epoch": 6, "lr": 9.999665632962114e-05} +{"train_loss": 0.07170980423688889, "global_step": 761, "epoch": 6, "lr": 9.999663065882994e-05} +{"train_loss": 0.06970884650945663, "global_step": 762, "epoch": 6, "lr": 9.99966048898757e-05} +{"train_loss": 0.0662086009979248, "global_step": 763, "epoch": 6, "lr": 9.999657902275845e-05} +{"train_loss": 0.07493769377470016, "global_step": 764, "epoch": 6, "lr": 9.999655305747828e-05} +{"train_loss": 0.05981176346540451, "global_step": 765, "epoch": 6, "lr": 9.999652699403521e-05} +{"train_loss": 0.07013025134801865, "global_step": 766, "epoch": 6, "lr": 9.999650083242929e-05} +{"train_loss": 0.07243189960718155, "global_step": 767, "epoch": 6, "lr": 9.99964745726606e-05} +{"train_loss": 0.07293212413787842, "global_step": 768, "epoch": 6, "lr": 9.999644821472915e-05} +{"train_loss": 0.06576994061470032, "global_step": 769, "epoch": 6, "lr": 9.999642175863504e-05} +{"train_loss": 0.06981278955936432, "global_step": 770, "epoch": 6, "lr": 9.999639520437829e-05} +{"train_loss": 0.0751032754778862, "global_step": 771, "epoch": 6, "lr": 9.999636855195895e-05} +{"train_loss": 0.06627431511878967, "global_step": 772, "epoch": 6, "lr": 9.999634180137709e-05} +{"train_loss": 0.06628792732954025, "global_step": 773, "epoch": 6, "lr": 9.999631495263275e-05} +{"train_loss": 0.05913280323147774, "global_step": 774, "epoch": 6, "lr": 9.999628800572601e-05} +{"train_loss": 0.06864520907402039, "global_step": 775, "epoch": 6, "lr": 9.999626096065687e-05} +{"train_loss": 0.05941295996308327, "global_step": 776, "epoch": 6, "lr": 9.999623381742542e-05} +{"train_loss": 0.06787695735692978, "global_step": 777, "epoch": 6, "lr": 9.999620657603172e-05} +{"train_loss": 0.06946257501840591, "global_step": 778, "epoch": 6, "lr": 9.99961792364758e-05} +{"train_loss": 0.06558630615472794, "global_step": 779, "epoch": 6, "lr": 9.999615179875772e-05} +{"train_loss": 0.0783933699131012, "global_step": 780, "epoch": 6, "lr": 9.999612426287753e-05} +{"train_loss": 0.067718006670475, "global_step": 781, "epoch": 6, "lr": 9.999609662883531e-05} +{"train_loss": 0.06832484900951385, "global_step": 782, "epoch": 6, "lr": 9.999606889663107e-05} +{"train_loss": 0.062190551310777664, "global_step": 783, "epoch": 6, "lr": 9.999604106626493e-05} +{"train_loss": 0.07610957324504852, "global_step": 784, "epoch": 6, "lr": 9.999601313773687e-05} +{"train_loss": 0.08211284875869751, "global_step": 785, "epoch": 6, "lr": 9.999598511104698e-05} +{"train_loss": 0.06670928746461868, "global_step": 786, "epoch": 6, "lr": 9.999595698619533e-05} +{"train_loss": 0.07564691454172134, "global_step": 787, "epoch": 6, "lr": 9.999592876318196e-05} +{"train_loss": 0.07152041792869568, "global_step": 788, "epoch": 6, "lr": 9.999590044200692e-05} +{"train_loss": 0.07254879921674728, "global_step": 789, "epoch": 6, "lr": 9.999587202267027e-05} +{"train_loss": 0.05901217833161354, "global_step": 790, "epoch": 6, "lr": 9.999584350517206e-05} +{"train_loss": 0.07181142270565033, "global_step": 791, "epoch": 6, "lr": 9.999581488951236e-05} +{"train_loss": 0.07629835605621338, "global_step": 792, "epoch": 6, "lr": 9.999578617569123e-05} +{"train_loss": 0.06382226943969727, "global_step": 793, "epoch": 6, "lr": 9.99957573637087e-05} +{"train_loss": 0.07889429479837418, "global_step": 794, "epoch": 6, "lr": 9.999572845356484e-05} +{"train_loss": 0.07157197594642639, "global_step": 795, "epoch": 6, "lr": 9.999569944525972e-05} +{"train_loss": 0.08873733133077621, "global_step": 796, "epoch": 6, "lr": 9.999567033879338e-05} +{"train_loss": 0.07302388548851013, "global_step": 797, "epoch": 6, "lr": 9.999564113416588e-05} +{"train_loss": 0.06728344410657883, "global_step": 798, "epoch": 6, "lr": 9.999561183137728e-05} +{"train_loss": 0.07905445247888565, "global_step": 799, "epoch": 6, "lr": 9.999558243042764e-05} +{"train_loss": 0.07160060852766037, "global_step": 800, "epoch": 6, "lr": 9.999555293131702e-05} +{"train_loss": 0.06856775283813477, "global_step": 801, "epoch": 6, "lr": 9.999552333404545e-05} +{"train_loss": 0.09902480989694595, "global_step": 802, "epoch": 6, "lr": 9.999549363861304e-05} +{"train_loss": 0.06816524267196655, "global_step": 803, "epoch": 6, "lr": 9.999546384501981e-05} +{"train_loss": 0.07684038579463959, "global_step": 804, "epoch": 6, "lr": 9.999543395326581e-05} +{"train_loss": 0.09484396874904633, "global_step": 805, "epoch": 6, "lr": 9.999540396335114e-05} +{"train_loss": 0.06390725076198578, "global_step": 806, "epoch": 6, "lr": 9.999537387527583e-05} +{"train_loss": 0.08196623623371124, "global_step": 807, "epoch": 6, "lr": 9.999534368903994e-05} +{"train_loss": 0.0807173103094101, "global_step": 808, "epoch": 6, "lr": 9.999531340464354e-05} +{"train_loss": 0.0900232121348381, "global_step": 809, "epoch": 6, "lr": 9.999528302208668e-05} +{"train_loss": 0.05442959442734718, "global_step": 810, "epoch": 6, "lr": 9.999525254136942e-05} +{"train_loss": 0.07893925905227661, "global_step": 811, "epoch": 6, "lr": 9.999522196249182e-05} +{"train_loss": 0.09413398057222366, "global_step": 812, "epoch": 6, "lr": 9.999519128545396e-05} +{"train_loss": 0.06765428185462952, "global_step": 813, "epoch": 6, "lr": 9.999516051025586e-05} +{"train_loss": 0.06543569266796112, "global_step": 814, "epoch": 6, "lr": 9.999512963689762e-05} +{"train_loss": 0.082463838160038, "global_step": 815, "epoch": 6, "lr": 9.999509866537929e-05} +{"train_loss": 0.06938619911670685, "global_step": 816, "epoch": 6, "lr": 9.99950675957009e-05} +{"train_loss": 0.08212997764348984, "global_step": 817, "epoch": 6, "lr": 9.999503642786255e-05} +{"train_loss": 0.06916835904121399, "global_step": 818, "epoch": 6, "lr": 9.999500516186428e-05} +{"train_loss": 0.08104268461465836, "global_step": 819, "epoch": 6, "lr": 9.999497379770617e-05} +{"train_loss": 0.0644562840461731, "global_step": 820, "epoch": 6, "lr": 9.999494233538827e-05} +{"train_loss": 0.07538159191608429, "global_step": 821, "epoch": 6, "lr": 9.999491077491063e-05} +{"train_loss": 0.07104053348302841, "global_step": 822, "epoch": 6, "lr": 9.999487911627334e-05} +{"train_loss": 0.09793625771999359, "global_step": 823, "epoch": 6, "lr": 9.999484735947644e-05} +{"train_loss": 0.07190847396850586, "global_step": 824, "epoch": 6, "lr": 9.999481550451998e-05} +{"train_loss": 0.06304429471492767, "global_step": 825, "epoch": 6, "lr": 9.999478355140408e-05} +{"train_loss": 0.0772833451628685, "global_step": 826, "epoch": 6, "lr": 9.999475150012873e-05} +{"train_loss": 0.06692571938037872, "global_step": 827, "epoch": 6, "lr": 9.999471935069405e-05} +{"train_loss": 0.08251187205314636, "global_step": 828, "epoch": 6, "lr": 9.999468710310006e-05} +{"train_loss": 0.06712504476308823, "global_step": 829, "epoch": 6, "lr": 9.999465475734684e-05} +{"train_loss": 0.07531493157148361, "global_step": 830, "epoch": 6, "lr": 9.999462231343447e-05} +{"train_loss": 0.0911073163151741, "global_step": 831, "epoch": 6, "lr": 9.9994589771363e-05} +{"train_loss": 0.0733126947859756, "global_step": 832, "epoch": 6, "lr": 9.999455713113249e-05, "val_loss": 0.0994868054986} +{"train_loss": 0.06636610627174377, "global_step": 833, "epoch": 7, "lr": 9.999452439274302e-05} +{"train_loss": 0.07621198147535324, "global_step": 834, "epoch": 7, "lr": 9.999449155619463e-05} +{"train_loss": 0.06716684252023697, "global_step": 835, "epoch": 7, "lr": 9.999445862148739e-05} +{"train_loss": 0.07778327912092209, "global_step": 836, "epoch": 7, "lr": 9.999442558862137e-05} +{"train_loss": 0.06881701946258545, "global_step": 837, "epoch": 7, "lr": 9.999439245759666e-05} +{"train_loss": 0.07379816472530365, "global_step": 838, "epoch": 7, "lr": 9.99943592284133e-05} +{"train_loss": 0.06707817316055298, "global_step": 839, "epoch": 7, "lr": 9.999432590107133e-05} +{"train_loss": 0.058975864201784134, "global_step": 840, "epoch": 7, "lr": 9.999429247557087e-05} +{"train_loss": 0.07892701029777527, "global_step": 841, "epoch": 7, "lr": 9.999425895191193e-05} +{"train_loss": 0.061427682638168335, "global_step": 842, "epoch": 7, "lr": 9.999422533009462e-05} +{"train_loss": 0.07448059320449829, "global_step": 843, "epoch": 7, "lr": 9.999419161011898e-05} +{"train_loss": 0.07065232843160629, "global_step": 844, "epoch": 7, "lr": 9.99941577919851e-05} +{"train_loss": 0.07319070398807526, "global_step": 845, "epoch": 7, "lr": 9.999412387569302e-05} +{"train_loss": 0.06864415109157562, "global_step": 846, "epoch": 7, "lr": 9.999408986124283e-05} +{"train_loss": 0.07911872863769531, "global_step": 847, "epoch": 7, "lr": 9.999405574863458e-05} +{"train_loss": 0.06656007468700409, "global_step": 848, "epoch": 7, "lr": 9.999402153786834e-05} +{"train_loss": 0.08286021649837494, "global_step": 849, "epoch": 7, "lr": 9.99939872289442e-05} +{"train_loss": 0.05595461279153824, "global_step": 850, "epoch": 7, "lr": 9.999395282186218e-05} +{"train_loss": 0.08945394307374954, "global_step": 851, "epoch": 7, "lr": 9.999391831662239e-05} +{"train_loss": 0.06535445898771286, "global_step": 852, "epoch": 7, "lr": 9.999388371322487e-05} +{"train_loss": 0.06439374387264252, "global_step": 853, "epoch": 7, "lr": 9.999384901166971e-05} +{"train_loss": 0.08616528660058975, "global_step": 854, "epoch": 7, "lr": 9.999381421195697e-05} +{"train_loss": 0.0625547468662262, "global_step": 855, "epoch": 7, "lr": 9.999377931408671e-05} +{"train_loss": 0.07865289598703384, "global_step": 856, "epoch": 7, "lr": 9.999374431805901e-05} +{"train_loss": 0.050195686519145966, "global_step": 857, "epoch": 7, "lr": 9.999370922387393e-05} +{"train_loss": 0.08466292172670364, "global_step": 858, "epoch": 7, "lr": 9.999367403153155e-05} +{"train_loss": 0.07132234424352646, "global_step": 859, "epoch": 7, "lr": 9.999363874103193e-05} +{"train_loss": 0.05967652052640915, "global_step": 860, "epoch": 7, "lr": 9.999360335237513e-05} +{"train_loss": 0.06896653771400452, "global_step": 861, "epoch": 7, "lr": 9.999356786556124e-05} +{"train_loss": 0.07758303731679916, "global_step": 862, "epoch": 7, "lr": 9.999353228059033e-05} +{"train_loss": 0.06071298569440842, "global_step": 863, "epoch": 7, "lr": 9.999349659746244e-05} +{"train_loss": 0.07009728997945786, "global_step": 864, "epoch": 7, "lr": 9.999346081617769e-05} +{"train_loss": 0.06696176528930664, "global_step": 865, "epoch": 7, "lr": 9.99934249367361e-05} +{"train_loss": 0.06406787782907486, "global_step": 866, "epoch": 7, "lr": 9.999338895913776e-05} +{"train_loss": 0.06986134499311447, "global_step": 867, "epoch": 7, "lr": 9.999335288338274e-05} +{"train_loss": 0.05931619554758072, "global_step": 868, "epoch": 7, "lr": 9.999331670947112e-05} +{"train_loss": 0.05949525535106659, "global_step": 869, "epoch": 7, "lr": 9.999328043740296e-05} +{"train_loss": 0.05601106584072113, "global_step": 870, "epoch": 7, "lr": 9.999324406717834e-05} +{"train_loss": 0.06187962368130684, "global_step": 871, "epoch": 7, "lr": 9.999320759879731e-05} +{"train_loss": 0.06674595177173615, "global_step": 872, "epoch": 7, "lr": 9.999317103225999e-05} +{"train_loss": 0.06533556431531906, "global_step": 873, "epoch": 7, "lr": 9.999313436756639e-05} +{"train_loss": 0.05673433467745781, "global_step": 874, "epoch": 7, "lr": 9.999309760471663e-05} +{"train_loss": 0.04850281402468681, "global_step": 875, "epoch": 7, "lr": 9.999306074371074e-05} +{"train_loss": 0.07048709690570831, "global_step": 876, "epoch": 7, "lr": 9.999302378454884e-05} +{"train_loss": 0.052274372428655624, "global_step": 877, "epoch": 7, "lr": 9.999298672723097e-05} +{"train_loss": 0.055770471692085266, "global_step": 878, "epoch": 7, "lr": 9.99929495717572e-05} +{"train_loss": 0.06606807559728622, "global_step": 879, "epoch": 7, "lr": 9.999291231812765e-05} +{"train_loss": 0.06332707405090332, "global_step": 880, "epoch": 7, "lr": 9.999287496634233e-05} +{"train_loss": 0.07485463470220566, "global_step": 881, "epoch": 7, "lr": 9.999283751640134e-05} +{"train_loss": 0.0648370012640953, "global_step": 882, "epoch": 7, "lr": 9.999279996830475e-05} +{"train_loss": 0.06328950077295303, "global_step": 883, "epoch": 7, "lr": 9.999276232205265e-05} +{"train_loss": 0.07173404097557068, "global_step": 884, "epoch": 7, "lr": 9.99927245776451e-05} +{"train_loss": 0.05967516079545021, "global_step": 885, "epoch": 7, "lr": 9.999268673508217e-05} +{"train_loss": 0.05644255131483078, "global_step": 886, "epoch": 7, "lr": 9.999264879436395e-05} +{"train_loss": 0.0713311955332756, "global_step": 887, "epoch": 7, "lr": 9.99926107554905e-05} +{"train_loss": 0.07039865106344223, "global_step": 888, "epoch": 7, "lr": 9.999257261846191e-05} +{"train_loss": 0.057115186005830765, "global_step": 889, "epoch": 7, "lr": 9.999253438327823e-05} +{"train_loss": 0.08235074579715729, "global_step": 890, "epoch": 7, "lr": 9.999249604993956e-05} +{"train_loss": 0.06025243178009987, "global_step": 891, "epoch": 7, "lr": 9.999245761844596e-05} +{"train_loss": 0.06548936665058136, "global_step": 892, "epoch": 7, "lr": 9.99924190887975e-05} +{"train_loss": 0.0641290545463562, "global_step": 893, "epoch": 7, "lr": 9.999238046099428e-05} +{"train_loss": 0.05645425617694855, "global_step": 894, "epoch": 7, "lr": 9.999234173503636e-05} +{"train_loss": 0.0672619566321373, "global_step": 895, "epoch": 7, "lr": 9.999230291092382e-05} +{"train_loss": 0.05881804600358009, "global_step": 896, "epoch": 7, "lr": 9.999226398865673e-05} +{"train_loss": 0.0576966218650341, "global_step": 897, "epoch": 7, "lr": 9.999222496823518e-05} +{"train_loss": 0.057192910462617874, "global_step": 898, "epoch": 7, "lr": 9.999218584965922e-05} +{"train_loss": 0.06998151540756226, "global_step": 899, "epoch": 7, "lr": 9.999214663292896e-05} +{"train_loss": 0.0714801773428917, "global_step": 900, "epoch": 7, "lr": 9.999210731804445e-05} +{"train_loss": 0.058598846197128296, "global_step": 901, "epoch": 7, "lr": 9.999206790500577e-05} +{"train_loss": 0.06097846478223801, "global_step": 902, "epoch": 7, "lr": 9.999202839381303e-05} +{"train_loss": 0.06919194757938385, "global_step": 903, "epoch": 7, "lr": 9.999198878446626e-05} +{"train_loss": 0.05315614491701126, "global_step": 904, "epoch": 7, "lr": 9.999194907696558e-05} +{"train_loss": 0.08467177301645279, "global_step": 905, "epoch": 7, "lr": 9.999190927131103e-05} +{"train_loss": 0.057172611355781555, "global_step": 906, "epoch": 7, "lr": 9.999186936750272e-05} +{"train_loss": 0.06655515730381012, "global_step": 907, "epoch": 7, "lr": 9.999182936554071e-05} +{"train_loss": 0.060619253665208817, "global_step": 908, "epoch": 7, "lr": 9.99917892654251e-05} +{"train_loss": 0.07098179310560226, "global_step": 909, "epoch": 7, "lr": 9.999174906715593e-05} +{"train_loss": 0.06332752108573914, "global_step": 910, "epoch": 7, "lr": 9.99917087707333e-05} +{"train_loss": 0.0705980509519577, "global_step": 911, "epoch": 7, "lr": 9.999166837615732e-05} +{"train_loss": 0.05587853491306305, "global_step": 912, "epoch": 7, "lr": 9.9991627883428e-05} +{"train_loss": 0.0624457411468029, "global_step": 913, "epoch": 7, "lr": 9.99915872925455e-05} +{"train_loss": 0.056266941130161285, "global_step": 914, "epoch": 7, "lr": 9.999154660350982e-05} +{"train_loss": 0.08363386988639832, "global_step": 915, "epoch": 7, "lr": 9.99915058163211e-05} +{"train_loss": 0.06319871544837952, "global_step": 916, "epoch": 7, "lr": 9.99914649309794e-05} +{"train_loss": 0.06066501885652542, "global_step": 917, "epoch": 7, "lr": 9.99914239474848e-05} +{"train_loss": 0.05441950634121895, "global_step": 918, "epoch": 7, "lr": 9.999138286583738e-05} +{"train_loss": 0.05023985356092453, "global_step": 919, "epoch": 7, "lr": 9.999134168603721e-05} +{"train_loss": 0.05853842943906784, "global_step": 920, "epoch": 7, "lr": 9.999130040808439e-05} +{"train_loss": 0.05685150995850563, "global_step": 921, "epoch": 7, "lr": 9.999125903197898e-05} +{"train_loss": 0.05872054025530815, "global_step": 922, "epoch": 7, "lr": 9.999121755772109e-05} +{"train_loss": 0.0693797767162323, "global_step": 923, "epoch": 7, "lr": 9.99911759853108e-05} +{"train_loss": 0.0700354129076004, "global_step": 924, "epoch": 7, "lr": 9.999113431474815e-05} +{"train_loss": 0.07335640490055084, "global_step": 925, "epoch": 7, "lr": 9.999109254603325e-05} +{"train_loss": 0.05712655931711197, "global_step": 926, "epoch": 7, "lr": 9.999105067916618e-05} +{"train_loss": 0.047858480364084244, "global_step": 927, "epoch": 7, "lr": 9.999100871414704e-05} +{"train_loss": 0.04776475951075554, "global_step": 928, "epoch": 7, "lr": 9.999096665097588e-05} +{"train_loss": 0.06758512556552887, "global_step": 929, "epoch": 7, "lr": 9.999092448965281e-05} +{"train_loss": 0.056729983538389206, "global_step": 930, "epoch": 7, "lr": 9.999088223017788e-05} +{"train_loss": 0.07286331057548523, "global_step": 931, "epoch": 7, "lr": 9.999083987255121e-05} +{"train_loss": 0.055746737867593765, "global_step": 932, "epoch": 7, "lr": 9.999079741677287e-05} +{"train_loss": 0.06540562957525253, "global_step": 933, "epoch": 7, "lr": 9.999075486284292e-05} +{"train_loss": 0.06382681429386139, "global_step": 934, "epoch": 7, "lr": 9.999071221076149e-05} +{"train_loss": 0.06033695861697197, "global_step": 935, "epoch": 7, "lr": 9.999066946052862e-05} +{"train_loss": 0.06632079184055328, "global_step": 936, "epoch": 7, "lr": 9.99906266121444e-05} +{"train_loss": 0.06475852429866791, "global_step": 937, "epoch": 7, "lr": 9.999058366560894e-05} +{"train_loss": 0.06848855316638947, "global_step": 938, "epoch": 7, "lr": 9.99905406209223e-05} +{"train_loss": 0.049736008048057556, "global_step": 939, "epoch": 7, "lr": 9.99904974780846e-05} +{"train_loss": 0.05563788488507271, "global_step": 940, "epoch": 7, "lr": 9.999045423709588e-05} +{"train_loss": 0.05275775119662285, "global_step": 941, "epoch": 7, "lr": 9.999041089795624e-05} +{"train_loss": 0.05684391409158707, "global_step": 942, "epoch": 7, "lr": 9.999036746066577e-05} +{"train_loss": 0.06378220021724701, "global_step": 943, "epoch": 7, "lr": 9.999032392522457e-05} +{"train_loss": 0.059039849787950516, "global_step": 944, "epoch": 7, "lr": 9.99902802916327e-05} +{"train_loss": 0.04618312790989876, "global_step": 945, "epoch": 7, "lr": 9.999023655989026e-05} +{"train_loss": 0.06420592963695526, "global_step": 946, "epoch": 7, "lr": 9.999019272999732e-05} +{"train_loss": 0.05262071266770363, "global_step": 947, "epoch": 7, "lr": 9.999014880195399e-05} +{"train_loss": 0.04485858604311943, "global_step": 948, "epoch": 7, "lr": 9.999010477576033e-05} +{"train_loss": 0.04907489940524101, "global_step": 949, "epoch": 7, "lr": 9.999006065141645e-05} +{"train_loss": 0.061576299369335175, "global_step": 950, "epoch": 7, "lr": 9.999001642892241e-05} +{"train_loss": 0.06423419679538543, "global_step": 951, "epoch": 7, "lr": 9.998997210827834e-05, "val_loss": 0.0736088976264} +{"train_loss": 0.04818742722272873, "global_step": 952, "epoch": 8, "lr": 9.998992768948428e-05} +{"train_loss": 0.06994882225990295, "global_step": 953, "epoch": 8, "lr": 9.998988317254034e-05} +{"train_loss": 0.04818979650735855, "global_step": 954, "epoch": 8, "lr": 9.998983855744662e-05} +{"train_loss": 0.0599747970700264, "global_step": 955, "epoch": 8, "lr": 9.998979384420318e-05} +{"train_loss": 0.05603285878896713, "global_step": 956, "epoch": 8, "lr": 9.998974903281011e-05} +{"train_loss": 0.05848710983991623, "global_step": 957, "epoch": 8, "lr": 9.998970412326753e-05} +{"train_loss": 0.06377891451120377, "global_step": 958, "epoch": 8, "lr": 9.99896591155755e-05} +{"train_loss": 0.05506725236773491, "global_step": 959, "epoch": 8, "lr": 9.99896140097341e-05} +{"train_loss": 0.05036267265677452, "global_step": 960, "epoch": 8, "lr": 9.998956880574345e-05} +{"train_loss": 0.059326738119125366, "global_step": 961, "epoch": 8, "lr": 9.998952350360362e-05} +{"train_loss": 0.05101526901125908, "global_step": 962, "epoch": 8, "lr": 9.998947810331469e-05} +{"train_loss": 0.06860248744487762, "global_step": 963, "epoch": 8, "lr": 9.998943260487677e-05} +{"train_loss": 0.06676679104566574, "global_step": 964, "epoch": 8, "lr": 9.998938700828995e-05} +{"train_loss": 0.049568451941013336, "global_step": 965, "epoch": 8, "lr": 9.998934131355429e-05} +{"train_loss": 0.05632403492927551, "global_step": 966, "epoch": 8, "lr": 9.998929552066991e-05} +{"train_loss": 0.04804094880819321, "global_step": 967, "epoch": 8, "lr": 9.998924962963689e-05} +{"train_loss": 0.05023656785488129, "global_step": 968, "epoch": 8, "lr": 9.998920364045531e-05} +{"train_loss": 0.06216954067349434, "global_step": 969, "epoch": 8, "lr": 9.998915755312528e-05} +{"train_loss": 0.053467683494091034, "global_step": 970, "epoch": 8, "lr": 9.998911136764686e-05} +{"train_loss": 0.05206162855029106, "global_step": 971, "epoch": 8, "lr": 9.998906508402017e-05} +{"train_loss": 0.06460943818092346, "global_step": 972, "epoch": 8, "lr": 9.998901870224531e-05} +{"train_loss": 0.07093333452939987, "global_step": 973, "epoch": 8, "lr": 9.998897222232233e-05} +{"train_loss": 0.05288504809141159, "global_step": 974, "epoch": 8, "lr": 9.998892564425136e-05} +{"train_loss": 0.05624646320939064, "global_step": 975, "epoch": 8, "lr": 9.998887896803246e-05} +{"train_loss": 0.06174591928720474, "global_step": 976, "epoch": 8, "lr": 9.998883219366575e-05} +{"train_loss": 0.05661923438310623, "global_step": 977, "epoch": 8, "lr": 9.998878532115131e-05} +{"train_loss": 0.055534932762384415, "global_step": 978, "epoch": 8, "lr": 9.998873835048921e-05} +{"train_loss": 0.06431189179420471, "global_step": 979, "epoch": 8, "lr": 9.998869128167957e-05} +{"train_loss": 0.04421638697385788, "global_step": 980, "epoch": 8, "lr": 9.998864411472249e-05} +{"train_loss": 0.06720801442861557, "global_step": 981, "epoch": 8, "lr": 9.998859684961803e-05} +{"train_loss": 0.04780973121523857, "global_step": 982, "epoch": 8, "lr": 9.998854948636631e-05} +{"train_loss": 0.05268504098057747, "global_step": 983, "epoch": 8, "lr": 9.99885020249674e-05} +{"train_loss": 0.05016179010272026, "global_step": 984, "epoch": 8, "lr": 9.998845446542142e-05} +{"train_loss": 0.05255300924181938, "global_step": 985, "epoch": 8, "lr": 9.998840680772845e-05} +{"train_loss": 0.05902948975563049, "global_step": 986, "epoch": 8, "lr": 9.99883590518886e-05} +{"train_loss": 0.05516144633293152, "global_step": 987, "epoch": 8, "lr": 9.998831119790191e-05} +{"train_loss": 0.06302471458911896, "global_step": 988, "epoch": 8, "lr": 9.998826324576853e-05} +{"train_loss": 0.06151392310857773, "global_step": 989, "epoch": 8, "lr": 9.998821519548855e-05} +{"train_loss": 0.06336849927902222, "global_step": 990, "epoch": 8, "lr": 9.998816704706203e-05} +{"train_loss": 0.05124702304601669, "global_step": 991, "epoch": 8, "lr": 9.998811880048909e-05} +{"train_loss": 0.05488477274775505, "global_step": 992, "epoch": 8, "lr": 9.998807045576982e-05} +{"train_loss": 0.06382053345441818, "global_step": 993, "epoch": 8, "lr": 9.998802201290431e-05} +{"train_loss": 0.05422718822956085, "global_step": 994, "epoch": 8, "lr": 9.998797347189267e-05} +{"train_loss": 0.052227992564439774, "global_step": 995, "epoch": 8, "lr": 9.998792483273497e-05} +{"train_loss": 0.07023390382528305, "global_step": 996, "epoch": 8, "lr": 9.998787609543134e-05} +{"train_loss": 0.0559525191783905, "global_step": 997, "epoch": 8, "lr": 9.998782725998183e-05} +{"train_loss": 0.057595394551754, "global_step": 998, "epoch": 8, "lr": 9.99877783263866e-05} +{"train_loss": 0.05695336312055588, "global_step": 999, "epoch": 8, "lr": 9.998772929464567e-05} +{"train_loss": 0.05552202835679054, "global_step": 1000, "epoch": 8, "lr": 9.99876801647592e-05} +{"train_loss": 0.056999191641807556, "global_step": 1001, "epoch": 8, "lr": 9.998763093672722e-05} +{"train_loss": 0.05864353105425835, "global_step": 1002, "epoch": 8, "lr": 9.998758161054991e-05} +{"train_loss": 0.05126170068979263, "global_step": 1003, "epoch": 8, "lr": 9.99875321862273e-05} +{"train_loss": 0.07057032734155655, "global_step": 1004, "epoch": 8, "lr": 9.998748266375952e-05} +{"train_loss": 0.051459766924381256, "global_step": 1005, "epoch": 8, "lr": 9.998743304314666e-05} +{"train_loss": 0.048487015068531036, "global_step": 1006, "epoch": 8, "lr": 9.998738332438882e-05} +{"train_loss": 0.05118818208575249, "global_step": 1007, "epoch": 8, "lr": 9.998733350748608e-05} +{"train_loss": 0.05812275782227516, "global_step": 1008, "epoch": 8, "lr": 9.998728359243856e-05} +{"train_loss": 0.04900909587740898, "global_step": 1009, "epoch": 8, "lr": 9.998723357924635e-05} +{"train_loss": 0.05411754176020622, "global_step": 1010, "epoch": 8, "lr": 9.998718346790954e-05} +{"train_loss": 0.05145876854658127, "global_step": 1011, "epoch": 8, "lr": 9.998713325842823e-05} +{"train_loss": 0.0537584163248539, "global_step": 1012, "epoch": 8, "lr": 9.998708295080255e-05} +{"train_loss": 0.08075409382581711, "global_step": 1013, "epoch": 8, "lr": 9.998703254503255e-05} +{"train_loss": 0.05148407444357872, "global_step": 1014, "epoch": 8, "lr": 9.998698204111836e-05} +{"train_loss": 0.06065114587545395, "global_step": 1015, "epoch": 8, "lr": 9.998693143906006e-05} +{"train_loss": 0.052589185535907745, "global_step": 1016, "epoch": 8, "lr": 9.998688073885778e-05} +{"train_loss": 0.05623337998986244, "global_step": 1017, "epoch": 8, "lr": 9.998682994051158e-05} +{"train_loss": 0.05970640853047371, "global_step": 1018, "epoch": 8, "lr": 9.99867790440216e-05} +{"train_loss": 0.052406568080186844, "global_step": 1019, "epoch": 8, "lr": 9.99867280493879e-05} +{"train_loss": 0.05828937888145447, "global_step": 1020, "epoch": 8, "lr": 9.998667695661062e-05} +{"train_loss": 0.048405971378088, "global_step": 1021, "epoch": 8, "lr": 9.998662576568982e-05} +{"train_loss": 0.04998724162578583, "global_step": 1022, "epoch": 8, "lr": 9.998657447662563e-05} +{"train_loss": 0.05665498971939087, "global_step": 1023, "epoch": 8, "lr": 9.998652308941814e-05} +{"train_loss": 0.05069977417588234, "global_step": 1024, "epoch": 8, "lr": 9.998647160406746e-05} +{"train_loss": 0.05601339414715767, "global_step": 1025, "epoch": 8, "lr": 9.998642002057367e-05} +{"train_loss": 0.05061689764261246, "global_step": 1026, "epoch": 8, "lr": 9.998636833893688e-05} +{"train_loss": 0.04123854264616966, "global_step": 1027, "epoch": 8, "lr": 9.998631655915723e-05} +{"train_loss": 0.05153762549161911, "global_step": 1028, "epoch": 8, "lr": 9.998626468123475e-05} +{"train_loss": 0.05914721637964249, "global_step": 1029, "epoch": 8, "lr": 9.998621270516959e-05} +{"train_loss": 0.05185601860284805, "global_step": 1030, "epoch": 8, "lr": 9.998616063096185e-05} +{"train_loss": 0.0587788000702858, "global_step": 1031, "epoch": 8, "lr": 9.998610845861163e-05} +{"train_loss": 0.04688786715269089, "global_step": 1032, "epoch": 8, "lr": 9.9986056188119e-05} +{"train_loss": 0.05487389117479324, "global_step": 1033, "epoch": 8, "lr": 9.99860038194841e-05} +{"train_loss": 0.0442991703748703, "global_step": 1034, "epoch": 8, "lr": 9.998595135270705e-05} +{"train_loss": 0.041080184280872345, "global_step": 1035, "epoch": 8, "lr": 9.998589878778789e-05} +{"train_loss": 0.05142317712306976, "global_step": 1036, "epoch": 8, "lr": 9.998584612472677e-05} +{"train_loss": 0.04369791969656944, "global_step": 1037, "epoch": 8, "lr": 9.998579336352379e-05} +{"train_loss": 0.05152389034628868, "global_step": 1038, "epoch": 8, "lr": 9.998574050417902e-05} +{"train_loss": 0.05114441737532616, "global_step": 1039, "epoch": 8, "lr": 9.99856875466926e-05} +{"train_loss": 0.04873828589916229, "global_step": 1040, "epoch": 8, "lr": 9.998563449106464e-05} +{"train_loss": 0.05064019933342934, "global_step": 1041, "epoch": 8, "lr": 9.998558133729521e-05} +{"train_loss": 0.04180605337023735, "global_step": 1042, "epoch": 8, "lr": 9.998552808538443e-05} +{"train_loss": 0.04232286661863327, "global_step": 1043, "epoch": 8, "lr": 9.998547473533242e-05} +{"train_loss": 0.05864877626299858, "global_step": 1044, "epoch": 8, "lr": 9.998542128713926e-05} +{"train_loss": 0.05664630979299545, "global_step": 1045, "epoch": 8, "lr": 9.998536774080506e-05} +{"train_loss": 0.05216903239488602, "global_step": 1046, "epoch": 8, "lr": 9.998531409632994e-05} +{"train_loss": 0.05155644565820694, "global_step": 1047, "epoch": 8, "lr": 9.9985260353714e-05} +{"train_loss": 0.047849394381046295, "global_step": 1048, "epoch": 8, "lr": 9.998520651295733e-05} +{"train_loss": 0.049743954092264175, "global_step": 1049, "epoch": 8, "lr": 9.998515257406005e-05} +{"train_loss": 0.05948677659034729, "global_step": 1050, "epoch": 8, "lr": 9.998509853702228e-05} +{"train_loss": 0.05378634110093117, "global_step": 1051, "epoch": 8, "lr": 9.998504440184407e-05} +{"train_loss": 0.05931583046913147, "global_step": 1052, "epoch": 8, "lr": 9.998499016852559e-05} +{"train_loss": 0.04948817193508148, "global_step": 1053, "epoch": 8, "lr": 9.998493583706694e-05} +{"train_loss": 0.05224044248461723, "global_step": 1054, "epoch": 8, "lr": 9.998488140746818e-05} +{"train_loss": 0.047266628593206406, "global_step": 1055, "epoch": 8, "lr": 9.998482687972945e-05} +{"train_loss": 0.048131171613931656, "global_step": 1056, "epoch": 8, "lr": 9.998477225385086e-05} +{"train_loss": 0.044389232993125916, "global_step": 1057, "epoch": 8, "lr": 9.99847175298325e-05} +{"train_loss": 0.043190158903598785, "global_step": 1058, "epoch": 8, "lr": 9.99846627076745e-05} +{"train_loss": 0.05078746750950813, "global_step": 1059, "epoch": 8, "lr": 9.998460778737694e-05} +{"train_loss": 0.05672510340809822, "global_step": 1060, "epoch": 8, "lr": 9.998455276893997e-05} +{"train_loss": 0.049385931342840195, "global_step": 1061, "epoch": 8, "lr": 9.998449765236364e-05} +{"train_loss": 0.06183193624019623, "global_step": 1062, "epoch": 8, "lr": 9.99844424376481e-05} +{"train_loss": 0.06030821055173874, "global_step": 1063, "epoch": 8, "lr": 9.998438712479345e-05} +{"train_loss": 0.044946007430553436, "global_step": 1064, "epoch": 8, "lr": 9.998433171379979e-05} +{"train_loss": 0.061940599232912064, "global_step": 1065, "epoch": 8, "lr": 9.998427620466726e-05} +{"train_loss": 0.04654991254210472, "global_step": 1066, "epoch": 8, "lr": 9.998422059739591e-05} +{"train_loss": 0.059761423617601395, "global_step": 1067, "epoch": 8, "lr": 9.99841648919859e-05} +{"train_loss": 0.044098395854234695, "global_step": 1068, "epoch": 8, "lr": 9.998410908843732e-05} +{"train_loss": 0.050038885325193405, "global_step": 1069, "epoch": 8, "lr": 9.998405318675028e-05} +{"train_loss": 0.05450084846185035, "global_step": 1070, "epoch": 8, "lr": 9.998399718692489e-05, "val_loss": 0.07298924028873444} +{"train_loss": 0.050906796008348465, "global_step": 1071, "epoch": 9, "lr": 9.998394108896127e-05} +{"train_loss": 0.052017468959093094, "global_step": 1072, "epoch": 9, "lr": 9.998388489285952e-05} +{"train_loss": 0.059814728796482086, "global_step": 1073, "epoch": 9, "lr": 9.998382859861974e-05} +{"train_loss": 0.05676431581377983, "global_step": 1074, "epoch": 9, "lr": 9.998377220624206e-05} +{"train_loss": 0.04811756685376167, "global_step": 1075, "epoch": 9, "lr": 9.998371571572657e-05} +{"train_loss": 0.057998646050691605, "global_step": 1076, "epoch": 9, "lr": 9.998365912707342e-05} +{"train_loss": 0.058860696852207184, "global_step": 1077, "epoch": 9, "lr": 9.998360244028269e-05} +{"train_loss": 0.05326194688677788, "global_step": 1078, "epoch": 9, "lr": 9.998354565535449e-05} +{"train_loss": 0.06676840037107468, "global_step": 1079, "epoch": 9, "lr": 9.998348877228894e-05} +{"train_loss": 0.046263452619314194, "global_step": 1080, "epoch": 9, "lr": 9.998343179108613e-05} +{"train_loss": 0.05959780141711235, "global_step": 1081, "epoch": 9, "lr": 9.998337471174622e-05} +{"train_loss": 0.05651170387864113, "global_step": 1082, "epoch": 9, "lr": 9.998331753426929e-05} +{"train_loss": 0.06688952445983887, "global_step": 1083, "epoch": 9, "lr": 9.998326025865543e-05} +{"train_loss": 0.054447900503873825, "global_step": 1084, "epoch": 9, "lr": 9.99832028849048e-05} +{"train_loss": 0.05266043171286583, "global_step": 1085, "epoch": 9, "lr": 9.998314541301749e-05} +{"train_loss": 0.06498141586780548, "global_step": 1086, "epoch": 9, "lr": 9.998308784299362e-05} +{"train_loss": 0.06787316501140594, "global_step": 1087, "epoch": 9, "lr": 9.998303017483328e-05} +{"train_loss": 0.07077793776988983, "global_step": 1088, "epoch": 9, "lr": 9.99829724085366e-05} +{"train_loss": 0.047958776354789734, "global_step": 1089, "epoch": 9, "lr": 9.998291454410372e-05} +{"train_loss": 0.059230029582977295, "global_step": 1090, "epoch": 9, "lr": 9.99828565815347e-05} +{"train_loss": 0.05539241433143616, "global_step": 1091, "epoch": 9, "lr": 9.998279852082969e-05} +{"train_loss": 0.05064268037676811, "global_step": 1092, "epoch": 9, "lr": 9.998274036198879e-05} +{"train_loss": 0.04717807471752167, "global_step": 1093, "epoch": 9, "lr": 9.998268210501213e-05} +{"train_loss": 0.0519522987306118, "global_step": 1094, "epoch": 9, "lr": 9.99826237498998e-05} +{"train_loss": 0.04321955144405365, "global_step": 1095, "epoch": 9, "lr": 9.998256529665194e-05} +{"train_loss": 0.04947252199053764, "global_step": 1096, "epoch": 9, "lr": 9.998250674526865e-05} +{"train_loss": 0.0461883619427681, "global_step": 1097, "epoch": 9, "lr": 9.998244809575005e-05} +{"train_loss": 0.0557977668941021, "global_step": 1098, "epoch": 9, "lr": 9.998238934809625e-05} +{"train_loss": 0.0684855580329895, "global_step": 1099, "epoch": 9, "lr": 9.998233050230736e-05} +{"train_loss": 0.050914984196424484, "global_step": 1100, "epoch": 9, "lr": 9.99822715583835e-05} +{"train_loss": 0.04459948465228081, "global_step": 1101, "epoch": 9, "lr": 9.998221251632483e-05} +{"train_loss": 0.04797293245792389, "global_step": 1102, "epoch": 9, "lr": 9.99821533761314e-05} +{"train_loss": 0.04898867756128311, "global_step": 1103, "epoch": 9, "lr": 9.998209413780333e-05} +{"train_loss": 0.05636144056916237, "global_step": 1104, "epoch": 9, "lr": 9.998203480134078e-05} +{"train_loss": 0.06181351840496063, "global_step": 1105, "epoch": 9, "lr": 9.998197536674384e-05} +{"train_loss": 0.05631367117166519, "global_step": 1106, "epoch": 9, "lr": 9.998191583401263e-05} +{"train_loss": 0.04828573763370514, "global_step": 1107, "epoch": 9, "lr": 9.998185620314728e-05} +{"train_loss": 0.05340810492634773, "global_step": 1108, "epoch": 9, "lr": 9.998179647414788e-05} +{"train_loss": 0.05921993404626846, "global_step": 1109, "epoch": 9, "lr": 9.998173664701456e-05} +{"train_loss": 0.056754082441329956, "global_step": 1110, "epoch": 9, "lr": 9.998167672174745e-05} +{"train_loss": 0.0460866279900074, "global_step": 1111, "epoch": 9, "lr": 9.998161669834666e-05} +{"train_loss": 0.05677538365125656, "global_step": 1112, "epoch": 9, "lr": 9.99815565768123e-05} +{"train_loss": 0.05530445650219917, "global_step": 1113, "epoch": 9, "lr": 9.99814963571445e-05} +{"train_loss": 0.05719053000211716, "global_step": 1114, "epoch": 9, "lr": 9.998143603934336e-05} +{"train_loss": 0.04651426896452904, "global_step": 1115, "epoch": 9, "lr": 9.998137562340901e-05} +{"train_loss": 0.049586616456508636, "global_step": 1116, "epoch": 9, "lr": 9.998131510934159e-05} +{"train_loss": 0.05724819749593735, "global_step": 1117, "epoch": 9, "lr": 9.998125449714118e-05} +{"train_loss": 0.0487767718732357, "global_step": 1118, "epoch": 9, "lr": 9.998119378680792e-05} +{"train_loss": 0.051331739872694016, "global_step": 1119, "epoch": 9, "lr": 9.998113297834192e-05} +{"train_loss": 0.05388004332780838, "global_step": 1120, "epoch": 9, "lr": 9.998107207174331e-05} +{"train_loss": 0.05760626494884491, "global_step": 1121, "epoch": 9, "lr": 9.99810110670122e-05} +{"train_loss": 0.04395173490047455, "global_step": 1122, "epoch": 9, "lr": 9.998094996414871e-05} +{"train_loss": 0.06278383731842041, "global_step": 1123, "epoch": 9, "lr": 9.998088876315299e-05} +{"train_loss": 0.04347819462418556, "global_step": 1124, "epoch": 9, "lr": 9.99808274640251e-05} +{"train_loss": 0.053461167961359024, "global_step": 1125, "epoch": 9, "lr": 9.998076606676523e-05} +{"train_loss": 0.05938850715756416, "global_step": 1126, "epoch": 9, "lr": 9.998070457137344e-05} +{"train_loss": 0.05212406814098358, "global_step": 1127, "epoch": 9, "lr": 9.998064297784988e-05} +{"train_loss": 0.04799909517168999, "global_step": 1128, "epoch": 9, "lr": 9.998058128619468e-05} +{"train_loss": 0.050658825784921646, "global_step": 1129, "epoch": 9, "lr": 9.998051949640794e-05} +{"train_loss": 0.052343521267175674, "global_step": 1130, "epoch": 9, "lr": 9.998045760848979e-05} +{"train_loss": 0.04779258742928505, "global_step": 1131, "epoch": 9, "lr": 9.998039562244035e-05} +{"train_loss": 0.04507090523838997, "global_step": 1132, "epoch": 9, "lr": 9.998033353825974e-05} +{"train_loss": 0.044108882546424866, "global_step": 1133, "epoch": 9, "lr": 9.998027135594809e-05} +{"train_loss": 0.05701158195734024, "global_step": 1134, "epoch": 9, "lr": 9.998020907550551e-05} +{"train_loss": 0.0537484809756279, "global_step": 1135, "epoch": 9, "lr": 9.998014669693214e-05} +{"train_loss": 0.05883384123444557, "global_step": 1136, "epoch": 9, "lr": 9.998008422022808e-05} +{"train_loss": 0.03914652764797211, "global_step": 1137, "epoch": 9, "lr": 9.998002164539346e-05} +{"train_loss": 0.05617286264896393, "global_step": 1138, "epoch": 9, "lr": 9.997995897242842e-05} +{"train_loss": 0.04572250321507454, "global_step": 1139, "epoch": 9, "lr": 9.997989620133307e-05} +{"train_loss": 0.05715785175561905, "global_step": 1140, "epoch": 9, "lr": 9.997983333210753e-05} +{"train_loss": 0.060338638722896576, "global_step": 1141, "epoch": 9, "lr": 9.997977036475193e-05} +{"train_loss": 0.03827657923102379, "global_step": 1142, "epoch": 9, "lr": 9.997970729926638e-05} +{"train_loss": 0.04313367232680321, "global_step": 1143, "epoch": 9, "lr": 9.997964413565103e-05} +{"train_loss": 0.0451284684240818, "global_step": 1144, "epoch": 9, "lr": 9.997958087390598e-05} +{"train_loss": 0.05257334187626839, "global_step": 1145, "epoch": 9, "lr": 9.997951751403136e-05} +{"train_loss": 0.05427379533648491, "global_step": 1146, "epoch": 9, "lr": 9.99794540560273e-05} +{"train_loss": 0.040392689406871796, "global_step": 1147, "epoch": 9, "lr": 9.997939049989392e-05} +{"train_loss": 0.05568758398294449, "global_step": 1148, "epoch": 9, "lr": 9.997932684563134e-05} +{"train_loss": 0.05158429592847824, "global_step": 1149, "epoch": 9, "lr": 9.997926309323971e-05} +{"train_loss": 0.03542913869023323, "global_step": 1150, "epoch": 9, "lr": 9.997919924271912e-05} +{"train_loss": 0.036503732204437256, "global_step": 1151, "epoch": 9, "lr": 9.997913529406972e-05} +{"train_loss": 0.053368136286735535, "global_step": 1152, "epoch": 9, "lr": 9.997907124729162e-05} +{"train_loss": 0.0451473668217659, "global_step": 1153, "epoch": 9, "lr": 9.997900710238496e-05} +{"train_loss": 0.044298600405454636, "global_step": 1154, "epoch": 9, "lr": 9.997894285934985e-05} +{"train_loss": 0.04747952148318291, "global_step": 1155, "epoch": 9, "lr": 9.997887851818643e-05} +{"train_loss": 0.03525586426258087, "global_step": 1156, "epoch": 9, "lr": 9.997881407889483e-05} +{"train_loss": 0.04620516672730446, "global_step": 1157, "epoch": 9, "lr": 9.997874954147515e-05} +{"train_loss": 0.04700041189789772, "global_step": 1158, "epoch": 9, "lr": 9.997868490592754e-05} +{"train_loss": 0.04927217215299606, "global_step": 1159, "epoch": 9, "lr": 9.997862017225213e-05} +{"train_loss": 0.051292695105075836, "global_step": 1160, "epoch": 9, "lr": 9.997855534044904e-05} +{"train_loss": 0.04344146326184273, "global_step": 1161, "epoch": 9, "lr": 9.997849041051838e-05} +{"train_loss": 0.04729873314499855, "global_step": 1162, "epoch": 9, "lr": 9.997842538246032e-05} +{"train_loss": 0.04541383311152458, "global_step": 1163, "epoch": 9, "lr": 9.997836025627494e-05} +{"train_loss": 0.046438202261924744, "global_step": 1164, "epoch": 9, "lr": 9.99782950319624e-05} +{"train_loss": 0.049206558614969254, "global_step": 1165, "epoch": 9, "lr": 9.997822970952282e-05} +{"train_loss": 0.045438267290592194, "global_step": 1166, "epoch": 9, "lr": 9.997816428895631e-05} +{"train_loss": 0.042995385825634, "global_step": 1167, "epoch": 9, "lr": 9.997809877026303e-05} +{"train_loss": 0.044925641268491745, "global_step": 1168, "epoch": 9, "lr": 9.997803315344307e-05} +{"train_loss": 0.046324390918016434, "global_step": 1169, "epoch": 9, "lr": 9.99779674384966e-05} +{"train_loss": 0.043153781443834305, "global_step": 1170, "epoch": 9, "lr": 9.997790162542373e-05} +{"train_loss": 0.04177149757742882, "global_step": 1171, "epoch": 9, "lr": 9.997783571422458e-05} +{"train_loss": 0.04354969412088394, "global_step": 1172, "epoch": 9, "lr": 9.99777697048993e-05} +{"train_loss": 0.043046142905950546, "global_step": 1173, "epoch": 9, "lr": 9.9977703597448e-05} +{"train_loss": 0.052064672112464905, "global_step": 1174, "epoch": 9, "lr": 9.997763739187083e-05} +{"train_loss": 0.0542379729449749, "global_step": 1175, "epoch": 9, "lr": 9.99775710881679e-05} +{"train_loss": 0.04618609696626663, "global_step": 1176, "epoch": 9, "lr": 9.997750468633933e-05} +{"train_loss": 0.038023438304662704, "global_step": 1177, "epoch": 9, "lr": 9.99774381863853e-05} +{"train_loss": 0.0442170687019825, "global_step": 1178, "epoch": 9, "lr": 9.99773715883059e-05} +{"train_loss": 0.04687308892607689, "global_step": 1179, "epoch": 9, "lr": 9.997730489210125e-05} +{"train_loss": 0.044926587492227554, "global_step": 1180, "epoch": 9, "lr": 9.997723809777152e-05} +{"train_loss": 0.04657816141843796, "global_step": 1181, "epoch": 9, "lr": 9.997717120531682e-05} +{"train_loss": 0.046645388007164, "global_step": 1182, "epoch": 9, "lr": 9.997710421473729e-05} +{"train_loss": 0.05053723603487015, "global_step": 1183, "epoch": 9, "lr": 9.997703712603304e-05} +{"train_loss": 0.04438033327460289, "global_step": 1184, "epoch": 9, "lr": 9.997696993920422e-05} +{"train_loss": 0.0624910406768322, "global_step": 1185, "epoch": 9, "lr": 9.997690265425097e-05} +{"train_loss": 0.04366930574178696, "global_step": 1186, "epoch": 9, "lr": 9.997683527117341e-05} +{"train_loss": 0.04762963205575943, "global_step": 1187, "epoch": 9, "lr": 9.997676778997168e-05} +{"train_loss": 0.046827927231788635, "global_step": 1188, "epoch": 9, "lr": 9.997670021064587e-05} +{"train_loss": 0.050624361809562236, "global_step": 1189, "epoch": 9, "lr": 9.997663253319618e-05, "val_loss": 0.064478799700737} +{"train_loss": 0.05095212906599045, "global_step": 1190, "epoch": 10, "lr": 9.99765647576227e-05} +{"train_loss": 0.050003692507743835, "global_step": 1191, "epoch": 10, "lr": 9.997649688392559e-05} +{"train_loss": 0.05032726004719734, "global_step": 1192, "epoch": 10, "lr": 9.997642891210495e-05} +{"train_loss": 0.04258207231760025, "global_step": 1193, "epoch": 10, "lr": 9.997636084216093e-05} +{"train_loss": 0.04396768659353256, "global_step": 1194, "epoch": 10, "lr": 9.997629267409368e-05} +{"train_loss": 0.036681756377220154, "global_step": 1195, "epoch": 10, "lr": 9.99762244079033e-05} +{"train_loss": 0.037320174276828766, "global_step": 1196, "epoch": 10, "lr": 9.997615604358995e-05} +{"train_loss": 0.048002805560827255, "global_step": 1197, "epoch": 10, "lr": 9.997608758115375e-05} +{"train_loss": 0.03875618800520897, "global_step": 1198, "epoch": 10, "lr": 9.997601902059485e-05} +{"train_loss": 0.04134228453040123, "global_step": 1199, "epoch": 10, "lr": 9.997595036191338e-05} +{"train_loss": 0.04962621629238129, "global_step": 1200, "epoch": 10, "lr": 9.997588160510946e-05} +{"train_loss": 0.046181801706552505, "global_step": 1201, "epoch": 10, "lr": 9.997581275018325e-05} +{"train_loss": 0.04943232983350754, "global_step": 1202, "epoch": 10, "lr": 9.997574379713486e-05} +{"train_loss": 0.04336806759238243, "global_step": 1203, "epoch": 10, "lr": 9.997567474596444e-05} +{"train_loss": 0.05072846636176109, "global_step": 1204, "epoch": 10, "lr": 9.997560559667211e-05} +{"train_loss": 0.044808365404605865, "global_step": 1205, "epoch": 10, "lr": 9.997553634925805e-05} +{"train_loss": 0.03505841642618179, "global_step": 1206, "epoch": 10, "lr": 9.997546700372233e-05} +{"train_loss": 0.054072845727205276, "global_step": 1207, "epoch": 10, "lr": 9.997539756006513e-05} +{"train_loss": 0.041146330535411835, "global_step": 1208, "epoch": 10, "lr": 9.997532801828658e-05} +{"train_loss": 0.05351065471768379, "global_step": 1209, "epoch": 10, "lr": 9.997525837838682e-05} +{"train_loss": 0.04284569248557091, "global_step": 1210, "epoch": 10, "lr": 9.997518864036597e-05} +{"train_loss": 0.055349186062812805, "global_step": 1211, "epoch": 10, "lr": 9.997511880422417e-05} +{"train_loss": 0.038965582847595215, "global_step": 1212, "epoch": 10, "lr": 9.997504886996156e-05} +{"train_loss": 0.047650296241045, "global_step": 1213, "epoch": 10, "lr": 9.99749788375783e-05} +{"train_loss": 0.04341760650277138, "global_step": 1214, "epoch": 10, "lr": 9.997490870707449e-05} +{"train_loss": 0.039946626871824265, "global_step": 1215, "epoch": 10, "lr": 9.997483847845029e-05} +{"train_loss": 0.04382120445370674, "global_step": 1216, "epoch": 10, "lr": 9.997476815170583e-05} +{"train_loss": 0.04548047482967377, "global_step": 1217, "epoch": 10, "lr": 9.997469772684127e-05} +{"train_loss": 0.0523415133357048, "global_step": 1218, "epoch": 10, "lr": 9.997462720385671e-05} +{"train_loss": 0.04514261707663536, "global_step": 1219, "epoch": 10, "lr": 9.997455658275231e-05} +{"train_loss": 0.049088992178440094, "global_step": 1220, "epoch": 10, "lr": 9.997448586352822e-05} +{"train_loss": 0.04815773665904999, "global_step": 1221, "epoch": 10, "lr": 9.997441504618457e-05} +{"train_loss": 0.04267752543091774, "global_step": 1222, "epoch": 10, "lr": 9.99743441307215e-05} +{"train_loss": 0.044162821024656296, "global_step": 1223, "epoch": 10, "lr": 9.997427311713912e-05} +{"train_loss": 0.04300882667303085, "global_step": 1224, "epoch": 10, "lr": 9.99742020054376e-05} +{"train_loss": 0.04171077907085419, "global_step": 1225, "epoch": 10, "lr": 9.997413079561707e-05} +{"train_loss": 0.05310382321476936, "global_step": 1226, "epoch": 10, "lr": 9.997405948767768e-05} +{"train_loss": 0.0446859747171402, "global_step": 1227, "epoch": 10, "lr": 9.997398808161956e-05} +{"train_loss": 0.04441758617758751, "global_step": 1228, "epoch": 10, "lr": 9.997391657744286e-05} +{"train_loss": 0.04481677711009979, "global_step": 1229, "epoch": 10, "lr": 9.99738449751477e-05} +{"train_loss": 0.03755473718047142, "global_step": 1230, "epoch": 10, "lr": 9.997377327473426e-05} +{"train_loss": 0.050759200006723404, "global_step": 1231, "epoch": 10, "lr": 9.997370147620263e-05} +{"train_loss": 0.046132463961839676, "global_step": 1232, "epoch": 10, "lr": 9.997362957955299e-05} +{"train_loss": 0.04130014404654503, "global_step": 1233, "epoch": 10, "lr": 9.997355758478546e-05} +{"train_loss": 0.04113037884235382, "global_step": 1234, "epoch": 10, "lr": 9.997348549190018e-05} +{"train_loss": 0.05058909207582474, "global_step": 1235, "epoch": 10, "lr": 9.997341330089732e-05} +{"train_loss": 0.0476195365190506, "global_step": 1236, "epoch": 10, "lr": 9.997334101177699e-05} +{"train_loss": 0.054930679500103, "global_step": 1237, "epoch": 10, "lr": 9.997326862453935e-05} +{"train_loss": 0.04892129451036453, "global_step": 1238, "epoch": 10, "lr": 9.997319613918452e-05} +{"train_loss": 0.03847884386777878, "global_step": 1239, "epoch": 10, "lr": 9.997312355571267e-05} +{"train_loss": 0.035852715373039246, "global_step": 1240, "epoch": 10, "lr": 9.997305087412394e-05} +{"train_loss": 0.04821210727095604, "global_step": 1241, "epoch": 10, "lr": 9.997297809441846e-05} +{"train_loss": 0.05597350001335144, "global_step": 1242, "epoch": 10, "lr": 9.997290521659637e-05} +{"train_loss": 0.04271063953638077, "global_step": 1243, "epoch": 10, "lr": 9.997283224065782e-05} +{"train_loss": 0.05163703113794327, "global_step": 1244, "epoch": 10, "lr": 9.997275916660295e-05} +{"train_loss": 0.05105143040418625, "global_step": 1245, "epoch": 10, "lr": 9.99726859944319e-05} +{"train_loss": 0.05644361302256584, "global_step": 1246, "epoch": 10, "lr": 9.997261272414484e-05} +{"train_loss": 0.04501740261912346, "global_step": 1247, "epoch": 10, "lr": 9.997253935574188e-05} +{"train_loss": 0.042344316840171814, "global_step": 1248, "epoch": 10, "lr": 9.997246588922318e-05} +{"train_loss": 0.04770653694868088, "global_step": 1249, "epoch": 10, "lr": 9.997239232458888e-05} +{"train_loss": 0.043152857571840286, "global_step": 1250, "epoch": 10, "lr": 9.997231866183914e-05} +{"train_loss": 0.03841414675116539, "global_step": 1251, "epoch": 10, "lr": 9.997224490097408e-05} +{"train_loss": 0.039708904922008514, "global_step": 1252, "epoch": 10, "lr": 9.997217104199385e-05} +{"train_loss": 0.042321786284446716, "global_step": 1253, "epoch": 10, "lr": 9.99720970848986e-05} +{"train_loss": 0.041015464812517166, "global_step": 1254, "epoch": 10, "lr": 9.997202302968849e-05} +{"train_loss": 0.0379454679787159, "global_step": 1255, "epoch": 10, "lr": 9.997194887636365e-05} +{"train_loss": 0.048189956694841385, "global_step": 1256, "epoch": 10, "lr": 9.997187462492421e-05} +{"train_loss": 0.043747615069150925, "global_step": 1257, "epoch": 10, "lr": 9.997180027537035e-05} +{"train_loss": 0.03678526356816292, "global_step": 1258, "epoch": 10, "lr": 9.99717258277022e-05} +{"train_loss": 0.04588242992758751, "global_step": 1259, "epoch": 10, "lr": 9.99716512819199e-05} +{"train_loss": 0.03888508304953575, "global_step": 1260, "epoch": 10, "lr": 9.99715766380236e-05} +{"train_loss": 0.05387338995933533, "global_step": 1261, "epoch": 10, "lr": 9.997150189601345e-05} +{"train_loss": 0.043093834072351456, "global_step": 1262, "epoch": 10, "lr": 9.997142705588958e-05} +{"train_loss": 0.04100402817130089, "global_step": 1263, "epoch": 10, "lr": 9.997135211765216e-05} +{"train_loss": 0.046826981008052826, "global_step": 1264, "epoch": 10, "lr": 9.997127708130134e-05} +{"train_loss": 0.05217259004712105, "global_step": 1265, "epoch": 10, "lr": 9.997120194683725e-05} +{"train_loss": 0.037241172045469284, "global_step": 1266, "epoch": 10, "lr": 9.997112671426004e-05} +{"train_loss": 0.0343368798494339, "global_step": 1267, "epoch": 10, "lr": 9.997105138356987e-05} +{"train_loss": 0.03462721034884453, "global_step": 1268, "epoch": 10, "lr": 9.997097595476688e-05} +{"train_loss": 0.04456447437405586, "global_step": 1269, "epoch": 10, "lr": 9.99709004278512e-05} +{"train_loss": 0.06034879386425018, "global_step": 1270, "epoch": 10, "lr": 9.9970824802823e-05} +{"train_loss": 0.050405628979206085, "global_step": 1271, "epoch": 10, "lr": 9.997074907968244e-05} +{"train_loss": 0.05168617516756058, "global_step": 1272, "epoch": 10, "lr": 9.997067325842963e-05} +{"train_loss": 0.043684739619493484, "global_step": 1273, "epoch": 10, "lr": 9.997059733906476e-05} +{"train_loss": 0.042943377047777176, "global_step": 1274, "epoch": 10, "lr": 9.997052132158796e-05} +{"train_loss": 0.04548976570367813, "global_step": 1275, "epoch": 10, "lr": 9.997044520599938e-05} +{"train_loss": 0.051088497042655945, "global_step": 1276, "epoch": 10, "lr": 9.997036899229917e-05} +{"train_loss": 0.04226274415850639, "global_step": 1277, "epoch": 10, "lr": 9.997029268048746e-05} +{"train_loss": 0.03838009387254715, "global_step": 1278, "epoch": 10, "lr": 9.997021627056444e-05} +{"train_loss": 0.05242897942662239, "global_step": 1279, "epoch": 10, "lr": 9.997013976253022e-05} +{"train_loss": 0.05166222155094147, "global_step": 1280, "epoch": 10, "lr": 9.9970063156385e-05} +{"train_loss": 0.03964889049530029, "global_step": 1281, "epoch": 10, "lr": 9.996998645212888e-05} +{"train_loss": 0.05114065483212471, "global_step": 1282, "epoch": 10, "lr": 9.996990964976203e-05} +{"train_loss": 0.04199143126606941, "global_step": 1283, "epoch": 10, "lr": 9.99698327492846e-05} +{"train_loss": 0.04896528273820877, "global_step": 1284, "epoch": 10, "lr": 9.996975575069674e-05} +{"train_loss": 0.05814571678638458, "global_step": 1285, "epoch": 10, "lr": 9.99696786539986e-05} +{"train_loss": 0.053778938949108124, "global_step": 1286, "epoch": 10, "lr": 9.996960145919035e-05} +{"train_loss": 0.045306574553251266, "global_step": 1287, "epoch": 10, "lr": 9.99695241662721e-05} +{"train_loss": 0.04779694229364395, "global_step": 1288, "epoch": 10, "lr": 9.996944677524404e-05} +{"train_loss": 0.045404575765132904, "global_step": 1289, "epoch": 10, "lr": 9.996936928610632e-05} +{"train_loss": 0.03846196085214615, "global_step": 1290, "epoch": 10, "lr": 9.996929169885908e-05} +{"train_loss": 0.03594430908560753, "global_step": 1291, "epoch": 10, "lr": 9.996921401350248e-05} +{"train_loss": 0.03268353268504143, "global_step": 1292, "epoch": 10, "lr": 9.996913623003666e-05} +{"train_loss": 0.04909440502524376, "global_step": 1293, "epoch": 10, "lr": 9.996905834846177e-05} +{"train_loss": 0.04263884946703911, "global_step": 1294, "epoch": 10, "lr": 9.996898036877798e-05} +{"train_loss": 0.052860017865896225, "global_step": 1295, "epoch": 10, "lr": 9.996890229098543e-05} +{"train_loss": 0.04111097753047943, "global_step": 1296, "epoch": 10, "lr": 9.996882411508428e-05} +{"train_loss": 0.04996417462825775, "global_step": 1297, "epoch": 10, "lr": 9.996874584107468e-05} +{"train_loss": 0.04055370017886162, "global_step": 1298, "epoch": 10, "lr": 9.996866746895679e-05} +{"train_loss": 0.038580045104026794, "global_step": 1299, "epoch": 10, "lr": 9.996858899873076e-05} +{"train_loss": 0.04332203045487404, "global_step": 1300, "epoch": 10, "lr": 9.996851043039675e-05} +{"train_loss": 0.04485120624303818, "global_step": 1301, "epoch": 10, "lr": 9.99684317639549e-05} +{"train_loss": 0.04495645686984062, "global_step": 1302, "epoch": 10, "lr": 9.996835299940538e-05} +{"train_loss": 0.04450831562280655, "global_step": 1303, "epoch": 10, "lr": 9.996827413674832e-05} +{"train_loss": 0.041231002658605576, "global_step": 1304, "epoch": 10, "lr": 9.996819517598391e-05} +{"train_loss": 0.039558131247758865, "global_step": 1305, "epoch": 10, "lr": 9.996811611711229e-05} +{"train_loss": 0.03740007430315018, "global_step": 1306, "epoch": 10, "lr": 9.996803696013359e-05} +{"train_loss": 0.04892598092556, "global_step": 1307, "epoch": 10, "lr": 9.996795770504801e-05} +{"train_loss": 0.04512454710212074, "global_step": 1308, "epoch": 10, "lr": 9.996787835185569e-05, "val_loss": 0.04849512130022049, "train_action_mse_error": 0.010040667839348316} +{"train_loss": 0.04096312075853348, "global_step": 1309, "epoch": 11, "lr": 9.996779890055675e-05} +{"train_loss": 0.04608335345983505, "global_step": 1310, "epoch": 11, "lr": 9.996771935115139e-05} +{"train_loss": 0.04061859846115112, "global_step": 1311, "epoch": 11, "lr": 9.996763970363975e-05} +{"train_loss": 0.03567659482359886, "global_step": 1312, "epoch": 11, "lr": 9.996755995802198e-05} +{"train_loss": 0.04609527811408043, "global_step": 1313, "epoch": 11, "lr": 9.996748011429827e-05} +{"train_loss": 0.04738686978816986, "global_step": 1314, "epoch": 11, "lr": 9.996740017246873e-05} +{"train_loss": 0.04975533112883568, "global_step": 1315, "epoch": 11, "lr": 9.996732013253353e-05} +{"train_loss": 0.052691616117954254, "global_step": 1316, "epoch": 11, "lr": 9.996723999449284e-05} +{"train_loss": 0.042723800987005234, "global_step": 1317, "epoch": 11, "lr": 9.996715975834682e-05} +{"train_loss": 0.04428683966398239, "global_step": 1318, "epoch": 11, "lr": 9.996707942409562e-05} +{"train_loss": 0.045779433101415634, "global_step": 1319, "epoch": 11, "lr": 9.99669989917394e-05} +{"train_loss": 0.05330168828368187, "global_step": 1320, "epoch": 11, "lr": 9.996691846127833e-05} +{"train_loss": 0.041172027587890625, "global_step": 1321, "epoch": 11, "lr": 9.996683783271252e-05} +{"train_loss": 0.060985155403614044, "global_step": 1322, "epoch": 11, "lr": 9.996675710604219e-05} +{"train_loss": 0.04001374542713165, "global_step": 1323, "epoch": 11, "lr": 9.996667628126746e-05} +{"train_loss": 0.03862576186656952, "global_step": 1324, "epoch": 11, "lr": 9.99665953583885e-05} +{"train_loss": 0.04408026114106178, "global_step": 1325, "epoch": 11, "lr": 9.996651433740545e-05} +{"train_loss": 0.05432146042585373, "global_step": 1326, "epoch": 11, "lr": 9.996643321831852e-05} +{"train_loss": 0.04035614803433418, "global_step": 1327, "epoch": 11, "lr": 9.99663520011278e-05} +{"train_loss": 0.04682471603155136, "global_step": 1328, "epoch": 11, "lr": 9.996627068583351e-05} +{"train_loss": 0.05063197761774063, "global_step": 1329, "epoch": 11, "lr": 9.996618927243579e-05} +{"train_loss": 0.04346192255616188, "global_step": 1330, "epoch": 11, "lr": 9.996610776093478e-05} +{"train_loss": 0.04782122001051903, "global_step": 1331, "epoch": 11, "lr": 9.996602615133066e-05} +{"train_loss": 0.05611664429306984, "global_step": 1332, "epoch": 11, "lr": 9.996594444362359e-05} +{"train_loss": 0.05173246189951897, "global_step": 1333, "epoch": 11, "lr": 9.996586263781373e-05} +{"train_loss": 0.036744698882102966, "global_step": 1334, "epoch": 11, "lr": 9.996578073390124e-05} +{"train_loss": 0.04946206510066986, "global_step": 1335, "epoch": 11, "lr": 9.996569873188626e-05} +{"train_loss": 0.03803415223956108, "global_step": 1336, "epoch": 11, "lr": 9.996561663176897e-05} +{"train_loss": 0.050055403262376785, "global_step": 1337, "epoch": 11, "lr": 9.996553443354955e-05} +{"train_loss": 0.0403502956032753, "global_step": 1338, "epoch": 11, "lr": 9.996545213722813e-05} +{"train_loss": 0.04909614846110344, "global_step": 1339, "epoch": 11, "lr": 9.996536974280488e-05} +{"train_loss": 0.03626863285899162, "global_step": 1340, "epoch": 11, "lr": 9.996528725027995e-05} +{"train_loss": 0.05436353012919426, "global_step": 1341, "epoch": 11, "lr": 9.996520465965355e-05} +{"train_loss": 0.0418027900159359, "global_step": 1342, "epoch": 11, "lr": 9.996512197092577e-05} +{"train_loss": 0.04946984723210335, "global_step": 1343, "epoch": 11, "lr": 9.996503918409685e-05} +{"train_loss": 0.03708682209253311, "global_step": 1344, "epoch": 11, "lr": 9.99649562991669e-05} +{"train_loss": 0.04801986366510391, "global_step": 1345, "epoch": 11, "lr": 9.996487331613609e-05} +{"train_loss": 0.04319334402680397, "global_step": 1346, "epoch": 11, "lr": 9.996479023500458e-05} +{"train_loss": 0.03688197582960129, "global_step": 1347, "epoch": 11, "lr": 9.996470705577257e-05} +{"train_loss": 0.055857449769973755, "global_step": 1348, "epoch": 11, "lr": 9.996462377844016e-05} +{"train_loss": 0.037023384124040604, "global_step": 1349, "epoch": 11, "lr": 9.996454040300757e-05} +{"train_loss": 0.036918189376592636, "global_step": 1350, "epoch": 11, "lr": 9.996445692947495e-05} +{"train_loss": 0.042170450091362, "global_step": 1351, "epoch": 11, "lr": 9.996437335784244e-05} +{"train_loss": 0.042733922600746155, "global_step": 1352, "epoch": 11, "lr": 9.996428968811022e-05} +{"train_loss": 0.04134063050150871, "global_step": 1353, "epoch": 11, "lr": 9.996420592027848e-05} +{"train_loss": 0.05585767701268196, "global_step": 1354, "epoch": 11, "lr": 9.996412205434734e-05} +{"train_loss": 0.0402965322136879, "global_step": 1355, "epoch": 11, "lr": 9.996403809031699e-05} +{"train_loss": 0.04169789329171181, "global_step": 1356, "epoch": 11, "lr": 9.996395402818759e-05} +{"train_loss": 0.04411723092198372, "global_step": 1357, "epoch": 11, "lr": 9.99638698679593e-05} +{"train_loss": 0.04818500950932503, "global_step": 1358, "epoch": 11, "lr": 9.996378560963228e-05} +{"train_loss": 0.04360654205083847, "global_step": 1359, "epoch": 11, "lr": 9.996370125320671e-05} +{"train_loss": 0.041889265179634094, "global_step": 1360, "epoch": 11, "lr": 9.996361679868276e-05} +{"train_loss": 0.039088379591703415, "global_step": 1361, "epoch": 11, "lr": 9.996353224606058e-05} +{"train_loss": 0.034228771924972534, "global_step": 1362, "epoch": 11, "lr": 9.996344759534035e-05} +{"train_loss": 0.044171180576086044, "global_step": 1363, "epoch": 11, "lr": 9.996336284652222e-05} +{"train_loss": 0.036481957882642746, "global_step": 1364, "epoch": 11, "lr": 9.996327799960636e-05} +{"train_loss": 0.050947390496730804, "global_step": 1365, "epoch": 11, "lr": 9.996319305459296e-05} +{"train_loss": 0.04227090999484062, "global_step": 1366, "epoch": 11, "lr": 9.996310801148216e-05} +{"train_loss": 0.034005291759967804, "global_step": 1367, "epoch": 11, "lr": 9.996302287027412e-05} +{"train_loss": 0.03669339418411255, "global_step": 1368, "epoch": 11, "lr": 9.996293763096904e-05} +{"train_loss": 0.045240361243486404, "global_step": 1369, "epoch": 11, "lr": 9.996285229356705e-05} +{"train_loss": 0.03828089311718941, "global_step": 1370, "epoch": 11, "lr": 9.996276685806835e-05} +{"train_loss": 0.03996670991182327, "global_step": 1371, "epoch": 11, "lr": 9.99626813244731e-05} +{"train_loss": 0.0469302199780941, "global_step": 1372, "epoch": 11, "lr": 9.996259569278147e-05} +{"train_loss": 0.04113354906439781, "global_step": 1373, "epoch": 11, "lr": 9.996250996299362e-05} +{"train_loss": 0.03338978439569473, "global_step": 1374, "epoch": 11, "lr": 9.99624241351097e-05} +{"train_loss": 0.03712673857808113, "global_step": 1375, "epoch": 11, "lr": 9.996233820912991e-05} +{"train_loss": 0.03542524203658104, "global_step": 1376, "epoch": 11, "lr": 9.996225218505439e-05} +{"train_loss": 0.03297103941440582, "global_step": 1377, "epoch": 11, "lr": 9.996216606288335e-05} +{"train_loss": 0.04126420617103577, "global_step": 1378, "epoch": 11, "lr": 9.996207984261692e-05} +{"train_loss": 0.044665269553661346, "global_step": 1379, "epoch": 11, "lr": 9.996199352425528e-05} +{"train_loss": 0.04056701809167862, "global_step": 1380, "epoch": 11, "lr": 9.996190710779863e-05} +{"train_loss": 0.03437726944684982, "global_step": 1381, "epoch": 11, "lr": 9.996182059324708e-05} +{"train_loss": 0.047338683158159256, "global_step": 1382, "epoch": 11, "lr": 9.996173398060085e-05} +{"train_loss": 0.038569845259189606, "global_step": 1383, "epoch": 11, "lr": 9.996164726986009e-05} +{"train_loss": 0.028671767562627792, "global_step": 1384, "epoch": 11, "lr": 9.996156046102499e-05} +{"train_loss": 0.036114245653152466, "global_step": 1385, "epoch": 11, "lr": 9.996147355409568e-05} +{"train_loss": 0.03334483504295349, "global_step": 1386, "epoch": 11, "lr": 9.996138654907236e-05} +{"train_loss": 0.05462134629487991, "global_step": 1387, "epoch": 11, "lr": 9.996129944595519e-05} +{"train_loss": 0.042115576565265656, "global_step": 1388, "epoch": 11, "lr": 9.996121224474435e-05} +{"train_loss": 0.03124539740383625, "global_step": 1389, "epoch": 11, "lr": 9.996112494544001e-05} +{"train_loss": 0.04732759669423103, "global_step": 1390, "epoch": 11, "lr": 9.996103754804234e-05} +{"train_loss": 0.04256175458431244, "global_step": 1391, "epoch": 11, "lr": 9.996095005255151e-05} +{"train_loss": 0.03385931998491287, "global_step": 1392, "epoch": 11, "lr": 9.99608624589677e-05} +{"train_loss": 0.034310828894376755, "global_step": 1393, "epoch": 11, "lr": 9.996077476729107e-05} +{"train_loss": 0.041949495673179626, "global_step": 1394, "epoch": 11, "lr": 9.996068697752178e-05} +{"train_loss": 0.038420163094997406, "global_step": 1395, "epoch": 11, "lr": 9.996059908966003e-05} +{"train_loss": 0.043356072157621384, "global_step": 1396, "epoch": 11, "lr": 9.996051110370599e-05} +{"train_loss": 0.03339632973074913, "global_step": 1397, "epoch": 11, "lr": 9.99604230196598e-05} +{"train_loss": 0.036025866866111755, "global_step": 1398, "epoch": 11, "lr": 9.996033483752168e-05} +{"train_loss": 0.03661869466304779, "global_step": 1399, "epoch": 11, "lr": 9.996024655729177e-05} +{"train_loss": 0.05038689821958542, "global_step": 1400, "epoch": 11, "lr": 9.996015817897026e-05} +{"train_loss": 0.04726257175207138, "global_step": 1401, "epoch": 11, "lr": 9.996006970255731e-05} +{"train_loss": 0.045844241976737976, "global_step": 1402, "epoch": 11, "lr": 9.99599811280531e-05} +{"train_loss": 0.04046161472797394, "global_step": 1403, "epoch": 11, "lr": 9.99598924554578e-05} +{"train_loss": 0.04570552334189415, "global_step": 1404, "epoch": 11, "lr": 9.99598036847716e-05} +{"train_loss": 0.04903614893555641, "global_step": 1405, "epoch": 11, "lr": 9.995971481599467e-05} +{"train_loss": 0.044630203396081924, "global_step": 1406, "epoch": 11, "lr": 9.995962584912716e-05} +{"train_loss": 0.03665162995457649, "global_step": 1407, "epoch": 11, "lr": 9.995953678416927e-05} +{"train_loss": 0.03502139449119568, "global_step": 1408, "epoch": 11, "lr": 9.995944762112117e-05} +{"train_loss": 0.049910712987184525, "global_step": 1409, "epoch": 11, "lr": 9.995935835998303e-05} +{"train_loss": 0.035015713423490524, "global_step": 1410, "epoch": 11, "lr": 9.995926900075502e-05} +{"train_loss": 0.04088755324482918, "global_step": 1411, "epoch": 11, "lr": 9.995917954343732e-05} +{"train_loss": 0.03567852824926376, "global_step": 1412, "epoch": 11, "lr": 9.995908998803011e-05} +{"train_loss": 0.032947033643722534, "global_step": 1413, "epoch": 11, "lr": 9.995900033453359e-05} +{"train_loss": 0.043397437781095505, "global_step": 1414, "epoch": 11, "lr": 9.995891058294788e-05} +{"train_loss": 0.04617055878043175, "global_step": 1415, "epoch": 11, "lr": 9.99588207332732e-05} +{"train_loss": 0.03451162204146385, "global_step": 1416, "epoch": 11, "lr": 9.99587307855097e-05} +{"train_loss": 0.04265954717993736, "global_step": 1417, "epoch": 11, "lr": 9.995864073965759e-05} +{"train_loss": 0.04126569256186485, "global_step": 1418, "epoch": 11, "lr": 9.9958550595717e-05} +{"train_loss": 0.03447757661342621, "global_step": 1419, "epoch": 11, "lr": 9.995846035368816e-05} +{"train_loss": 0.037671543657779694, "global_step": 1420, "epoch": 11, "lr": 9.99583700135712e-05} +{"train_loss": 0.04047344997525215, "global_step": 1421, "epoch": 11, "lr": 9.995827957536632e-05} +{"train_loss": 0.04366908222436905, "global_step": 1422, "epoch": 11, "lr": 9.99581890390737e-05} +{"train_loss": 0.04020386189222336, "global_step": 1423, "epoch": 11, "lr": 9.995809840469353e-05} +{"train_loss": 0.036619991064071655, "global_step": 1424, "epoch": 11, "lr": 9.995800767222595e-05} +{"train_loss": 0.03773784637451172, "global_step": 1425, "epoch": 11, "lr": 9.995791684167117e-05} +{"train_loss": 0.04353997856378555, "global_step": 1426, "epoch": 11, "lr": 9.995782591302935e-05} +{"train_loss": 0.042212407769901414, "global_step": 1427, "epoch": 11, "lr": 9.995773488630066e-05, "val_loss": 0.06121334433555603} +{"train_loss": 0.03648809716105461, "global_step": 1428, "epoch": 12, "lr": 9.995764376148533e-05} +{"train_loss": 0.04143906384706497, "global_step": 1429, "epoch": 12, "lr": 9.995755253858348e-05} +{"train_loss": 0.036327242851257324, "global_step": 1430, "epoch": 12, "lr": 9.995746121759533e-05} +{"train_loss": 0.03686882555484772, "global_step": 1431, "epoch": 12, "lr": 9.995736979852102e-05} +{"train_loss": 0.03286154568195343, "global_step": 1432, "epoch": 12, "lr": 9.995727828136077e-05} +{"train_loss": 0.04244426265358925, "global_step": 1433, "epoch": 12, "lr": 9.995718666611473e-05} +{"train_loss": 0.02835523709654808, "global_step": 1434, "epoch": 12, "lr": 9.99570949527831e-05} +{"train_loss": 0.043276526033878326, "global_step": 1435, "epoch": 12, "lr": 9.995700314136605e-05} +{"train_loss": 0.03990478068590164, "global_step": 1436, "epoch": 12, "lr": 9.995691123186374e-05} +{"train_loss": 0.034230977296829224, "global_step": 1437, "epoch": 12, "lr": 9.99568192242764e-05} +{"train_loss": 0.038675978779792786, "global_step": 1438, "epoch": 12, "lr": 9.995672711860418e-05} +{"train_loss": 0.033896371722221375, "global_step": 1439, "epoch": 12, "lr": 9.995663491484725e-05} +{"train_loss": 0.040222544223070145, "global_step": 1440, "epoch": 12, "lr": 9.99565426130058e-05} +{"train_loss": 0.04588829725980759, "global_step": 1441, "epoch": 12, "lr": 9.995645021308004e-05} +{"train_loss": 0.03832753375172615, "global_step": 1442, "epoch": 12, "lr": 9.99563577150701e-05} +{"train_loss": 0.03234715387225151, "global_step": 1443, "epoch": 12, "lr": 9.99562651189762e-05} +{"train_loss": 0.04587860032916069, "global_step": 1444, "epoch": 12, "lr": 9.995617242479851e-05} +{"train_loss": 0.035207830369472504, "global_step": 1445, "epoch": 12, "lr": 9.995607963253722e-05} +{"train_loss": 0.03982260078191757, "global_step": 1446, "epoch": 12, "lr": 9.995598674219251e-05} +{"train_loss": 0.030125394463539124, "global_step": 1447, "epoch": 12, "lr": 9.995589375376453e-05} +{"train_loss": 0.03965785726904869, "global_step": 1448, "epoch": 12, "lr": 9.995580066725351e-05} +{"train_loss": 0.0357193797826767, "global_step": 1449, "epoch": 12, "lr": 9.995570748265962e-05} +{"train_loss": 0.030918123200535774, "global_step": 1450, "epoch": 12, "lr": 9.995561419998302e-05} +{"train_loss": 0.04926175996661186, "global_step": 1451, "epoch": 12, "lr": 9.99555208192239e-05} +{"train_loss": 0.03877931833267212, "global_step": 1452, "epoch": 12, "lr": 9.995542734038247e-05} +{"train_loss": 0.04539437219500542, "global_step": 1453, "epoch": 12, "lr": 9.995533376345889e-05} +{"train_loss": 0.031435590237379074, "global_step": 1454, "epoch": 12, "lr": 9.995524008845335e-05} +{"train_loss": 0.050706423819065094, "global_step": 1455, "epoch": 12, "lr": 9.995514631536602e-05} +{"train_loss": 0.044218260794878006, "global_step": 1456, "epoch": 12, "lr": 9.995505244419711e-05} +{"train_loss": 0.042369384318590164, "global_step": 1457, "epoch": 12, "lr": 9.99549584749468e-05} +{"train_loss": 0.03708077594637871, "global_step": 1458, "epoch": 12, "lr": 9.995486440761526e-05} +{"train_loss": 0.0444595105946064, "global_step": 1459, "epoch": 12, "lr": 9.995477024220267e-05} +{"train_loss": 0.04158870130777359, "global_step": 1460, "epoch": 12, "lr": 9.995467597870923e-05} +{"train_loss": 0.03792485222220421, "global_step": 1461, "epoch": 12, "lr": 9.995458161713512e-05} +{"train_loss": 0.029217878356575966, "global_step": 1462, "epoch": 12, "lr": 9.995448715748052e-05} +{"train_loss": 0.034551240503787994, "global_step": 1463, "epoch": 12, "lr": 9.995439259974564e-05} +{"train_loss": 0.044290587306022644, "global_step": 1464, "epoch": 12, "lr": 9.995429794393063e-05} +{"train_loss": 0.03641475364565849, "global_step": 1465, "epoch": 12, "lr": 9.99542031900357e-05} +{"train_loss": 0.04242394119501114, "global_step": 1466, "epoch": 12, "lr": 9.995410833806104e-05} +{"train_loss": 0.03250996023416519, "global_step": 1467, "epoch": 12, "lr": 9.995401338800681e-05} +{"train_loss": 0.038923222571611404, "global_step": 1468, "epoch": 12, "lr": 9.995391833987322e-05} +{"train_loss": 0.05272085964679718, "global_step": 1469, "epoch": 12, "lr": 9.995382319366045e-05} +{"train_loss": 0.046651020646095276, "global_step": 1470, "epoch": 12, "lr": 9.995372794936865e-05} +{"train_loss": 0.03976721689105034, "global_step": 1471, "epoch": 12, "lr": 9.995363260699809e-05} +{"train_loss": 0.04885779321193695, "global_step": 1472, "epoch": 12, "lr": 9.995353716654888e-05} +{"train_loss": 0.03951254114508629, "global_step": 1473, "epoch": 12, "lr": 9.995344162802125e-05} +{"train_loss": 0.038580067455768585, "global_step": 1474, "epoch": 12, "lr": 9.995334599141536e-05} +{"train_loss": 0.04255862906575203, "global_step": 1475, "epoch": 12, "lr": 9.995325025673143e-05} +{"train_loss": 0.03948419541120529, "global_step": 1476, "epoch": 12, "lr": 9.995315442396962e-05} +{"train_loss": 0.040366221219301224, "global_step": 1477, "epoch": 12, "lr": 9.995305849313012e-05} +{"train_loss": 0.03616682440042496, "global_step": 1478, "epoch": 12, "lr": 9.995296246421315e-05} +{"train_loss": 0.046988122165203094, "global_step": 1479, "epoch": 12, "lr": 9.995286633721885e-05} +{"train_loss": 0.04198537766933441, "global_step": 1480, "epoch": 12, "lr": 9.995277011214745e-05} +{"train_loss": 0.04460829868912697, "global_step": 1481, "epoch": 12, "lr": 9.995267378899912e-05} +{"train_loss": 0.04949428513646126, "global_step": 1482, "epoch": 12, "lr": 9.995257736777404e-05} +{"train_loss": 0.03607671335339546, "global_step": 1483, "epoch": 12, "lr": 9.995248084847243e-05} +{"train_loss": 0.03289244696497917, "global_step": 1484, "epoch": 12, "lr": 9.995238423109446e-05} +{"train_loss": 0.04642830044031143, "global_step": 1485, "epoch": 12, "lr": 9.995228751564029e-05} +{"train_loss": 0.03664528578519821, "global_step": 1486, "epoch": 12, "lr": 9.995219070211017e-05} +{"train_loss": 0.03627005219459534, "global_step": 1487, "epoch": 12, "lr": 9.995209379050425e-05} +{"train_loss": 0.0491064228117466, "global_step": 1488, "epoch": 12, "lr": 9.995199678082272e-05} +{"train_loss": 0.04437791556119919, "global_step": 1489, "epoch": 12, "lr": 9.99518996730658e-05} +{"train_loss": 0.03539574146270752, "global_step": 1490, "epoch": 12, "lr": 9.995180246723366e-05} +{"train_loss": 0.03817863017320633, "global_step": 1491, "epoch": 12, "lr": 9.995170516332649e-05} +{"train_loss": 0.03490942716598511, "global_step": 1492, "epoch": 12, "lr": 9.995160776134447e-05} +{"train_loss": 0.03177936002612114, "global_step": 1493, "epoch": 12, "lr": 9.995151026128782e-05} +{"train_loss": 0.04186439886689186, "global_step": 1494, "epoch": 12, "lr": 9.99514126631567e-05} +{"train_loss": 0.03876233845949173, "global_step": 1495, "epoch": 12, "lr": 9.995131496695134e-05} +{"train_loss": 0.03792322799563408, "global_step": 1496, "epoch": 12, "lr": 9.995121717267189e-05} +{"train_loss": 0.0369335301220417, "global_step": 1497, "epoch": 12, "lr": 9.995111928031858e-05} +{"train_loss": 0.04354134947061539, "global_step": 1498, "epoch": 12, "lr": 9.995102128989155e-05} +{"train_loss": 0.031276922672986984, "global_step": 1499, "epoch": 12, "lr": 9.995092320139106e-05} +{"train_loss": 0.038367051631212234, "global_step": 1500, "epoch": 12, "lr": 9.995082501481725e-05} +{"train_loss": 0.046214405447244644, "global_step": 1501, "epoch": 12, "lr": 9.995072673017034e-05} +{"train_loss": 0.03423623368144035, "global_step": 1502, "epoch": 12, "lr": 9.995062834745053e-05} +{"train_loss": 0.035346619784832, "global_step": 1503, "epoch": 12, "lr": 9.995052986665797e-05} +{"train_loss": 0.04045562446117401, "global_step": 1504, "epoch": 12, "lr": 9.995043128779289e-05} +{"train_loss": 0.035854607820510864, "global_step": 1505, "epoch": 12, "lr": 9.995033261085547e-05} +{"train_loss": 0.04120501130819321, "global_step": 1506, "epoch": 12, "lr": 9.995023383584591e-05} +{"train_loss": 0.041254617273807526, "global_step": 1507, "epoch": 12, "lr": 9.995013496276442e-05} +{"train_loss": 0.04119318351149559, "global_step": 1508, "epoch": 12, "lr": 9.995003599161117e-05} +{"train_loss": 0.03853302448987961, "global_step": 1509, "epoch": 12, "lr": 9.994993692238634e-05} +{"train_loss": 0.033307626843452454, "global_step": 1510, "epoch": 12, "lr": 9.994983775509017e-05} +{"train_loss": 0.04201636463403702, "global_step": 1511, "epoch": 12, "lr": 9.994973848972283e-05} +{"train_loss": 0.03307570144534111, "global_step": 1512, "epoch": 12, "lr": 9.99496391262845e-05} +{"train_loss": 0.04850827530026436, "global_step": 1513, "epoch": 12, "lr": 9.994953966477538e-05} +{"train_loss": 0.04062068462371826, "global_step": 1514, "epoch": 12, "lr": 9.99494401051957e-05} +{"train_loss": 0.041466642171144485, "global_step": 1515, "epoch": 12, "lr": 9.994934044754563e-05} +{"train_loss": 0.03705347329378128, "global_step": 1516, "epoch": 12, "lr": 9.994924069182535e-05} +{"train_loss": 0.03727252408862114, "global_step": 1517, "epoch": 12, "lr": 9.994914083803508e-05} +{"train_loss": 0.04068763926625252, "global_step": 1518, "epoch": 12, "lr": 9.994904088617501e-05} +{"train_loss": 0.038516923785209656, "global_step": 1519, "epoch": 12, "lr": 9.994894083624534e-05} +{"train_loss": 0.0378638431429863, "global_step": 1520, "epoch": 12, "lr": 9.994884068824623e-05} +{"train_loss": 0.043443527072668076, "global_step": 1521, "epoch": 12, "lr": 9.994874044217793e-05} +{"train_loss": 0.03602166846394539, "global_step": 1522, "epoch": 12, "lr": 9.994864009804062e-05} +{"train_loss": 0.03727700933814049, "global_step": 1523, "epoch": 12, "lr": 9.994853965583448e-05} +{"train_loss": 0.03387906402349472, "global_step": 1524, "epoch": 12, "lr": 9.994843911555974e-05} +{"train_loss": 0.04066281020641327, "global_step": 1525, "epoch": 12, "lr": 9.994833847721655e-05} +{"train_loss": 0.03350131958723068, "global_step": 1526, "epoch": 12, "lr": 9.994823774080515e-05} +{"train_loss": 0.03028242662549019, "global_step": 1527, "epoch": 12, "lr": 9.994813690632571e-05} +{"train_loss": 0.035384275019168854, "global_step": 1528, "epoch": 12, "lr": 9.994803597377844e-05} +{"train_loss": 0.037041716277599335, "global_step": 1529, "epoch": 12, "lr": 9.994793494316355e-05} +{"train_loss": 0.043629683554172516, "global_step": 1530, "epoch": 12, "lr": 9.994783381448122e-05} +{"train_loss": 0.040786899626255035, "global_step": 1531, "epoch": 12, "lr": 9.994773258773164e-05} +{"train_loss": 0.04765660688281059, "global_step": 1532, "epoch": 12, "lr": 9.994763126291504e-05} +{"train_loss": 0.030821120366454124, "global_step": 1533, "epoch": 12, "lr": 9.99475298400316e-05} +{"train_loss": 0.04561260715126991, "global_step": 1534, "epoch": 12, "lr": 9.994742831908152e-05} +{"train_loss": 0.031449563801288605, "global_step": 1535, "epoch": 12, "lr": 9.9947326700065e-05} +{"train_loss": 0.03928951174020767, "global_step": 1536, "epoch": 12, "lr": 9.994722498298225e-05} +{"train_loss": 0.053076352924108505, "global_step": 1537, "epoch": 12, "lr": 9.994712316783345e-05} +{"train_loss": 0.04173453897237778, "global_step": 1538, "epoch": 12, "lr": 9.994702125461882e-05} +{"train_loss": 0.05046491324901581, "global_step": 1539, "epoch": 12, "lr": 9.994691924333852e-05} +{"train_loss": 0.03638467192649841, "global_step": 1540, "epoch": 12, "lr": 9.994681713399282e-05} +{"train_loss": 0.0533137246966362, "global_step": 1541, "epoch": 12, "lr": 9.994671492658184e-05} +{"train_loss": 0.03490400314331055, "global_step": 1542, "epoch": 12, "lr": 9.994661262110586e-05} +{"train_loss": 0.044202227145433426, "global_step": 1543, "epoch": 12, "lr": 9.994651021756501e-05} +{"train_loss": 0.03461962938308716, "global_step": 1544, "epoch": 12, "lr": 9.994640771595954e-05} +{"train_loss": 0.05065252259373665, "global_step": 1545, "epoch": 12, "lr": 9.994630511628962e-05} +{"train_loss": 0.03955644993659328, "global_step": 1546, "epoch": 12, "lr": 9.994620241855548e-05, "val_loss": 0.05138614773750305} +{"train_loss": 0.04274456948041916, "global_step": 1547, "epoch": 13, "lr": 9.99460996227573e-05} +{"train_loss": 0.04291261360049248, "global_step": 1548, "epoch": 13, "lr": 9.99459967288953e-05} +{"train_loss": 0.04253503307700157, "global_step": 1549, "epoch": 13, "lr": 9.994589373696966e-05} +{"train_loss": 0.047757588326931, "global_step": 1550, "epoch": 13, "lr": 9.994579064698059e-05} +{"train_loss": 0.038074325770139694, "global_step": 1551, "epoch": 13, "lr": 9.994568745892832e-05} +{"train_loss": 0.034071095287799835, "global_step": 1552, "epoch": 13, "lr": 9.994558417281301e-05} +{"train_loss": 0.03295424208045006, "global_step": 1553, "epoch": 13, "lr": 9.994548078863488e-05} +{"train_loss": 0.0414186492562294, "global_step": 1554, "epoch": 13, "lr": 9.994537730639416e-05} +{"train_loss": 0.05404345691204071, "global_step": 1555, "epoch": 13, "lr": 9.9945273726091e-05} +{"train_loss": 0.04294978454709053, "global_step": 1556, "epoch": 13, "lr": 9.994517004772564e-05} +{"train_loss": 0.041671063750982285, "global_step": 1557, "epoch": 13, "lr": 9.994506627129826e-05} +{"train_loss": 0.032517753541469574, "global_step": 1558, "epoch": 13, "lr": 9.99449623968091e-05} +{"train_loss": 0.03915764391422272, "global_step": 1559, "epoch": 13, "lr": 9.994485842425833e-05} +{"train_loss": 0.033329106867313385, "global_step": 1560, "epoch": 13, "lr": 9.994475435364616e-05} +{"train_loss": 0.0386471264064312, "global_step": 1561, "epoch": 13, "lr": 9.994465018497281e-05} +{"train_loss": 0.03576468676328659, "global_step": 1562, "epoch": 13, "lr": 9.994454591823848e-05} +{"train_loss": 0.036121029406785965, "global_step": 1563, "epoch": 13, "lr": 9.994444155344336e-05} +{"train_loss": 0.035990454256534576, "global_step": 1564, "epoch": 13, "lr": 9.994433709058767e-05} +{"train_loss": 0.022043893113732338, "global_step": 1565, "epoch": 13, "lr": 9.994423252967161e-05} +{"train_loss": 0.038952458649873734, "global_step": 1566, "epoch": 13, "lr": 9.994412787069539e-05} +{"train_loss": 0.044898681342601776, "global_step": 1567, "epoch": 13, "lr": 9.99440231136592e-05} +{"train_loss": 0.03845115378499031, "global_step": 1568, "epoch": 13, "lr": 9.994391825856326e-05} +{"train_loss": 0.04238715395331383, "global_step": 1569, "epoch": 13, "lr": 9.994381330540778e-05} +{"train_loss": 0.039873670786619186, "global_step": 1570, "epoch": 13, "lr": 9.994370825419295e-05} +{"train_loss": 0.0393221378326416, "global_step": 1571, "epoch": 13, "lr": 9.994360310491898e-05} +{"train_loss": 0.0364856943488121, "global_step": 1572, "epoch": 13, "lr": 9.994349785758609e-05} +{"train_loss": 0.032069720327854156, "global_step": 1573, "epoch": 13, "lr": 9.994339251219446e-05} +{"train_loss": 0.04090416431427002, "global_step": 1574, "epoch": 13, "lr": 9.994328706874433e-05} +{"train_loss": 0.04043062776327133, "global_step": 1575, "epoch": 13, "lr": 9.99431815272359e-05} +{"train_loss": 0.03398051857948303, "global_step": 1576, "epoch": 13, "lr": 9.994307588766936e-05} +{"train_loss": 0.033316999673843384, "global_step": 1577, "epoch": 13, "lr": 9.994297015004492e-05} +{"train_loss": 0.032184112817049026, "global_step": 1578, "epoch": 13, "lr": 9.994286431436281e-05} +{"train_loss": 0.03477528318762779, "global_step": 1579, "epoch": 13, "lr": 9.994275838062322e-05} +{"train_loss": 0.029116351157426834, "global_step": 1580, "epoch": 13, "lr": 9.994265234882634e-05} +{"train_loss": 0.03853626176714897, "global_step": 1581, "epoch": 13, "lr": 9.994254621897241e-05} +{"train_loss": 0.03799551725387573, "global_step": 1582, "epoch": 13, "lr": 9.994243999106162e-05} +{"train_loss": 0.04254110902547836, "global_step": 1583, "epoch": 13, "lr": 9.994233366509418e-05} +{"train_loss": 0.03275996446609497, "global_step": 1584, "epoch": 13, "lr": 9.994222724107032e-05} +{"train_loss": 0.03449162095785141, "global_step": 1585, "epoch": 13, "lr": 9.994212071899022e-05} +{"train_loss": 0.028167877346277237, "global_step": 1586, "epoch": 13, "lr": 9.994201409885411e-05} +{"train_loss": 0.0300401970744133, "global_step": 1587, "epoch": 13, "lr": 9.99419073806622e-05} +{"train_loss": 0.03238999471068382, "global_step": 1588, "epoch": 13, "lr": 9.994180056441467e-05} +{"train_loss": 0.03828848525881767, "global_step": 1589, "epoch": 13, "lr": 9.994169365011175e-05} +{"train_loss": 0.042667485773563385, "global_step": 1590, "epoch": 13, "lr": 9.994158663775366e-05} +{"train_loss": 0.04169977456331253, "global_step": 1591, "epoch": 13, "lr": 9.99414795273406e-05} +{"train_loss": 0.033001720905303955, "global_step": 1592, "epoch": 13, "lr": 9.994137231887278e-05} +{"train_loss": 0.041448842734098434, "global_step": 1593, "epoch": 13, "lr": 9.99412650123504e-05} +{"train_loss": 0.04483344033360481, "global_step": 1594, "epoch": 13, "lr": 9.99411576077737e-05} +{"train_loss": 0.031676676124334335, "global_step": 1595, "epoch": 13, "lr": 9.994105010514285e-05} +{"train_loss": 0.036594171077013016, "global_step": 1596, "epoch": 13, "lr": 9.994094250445811e-05} +{"train_loss": 0.04462302103638649, "global_step": 1597, "epoch": 13, "lr": 9.994083480571965e-05} +{"train_loss": 0.033277325332164764, "global_step": 1598, "epoch": 13, "lr": 9.994072700892769e-05} +{"train_loss": 0.03331218659877777, "global_step": 1599, "epoch": 13, "lr": 9.994061911408245e-05} +{"train_loss": 0.03420059382915497, "global_step": 1600, "epoch": 13, "lr": 9.994051112118415e-05} +{"train_loss": 0.03495971858501434, "global_step": 1601, "epoch": 13, "lr": 9.9940403030233e-05} +{"train_loss": 0.027546312659978867, "global_step": 1602, "epoch": 13, "lr": 9.994029484122917e-05} +{"train_loss": 0.029600434005260468, "global_step": 1603, "epoch": 13, "lr": 9.994018655417294e-05} +{"train_loss": 0.03121996857225895, "global_step": 1604, "epoch": 13, "lr": 9.994007816906448e-05} +{"train_loss": 0.0346190519630909, "global_step": 1605, "epoch": 13, "lr": 9.9939969685904e-05} +{"train_loss": 0.036886945366859436, "global_step": 1606, "epoch": 13, "lr": 9.993986110469174e-05} +{"train_loss": 0.024817658588290215, "global_step": 1607, "epoch": 13, "lr": 9.993975242542789e-05} +{"train_loss": 0.040908992290496826, "global_step": 1608, "epoch": 13, "lr": 9.993964364811268e-05} +{"train_loss": 0.038212813436985016, "global_step": 1609, "epoch": 13, "lr": 9.99395347727463e-05} +{"train_loss": 0.0403255894780159, "global_step": 1610, "epoch": 13, "lr": 9.993942579932898e-05} +{"train_loss": 0.03991164267063141, "global_step": 1611, "epoch": 13, "lr": 9.993931672786095e-05} +{"train_loss": 0.027687449008226395, "global_step": 1612, "epoch": 13, "lr": 9.993920755834239e-05} +{"train_loss": 0.035250913351774216, "global_step": 1613, "epoch": 13, "lr": 9.993909829077353e-05} +{"train_loss": 0.03047572448849678, "global_step": 1614, "epoch": 13, "lr": 9.993898892515459e-05} +{"train_loss": 0.03045780025422573, "global_step": 1615, "epoch": 13, "lr": 9.993887946148579e-05} +{"train_loss": 0.03572133928537369, "global_step": 1616, "epoch": 13, "lr": 9.993876989976734e-05} +{"train_loss": 0.03212887793779373, "global_step": 1617, "epoch": 13, "lr": 9.993866023999942e-05} +{"train_loss": 0.035459004342556, "global_step": 1618, "epoch": 13, "lr": 9.99385504821823e-05} +{"train_loss": 0.04127832129597664, "global_step": 1619, "epoch": 13, "lr": 9.993844062631616e-05} +{"train_loss": 0.04118191450834274, "global_step": 1620, "epoch": 13, "lr": 9.993833067240124e-05} +{"train_loss": 0.0428520105779171, "global_step": 1621, "epoch": 13, "lr": 9.993822062043774e-05} +{"train_loss": 0.03764795511960983, "global_step": 1622, "epoch": 13, "lr": 9.993811047042588e-05} +{"train_loss": 0.033757954835891724, "global_step": 1623, "epoch": 13, "lr": 9.993800022236586e-05} +{"train_loss": 0.03550177812576294, "global_step": 1624, "epoch": 13, "lr": 9.993788987625792e-05} +{"train_loss": 0.03809908777475357, "global_step": 1625, "epoch": 13, "lr": 9.993777943210228e-05} +{"train_loss": 0.03490697965025902, "global_step": 1626, "epoch": 13, "lr": 9.993766888989913e-05} +{"train_loss": 0.03513406962156296, "global_step": 1627, "epoch": 13, "lr": 9.99375582496487e-05} +{"train_loss": 0.037373851984739304, "global_step": 1628, "epoch": 13, "lr": 9.993744751135122e-05} +{"train_loss": 0.033870480954647064, "global_step": 1629, "epoch": 13, "lr": 9.993733667500689e-05} +{"train_loss": 0.042708687484264374, "global_step": 1630, "epoch": 13, "lr": 9.993722574061595e-05} +{"train_loss": 0.02815634198486805, "global_step": 1631, "epoch": 13, "lr": 9.993711470817859e-05} +{"train_loss": 0.029069889336824417, "global_step": 1632, "epoch": 13, "lr": 9.993700357769503e-05} +{"train_loss": 0.039347030222415924, "global_step": 1633, "epoch": 13, "lr": 9.993689234916551e-05} +{"train_loss": 0.03589136525988579, "global_step": 1634, "epoch": 13, "lr": 9.993678102259023e-05} +{"train_loss": 0.035343509167432785, "global_step": 1635, "epoch": 13, "lr": 9.993666959796944e-05} +{"train_loss": 0.041333891451358795, "global_step": 1636, "epoch": 13, "lr": 9.993655807530331e-05} +{"train_loss": 0.0316307358443737, "global_step": 1637, "epoch": 13, "lr": 9.993644645459209e-05} +{"train_loss": 0.03703130781650543, "global_step": 1638, "epoch": 13, "lr": 9.993633473583599e-05} +{"train_loss": 0.031139740720391273, "global_step": 1639, "epoch": 13, "lr": 9.993622291903521e-05} +{"train_loss": 0.03347397595643997, "global_step": 1640, "epoch": 13, "lr": 9.993611100419002e-05} +{"train_loss": 0.028070170432329178, "global_step": 1641, "epoch": 13, "lr": 9.993599899130062e-05} +{"train_loss": 0.0387161448597908, "global_step": 1642, "epoch": 13, "lr": 9.993588688036719e-05} +{"train_loss": 0.031206170096993446, "global_step": 1643, "epoch": 13, "lr": 9.993577467139001e-05} +{"train_loss": 0.036064185202121735, "global_step": 1644, "epoch": 13, "lr": 9.993566236436926e-05} +{"train_loss": 0.040502361953258514, "global_step": 1645, "epoch": 13, "lr": 9.993554995930516e-05} +{"train_loss": 0.027657978236675262, "global_step": 1646, "epoch": 13, "lr": 9.993543745619796e-05} +{"train_loss": 0.03839762136340141, "global_step": 1647, "epoch": 13, "lr": 9.993532485504783e-05} +{"train_loss": 0.030774202197790146, "global_step": 1648, "epoch": 13, "lr": 9.993521215585506e-05} +{"train_loss": 0.045302025973796844, "global_step": 1649, "epoch": 13, "lr": 9.993509935861983e-05} +{"train_loss": 0.03760372847318649, "global_step": 1650, "epoch": 13, "lr": 9.993498646334236e-05} +{"train_loss": 0.03403032571077347, "global_step": 1651, "epoch": 13, "lr": 9.993487347002288e-05} +{"train_loss": 0.03630804270505905, "global_step": 1652, "epoch": 13, "lr": 9.993476037866161e-05} +{"train_loss": 0.03117300011217594, "global_step": 1653, "epoch": 13, "lr": 9.993464718925878e-05} +{"train_loss": 0.04544099420309067, "global_step": 1654, "epoch": 13, "lr": 9.99345339018146e-05} +{"train_loss": 0.038934506475925446, "global_step": 1655, "epoch": 13, "lr": 9.993442051632931e-05} +{"train_loss": 0.031047144904732704, "global_step": 1656, "epoch": 13, "lr": 9.99343070328031e-05} +{"train_loss": 0.041510533541440964, "global_step": 1657, "epoch": 13, "lr": 9.993419345123623e-05} +{"train_loss": 0.03426332399249077, "global_step": 1658, "epoch": 13, "lr": 9.993407977162889e-05} +{"train_loss": 0.03100288286805153, "global_step": 1659, "epoch": 13, "lr": 9.993396599398133e-05} +{"train_loss": 0.03299815580248833, "global_step": 1660, "epoch": 13, "lr": 9.993385211829375e-05} +{"train_loss": 0.036265742033720016, "global_step": 1661, "epoch": 13, "lr": 9.993373814456639e-05} +{"train_loss": 0.04599892348051071, "global_step": 1662, "epoch": 13, "lr": 9.993362407279947e-05} +{"train_loss": 0.04655643180012703, "global_step": 1663, "epoch": 13, "lr": 9.993350990299322e-05} +{"train_loss": 0.036863796412944794, "global_step": 1664, "epoch": 13, "lr": 9.993339563514786e-05} +{"train_loss": 0.03644246562626682, "global_step": 1665, "epoch": 13, "lr": 9.99332812692636e-05, "val_loss": 0.045812517404556274} +{"train_loss": 0.04217119514942169, "global_step": 1666, "epoch": 14, "lr": 9.993316680534068e-05} +{"train_loss": 0.034511614590883255, "global_step": 1667, "epoch": 14, "lr": 9.993305224337933e-05} +{"train_loss": 0.03734787926077843, "global_step": 1668, "epoch": 14, "lr": 9.993293758337975e-05} +{"train_loss": 0.04557838663458824, "global_step": 1669, "epoch": 14, "lr": 9.993282282534221e-05} +{"train_loss": 0.030671536922454834, "global_step": 1670, "epoch": 14, "lr": 9.993270796926687e-05} +{"train_loss": 0.0324784591794014, "global_step": 1671, "epoch": 14, "lr": 9.993259301515404e-05} +{"train_loss": 0.038669899106025696, "global_step": 1672, "epoch": 14, "lr": 9.993247796300387e-05} +{"train_loss": 0.03366297483444214, "global_step": 1673, "epoch": 14, "lr": 9.99323628128166e-05} +{"train_loss": 0.034513574093580246, "global_step": 1674, "epoch": 14, "lr": 9.99322475645925e-05} +{"train_loss": 0.0331711545586586, "global_step": 1675, "epoch": 14, "lr": 9.993213221833175e-05} +{"train_loss": 0.03013686090707779, "global_step": 1676, "epoch": 14, "lr": 9.993201677403459e-05} +{"train_loss": 0.03326549753546715, "global_step": 1677, "epoch": 14, "lr": 9.993190123170125e-05} +{"train_loss": 0.03145737946033478, "global_step": 1678, "epoch": 14, "lr": 9.993178559133197e-05} +{"train_loss": 0.02562372013926506, "global_step": 1679, "epoch": 14, "lr": 9.993166985292694e-05} +{"train_loss": 0.031994469463825226, "global_step": 1680, "epoch": 14, "lr": 9.993155401648643e-05} +{"train_loss": 0.029354991391301155, "global_step": 1681, "epoch": 14, "lr": 9.993143808201064e-05} +{"train_loss": 0.03207208588719368, "global_step": 1682, "epoch": 14, "lr": 9.993132204949981e-05} +{"train_loss": 0.029112040996551514, "global_step": 1683, "epoch": 14, "lr": 9.993120591895416e-05} +{"train_loss": 0.029283517971634865, "global_step": 1684, "epoch": 14, "lr": 9.993108969037392e-05} +{"train_loss": 0.03597663715481758, "global_step": 1685, "epoch": 14, "lr": 9.993097336375933e-05} +{"train_loss": 0.031912632286548615, "global_step": 1686, "epoch": 14, "lr": 9.99308569391106e-05} +{"train_loss": 0.027075113728642464, "global_step": 1687, "epoch": 14, "lr": 9.993074041642796e-05} +{"train_loss": 0.03991103172302246, "global_step": 1688, "epoch": 14, "lr": 9.993062379571166e-05} +{"train_loss": 0.0349070243537426, "global_step": 1689, "epoch": 14, "lr": 9.993050707696191e-05} +{"train_loss": 0.03703415393829346, "global_step": 1690, "epoch": 14, "lr": 9.993039026017894e-05} +{"train_loss": 0.03588526323437691, "global_step": 1691, "epoch": 14, "lr": 9.993027334536297e-05} +{"train_loss": 0.03379062935709953, "global_step": 1692, "epoch": 14, "lr": 9.993015633251426e-05} +{"train_loss": 0.036464232951402664, "global_step": 1693, "epoch": 14, "lr": 9.993003922163304e-05} +{"train_loss": 0.02651381306350231, "global_step": 1694, "epoch": 14, "lr": 9.99299220127195e-05} +{"train_loss": 0.03161921352148056, "global_step": 1695, "epoch": 14, "lr": 9.992980470577388e-05} +{"train_loss": 0.0298214890062809, "global_step": 1696, "epoch": 14, "lr": 9.992968730079643e-05} +{"train_loss": 0.04164135456085205, "global_step": 1697, "epoch": 14, "lr": 9.992956979778739e-05} +{"train_loss": 0.028016330674290657, "global_step": 1698, "epoch": 14, "lr": 9.992945219674696e-05} +{"train_loss": 0.035338956862688065, "global_step": 1699, "epoch": 14, "lr": 9.992933449767539e-05} +{"train_loss": 0.029752060770988464, "global_step": 1700, "epoch": 14, "lr": 9.992921670057292e-05} +{"train_loss": 0.03413130342960358, "global_step": 1701, "epoch": 14, "lr": 9.992909880543975e-05} +{"train_loss": 0.03568175062537193, "global_step": 1702, "epoch": 14, "lr": 9.992898081227612e-05} +{"train_loss": 0.031575970351696014, "global_step": 1703, "epoch": 14, "lr": 9.992886272108229e-05} +{"train_loss": 0.033414267003536224, "global_step": 1704, "epoch": 14, "lr": 9.992874453185846e-05} +{"train_loss": 0.023194607347249985, "global_step": 1705, "epoch": 14, "lr": 9.992862624460488e-05} +{"train_loss": 0.027881795540452003, "global_step": 1706, "epoch": 14, "lr": 9.992850785932176e-05} +{"train_loss": 0.034572649747133255, "global_step": 1707, "epoch": 14, "lr": 9.992838937600936e-05} +{"train_loss": 0.025821484625339508, "global_step": 1708, "epoch": 14, "lr": 9.992827079466791e-05} +{"train_loss": 0.029246846213936806, "global_step": 1709, "epoch": 14, "lr": 9.992815211529762e-05} +{"train_loss": 0.02529696188867092, "global_step": 1710, "epoch": 14, "lr": 9.992803333789875e-05} +{"train_loss": 0.034651979804039, "global_step": 1711, "epoch": 14, "lr": 9.992791446247152e-05} +{"train_loss": 0.03293200954794884, "global_step": 1712, "epoch": 14, "lr": 9.992779548901616e-05} +{"train_loss": 0.04082895442843437, "global_step": 1713, "epoch": 14, "lr": 9.992767641753291e-05} +{"train_loss": 0.032007645815610886, "global_step": 1714, "epoch": 14, "lr": 9.9927557248022e-05} +{"train_loss": 0.02393564209342003, "global_step": 1715, "epoch": 14, "lr": 9.992743798048365e-05} +{"train_loss": 0.04496493563055992, "global_step": 1716, "epoch": 14, "lr": 9.992731861491813e-05} +{"train_loss": 0.03228103742003441, "global_step": 1717, "epoch": 14, "lr": 9.992719915132565e-05} +{"train_loss": 0.027283573523163795, "global_step": 1718, "epoch": 14, "lr": 9.992707958970644e-05} +{"train_loss": 0.039498068392276764, "global_step": 1719, "epoch": 14, "lr": 9.992695993006077e-05} +{"train_loss": 0.03196753188967705, "global_step": 1720, "epoch": 14, "lr": 9.992684017238882e-05} +{"train_loss": 0.023894306272268295, "global_step": 1721, "epoch": 14, "lr": 9.992672031669086e-05} +{"train_loss": 0.03707566484808922, "global_step": 1722, "epoch": 14, "lr": 9.992660036296711e-05} +{"train_loss": 0.03133593499660492, "global_step": 1723, "epoch": 14, "lr": 9.992648031121783e-05} +{"train_loss": 0.038915686309337616, "global_step": 1724, "epoch": 14, "lr": 9.992636016144324e-05} +{"train_loss": 0.03748741373419762, "global_step": 1725, "epoch": 14, "lr": 9.992623991364356e-05} +{"train_loss": 0.04144283011555672, "global_step": 1726, "epoch": 14, "lr": 9.992611956781904e-05} +{"train_loss": 0.03157753124833107, "global_step": 1727, "epoch": 14, "lr": 9.992599912396994e-05} +{"train_loss": 0.03599470853805542, "global_step": 1728, "epoch": 14, "lr": 9.992587858209646e-05} +{"train_loss": 0.034084949642419815, "global_step": 1729, "epoch": 14, "lr": 9.992575794219885e-05} +{"train_loss": 0.03390633687376976, "global_step": 1730, "epoch": 14, "lr": 9.992563720427734e-05} +{"train_loss": 0.03138008341193199, "global_step": 1731, "epoch": 14, "lr": 9.992551636833221e-05} +{"train_loss": 0.028019938617944717, "global_step": 1732, "epoch": 14, "lr": 9.992539543436363e-05} +{"train_loss": 0.032986536622047424, "global_step": 1733, "epoch": 14, "lr": 9.992527440237187e-05} +{"train_loss": 0.032595809549093246, "global_step": 1734, "epoch": 14, "lr": 9.992515327235718e-05} +{"train_loss": 0.04337194189429283, "global_step": 1735, "epoch": 14, "lr": 9.992503204431978e-05} +{"train_loss": 0.038282670080661774, "global_step": 1736, "epoch": 14, "lr": 9.992491071825991e-05} +{"train_loss": 0.036670148372650146, "global_step": 1737, "epoch": 14, "lr": 9.992478929417783e-05} +{"train_loss": 0.03836308419704437, "global_step": 1738, "epoch": 14, "lr": 9.992466777207375e-05} +{"train_loss": 0.03620312362909317, "global_step": 1739, "epoch": 14, "lr": 9.99245461519479e-05} +{"train_loss": 0.03725939616560936, "global_step": 1740, "epoch": 14, "lr": 9.992442443380057e-05} +{"train_loss": 0.0395168662071228, "global_step": 1741, "epoch": 14, "lr": 9.992430261763194e-05} +{"train_loss": 0.033303700387477875, "global_step": 1742, "epoch": 14, "lr": 9.992418070344228e-05} +{"train_loss": 0.026718681678175926, "global_step": 1743, "epoch": 14, "lr": 9.992405869123182e-05} +{"train_loss": 0.025000127032399178, "global_step": 1744, "epoch": 14, "lr": 9.992393658100084e-05} +{"train_loss": 0.036675214767456055, "global_step": 1745, "epoch": 14, "lr": 9.99238143727495e-05} +{"train_loss": 0.029045676812529564, "global_step": 1746, "epoch": 14, "lr": 9.99236920664781e-05} +{"train_loss": 0.03438083082437515, "global_step": 1747, "epoch": 14, "lr": 9.992356966218687e-05} +{"train_loss": 0.035943321883678436, "global_step": 1748, "epoch": 14, "lr": 9.992344715987603e-05} +{"train_loss": 0.035720791667699814, "global_step": 1749, "epoch": 14, "lr": 9.992332455954585e-05} +{"train_loss": 0.030047306790947914, "global_step": 1750, "epoch": 14, "lr": 9.992320186119655e-05} +{"train_loss": 0.03202098235487938, "global_step": 1751, "epoch": 14, "lr": 9.992307906482839e-05} +{"train_loss": 0.03876939043402672, "global_step": 1752, "epoch": 14, "lr": 9.992295617044158e-05} +{"train_loss": 0.027787484228610992, "global_step": 1753, "epoch": 14, "lr": 9.99228331780364e-05} +{"train_loss": 0.04190598800778389, "global_step": 1754, "epoch": 14, "lr": 9.992271008761304e-05} +{"train_loss": 0.03459431976079941, "global_step": 1755, "epoch": 14, "lr": 9.992258689917178e-05} +{"train_loss": 0.03304927796125412, "global_step": 1756, "epoch": 14, "lr": 9.992246361271287e-05} +{"train_loss": 0.033363502472639084, "global_step": 1757, "epoch": 14, "lr": 9.992234022823652e-05} +{"train_loss": 0.03413645550608635, "global_step": 1758, "epoch": 14, "lr": 9.9922216745743e-05} +{"train_loss": 0.02747879922389984, "global_step": 1759, "epoch": 14, "lr": 9.992209316523254e-05} +{"train_loss": 0.03290066868066788, "global_step": 1760, "epoch": 14, "lr": 9.992196948670537e-05} +{"train_loss": 0.032141830772161484, "global_step": 1761, "epoch": 14, "lr": 9.992184571016177e-05} +{"train_loss": 0.031658053398132324, "global_step": 1762, "epoch": 14, "lr": 9.992172183560193e-05} +{"train_loss": 0.029764261096715927, "global_step": 1763, "epoch": 14, "lr": 9.992159786302616e-05} +{"train_loss": 0.030321693047881126, "global_step": 1764, "epoch": 14, "lr": 9.992147379243463e-05} +{"train_loss": 0.03764437511563301, "global_step": 1765, "epoch": 14, "lr": 9.992134962382763e-05} +{"train_loss": 0.026529507711529732, "global_step": 1766, "epoch": 14, "lr": 9.992122535720541e-05} +{"train_loss": 0.037727683782577515, "global_step": 1767, "epoch": 14, "lr": 9.992110099256817e-05} +{"train_loss": 0.02642766572535038, "global_step": 1768, "epoch": 14, "lr": 9.99209765299162e-05} +{"train_loss": 0.03599083423614502, "global_step": 1769, "epoch": 14, "lr": 9.992085196924971e-05} +{"train_loss": 0.03185497969388962, "global_step": 1770, "epoch": 14, "lr": 9.992072731056898e-05} +{"train_loss": 0.028219228610396385, "global_step": 1771, "epoch": 14, "lr": 9.992060255387423e-05} +{"train_loss": 0.030421914532780647, "global_step": 1772, "epoch": 14, "lr": 9.99204776991657e-05} +{"train_loss": 0.03487233445048332, "global_step": 1773, "epoch": 14, "lr": 9.992035274644366e-05} +{"train_loss": 0.036521509289741516, "global_step": 1774, "epoch": 14, "lr": 9.992022769570834e-05} +{"train_loss": 0.03672399744391441, "global_step": 1775, "epoch": 14, "lr": 9.992010254695997e-05} +{"train_loss": 0.02847953699529171, "global_step": 1776, "epoch": 14, "lr": 9.991997730019882e-05} +{"train_loss": 0.03206805884838104, "global_step": 1777, "epoch": 14, "lr": 9.991985195542513e-05} +{"train_loss": 0.025365639477968216, "global_step": 1778, "epoch": 14, "lr": 9.991972651263914e-05} +{"train_loss": 0.03631097823381424, "global_step": 1779, "epoch": 14, "lr": 9.99196009718411e-05} +{"train_loss": 0.03185654804110527, "global_step": 1780, "epoch": 14, "lr": 9.991947533303127e-05} +{"train_loss": 0.03356533870100975, "global_step": 1781, "epoch": 14, "lr": 9.991934959620987e-05} +{"train_loss": 0.032170962542295456, "global_step": 1782, "epoch": 14, "lr": 9.991922376137717e-05} +{"train_loss": 0.03771638870239258, "global_step": 1783, "epoch": 14, "lr": 9.991909782853339e-05} +{"train_loss": 0.033223228716925415, "global_step": 1784, "epoch": 14, "lr": 9.99189717976788e-05, "val_loss": 0.04745185375213623} +{"train_loss": 0.0342182032763958, "global_step": 1785, "epoch": 15, "lr": 9.991884566881365e-05} +{"train_loss": 0.030141431838274002, "global_step": 1786, "epoch": 15, "lr": 9.991871944193818e-05} +{"train_loss": 0.029617756605148315, "global_step": 1787, "epoch": 15, "lr": 9.991859311705262e-05} +{"train_loss": 0.03441544994711876, "global_step": 1788, "epoch": 15, "lr": 9.991846669415725e-05} +{"train_loss": 0.02944611757993698, "global_step": 1789, "epoch": 15, "lr": 9.99183401732523e-05} +{"train_loss": 0.029037300497293472, "global_step": 1790, "epoch": 15, "lr": 9.991821355433803e-05} +{"train_loss": 0.0313679501414299, "global_step": 1791, "epoch": 15, "lr": 9.991808683741469e-05} +{"train_loss": 0.03642527759075165, "global_step": 1792, "epoch": 15, "lr": 9.99179600224825e-05} +{"train_loss": 0.041627392172813416, "global_step": 1793, "epoch": 15, "lr": 9.991783310954172e-05} +{"train_loss": 0.034439630806446075, "global_step": 1794, "epoch": 15, "lr": 9.991770609859264e-05} +{"train_loss": 0.03237418830394745, "global_step": 1795, "epoch": 15, "lr": 9.991757898963545e-05} +{"train_loss": 0.035047903656959534, "global_step": 1796, "epoch": 15, "lr": 9.991745178267042e-05} +{"train_loss": 0.026725763455033302, "global_step": 1797, "epoch": 15, "lr": 9.991732447769784e-05} +{"train_loss": 0.030626481398940086, "global_step": 1798, "epoch": 15, "lr": 9.99171970747179e-05} +{"train_loss": 0.02939138002693653, "global_step": 1799, "epoch": 15, "lr": 9.991706957373088e-05} +{"train_loss": 0.027077987790107727, "global_step": 1800, "epoch": 15, "lr": 9.991694197473703e-05} +{"train_loss": 0.027609581127762794, "global_step": 1801, "epoch": 15, "lr": 9.99168142777366e-05} +{"train_loss": 0.03357607126235962, "global_step": 1802, "epoch": 15, "lr": 9.991668648272984e-05} +{"train_loss": 0.029878970235586166, "global_step": 1803, "epoch": 15, "lr": 9.991655858971699e-05} +{"train_loss": 0.03426152095198631, "global_step": 1804, "epoch": 15, "lr": 9.991643059869831e-05} +{"train_loss": 0.035355180501937866, "global_step": 1805, "epoch": 15, "lr": 9.991630250967406e-05} +{"train_loss": 0.031018676236271858, "global_step": 1806, "epoch": 15, "lr": 9.991617432264448e-05} +{"train_loss": 0.04242273420095444, "global_step": 1807, "epoch": 15, "lr": 9.991604603760982e-05} +{"train_loss": 0.030559923499822617, "global_step": 1808, "epoch": 15, "lr": 9.991591765457034e-05} +{"train_loss": 0.032561417669057846, "global_step": 1809, "epoch": 15, "lr": 9.991578917352629e-05} +{"train_loss": 0.026735488325357437, "global_step": 1810, "epoch": 15, "lr": 9.991566059447792e-05} +{"train_loss": 0.023706454783678055, "global_step": 1811, "epoch": 15, "lr": 9.991553191742548e-05} +{"train_loss": 0.029071439057588577, "global_step": 1812, "epoch": 15, "lr": 9.991540314236923e-05} +{"train_loss": 0.03360164910554886, "global_step": 1813, "epoch": 15, "lr": 9.991527426930941e-05} +{"train_loss": 0.03579642251133919, "global_step": 1814, "epoch": 15, "lr": 9.991514529824628e-05} +{"train_loss": 0.03289247676730156, "global_step": 1815, "epoch": 15, "lr": 9.991501622918012e-05} +{"train_loss": 0.035255398601293564, "global_step": 1816, "epoch": 15, "lr": 9.991488706211112e-05} +{"train_loss": 0.03435814008116722, "global_step": 1817, "epoch": 15, "lr": 9.99147577970396e-05} +{"train_loss": 0.029459606856107712, "global_step": 1818, "epoch": 15, "lr": 9.991462843396577e-05} +{"train_loss": 0.03712709620594978, "global_step": 1819, "epoch": 15, "lr": 9.991449897288991e-05} +{"train_loss": 0.029676370322704315, "global_step": 1820, "epoch": 15, "lr": 9.991436941381228e-05} +{"train_loss": 0.04279986768960953, "global_step": 1821, "epoch": 15, "lr": 9.991423975673308e-05} +{"train_loss": 0.02284705825150013, "global_step": 1822, "epoch": 15, "lr": 9.991411000165262e-05} +{"train_loss": 0.02897481620311737, "global_step": 1823, "epoch": 15, "lr": 9.991398014857116e-05} +{"train_loss": 0.03713972494006157, "global_step": 1824, "epoch": 15, "lr": 9.99138501974889e-05} +{"train_loss": 0.03610164672136307, "global_step": 1825, "epoch": 15, "lr": 9.991372014840615e-05} +{"train_loss": 0.036657657474279404, "global_step": 1826, "epoch": 15, "lr": 9.991359000132312e-05} +{"train_loss": 0.038416892290115356, "global_step": 1827, "epoch": 15, "lr": 9.991345975624011e-05} +{"train_loss": 0.02666407637298107, "global_step": 1828, "epoch": 15, "lr": 9.991332941315735e-05} +{"train_loss": 0.0351986289024353, "global_step": 1829, "epoch": 15, "lr": 9.99131989720751e-05} +{"train_loss": 0.02316337451338768, "global_step": 1830, "epoch": 15, "lr": 9.99130684329936e-05} +{"train_loss": 0.02916521206498146, "global_step": 1831, "epoch": 15, "lr": 9.991293779591312e-05} +{"train_loss": 0.031145386397838593, "global_step": 1832, "epoch": 15, "lr": 9.991280706083395e-05} +{"train_loss": 0.03701447322964668, "global_step": 1833, "epoch": 15, "lr": 9.99126762277563e-05} +{"train_loss": 0.03221665322780609, "global_step": 1834, "epoch": 15, "lr": 9.991254529668044e-05} +{"train_loss": 0.035510238260030746, "global_step": 1835, "epoch": 15, "lr": 9.991241426760663e-05} +{"train_loss": 0.0400509312748909, "global_step": 1836, "epoch": 15, "lr": 9.991228314053514e-05} +{"train_loss": 0.026737535372376442, "global_step": 1837, "epoch": 15, "lr": 9.991215191546618e-05} +{"train_loss": 0.02661963179707527, "global_step": 1838, "epoch": 15, "lr": 9.991202059240007e-05} +{"train_loss": 0.03178577870130539, "global_step": 1839, "epoch": 15, "lr": 9.991188917133705e-05} +{"train_loss": 0.024136407300829887, "global_step": 1840, "epoch": 15, "lr": 9.991175765227736e-05} +{"train_loss": 0.027865508571267128, "global_step": 1841, "epoch": 15, "lr": 9.991162603522125e-05} +{"train_loss": 0.04118027910590172, "global_step": 1842, "epoch": 15, "lr": 9.9911494320169e-05} +{"train_loss": 0.03800925612449646, "global_step": 1843, "epoch": 15, "lr": 9.991136250712088e-05} +{"train_loss": 0.02858162857592106, "global_step": 1844, "epoch": 15, "lr": 9.99112305960771e-05} +{"train_loss": 0.03948647901415825, "global_step": 1845, "epoch": 15, "lr": 9.991109858703797e-05} +{"train_loss": 0.022864578291773796, "global_step": 1846, "epoch": 15, "lr": 9.991096648000373e-05} +{"train_loss": 0.029067670926451683, "global_step": 1847, "epoch": 15, "lr": 9.991083427497465e-05} +{"train_loss": 0.03722628578543663, "global_step": 1848, "epoch": 15, "lr": 9.991070197195096e-05} +{"train_loss": 0.0248599611222744, "global_step": 1849, "epoch": 15, "lr": 9.991056957093295e-05} +{"train_loss": 0.033719971776008606, "global_step": 1850, "epoch": 15, "lr": 9.991043707192088e-05} +{"train_loss": 0.03020985797047615, "global_step": 1851, "epoch": 15, "lr": 9.991030447491499e-05} +{"train_loss": 0.028037216514348984, "global_step": 1852, "epoch": 15, "lr": 9.991017177991553e-05} +{"train_loss": 0.03490554913878441, "global_step": 1853, "epoch": 15, "lr": 9.991003898692279e-05} +{"train_loss": 0.032418303191661835, "global_step": 1854, "epoch": 15, "lr": 9.990990609593702e-05} +{"train_loss": 0.024204064160585403, "global_step": 1855, "epoch": 15, "lr": 9.99097731069585e-05} +{"train_loss": 0.02680855430662632, "global_step": 1856, "epoch": 15, "lr": 9.990964001998746e-05} +{"train_loss": 0.028727490454912186, "global_step": 1857, "epoch": 15, "lr": 9.990950683502417e-05} +{"train_loss": 0.021222619339823723, "global_step": 1858, "epoch": 15, "lr": 9.99093735520689e-05} +{"train_loss": 0.032015468925237656, "global_step": 1859, "epoch": 15, "lr": 9.99092401711219e-05} +{"train_loss": 0.03262729570269585, "global_step": 1860, "epoch": 15, "lr": 9.990910669218346e-05} +{"train_loss": 0.021145960316061974, "global_step": 1861, "epoch": 15, "lr": 9.990897311525379e-05} +{"train_loss": 0.02964523620903492, "global_step": 1862, "epoch": 15, "lr": 9.99088394403332e-05} +{"train_loss": 0.030360601842403412, "global_step": 1863, "epoch": 15, "lr": 9.990870566742194e-05} +{"train_loss": 0.030735522508621216, "global_step": 1864, "epoch": 15, "lr": 9.990857179652025e-05} +{"train_loss": 0.025226078927516937, "global_step": 1865, "epoch": 15, "lr": 9.990843782762843e-05} +{"train_loss": 0.028154021129012108, "global_step": 1866, "epoch": 15, "lr": 9.990830376074672e-05} +{"train_loss": 0.02190288156270981, "global_step": 1867, "epoch": 15, "lr": 9.99081695958754e-05} +{"train_loss": 0.034048691391944885, "global_step": 1868, "epoch": 15, "lr": 9.990803533301469e-05} +{"train_loss": 0.027477048337459564, "global_step": 1869, "epoch": 15, "lr": 9.990790097216491e-05} +{"train_loss": 0.037840913981199265, "global_step": 1870, "epoch": 15, "lr": 9.990776651332627e-05} +{"train_loss": 0.01993262767791748, "global_step": 1871, "epoch": 15, "lr": 9.99076319564991e-05} +{"train_loss": 0.03518246114253998, "global_step": 1872, "epoch": 15, "lr": 9.99074973016836e-05} +{"train_loss": 0.020455295220017433, "global_step": 1873, "epoch": 15, "lr": 9.990736254888007e-05} +{"train_loss": 0.02259904518723488, "global_step": 1874, "epoch": 15, "lr": 9.990722769808875e-05} +{"train_loss": 0.026222940534353256, "global_step": 1875, "epoch": 15, "lr": 9.990709274930995e-05} +{"train_loss": 0.03197148069739342, "global_step": 1876, "epoch": 15, "lr": 9.990695770254388e-05} +{"train_loss": 0.02735820598900318, "global_step": 1877, "epoch": 15, "lr": 9.990682255779084e-05} +{"train_loss": 0.029108744114637375, "global_step": 1878, "epoch": 15, "lr": 9.99066873150511e-05} +{"train_loss": 0.037269871681928635, "global_step": 1879, "epoch": 15, "lr": 9.990655197432489e-05} +{"train_loss": 0.03542608022689819, "global_step": 1880, "epoch": 15, "lr": 9.99064165356125e-05} +{"train_loss": 0.033640675246715546, "global_step": 1881, "epoch": 15, "lr": 9.99062809989142e-05} +{"train_loss": 0.03285818547010422, "global_step": 1882, "epoch": 15, "lr": 9.990614536423024e-05} +{"train_loss": 0.02297576330602169, "global_step": 1883, "epoch": 15, "lr": 9.990600963156092e-05} +{"train_loss": 0.03406243026256561, "global_step": 1884, "epoch": 15, "lr": 9.990587380090645e-05} +{"train_loss": 0.022802332416176796, "global_step": 1885, "epoch": 15, "lr": 9.990573787226714e-05} +{"train_loss": 0.027116741985082626, "global_step": 1886, "epoch": 15, "lr": 9.990560184564325e-05} +{"train_loss": 0.04049333557486534, "global_step": 1887, "epoch": 15, "lr": 9.990546572103505e-05} +{"train_loss": 0.024750996381044388, "global_step": 1888, "epoch": 15, "lr": 9.990532949844279e-05} +{"train_loss": 0.03509454429149628, "global_step": 1889, "epoch": 15, "lr": 9.990519317786673e-05} +{"train_loss": 0.019398493692278862, "global_step": 1890, "epoch": 15, "lr": 9.990505675930717e-05} +{"train_loss": 0.034971173852682114, "global_step": 1891, "epoch": 15, "lr": 9.990492024276437e-05} +{"train_loss": 0.02792491391301155, "global_step": 1892, "epoch": 15, "lr": 9.990478362823859e-05} +{"train_loss": 0.021570775657892227, "global_step": 1893, "epoch": 15, "lr": 9.990464691573009e-05} +{"train_loss": 0.02693593129515648, "global_step": 1894, "epoch": 15, "lr": 9.990451010523913e-05} +{"train_loss": 0.0442073792219162, "global_step": 1895, "epoch": 15, "lr": 9.990437319676602e-05} +{"train_loss": 0.02959330752491951, "global_step": 1896, "epoch": 15, "lr": 9.990423619031101e-05} +{"train_loss": 0.03488597273826599, "global_step": 1897, "epoch": 15, "lr": 9.990409908587435e-05} +{"train_loss": 0.04266095906496048, "global_step": 1898, "epoch": 15, "lr": 9.990396188345633e-05} +{"train_loss": 0.02840231917798519, "global_step": 1899, "epoch": 15, "lr": 9.99038245830572e-05} +{"train_loss": 0.026219071820378304, "global_step": 1900, "epoch": 15, "lr": 9.990368718467727e-05} +{"train_loss": 0.03666810318827629, "global_step": 1901, "epoch": 15, "lr": 9.990354968831675e-05} +{"train_loss": 0.02913793921470642, "global_step": 1902, "epoch": 15, "lr": 9.990341209397595e-05} +{"train_loss": 0.031048920209042163, "global_step": 1903, "epoch": 15, "lr": 9.990327440165515e-05, "val_loss": 0.048115842044353485, "train_action_mse_error": 0.0049999370239675045} +{"train_loss": 0.02772550657391548, "global_step": 1904, "epoch": 16, "lr": 9.990313661135459e-05} +{"train_loss": 0.03491199389100075, "global_step": 1905, "epoch": 16, "lr": 9.990299872307454e-05} +{"train_loss": 0.022884901612997055, "global_step": 1906, "epoch": 16, "lr": 9.99028607368153e-05} +{"train_loss": 0.03752188757061958, "global_step": 1907, "epoch": 16, "lr": 9.990272265257712e-05} +{"train_loss": 0.034558605402708054, "global_step": 1908, "epoch": 16, "lr": 9.990258447036027e-05} +{"train_loss": 0.029155826196074486, "global_step": 1909, "epoch": 16, "lr": 9.990244619016504e-05} +{"train_loss": 0.029063215479254723, "global_step": 1910, "epoch": 16, "lr": 9.990230781199168e-05} +{"train_loss": 0.03257809206843376, "global_step": 1911, "epoch": 16, "lr": 9.990216933584047e-05} +{"train_loss": 0.02884533628821373, "global_step": 1912, "epoch": 16, "lr": 9.990203076171168e-05} +{"train_loss": 0.035960644483566284, "global_step": 1913, "epoch": 16, "lr": 9.990189208960557e-05} +{"train_loss": 0.03298190236091614, "global_step": 1914, "epoch": 16, "lr": 9.990175331952245e-05} +{"train_loss": 0.04183993488550186, "global_step": 1915, "epoch": 16, "lr": 9.990161445146256e-05} +{"train_loss": 0.03521856665611267, "global_step": 1916, "epoch": 16, "lr": 9.990147548542618e-05} +{"train_loss": 0.025219332426786423, "global_step": 1917, "epoch": 16, "lr": 9.990133642141359e-05} +{"train_loss": 0.029538389295339584, "global_step": 1918, "epoch": 16, "lr": 9.990119725942504e-05} +{"train_loss": 0.030227743089199066, "global_step": 1919, "epoch": 16, "lr": 9.990105799946083e-05} +{"train_loss": 0.03242809325456619, "global_step": 1920, "epoch": 16, "lr": 9.990091864152124e-05} +{"train_loss": 0.03334849327802658, "global_step": 1921, "epoch": 16, "lr": 9.99007791856065e-05} +{"train_loss": 0.02193486876785755, "global_step": 1922, "epoch": 16, "lr": 9.990063963171693e-05} +{"train_loss": 0.04086679220199585, "global_step": 1923, "epoch": 16, "lr": 9.990049997985278e-05} +{"train_loss": 0.03814788535237312, "global_step": 1924, "epoch": 16, "lr": 9.990036023001432e-05} +{"train_loss": 0.02922331914305687, "global_step": 1925, "epoch": 16, "lr": 9.990022038220186e-05} +{"train_loss": 0.033473074436187744, "global_step": 1926, "epoch": 16, "lr": 9.990008043641563e-05} +{"train_loss": 0.03115193173289299, "global_step": 1927, "epoch": 16, "lr": 9.989994039265592e-05} +{"train_loss": 0.033750712871551514, "global_step": 1928, "epoch": 16, "lr": 9.989980025092301e-05} +{"train_loss": 0.03038494475185871, "global_step": 1929, "epoch": 16, "lr": 9.989966001121717e-05} +{"train_loss": 0.03297364339232445, "global_step": 1930, "epoch": 16, "lr": 9.989951967353869e-05} +{"train_loss": 0.030898768454790115, "global_step": 1931, "epoch": 16, "lr": 9.989937923788782e-05} +{"train_loss": 0.031216436997056007, "global_step": 1932, "epoch": 16, "lr": 9.989923870426486e-05} +{"train_loss": 0.03779807314276695, "global_step": 1933, "epoch": 16, "lr": 9.989909807267009e-05} +{"train_loss": 0.027719654142856598, "global_step": 1934, "epoch": 16, "lr": 9.989895734310376e-05} +{"train_loss": 0.02941235527396202, "global_step": 1935, "epoch": 16, "lr": 9.989881651556614e-05} +{"train_loss": 0.03129645809531212, "global_step": 1936, "epoch": 16, "lr": 9.989867559005753e-05} +{"train_loss": 0.03452732786536217, "global_step": 1937, "epoch": 16, "lr": 9.98985345665782e-05} +{"train_loss": 0.04927713796496391, "global_step": 1938, "epoch": 16, "lr": 9.989839344512846e-05} +{"train_loss": 0.02757183648645878, "global_step": 1939, "epoch": 16, "lr": 9.989825222570852e-05} +{"train_loss": 0.04769786819815636, "global_step": 1940, "epoch": 16, "lr": 9.989811090831871e-05} +{"train_loss": 0.030881091952323914, "global_step": 1941, "epoch": 16, "lr": 9.989796949295928e-05} +{"train_loss": 0.03936050087213516, "global_step": 1942, "epoch": 16, "lr": 9.989782797963053e-05} +{"train_loss": 0.03236167132854462, "global_step": 1943, "epoch": 16, "lr": 9.989768636833272e-05} +{"train_loss": 0.02542927674949169, "global_step": 1944, "epoch": 16, "lr": 9.989754465906614e-05} +{"train_loss": 0.02616116590797901, "global_step": 1945, "epoch": 16, "lr": 9.989740285183105e-05} +{"train_loss": 0.03217028081417084, "global_step": 1946, "epoch": 16, "lr": 9.989726094662775e-05} +{"train_loss": 0.02663000114262104, "global_step": 1947, "epoch": 16, "lr": 9.98971189434565e-05} +{"train_loss": 0.021819716319441795, "global_step": 1948, "epoch": 16, "lr": 9.989697684231759e-05} +{"train_loss": 0.023389825597405434, "global_step": 1949, "epoch": 16, "lr": 9.98968346432113e-05} +{"train_loss": 0.041757963597774506, "global_step": 1950, "epoch": 16, "lr": 9.989669234613789e-05} +{"train_loss": 0.031069369986653328, "global_step": 1951, "epoch": 16, "lr": 9.989654995109768e-05} +{"train_loss": 0.022483520209789276, "global_step": 1952, "epoch": 16, "lr": 9.989640745809092e-05} +{"train_loss": 0.02631685696542263, "global_step": 1953, "epoch": 16, "lr": 9.989626486711788e-05} +{"train_loss": 0.03317035362124443, "global_step": 1954, "epoch": 16, "lr": 9.989612217817886e-05} +{"train_loss": 0.02465062588453293, "global_step": 1955, "epoch": 16, "lr": 9.989597939127414e-05} +{"train_loss": 0.03203582391142845, "global_step": 1956, "epoch": 16, "lr": 9.9895836506404e-05} +{"train_loss": 0.032795410603284836, "global_step": 1957, "epoch": 16, "lr": 9.989569352356871e-05} +{"train_loss": 0.04084305092692375, "global_step": 1958, "epoch": 16, "lr": 9.989555044276855e-05} +{"train_loss": 0.03547335043549538, "global_step": 1959, "epoch": 16, "lr": 9.989540726400382e-05} +{"train_loss": 0.030380280688405037, "global_step": 1960, "epoch": 16, "lr": 9.989526398727478e-05} +{"train_loss": 0.03095807135105133, "global_step": 1961, "epoch": 16, "lr": 9.989512061258171e-05} +{"train_loss": 0.032018303871154785, "global_step": 1962, "epoch": 16, "lr": 9.989497713992491e-05} +{"train_loss": 0.03217284381389618, "global_step": 1963, "epoch": 16, "lr": 9.989483356930466e-05} +{"train_loss": 0.026623869314789772, "global_step": 1964, "epoch": 16, "lr": 9.989468990072123e-05} +{"train_loss": 0.04189620167016983, "global_step": 1965, "epoch": 16, "lr": 9.98945461341749e-05} +{"train_loss": 0.022047899663448334, "global_step": 1966, "epoch": 16, "lr": 9.989440226966597e-05} +{"train_loss": 0.03598364070057869, "global_step": 1967, "epoch": 16, "lr": 9.98942583071947e-05} +{"train_loss": 0.02717364951968193, "global_step": 1968, "epoch": 16, "lr": 9.98941142467614e-05} +{"train_loss": 0.026509005576372147, "global_step": 1969, "epoch": 16, "lr": 9.989397008836631e-05} +{"train_loss": 0.029979586601257324, "global_step": 1970, "epoch": 16, "lr": 9.989382583200976e-05} +{"train_loss": 0.030696865171194077, "global_step": 1971, "epoch": 16, "lr": 9.989368147769203e-05} +{"train_loss": 0.02652958780527115, "global_step": 1972, "epoch": 16, "lr": 9.989353702541336e-05} +{"train_loss": 0.02588287740945816, "global_step": 1973, "epoch": 16, "lr": 9.989339247517406e-05} +{"train_loss": 0.02916172333061695, "global_step": 1974, "epoch": 16, "lr": 9.989324782697444e-05} +{"train_loss": 0.03421800956130028, "global_step": 1975, "epoch": 16, "lr": 9.989310308081473e-05} +{"train_loss": 0.033529579639434814, "global_step": 1976, "epoch": 16, "lr": 9.989295823669526e-05} +{"train_loss": 0.03734458237886429, "global_step": 1977, "epoch": 16, "lr": 9.989281329461629e-05} +{"train_loss": 0.03289911150932312, "global_step": 1978, "epoch": 16, "lr": 9.989266825457811e-05} +{"train_loss": 0.029750186949968338, "global_step": 1979, "epoch": 16, "lr": 9.9892523116581e-05} +{"train_loss": 0.02660660818219185, "global_step": 1980, "epoch": 16, "lr": 9.989237788062527e-05} +{"train_loss": 0.026259107515215874, "global_step": 1981, "epoch": 16, "lr": 9.989223254671116e-05} +{"train_loss": 0.024653960019350052, "global_step": 1982, "epoch": 16, "lr": 9.989208711483901e-05} +{"train_loss": 0.028991851955652237, "global_step": 1983, "epoch": 16, "lr": 9.989194158500906e-05} +{"train_loss": 0.03517003357410431, "global_step": 1984, "epoch": 16, "lr": 9.989179595722162e-05} +{"train_loss": 0.024466287344694138, "global_step": 1985, "epoch": 16, "lr": 9.989165023147696e-05} +{"train_loss": 0.023982850834727287, "global_step": 1986, "epoch": 16, "lr": 9.989150440777538e-05} +{"train_loss": 0.02473597601056099, "global_step": 1987, "epoch": 16, "lr": 9.989135848611717e-05} +{"train_loss": 0.02733151614665985, "global_step": 1988, "epoch": 16, "lr": 9.98912124665026e-05} +{"train_loss": 0.029079386964440346, "global_step": 1989, "epoch": 16, "lr": 9.989106634893195e-05} +{"train_loss": 0.03102429211139679, "global_step": 1990, "epoch": 16, "lr": 9.989092013340554e-05} +{"train_loss": 0.0266348198056221, "global_step": 1991, "epoch": 16, "lr": 9.989077381992363e-05} +{"train_loss": 0.03310270980000496, "global_step": 1992, "epoch": 16, "lr": 9.989062740848653e-05} +{"train_loss": 0.03313317522406578, "global_step": 1993, "epoch": 16, "lr": 9.989048089909449e-05} +{"train_loss": 0.022961433976888657, "global_step": 1994, "epoch": 16, "lr": 9.989033429174783e-05} +{"train_loss": 0.026878492906689644, "global_step": 1995, "epoch": 16, "lr": 9.989018758644683e-05} +{"train_loss": 0.02453765459358692, "global_step": 1996, "epoch": 16, "lr": 9.989004078319179e-05} +{"train_loss": 0.03661229461431503, "global_step": 1997, "epoch": 16, "lr": 9.988989388198298e-05} +{"train_loss": 0.029502922669053078, "global_step": 1998, "epoch": 16, "lr": 9.988974688282068e-05} +{"train_loss": 0.025746142491698265, "global_step": 1999, "epoch": 16, "lr": 9.98895997857052e-05} +{"train_loss": 0.029514016583561897, "global_step": 2000, "epoch": 16, "lr": 9.988945259063681e-05} +{"train_loss": 0.03313840553164482, "global_step": 2001, "epoch": 16, "lr": 9.988930529761582e-05} +{"train_loss": 0.025133801624178886, "global_step": 2002, "epoch": 16, "lr": 9.98891579066425e-05} +{"train_loss": 0.02625325694680214, "global_step": 2003, "epoch": 16, "lr": 9.988901041771716e-05} +{"train_loss": 0.03132624551653862, "global_step": 2004, "epoch": 16, "lr": 9.988886283084008e-05} +{"train_loss": 0.02915661223232746, "global_step": 2005, "epoch": 16, "lr": 9.988871514601155e-05} +{"train_loss": 0.02651544101536274, "global_step": 2006, "epoch": 16, "lr": 9.988856736323184e-05} +{"train_loss": 0.040664687752723694, "global_step": 2007, "epoch": 16, "lr": 9.988841948250127e-05} +{"train_loss": 0.029619142413139343, "global_step": 2008, "epoch": 16, "lr": 9.988827150382012e-05} +{"train_loss": 0.029039835557341576, "global_step": 2009, "epoch": 16, "lr": 9.988812342718868e-05} +{"train_loss": 0.025933165103197098, "global_step": 2010, "epoch": 16, "lr": 9.988797525260723e-05} +{"train_loss": 0.01989905908703804, "global_step": 2011, "epoch": 16, "lr": 9.988782698007605e-05} +{"train_loss": 0.02589782327413559, "global_step": 2012, "epoch": 16, "lr": 9.988767860959549e-05} +{"train_loss": 0.037782423198223114, "global_step": 2013, "epoch": 16, "lr": 9.988753014116579e-05} +{"train_loss": 0.02420451119542122, "global_step": 2014, "epoch": 16, "lr": 9.988738157478726e-05} +{"train_loss": 0.026790300384163857, "global_step": 2015, "epoch": 16, "lr": 9.988723291046017e-05} +{"train_loss": 0.030148886144161224, "global_step": 2016, "epoch": 16, "lr": 9.988708414818483e-05} +{"train_loss": 0.027662059292197227, "global_step": 2017, "epoch": 16, "lr": 9.988693528796154e-05} +{"train_loss": 0.0355529822409153, "global_step": 2018, "epoch": 16, "lr": 9.988678632979059e-05} +{"train_loss": 0.028659554198384285, "global_step": 2019, "epoch": 16, "lr": 9.988663727367224e-05} +{"train_loss": 0.02664363570511341, "global_step": 2020, "epoch": 16, "lr": 9.988648811960681e-05} +{"train_loss": 0.0356057807803154, "global_step": 2021, "epoch": 16, "lr": 9.988633886759461e-05} +{"train_loss": 0.030645291907947604, "global_step": 2022, "epoch": 16, "lr": 9.98861895176359e-05, "val_loss": 0.02563321962952614} +{"train_loss": 0.0301128551363945, "global_step": 2023, "epoch": 17, "lr": 9.988604006973099e-05} +{"train_loss": 0.02723754569888115, "global_step": 2024, "epoch": 17, "lr": 9.988589052388018e-05} +{"train_loss": 0.03090781904757023, "global_step": 2025, "epoch": 17, "lr": 9.988574088008373e-05} +{"train_loss": 0.02837345562875271, "global_step": 2026, "epoch": 17, "lr": 9.988559113834197e-05} +{"train_loss": 0.02678503468632698, "global_step": 2027, "epoch": 17, "lr": 9.988544129865518e-05} +{"train_loss": 0.027354693040251732, "global_step": 2028, "epoch": 17, "lr": 9.988529136102367e-05} +{"train_loss": 0.030779987573623657, "global_step": 2029, "epoch": 17, "lr": 9.98851413254477e-05} +{"train_loss": 0.025098389014601707, "global_step": 2030, "epoch": 17, "lr": 9.988499119192759e-05} +{"train_loss": 0.033920783549547195, "global_step": 2031, "epoch": 17, "lr": 9.988484096046363e-05} +{"train_loss": 0.03481532260775566, "global_step": 2032, "epoch": 17, "lr": 9.988469063105612e-05} +{"train_loss": 0.03670332953333855, "global_step": 2033, "epoch": 17, "lr": 9.988454020370534e-05} +{"train_loss": 0.04267485812306404, "global_step": 2034, "epoch": 17, "lr": 9.98843896784116e-05} +{"train_loss": 0.027043314650654793, "global_step": 2035, "epoch": 17, "lr": 9.988423905517519e-05} +{"train_loss": 0.02431456185877323, "global_step": 2036, "epoch": 17, "lr": 9.98840883339964e-05} +{"train_loss": 0.031800176948308945, "global_step": 2037, "epoch": 17, "lr": 9.988393751487555e-05} +{"train_loss": 0.03715314343571663, "global_step": 2038, "epoch": 17, "lr": 9.98837865978129e-05} +{"train_loss": 0.027247533202171326, "global_step": 2039, "epoch": 17, "lr": 9.988363558280876e-05} +{"train_loss": 0.040489278733730316, "global_step": 2040, "epoch": 17, "lr": 9.988348446986344e-05} +{"train_loss": 0.02809055708348751, "global_step": 2041, "epoch": 17, "lr": 9.988333325897722e-05} +{"train_loss": 0.03216855973005295, "global_step": 2042, "epoch": 17, "lr": 9.988318195015043e-05} +{"train_loss": 0.02904639206826687, "global_step": 2043, "epoch": 17, "lr": 9.988303054338331e-05} +{"train_loss": 0.0231922697275877, "global_step": 2044, "epoch": 17, "lr": 9.988287903867622e-05} +{"train_loss": 0.034580931067466736, "global_step": 2045, "epoch": 17, "lr": 9.98827274360294e-05} +{"train_loss": 0.028337404131889343, "global_step": 2046, "epoch": 17, "lr": 9.988257573544317e-05} +{"train_loss": 0.02466469071805477, "global_step": 2047, "epoch": 17, "lr": 9.988242393691784e-05} +{"train_loss": 0.031011655926704407, "global_step": 2048, "epoch": 17, "lr": 9.988227204045371e-05} +{"train_loss": 0.036418456584215164, "global_step": 2049, "epoch": 17, "lr": 9.988212004605107e-05} +{"train_loss": 0.032674390822649, "global_step": 2050, "epoch": 17, "lr": 9.988196795371021e-05} +{"train_loss": 0.02675444446504116, "global_step": 2051, "epoch": 17, "lr": 9.988181576343143e-05} +{"train_loss": 0.026563461869955063, "global_step": 2052, "epoch": 17, "lr": 9.988166347521504e-05} +{"train_loss": 0.023334922268986702, "global_step": 2053, "epoch": 17, "lr": 9.988151108906132e-05} +{"train_loss": 0.04058593139052391, "global_step": 2054, "epoch": 17, "lr": 9.98813586049706e-05} +{"train_loss": 0.02790152281522751, "global_step": 2055, "epoch": 17, "lr": 9.988120602294315e-05} +{"train_loss": 0.027902277186512947, "global_step": 2056, "epoch": 17, "lr": 9.988105334297929e-05} +{"train_loss": 0.03033669851720333, "global_step": 2057, "epoch": 17, "lr": 9.988090056507931e-05} +{"train_loss": 0.03502003103494644, "global_step": 2058, "epoch": 17, "lr": 9.98807476892435e-05} +{"train_loss": 0.027872692793607712, "global_step": 2059, "epoch": 17, "lr": 9.988059471547218e-05} +{"train_loss": 0.03570578992366791, "global_step": 2060, "epoch": 17, "lr": 9.988044164376564e-05} +{"train_loss": 0.03768419474363327, "global_step": 2061, "epoch": 17, "lr": 9.988028847412417e-05} +{"train_loss": 0.03601710870862007, "global_step": 2062, "epoch": 17, "lr": 9.988013520654809e-05} +{"train_loss": 0.03247326239943504, "global_step": 2063, "epoch": 17, "lr": 9.987998184103771e-05} +{"train_loss": 0.029480960220098495, "global_step": 2064, "epoch": 17, "lr": 9.987982837759328e-05} +{"train_loss": 0.023265235126018524, "global_step": 2065, "epoch": 17, "lr": 9.987967481621517e-05} +{"train_loss": 0.028262421488761902, "global_step": 2066, "epoch": 17, "lr": 9.987952115690363e-05} +{"train_loss": 0.024829579517245293, "global_step": 2067, "epoch": 17, "lr": 9.987936739965898e-05} +{"train_loss": 0.03312256187200546, "global_step": 2068, "epoch": 17, "lr": 9.987921354448153e-05} +{"train_loss": 0.03823599964380264, "global_step": 2069, "epoch": 17, "lr": 9.987905959137156e-05} +{"train_loss": 0.02318268083035946, "global_step": 2070, "epoch": 17, "lr": 9.987890554032939e-05} +{"train_loss": 0.0238628052175045, "global_step": 2071, "epoch": 17, "lr": 9.987875139135531e-05} +{"train_loss": 0.02850937284529209, "global_step": 2072, "epoch": 17, "lr": 9.987859714444965e-05} +{"train_loss": 0.025409039109945297, "global_step": 2073, "epoch": 17, "lr": 9.987844279961269e-05} +{"train_loss": 0.03213135898113251, "global_step": 2074, "epoch": 17, "lr": 9.987828835684472e-05} +{"train_loss": 0.029610993340611458, "global_step": 2075, "epoch": 17, "lr": 9.987813381614608e-05} +{"train_loss": 0.03060334175825119, "global_step": 2076, "epoch": 17, "lr": 9.987797917751703e-05} +{"train_loss": 0.031794141978025436, "global_step": 2077, "epoch": 17, "lr": 9.987782444095792e-05} +{"train_loss": 0.031228281557559967, "global_step": 2078, "epoch": 17, "lr": 9.9877669606469e-05} +{"train_loss": 0.0303509458899498, "global_step": 2079, "epoch": 17, "lr": 9.987751467405063e-05} +{"train_loss": 0.03768283128738403, "global_step": 2080, "epoch": 17, "lr": 9.987735964370309e-05} +{"train_loss": 0.02326149493455887, "global_step": 2081, "epoch": 17, "lr": 9.987720451542667e-05} +{"train_loss": 0.02046186849474907, "global_step": 2082, "epoch": 17, "lr": 9.987704928922169e-05} +{"train_loss": 0.03142810985445976, "global_step": 2083, "epoch": 17, "lr": 9.987689396508846e-05} +{"train_loss": 0.021825967356562614, "global_step": 2084, "epoch": 17, "lr": 9.987673854302728e-05} +{"train_loss": 0.03983726724982262, "global_step": 2085, "epoch": 17, "lr": 9.987658302303843e-05} +{"train_loss": 0.02052309736609459, "global_step": 2086, "epoch": 17, "lr": 9.987642740512226e-05} +{"train_loss": 0.029429620131850243, "global_step": 2087, "epoch": 17, "lr": 9.987627168927904e-05} +{"train_loss": 0.030406061559915543, "global_step": 2088, "epoch": 17, "lr": 9.987611587550909e-05} +{"train_loss": 0.028841974213719368, "global_step": 2089, "epoch": 17, "lr": 9.987595996381272e-05} +{"train_loss": 0.026005936786532402, "global_step": 2090, "epoch": 17, "lr": 9.987580395419022e-05} +{"train_loss": 0.02993915043771267, "global_step": 2091, "epoch": 17, "lr": 9.987564784664193e-05} +{"train_loss": 0.02543051354587078, "global_step": 2092, "epoch": 17, "lr": 9.987549164116811e-05} +{"train_loss": 0.02850426733493805, "global_step": 2093, "epoch": 17, "lr": 9.987533533776911e-05} +{"train_loss": 0.03212115913629532, "global_step": 2094, "epoch": 17, "lr": 9.987517893644521e-05} +{"train_loss": 0.0287468358874321, "global_step": 2095, "epoch": 17, "lr": 9.987502243719673e-05} +{"train_loss": 0.02839883789420128, "global_step": 2096, "epoch": 17, "lr": 9.987486584002397e-05} +{"train_loss": 0.032254237681627274, "global_step": 2097, "epoch": 17, "lr": 9.987470914492723e-05} +{"train_loss": 0.03445667773485184, "global_step": 2098, "epoch": 17, "lr": 9.987455235190683e-05} +{"train_loss": 0.028914228081703186, "global_step": 2099, "epoch": 17, "lr": 9.987439546096308e-05} +{"train_loss": 0.029018351808190346, "global_step": 2100, "epoch": 17, "lr": 9.987423847209628e-05} +{"train_loss": 0.02455691248178482, "global_step": 2101, "epoch": 17, "lr": 9.987408138530674e-05} +{"train_loss": 0.03343185409903526, "global_step": 2102, "epoch": 17, "lr": 9.987392420059475e-05} +{"train_loss": 0.024841826409101486, "global_step": 2103, "epoch": 17, "lr": 9.987376691796068e-05} +{"train_loss": 0.03350038453936577, "global_step": 2104, "epoch": 17, "lr": 9.987360953740477e-05} +{"train_loss": 0.028303237631917, "global_step": 2105, "epoch": 17, "lr": 9.987345205892736e-05} +{"train_loss": 0.02236936427652836, "global_step": 2106, "epoch": 17, "lr": 9.987329448252876e-05} +{"train_loss": 0.02944512665271759, "global_step": 2107, "epoch": 17, "lr": 9.987313680820926e-05} +{"train_loss": 0.03768303245306015, "global_step": 2108, "epoch": 17, "lr": 9.98729790359692e-05} +{"train_loss": 0.03090541437268257, "global_step": 2109, "epoch": 17, "lr": 9.987282116580888e-05} +{"train_loss": 0.027698349207639694, "global_step": 2110, "epoch": 17, "lr": 9.98726631977286e-05} +{"train_loss": 0.026508400216698647, "global_step": 2111, "epoch": 17, "lr": 9.987250513172865e-05} +{"train_loss": 0.02352898009121418, "global_step": 2112, "epoch": 17, "lr": 9.987234696780938e-05} +{"train_loss": 0.04271595925092697, "global_step": 2113, "epoch": 17, "lr": 9.987218870597108e-05} +{"train_loss": 0.02928733080625534, "global_step": 2114, "epoch": 17, "lr": 9.987203034621408e-05} +{"train_loss": 0.032304659485816956, "global_step": 2115, "epoch": 17, "lr": 9.987187188853866e-05} +{"train_loss": 0.026014043018221855, "global_step": 2116, "epoch": 17, "lr": 9.987171333294516e-05} +{"train_loss": 0.026428325101733208, "global_step": 2117, "epoch": 17, "lr": 9.987155467943387e-05} +{"train_loss": 0.031108375638723373, "global_step": 2118, "epoch": 17, "lr": 9.987139592800512e-05} +{"train_loss": 0.03596027195453644, "global_step": 2119, "epoch": 17, "lr": 9.98712370786592e-05} +{"train_loss": 0.030764900147914886, "global_step": 2120, "epoch": 17, "lr": 9.987107813139645e-05} +{"train_loss": 0.03106514737010002, "global_step": 2121, "epoch": 17, "lr": 9.987091908621716e-05} +{"train_loss": 0.026243453845381737, "global_step": 2122, "epoch": 17, "lr": 9.987075994312163e-05} +{"train_loss": 0.02891617640852928, "global_step": 2123, "epoch": 17, "lr": 9.987060070211021e-05} +{"train_loss": 0.03471985459327698, "global_step": 2124, "epoch": 17, "lr": 9.987044136318317e-05} +{"train_loss": 0.041822925209999084, "global_step": 2125, "epoch": 17, "lr": 9.987028192634088e-05} +{"train_loss": 0.0318605862557888, "global_step": 2126, "epoch": 17, "lr": 9.98701223915836e-05} +{"train_loss": 0.02805081196129322, "global_step": 2127, "epoch": 17, "lr": 9.986996275891167e-05} +{"train_loss": 0.030804648995399475, "global_step": 2128, "epoch": 17, "lr": 9.98698030283254e-05} +{"train_loss": 0.03206714242696762, "global_step": 2129, "epoch": 17, "lr": 9.986964319982508e-05} +{"train_loss": 0.029457557946443558, "global_step": 2130, "epoch": 17, "lr": 9.986948327341105e-05} +{"train_loss": 0.0361563116312027, "global_step": 2131, "epoch": 17, "lr": 9.986932324908363e-05} +{"train_loss": 0.02215595357120037, "global_step": 2132, "epoch": 17, "lr": 9.986916312684312e-05} +{"train_loss": 0.02358303591609001, "global_step": 2133, "epoch": 17, "lr": 9.986900290668982e-05} +{"train_loss": 0.02706785500049591, "global_step": 2134, "epoch": 17, "lr": 9.986884258862408e-05} +{"train_loss": 0.030769111588597298, "global_step": 2135, "epoch": 17, "lr": 9.986868217264617e-05} +{"train_loss": 0.023003675043582916, "global_step": 2136, "epoch": 17, "lr": 9.986852165875646e-05} +{"train_loss": 0.04043151065707207, "global_step": 2137, "epoch": 17, "lr": 9.986836104695523e-05} +{"train_loss": 0.03063397854566574, "global_step": 2138, "epoch": 17, "lr": 9.986820033724278e-05} +{"train_loss": 0.029954485595226288, "global_step": 2139, "epoch": 17, "lr": 9.986803952961946e-05} +{"train_loss": 0.02381640113890171, "global_step": 2140, "epoch": 17, "lr": 9.986787862408558e-05} +{"train_loss": 0.03003475013650766, "global_step": 2141, "epoch": 17, "lr": 9.986771762064143e-05, "val_loss": 0.04523021727800369} +{"train_loss": 0.0330611988902092, "global_step": 2142, "epoch": 18, "lr": 9.986755651928736e-05} +{"train_loss": 0.03265178203582764, "global_step": 2143, "epoch": 18, "lr": 9.986739532002365e-05} +{"train_loss": 0.029938004910945892, "global_step": 2144, "epoch": 18, "lr": 9.986723402285066e-05} +{"train_loss": 0.03176579996943474, "global_step": 2145, "epoch": 18, "lr": 9.986707262776867e-05} +{"train_loss": 0.022738376632332802, "global_step": 2146, "epoch": 18, "lr": 9.986691113477801e-05} +{"train_loss": 0.030757328495383263, "global_step": 2147, "epoch": 18, "lr": 9.9866749543879e-05} +{"train_loss": 0.027367431670427322, "global_step": 2148, "epoch": 18, "lr": 9.986658785507196e-05} +{"train_loss": 0.02270442061126232, "global_step": 2149, "epoch": 18, "lr": 9.98664260683572e-05} +{"train_loss": 0.030746689066290855, "global_step": 2150, "epoch": 18, "lr": 9.986626418373504e-05} +{"train_loss": 0.037013523280620575, "global_step": 2151, "epoch": 18, "lr": 9.986610220120579e-05} +{"train_loss": 0.028052257373929024, "global_step": 2152, "epoch": 18, "lr": 9.986594012076977e-05} +{"train_loss": 0.03603889420628548, "global_step": 2153, "epoch": 18, "lr": 9.986577794242733e-05} +{"train_loss": 0.02472197636961937, "global_step": 2154, "epoch": 18, "lr": 9.986561566617874e-05} +{"train_loss": 0.028418423607945442, "global_step": 2155, "epoch": 18, "lr": 9.986545329202435e-05} +{"train_loss": 0.03756019473075867, "global_step": 2156, "epoch": 18, "lr": 9.986529081996447e-05} +{"train_loss": 0.019215475767850876, "global_step": 2157, "epoch": 18, "lr": 9.986512824999941e-05} +{"train_loss": 0.030864091590046883, "global_step": 2158, "epoch": 18, "lr": 9.986496558212952e-05} +{"train_loss": 0.028984714299440384, "global_step": 2159, "epoch": 18, "lr": 9.986480281635508e-05} +{"train_loss": 0.022841621190309525, "global_step": 2160, "epoch": 18, "lr": 9.986463995267643e-05} +{"train_loss": 0.026777280494570732, "global_step": 2161, "epoch": 18, "lr": 9.986447699109389e-05} +{"train_loss": 0.02731279470026493, "global_step": 2162, "epoch": 18, "lr": 9.986431393160776e-05} +{"train_loss": 0.04205697029829025, "global_step": 2163, "epoch": 18, "lr": 9.98641507742184e-05} +{"train_loss": 0.02671002969145775, "global_step": 2164, "epoch": 18, "lr": 9.986398751892609e-05} +{"train_loss": 0.03177180513739586, "global_step": 2165, "epoch": 18, "lr": 9.986382416573117e-05} +{"train_loss": 0.030287757515907288, "global_step": 2166, "epoch": 18, "lr": 9.986366071463398e-05} +{"train_loss": 0.022170135751366615, "global_step": 2167, "epoch": 18, "lr": 9.98634971656348e-05} +{"train_loss": 0.03425164520740509, "global_step": 2168, "epoch": 18, "lr": 9.986333351873395e-05} +{"train_loss": 0.01855265349149704, "global_step": 2169, "epoch": 18, "lr": 9.986316977393181e-05} +{"train_loss": 0.026653273031115532, "global_step": 2170, "epoch": 18, "lr": 9.986300593122864e-05} +{"train_loss": 0.02537975087761879, "global_step": 2171, "epoch": 18, "lr": 9.98628419906248e-05} +{"train_loss": 0.03257888928055763, "global_step": 2172, "epoch": 18, "lr": 9.986267795212059e-05} +{"train_loss": 0.02762049064040184, "global_step": 2173, "epoch": 18, "lr": 9.986251381571635e-05} +{"train_loss": 0.03294331580400467, "global_step": 2174, "epoch": 18, "lr": 9.986234958141236e-05} +{"train_loss": 0.02659527398645878, "global_step": 2175, "epoch": 18, "lr": 9.986218524920901e-05} +{"train_loss": 0.030030662193894386, "global_step": 2176, "epoch": 18, "lr": 9.986202081910656e-05} +{"train_loss": 0.030418936163187027, "global_step": 2177, "epoch": 18, "lr": 9.986185629110538e-05} +{"train_loss": 0.026395924389362335, "global_step": 2178, "epoch": 18, "lr": 9.986169166520575e-05} +{"train_loss": 0.03192874416708946, "global_step": 2179, "epoch": 18, "lr": 9.986152694140803e-05} +{"train_loss": 0.028846999630331993, "global_step": 2180, "epoch": 18, "lr": 9.986136211971252e-05} +{"train_loss": 0.029491715133190155, "global_step": 2181, "epoch": 18, "lr": 9.986119720011955e-05} +{"train_loss": 0.020497765392065048, "global_step": 2182, "epoch": 18, "lr": 9.986103218262947e-05} +{"train_loss": 0.026210125535726547, "global_step": 2183, "epoch": 18, "lr": 9.986086706724256e-05} +{"train_loss": 0.032027918845415115, "global_step": 2184, "epoch": 18, "lr": 9.986070185395917e-05} +{"train_loss": 0.030215967446565628, "global_step": 2185, "epoch": 18, "lr": 9.98605365427796e-05} +{"train_loss": 0.027404334396123886, "global_step": 2186, "epoch": 18, "lr": 9.986037113370422e-05} +{"train_loss": 0.02137400023639202, "global_step": 2187, "epoch": 18, "lr": 9.986020562673333e-05} +{"train_loss": 0.029765283688902855, "global_step": 2188, "epoch": 18, "lr": 9.986004002186723e-05} +{"train_loss": 0.029116429388523102, "global_step": 2189, "epoch": 18, "lr": 9.985987431910628e-05} +{"train_loss": 0.03095041960477829, "global_step": 2190, "epoch": 18, "lr": 9.985970851845079e-05} +{"train_loss": 0.017717432230710983, "global_step": 2191, "epoch": 18, "lr": 9.985954261990109e-05} +{"train_loss": 0.030006788671016693, "global_step": 2192, "epoch": 18, "lr": 9.985937662345751e-05} +{"train_loss": 0.028002599254250526, "global_step": 2193, "epoch": 18, "lr": 9.985921052912038e-05} +{"train_loss": 0.024089494720101357, "global_step": 2194, "epoch": 18, "lr": 9.985904433689e-05} +{"train_loss": 0.027407025918364525, "global_step": 2195, "epoch": 18, "lr": 9.98588780467667e-05} +{"train_loss": 0.0316077284514904, "global_step": 2196, "epoch": 18, "lr": 9.985871165875084e-05} +{"train_loss": 0.025751270353794098, "global_step": 2197, "epoch": 18, "lr": 9.985854517284272e-05} +{"train_loss": 0.03167658671736717, "global_step": 2198, "epoch": 18, "lr": 9.985837858904268e-05} +{"train_loss": 0.03299468010663986, "global_step": 2199, "epoch": 18, "lr": 9.985821190735105e-05} +{"train_loss": 0.033074844628572464, "global_step": 2200, "epoch": 18, "lr": 9.985804512776813e-05} +{"train_loss": 0.0270039401948452, "global_step": 2201, "epoch": 18, "lr": 9.985787825029427e-05} +{"train_loss": 0.022812852635979652, "global_step": 2202, "epoch": 18, "lr": 9.985771127492979e-05} +{"train_loss": 0.03409411013126373, "global_step": 2203, "epoch": 18, "lr": 9.985754420167502e-05} +{"train_loss": 0.024409674108028412, "global_step": 2204, "epoch": 18, "lr": 9.985737703053028e-05} +{"train_loss": 0.03969651460647583, "global_step": 2205, "epoch": 18, "lr": 9.985720976149592e-05} +{"train_loss": 0.0392676517367363, "global_step": 2206, "epoch": 18, "lr": 9.985704239457226e-05} +{"train_loss": 0.02319520153105259, "global_step": 2207, "epoch": 18, "lr": 9.985687492975961e-05} +{"train_loss": 0.025334564968943596, "global_step": 2208, "epoch": 18, "lr": 9.985670736705832e-05} +{"train_loss": 0.03124532289803028, "global_step": 2209, "epoch": 18, "lr": 9.985653970646871e-05} +{"train_loss": 0.021346617490053177, "global_step": 2210, "epoch": 18, "lr": 9.985637194799111e-05} +{"train_loss": 0.03050915338099003, "global_step": 2211, "epoch": 18, "lr": 9.985620409162586e-05} +{"train_loss": 0.024655010551214218, "global_step": 2212, "epoch": 18, "lr": 9.985603613737326e-05} +{"train_loss": 0.02912159264087677, "global_step": 2213, "epoch": 18, "lr": 9.985586808523367e-05} +{"train_loss": 0.02494625188410282, "global_step": 2214, "epoch": 18, "lr": 9.985569993520741e-05} +{"train_loss": 0.02707255817949772, "global_step": 2215, "epoch": 18, "lr": 9.98555316872948e-05} +{"train_loss": 0.018650153651833534, "global_step": 2216, "epoch": 18, "lr": 9.985536334149618e-05} +{"train_loss": 0.02262018993496895, "global_step": 2217, "epoch": 18, "lr": 9.98551948978119e-05} +{"train_loss": 0.0321296826004982, "global_step": 2218, "epoch": 18, "lr": 9.985502635624226e-05} +{"train_loss": 0.021774224936962128, "global_step": 2219, "epoch": 18, "lr": 9.98548577167876e-05} +{"train_loss": 0.0315001979470253, "global_step": 2220, "epoch": 18, "lr": 9.985468897944826e-05} +{"train_loss": 0.03043672814965248, "global_step": 2221, "epoch": 18, "lr": 9.985452014422456e-05} +{"train_loss": 0.02412932738661766, "global_step": 2222, "epoch": 18, "lr": 9.985435121111684e-05} +{"train_loss": 0.02258414588868618, "global_step": 2223, "epoch": 18, "lr": 9.98541821801254e-05} +{"train_loss": 0.02648949809372425, "global_step": 2224, "epoch": 18, "lr": 9.985401305125064e-05} +{"train_loss": 0.0322713740170002, "global_step": 2225, "epoch": 18, "lr": 9.985384382449283e-05} +{"train_loss": 0.021493759006261826, "global_step": 2226, "epoch": 18, "lr": 9.985367449985233e-05} +{"train_loss": 0.024984514340758324, "global_step": 2227, "epoch": 18, "lr": 9.985350507732947e-05} +{"train_loss": 0.027247950434684753, "global_step": 2228, "epoch": 18, "lr": 9.985333555692457e-05} +{"train_loss": 0.02917676791548729, "global_step": 2229, "epoch": 18, "lr": 9.985316593863796e-05} +{"train_loss": 0.0335630439221859, "global_step": 2230, "epoch": 18, "lr": 9.985299622247e-05} +{"train_loss": 0.03583480790257454, "global_step": 2231, "epoch": 18, "lr": 9.985282640842102e-05} +{"train_loss": 0.022186698392033577, "global_step": 2232, "epoch": 18, "lr": 9.985265649649132e-05} +{"train_loss": 0.019238371402025223, "global_step": 2233, "epoch": 18, "lr": 9.985248648668127e-05} +{"train_loss": 0.024195829406380653, "global_step": 2234, "epoch": 18, "lr": 9.985231637899117e-05} +{"train_loss": 0.030093589797616005, "global_step": 2235, "epoch": 18, "lr": 9.98521461734214e-05} +{"train_loss": 0.0348338857293129, "global_step": 2236, "epoch": 18, "lr": 9.985197586997224e-05} +{"train_loss": 0.03152371197938919, "global_step": 2237, "epoch": 18, "lr": 9.985180546864406e-05} +{"train_loss": 0.024201830849051476, "global_step": 2238, "epoch": 18, "lr": 9.98516349694372e-05} +{"train_loss": 0.0349903330206871, "global_step": 2239, "epoch": 18, "lr": 9.985146437235195e-05} +{"train_loss": 0.026589877903461456, "global_step": 2240, "epoch": 18, "lr": 9.98512936773887e-05} +{"train_loss": 0.02150542289018631, "global_step": 2241, "epoch": 18, "lr": 9.985112288454777e-05} +{"train_loss": 0.024759341031312943, "global_step": 2242, "epoch": 18, "lr": 9.985095199382946e-05} +{"train_loss": 0.03493940457701683, "global_step": 2243, "epoch": 18, "lr": 9.985078100523415e-05} +{"train_loss": 0.03064211830496788, "global_step": 2244, "epoch": 18, "lr": 9.985060991876214e-05} +{"train_loss": 0.02462192438542843, "global_step": 2245, "epoch": 18, "lr": 9.98504387344138e-05} +{"train_loss": 0.02859504520893097, "global_step": 2246, "epoch": 18, "lr": 9.985026745218944e-05} +{"train_loss": 0.0284742321819067, "global_step": 2247, "epoch": 18, "lr": 9.98500960720894e-05} +{"train_loss": 0.0301298089325428, "global_step": 2248, "epoch": 18, "lr": 9.984992459411404e-05} +{"train_loss": 0.02682751975953579, "global_step": 2249, "epoch": 18, "lr": 9.984975301826367e-05} +{"train_loss": 0.025509869679808617, "global_step": 2250, "epoch": 18, "lr": 9.984958134453863e-05} +{"train_loss": 0.025463230907917023, "global_step": 2251, "epoch": 18, "lr": 9.984940957293927e-05} +{"train_loss": 0.020657939836382866, "global_step": 2252, "epoch": 18, "lr": 9.98492377034659e-05} +{"train_loss": 0.020534325391054153, "global_step": 2253, "epoch": 18, "lr": 9.98490657361189e-05} +{"train_loss": 0.02208571881055832, "global_step": 2254, "epoch": 18, "lr": 9.984889367089858e-05} +{"train_loss": 0.04469900578260422, "global_step": 2255, "epoch": 18, "lr": 9.98487215078053e-05} +{"train_loss": 0.03821953386068344, "global_step": 2256, "epoch": 18, "lr": 9.984854924683934e-05} +{"train_loss": 0.031753480434417725, "global_step": 2257, "epoch": 18, "lr": 9.984837688800111e-05} +{"train_loss": 0.022626925259828568, "global_step": 2258, "epoch": 18, "lr": 9.98482044312909e-05} +{"train_loss": 0.02604217268526554, "global_step": 2259, "epoch": 18, "lr": 9.984803187670909e-05} +{"train_loss": 0.028241358994811522, "global_step": 2260, "epoch": 18, "lr": 9.984785922425596e-05, "val_loss": 0.03870818018913269} +{"train_loss": 0.020780231803655624, "global_step": 2261, "epoch": 19, "lr": 9.984768647393192e-05} +{"train_loss": 0.03538227826356888, "global_step": 2262, "epoch": 19, "lr": 9.984751362573726e-05} +{"train_loss": 0.021559542044997215, "global_step": 2263, "epoch": 19, "lr": 9.984734067967233e-05} +{"train_loss": 0.028919365257024765, "global_step": 2264, "epoch": 19, "lr": 9.984716763573747e-05} +{"train_loss": 0.028894731774926186, "global_step": 2265, "epoch": 19, "lr": 9.984699449393302e-05} +{"train_loss": 0.02440929040312767, "global_step": 2266, "epoch": 19, "lr": 9.984682125425933e-05} +{"train_loss": 0.027314217761158943, "global_step": 2267, "epoch": 19, "lr": 9.984664791671672e-05} +{"train_loss": 0.027196591719985008, "global_step": 2268, "epoch": 19, "lr": 9.984647448130556e-05} +{"train_loss": 0.024779552593827248, "global_step": 2269, "epoch": 19, "lr": 9.984630094802616e-05} +{"train_loss": 0.02380053512752056, "global_step": 2270, "epoch": 19, "lr": 9.984612731687887e-05} +{"train_loss": 0.03439341112971306, "global_step": 2271, "epoch": 19, "lr": 9.984595358786404e-05} +{"train_loss": 0.024000534787774086, "global_step": 2272, "epoch": 19, "lr": 9.984577976098201e-05} +{"train_loss": 0.030746201053261757, "global_step": 2273, "epoch": 19, "lr": 9.98456058362331e-05} +{"train_loss": 0.024603823199868202, "global_step": 2274, "epoch": 19, "lr": 9.984543181361769e-05} +{"train_loss": 0.022770175710320473, "global_step": 2275, "epoch": 19, "lr": 9.984525769313608e-05} +{"train_loss": 0.02505352348089218, "global_step": 2276, "epoch": 19, "lr": 9.984508347478865e-05} +{"train_loss": 0.031250208616256714, "global_step": 2277, "epoch": 19, "lr": 9.984490915857572e-05} +{"train_loss": 0.02936381846666336, "global_step": 2278, "epoch": 19, "lr": 9.984473474449763e-05} +{"train_loss": 0.02618955448269844, "global_step": 2279, "epoch": 19, "lr": 9.984456023255473e-05} +{"train_loss": 0.028582684695720673, "global_step": 2280, "epoch": 19, "lr": 9.984438562274736e-05} +{"train_loss": 0.02509496919810772, "global_step": 2281, "epoch": 19, "lr": 9.984421091507585e-05} +{"train_loss": 0.03539628908038139, "global_step": 2282, "epoch": 19, "lr": 9.984403610954058e-05} +{"train_loss": 0.03461071103811264, "global_step": 2283, "epoch": 19, "lr": 9.984386120614187e-05} +{"train_loss": 0.02756831794977188, "global_step": 2284, "epoch": 19, "lr": 9.984368620488005e-05} +{"train_loss": 0.02978118695318699, "global_step": 2285, "epoch": 19, "lr": 9.984351110575548e-05} +{"train_loss": 0.023031970486044884, "global_step": 2286, "epoch": 19, "lr": 9.98433359087685e-05} +{"train_loss": 0.029282942414283752, "global_step": 2287, "epoch": 19, "lr": 9.984316061391946e-05} +{"train_loss": 0.02741633728146553, "global_step": 2288, "epoch": 19, "lr": 9.984298522120869e-05} +{"train_loss": 0.03326607868075371, "global_step": 2289, "epoch": 19, "lr": 9.984280973063656e-05} +{"train_loss": 0.02604062296450138, "global_step": 2290, "epoch": 19, "lr": 9.984263414220339e-05} +{"train_loss": 0.03464650362730026, "global_step": 2291, "epoch": 19, "lr": 9.984245845590953e-05} +{"train_loss": 0.023518389090895653, "global_step": 2292, "epoch": 19, "lr": 9.984228267175533e-05} +{"train_loss": 0.030176904052495956, "global_step": 2293, "epoch": 19, "lr": 9.984210678974112e-05} +{"train_loss": 0.02873811684548855, "global_step": 2294, "epoch": 19, "lr": 9.984193080986728e-05} +{"train_loss": 0.033263109624385834, "global_step": 2295, "epoch": 19, "lr": 9.984175473213412e-05} +{"train_loss": 0.028752774000167847, "global_step": 2296, "epoch": 19, "lr": 9.984157855654201e-05} +{"train_loss": 0.031311072409152985, "global_step": 2297, "epoch": 19, "lr": 9.984140228309127e-05} +{"train_loss": 0.02357892319560051, "global_step": 2298, "epoch": 19, "lr": 9.984122591178228e-05} +{"train_loss": 0.027664020657539368, "global_step": 2299, "epoch": 19, "lr": 9.984104944261535e-05} +{"train_loss": 0.02122240886092186, "global_step": 2300, "epoch": 19, "lr": 9.984087287559085e-05} +{"train_loss": 0.03341853618621826, "global_step": 2301, "epoch": 19, "lr": 9.984069621070913e-05} +{"train_loss": 0.02706814743578434, "global_step": 2302, "epoch": 19, "lr": 9.984051944797052e-05} +{"train_loss": 0.02744462713599205, "global_step": 2303, "epoch": 19, "lr": 9.984034258737539e-05} +{"train_loss": 0.01876792125403881, "global_step": 2304, "epoch": 19, "lr": 9.984016562892405e-05} +{"train_loss": 0.023810485377907753, "global_step": 2305, "epoch": 19, "lr": 9.983998857261688e-05} +{"train_loss": 0.020085716620087624, "global_step": 2306, "epoch": 19, "lr": 9.98398114184542e-05} +{"train_loss": 0.01862754300236702, "global_step": 2307, "epoch": 19, "lr": 9.98396341664364e-05} +{"train_loss": 0.02266055904328823, "global_step": 2308, "epoch": 19, "lr": 9.983945681656379e-05} +{"train_loss": 0.02563035674393177, "global_step": 2309, "epoch": 19, "lr": 9.983927936883673e-05} +{"train_loss": 0.028928633779287338, "global_step": 2310, "epoch": 19, "lr": 9.983910182325556e-05} +{"train_loss": 0.03270644322037697, "global_step": 2311, "epoch": 19, "lr": 9.983892417982066e-05} +{"train_loss": 0.020528163760900497, "global_step": 2312, "epoch": 19, "lr": 9.983874643853235e-05} +{"train_loss": 0.02887422777712345, "global_step": 2313, "epoch": 19, "lr": 9.983856859939098e-05} +{"train_loss": 0.02425968274474144, "global_step": 2314, "epoch": 19, "lr": 9.983839066239691e-05} +{"train_loss": 0.030808791518211365, "global_step": 2315, "epoch": 19, "lr": 9.983821262755047e-05} +{"train_loss": 0.026530100032687187, "global_step": 2316, "epoch": 19, "lr": 9.983803449485205e-05} +{"train_loss": 0.02850157581269741, "global_step": 2317, "epoch": 19, "lr": 9.983785626430195e-05} +{"train_loss": 0.03057265654206276, "global_step": 2318, "epoch": 19, "lr": 9.983767793590056e-05} +{"train_loss": 0.027662815526127815, "global_step": 2319, "epoch": 19, "lr": 9.98374995096482e-05} +{"train_loss": 0.031726837158203125, "global_step": 2320, "epoch": 19, "lr": 9.983732098554523e-05} +{"train_loss": 0.031815122812986374, "global_step": 2321, "epoch": 19, "lr": 9.983714236359202e-05} +{"train_loss": 0.036281999200582504, "global_step": 2322, "epoch": 19, "lr": 9.983696364378892e-05} +{"train_loss": 0.026972005143761635, "global_step": 2323, "epoch": 19, "lr": 9.983678482613623e-05} +{"train_loss": 0.025723544880747795, "global_step": 2324, "epoch": 19, "lr": 9.983660591063437e-05} +{"train_loss": 0.02371140383183956, "global_step": 2325, "epoch": 19, "lr": 9.983642689728363e-05} +{"train_loss": 0.02849412150681019, "global_step": 2326, "epoch": 19, "lr": 9.98362477860844e-05} +{"train_loss": 0.026658309623599052, "global_step": 2327, "epoch": 19, "lr": 9.983606857703702e-05} +{"train_loss": 0.027661854401230812, "global_step": 2328, "epoch": 19, "lr": 9.983588927014185e-05} +{"train_loss": 0.028504716232419014, "global_step": 2329, "epoch": 19, "lr": 9.983570986539925e-05} +{"train_loss": 0.0247615035623312, "global_step": 2330, "epoch": 19, "lr": 9.983553036280953e-05} +{"train_loss": 0.027057895436882973, "global_step": 2331, "epoch": 19, "lr": 9.98353507623731e-05} +{"train_loss": 0.02954516001045704, "global_step": 2332, "epoch": 19, "lr": 9.983517106409024e-05} +{"train_loss": 0.026331838220357895, "global_step": 2333, "epoch": 19, "lr": 9.983499126796138e-05} +{"train_loss": 0.02391635999083519, "global_step": 2334, "epoch": 19, "lr": 9.983481137398683e-05} +{"train_loss": 0.020787296816706657, "global_step": 2335, "epoch": 19, "lr": 9.983463138216696e-05} +{"train_loss": 0.025350796058773994, "global_step": 2336, "epoch": 19, "lr": 9.983445129250211e-05} +{"train_loss": 0.02859935350716114, "global_step": 2337, "epoch": 19, "lr": 9.983427110499263e-05} +{"train_loss": 0.03059827722609043, "global_step": 2338, "epoch": 19, "lr": 9.983409081963888e-05} +{"train_loss": 0.028624624013900757, "global_step": 2339, "epoch": 19, "lr": 9.983391043644123e-05} +{"train_loss": 0.03472526744008064, "global_step": 2340, "epoch": 19, "lr": 9.983372995540002e-05} +{"train_loss": 0.035848669707775116, "global_step": 2341, "epoch": 19, "lr": 9.983354937651558e-05} +{"train_loss": 0.02236933819949627, "global_step": 2342, "epoch": 19, "lr": 9.983336869978832e-05} +{"train_loss": 0.02900294028222561, "global_step": 2343, "epoch": 19, "lr": 9.983318792521856e-05} +{"train_loss": 0.02665312960743904, "global_step": 2344, "epoch": 19, "lr": 9.983300705280665e-05} +{"train_loss": 0.030703537166118622, "global_step": 2345, "epoch": 19, "lr": 9.983282608255296e-05} +{"train_loss": 0.02917597070336342, "global_step": 2346, "epoch": 19, "lr": 9.983264501445784e-05} +{"train_loss": 0.0251157246530056, "global_step": 2347, "epoch": 19, "lr": 9.983246384852165e-05} +{"train_loss": 0.03362539783120155, "global_step": 2348, "epoch": 19, "lr": 9.983228258474472e-05} +{"train_loss": 0.027322541922330856, "global_step": 2349, "epoch": 19, "lr": 9.983210122312744e-05} +{"train_loss": 0.021733561530709267, "global_step": 2350, "epoch": 19, "lr": 9.983191976367016e-05} +{"train_loss": 0.03405958414077759, "global_step": 2351, "epoch": 19, "lr": 9.983173820637324e-05} +{"train_loss": 0.031241973862051964, "global_step": 2352, "epoch": 19, "lr": 9.983155655123701e-05} +{"train_loss": 0.031387217342853546, "global_step": 2353, "epoch": 19, "lr": 9.983137479826183e-05} +{"train_loss": 0.027892300859093666, "global_step": 2354, "epoch": 19, "lr": 9.98311929474481e-05} +{"train_loss": 0.031028732657432556, "global_step": 2355, "epoch": 19, "lr": 9.983101099879611e-05} +{"train_loss": 0.01911894418299198, "global_step": 2356, "epoch": 19, "lr": 9.983082895230628e-05} +{"train_loss": 0.027445584535598755, "global_step": 2357, "epoch": 19, "lr": 9.983064680797893e-05} +{"train_loss": 0.025093821808695793, "global_step": 2358, "epoch": 19, "lr": 9.983046456581445e-05} +{"train_loss": 0.029410073533654213, "global_step": 2359, "epoch": 19, "lr": 9.983028222581314e-05} +{"train_loss": 0.031186815351247787, "global_step": 2360, "epoch": 19, "lr": 9.983009978797542e-05} +{"train_loss": 0.02142444998025894, "global_step": 2361, "epoch": 19, "lr": 9.98299172523016e-05} +{"train_loss": 0.031189199537038803, "global_step": 2362, "epoch": 19, "lr": 9.982973461879208e-05} +{"train_loss": 0.022363223135471344, "global_step": 2363, "epoch": 19, "lr": 9.982955188744721e-05} +{"train_loss": 0.03600301221013069, "global_step": 2364, "epoch": 19, "lr": 9.982936905826731e-05} +{"train_loss": 0.02448933757841587, "global_step": 2365, "epoch": 19, "lr": 9.982918613125278e-05} +{"train_loss": 0.025586236268281937, "global_step": 2366, "epoch": 19, "lr": 9.982900310640398e-05} +{"train_loss": 0.02069034054875374, "global_step": 2367, "epoch": 19, "lr": 9.982881998372124e-05} +{"train_loss": 0.02474972791969776, "global_step": 2368, "epoch": 19, "lr": 9.982863676320493e-05} +{"train_loss": 0.02249174565076828, "global_step": 2369, "epoch": 19, "lr": 9.982845344485543e-05} +{"train_loss": 0.028775323182344437, "global_step": 2370, "epoch": 19, "lr": 9.982827002867308e-05} +{"train_loss": 0.02248447760939598, "global_step": 2371, "epoch": 19, "lr": 9.982808651465825e-05} +{"train_loss": 0.027889147400856018, "global_step": 2372, "epoch": 19, "lr": 9.982790290281128e-05} +{"train_loss": 0.03659164905548096, "global_step": 2373, "epoch": 19, "lr": 9.982771919313256e-05} +{"train_loss": 0.02065598964691162, "global_step": 2374, "epoch": 19, "lr": 9.982753538562244e-05} +{"train_loss": 0.029051275923848152, "global_step": 2375, "epoch": 19, "lr": 9.982735148028126e-05} +{"train_loss": 0.021968858316540718, "global_step": 2376, "epoch": 19, "lr": 9.98271674771094e-05} +{"train_loss": 0.025922829285264015, "global_step": 2377, "epoch": 19, "lr": 9.982698337610723e-05} +{"train_loss": 0.02950940653681755, "global_step": 2378, "epoch": 19, "lr": 9.982679917727511e-05} +{"train_loss": 0.027529772167571454, "global_step": 2379, "epoch": 19, "lr": 9.982661488061337e-05, "val_loss": 0.03699544817209244} +{"train_loss": 0.027207711711525917, "global_step": 2380, "epoch": 20, "lr": 9.982643048612242e-05} +{"train_loss": 0.029016107320785522, "global_step": 2381, "epoch": 20, "lr": 9.982624599380259e-05} +{"train_loss": 0.027227872982621193, "global_step": 2382, "epoch": 20, "lr": 9.982606140365423e-05} +{"train_loss": 0.026054522022604942, "global_step": 2383, "epoch": 20, "lr": 9.982587671567773e-05} +{"train_loss": 0.022938592359423637, "global_step": 2384, "epoch": 20, "lr": 9.982569192987345e-05} +{"train_loss": 0.024935539811849594, "global_step": 2385, "epoch": 20, "lr": 9.982550704624176e-05} +{"train_loss": 0.025777537375688553, "global_step": 2386, "epoch": 20, "lr": 9.982532206478299e-05} +{"train_loss": 0.024935970082879066, "global_step": 2387, "epoch": 20, "lr": 9.982513698549753e-05} +{"train_loss": 0.01545907836407423, "global_step": 2388, "epoch": 20, "lr": 9.982495180838574e-05} +{"train_loss": 0.022059792652726173, "global_step": 2389, "epoch": 20, "lr": 9.982476653344797e-05} +{"train_loss": 0.025530854240059853, "global_step": 2390, "epoch": 20, "lr": 9.982458116068461e-05} +{"train_loss": 0.023780399933457375, "global_step": 2391, "epoch": 20, "lr": 9.982439569009599e-05} +{"train_loss": 0.024360347539186478, "global_step": 2392, "epoch": 20, "lr": 9.98242101216825e-05} +{"train_loss": 0.026255566626787186, "global_step": 2393, "epoch": 20, "lr": 9.98240244554445e-05} +{"train_loss": 0.022362330928444862, "global_step": 2394, "epoch": 20, "lr": 9.982383869138236e-05} +{"train_loss": 0.02101680263876915, "global_step": 2395, "epoch": 20, "lr": 9.982365282949642e-05} +{"train_loss": 0.03157241269946098, "global_step": 2396, "epoch": 20, "lr": 9.982346686978705e-05} +{"train_loss": 0.02260536514222622, "global_step": 2397, "epoch": 20, "lr": 9.982328081225464e-05} +{"train_loss": 0.020633546635508537, "global_step": 2398, "epoch": 20, "lr": 9.982309465689954e-05} +{"train_loss": 0.02535218745470047, "global_step": 2399, "epoch": 20, "lr": 9.982290840372212e-05} +{"train_loss": 0.026182018220424652, "global_step": 2400, "epoch": 20, "lr": 9.982272205272274e-05} +{"train_loss": 0.02213263139128685, "global_step": 2401, "epoch": 20, "lr": 9.982253560390177e-05} +{"train_loss": 0.03065672144293785, "global_step": 2402, "epoch": 20, "lr": 9.982234905725959e-05} +{"train_loss": 0.021581418812274933, "global_step": 2403, "epoch": 20, "lr": 9.982216241279652e-05} +{"train_loss": 0.022203143686056137, "global_step": 2404, "epoch": 20, "lr": 9.982197567051297e-05} +{"train_loss": 0.034495461732149124, "global_step": 2405, "epoch": 20, "lr": 9.98217888304093e-05} +{"train_loss": 0.018479853868484497, "global_step": 2406, "epoch": 20, "lr": 9.982160189248584e-05} +{"train_loss": 0.026400262489914894, "global_step": 2407, "epoch": 20, "lr": 9.982141485674301e-05} +{"train_loss": 0.025649894028902054, "global_step": 2408, "epoch": 20, "lr": 9.982122772318116e-05} +{"train_loss": 0.021515270695090294, "global_step": 2409, "epoch": 20, "lr": 9.982104049180065e-05} +{"train_loss": 0.03580205887556076, "global_step": 2410, "epoch": 20, "lr": 9.982085316260183e-05} +{"train_loss": 0.02322854846715927, "global_step": 2411, "epoch": 20, "lr": 9.982066573558511e-05} +{"train_loss": 0.02516799047589302, "global_step": 2412, "epoch": 20, "lr": 9.982047821075083e-05} +{"train_loss": 0.022614462301135063, "global_step": 2413, "epoch": 20, "lr": 9.982029058809936e-05} +{"train_loss": 0.02759810909628868, "global_step": 2414, "epoch": 20, "lr": 9.982010286763108e-05} +{"train_loss": 0.02355317957699299, "global_step": 2415, "epoch": 20, "lr": 9.981991504934634e-05} +{"train_loss": 0.02561270073056221, "global_step": 2416, "epoch": 20, "lr": 9.981972713324552e-05} +{"train_loss": 0.02208399586379528, "global_step": 2417, "epoch": 20, "lr": 9.9819539119329e-05} +{"train_loss": 0.02307109907269478, "global_step": 2418, "epoch": 20, "lr": 9.981935100759712e-05} +{"train_loss": 0.02791246399283409, "global_step": 2419, "epoch": 20, "lr": 9.981916279805028e-05} +{"train_loss": 0.0357184074819088, "global_step": 2420, "epoch": 20, "lr": 9.981897449068884e-05} +{"train_loss": 0.03802933171391487, "global_step": 2421, "epoch": 20, "lr": 9.981878608551316e-05} +{"train_loss": 0.018135488033294678, "global_step": 2422, "epoch": 20, "lr": 9.981859758252361e-05} +{"train_loss": 0.021890873089432716, "global_step": 2423, "epoch": 20, "lr": 9.981840898172057e-05} +{"train_loss": 0.022693030536174774, "global_step": 2424, "epoch": 20, "lr": 9.98182202831044e-05} +{"train_loss": 0.028811834752559662, "global_step": 2425, "epoch": 20, "lr": 9.981803148667548e-05} +{"train_loss": 0.032353419810533524, "global_step": 2426, "epoch": 20, "lr": 9.981784259243419e-05} +{"train_loss": 0.020251154899597168, "global_step": 2427, "epoch": 20, "lr": 9.981765360038087e-05} +{"train_loss": 0.023163098841905594, "global_step": 2428, "epoch": 20, "lr": 9.981746451051592e-05} +{"train_loss": 0.02745642513036728, "global_step": 2429, "epoch": 20, "lr": 9.98172753228397e-05} +{"train_loss": 0.030144188553094864, "global_step": 2430, "epoch": 20, "lr": 9.981708603735259e-05} +{"train_loss": 0.03035004995763302, "global_step": 2431, "epoch": 20, "lr": 9.981689665405494e-05} +{"train_loss": 0.025576097890734673, "global_step": 2432, "epoch": 20, "lr": 9.981670717294713e-05} +{"train_loss": 0.026770971715450287, "global_step": 2433, "epoch": 20, "lr": 9.981651759402955e-05} +{"train_loss": 0.02751031704246998, "global_step": 2434, "epoch": 20, "lr": 9.981632791730256e-05} +{"train_loss": 0.02305024489760399, "global_step": 2435, "epoch": 20, "lr": 9.981613814276653e-05} +{"train_loss": 0.022083615884184837, "global_step": 2436, "epoch": 20, "lr": 9.981594827042183e-05} +{"train_loss": 0.03086574748158455, "global_step": 2437, "epoch": 20, "lr": 9.981575830026884e-05} +{"train_loss": 0.04081990197300911, "global_step": 2438, "epoch": 20, "lr": 9.981556823230793e-05} +{"train_loss": 0.02678034082055092, "global_step": 2439, "epoch": 20, "lr": 9.981537806653949e-05} +{"train_loss": 0.02991200052201748, "global_step": 2440, "epoch": 20, "lr": 9.981518780296386e-05} +{"train_loss": 0.03030821681022644, "global_step": 2441, "epoch": 20, "lr": 9.981499744158143e-05} +{"train_loss": 0.023485787212848663, "global_step": 2442, "epoch": 20, "lr": 9.981480698239259e-05} +{"train_loss": 0.019041771069169044, "global_step": 2443, "epoch": 20, "lr": 9.981461642539768e-05} +{"train_loss": 0.03140134736895561, "global_step": 2444, "epoch": 20, "lr": 9.98144257705971e-05} +{"train_loss": 0.02224954403936863, "global_step": 2445, "epoch": 20, "lr": 9.981423501799121e-05} +{"train_loss": 0.02925281785428524, "global_step": 2446, "epoch": 20, "lr": 9.98140441675804e-05} +{"train_loss": 0.033122528344392776, "global_step": 2447, "epoch": 20, "lr": 9.981385321936503e-05} +{"train_loss": 0.03274425119161606, "global_step": 2448, "epoch": 20, "lr": 9.98136621733455e-05} +{"train_loss": 0.02803715318441391, "global_step": 2449, "epoch": 20, "lr": 9.981347102952214e-05} +{"train_loss": 0.025795700028538704, "global_step": 2450, "epoch": 20, "lr": 9.981327978789537e-05} +{"train_loss": 0.02143501490354538, "global_step": 2451, "epoch": 20, "lr": 9.981308844846553e-05} +{"train_loss": 0.020166153088212013, "global_step": 2452, "epoch": 20, "lr": 9.981289701123303e-05} +{"train_loss": 0.03801201283931732, "global_step": 2453, "epoch": 20, "lr": 9.981270547619822e-05} +{"train_loss": 0.02691549062728882, "global_step": 2454, "epoch": 20, "lr": 9.981251384336148e-05} +{"train_loss": 0.0243703480809927, "global_step": 2455, "epoch": 20, "lr": 9.98123221127232e-05} +{"train_loss": 0.033154238015413284, "global_step": 2456, "epoch": 20, "lr": 9.981213028428374e-05} +{"train_loss": 0.03489451855421066, "global_step": 2457, "epoch": 20, "lr": 9.98119383580435e-05} +{"train_loss": 0.024405701085925102, "global_step": 2458, "epoch": 20, "lr": 9.981174633400282e-05} +{"train_loss": 0.02403280697762966, "global_step": 2459, "epoch": 20, "lr": 9.981155421216211e-05} +{"train_loss": 0.0341973640024662, "global_step": 2460, "epoch": 20, "lr": 9.981136199252173e-05} +{"train_loss": 0.020626435056328773, "global_step": 2461, "epoch": 20, "lr": 9.981116967508206e-05} +{"train_loss": 0.02565210685133934, "global_step": 2462, "epoch": 20, "lr": 9.981097725984348e-05} +{"train_loss": 0.023854944854974747, "global_step": 2463, "epoch": 20, "lr": 9.981078474680638e-05} +{"train_loss": 0.02530471794307232, "global_step": 2464, "epoch": 20, "lr": 9.981059213597111e-05} +{"train_loss": 0.033614255487918854, "global_step": 2465, "epoch": 20, "lr": 9.981039942733807e-05} +{"train_loss": 0.024821938946843147, "global_step": 2466, "epoch": 20, "lr": 9.981020662090763e-05} +{"train_loss": 0.029774297028779984, "global_step": 2467, "epoch": 20, "lr": 9.981001371668017e-05} +{"train_loss": 0.027244415134191513, "global_step": 2468, "epoch": 20, "lr": 9.980982071465607e-05} +{"train_loss": 0.018242914229631424, "global_step": 2469, "epoch": 20, "lr": 9.980962761483572e-05} +{"train_loss": 0.03208852559328079, "global_step": 2470, "epoch": 20, "lr": 9.980943441721947e-05} +{"train_loss": 0.02357226237654686, "global_step": 2471, "epoch": 20, "lr": 9.980924112180773e-05} +{"train_loss": 0.028133805841207504, "global_step": 2472, "epoch": 20, "lr": 9.980904772860086e-05} +{"train_loss": 0.03710304945707321, "global_step": 2473, "epoch": 20, "lr": 9.980885423759925e-05} +{"train_loss": 0.035597506910562515, "global_step": 2474, "epoch": 20, "lr": 9.980866064880327e-05} +{"train_loss": 0.026611046865582466, "global_step": 2475, "epoch": 20, "lr": 9.980846696221331e-05} +{"train_loss": 0.02558853104710579, "global_step": 2476, "epoch": 20, "lr": 9.980827317782975e-05} +{"train_loss": 0.023090068250894547, "global_step": 2477, "epoch": 20, "lr": 9.980807929565296e-05} +{"train_loss": 0.03231554478406906, "global_step": 2478, "epoch": 20, "lr": 9.980788531568333e-05} +{"train_loss": 0.025262488052248955, "global_step": 2479, "epoch": 20, "lr": 9.980769123792125e-05} +{"train_loss": 0.02033519744873047, "global_step": 2480, "epoch": 20, "lr": 9.980749706236706e-05} +{"train_loss": 0.02921956032514572, "global_step": 2481, "epoch": 20, "lr": 9.98073027890212e-05} +{"train_loss": 0.025955699384212494, "global_step": 2482, "epoch": 20, "lr": 9.9807108417884e-05} +{"train_loss": 0.026824569329619408, "global_step": 2483, "epoch": 20, "lr": 9.980691394895588e-05} +{"train_loss": 0.02540302462875843, "global_step": 2484, "epoch": 20, "lr": 9.98067193822372e-05} +{"train_loss": 0.02239580638706684, "global_step": 2485, "epoch": 20, "lr": 9.980652471772835e-05} +{"train_loss": 0.025107646360993385, "global_step": 2486, "epoch": 20, "lr": 9.98063299554297e-05} +{"train_loss": 0.03281892463564873, "global_step": 2487, "epoch": 20, "lr": 9.980613509534165e-05} +{"train_loss": 0.02513340301811695, "global_step": 2488, "epoch": 20, "lr": 9.980594013746458e-05} +{"train_loss": 0.025673262774944305, "global_step": 2489, "epoch": 20, "lr": 9.980574508179885e-05} +{"train_loss": 0.018977118656039238, "global_step": 2490, "epoch": 20, "lr": 9.980554992834487e-05} +{"train_loss": 0.01977740228176117, "global_step": 2491, "epoch": 20, "lr": 9.980535467710302e-05} +{"train_loss": 0.032650552690029144, "global_step": 2492, "epoch": 20, "lr": 9.980515932807368e-05} +{"train_loss": 0.027080919593572617, "global_step": 2493, "epoch": 20, "lr": 9.980496388125722e-05} +{"train_loss": 0.022078072652220726, "global_step": 2494, "epoch": 20, "lr": 9.980476833665405e-05} +{"train_loss": 0.01809876598417759, "global_step": 2495, "epoch": 20, "lr": 9.980457269426451e-05} +{"train_loss": 0.025213779881596565, "global_step": 2496, "epoch": 20, "lr": 9.980437695408905e-05} +{"train_loss": 0.027698300778865814, "global_step": 2497, "epoch": 20, "lr": 9.980418111612798e-05} +{"train_loss": 0.026297309983740833, "global_step": 2498, "epoch": 20, "lr": 9.980398518038174e-05, "val_loss": 0.04618685320019722, "train_action_mse_error": 0.0031484223436564207} +{"train_loss": 0.019272714853286743, "global_step": 2499, "epoch": 21, "lr": 9.98037891468507e-05} +{"train_loss": 0.029536830261349678, "global_step": 2500, "epoch": 21, "lr": 9.980359301553522e-05} +{"train_loss": 0.042742226272821426, "global_step": 2501, "epoch": 21, "lr": 9.98033967864357e-05} +{"train_loss": 0.025416290387511253, "global_step": 2502, "epoch": 21, "lr": 9.980320045955257e-05} +{"train_loss": 0.03128116577863693, "global_step": 2503, "epoch": 21, "lr": 9.980300403488616e-05} +{"train_loss": 0.02778507210314274, "global_step": 2504, "epoch": 21, "lr": 9.980280751243687e-05} +{"train_loss": 0.029848670586943626, "global_step": 2505, "epoch": 21, "lr": 9.980261089220509e-05} +{"train_loss": 0.02231913059949875, "global_step": 2506, "epoch": 21, "lr": 9.980241417419118e-05} +{"train_loss": 0.026072869077324867, "global_step": 2507, "epoch": 21, "lr": 9.980221735839558e-05} +{"train_loss": 0.01850634068250656, "global_step": 2508, "epoch": 21, "lr": 9.980202044481864e-05} +{"train_loss": 0.026180412620306015, "global_step": 2509, "epoch": 21, "lr": 9.980182343346076e-05} +{"train_loss": 0.0218949131667614, "global_step": 2510, "epoch": 21, "lr": 9.980162632432231e-05} +{"train_loss": 0.02929537557065487, "global_step": 2511, "epoch": 21, "lr": 9.98014291174037e-05} +{"train_loss": 0.02485710009932518, "global_step": 2512, "epoch": 21, "lr": 9.980123181270528e-05} +{"train_loss": 0.024697866290807724, "global_step": 2513, "epoch": 21, "lr": 9.980103441022746e-05} +{"train_loss": 0.025086183100938797, "global_step": 2514, "epoch": 21, "lr": 9.980083690997065e-05} +{"train_loss": 0.021993981674313545, "global_step": 2515, "epoch": 21, "lr": 9.980063931193522e-05} +{"train_loss": 0.019652288407087326, "global_step": 2516, "epoch": 21, "lr": 9.980044161612155e-05} +{"train_loss": 0.02389853075146675, "global_step": 2517, "epoch": 21, "lr": 9.980024382253001e-05} +{"train_loss": 0.016581138595938683, "global_step": 2518, "epoch": 21, "lr": 9.980004593116104e-05} +{"train_loss": 0.02467622607946396, "global_step": 2519, "epoch": 21, "lr": 9.9799847942015e-05} +{"train_loss": 0.027101751416921616, "global_step": 2520, "epoch": 21, "lr": 9.979964985509228e-05} +{"train_loss": 0.02792358584702015, "global_step": 2521, "epoch": 21, "lr": 9.979945167039324e-05} +{"train_loss": 0.025692826136946678, "global_step": 2522, "epoch": 21, "lr": 9.979925338791832e-05} +{"train_loss": 0.018531877547502518, "global_step": 2523, "epoch": 21, "lr": 9.979905500766788e-05} +{"train_loss": 0.02611291967332363, "global_step": 2524, "epoch": 21, "lr": 9.979885652964232e-05} +{"train_loss": 0.028409462422132492, "global_step": 2525, "epoch": 21, "lr": 9.979865795384203e-05} +{"train_loss": 0.02518637292087078, "global_step": 2526, "epoch": 21, "lr": 9.979845928026739e-05} +{"train_loss": 0.020283972844481468, "global_step": 2527, "epoch": 21, "lr": 9.979826050891878e-05} +{"train_loss": 0.034269679337739944, "global_step": 2528, "epoch": 21, "lr": 9.979806163979663e-05} +{"train_loss": 0.019188307225704193, "global_step": 2529, "epoch": 21, "lr": 9.979786267290129e-05} +{"train_loss": 0.028832649812102318, "global_step": 2530, "epoch": 21, "lr": 9.979766360823318e-05} +{"train_loss": 0.025729943066835403, "global_step": 2531, "epoch": 21, "lr": 9.979746444579265e-05} +{"train_loss": 0.028718682006001472, "global_step": 2532, "epoch": 21, "lr": 9.979726518558015e-05} +{"train_loss": 0.02216026559472084, "global_step": 2533, "epoch": 21, "lr": 9.979706582759603e-05} +{"train_loss": 0.026112280786037445, "global_step": 2534, "epoch": 21, "lr": 9.979686637184069e-05} +{"train_loss": 0.018187502399086952, "global_step": 2535, "epoch": 21, "lr": 9.979666681831452e-05} +{"train_loss": 0.02547612227499485, "global_step": 2536, "epoch": 21, "lr": 9.979646716701791e-05} +{"train_loss": 0.029460372403264046, "global_step": 2537, "epoch": 21, "lr": 9.979626741795127e-05} +{"train_loss": 0.02810569666326046, "global_step": 2538, "epoch": 21, "lr": 9.979606757111497e-05} +{"train_loss": 0.02143843285739422, "global_step": 2539, "epoch": 21, "lr": 9.97958676265094e-05} +{"train_loss": 0.023779716342687607, "global_step": 2540, "epoch": 21, "lr": 9.979566758413499e-05} +{"train_loss": 0.02427697740495205, "global_step": 2541, "epoch": 21, "lr": 9.97954674439921e-05} +{"train_loss": 0.019725732505321503, "global_step": 2542, "epoch": 21, "lr": 9.979526720608112e-05} +{"train_loss": 0.021683860570192337, "global_step": 2543, "epoch": 21, "lr": 9.979506687040246e-05} +{"train_loss": 0.019855493679642677, "global_step": 2544, "epoch": 21, "lr": 9.97948664369565e-05} +{"train_loss": 0.024620475247502327, "global_step": 2545, "epoch": 21, "lr": 9.979466590574365e-05} +{"train_loss": 0.03167156130075455, "global_step": 2546, "epoch": 21, "lr": 9.979446527676429e-05} +{"train_loss": 0.022255903109908104, "global_step": 2547, "epoch": 21, "lr": 9.97942645500188e-05} +{"train_loss": 0.022960854694247246, "global_step": 2548, "epoch": 21, "lr": 9.979406372550762e-05} +{"train_loss": 0.017672447487711906, "global_step": 2549, "epoch": 21, "lr": 9.979386280323108e-05} +{"train_loss": 0.020750325173139572, "global_step": 2550, "epoch": 21, "lr": 9.979366178318963e-05} +{"train_loss": 0.019966846331954002, "global_step": 2551, "epoch": 21, "lr": 9.979346066538364e-05} +{"train_loss": 0.02526881918311119, "global_step": 2552, "epoch": 21, "lr": 9.979325944981352e-05} +{"train_loss": 0.02971957065165043, "global_step": 2553, "epoch": 21, "lr": 9.979305813647965e-05} +{"train_loss": 0.020413246005773544, "global_step": 2554, "epoch": 21, "lr": 9.979285672538243e-05} +{"train_loss": 0.028977755457162857, "global_step": 2555, "epoch": 21, "lr": 9.979265521652226e-05} +{"train_loss": 0.026675792410969734, "global_step": 2556, "epoch": 21, "lr": 9.979245360989952e-05} +{"train_loss": 0.021466661244630814, "global_step": 2557, "epoch": 21, "lr": 9.979225190551462e-05} +{"train_loss": 0.028382983058691025, "global_step": 2558, "epoch": 21, "lr": 9.979205010336796e-05} +{"train_loss": 0.0293741337954998, "global_step": 2559, "epoch": 21, "lr": 9.979184820345992e-05} +{"train_loss": 0.021128501743078232, "global_step": 2560, "epoch": 21, "lr": 9.979164620579091e-05} +{"train_loss": 0.02716563083231449, "global_step": 2561, "epoch": 21, "lr": 9.979144411036133e-05} +{"train_loss": 0.02197260782122612, "global_step": 2562, "epoch": 21, "lr": 9.979124191717155e-05} +{"train_loss": 0.02637128345668316, "global_step": 2563, "epoch": 21, "lr": 9.9791039626222e-05} +{"train_loss": 0.01730220764875412, "global_step": 2564, "epoch": 21, "lr": 9.979083723751306e-05} +{"train_loss": 0.0193440243601799, "global_step": 2565, "epoch": 21, "lr": 9.979063475104513e-05} +{"train_loss": 0.02485843189060688, "global_step": 2566, "epoch": 21, "lr": 9.97904321668186e-05} +{"train_loss": 0.019414570182561874, "global_step": 2567, "epoch": 21, "lr": 9.979022948483389e-05} +{"train_loss": 0.02348778210580349, "global_step": 2568, "epoch": 21, "lr": 9.979002670509138e-05} +{"train_loss": 0.030227266252040863, "global_step": 2569, "epoch": 21, "lr": 9.978982382759146e-05} +{"train_loss": 0.02313913032412529, "global_step": 2570, "epoch": 21, "lr": 9.978962085233455e-05} +{"train_loss": 0.025007130578160286, "global_step": 2571, "epoch": 21, "lr": 9.978941777932104e-05} +{"train_loss": 0.019542673602700233, "global_step": 2572, "epoch": 21, "lr": 9.978921460855132e-05} +{"train_loss": 0.027414971962571144, "global_step": 2573, "epoch": 21, "lr": 9.97890113400258e-05} +{"train_loss": 0.03194209933280945, "global_step": 2574, "epoch": 21, "lr": 9.978880797374488e-05} +{"train_loss": 0.024258853867650032, "global_step": 2575, "epoch": 21, "lr": 9.978860450970896e-05} +{"train_loss": 0.02509147673845291, "global_step": 2576, "epoch": 21, "lr": 9.978840094791842e-05} +{"train_loss": 0.021855928003787994, "global_step": 2577, "epoch": 21, "lr": 9.978819728837368e-05} +{"train_loss": 0.02190515585243702, "global_step": 2578, "epoch": 21, "lr": 9.978799353107513e-05} +{"train_loss": 0.024347476661205292, "global_step": 2579, "epoch": 21, "lr": 9.978778967602318e-05} +{"train_loss": 0.023509027436375618, "global_step": 2580, "epoch": 21, "lr": 9.978758572321823e-05} +{"train_loss": 0.024125760421156883, "global_step": 2581, "epoch": 21, "lr": 9.978738167266067e-05} +{"train_loss": 0.023428000509738922, "global_step": 2582, "epoch": 21, "lr": 9.978717752435089e-05} +{"train_loss": 0.02734246477484703, "global_step": 2583, "epoch": 21, "lr": 9.978697327828933e-05} +{"train_loss": 0.017875490710139275, "global_step": 2584, "epoch": 21, "lr": 9.978676893447634e-05} +{"train_loss": 0.019041001796722412, "global_step": 2585, "epoch": 21, "lr": 9.978656449291237e-05} +{"train_loss": 0.023921703919768333, "global_step": 2586, "epoch": 21, "lr": 9.978635995359778e-05} +{"train_loss": 0.0327124148607254, "global_step": 2587, "epoch": 21, "lr": 9.978615531653301e-05} +{"train_loss": 0.028670333325862885, "global_step": 2588, "epoch": 21, "lr": 9.978595058171844e-05} +{"train_loss": 0.01939208246767521, "global_step": 2589, "epoch": 21, "lr": 9.978574574915447e-05} +{"train_loss": 0.02066006511449814, "global_step": 2590, "epoch": 21, "lr": 9.97855408188415e-05} +{"train_loss": 0.02412552386522293, "global_step": 2591, "epoch": 21, "lr": 9.978533579077996e-05} +{"train_loss": 0.018984757363796234, "global_step": 2592, "epoch": 21, "lr": 9.978513066497021e-05} +{"train_loss": 0.020436516031622887, "global_step": 2593, "epoch": 21, "lr": 9.978492544141268e-05} +{"train_loss": 0.024888908490538597, "global_step": 2594, "epoch": 21, "lr": 9.978472012010778e-05} +{"train_loss": 0.023742953315377235, "global_step": 2595, "epoch": 21, "lr": 9.978451470105588e-05} +{"train_loss": 0.028238948434591293, "global_step": 2596, "epoch": 21, "lr": 9.978430918425741e-05} +{"train_loss": 0.023721031844615936, "global_step": 2597, "epoch": 21, "lr": 9.978410356971279e-05} +{"train_loss": 0.028912343084812164, "global_step": 2598, "epoch": 21, "lr": 9.978389785742238e-05} +{"train_loss": 0.020822640508413315, "global_step": 2599, "epoch": 21, "lr": 9.97836920473866e-05} +{"train_loss": 0.023057717829942703, "global_step": 2600, "epoch": 21, "lr": 9.978348613960588e-05} +{"train_loss": 0.024045787751674652, "global_step": 2601, "epoch": 21, "lr": 9.97832801340806e-05} +{"train_loss": 0.027103256434202194, "global_step": 2602, "epoch": 21, "lr": 9.978307403081115e-05} +{"train_loss": 0.02376490645110607, "global_step": 2603, "epoch": 21, "lr": 9.978286782979796e-05} +{"train_loss": 0.01496137399226427, "global_step": 2604, "epoch": 21, "lr": 9.978266153104143e-05} +{"train_loss": 0.02493349276483059, "global_step": 2605, "epoch": 21, "lr": 9.978245513454197e-05} +{"train_loss": 0.033165913075208664, "global_step": 2606, "epoch": 21, "lr": 9.978224864029997e-05} +{"train_loss": 0.022631186991930008, "global_step": 2607, "epoch": 21, "lr": 9.978204204831585e-05} +{"train_loss": 0.025503115728497505, "global_step": 2608, "epoch": 21, "lr": 9.978183535859e-05} +{"train_loss": 0.02187800593674183, "global_step": 2609, "epoch": 21, "lr": 9.978162857112283e-05} +{"train_loss": 0.027018118649721146, "global_step": 2610, "epoch": 21, "lr": 9.978142168591477e-05} +{"train_loss": 0.02436145395040512, "global_step": 2611, "epoch": 21, "lr": 9.978121470296619e-05} +{"train_loss": 0.024772265926003456, "global_step": 2612, "epoch": 21, "lr": 9.978100762227752e-05} +{"train_loss": 0.028657935559749603, "global_step": 2613, "epoch": 21, "lr": 9.978080044384917e-05} +{"train_loss": 0.02019904926419258, "global_step": 2614, "epoch": 21, "lr": 9.978059316768151e-05} +{"train_loss": 0.030271101742982864, "global_step": 2615, "epoch": 21, "lr": 9.9780385793775e-05} +{"train_loss": 0.03478335216641426, "global_step": 2616, "epoch": 21, "lr": 9.978017832213001e-05} +{"train_loss": 0.024634268220921022, "global_step": 2617, "epoch": 21, "lr": 9.977997075274695e-05, "val_loss": 0.036151111125946045} +{"train_loss": 0.024273941293358803, "global_step": 2618, "epoch": 22, "lr": 9.977976308562624e-05} +{"train_loss": 0.030042096972465515, "global_step": 2619, "epoch": 22, "lr": 9.977955532076829e-05} +{"train_loss": 0.022370880469679832, "global_step": 2620, "epoch": 22, "lr": 9.97793474581735e-05} +{"train_loss": 0.023581914603710175, "global_step": 2621, "epoch": 22, "lr": 9.977913949784228e-05} +{"train_loss": 0.03055165335536003, "global_step": 2622, "epoch": 22, "lr": 9.977893143977503e-05} +{"train_loss": 0.02842009998857975, "global_step": 2623, "epoch": 22, "lr": 9.977872328397218e-05} +{"train_loss": 0.026375209912657738, "global_step": 2624, "epoch": 22, "lr": 9.977851503043412e-05} +{"train_loss": 0.033515430986881256, "global_step": 2625, "epoch": 22, "lr": 9.977830667916127e-05} +{"train_loss": 0.025814823806285858, "global_step": 2626, "epoch": 22, "lr": 9.977809823015401e-05} +{"train_loss": 0.023178301751613617, "global_step": 2627, "epoch": 22, "lr": 9.977788968341277e-05} +{"train_loss": 0.024310734122991562, "global_step": 2628, "epoch": 22, "lr": 9.977768103893799e-05} +{"train_loss": 0.02075931243598461, "global_step": 2629, "epoch": 22, "lr": 9.977747229673004e-05} +{"train_loss": 0.022954070940613747, "global_step": 2630, "epoch": 22, "lr": 9.977726345678933e-05} +{"train_loss": 0.029045620933175087, "global_step": 2631, "epoch": 22, "lr": 9.97770545191163e-05} +{"train_loss": 0.016951512545347214, "global_step": 2632, "epoch": 22, "lr": 9.977684548371134e-05} +{"train_loss": 0.03233123570680618, "global_step": 2633, "epoch": 22, "lr": 9.977663635057484e-05} +{"train_loss": 0.025560779497027397, "global_step": 2634, "epoch": 22, "lr": 9.977642711970725e-05} +{"train_loss": 0.017294390127062798, "global_step": 2635, "epoch": 22, "lr": 9.977621779110895e-05} +{"train_loss": 0.03231040760874748, "global_step": 2636, "epoch": 22, "lr": 9.977600836478039e-05} +{"train_loss": 0.02720855176448822, "global_step": 2637, "epoch": 22, "lr": 9.977579884072192e-05} +{"train_loss": 0.023844178766012192, "global_step": 2638, "epoch": 22, "lr": 9.977558921893402e-05} +{"train_loss": 0.02505239099264145, "global_step": 2639, "epoch": 22, "lr": 9.977537949941704e-05} +{"train_loss": 0.022874346002936363, "global_step": 2640, "epoch": 22, "lr": 9.977516968217144e-05} +{"train_loss": 0.0209023617208004, "global_step": 2641, "epoch": 22, "lr": 9.977495976719761e-05} +{"train_loss": 0.024048855528235435, "global_step": 2642, "epoch": 22, "lr": 9.977474975449595e-05} +{"train_loss": 0.023655511438846588, "global_step": 2643, "epoch": 22, "lr": 9.97745396440669e-05} +{"train_loss": 0.02370232529938221, "global_step": 2644, "epoch": 22, "lr": 9.977432943591085e-05} +{"train_loss": 0.024341536685824394, "global_step": 2645, "epoch": 22, "lr": 9.977411913002823e-05} +{"train_loss": 0.032733142375946045, "global_step": 2646, "epoch": 22, "lr": 9.977390872641945e-05} +{"train_loss": 0.026824261993169785, "global_step": 2647, "epoch": 22, "lr": 9.977369822508491e-05} +{"train_loss": 0.027228806167840958, "global_step": 2648, "epoch": 22, "lr": 9.977348762602503e-05} +{"train_loss": 0.02728886902332306, "global_step": 2649, "epoch": 22, "lr": 9.977327692924021e-05} +{"train_loss": 0.021305713802576065, "global_step": 2650, "epoch": 22, "lr": 9.977306613473089e-05} +{"train_loss": 0.03136356920003891, "global_step": 2651, "epoch": 22, "lr": 9.977285524249749e-05} +{"train_loss": 0.0262424536049366, "global_step": 2652, "epoch": 22, "lr": 9.977264425254039e-05} +{"train_loss": 0.025541391223669052, "global_step": 2653, "epoch": 22, "lr": 9.977243316486003e-05} +{"train_loss": 0.024561885744333267, "global_step": 2654, "epoch": 22, "lr": 9.97722219794568e-05} +{"train_loss": 0.027503633871674538, "global_step": 2655, "epoch": 22, "lr": 9.977201069633113e-05} +{"train_loss": 0.024206524714827538, "global_step": 2656, "epoch": 22, "lr": 9.977179931548343e-05} +{"train_loss": 0.02003392018377781, "global_step": 2657, "epoch": 22, "lr": 9.977158783691415e-05} +{"train_loss": 0.020931672304868698, "global_step": 2658, "epoch": 22, "lr": 9.977137626062365e-05} +{"train_loss": 0.018933411687612534, "global_step": 2659, "epoch": 22, "lr": 9.977116458661238e-05} +{"train_loss": 0.021700778976082802, "global_step": 2660, "epoch": 22, "lr": 9.977095281488073e-05} +{"train_loss": 0.028743766248226166, "global_step": 2661, "epoch": 22, "lr": 9.977074094542916e-05} +{"train_loss": 0.030548982322216034, "global_step": 2662, "epoch": 22, "lr": 9.977052897825802e-05} +{"train_loss": 0.024374378845095634, "global_step": 2663, "epoch": 22, "lr": 9.977031691336778e-05} +{"train_loss": 0.017224792391061783, "global_step": 2664, "epoch": 22, "lr": 9.977010475075885e-05} +{"train_loss": 0.021207813173532486, "global_step": 2665, "epoch": 22, "lr": 9.976989249043163e-05} +{"train_loss": 0.025601854547858238, "global_step": 2666, "epoch": 22, "lr": 9.976968013238654e-05} +{"train_loss": 0.031395312398672104, "global_step": 2667, "epoch": 22, "lr": 9.9769467676624e-05} +{"train_loss": 0.02200462482869625, "global_step": 2668, "epoch": 22, "lr": 9.976925512314444e-05} +{"train_loss": 0.026964491233229637, "global_step": 2669, "epoch": 22, "lr": 9.976904247194825e-05} +{"train_loss": 0.020008623600006104, "global_step": 2670, "epoch": 22, "lr": 9.976882972303587e-05} +{"train_loss": 0.025458967313170433, "global_step": 2671, "epoch": 22, "lr": 9.97686168764077e-05} +{"train_loss": 0.020319152623414993, "global_step": 2672, "epoch": 22, "lr": 9.976840393206419e-05} +{"train_loss": 0.0219566710293293, "global_step": 2673, "epoch": 22, "lr": 9.97681908900057e-05} +{"train_loss": 0.02340134046971798, "global_step": 2674, "epoch": 22, "lr": 9.976797775023272e-05} +{"train_loss": 0.026265980675816536, "global_step": 2675, "epoch": 22, "lr": 9.976776451274561e-05} +{"train_loss": 0.023925555869936943, "global_step": 2676, "epoch": 22, "lr": 9.976755117754482e-05} +{"train_loss": 0.02217515930533409, "global_step": 2677, "epoch": 22, "lr": 9.976733774463076e-05} +{"train_loss": 0.02292829006910324, "global_step": 2678, "epoch": 22, "lr": 9.976712421400385e-05} +{"train_loss": 0.02281462773680687, "global_step": 2679, "epoch": 22, "lr": 9.97669105856645e-05} +{"train_loss": 0.020564254373311996, "global_step": 2680, "epoch": 22, "lr": 9.976669685961314e-05} +{"train_loss": 0.023649847134947777, "global_step": 2681, "epoch": 22, "lr": 9.976648303585019e-05} +{"train_loss": 0.020232809707522392, "global_step": 2682, "epoch": 22, "lr": 9.976626911437608e-05} +{"train_loss": 0.02596001885831356, "global_step": 2683, "epoch": 22, "lr": 9.976605509519119e-05} +{"train_loss": 0.023841721937060356, "global_step": 2684, "epoch": 22, "lr": 9.9765840978296e-05} +{"train_loss": 0.025419047102332115, "global_step": 2685, "epoch": 22, "lr": 9.976562676369088e-05} +{"train_loss": 0.022166658192873, "global_step": 2686, "epoch": 22, "lr": 9.976541245137627e-05} +{"train_loss": 0.02171001397073269, "global_step": 2687, "epoch": 22, "lr": 9.976519804135258e-05} +{"train_loss": 0.01774236559867859, "global_step": 2688, "epoch": 22, "lr": 9.976498353362024e-05} +{"train_loss": 0.029041510075330734, "global_step": 2689, "epoch": 22, "lr": 9.97647689281797e-05} +{"train_loss": 0.016913220286369324, "global_step": 2690, "epoch": 22, "lr": 9.976455422503132e-05} +{"train_loss": 0.021961642429232597, "global_step": 2691, "epoch": 22, "lr": 9.976433942417558e-05} +{"train_loss": 0.02684335969388485, "global_step": 2692, "epoch": 22, "lr": 9.976412452561286e-05} +{"train_loss": 0.0277915820479393, "global_step": 2693, "epoch": 22, "lr": 9.97639095293436e-05} +{"train_loss": 0.02205500192940235, "global_step": 2694, "epoch": 22, "lr": 9.976369443536822e-05} +{"train_loss": 0.02475263550877571, "global_step": 2695, "epoch": 22, "lr": 9.976347924368715e-05} +{"train_loss": 0.023926593363285065, "global_step": 2696, "epoch": 22, "lr": 9.97632639543008e-05} +{"train_loss": 0.01945723406970501, "global_step": 2697, "epoch": 22, "lr": 9.97630485672096e-05} +{"train_loss": 0.018342066556215286, "global_step": 2698, "epoch": 22, "lr": 9.976283308241396e-05} +{"train_loss": 0.025120293721556664, "global_step": 2699, "epoch": 22, "lr": 9.976261749991432e-05} +{"train_loss": 0.022580407559871674, "global_step": 2700, "epoch": 22, "lr": 9.97624018197111e-05} +{"train_loss": 0.019568348303437233, "global_step": 2701, "epoch": 22, "lr": 9.976218604180472e-05} +{"train_loss": 0.022067932412028313, "global_step": 2702, "epoch": 22, "lr": 9.976197016619561e-05} +{"train_loss": 0.02467220276594162, "global_step": 2703, "epoch": 22, "lr": 9.976175419288418e-05} +{"train_loss": 0.017045358195900917, "global_step": 2704, "epoch": 22, "lr": 9.976153812187086e-05} +{"train_loss": 0.020884206518530846, "global_step": 2705, "epoch": 22, "lr": 9.976132195315608e-05} +{"train_loss": 0.023976590484380722, "global_step": 2706, "epoch": 22, "lr": 9.976110568674025e-05} +{"train_loss": 0.019378211349248886, "global_step": 2707, "epoch": 22, "lr": 9.976088932262382e-05} +{"train_loss": 0.026841189712285995, "global_step": 2708, "epoch": 22, "lr": 9.976067286080719e-05} +{"train_loss": 0.01888285018503666, "global_step": 2709, "epoch": 22, "lr": 9.97604563012908e-05} +{"train_loss": 0.028229106217622757, "global_step": 2710, "epoch": 22, "lr": 9.976023964407507e-05} +{"train_loss": 0.02592729777097702, "global_step": 2711, "epoch": 22, "lr": 9.976002288916042e-05} +{"train_loss": 0.02056192234158516, "global_step": 2712, "epoch": 22, "lr": 9.975980603654729e-05} +{"train_loss": 0.027729295194149017, "global_step": 2713, "epoch": 22, "lr": 9.97595890862361e-05} +{"train_loss": 0.018319496884942055, "global_step": 2714, "epoch": 22, "lr": 9.975937203822726e-05} +{"train_loss": 0.029104771092534065, "global_step": 2715, "epoch": 22, "lr": 9.975915489252122e-05} +{"train_loss": 0.019543731585144997, "global_step": 2716, "epoch": 22, "lr": 9.975893764911839e-05} +{"train_loss": 0.020490586757659912, "global_step": 2717, "epoch": 22, "lr": 9.975872030801921e-05} +{"train_loss": 0.025116415694355965, "global_step": 2718, "epoch": 22, "lr": 9.975850286922407e-05} +{"train_loss": 0.022604236379265785, "global_step": 2719, "epoch": 22, "lr": 9.975828533273346e-05} +{"train_loss": 0.02125321887433529, "global_step": 2720, "epoch": 22, "lr": 9.975806769854777e-05} +{"train_loss": 0.019881537184119225, "global_step": 2721, "epoch": 22, "lr": 9.97578499666674e-05} +{"train_loss": 0.018511995673179626, "global_step": 2722, "epoch": 22, "lr": 9.975763213709283e-05} +{"train_loss": 0.029313186183571815, "global_step": 2723, "epoch": 22, "lr": 9.975741420982447e-05} +{"train_loss": 0.02128278836607933, "global_step": 2724, "epoch": 22, "lr": 9.975719618486272e-05} +{"train_loss": 0.03057747334241867, "global_step": 2725, "epoch": 22, "lr": 9.975697806220804e-05} +{"train_loss": 0.01960100047290325, "global_step": 2726, "epoch": 22, "lr": 9.975675984186087e-05} +{"train_loss": 0.02187890000641346, "global_step": 2727, "epoch": 22, "lr": 9.97565415238216e-05} +{"train_loss": 0.03219141066074371, "global_step": 2728, "epoch": 22, "lr": 9.975632310809068e-05} +{"train_loss": 0.021588202565908432, "global_step": 2729, "epoch": 22, "lr": 9.975610459466854e-05} +{"train_loss": 0.022166572511196136, "global_step": 2730, "epoch": 22, "lr": 9.975588598355559e-05} +{"train_loss": 0.02261148765683174, "global_step": 2731, "epoch": 22, "lr": 9.975566727475228e-05} +{"train_loss": 0.024145323783159256, "global_step": 2732, "epoch": 22, "lr": 9.975544846825904e-05} +{"train_loss": 0.02120649628341198, "global_step": 2733, "epoch": 22, "lr": 9.975522956407628e-05} +{"train_loss": 0.028002487495541573, "global_step": 2734, "epoch": 22, "lr": 9.975501056220445e-05} +{"train_loss": 0.019007623195648193, "global_step": 2735, "epoch": 22, "lr": 9.975479146264397e-05} +{"train_loss": 0.024023297751525872, "global_step": 2736, "epoch": 22, "lr": 9.975457226539529e-05, "val_loss": 0.030115865170955658} +{"train_loss": 0.027654921635985374, "global_step": 2737, "epoch": 23, "lr": 9.97543529704588e-05} +{"train_loss": 0.02253168448805809, "global_step": 2738, "epoch": 23, "lr": 9.975413357783496e-05} +{"train_loss": 0.026611244305968285, "global_step": 2739, "epoch": 23, "lr": 9.97539140875242e-05} +{"train_loss": 0.019111912697553635, "global_step": 2740, "epoch": 23, "lr": 9.975369449952694e-05} +{"train_loss": 0.030201122164726257, "global_step": 2741, "epoch": 23, "lr": 9.97534748138436e-05} +{"train_loss": 0.019551128149032593, "global_step": 2742, "epoch": 23, "lr": 9.975325503047466e-05} +{"train_loss": 0.026288233697414398, "global_step": 2743, "epoch": 23, "lr": 9.975303514942049e-05} +{"train_loss": 0.028505871072411537, "global_step": 2744, "epoch": 23, "lr": 9.975281517068158e-05} +{"train_loss": 0.019930049777030945, "global_step": 2745, "epoch": 23, "lr": 9.975259509425831e-05} +{"train_loss": 0.021019186824560165, "global_step": 2746, "epoch": 23, "lr": 9.975237492015115e-05} +{"train_loss": 0.02341311424970627, "global_step": 2747, "epoch": 23, "lr": 9.97521546483605e-05} +{"train_loss": 0.024985890835523605, "global_step": 2748, "epoch": 23, "lr": 9.975193427888681e-05} +{"train_loss": 0.02797301858663559, "global_step": 2749, "epoch": 23, "lr": 9.975171381173052e-05} +{"train_loss": 0.016109665855765343, "global_step": 2750, "epoch": 23, "lr": 9.975149324689206e-05} +{"train_loss": 0.02981743775308132, "global_step": 2751, "epoch": 23, "lr": 9.975127258437186e-05} +{"train_loss": 0.019095655530691147, "global_step": 2752, "epoch": 23, "lr": 9.975105182417035e-05} +{"train_loss": 0.030046049505472183, "global_step": 2753, "epoch": 23, "lr": 9.975083096628795e-05} +{"train_loss": 0.027417080476880074, "global_step": 2754, "epoch": 23, "lr": 9.975061001072512e-05} +{"train_loss": 0.019816439598798752, "global_step": 2755, "epoch": 23, "lr": 9.975038895748228e-05} +{"train_loss": 0.023394308984279633, "global_step": 2756, "epoch": 23, "lr": 9.975016780655987e-05} +{"train_loss": 0.028305761516094208, "global_step": 2757, "epoch": 23, "lr": 9.974994655795831e-05} +{"train_loss": 0.02399052120745182, "global_step": 2758, "epoch": 23, "lr": 9.974972521167806e-05} +{"train_loss": 0.02115318365395069, "global_step": 2759, "epoch": 23, "lr": 9.974950376771953e-05} +{"train_loss": 0.030196944251656532, "global_step": 2760, "epoch": 23, "lr": 9.974928222608317e-05} +{"train_loss": 0.02544424496591091, "global_step": 2761, "epoch": 23, "lr": 9.97490605867694e-05} +{"train_loss": 0.03467061370611191, "global_step": 2762, "epoch": 23, "lr": 9.974883884977868e-05} +{"train_loss": 0.02806727960705757, "global_step": 2763, "epoch": 23, "lr": 9.974861701511142e-05} +{"train_loss": 0.024345649406313896, "global_step": 2764, "epoch": 23, "lr": 9.974839508276805e-05} +{"train_loss": 0.027289237827062607, "global_step": 2765, "epoch": 23, "lr": 9.974817305274903e-05} +{"train_loss": 0.019577061757445335, "global_step": 2766, "epoch": 23, "lr": 9.97479509250548e-05} +{"train_loss": 0.026495518162846565, "global_step": 2767, "epoch": 23, "lr": 9.974772869968579e-05} +{"train_loss": 0.02706843800842762, "global_step": 2768, "epoch": 23, "lr": 9.97475063766424e-05} +{"train_loss": 0.031246403232216835, "global_step": 2769, "epoch": 23, "lr": 9.974728395592512e-05} +{"train_loss": 0.020138777792453766, "global_step": 2770, "epoch": 23, "lr": 9.974706143753436e-05} +{"train_loss": 0.023490319028496742, "global_step": 2771, "epoch": 23, "lr": 9.974683882147055e-05} +{"train_loss": 0.01710294932126999, "global_step": 2772, "epoch": 23, "lr": 9.974661610773414e-05} +{"train_loss": 0.023181933909654617, "global_step": 2773, "epoch": 23, "lr": 9.974639329632556e-05} +{"train_loss": 0.02085079997777939, "global_step": 2774, "epoch": 23, "lr": 9.974617038724526e-05} +{"train_loss": 0.03414672240614891, "global_step": 2775, "epoch": 23, "lr": 9.974594738049368e-05} +{"train_loss": 0.023557187989354134, "global_step": 2776, "epoch": 23, "lr": 9.974572427607122e-05} +{"train_loss": 0.029553908854722977, "global_step": 2777, "epoch": 23, "lr": 9.974550107397836e-05} +{"train_loss": 0.020776014775037766, "global_step": 2778, "epoch": 23, "lr": 9.974527777421552e-05} +{"train_loss": 0.026809995993971825, "global_step": 2779, "epoch": 23, "lr": 9.974505437678315e-05} +{"train_loss": 0.016906142234802246, "global_step": 2780, "epoch": 23, "lr": 9.974483088168167e-05} +{"train_loss": 0.0246413741260767, "global_step": 2781, "epoch": 23, "lr": 9.974460728891153e-05} +{"train_loss": 0.018481796607375145, "global_step": 2782, "epoch": 23, "lr": 9.974438359847316e-05} +{"train_loss": 0.02191491238772869, "global_step": 2783, "epoch": 23, "lr": 9.974415981036702e-05} +{"train_loss": 0.01834128238260746, "global_step": 2784, "epoch": 23, "lr": 9.974393592459352e-05} +{"train_loss": 0.025118477642536163, "global_step": 2785, "epoch": 23, "lr": 9.974371194115314e-05} +{"train_loss": 0.01996624283492565, "global_step": 2786, "epoch": 23, "lr": 9.974348786004628e-05} +{"train_loss": 0.021790649741888046, "global_step": 2787, "epoch": 23, "lr": 9.97432636812734e-05} +{"train_loss": 0.021884378045797348, "global_step": 2788, "epoch": 23, "lr": 9.974303940483494e-05} +{"train_loss": 0.018758496269583702, "global_step": 2789, "epoch": 23, "lr": 9.974281503073134e-05} +{"train_loss": 0.016938429325819016, "global_step": 2790, "epoch": 23, "lr": 9.974259055896303e-05} +{"train_loss": 0.023698855191469193, "global_step": 2791, "epoch": 23, "lr": 9.974236598953045e-05} +{"train_loss": 0.023620370775461197, "global_step": 2792, "epoch": 23, "lr": 9.974214132243406e-05} +{"train_loss": 0.02727600559592247, "global_step": 2793, "epoch": 23, "lr": 9.974191655767429e-05} +{"train_loss": 0.020894603803753853, "global_step": 2794, "epoch": 23, "lr": 9.974169169525156e-05} +{"train_loss": 0.02446327544748783, "global_step": 2795, "epoch": 23, "lr": 9.974146673516635e-05} +{"train_loss": 0.03277885913848877, "global_step": 2796, "epoch": 23, "lr": 9.974124167741909e-05} +{"train_loss": 0.023537002503871918, "global_step": 2797, "epoch": 23, "lr": 9.97410165220102e-05} +{"train_loss": 0.02213040553033352, "global_step": 2798, "epoch": 23, "lr": 9.974079126894016e-05} +{"train_loss": 0.01825043559074402, "global_step": 2799, "epoch": 23, "lr": 9.974056591820937e-05} +{"train_loss": 0.02263140305876732, "global_step": 2800, "epoch": 23, "lr": 9.97403404698183e-05} +{"train_loss": 0.02306128665804863, "global_step": 2801, "epoch": 23, "lr": 9.97401149237674e-05} +{"train_loss": 0.017715314403176308, "global_step": 2802, "epoch": 23, "lr": 9.973988928005709e-05} +{"train_loss": 0.019595760852098465, "global_step": 2803, "epoch": 23, "lr": 9.97396635386878e-05} +{"train_loss": 0.02423795498907566, "global_step": 2804, "epoch": 23, "lr": 9.973943769966e-05} +{"train_loss": 0.025189979001879692, "global_step": 2805, "epoch": 23, "lr": 9.973921176297416e-05} +{"train_loss": 0.02130107395350933, "global_step": 2806, "epoch": 23, "lr": 9.973898572863068e-05} +{"train_loss": 0.024854889139533043, "global_step": 2807, "epoch": 23, "lr": 9.973875959663e-05} +{"train_loss": 0.02803681790828705, "global_step": 2808, "epoch": 23, "lr": 9.973853336697258e-05} +{"train_loss": 0.015435673296451569, "global_step": 2809, "epoch": 23, "lr": 9.973830703965886e-05} +{"train_loss": 0.021632565185427666, "global_step": 2810, "epoch": 23, "lr": 9.97380806146893e-05} +{"train_loss": 0.019939448684453964, "global_step": 2811, "epoch": 23, "lr": 9.973785409206434e-05} +{"train_loss": 0.02393146976828575, "global_step": 2812, "epoch": 23, "lr": 9.97376274717844e-05} +{"train_loss": 0.031002823263406754, "global_step": 2813, "epoch": 23, "lr": 9.973740075384994e-05} +{"train_loss": 0.028696589171886444, "global_step": 2814, "epoch": 23, "lr": 9.973717393826142e-05} +{"train_loss": 0.024691380560398102, "global_step": 2815, "epoch": 23, "lr": 9.973694702501927e-05} +{"train_loss": 0.025768378749489784, "global_step": 2816, "epoch": 23, "lr": 9.973672001412393e-05} +{"train_loss": 0.028975294902920723, "global_step": 2817, "epoch": 23, "lr": 9.973649290557586e-05} +{"train_loss": 0.020234355702996254, "global_step": 2818, "epoch": 23, "lr": 9.973626569937551e-05} +{"train_loss": 0.023130467161536217, "global_step": 2819, "epoch": 23, "lr": 9.97360383955233e-05} +{"train_loss": 0.02878079190850258, "global_step": 2820, "epoch": 23, "lr": 9.97358109940197e-05} +{"train_loss": 0.03267548605799675, "global_step": 2821, "epoch": 23, "lr": 9.973558349486514e-05} +{"train_loss": 0.02407534047961235, "global_step": 2822, "epoch": 23, "lr": 9.973535589806008e-05} +{"train_loss": 0.015712013468146324, "global_step": 2823, "epoch": 23, "lr": 9.973512820360497e-05} +{"train_loss": 0.022602444514632225, "global_step": 2824, "epoch": 23, "lr": 9.973490041150025e-05} +{"train_loss": 0.02645210735499859, "global_step": 2825, "epoch": 23, "lr": 9.973467252174636e-05} +{"train_loss": 0.028298817574977875, "global_step": 2826, "epoch": 23, "lr": 9.973444453434375e-05} +{"train_loss": 0.016549814492464066, "global_step": 2827, "epoch": 23, "lr": 9.973421644929286e-05} +{"train_loss": 0.024960137903690338, "global_step": 2828, "epoch": 23, "lr": 9.973398826659417e-05} +{"train_loss": 0.03030458278954029, "global_step": 2829, "epoch": 23, "lr": 9.97337599862481e-05} +{"train_loss": 0.0231980811804533, "global_step": 2830, "epoch": 23, "lr": 9.97335316082551e-05} +{"train_loss": 0.019775032997131348, "global_step": 2831, "epoch": 23, "lr": 9.973330313261564e-05} +{"train_loss": 0.020659906789660454, "global_step": 2832, "epoch": 23, "lr": 9.973307455933015e-05} +{"train_loss": 0.0173348318785429, "global_step": 2833, "epoch": 23, "lr": 9.973284588839907e-05} +{"train_loss": 0.02454737015068531, "global_step": 2834, "epoch": 23, "lr": 9.973261711982285e-05} +{"train_loss": 0.02828630432486534, "global_step": 2835, "epoch": 23, "lr": 9.973238825360197e-05} +{"train_loss": 0.01850546896457672, "global_step": 2836, "epoch": 23, "lr": 9.973215928973685e-05} +{"train_loss": 0.013968291692435741, "global_step": 2837, "epoch": 23, "lr": 9.973193022822795e-05} +{"train_loss": 0.024481050670146942, "global_step": 2838, "epoch": 23, "lr": 9.973170106907573e-05} +{"train_loss": 0.018956882879137993, "global_step": 2839, "epoch": 23, "lr": 9.973147181228062e-05} +{"train_loss": 0.019441014155745506, "global_step": 2840, "epoch": 23, "lr": 9.973124245784307e-05} +{"train_loss": 0.021115722134709358, "global_step": 2841, "epoch": 23, "lr": 9.973101300576354e-05} +{"train_loss": 0.017300976440310478, "global_step": 2842, "epoch": 23, "lr": 9.973078345604248e-05} +{"train_loss": 0.021575873717665672, "global_step": 2843, "epoch": 23, "lr": 9.973055380868035e-05} +{"train_loss": 0.020438626408576965, "global_step": 2844, "epoch": 23, "lr": 9.973032406367758e-05} +{"train_loss": 0.019562669098377228, "global_step": 2845, "epoch": 23, "lr": 9.973009422103463e-05} +{"train_loss": 0.027649518102407455, "global_step": 2846, "epoch": 23, "lr": 9.972986428075197e-05} +{"train_loss": 0.021178092807531357, "global_step": 2847, "epoch": 23, "lr": 9.972963424283002e-05} +{"train_loss": 0.01968437060713768, "global_step": 2848, "epoch": 23, "lr": 9.972940410726925e-05} +{"train_loss": 0.02102356217801571, "global_step": 2849, "epoch": 23, "lr": 9.97291738740701e-05} +{"train_loss": 0.022122198715806007, "global_step": 2850, "epoch": 23, "lr": 9.972894354323304e-05} +{"train_loss": 0.018446266651153564, "global_step": 2851, "epoch": 23, "lr": 9.972871311475849e-05} +{"train_loss": 0.0246936846524477, "global_step": 2852, "epoch": 23, "lr": 9.972848258864696e-05} +{"train_loss": 0.010989378206431866, "global_step": 2853, "epoch": 23, "lr": 9.972825196489883e-05} +{"train_loss": 0.020899923518300056, "global_step": 2854, "epoch": 23, "lr": 9.972802124351462e-05} +{"train_loss": 0.023268800009699428, "global_step": 2855, "epoch": 23, "lr": 9.972779042449474e-05, "val_loss": 0.040374040603637695} +{"train_loss": 0.024244744330644608, "global_step": 2856, "epoch": 24, "lr": 9.972755950783967e-05} +{"train_loss": 0.023178081959486008, "global_step": 2857, "epoch": 24, "lr": 9.972732849354981e-05} +{"train_loss": 0.014942463487386703, "global_step": 2858, "epoch": 24, "lr": 9.97270973816257e-05} +{"train_loss": 0.02238745242357254, "global_step": 2859, "epoch": 24, "lr": 9.972686617206772e-05} +{"train_loss": 0.022017337381839752, "global_step": 2860, "epoch": 24, "lr": 9.972663486487637e-05} +{"train_loss": 0.026443470269441605, "global_step": 2861, "epoch": 24, "lr": 9.972640346005207e-05} +{"train_loss": 0.02649347297847271, "global_step": 2862, "epoch": 24, "lr": 9.97261719575953e-05} +{"train_loss": 0.025237668305635452, "global_step": 2863, "epoch": 24, "lr": 9.972594035750649e-05} +{"train_loss": 0.021099798381328583, "global_step": 2864, "epoch": 24, "lr": 9.972570865978612e-05} +{"train_loss": 0.02282332256436348, "global_step": 2865, "epoch": 24, "lr": 9.972547686443463e-05} +{"train_loss": 0.021247562021017075, "global_step": 2866, "epoch": 24, "lr": 9.972524497145246e-05} +{"train_loss": 0.02313491329550743, "global_step": 2867, "epoch": 24, "lr": 9.972501298084012e-05} +{"train_loss": 0.027546074241399765, "global_step": 2868, "epoch": 24, "lr": 9.9724780892598e-05} +{"train_loss": 0.019948864355683327, "global_step": 2869, "epoch": 24, "lr": 9.972454870672659e-05} +{"train_loss": 0.017950376495718956, "global_step": 2870, "epoch": 24, "lr": 9.972431642322635e-05} +{"train_loss": 0.022618908435106277, "global_step": 2871, "epoch": 24, "lr": 9.972408404209773e-05} +{"train_loss": 0.030270393937826157, "global_step": 2872, "epoch": 24, "lr": 9.972385156334117e-05} +{"train_loss": 0.01941746100783348, "global_step": 2873, "epoch": 24, "lr": 9.972361898695714e-05} +{"train_loss": 0.02756669372320175, "global_step": 2874, "epoch": 24, "lr": 9.97233863129461e-05} +{"train_loss": 0.0272801723331213, "global_step": 2875, "epoch": 24, "lr": 9.972315354130853e-05} +{"train_loss": 0.022587738931179047, "global_step": 2876, "epoch": 24, "lr": 9.972292067204483e-05} +{"train_loss": 0.02217962220311165, "global_step": 2877, "epoch": 24, "lr": 9.97226877051555e-05} +{"train_loss": 0.026447664946317673, "global_step": 2878, "epoch": 24, "lr": 9.972245464064096e-05} +{"train_loss": 0.025347761809825897, "global_step": 2879, "epoch": 24, "lr": 9.972222147850172e-05} +{"train_loss": 0.019125377759337425, "global_step": 2880, "epoch": 24, "lr": 9.97219882187382e-05} +{"train_loss": 0.027718499302864075, "global_step": 2881, "epoch": 24, "lr": 9.972175486135087e-05} +{"train_loss": 0.02915176935493946, "global_step": 2882, "epoch": 24, "lr": 9.972152140634019e-05} +{"train_loss": 0.026647670194506645, "global_step": 2883, "epoch": 24, "lr": 9.97212878537066e-05} +{"train_loss": 0.01962871477007866, "global_step": 2884, "epoch": 24, "lr": 9.972105420345058e-05} +{"train_loss": 0.028268225491046906, "global_step": 2885, "epoch": 24, "lr": 9.972082045557258e-05} +{"train_loss": 0.02238747663795948, "global_step": 2886, "epoch": 24, "lr": 9.972058661007306e-05} +{"train_loss": 0.02389342710375786, "global_step": 2887, "epoch": 24, "lr": 9.97203526669525e-05} +{"train_loss": 0.017475668340921402, "global_step": 2888, "epoch": 24, "lr": 9.972011862621133e-05} +{"train_loss": 0.026574332267045975, "global_step": 2889, "epoch": 24, "lr": 9.971988448785001e-05} +{"train_loss": 0.02228330448269844, "global_step": 2890, "epoch": 24, "lr": 9.9719650251869e-05} +{"train_loss": 0.021185098215937614, "global_step": 2891, "epoch": 24, "lr": 9.971941591826879e-05} +{"train_loss": 0.01871931366622448, "global_step": 2892, "epoch": 24, "lr": 9.97191814870498e-05} +{"train_loss": 0.026722397655248642, "global_step": 2893, "epoch": 24, "lr": 9.971894695821254e-05} +{"train_loss": 0.02230670675635338, "global_step": 2894, "epoch": 24, "lr": 9.97187123317574e-05} +{"train_loss": 0.028339117765426636, "global_step": 2895, "epoch": 24, "lr": 9.97184776076849e-05} +{"train_loss": 0.022511709481477737, "global_step": 2896, "epoch": 24, "lr": 9.971824278599549e-05} +{"train_loss": 0.02417326718568802, "global_step": 2897, "epoch": 24, "lr": 9.97180078666896e-05} +{"train_loss": 0.019014030694961548, "global_step": 2898, "epoch": 24, "lr": 9.971777284976774e-05} +{"train_loss": 0.019589973613619804, "global_step": 2899, "epoch": 24, "lr": 9.971753773523032e-05} +{"train_loss": 0.026914402842521667, "global_step": 2900, "epoch": 24, "lr": 9.971730252307783e-05} +{"train_loss": 0.02125665359199047, "global_step": 2901, "epoch": 24, "lr": 9.971706721331073e-05} +{"train_loss": 0.022929765284061432, "global_step": 2902, "epoch": 24, "lr": 9.971683180592948e-05} +{"train_loss": 0.022607190534472466, "global_step": 2903, "epoch": 24, "lr": 9.971659630093455e-05} +{"train_loss": 0.022319253534078598, "global_step": 2904, "epoch": 24, "lr": 9.97163606983264e-05} +{"train_loss": 0.02525176666676998, "global_step": 2905, "epoch": 24, "lr": 9.971612499810546e-05} +{"train_loss": 0.02576564997434616, "global_step": 2906, "epoch": 24, "lr": 9.971588920027224e-05} +{"train_loss": 0.024783233180642128, "global_step": 2907, "epoch": 24, "lr": 9.971565330482718e-05} +{"train_loss": 0.020607290789484978, "global_step": 2908, "epoch": 24, "lr": 9.971541731177074e-05} +{"train_loss": 0.025014305487275124, "global_step": 2909, "epoch": 24, "lr": 9.97151812211034e-05} +{"train_loss": 0.02805822715163231, "global_step": 2910, "epoch": 24, "lr": 9.971494503282561e-05} +{"train_loss": 0.02369854971766472, "global_step": 2911, "epoch": 24, "lr": 9.971470874693784e-05} +{"train_loss": 0.02549559436738491, "global_step": 2912, "epoch": 24, "lr": 9.971447236344053e-05} +{"train_loss": 0.018293388187885284, "global_step": 2913, "epoch": 24, "lr": 9.97142358823342e-05} +{"train_loss": 0.018265683203935623, "global_step": 2914, "epoch": 24, "lr": 9.971399930361925e-05} +{"train_loss": 0.023833347484469414, "global_step": 2915, "epoch": 24, "lr": 9.971376262729618e-05} +{"train_loss": 0.027210840955376625, "global_step": 2916, "epoch": 24, "lr": 9.971352585336545e-05} +{"train_loss": 0.015138903632760048, "global_step": 2917, "epoch": 24, "lr": 9.971328898182752e-05} +{"train_loss": 0.025643642991781235, "global_step": 2918, "epoch": 24, "lr": 9.971305201268286e-05} +{"train_loss": 0.018671125173568726, "global_step": 2919, "epoch": 24, "lr": 9.971281494593194e-05} +{"train_loss": 0.02571120113134384, "global_step": 2920, "epoch": 24, "lr": 9.971257778157521e-05} +{"train_loss": 0.025350773707032204, "global_step": 2921, "epoch": 24, "lr": 9.971234051961315e-05} +{"train_loss": 0.023930378258228302, "global_step": 2922, "epoch": 24, "lr": 9.971210316004622e-05} +{"train_loss": 0.01882779225707054, "global_step": 2923, "epoch": 24, "lr": 9.97118657028749e-05} +{"train_loss": 0.030553283169865608, "global_step": 2924, "epoch": 24, "lr": 9.971162814809962e-05} +{"train_loss": 0.01570451259613037, "global_step": 2925, "epoch": 24, "lr": 9.971139049572086e-05} +{"train_loss": 0.023586425930261612, "global_step": 2926, "epoch": 24, "lr": 9.971115274573912e-05} +{"train_loss": 0.022875947877764702, "global_step": 2927, "epoch": 24, "lr": 9.971091489815485e-05} +{"train_loss": 0.028808999806642532, "global_step": 2928, "epoch": 24, "lr": 9.971067695296849e-05} +{"train_loss": 0.021597424522042274, "global_step": 2929, "epoch": 24, "lr": 9.971043891018053e-05} +{"train_loss": 0.02867533266544342, "global_step": 2930, "epoch": 24, "lr": 9.971020076979142e-05} +{"train_loss": 0.019515186548233032, "global_step": 2931, "epoch": 24, "lr": 9.970996253180168e-05} +{"train_loss": 0.02283543162047863, "global_step": 2932, "epoch": 24, "lr": 9.970972419621171e-05} +{"train_loss": 0.018390748649835587, "global_step": 2933, "epoch": 24, "lr": 9.970948576302201e-05} +{"train_loss": 0.022026045247912407, "global_step": 2934, "epoch": 24, "lr": 9.970924723223305e-05} +{"train_loss": 0.024540191516280174, "global_step": 2935, "epoch": 24, "lr": 9.970900860384529e-05} +{"train_loss": 0.024807875975966454, "global_step": 2936, "epoch": 24, "lr": 9.970876987785919e-05} +{"train_loss": 0.02312857285141945, "global_step": 2937, "epoch": 24, "lr": 9.970853105427526e-05} +{"train_loss": 0.021427743136882782, "global_step": 2938, "epoch": 24, "lr": 9.970829213309392e-05} +{"train_loss": 0.015801265835762024, "global_step": 2939, "epoch": 24, "lr": 9.970805311431567e-05} +{"train_loss": 0.023682842031121254, "global_step": 2940, "epoch": 24, "lr": 9.970781399794096e-05} +{"train_loss": 0.02000124379992485, "global_step": 2941, "epoch": 24, "lr": 9.970757478397028e-05} +{"train_loss": 0.0188693068921566, "global_step": 2942, "epoch": 24, "lr": 9.970733547240407e-05} +{"train_loss": 0.015275858342647552, "global_step": 2943, "epoch": 24, "lr": 9.970709606324282e-05} +{"train_loss": 0.02510298602283001, "global_step": 2944, "epoch": 24, "lr": 9.970685655648702e-05} +{"train_loss": 0.021003438159823418, "global_step": 2945, "epoch": 24, "lr": 9.97066169521371e-05} +{"train_loss": 0.02217884175479412, "global_step": 2946, "epoch": 24, "lr": 9.970637725019354e-05} +{"train_loss": 0.021410448476672173, "global_step": 2947, "epoch": 24, "lr": 9.970613745065682e-05} +{"train_loss": 0.018543828278779984, "global_step": 2948, "epoch": 24, "lr": 9.970589755352741e-05} +{"train_loss": 0.016846608370542526, "global_step": 2949, "epoch": 24, "lr": 9.970565755880578e-05} +{"train_loss": 0.021210407838225365, "global_step": 2950, "epoch": 24, "lr": 9.970541746649243e-05} +{"train_loss": 0.019573461264371872, "global_step": 2951, "epoch": 24, "lr": 9.970517727658777e-05} +{"train_loss": 0.022798117250204086, "global_step": 2952, "epoch": 24, "lr": 9.970493698909232e-05} +{"train_loss": 0.017223265022039413, "global_step": 2953, "epoch": 24, "lr": 9.970469660400653e-05} +{"train_loss": 0.021181780844926834, "global_step": 2954, "epoch": 24, "lr": 9.970445612133088e-05} +{"train_loss": 0.02083861082792282, "global_step": 2955, "epoch": 24, "lr": 9.970421554106584e-05} +{"train_loss": 0.018999947234988213, "global_step": 2956, "epoch": 24, "lr": 9.970397486321187e-05} +{"train_loss": 0.01580902747809887, "global_step": 2957, "epoch": 24, "lr": 9.970373408776948e-05} +{"train_loss": 0.025307662785053253, "global_step": 2958, "epoch": 24, "lr": 9.97034932147391e-05} +{"train_loss": 0.015082095749676228, "global_step": 2959, "epoch": 24, "lr": 9.970325224412125e-05} +{"train_loss": 0.021434633061289787, "global_step": 2960, "epoch": 24, "lr": 9.970301117591634e-05} +{"train_loss": 0.018838027492165565, "global_step": 2961, "epoch": 24, "lr": 9.970277001012489e-05} +{"train_loss": 0.024081043899059296, "global_step": 2962, "epoch": 24, "lr": 9.970252874674737e-05} +{"train_loss": 0.02115345187485218, "global_step": 2963, "epoch": 24, "lr": 9.970228738578423e-05} +{"train_loss": 0.015951724722981453, "global_step": 2964, "epoch": 24, "lr": 9.970204592723597e-05} +{"train_loss": 0.01651838608086109, "global_step": 2965, "epoch": 24, "lr": 9.970180437110305e-05} +{"train_loss": 0.01406935602426529, "global_step": 2966, "epoch": 24, "lr": 9.970156271738594e-05} +{"train_loss": 0.023221438750624657, "global_step": 2967, "epoch": 24, "lr": 9.970132096608513e-05} +{"train_loss": 0.024845076724886894, "global_step": 2968, "epoch": 24, "lr": 9.970107911720109e-05} +{"train_loss": 0.013438533060252666, "global_step": 2969, "epoch": 24, "lr": 9.970083717073428e-05} +{"train_loss": 0.01537081878632307, "global_step": 2970, "epoch": 24, "lr": 9.970059512668518e-05} +{"train_loss": 0.02173457108438015, "global_step": 2971, "epoch": 24, "lr": 9.970035298505428e-05} +{"train_loss": 0.02349495142698288, "global_step": 2972, "epoch": 24, "lr": 9.970011074584205e-05} +{"train_loss": 0.01801401376724243, "global_step": 2973, "epoch": 24, "lr": 9.969986840904896e-05} +{"train_loss": 0.02219660466677752, "global_step": 2974, "epoch": 24, "lr": 9.969962597467548e-05, "val_loss": 0.03171706199645996} +{"train_loss": 0.02371376007795334, "global_step": 2975, "epoch": 25, "lr": 9.969938344272211e-05} +{"train_loss": 0.022220535203814507, "global_step": 2976, "epoch": 25, "lr": 9.96991408131893e-05} +{"train_loss": 0.023460499942302704, "global_step": 2977, "epoch": 25, "lr": 9.969889808607753e-05} +{"train_loss": 0.02651936374604702, "global_step": 2978, "epoch": 25, "lr": 9.969865526138728e-05} +{"train_loss": 0.020251765847206116, "global_step": 2979, "epoch": 25, "lr": 9.969841233911905e-05} +{"train_loss": 0.02550504542887211, "global_step": 2980, "epoch": 25, "lr": 9.969816931927329e-05} +{"train_loss": 0.020231014117598534, "global_step": 2981, "epoch": 25, "lr": 9.969792620185048e-05} +{"train_loss": 0.01737252250313759, "global_step": 2982, "epoch": 25, "lr": 9.969768298685112e-05} +{"train_loss": 0.02420843206346035, "global_step": 2983, "epoch": 25, "lr": 9.969743967427564e-05} +{"train_loss": 0.024725625291466713, "global_step": 2984, "epoch": 25, "lr": 9.969719626412456e-05} +{"train_loss": 0.01256995927542448, "global_step": 2985, "epoch": 25, "lr": 9.969695275639834e-05} +{"train_loss": 0.023034941405057907, "global_step": 2986, "epoch": 25, "lr": 9.969670915109747e-05} +{"train_loss": 0.020506083965301514, "global_step": 2987, "epoch": 25, "lr": 9.969646544822242e-05} +{"train_loss": 0.019998449832201004, "global_step": 2988, "epoch": 25, "lr": 9.969622164777366e-05} +{"train_loss": 0.017480242997407913, "global_step": 2989, "epoch": 25, "lr": 9.969597774975167e-05} +{"train_loss": 0.020834265276789665, "global_step": 2990, "epoch": 25, "lr": 9.969573375415696e-05} +{"train_loss": 0.023513469845056534, "global_step": 2991, "epoch": 25, "lr": 9.969548966098998e-05} +{"train_loss": 0.01810559630393982, "global_step": 2992, "epoch": 25, "lr": 9.969524547025122e-05} +{"train_loss": 0.022123130038380623, "global_step": 2993, "epoch": 25, "lr": 9.969500118194114e-05} +{"train_loss": 0.021610353142023087, "global_step": 2994, "epoch": 25, "lr": 9.969475679606024e-05} +{"train_loss": 0.020604560151696205, "global_step": 2995, "epoch": 25, "lr": 9.9694512312609e-05} +{"train_loss": 0.019222719594836235, "global_step": 2996, "epoch": 25, "lr": 9.969426773158789e-05} +{"train_loss": 0.022471852600574493, "global_step": 2997, "epoch": 25, "lr": 9.969402305299739e-05} +{"train_loss": 0.019111331552267075, "global_step": 2998, "epoch": 25, "lr": 9.969377827683799e-05} +{"train_loss": 0.019204962998628616, "global_step": 2999, "epoch": 25, "lr": 9.969353340311016e-05} +{"train_loss": 0.018278663977980614, "global_step": 3000, "epoch": 25, "lr": 9.969328843181438e-05} +{"train_loss": 0.014366604387760162, "global_step": 3001, "epoch": 25, "lr": 9.969304336295115e-05} +{"train_loss": 0.02257118932902813, "global_step": 3002, "epoch": 25, "lr": 9.969279819652094e-05} +{"train_loss": 0.0151672987267375, "global_step": 3003, "epoch": 25, "lr": 9.969255293252422e-05} +{"train_loss": 0.023218395188450813, "global_step": 3004, "epoch": 25, "lr": 9.969230757096149e-05} +{"train_loss": 0.02305786684155464, "global_step": 3005, "epoch": 25, "lr": 9.969206211183322e-05} +{"train_loss": 0.01896524429321289, "global_step": 3006, "epoch": 25, "lr": 9.969181655513989e-05} +{"train_loss": 0.017182959243655205, "global_step": 3007, "epoch": 25, "lr": 9.9691570900882e-05} +{"train_loss": 0.021641859784722328, "global_step": 3008, "epoch": 25, "lr": 9.969132514906001e-05} +{"train_loss": 0.01970786787569523, "global_step": 3009, "epoch": 25, "lr": 9.96910792996744e-05} +{"train_loss": 0.022281114012002945, "global_step": 3010, "epoch": 25, "lr": 9.969083335272568e-05} +{"train_loss": 0.014802011661231518, "global_step": 3011, "epoch": 25, "lr": 9.969058730821433e-05} +{"train_loss": 0.028987806290388107, "global_step": 3012, "epoch": 25, "lr": 9.96903411661408e-05} +{"train_loss": 0.017657676711678505, "global_step": 3013, "epoch": 25, "lr": 9.96900949265056e-05} +{"train_loss": 0.019656475633382797, "global_step": 3014, "epoch": 25, "lr": 9.96898485893092e-05} +{"train_loss": 0.01860777474939823, "global_step": 3015, "epoch": 25, "lr": 9.968960215455209e-05} +{"train_loss": 0.02271299809217453, "global_step": 3016, "epoch": 25, "lr": 9.968935562223476e-05} +{"train_loss": 0.021531080827116966, "global_step": 3017, "epoch": 25, "lr": 9.968910899235769e-05} +{"train_loss": 0.015330691821873188, "global_step": 3018, "epoch": 25, "lr": 9.968886226492137e-05} +{"train_loss": 0.02096690982580185, "global_step": 3019, "epoch": 25, "lr": 9.968861543992627e-05} +{"train_loss": 0.022504134103655815, "global_step": 3020, "epoch": 25, "lr": 9.968836851737289e-05} +{"train_loss": 0.019064946100115776, "global_step": 3021, "epoch": 25, "lr": 9.968812149726169e-05} +{"train_loss": 0.02875414490699768, "global_step": 3022, "epoch": 25, "lr": 9.968787437959318e-05} +{"train_loss": 0.01718677580356598, "global_step": 3023, "epoch": 25, "lr": 9.968762716436784e-05} +{"train_loss": 0.01807233691215515, "global_step": 3024, "epoch": 25, "lr": 9.968737985158615e-05} +{"train_loss": 0.02211536280810833, "global_step": 3025, "epoch": 25, "lr": 9.96871324412486e-05} +{"train_loss": 0.022427741438150406, "global_step": 3026, "epoch": 25, "lr": 9.968688493335567e-05} +{"train_loss": 0.02091694064438343, "global_step": 3027, "epoch": 25, "lr": 9.968663732790785e-05} +{"train_loss": 0.030571946874260902, "global_step": 3028, "epoch": 25, "lr": 9.968638962490563e-05} +{"train_loss": 0.019774723798036575, "global_step": 3029, "epoch": 25, "lr": 9.968614182434949e-05} +{"train_loss": 0.018384797498583794, "global_step": 3030, "epoch": 25, "lr": 9.968589392623992e-05} +{"train_loss": 0.031136583536863327, "global_step": 3031, "epoch": 25, "lr": 9.96856459305774e-05} +{"train_loss": 0.016191083937883377, "global_step": 3032, "epoch": 25, "lr": 9.968539783736242e-05} +{"train_loss": 0.021497854962944984, "global_step": 3033, "epoch": 25, "lr": 9.968514964659548e-05} +{"train_loss": 0.027004221454262733, "global_step": 3034, "epoch": 25, "lr": 9.968490135827706e-05} +{"train_loss": 0.021688062697649002, "global_step": 3035, "epoch": 25, "lr": 9.968465297240763e-05} +{"train_loss": 0.015695495530962944, "global_step": 3036, "epoch": 25, "lr": 9.96844044889877e-05} +{"train_loss": 0.02776372991502285, "global_step": 3037, "epoch": 25, "lr": 9.968415590801774e-05} +{"train_loss": 0.025115476921200752, "global_step": 3038, "epoch": 25, "lr": 9.968390722949826e-05} +{"train_loss": 0.025652030482888222, "global_step": 3039, "epoch": 25, "lr": 9.968365845342973e-05} +{"train_loss": 0.026793962344527245, "global_step": 3040, "epoch": 25, "lr": 9.968340957981265e-05} +{"train_loss": 0.016183000057935715, "global_step": 3041, "epoch": 25, "lr": 9.96831606086475e-05} +{"train_loss": 0.019431162625551224, "global_step": 3042, "epoch": 25, "lr": 9.968291153993477e-05} +{"train_loss": 0.019216639921069145, "global_step": 3043, "epoch": 25, "lr": 9.968266237367496e-05} +{"train_loss": 0.019294224679470062, "global_step": 3044, "epoch": 25, "lr": 9.968241310986855e-05} +{"train_loss": 0.025966010987758636, "global_step": 3045, "epoch": 25, "lr": 9.9682163748516e-05} +{"train_loss": 0.023234186694025993, "global_step": 3046, "epoch": 25, "lr": 9.968191428961786e-05} +{"train_loss": 0.016171762719750404, "global_step": 3047, "epoch": 25, "lr": 9.968166473317459e-05} +{"train_loss": 0.02479473128914833, "global_step": 3048, "epoch": 25, "lr": 9.968141507918666e-05} +{"train_loss": 0.020554816350340843, "global_step": 3049, "epoch": 25, "lr": 9.968116532765458e-05} +{"train_loss": 0.02006162703037262, "global_step": 3050, "epoch": 25, "lr": 9.968091547857886e-05} +{"train_loss": 0.023726124316453934, "global_step": 3051, "epoch": 25, "lr": 9.968066553195995e-05} +{"train_loss": 0.021696696057915688, "global_step": 3052, "epoch": 25, "lr": 9.968041548779839e-05} +{"train_loss": 0.019372856244444847, "global_step": 3053, "epoch": 25, "lr": 9.968016534609461e-05} +{"train_loss": 0.025987813249230385, "global_step": 3054, "epoch": 25, "lr": 9.967991510684915e-05} +{"train_loss": 0.02136886678636074, "global_step": 3055, "epoch": 25, "lr": 9.967966477006248e-05} +{"train_loss": 0.022814834490418434, "global_step": 3056, "epoch": 25, "lr": 9.967941433573509e-05} +{"train_loss": 0.01899341680109501, "global_step": 3057, "epoch": 25, "lr": 9.967916380386748e-05} +{"train_loss": 0.020979780703783035, "global_step": 3058, "epoch": 25, "lr": 9.967891317446014e-05} +{"train_loss": 0.025505220517516136, "global_step": 3059, "epoch": 25, "lr": 9.967866244751355e-05} +{"train_loss": 0.018092256039381027, "global_step": 3060, "epoch": 25, "lr": 9.967841162302824e-05} +{"train_loss": 0.0180867537856102, "global_step": 3061, "epoch": 25, "lr": 9.967816070100466e-05} +{"train_loss": 0.026573602110147476, "global_step": 3062, "epoch": 25, "lr": 9.967790968144333e-05} +{"train_loss": 0.0187064241617918, "global_step": 3063, "epoch": 25, "lr": 9.967765856434473e-05} +{"train_loss": 0.01905277743935585, "global_step": 3064, "epoch": 25, "lr": 9.967740734970934e-05} +{"train_loss": 0.017695218324661255, "global_step": 3065, "epoch": 25, "lr": 9.967715603753767e-05} +{"train_loss": 0.028260130435228348, "global_step": 3066, "epoch": 25, "lr": 9.967690462783022e-05} +{"train_loss": 0.019128121435642242, "global_step": 3067, "epoch": 25, "lr": 9.967665312058746e-05} +{"train_loss": 0.022693486884236336, "global_step": 3068, "epoch": 25, "lr": 9.967640151580992e-05} +{"train_loss": 0.024496713653206825, "global_step": 3069, "epoch": 25, "lr": 9.967614981349806e-05} +{"train_loss": 0.01742701046168804, "global_step": 3070, "epoch": 25, "lr": 9.96758980136524e-05} +{"train_loss": 0.028472110629081726, "global_step": 3071, "epoch": 25, "lr": 9.96756461162734e-05} +{"train_loss": 0.026147974655032158, "global_step": 3072, "epoch": 25, "lr": 9.96753941213616e-05} +{"train_loss": 0.019334256649017334, "global_step": 3073, "epoch": 25, "lr": 9.967514202891746e-05} +{"train_loss": 0.026438208296895027, "global_step": 3074, "epoch": 25, "lr": 9.967488983894147e-05} +{"train_loss": 0.02375328168272972, "global_step": 3075, "epoch": 25, "lr": 9.967463755143415e-05} +{"train_loss": 0.012110401876270771, "global_step": 3076, "epoch": 25, "lr": 9.9674385166396e-05} +{"train_loss": 0.025926340371370316, "global_step": 3077, "epoch": 25, "lr": 9.967413268382749e-05} +{"train_loss": 0.020972777158021927, "global_step": 3078, "epoch": 25, "lr": 9.967388010372913e-05} +{"train_loss": 0.018287293612957, "global_step": 3079, "epoch": 25, "lr": 9.967362742610141e-05} +{"train_loss": 0.020582079887390137, "global_step": 3080, "epoch": 25, "lr": 9.967337465094484e-05} +{"train_loss": 0.025693608447909355, "global_step": 3081, "epoch": 25, "lr": 9.967312177825989e-05} +{"train_loss": 0.0283050574362278, "global_step": 3082, "epoch": 25, "lr": 9.967286880804709e-05} +{"train_loss": 0.02441529370844364, "global_step": 3083, "epoch": 25, "lr": 9.96726157403069e-05} +{"train_loss": 0.019795669242739677, "global_step": 3084, "epoch": 25, "lr": 9.967236257503985e-05} +{"train_loss": 0.020361129194498062, "global_step": 3085, "epoch": 25, "lr": 9.967210931224642e-05} +{"train_loss": 0.025785548612475395, "global_step": 3086, "epoch": 25, "lr": 9.96718559519271e-05} +{"train_loss": 0.015756843611598015, "global_step": 3087, "epoch": 25, "lr": 9.96716024940824e-05} +{"train_loss": 0.024575430899858475, "global_step": 3088, "epoch": 25, "lr": 9.967134893871283e-05} +{"train_loss": 0.01983514428138733, "global_step": 3089, "epoch": 25, "lr": 9.967109528581886e-05} +{"train_loss": 0.01527370885014534, "global_step": 3090, "epoch": 25, "lr": 9.9670841535401e-05} +{"train_loss": 0.022106792777776718, "global_step": 3091, "epoch": 25, "lr": 9.967058768745976e-05} +{"train_loss": 0.025847407057881355, "global_step": 3092, "epoch": 25, "lr": 9.967033374199561e-05} +{"train_loss": 0.02140984170044921, "global_step": 3093, "epoch": 25, "lr": 9.967007969900908e-05, "val_loss": 0.02426368184387684, "train_action_mse_error": 0.001850793487392366} +{"train_loss": 0.030355164781212807, "global_step": 3094, "epoch": 26, "lr": 9.966982555850067e-05} +{"train_loss": 0.020515747368335724, "global_step": 3095, "epoch": 26, "lr": 9.966957132047083e-05} +{"train_loss": 0.0246360432356596, "global_step": 3096, "epoch": 26, "lr": 9.966931698492011e-05} +{"train_loss": 0.020778382197022438, "global_step": 3097, "epoch": 26, "lr": 9.9669062551849e-05} +{"train_loss": 0.018251905217766762, "global_step": 3098, "epoch": 26, "lr": 9.966880802125797e-05} +{"train_loss": 0.02145984396338463, "global_step": 3099, "epoch": 26, "lr": 9.966855339314756e-05} +{"train_loss": 0.02854277938604355, "global_step": 3100, "epoch": 26, "lr": 9.966829866751826e-05} +{"train_loss": 0.021996142342686653, "global_step": 3101, "epoch": 26, "lr": 9.966804384437054e-05} +{"train_loss": 0.0249306783080101, "global_step": 3102, "epoch": 26, "lr": 9.966778892370494e-05} +{"train_loss": 0.024437667801976204, "global_step": 3103, "epoch": 26, "lr": 9.966753390552193e-05} +{"train_loss": 0.02119695395231247, "global_step": 3104, "epoch": 26, "lr": 9.966727878982203e-05} +{"train_loss": 0.016625937074422836, "global_step": 3105, "epoch": 26, "lr": 9.966702357660572e-05} +{"train_loss": 0.03231735900044441, "global_step": 3106, "epoch": 26, "lr": 9.966676826587353e-05} +{"train_loss": 0.020735014230012894, "global_step": 3107, "epoch": 26, "lr": 9.966651285762593e-05} +{"train_loss": 0.01765846088528633, "global_step": 3108, "epoch": 26, "lr": 9.966625735186346e-05} +{"train_loss": 0.021281488239765167, "global_step": 3109, "epoch": 26, "lr": 9.96660017485866e-05} +{"train_loss": 0.021967096254229546, "global_step": 3110, "epoch": 26, "lr": 9.966574604779584e-05} +{"train_loss": 0.022720124572515488, "global_step": 3111, "epoch": 26, "lr": 9.96654902494917e-05} +{"train_loss": 0.0180037971585989, "global_step": 3112, "epoch": 26, "lr": 9.966523435367468e-05} +{"train_loss": 0.022054234519600868, "global_step": 3113, "epoch": 26, "lr": 9.966497836034525e-05} +{"train_loss": 0.01862461306154728, "global_step": 3114, "epoch": 26, "lr": 9.966472226950396e-05} +{"train_loss": 0.019139017909765244, "global_step": 3115, "epoch": 26, "lr": 9.96644660811513e-05} +{"train_loss": 0.018592199310660362, "global_step": 3116, "epoch": 26, "lr": 9.966420979528776e-05} +{"train_loss": 0.022939452901482582, "global_step": 3117, "epoch": 26, "lr": 9.966395341191385e-05} +{"train_loss": 0.02144666202366352, "global_step": 3118, "epoch": 26, "lr": 9.966369693103008e-05} +{"train_loss": 0.024304743856191635, "global_step": 3119, "epoch": 26, "lr": 9.966344035263695e-05} +{"train_loss": 0.02325059287250042, "global_step": 3120, "epoch": 26, "lr": 9.966318367673495e-05} +{"train_loss": 0.02164601907134056, "global_step": 3121, "epoch": 26, "lr": 9.96629269033246e-05} +{"train_loss": 0.0193331241607666, "global_step": 3122, "epoch": 26, "lr": 9.966267003240638e-05} +{"train_loss": 0.022486742585897446, "global_step": 3123, "epoch": 26, "lr": 9.966241306398084e-05} +{"train_loss": 0.01990155689418316, "global_step": 3124, "epoch": 26, "lr": 9.966215599804845e-05} +{"train_loss": 0.018865935504436493, "global_step": 3125, "epoch": 26, "lr": 9.966189883460972e-05} +{"train_loss": 0.024935923516750336, "global_step": 3126, "epoch": 26, "lr": 9.966164157366516e-05} +{"train_loss": 0.015218928456306458, "global_step": 3127, "epoch": 26, "lr": 9.966138421521527e-05} +{"train_loss": 0.022373026236891747, "global_step": 3128, "epoch": 26, "lr": 9.966112675926055e-05} +{"train_loss": 0.023641737177968025, "global_step": 3129, "epoch": 26, "lr": 9.966086920580151e-05} +{"train_loss": 0.02824654057621956, "global_step": 3130, "epoch": 26, "lr": 9.966061155483868e-05} +{"train_loss": 0.017706293612718582, "global_step": 3131, "epoch": 26, "lr": 9.966035380637254e-05} +{"train_loss": 0.025372376665472984, "global_step": 3132, "epoch": 26, "lr": 9.966009596040358e-05} +{"train_loss": 0.02456849440932274, "global_step": 3133, "epoch": 26, "lr": 9.965983801693235e-05} +{"train_loss": 0.01732482574880123, "global_step": 3134, "epoch": 26, "lr": 9.965957997595931e-05} +{"train_loss": 0.022504236549139023, "global_step": 3135, "epoch": 26, "lr": 9.965932183748501e-05} +{"train_loss": 0.024728622287511826, "global_step": 3136, "epoch": 26, "lr": 9.965906360150993e-05} +{"train_loss": 0.023454837501049042, "global_step": 3137, "epoch": 26, "lr": 9.965880526803459e-05} +{"train_loss": 0.026431184262037277, "global_step": 3138, "epoch": 26, "lr": 9.965854683705948e-05} +{"train_loss": 0.019699353724718094, "global_step": 3139, "epoch": 26, "lr": 9.965828830858512e-05} +{"train_loss": 0.021351806819438934, "global_step": 3140, "epoch": 26, "lr": 9.965802968261201e-05} +{"train_loss": 0.02236381731927395, "global_step": 3141, "epoch": 26, "lr": 9.965777095914068e-05} +{"train_loss": 0.027896881103515625, "global_step": 3142, "epoch": 26, "lr": 9.965751213817163e-05} +{"train_loss": 0.020947031676769257, "global_step": 3143, "epoch": 26, "lr": 9.965725321970533e-05} +{"train_loss": 0.01826498843729496, "global_step": 3144, "epoch": 26, "lr": 9.965699420374235e-05} +{"train_loss": 0.02406436577439308, "global_step": 3145, "epoch": 26, "lr": 9.965673509028315e-05} +{"train_loss": 0.021870935335755348, "global_step": 3146, "epoch": 26, "lr": 9.965647587932826e-05} +{"train_loss": 0.02345854602754116, "global_step": 3147, "epoch": 26, "lr": 9.965621657087818e-05} +{"train_loss": 0.030123205855488777, "global_step": 3148, "epoch": 26, "lr": 9.965595716493342e-05} +{"train_loss": 0.020507102832198143, "global_step": 3149, "epoch": 26, "lr": 9.96556976614945e-05} +{"train_loss": 0.016881175339221954, "global_step": 3150, "epoch": 26, "lr": 9.965543806056193e-05} +{"train_loss": 0.019033437594771385, "global_step": 3151, "epoch": 26, "lr": 9.96551783621362e-05} +{"train_loss": 0.02608725056052208, "global_step": 3152, "epoch": 26, "lr": 9.965491856621783e-05} +{"train_loss": 0.016324013471603394, "global_step": 3153, "epoch": 26, "lr": 9.965465867280734e-05} +{"train_loss": 0.024038486182689667, "global_step": 3154, "epoch": 26, "lr": 9.965439868190523e-05} +{"train_loss": 0.029923219233751297, "global_step": 3155, "epoch": 26, "lr": 9.965413859351201e-05} +{"train_loss": 0.0154794380068779, "global_step": 3156, "epoch": 26, "lr": 9.965387840762821e-05} +{"train_loss": 0.03006332367658615, "global_step": 3157, "epoch": 26, "lr": 9.965361812425431e-05} +{"train_loss": 0.016738224774599075, "global_step": 3158, "epoch": 26, "lr": 9.965335774339084e-05} +{"train_loss": 0.026625748723745346, "global_step": 3159, "epoch": 26, "lr": 9.96530972650383e-05} +{"train_loss": 0.0214109905064106, "global_step": 3160, "epoch": 26, "lr": 9.96528366891972e-05} +{"train_loss": 0.021285424008965492, "global_step": 3161, "epoch": 26, "lr": 9.965257601586809e-05} +{"train_loss": 0.020186718553304672, "global_step": 3162, "epoch": 26, "lr": 9.965231524505143e-05} +{"train_loss": 0.0154875498265028, "global_step": 3163, "epoch": 26, "lr": 9.965205437674775e-05} +{"train_loss": 0.028731027618050575, "global_step": 3164, "epoch": 26, "lr": 9.965179341095758e-05} +{"train_loss": 0.018647681921720505, "global_step": 3165, "epoch": 26, "lr": 9.965153234768141e-05} +{"train_loss": 0.01871846243739128, "global_step": 3166, "epoch": 26, "lr": 9.965127118691975e-05} +{"train_loss": 0.02775660715997219, "global_step": 3167, "epoch": 26, "lr": 9.965100992867313e-05} +{"train_loss": 0.018986379727721214, "global_step": 3168, "epoch": 26, "lr": 9.965074857294207e-05} +{"train_loss": 0.020741868764162064, "global_step": 3169, "epoch": 26, "lr": 9.965048711972707e-05} +{"train_loss": 0.015231207944452763, "global_step": 3170, "epoch": 26, "lr": 9.965022556902863e-05} +{"train_loss": 0.020000427961349487, "global_step": 3171, "epoch": 26, "lr": 9.964996392084728e-05} +{"train_loss": 0.020723361521959305, "global_step": 3172, "epoch": 26, "lr": 9.964970217518352e-05} +{"train_loss": 0.020029984414577484, "global_step": 3173, "epoch": 26, "lr": 9.964944033203789e-05} +{"train_loss": 0.02277507446706295, "global_step": 3174, "epoch": 26, "lr": 9.964917839141088e-05} +{"train_loss": 0.02386069856584072, "global_step": 3175, "epoch": 26, "lr": 9.964891635330302e-05} +{"train_loss": 0.026795830577611923, "global_step": 3176, "epoch": 26, "lr": 9.964865421771481e-05} +{"train_loss": 0.029447395354509354, "global_step": 3177, "epoch": 26, "lr": 9.964839198464677e-05} +{"train_loss": 0.01271680649369955, "global_step": 3178, "epoch": 26, "lr": 9.964812965409942e-05} +{"train_loss": 0.02266659587621689, "global_step": 3179, "epoch": 26, "lr": 9.964786722607329e-05} +{"train_loss": 0.014262853190302849, "global_step": 3180, "epoch": 26, "lr": 9.964760470056884e-05} +{"train_loss": 0.020569387823343277, "global_step": 3181, "epoch": 26, "lr": 9.964734207758665e-05} +{"train_loss": 0.018118616193532944, "global_step": 3182, "epoch": 26, "lr": 9.964707935712721e-05} +{"train_loss": 0.01619177870452404, "global_step": 3183, "epoch": 26, "lr": 9.964681653919101e-05} +{"train_loss": 0.02057279460132122, "global_step": 3184, "epoch": 26, "lr": 9.96465536237786e-05} +{"train_loss": 0.01815003901720047, "global_step": 3185, "epoch": 26, "lr": 9.96462906108905e-05} +{"train_loss": 0.023738181218504906, "global_step": 3186, "epoch": 26, "lr": 9.964602750052719e-05} +{"train_loss": 0.028557464480400085, "global_step": 3187, "epoch": 26, "lr": 9.964576429268921e-05} +{"train_loss": 0.021939164027571678, "global_step": 3188, "epoch": 26, "lr": 9.964550098737711e-05} +{"train_loss": 0.019384760409593582, "global_step": 3189, "epoch": 26, "lr": 9.964523758459134e-05} +{"train_loss": 0.020305974408984184, "global_step": 3190, "epoch": 26, "lr": 9.964497408433245e-05} +{"train_loss": 0.01815946213901043, "global_step": 3191, "epoch": 26, "lr": 9.964471048660097e-05} +{"train_loss": 0.02624819613993168, "global_step": 3192, "epoch": 26, "lr": 9.96444467913974e-05} +{"train_loss": 0.014873337931931019, "global_step": 3193, "epoch": 26, "lr": 9.964418299872225e-05} +{"train_loss": 0.016704188659787178, "global_step": 3194, "epoch": 26, "lr": 9.964391910857607e-05} +{"train_loss": 0.023473244160413742, "global_step": 3195, "epoch": 26, "lr": 9.964365512095935e-05} +{"train_loss": 0.02560940943658352, "global_step": 3196, "epoch": 26, "lr": 9.964339103587261e-05} +{"train_loss": 0.025014659389853477, "global_step": 3197, "epoch": 26, "lr": 9.964312685331639e-05} +{"train_loss": 0.017688607797026634, "global_step": 3198, "epoch": 26, "lr": 9.964286257329119e-05} +{"train_loss": 0.023356910794973373, "global_step": 3199, "epoch": 26, "lr": 9.964259819579754e-05} +{"train_loss": 0.018339132890105247, "global_step": 3200, "epoch": 26, "lr": 9.964233372083594e-05} +{"train_loss": 0.03147027641534805, "global_step": 3201, "epoch": 26, "lr": 9.964206914840691e-05} +{"train_loss": 0.01963457092642784, "global_step": 3202, "epoch": 26, "lr": 9.964180447851099e-05} +{"train_loss": 0.015632908791303635, "global_step": 3203, "epoch": 26, "lr": 9.96415397111487e-05} +{"train_loss": 0.020373575389385223, "global_step": 3204, "epoch": 26, "lr": 9.964127484632054e-05} +{"train_loss": 0.02202673628926277, "global_step": 3205, "epoch": 26, "lr": 9.964100988402705e-05} +{"train_loss": 0.01625550352036953, "global_step": 3206, "epoch": 26, "lr": 9.964074482426872e-05} +{"train_loss": 0.023699935525655746, "global_step": 3207, "epoch": 26, "lr": 9.964047966704613e-05} +{"train_loss": 0.018159622326493263, "global_step": 3208, "epoch": 26, "lr": 9.964021441235974e-05} +{"train_loss": 0.02434086613357067, "global_step": 3209, "epoch": 26, "lr": 9.963994906021009e-05} +{"train_loss": 0.020389162003993988, "global_step": 3210, "epoch": 26, "lr": 9.96396836105977e-05} +{"train_loss": 0.02751881070435047, "global_step": 3211, "epoch": 26, "lr": 9.963941806352308e-05} +{"train_loss": 0.02178917301646551, "global_step": 3212, "epoch": 26, "lr": 9.963915241898679e-05, "val_loss": 0.030967818573117256} +{"train_loss": 0.02142220176756382, "global_step": 3213, "epoch": 27, "lr": 9.963888667698933e-05} +{"train_loss": 0.024018041789531708, "global_step": 3214, "epoch": 27, "lr": 9.963862083753119e-05} +{"train_loss": 0.024587761610746384, "global_step": 3215, "epoch": 27, "lr": 9.963835490061295e-05} +{"train_loss": 0.024598343297839165, "global_step": 3216, "epoch": 27, "lr": 9.963808886623509e-05} +{"train_loss": 0.020733589306473732, "global_step": 3217, "epoch": 27, "lr": 9.963782273439816e-05} +{"train_loss": 0.020099136978387833, "global_step": 3218, "epoch": 27, "lr": 9.963755650510264e-05} +{"train_loss": 0.02085610292851925, "global_step": 3219, "epoch": 27, "lr": 9.96372901783491e-05} +{"train_loss": 0.018812958151102066, "global_step": 3220, "epoch": 27, "lr": 9.963702375413806e-05} +{"train_loss": 0.019939474761486053, "global_step": 3221, "epoch": 27, "lr": 9.963675723247e-05} +{"train_loss": 0.02725461684167385, "global_step": 3222, "epoch": 27, "lr": 9.963649061334547e-05} +{"train_loss": 0.024205971509218216, "global_step": 3223, "epoch": 27, "lr": 9.963622389676501e-05} +{"train_loss": 0.020504161715507507, "global_step": 3224, "epoch": 27, "lr": 9.963595708272913e-05} +{"train_loss": 0.02295432798564434, "global_step": 3225, "epoch": 27, "lr": 9.963569017123833e-05} +{"train_loss": 0.018685966730117798, "global_step": 3226, "epoch": 27, "lr": 9.963542316229317e-05} +{"train_loss": 0.024041797965765, "global_step": 3227, "epoch": 27, "lr": 9.963515605589415e-05} +{"train_loss": 0.016051508486270905, "global_step": 3228, "epoch": 27, "lr": 9.963488885204182e-05} +{"train_loss": 0.019105171784758568, "global_step": 3229, "epoch": 27, "lr": 9.963462155073668e-05} +{"train_loss": 0.018984919413924217, "global_step": 3230, "epoch": 27, "lr": 9.963435415197926e-05} +{"train_loss": 0.020646611228585243, "global_step": 3231, "epoch": 27, "lr": 9.963408665577007e-05} +{"train_loss": 0.024098537862300873, "global_step": 3232, "epoch": 27, "lr": 9.96338190621097e-05} +{"train_loss": 0.019730936735868454, "global_step": 3233, "epoch": 27, "lr": 9.96335513709986e-05} +{"train_loss": 0.016598735004663467, "global_step": 3234, "epoch": 27, "lr": 9.96332835824373e-05} +{"train_loss": 0.020986635237932205, "global_step": 3235, "epoch": 27, "lr": 9.963301569642639e-05} +{"train_loss": 0.016207877546548843, "global_step": 3236, "epoch": 27, "lr": 9.963274771296633e-05} +{"train_loss": 0.02603820525109768, "global_step": 3237, "epoch": 27, "lr": 9.96324796320577e-05} +{"train_loss": 0.02357451058924198, "global_step": 3238, "epoch": 27, "lr": 9.963221145370098e-05} +{"train_loss": 0.015134302899241447, "global_step": 3239, "epoch": 27, "lr": 9.963194317789673e-05} +{"train_loss": 0.019359124824404716, "global_step": 3240, "epoch": 27, "lr": 9.963167480464544e-05} +{"train_loss": 0.021057603880763054, "global_step": 3241, "epoch": 27, "lr": 9.963140633394767e-05} +{"train_loss": 0.021082628518342972, "global_step": 3242, "epoch": 27, "lr": 9.963113776580393e-05} +{"train_loss": 0.019515100866556168, "global_step": 3243, "epoch": 27, "lr": 9.963086910021476e-05} +{"train_loss": 0.018297238275408745, "global_step": 3244, "epoch": 27, "lr": 9.963060033718068e-05} +{"train_loss": 0.018695248290896416, "global_step": 3245, "epoch": 27, "lr": 9.963033147670223e-05} +{"train_loss": 0.02672029286623001, "global_step": 3246, "epoch": 27, "lr": 9.963006251877991e-05} +{"train_loss": 0.012520426884293556, "global_step": 3247, "epoch": 27, "lr": 9.962979346341425e-05} +{"train_loss": 0.021327150985598564, "global_step": 3248, "epoch": 27, "lr": 9.962952431060583e-05} +{"train_loss": 0.015552947297692299, "global_step": 3249, "epoch": 27, "lr": 9.962925506035512e-05} +{"train_loss": 0.02529098652303219, "global_step": 3250, "epoch": 27, "lr": 9.962898571266267e-05} +{"train_loss": 0.017363719642162323, "global_step": 3251, "epoch": 27, "lr": 9.962871626752901e-05} +{"train_loss": 0.016815802082419395, "global_step": 3252, "epoch": 27, "lr": 9.962844672495466e-05} +{"train_loss": 0.015680557116866112, "global_step": 3253, "epoch": 27, "lr": 9.962817708494017e-05} +{"train_loss": 0.019801903516054153, "global_step": 3254, "epoch": 27, "lr": 9.962790734748606e-05} +{"train_loss": 0.019692344591021538, "global_step": 3255, "epoch": 27, "lr": 9.962763751259285e-05} +{"train_loss": 0.021098937839269638, "global_step": 3256, "epoch": 27, "lr": 9.962736758026107e-05} +{"train_loss": 0.02100895717740059, "global_step": 3257, "epoch": 27, "lr": 9.962709755049126e-05} +{"train_loss": 0.019655657932162285, "global_step": 3258, "epoch": 27, "lr": 9.962682742328394e-05} +{"train_loss": 0.028965570032596588, "global_step": 3259, "epoch": 27, "lr": 9.962655719863964e-05} +{"train_loss": 0.014091698452830315, "global_step": 3260, "epoch": 27, "lr": 9.962628687655892e-05} +{"train_loss": 0.01763947494328022, "global_step": 3261, "epoch": 27, "lr": 9.962601645704228e-05} +{"train_loss": 0.026747407391667366, "global_step": 3262, "epoch": 27, "lr": 9.962574594009024e-05} +{"train_loss": 0.028443653136491776, "global_step": 3263, "epoch": 27, "lr": 9.962547532570337e-05} +{"train_loss": 0.024138344451785088, "global_step": 3264, "epoch": 27, "lr": 9.962520461388219e-05} +{"train_loss": 0.02029448002576828, "global_step": 3265, "epoch": 27, "lr": 9.962493380462719e-05} +{"train_loss": 0.023041773587465286, "global_step": 3266, "epoch": 27, "lr": 9.962466289793895e-05} +{"train_loss": 0.025821514427661896, "global_step": 3267, "epoch": 27, "lr": 9.9624391893818e-05} +{"train_loss": 0.02277747355401516, "global_step": 3268, "epoch": 27, "lr": 9.962412079226484e-05} +{"train_loss": 0.02181435376405716, "global_step": 3269, "epoch": 27, "lr": 9.962384959328001e-05} +{"train_loss": 0.023305092006921768, "global_step": 3270, "epoch": 27, "lr": 9.962357829686408e-05} +{"train_loss": 0.021968966349959373, "global_step": 3271, "epoch": 27, "lr": 9.962330690301754e-05} +{"train_loss": 0.025046320632100105, "global_step": 3272, "epoch": 27, "lr": 9.962303541174094e-05} +{"train_loss": 0.014858686365187168, "global_step": 3273, "epoch": 27, "lr": 9.962276382303481e-05} +{"train_loss": 0.019750958308577538, "global_step": 3274, "epoch": 27, "lr": 9.962249213689969e-05} +{"train_loss": 0.01912824623286724, "global_step": 3275, "epoch": 27, "lr": 9.962222035333611e-05} +{"train_loss": 0.026035625487565994, "global_step": 3276, "epoch": 27, "lr": 9.962194847234461e-05} +{"train_loss": 0.024558883160352707, "global_step": 3277, "epoch": 27, "lr": 9.96216764939257e-05} +{"train_loss": 0.0249814223498106, "global_step": 3278, "epoch": 27, "lr": 9.962140441807992e-05} +{"train_loss": 0.02075742743909359, "global_step": 3279, "epoch": 27, "lr": 9.962113224480784e-05} +{"train_loss": 0.01763054169714451, "global_step": 3280, "epoch": 27, "lr": 9.962085997410995e-05} +{"train_loss": 0.026475390419363976, "global_step": 3281, "epoch": 27, "lr": 9.96205876059868e-05} +{"train_loss": 0.02035447210073471, "global_step": 3282, "epoch": 27, "lr": 9.962031514043894e-05} +{"train_loss": 0.015980053693056107, "global_step": 3283, "epoch": 27, "lr": 9.962004257746689e-05} +{"train_loss": 0.01946074329316616, "global_step": 3284, "epoch": 27, "lr": 9.961976991707119e-05} +{"train_loss": 0.02760843187570572, "global_step": 3285, "epoch": 27, "lr": 9.961949715925236e-05} +{"train_loss": 0.019089290872216225, "global_step": 3286, "epoch": 27, "lr": 9.961922430401096e-05} +{"train_loss": 0.016936978325247765, "global_step": 3287, "epoch": 27, "lr": 9.961895135134751e-05} +{"train_loss": 0.01893416978418827, "global_step": 3288, "epoch": 27, "lr": 9.961867830126255e-05} +{"train_loss": 0.022334737703204155, "global_step": 3289, "epoch": 27, "lr": 9.961840515375662e-05} +{"train_loss": 0.029882019385695457, "global_step": 3290, "epoch": 27, "lr": 9.961813190883025e-05} +{"train_loss": 0.015601488761603832, "global_step": 3291, "epoch": 27, "lr": 9.961785856648397e-05} +{"train_loss": 0.019344840198755264, "global_step": 3292, "epoch": 27, "lr": 9.961758512671832e-05} +{"train_loss": 0.016771355643868446, "global_step": 3293, "epoch": 27, "lr": 9.961731158953387e-05} +{"train_loss": 0.025759857147932053, "global_step": 3294, "epoch": 27, "lr": 9.961703795493111e-05} +{"train_loss": 0.01969393528997898, "global_step": 3295, "epoch": 27, "lr": 9.961676422291061e-05} +{"train_loss": 0.01891220174729824, "global_step": 3296, "epoch": 27, "lr": 9.961649039347289e-05} +{"train_loss": 0.01484810933470726, "global_step": 3297, "epoch": 27, "lr": 9.961621646661848e-05} +{"train_loss": 0.016003385186195374, "global_step": 3298, "epoch": 27, "lr": 9.961594244234793e-05} +{"train_loss": 0.023254867643117905, "global_step": 3299, "epoch": 27, "lr": 9.961566832066179e-05} +{"train_loss": 0.020201468840241432, "global_step": 3300, "epoch": 27, "lr": 9.961539410156058e-05} +{"train_loss": 0.019330643117427826, "global_step": 3301, "epoch": 27, "lr": 9.961511978504485e-05} +{"train_loss": 0.018668342381715775, "global_step": 3302, "epoch": 27, "lr": 9.961484537111512e-05} +{"train_loss": 0.022147286683321, "global_step": 3303, "epoch": 27, "lr": 9.961457085977195e-05} +{"train_loss": 0.017516694962978363, "global_step": 3304, "epoch": 27, "lr": 9.961429625101588e-05} +{"train_loss": 0.01662507839500904, "global_step": 3305, "epoch": 27, "lr": 9.961402154484742e-05} +{"train_loss": 0.023577306419610977, "global_step": 3306, "epoch": 27, "lr": 9.961374674126715e-05} +{"train_loss": 0.022298239171504974, "global_step": 3307, "epoch": 27, "lr": 9.961347184027559e-05} +{"train_loss": 0.020108958706259727, "global_step": 3308, "epoch": 27, "lr": 9.961319684187326e-05} +{"train_loss": 0.016762441024184227, "global_step": 3309, "epoch": 27, "lr": 9.961292174606071e-05} +{"train_loss": 0.02214459516108036, "global_step": 3310, "epoch": 27, "lr": 9.961264655283851e-05} +{"train_loss": 0.018718566745519638, "global_step": 3311, "epoch": 27, "lr": 9.961237126220717e-05} +{"train_loss": 0.02332749031484127, "global_step": 3312, "epoch": 27, "lr": 9.961209587416724e-05} +{"train_loss": 0.02225722000002861, "global_step": 3313, "epoch": 27, "lr": 9.961182038871927e-05} +{"train_loss": 0.019343875348567963, "global_step": 3314, "epoch": 27, "lr": 9.961154480586379e-05} +{"train_loss": 0.01996348612010479, "global_step": 3315, "epoch": 27, "lr": 9.961126912560133e-05} +{"train_loss": 0.021240947768092155, "global_step": 3316, "epoch": 27, "lr": 9.961099334793245e-05} +{"train_loss": 0.030821779742836952, "global_step": 3317, "epoch": 27, "lr": 9.961071747285769e-05} +{"train_loss": 0.021604051813483238, "global_step": 3318, "epoch": 27, "lr": 9.961044150037757e-05} +{"train_loss": 0.016601238399744034, "global_step": 3319, "epoch": 27, "lr": 9.961016543049266e-05} +{"train_loss": 0.02195601537823677, "global_step": 3320, "epoch": 27, "lr": 9.960988926320348e-05} +{"train_loss": 0.022065790370106697, "global_step": 3321, "epoch": 27, "lr": 9.96096129985106e-05} +{"train_loss": 0.014589255675673485, "global_step": 3322, "epoch": 27, "lr": 9.960933663641453e-05} +{"train_loss": 0.020263953134417534, "global_step": 3323, "epoch": 27, "lr": 9.960906017691582e-05} +{"train_loss": 0.017551638185977936, "global_step": 3324, "epoch": 27, "lr": 9.960878362001504e-05} +{"train_loss": 0.019518962129950523, "global_step": 3325, "epoch": 27, "lr": 9.960850696571271e-05} +{"train_loss": 0.01866339147090912, "global_step": 3326, "epoch": 27, "lr": 9.960823021400938e-05} +{"train_loss": 0.016000015661120415, "global_step": 3327, "epoch": 27, "lr": 9.960795336490559e-05} +{"train_loss": 0.018838126212358475, "global_step": 3328, "epoch": 27, "lr": 9.960767641840186e-05} +{"train_loss": 0.018432890996336937, "global_step": 3329, "epoch": 27, "lr": 9.960739937449876e-05} +{"train_loss": 0.01484172884374857, "global_step": 3330, "epoch": 27, "lr": 9.960712223319685e-05} +{"train_loss": 0.020611940914404995, "global_step": 3331, "epoch": 27, "lr": 9.960684499449666e-05, "val_loss": 0.03112037107348442} +{"train_loss": 0.021074486896395683, "global_step": 3332, "epoch": 28, "lr": 9.96065676583987e-05} +{"train_loss": 0.01885039545595646, "global_step": 3333, "epoch": 28, "lr": 9.960629022490358e-05} +{"train_loss": 0.01861586421728134, "global_step": 3334, "epoch": 28, "lr": 9.96060126940118e-05} +{"train_loss": 0.023221321403980255, "global_step": 3335, "epoch": 28, "lr": 9.96057350657239e-05} +{"train_loss": 0.017978481948375702, "global_step": 3336, "epoch": 28, "lr": 9.960545734004044e-05} +{"train_loss": 0.015366753563284874, "global_step": 3337, "epoch": 28, "lr": 9.960517951696197e-05} +{"train_loss": 0.01823706552386284, "global_step": 3338, "epoch": 28, "lr": 9.960490159648903e-05} +{"train_loss": 0.016369780525565147, "global_step": 3339, "epoch": 28, "lr": 9.960462357862216e-05} +{"train_loss": 0.015369383618235588, "global_step": 3340, "epoch": 28, "lr": 9.960434546336191e-05} +{"train_loss": 0.019873861223459244, "global_step": 3341, "epoch": 28, "lr": 9.960406725070883e-05} +{"train_loss": 0.0181718897074461, "global_step": 3342, "epoch": 28, "lr": 9.960378894066346e-05} +{"train_loss": 0.024319525808095932, "global_step": 3343, "epoch": 28, "lr": 9.960351053322636e-05} +{"train_loss": 0.023079128935933113, "global_step": 3344, "epoch": 28, "lr": 9.960323202839807e-05} +{"train_loss": 0.024098636582493782, "global_step": 3345, "epoch": 28, "lr": 9.960295342617911e-05} +{"train_loss": 0.02035363018512726, "global_step": 3346, "epoch": 28, "lr": 9.960267472657008e-05} +{"train_loss": 0.01377180963754654, "global_step": 3347, "epoch": 28, "lr": 9.960239592957148e-05} +{"train_loss": 0.019373685121536255, "global_step": 3348, "epoch": 28, "lr": 9.960211703518387e-05} +{"train_loss": 0.016173072159290314, "global_step": 3349, "epoch": 28, "lr": 9.960183804340782e-05} +{"train_loss": 0.024885015562176704, "global_step": 3350, "epoch": 28, "lr": 9.960155895424384e-05} +{"train_loss": 0.024309299886226654, "global_step": 3351, "epoch": 28, "lr": 9.960127976769252e-05} +{"train_loss": 0.022460533306002617, "global_step": 3352, "epoch": 28, "lr": 9.960100048375436e-05} +{"train_loss": 0.01828809827566147, "global_step": 3353, "epoch": 28, "lr": 9.960072110242995e-05} +{"train_loss": 0.017041068524122238, "global_step": 3354, "epoch": 28, "lr": 9.960044162371982e-05} +{"train_loss": 0.02421867474913597, "global_step": 3355, "epoch": 28, "lr": 9.960016204762453e-05} +{"train_loss": 0.022957241162657738, "global_step": 3356, "epoch": 28, "lr": 9.959988237414461e-05} +{"train_loss": 0.023691246286034584, "global_step": 3357, "epoch": 28, "lr": 9.959960260328062e-05} +{"train_loss": 0.018582966178655624, "global_step": 3358, "epoch": 28, "lr": 9.959932273503312e-05} +{"train_loss": 0.021461956202983856, "global_step": 3359, "epoch": 28, "lr": 9.959904276940264e-05} +{"train_loss": 0.015009493567049503, "global_step": 3360, "epoch": 28, "lr": 9.959876270638974e-05} +{"train_loss": 0.016869891434907913, "global_step": 3361, "epoch": 28, "lr": 9.959848254599496e-05} +{"train_loss": 0.02151319570839405, "global_step": 3362, "epoch": 28, "lr": 9.959820228821888e-05} +{"train_loss": 0.01828274130821228, "global_step": 3363, "epoch": 28, "lr": 9.959792193306201e-05} +{"train_loss": 0.024642447009682655, "global_step": 3364, "epoch": 28, "lr": 9.959764148052492e-05} +{"train_loss": 0.02721313200891018, "global_step": 3365, "epoch": 28, "lr": 9.959736093060816e-05} +{"train_loss": 0.015048367902636528, "global_step": 3366, "epoch": 28, "lr": 9.95970802833123e-05} +{"train_loss": 0.01559983380138874, "global_step": 3367, "epoch": 28, "lr": 9.959679953863785e-05} +{"train_loss": 0.0253896526992321, "global_step": 3368, "epoch": 28, "lr": 9.95965186965854e-05} +{"train_loss": 0.02182776667177677, "global_step": 3369, "epoch": 28, "lr": 9.959623775715546e-05} +{"train_loss": 0.020192183554172516, "global_step": 3370, "epoch": 28, "lr": 9.959595672034863e-05} +{"train_loss": 0.02185008116066456, "global_step": 3371, "epoch": 28, "lr": 9.959567558616542e-05} +{"train_loss": 0.014829576015472412, "global_step": 3372, "epoch": 28, "lr": 9.959539435460641e-05} +{"train_loss": 0.02117360197007656, "global_step": 3373, "epoch": 28, "lr": 9.959511302567213e-05} +{"train_loss": 0.01624743454158306, "global_step": 3374, "epoch": 28, "lr": 9.959483159936317e-05} +{"train_loss": 0.022227266803383827, "global_step": 3375, "epoch": 28, "lr": 9.959455007568002e-05} +{"train_loss": 0.018019046634435654, "global_step": 3376, "epoch": 28, "lr": 9.95942684546233e-05} +{"train_loss": 0.014472459442913532, "global_step": 3377, "epoch": 28, "lr": 9.95939867361935e-05} +{"train_loss": 0.019933832809329033, "global_step": 3378, "epoch": 28, "lr": 9.959370492039124e-05} +{"train_loss": 0.02225245162844658, "global_step": 3379, "epoch": 28, "lr": 9.959342300721702e-05} +{"train_loss": 0.02739279717206955, "global_step": 3380, "epoch": 28, "lr": 9.95931409966714e-05} +{"train_loss": 0.01770917698740959, "global_step": 3381, "epoch": 28, "lr": 9.959285888875498e-05} +{"train_loss": 0.023613495752215385, "global_step": 3382, "epoch": 28, "lr": 9.959257668346826e-05} +{"train_loss": 0.0202884953469038, "global_step": 3383, "epoch": 28, "lr": 9.959229438081182e-05} +{"train_loss": 0.0240520890802145, "global_step": 3384, "epoch": 28, "lr": 9.95920119807862e-05} +{"train_loss": 0.024795111268758774, "global_step": 3385, "epoch": 28, "lr": 9.959172948339198e-05} +{"train_loss": 0.025490788742899895, "global_step": 3386, "epoch": 28, "lr": 9.959144688862967e-05} +{"train_loss": 0.016023501753807068, "global_step": 3387, "epoch": 28, "lr": 9.959116419649986e-05} +{"train_loss": 0.018879270181059837, "global_step": 3388, "epoch": 28, "lr": 9.95908814070031e-05} +{"train_loss": 0.017614880576729774, "global_step": 3389, "epoch": 28, "lr": 9.959059852013994e-05} +{"train_loss": 0.020932061597704887, "global_step": 3390, "epoch": 28, "lr": 9.959031553591096e-05} +{"train_loss": 0.019262902438640594, "global_step": 3391, "epoch": 28, "lr": 9.959003245431667e-05} +{"train_loss": 0.02738017588853836, "global_step": 3392, "epoch": 28, "lr": 9.958974927535766e-05} +{"train_loss": 0.018271660432219505, "global_step": 3393, "epoch": 28, "lr": 9.958946599903447e-05} +{"train_loss": 0.014157101511955261, "global_step": 3394, "epoch": 28, "lr": 9.958918262534766e-05} +{"train_loss": 0.0181938037276268, "global_step": 3395, "epoch": 28, "lr": 9.95888991542978e-05} +{"train_loss": 0.02185114100575447, "global_step": 3396, "epoch": 28, "lr": 9.958861558588542e-05} +{"train_loss": 0.025663571432232857, "global_step": 3397, "epoch": 28, "lr": 9.958833192011109e-05} +{"train_loss": 0.017914094030857086, "global_step": 3398, "epoch": 28, "lr": 9.958804815697538e-05} +{"train_loss": 0.018368376418948174, "global_step": 3399, "epoch": 28, "lr": 9.958776429647883e-05} +{"train_loss": 0.012279266491532326, "global_step": 3400, "epoch": 28, "lr": 9.9587480338622e-05} +{"train_loss": 0.02413388341665268, "global_step": 3401, "epoch": 28, "lr": 9.958719628340544e-05} +{"train_loss": 0.02020227164030075, "global_step": 3402, "epoch": 28, "lr": 9.958691213082973e-05} +{"train_loss": 0.018678216263651848, "global_step": 3403, "epoch": 28, "lr": 9.958662788089541e-05} +{"train_loss": 0.019092585891485214, "global_step": 3404, "epoch": 28, "lr": 9.958634353360306e-05} +{"train_loss": 0.024064715951681137, "global_step": 3405, "epoch": 28, "lr": 9.95860590889532e-05} +{"train_loss": 0.014906421303749084, "global_step": 3406, "epoch": 28, "lr": 9.958577454694643e-05} +{"train_loss": 0.018002403900027275, "global_step": 3407, "epoch": 28, "lr": 9.958548990758327e-05} +{"train_loss": 0.01683766208589077, "global_step": 3408, "epoch": 28, "lr": 9.958520517086431e-05} +{"train_loss": 0.01513560488820076, "global_step": 3409, "epoch": 28, "lr": 9.95849203367901e-05} +{"train_loss": 0.022970078513026237, "global_step": 3410, "epoch": 28, "lr": 9.958463540536118e-05} +{"train_loss": 0.01978454925119877, "global_step": 3411, "epoch": 28, "lr": 9.958435037657813e-05} +{"train_loss": 0.01619165949523449, "global_step": 3412, "epoch": 28, "lr": 9.958406525044153e-05} +{"train_loss": 0.01956780254840851, "global_step": 3413, "epoch": 28, "lr": 9.95837800269519e-05} +{"train_loss": 0.01811929978430271, "global_step": 3414, "epoch": 28, "lr": 9.95834947061098e-05} +{"train_loss": 0.01662093959748745, "global_step": 3415, "epoch": 28, "lr": 9.958320928791583e-05} +{"train_loss": 0.024817628785967827, "global_step": 3416, "epoch": 28, "lr": 9.958292377237051e-05} +{"train_loss": 0.019527053460478783, "global_step": 3417, "epoch": 28, "lr": 9.958263815947441e-05} +{"train_loss": 0.023131821304559708, "global_step": 3418, "epoch": 28, "lr": 9.958235244922811e-05} +{"train_loss": 0.021558647975325584, "global_step": 3419, "epoch": 28, "lr": 9.958206664163215e-05} +{"train_loss": 0.016207385808229446, "global_step": 3420, "epoch": 28, "lr": 9.958178073668711e-05} +{"train_loss": 0.026840705424547195, "global_step": 3421, "epoch": 28, "lr": 9.958149473439353e-05} +{"train_loss": 0.01831609010696411, "global_step": 3422, "epoch": 28, "lr": 9.958120863475199e-05} +{"train_loss": 0.024400437250733376, "global_step": 3423, "epoch": 28, "lr": 9.958092243776305e-05} +{"train_loss": 0.0217804666608572, "global_step": 3424, "epoch": 28, "lr": 9.958063614342725e-05} +{"train_loss": 0.02702995017170906, "global_step": 3425, "epoch": 28, "lr": 9.958034975174518e-05} +{"train_loss": 0.021472472697496414, "global_step": 3426, "epoch": 28, "lr": 9.958006326271738e-05} +{"train_loss": 0.02306465432047844, "global_step": 3427, "epoch": 28, "lr": 9.957977667634443e-05} +{"train_loss": 0.02115483209490776, "global_step": 3428, "epoch": 28, "lr": 9.957948999262687e-05} +{"train_loss": 0.019818643108010292, "global_step": 3429, "epoch": 28, "lr": 9.95792032115653e-05} +{"train_loss": 0.01798650063574314, "global_step": 3430, "epoch": 28, "lr": 9.957891633316026e-05} +{"train_loss": 0.01984880492091179, "global_step": 3431, "epoch": 28, "lr": 9.95786293574123e-05} +{"train_loss": 0.02641572803258896, "global_step": 3432, "epoch": 28, "lr": 9.957834228432201e-05} +{"train_loss": 0.02360704354941845, "global_step": 3433, "epoch": 28, "lr": 9.957805511388992e-05} +{"train_loss": 0.02646816521883011, "global_step": 3434, "epoch": 28, "lr": 9.957776784611663e-05} +{"train_loss": 0.01815911754965782, "global_step": 3435, "epoch": 28, "lr": 9.95774804810027e-05} +{"train_loss": 0.02101496420800686, "global_step": 3436, "epoch": 28, "lr": 9.957719301854867e-05} +{"train_loss": 0.02232719026505947, "global_step": 3437, "epoch": 28, "lr": 9.957690545875512e-05} +{"train_loss": 0.02612585388123989, "global_step": 3438, "epoch": 28, "lr": 9.957661780162261e-05} +{"train_loss": 0.017036452889442444, "global_step": 3439, "epoch": 28, "lr": 9.957633004715173e-05} +{"train_loss": 0.020804513245821, "global_step": 3440, "epoch": 28, "lr": 9.9576042195343e-05} +{"train_loss": 0.024430353194475174, "global_step": 3441, "epoch": 28, "lr": 9.9575754246197e-05} +{"train_loss": 0.01800861395895481, "global_step": 3442, "epoch": 28, "lr": 9.957546619971431e-05} +{"train_loss": 0.01979670487344265, "global_step": 3443, "epoch": 28, "lr": 9.957517805589552e-05} +{"train_loss": 0.015975192189216614, "global_step": 3444, "epoch": 28, "lr": 9.957488981474113e-05} +{"train_loss": 0.018176564946770668, "global_step": 3445, "epoch": 28, "lr": 9.957460147625175e-05} +{"train_loss": 0.01872856169939041, "global_step": 3446, "epoch": 28, "lr": 9.957431304042792e-05} +{"train_loss": 0.03335253521800041, "global_step": 3447, "epoch": 28, "lr": 9.957402450727024e-05} +{"train_loss": 0.020169509574770927, "global_step": 3448, "epoch": 28, "lr": 9.957373587677926e-05} +{"train_loss": 0.016482604667544365, "global_step": 3449, "epoch": 28, "lr": 9.957344714895553e-05} +{"train_loss": 0.020368626294266275, "global_step": 3450, "epoch": 28, "lr": 9.957315832379966e-05, "val_loss": 0.020875632762908936} +{"train_loss": 0.013379625044763088, "global_step": 3451, "epoch": 29, "lr": 9.957286940131216e-05} +{"train_loss": 0.01940895989537239, "global_step": 3452, "epoch": 29, "lr": 9.957258038149365e-05} +{"train_loss": 0.01978488080203533, "global_step": 3453, "epoch": 29, "lr": 9.957229126434466e-05} +{"train_loss": 0.01830568164587021, "global_step": 3454, "epoch": 29, "lr": 9.957200204986579e-05} +{"train_loss": 0.024651234969496727, "global_step": 3455, "epoch": 29, "lr": 9.957171273805756e-05} +{"train_loss": 0.019958775490522385, "global_step": 3456, "epoch": 29, "lr": 9.95714233289206e-05} +{"train_loss": 0.022215303033590317, "global_step": 3457, "epoch": 29, "lr": 9.957113382245544e-05} +{"train_loss": 0.020008986815810204, "global_step": 3458, "epoch": 29, "lr": 9.957084421866263e-05} +{"train_loss": 0.013009251095354557, "global_step": 3459, "epoch": 29, "lr": 9.957055451754277e-05} +{"train_loss": 0.023641178384423256, "global_step": 3460, "epoch": 29, "lr": 9.957026471909645e-05} +{"train_loss": 0.013270161114633083, "global_step": 3461, "epoch": 29, "lr": 9.95699748233242e-05} +{"train_loss": 0.022221047431230545, "global_step": 3462, "epoch": 29, "lr": 9.956968483022658e-05} +{"train_loss": 0.022237207740545273, "global_step": 3463, "epoch": 29, "lr": 9.95693947398042e-05} +{"train_loss": 0.013288886286318302, "global_step": 3464, "epoch": 29, "lr": 9.95691045520576e-05} +{"train_loss": 0.022479215636849403, "global_step": 3465, "epoch": 29, "lr": 9.956881426698737e-05} +{"train_loss": 0.0167867299169302, "global_step": 3466, "epoch": 29, "lr": 9.956852388459405e-05} +{"train_loss": 0.017184868454933167, "global_step": 3467, "epoch": 29, "lr": 9.956823340487824e-05} +{"train_loss": 0.025817621499300003, "global_step": 3468, "epoch": 29, "lr": 9.95679428278405e-05} +{"train_loss": 0.018861234188079834, "global_step": 3469, "epoch": 29, "lr": 9.95676521534814e-05} +{"train_loss": 0.01985875330865383, "global_step": 3470, "epoch": 29, "lr": 9.95673613818015e-05} +{"train_loss": 0.01701347343623638, "global_step": 3471, "epoch": 29, "lr": 9.956707051280139e-05} +{"train_loss": 0.01865275949239731, "global_step": 3472, "epoch": 29, "lr": 9.956677954648164e-05} +{"train_loss": 0.021004242822527885, "global_step": 3473, "epoch": 29, "lr": 9.95664884828428e-05} +{"train_loss": 0.018766557797789574, "global_step": 3474, "epoch": 29, "lr": 9.956619732188546e-05} +{"train_loss": 0.012803955003619194, "global_step": 3475, "epoch": 29, "lr": 9.956590606361018e-05} +{"train_loss": 0.016042524948716164, "global_step": 3476, "epoch": 29, "lr": 9.956561470801755e-05} +{"train_loss": 0.02291041798889637, "global_step": 3477, "epoch": 29, "lr": 9.956532325510813e-05} +{"train_loss": 0.013645289465785027, "global_step": 3478, "epoch": 29, "lr": 9.95650317048825e-05} +{"train_loss": 0.024535058066248894, "global_step": 3479, "epoch": 29, "lr": 9.956474005734121e-05} +{"train_loss": 0.018153885379433632, "global_step": 3480, "epoch": 29, "lr": 9.956444831248486e-05} +{"train_loss": 0.01568031683564186, "global_step": 3481, "epoch": 29, "lr": 9.956415647031401e-05} +{"train_loss": 0.014106597751379013, "global_step": 3482, "epoch": 29, "lr": 9.956386453082922e-05} +{"train_loss": 0.015110688284039497, "global_step": 3483, "epoch": 29, "lr": 9.956357249403109e-05} +{"train_loss": 0.024379339069128036, "global_step": 3484, "epoch": 29, "lr": 9.956328035992017e-05} +{"train_loss": 0.018542852252721786, "global_step": 3485, "epoch": 29, "lr": 9.956298812849704e-05} +{"train_loss": 0.016746200621128082, "global_step": 3486, "epoch": 29, "lr": 9.95626957997623e-05} +{"train_loss": 0.018234752118587494, "global_step": 3487, "epoch": 29, "lr": 9.95624033737165e-05} +{"train_loss": 0.020064597949385643, "global_step": 3488, "epoch": 29, "lr": 9.95621108503602e-05} +{"train_loss": 0.024618498980998993, "global_step": 3489, "epoch": 29, "lr": 9.956181822969399e-05} +{"train_loss": 0.020316844806075096, "global_step": 3490, "epoch": 29, "lr": 9.956152551171846e-05} +{"train_loss": 0.013804455287754536, "global_step": 3491, "epoch": 29, "lr": 9.956123269643416e-05} +{"train_loss": 0.018399357795715332, "global_step": 3492, "epoch": 29, "lr": 9.956093978384166e-05} +{"train_loss": 0.015839796513319016, "global_step": 3493, "epoch": 29, "lr": 9.956064677394158e-05} +{"train_loss": 0.016999628394842148, "global_step": 3494, "epoch": 29, "lr": 9.956035366673444e-05} +{"train_loss": 0.014956668019294739, "global_step": 3495, "epoch": 29, "lr": 9.956006046222086e-05} +{"train_loss": 0.018388696014881134, "global_step": 3496, "epoch": 29, "lr": 9.955976716040138e-05} +{"train_loss": 0.015354218892753124, "global_step": 3497, "epoch": 29, "lr": 9.95594737612766e-05} +{"train_loss": 0.02149849571287632, "global_step": 3498, "epoch": 29, "lr": 9.955918026484709e-05} +{"train_loss": 0.016351982951164246, "global_step": 3499, "epoch": 29, "lr": 9.955888667111341e-05} +{"train_loss": 0.013725914061069489, "global_step": 3500, "epoch": 29, "lr": 9.955859298007617e-05} +{"train_loss": 0.018810003995895386, "global_step": 3501, "epoch": 29, "lr": 9.955829919173592e-05} +{"train_loss": 0.022288553416728973, "global_step": 3502, "epoch": 29, "lr": 9.955800530609324e-05} +{"train_loss": 0.018793409690260887, "global_step": 3503, "epoch": 29, "lr": 9.955771132314871e-05} +{"train_loss": 0.02813185751438141, "global_step": 3504, "epoch": 29, "lr": 9.95574172429029e-05} +{"train_loss": 0.015698038041591644, "global_step": 3505, "epoch": 29, "lr": 9.955712306535643e-05} +{"train_loss": 0.015332326292991638, "global_step": 3506, "epoch": 29, "lr": 9.955682879050981e-05} +{"train_loss": 0.011647392064332962, "global_step": 3507, "epoch": 29, "lr": 9.955653441836365e-05} +{"train_loss": 0.02130969986319542, "global_step": 3508, "epoch": 29, "lr": 9.955623994891856e-05} +{"train_loss": 0.017854314297437668, "global_step": 3509, "epoch": 29, "lr": 9.955594538217506e-05} +{"train_loss": 0.010152190923690796, "global_step": 3510, "epoch": 29, "lr": 9.955565071813376e-05} +{"train_loss": 0.01848536729812622, "global_step": 3511, "epoch": 29, "lr": 9.955535595679524e-05} +{"train_loss": 0.013532736338675022, "global_step": 3512, "epoch": 29, "lr": 9.955506109816006e-05} +{"train_loss": 0.02073647826910019, "global_step": 3513, "epoch": 29, "lr": 9.955476614222883e-05} +{"train_loss": 0.015237231738865376, "global_step": 3514, "epoch": 29, "lr": 9.95544710890021e-05} +{"train_loss": 0.02111557312309742, "global_step": 3515, "epoch": 29, "lr": 9.955417593848046e-05} +{"train_loss": 0.01630476303398609, "global_step": 3516, "epoch": 29, "lr": 9.955388069066449e-05} +{"train_loss": 0.01790587231516838, "global_step": 3517, "epoch": 29, "lr": 9.955358534555478e-05} +{"train_loss": 0.02057858556509018, "global_step": 3518, "epoch": 29, "lr": 9.955328990315189e-05} +{"train_loss": 0.01895212009549141, "global_step": 3519, "epoch": 29, "lr": 9.955299436345641e-05} +{"train_loss": 0.016731789335608482, "global_step": 3520, "epoch": 29, "lr": 9.955269872646892e-05} +{"train_loss": 0.021671820431947708, "global_step": 3521, "epoch": 29, "lr": 9.955240299218999e-05} +{"train_loss": 0.014967928640544415, "global_step": 3522, "epoch": 29, "lr": 9.955210716062022e-05} +{"train_loss": 0.02345420978963375, "global_step": 3523, "epoch": 29, "lr": 9.955181123176019e-05} +{"train_loss": 0.020066171884536743, "global_step": 3524, "epoch": 29, "lr": 9.955151520561046e-05} +{"train_loss": 0.022815575823187828, "global_step": 3525, "epoch": 29, "lr": 9.955121908217163e-05} +{"train_loss": 0.018008824437856674, "global_step": 3526, "epoch": 29, "lr": 9.955092286144427e-05} +{"train_loss": 0.01885460689663887, "global_step": 3527, "epoch": 29, "lr": 9.955062654342898e-05} +{"train_loss": 0.01852472685277462, "global_step": 3528, "epoch": 29, "lr": 9.955033012812631e-05} +{"train_loss": 0.017640236765146255, "global_step": 3529, "epoch": 29, "lr": 9.955003361553688e-05} +{"train_loss": 0.01871330849826336, "global_step": 3530, "epoch": 29, "lr": 9.954973700566123e-05} +{"train_loss": 0.01833929866552353, "global_step": 3531, "epoch": 29, "lr": 9.954944029849998e-05} +{"train_loss": 0.020993847399950027, "global_step": 3532, "epoch": 29, "lr": 9.954914349405368e-05} +{"train_loss": 0.017114028334617615, "global_step": 3533, "epoch": 29, "lr": 9.954884659232295e-05} +{"train_loss": 0.02207777462899685, "global_step": 3534, "epoch": 29, "lr": 9.954854959330835e-05} +{"train_loss": 0.020015083253383636, "global_step": 3535, "epoch": 29, "lr": 9.954825249701047e-05} +{"train_loss": 0.018358733505010605, "global_step": 3536, "epoch": 29, "lr": 9.954795530342988e-05} +{"train_loss": 0.021777115762233734, "global_step": 3537, "epoch": 29, "lr": 9.954765801256718e-05} +{"train_loss": 0.020938511937856674, "global_step": 3538, "epoch": 29, "lr": 9.954736062442293e-05} +{"train_loss": 0.015558053739368916, "global_step": 3539, "epoch": 29, "lr": 9.954706313899775e-05} +{"train_loss": 0.016272053122520447, "global_step": 3540, "epoch": 29, "lr": 9.954676555629221e-05} +{"train_loss": 0.019471991807222366, "global_step": 3541, "epoch": 29, "lr": 9.954646787630687e-05} +{"train_loss": 0.015260793268680573, "global_step": 3542, "epoch": 29, "lr": 9.954617009904234e-05} +{"train_loss": 0.02300703153014183, "global_step": 3543, "epoch": 29, "lr": 9.95458722244992e-05} +{"train_loss": 0.019803274422883987, "global_step": 3544, "epoch": 29, "lr": 9.954557425267803e-05} +{"train_loss": 0.021570684388279915, "global_step": 3545, "epoch": 29, "lr": 9.954527618357943e-05} +{"train_loss": 0.016144076362252235, "global_step": 3546, "epoch": 29, "lr": 9.954497801720396e-05} +{"train_loss": 0.017529696226119995, "global_step": 3547, "epoch": 29, "lr": 9.954467975355221e-05} +{"train_loss": 0.01706547848880291, "global_step": 3548, "epoch": 29, "lr": 9.95443813926248e-05} +{"train_loss": 0.022316303104162216, "global_step": 3549, "epoch": 29, "lr": 9.954408293442228e-05} +{"train_loss": 0.018276110291481018, "global_step": 3550, "epoch": 29, "lr": 9.954378437894525e-05} +{"train_loss": 0.018033910542726517, "global_step": 3551, "epoch": 29, "lr": 9.954348572619427e-05} +{"train_loss": 0.013673048466444016, "global_step": 3552, "epoch": 29, "lr": 9.954318697616997e-05} +{"train_loss": 0.018108299002051353, "global_step": 3553, "epoch": 29, "lr": 9.954288812887291e-05} +{"train_loss": 0.023011155426502228, "global_step": 3554, "epoch": 29, "lr": 9.954258918430368e-05} +{"train_loss": 0.01694454438984394, "global_step": 3555, "epoch": 29, "lr": 9.954229014246287e-05} +{"train_loss": 0.013960481621325016, "global_step": 3556, "epoch": 29, "lr": 9.954199100335108e-05} +{"train_loss": 0.02028482034802437, "global_step": 3557, "epoch": 29, "lr": 9.954169176696886e-05} +{"train_loss": 0.022347213700413704, "global_step": 3558, "epoch": 29, "lr": 9.954139243331684e-05} +{"train_loss": 0.021120255813002586, "global_step": 3559, "epoch": 29, "lr": 9.954109300239558e-05} +{"train_loss": 0.016721857711672783, "global_step": 3560, "epoch": 29, "lr": 9.954079347420568e-05} +{"train_loss": 0.021748604252934456, "global_step": 3561, "epoch": 29, "lr": 9.954049384874772e-05} +{"train_loss": 0.017298324033617973, "global_step": 3562, "epoch": 29, "lr": 9.954019412602229e-05} +{"train_loss": 0.019699333235621452, "global_step": 3563, "epoch": 29, "lr": 9.953989430602998e-05} +{"train_loss": 0.017885861918330193, "global_step": 3564, "epoch": 29, "lr": 9.953959438877138e-05} +{"train_loss": 0.017038648948073387, "global_step": 3565, "epoch": 29, "lr": 9.953929437424709e-05} +{"train_loss": 0.014007569290697575, "global_step": 3566, "epoch": 29, "lr": 9.953899426245769e-05} +{"train_loss": 0.013659171760082245, "global_step": 3567, "epoch": 29, "lr": 9.953869405340376e-05} +{"train_loss": 0.018703509122133255, "global_step": 3568, "epoch": 29, "lr": 9.953839374708589e-05} +{"train_loss": 0.018510405709888756, "global_step": 3569, "epoch": 29, "lr": 9.953809334350469e-05, "val_loss": 0.026270262897014618} +{"train_loss": 0.020689288154244423, "global_step": 3570, "epoch": 30, "lr": 9.953779284266074e-05} +{"train_loss": 0.01637282967567444, "global_step": 3571, "epoch": 30, "lr": 9.95374922445546e-05} +{"train_loss": 0.018296336755156517, "global_step": 3572, "epoch": 30, "lr": 9.95371915491869e-05} +{"train_loss": 0.015841159969568253, "global_step": 3573, "epoch": 30, "lr": 9.953689075655823e-05} +{"train_loss": 0.01831100694835186, "global_step": 3574, "epoch": 30, "lr": 9.953658986666914e-05} +{"train_loss": 0.020257899537682533, "global_step": 3575, "epoch": 30, "lr": 9.953628887952027e-05} +{"train_loss": 0.015146971680223942, "global_step": 3576, "epoch": 30, "lr": 9.95359877951122e-05} +{"train_loss": 0.018801361322402954, "global_step": 3577, "epoch": 30, "lr": 9.953568661344548e-05} +{"train_loss": 0.015440816059708595, "global_step": 3578, "epoch": 30, "lr": 9.953538533452074e-05} +{"train_loss": 0.014614206738770008, "global_step": 3579, "epoch": 30, "lr": 9.953508395833857e-05} +{"train_loss": 0.020646721124649048, "global_step": 3580, "epoch": 30, "lr": 9.953478248489956e-05} +{"train_loss": 0.019123593345284462, "global_step": 3581, "epoch": 30, "lr": 9.953448091420428e-05} +{"train_loss": 0.01864532195031643, "global_step": 3582, "epoch": 30, "lr": 9.953417924625335e-05} +{"train_loss": 0.015517516061663628, "global_step": 3583, "epoch": 30, "lr": 9.953387748104735e-05} +{"train_loss": 0.016560107469558716, "global_step": 3584, "epoch": 30, "lr": 9.953357561858688e-05} +{"train_loss": 0.0204286091029644, "global_step": 3585, "epoch": 30, "lr": 9.953327365887251e-05} +{"train_loss": 0.028169330209493637, "global_step": 3586, "epoch": 30, "lr": 9.953297160190484e-05} +{"train_loss": 0.022109810262918472, "global_step": 3587, "epoch": 30, "lr": 9.95326694476845e-05} +{"train_loss": 0.015302769839763641, "global_step": 3588, "epoch": 30, "lr": 9.953236719621204e-05} +{"train_loss": 0.02216639369726181, "global_step": 3589, "epoch": 30, "lr": 9.953206484748807e-05} +{"train_loss": 0.02572777308523655, "global_step": 3590, "epoch": 30, "lr": 9.95317624015132e-05} +{"train_loss": 0.014527389779686928, "global_step": 3591, "epoch": 30, "lr": 9.953145985828798e-05} +{"train_loss": 0.022372404113411903, "global_step": 3592, "epoch": 30, "lr": 9.953115721781305e-05} +{"train_loss": 0.01574036106467247, "global_step": 3593, "epoch": 30, "lr": 9.953085448008897e-05} +{"train_loss": 0.019799986854195595, "global_step": 3594, "epoch": 30, "lr": 9.953055164511635e-05} +{"train_loss": 0.015436733141541481, "global_step": 3595, "epoch": 30, "lr": 9.95302487128958e-05} +{"train_loss": 0.022130388766527176, "global_step": 3596, "epoch": 30, "lr": 9.952994568342788e-05} +{"train_loss": 0.020201873034238815, "global_step": 3597, "epoch": 30, "lr": 9.952964255671322e-05} +{"train_loss": 0.020381171256303787, "global_step": 3598, "epoch": 30, "lr": 9.952933933275238e-05} +{"train_loss": 0.019777366891503334, "global_step": 3599, "epoch": 30, "lr": 9.952903601154597e-05} +{"train_loss": 0.023452695459127426, "global_step": 3600, "epoch": 30, "lr": 9.952873259309461e-05} +{"train_loss": 0.023354357108473778, "global_step": 3601, "epoch": 30, "lr": 9.952842907739887e-05} +{"train_loss": 0.026659643277525902, "global_step": 3602, "epoch": 30, "lr": 9.952812546445934e-05} +{"train_loss": 0.012267340905964375, "global_step": 3603, "epoch": 30, "lr": 9.952782175427664e-05} +{"train_loss": 0.026468941941857338, "global_step": 3604, "epoch": 30, "lr": 9.952751794685134e-05} +{"train_loss": 0.015565501525998116, "global_step": 3605, "epoch": 30, "lr": 9.952721404218405e-05} +{"train_loss": 0.02412787266075611, "global_step": 3606, "epoch": 30, "lr": 9.952691004027539e-05} +{"train_loss": 0.01930660381913185, "global_step": 3607, "epoch": 30, "lr": 9.952660594112591e-05} +{"train_loss": 0.019035257399082184, "global_step": 3608, "epoch": 30, "lr": 9.952630174473623e-05} +{"train_loss": 0.02518909052014351, "global_step": 3609, "epoch": 30, "lr": 9.952599745110696e-05} +{"train_loss": 0.020675132051110268, "global_step": 3610, "epoch": 30, "lr": 9.952569306023868e-05} +{"train_loss": 0.02544633485376835, "global_step": 3611, "epoch": 30, "lr": 9.9525388572132e-05} +{"train_loss": 0.018900832161307335, "global_step": 3612, "epoch": 30, "lr": 9.952508398678749e-05} +{"train_loss": 0.017480572685599327, "global_step": 3613, "epoch": 30, "lr": 9.952477930420578e-05} +{"train_loss": 0.020978353917598724, "global_step": 3614, "epoch": 30, "lr": 9.952447452438747e-05} +{"train_loss": 0.013783241622149944, "global_step": 3615, "epoch": 30, "lr": 9.952416964733313e-05} +{"train_loss": 0.018573909997940063, "global_step": 3616, "epoch": 30, "lr": 9.952386467304337e-05} +{"train_loss": 0.02060428261756897, "global_step": 3617, "epoch": 30, "lr": 9.95235596015188e-05} +{"train_loss": 0.01621544174849987, "global_step": 3618, "epoch": 30, "lr": 9.952325443276002e-05} +{"train_loss": 0.012104512192308903, "global_step": 3619, "epoch": 30, "lr": 9.95229491667676e-05} +{"train_loss": 0.024935532361268997, "global_step": 3620, "epoch": 30, "lr": 9.952264380354218e-05} +{"train_loss": 0.023424912244081497, "global_step": 3621, "epoch": 30, "lr": 9.952233834308433e-05} +{"train_loss": 0.021068373695015907, "global_step": 3622, "epoch": 30, "lr": 9.952203278539465e-05} +{"train_loss": 0.015529075637459755, "global_step": 3623, "epoch": 30, "lr": 9.952172713047376e-05} +{"train_loss": 0.016560740768909454, "global_step": 3624, "epoch": 30, "lr": 9.952142137832226e-05} +{"train_loss": 0.02076565846800804, "global_step": 3625, "epoch": 30, "lr": 9.952111552894073e-05} +{"train_loss": 0.01446531806141138, "global_step": 3626, "epoch": 30, "lr": 9.952080958232977e-05} +{"train_loss": 0.02410239912569523, "global_step": 3627, "epoch": 30, "lr": 9.952050353849001e-05} +{"train_loss": 0.01920844055712223, "global_step": 3628, "epoch": 30, "lr": 9.952019739742203e-05} +{"train_loss": 0.019102659076452255, "global_step": 3629, "epoch": 30, "lr": 9.951989115912641e-05} +{"train_loss": 0.018729006871581078, "global_step": 3630, "epoch": 30, "lr": 9.951958482360379e-05} +{"train_loss": 0.022692779079079628, "global_step": 3631, "epoch": 30, "lr": 9.951927839085476e-05} +{"train_loss": 0.01427579764276743, "global_step": 3632, "epoch": 30, "lr": 9.95189718608799e-05} +{"train_loss": 0.013686315156519413, "global_step": 3633, "epoch": 30, "lr": 9.951866523367985e-05} +{"train_loss": 0.026837291195988655, "global_step": 3634, "epoch": 30, "lr": 9.951835850925518e-05} +{"train_loss": 0.01550541166216135, "global_step": 3635, "epoch": 30, "lr": 9.951805168760651e-05} +{"train_loss": 0.021205784752964973, "global_step": 3636, "epoch": 30, "lr": 9.951774476873444e-05} +{"train_loss": 0.019732965156435966, "global_step": 3637, "epoch": 30, "lr": 9.951743775263955e-05} +{"train_loss": 0.013470346108078957, "global_step": 3638, "epoch": 30, "lr": 9.951713063932247e-05} +{"train_loss": 0.015021026134490967, "global_step": 3639, "epoch": 30, "lr": 9.951682342878379e-05} +{"train_loss": 0.01407351903617382, "global_step": 3640, "epoch": 30, "lr": 9.951651612102413e-05} +{"train_loss": 0.01712287776172161, "global_step": 3641, "epoch": 30, "lr": 9.951620871604407e-05} +{"train_loss": 0.013536319136619568, "global_step": 3642, "epoch": 30, "lr": 9.951590121384422e-05} +{"train_loss": 0.024142760783433914, "global_step": 3643, "epoch": 30, "lr": 9.951559361442519e-05} +{"train_loss": 0.01999747008085251, "global_step": 3644, "epoch": 30, "lr": 9.95152859177876e-05} +{"train_loss": 0.014075801707804203, "global_step": 3645, "epoch": 30, "lr": 9.951497812393202e-05} +{"train_loss": 0.012795078568160534, "global_step": 3646, "epoch": 30, "lr": 9.951467023285908e-05} +{"train_loss": 0.01877540349960327, "global_step": 3647, "epoch": 30, "lr": 9.951436224456937e-05} +{"train_loss": 0.03199146315455437, "global_step": 3648, "epoch": 30, "lr": 9.951405415906349e-05} +{"train_loss": 0.019212093204259872, "global_step": 3649, "epoch": 30, "lr": 9.951374597634207e-05} +{"train_loss": 0.01615450344979763, "global_step": 3650, "epoch": 30, "lr": 9.951343769640568e-05} +{"train_loss": 0.016166161745786667, "global_step": 3651, "epoch": 30, "lr": 9.951312931925496e-05} +{"train_loss": 0.016369853168725967, "global_step": 3652, "epoch": 30, "lr": 9.951282084489049e-05} +{"train_loss": 0.018509186804294586, "global_step": 3653, "epoch": 30, "lr": 9.95125122733129e-05} +{"train_loss": 0.02328535169363022, "global_step": 3654, "epoch": 30, "lr": 9.951220360452277e-05} +{"train_loss": 0.021999962627887726, "global_step": 3655, "epoch": 30, "lr": 9.951189483852072e-05} +{"train_loss": 0.018388284370303154, "global_step": 3656, "epoch": 30, "lr": 9.951158597530737e-05} +{"train_loss": 0.024925919249653816, "global_step": 3657, "epoch": 30, "lr": 9.951127701488328e-05} +{"train_loss": 0.023287547752261162, "global_step": 3658, "epoch": 30, "lr": 9.95109679572491e-05} +{"train_loss": 0.021295614540576935, "global_step": 3659, "epoch": 30, "lr": 9.951065880240544e-05} +{"train_loss": 0.016656886786222458, "global_step": 3660, "epoch": 30, "lr": 9.951034955035288e-05} +{"train_loss": 0.01859826222062111, "global_step": 3661, "epoch": 30, "lr": 9.951004020109202e-05} +{"train_loss": 0.021896060556173325, "global_step": 3662, "epoch": 30, "lr": 9.95097307546235e-05} +{"train_loss": 0.018605804070830345, "global_step": 3663, "epoch": 30, "lr": 9.950942121094793e-05} +{"train_loss": 0.022147737443447113, "global_step": 3664, "epoch": 30, "lr": 9.950911157006589e-05} +{"train_loss": 0.01703503727912903, "global_step": 3665, "epoch": 30, "lr": 9.9508801831978e-05} +{"train_loss": 0.018862439319491386, "global_step": 3666, "epoch": 30, "lr": 9.950849199668484e-05} +{"train_loss": 0.02084147185087204, "global_step": 3667, "epoch": 30, "lr": 9.950818206418709e-05} +{"train_loss": 0.019537009298801422, "global_step": 3668, "epoch": 30, "lr": 9.950787203448528e-05} +{"train_loss": 0.02003752626478672, "global_step": 3669, "epoch": 30, "lr": 9.950756190758006e-05} +{"train_loss": 0.019317934289574623, "global_step": 3670, "epoch": 30, "lr": 9.950725168347203e-05} +{"train_loss": 0.016753017902374268, "global_step": 3671, "epoch": 30, "lr": 9.950694136216181e-05} +{"train_loss": 0.020266233012080193, "global_step": 3672, "epoch": 30, "lr": 9.950663094364999e-05} +{"train_loss": 0.01939852349460125, "global_step": 3673, "epoch": 30, "lr": 9.95063204279372e-05} +{"train_loss": 0.019882207736372948, "global_step": 3674, "epoch": 30, "lr": 9.950600981502403e-05} +{"train_loss": 0.024705985561013222, "global_step": 3675, "epoch": 30, "lr": 9.95056991049111e-05} +{"train_loss": 0.020530948415398598, "global_step": 3676, "epoch": 30, "lr": 9.950538829759901e-05} +{"train_loss": 0.021981341764330864, "global_step": 3677, "epoch": 30, "lr": 9.950507739308839e-05} +{"train_loss": 0.01159229688346386, "global_step": 3678, "epoch": 30, "lr": 9.950476639137984e-05} +{"train_loss": 0.0205836221575737, "global_step": 3679, "epoch": 30, "lr": 9.950445529247396e-05} +{"train_loss": 0.018055256456136703, "global_step": 3680, "epoch": 30, "lr": 9.950414409637139e-05} +{"train_loss": 0.027054497972130775, "global_step": 3681, "epoch": 30, "lr": 9.95038328030727e-05} +{"train_loss": 0.021855438128113747, "global_step": 3682, "epoch": 30, "lr": 9.950352141257853e-05} +{"train_loss": 0.019273271784186363, "global_step": 3683, "epoch": 30, "lr": 9.95032099248895e-05} +{"train_loss": 0.018559295684099197, "global_step": 3684, "epoch": 30, "lr": 9.95028983400062e-05} +{"train_loss": 0.02496108040213585, "global_step": 3685, "epoch": 30, "lr": 9.950258665792924e-05} +{"train_loss": 0.020021554082632065, "global_step": 3686, "epoch": 30, "lr": 9.950227487865925e-05} +{"train_loss": 0.02095925249159336, "global_step": 3687, "epoch": 30, "lr": 9.95019630021968e-05} +{"train_loss": 0.019481089506141778, "global_step": 3688, "epoch": 30, "lr": 9.950165102854257e-05, "val_loss": 0.024979159235954285, "train_action_mse_error": 0.001322242897003889} +{"train_loss": 0.021018262952566147, "global_step": 3689, "epoch": 31, "lr": 9.950133895769711e-05} +{"train_loss": 0.01671604812145233, "global_step": 3690, "epoch": 31, "lr": 9.950102678966107e-05} +{"train_loss": 0.021482443436980247, "global_step": 3691, "epoch": 31, "lr": 9.950071452443505e-05} +{"train_loss": 0.02187170460820198, "global_step": 3692, "epoch": 31, "lr": 9.950040216201968e-05} +{"train_loss": 0.013982455246150494, "global_step": 3693, "epoch": 31, "lr": 9.950008970241556e-05} +{"train_loss": 0.015765607357025146, "global_step": 3694, "epoch": 31, "lr": 9.949977714562329e-05} +{"train_loss": 0.019826237112283707, "global_step": 3695, "epoch": 31, "lr": 9.949946449164349e-05} +{"train_loss": 0.019414179027080536, "global_step": 3696, "epoch": 31, "lr": 9.94991517404768e-05} +{"train_loss": 0.022030958905816078, "global_step": 3697, "epoch": 31, "lr": 9.949883889212379e-05} +{"train_loss": 0.015258803963661194, "global_step": 3698, "epoch": 31, "lr": 9.949852594658511e-05} +{"train_loss": 0.029282070696353912, "global_step": 3699, "epoch": 31, "lr": 9.949821290386137e-05} +{"train_loss": 0.019002119079232216, "global_step": 3700, "epoch": 31, "lr": 9.949789976395316e-05} +{"train_loss": 0.01530393399298191, "global_step": 3701, "epoch": 31, "lr": 9.949758652686112e-05} +{"train_loss": 0.02262176387012005, "global_step": 3702, "epoch": 31, "lr": 9.949727319258586e-05} +{"train_loss": 0.02077118121087551, "global_step": 3703, "epoch": 31, "lr": 9.949695976112798e-05} +{"train_loss": 0.025487955659627914, "global_step": 3704, "epoch": 31, "lr": 9.949664623248812e-05} +{"train_loss": 0.015425045043230057, "global_step": 3705, "epoch": 31, "lr": 9.949633260666688e-05} +{"train_loss": 0.01640942133963108, "global_step": 3706, "epoch": 31, "lr": 9.949601888366489e-05} +{"train_loss": 0.024034438654780388, "global_step": 3707, "epoch": 31, "lr": 9.949570506348273e-05} +{"train_loss": 0.021123923361301422, "global_step": 3708, "epoch": 31, "lr": 9.949539114612105e-05} +{"train_loss": 0.023401372134685516, "global_step": 3709, "epoch": 31, "lr": 9.949507713158047e-05} +{"train_loss": 0.018295753747224808, "global_step": 3710, "epoch": 31, "lr": 9.949476301986157e-05} +{"train_loss": 0.02001882903277874, "global_step": 3711, "epoch": 31, "lr": 9.949444881096502e-05} +{"train_loss": 0.017643442377448082, "global_step": 3712, "epoch": 31, "lr": 9.94941345048914e-05} +{"train_loss": 0.0141880689188838, "global_step": 3713, "epoch": 31, "lr": 9.949382010164132e-05} +{"train_loss": 0.01425999402999878, "global_step": 3714, "epoch": 31, "lr": 9.949350560121543e-05} +{"train_loss": 0.024195995181798935, "global_step": 3715, "epoch": 31, "lr": 9.949319100361431e-05} +{"train_loss": 0.016884226351976395, "global_step": 3716, "epoch": 31, "lr": 9.94928763088386e-05} +{"train_loss": 0.01968427747488022, "global_step": 3717, "epoch": 31, "lr": 9.949256151688892e-05} +{"train_loss": 0.019610945135354996, "global_step": 3718, "epoch": 31, "lr": 9.94922466277659e-05} +{"train_loss": 0.020225971937179565, "global_step": 3719, "epoch": 31, "lr": 9.949193164147012e-05} +{"train_loss": 0.025631902739405632, "global_step": 3720, "epoch": 31, "lr": 9.949161655800222e-05} +{"train_loss": 0.021910984069108963, "global_step": 3721, "epoch": 31, "lr": 9.949130137736282e-05} +{"train_loss": 0.021996401250362396, "global_step": 3722, "epoch": 31, "lr": 9.949098609955254e-05} +{"train_loss": 0.01638946495950222, "global_step": 3723, "epoch": 31, "lr": 9.9490670724572e-05} +{"train_loss": 0.024779759347438812, "global_step": 3724, "epoch": 31, "lr": 9.949035525242181e-05} +{"train_loss": 0.014722649939358234, "global_step": 3725, "epoch": 31, "lr": 9.94900396831026e-05} +{"train_loss": 0.020750410854816437, "global_step": 3726, "epoch": 31, "lr": 9.948972401661498e-05} +{"train_loss": 0.020516538992524147, "global_step": 3727, "epoch": 31, "lr": 9.948940825295958e-05} +{"train_loss": 0.016583377495408058, "global_step": 3728, "epoch": 31, "lr": 9.9489092392137e-05} +{"train_loss": 0.016210108995437622, "global_step": 3729, "epoch": 31, "lr": 9.948877643414789e-05} +{"train_loss": 0.019095251336693764, "global_step": 3730, "epoch": 31, "lr": 9.948846037899284e-05} +{"train_loss": 0.02376619167625904, "global_step": 3731, "epoch": 31, "lr": 9.94881442266725e-05} +{"train_loss": 0.018054768443107605, "global_step": 3732, "epoch": 31, "lr": 9.948782797718748e-05} +{"train_loss": 0.017612559720873833, "global_step": 3733, "epoch": 31, "lr": 9.948751163053838e-05} +{"train_loss": 0.01957833021879196, "global_step": 3734, "epoch": 31, "lr": 9.948719518672584e-05} +{"train_loss": 0.01688305288553238, "global_step": 3735, "epoch": 31, "lr": 9.948687864575048e-05} +{"train_loss": 0.01735253445804119, "global_step": 3736, "epoch": 31, "lr": 9.948656200761292e-05} +{"train_loss": 0.016520865261554718, "global_step": 3737, "epoch": 31, "lr": 9.948624527231379e-05} +{"train_loss": 0.018198484554886818, "global_step": 3738, "epoch": 31, "lr": 9.94859284398537e-05} +{"train_loss": 0.01849604956805706, "global_step": 3739, "epoch": 31, "lr": 9.948561151023328e-05} +{"train_loss": 0.017349068075418472, "global_step": 3740, "epoch": 31, "lr": 9.948529448345314e-05} +{"train_loss": 0.013954395428299904, "global_step": 3741, "epoch": 31, "lr": 9.948497735951392e-05} +{"train_loss": 0.02505997009575367, "global_step": 3742, "epoch": 31, "lr": 9.948466013841622e-05} +{"train_loss": 0.02226453274488449, "global_step": 3743, "epoch": 31, "lr": 9.94843428201607e-05} +{"train_loss": 0.02814057655632496, "global_step": 3744, "epoch": 31, "lr": 9.948402540474792e-05} +{"train_loss": 0.016254400834441185, "global_step": 3745, "epoch": 31, "lr": 9.948370789217857e-05} +{"train_loss": 0.021910229697823524, "global_step": 3746, "epoch": 31, "lr": 9.948339028245326e-05} +{"train_loss": 0.017533451318740845, "global_step": 3747, "epoch": 31, "lr": 9.94830725755726e-05} +{"train_loss": 0.018048947677016258, "global_step": 3748, "epoch": 31, "lr": 9.948275477153717e-05} +{"train_loss": 0.015936443582177162, "global_step": 3749, "epoch": 31, "lr": 9.948243687034767e-05} +{"train_loss": 0.01931856945157051, "global_step": 3750, "epoch": 31, "lr": 9.94821188720047e-05} +{"train_loss": 0.01668686792254448, "global_step": 3751, "epoch": 31, "lr": 9.948180077650886e-05} +{"train_loss": 0.016170697286725044, "global_step": 3752, "epoch": 31, "lr": 9.948148258386079e-05} +{"train_loss": 0.021328110247850418, "global_step": 3753, "epoch": 31, "lr": 9.948116429406111e-05} +{"train_loss": 0.01897810772061348, "global_step": 3754, "epoch": 31, "lr": 9.948084590711046e-05} +{"train_loss": 0.01926935650408268, "global_step": 3755, "epoch": 31, "lr": 9.948052742300946e-05} +{"train_loss": 0.014694413170218468, "global_step": 3756, "epoch": 31, "lr": 9.948020884175872e-05} +{"train_loss": 0.019200963899493217, "global_step": 3757, "epoch": 31, "lr": 9.947989016335888e-05} +{"train_loss": 0.017975222319364548, "global_step": 3758, "epoch": 31, "lr": 9.947957138781056e-05} +{"train_loss": 0.019411766901612282, "global_step": 3759, "epoch": 31, "lr": 9.947925251511438e-05} +{"train_loss": 0.01746266707777977, "global_step": 3760, "epoch": 31, "lr": 9.9478933545271e-05} +{"train_loss": 0.013388123363256454, "global_step": 3761, "epoch": 31, "lr": 9.9478614478281e-05} +{"train_loss": 0.02161770686507225, "global_step": 3762, "epoch": 31, "lr": 9.947829531414503e-05} +{"train_loss": 0.014312309212982655, "global_step": 3763, "epoch": 31, "lr": 9.94779760528637e-05} +{"train_loss": 0.020916961133480072, "global_step": 3764, "epoch": 31, "lr": 9.947765669443768e-05} +{"train_loss": 0.018641192466020584, "global_step": 3765, "epoch": 31, "lr": 9.947733723886754e-05} +{"train_loss": 0.020732736214995384, "global_step": 3766, "epoch": 31, "lr": 9.947701768615396e-05} +{"train_loss": 0.0163408350199461, "global_step": 3767, "epoch": 31, "lr": 9.947669803629751e-05} +{"train_loss": 0.016541950404644012, "global_step": 3768, "epoch": 31, "lr": 9.947637828929887e-05} +{"train_loss": 0.015456397086381912, "global_step": 3769, "epoch": 31, "lr": 9.947605844515863e-05} +{"train_loss": 0.016352809965610504, "global_step": 3770, "epoch": 31, "lr": 9.947573850387745e-05} +{"train_loss": 0.02141757123172283, "global_step": 3771, "epoch": 31, "lr": 9.947541846545595e-05} +{"train_loss": 0.020974190905690193, "global_step": 3772, "epoch": 31, "lr": 9.947509832989474e-05} +{"train_loss": 0.02346142940223217, "global_step": 3773, "epoch": 31, "lr": 9.947477809719447e-05} +{"train_loss": 0.020588591694831848, "global_step": 3774, "epoch": 31, "lr": 9.947445776735575e-05} +{"train_loss": 0.0169462189078331, "global_step": 3775, "epoch": 31, "lr": 9.947413734037921e-05} +{"train_loss": 0.02067607268691063, "global_step": 3776, "epoch": 31, "lr": 9.94738168162655e-05} +{"train_loss": 0.014487411826848984, "global_step": 3777, "epoch": 31, "lr": 9.947349619501523e-05} +{"train_loss": 0.017731355503201485, "global_step": 3778, "epoch": 31, "lr": 9.947317547662904e-05} +{"train_loss": 0.019424237310886383, "global_step": 3779, "epoch": 31, "lr": 9.947285466110755e-05} +{"train_loss": 0.019581150263547897, "global_step": 3780, "epoch": 31, "lr": 9.94725337484514e-05} +{"train_loss": 0.01844559982419014, "global_step": 3781, "epoch": 31, "lr": 9.947221273866121e-05} +{"train_loss": 0.01590670645236969, "global_step": 3782, "epoch": 31, "lr": 9.947189163173762e-05} +{"train_loss": 0.0195974949747324, "global_step": 3783, "epoch": 31, "lr": 9.947157042768124e-05} +{"train_loss": 0.017949961125850677, "global_step": 3784, "epoch": 31, "lr": 9.947124912649275e-05} +{"train_loss": 0.016659487038850784, "global_step": 3785, "epoch": 31, "lr": 9.947092772817272e-05} +{"train_loss": 0.01778910681605339, "global_step": 3786, "epoch": 31, "lr": 9.947060623272181e-05} +{"train_loss": 0.023445092141628265, "global_step": 3787, "epoch": 31, "lr": 9.947028464014068e-05} +{"train_loss": 0.018499916419386864, "global_step": 3788, "epoch": 31, "lr": 9.946996295042989e-05} +{"train_loss": 0.016306210309267044, "global_step": 3789, "epoch": 31, "lr": 9.946964116359015e-05} +{"train_loss": 0.02170167677104473, "global_step": 3790, "epoch": 31, "lr": 9.946931927962203e-05} +{"train_loss": 0.012950214557349682, "global_step": 3791, "epoch": 31, "lr": 9.94689972985262e-05} +{"train_loss": 0.017220674082636833, "global_step": 3792, "epoch": 31, "lr": 9.946867522030326e-05} +{"train_loss": 0.02466491423547268, "global_step": 3793, "epoch": 31, "lr": 9.946835304495387e-05} +{"train_loss": 0.015863779932260513, "global_step": 3794, "epoch": 31, "lr": 9.946803077247866e-05} +{"train_loss": 0.020983370020985603, "global_step": 3795, "epoch": 31, "lr": 9.946770840287826e-05} +{"train_loss": 0.01990595832467079, "global_step": 3796, "epoch": 31, "lr": 9.946738593615329e-05} +{"train_loss": 0.01694592647254467, "global_step": 3797, "epoch": 31, "lr": 9.946706337230441e-05} +{"train_loss": 0.018174929544329643, "global_step": 3798, "epoch": 31, "lr": 9.946674071133221e-05} +{"train_loss": 0.017529509961605072, "global_step": 3799, "epoch": 31, "lr": 9.946641795323735e-05} +{"train_loss": 0.02125570923089981, "global_step": 3800, "epoch": 31, "lr": 9.946609509802047e-05} +{"train_loss": 0.02272476814687252, "global_step": 3801, "epoch": 31, "lr": 9.94657721456822e-05} +{"train_loss": 0.02407180517911911, "global_step": 3802, "epoch": 31, "lr": 9.946544909622318e-05} +{"train_loss": 0.015136840753257275, "global_step": 3803, "epoch": 31, "lr": 9.946512594964404e-05} +{"train_loss": 0.023201635107398033, "global_step": 3804, "epoch": 31, "lr": 9.946480270594538e-05} +{"train_loss": 0.018845388665795326, "global_step": 3805, "epoch": 31, "lr": 9.946447936512788e-05} +{"train_loss": 0.01713475212454796, "global_step": 3806, "epoch": 31, "lr": 9.946415592719216e-05} +{"train_loss": 0.019063339247798718, "global_step": 3807, "epoch": 31, "lr": 9.946383239213885e-05, "val_loss": 0.026903994381427765} +{"train_loss": 0.01493237167596817, "global_step": 3808, "epoch": 32, "lr": 9.946350875996861e-05} +{"train_loss": 0.023136289790272713, "global_step": 3809, "epoch": 32, "lr": 9.946318503068204e-05} +{"train_loss": 0.014116649515926838, "global_step": 3810, "epoch": 32, "lr": 9.946286120427978e-05} +{"train_loss": 0.014829704537987709, "global_step": 3811, "epoch": 32, "lr": 9.946253728076249e-05} +{"train_loss": 0.0192429032176733, "global_step": 3812, "epoch": 32, "lr": 9.946221326013079e-05} +{"train_loss": 0.012172797694802284, "global_step": 3813, "epoch": 32, "lr": 9.946188914238532e-05} +{"train_loss": 0.01710658147931099, "global_step": 3814, "epoch": 32, "lr": 9.946156492752669e-05} +{"train_loss": 0.014589080587029457, "global_step": 3815, "epoch": 32, "lr": 9.94612406155556e-05} +{"train_loss": 0.02356940135359764, "global_step": 3816, "epoch": 32, "lr": 9.946091620647261e-05} +{"train_loss": 0.014926613308489323, "global_step": 3817, "epoch": 32, "lr": 9.946059170027844e-05} +{"train_loss": 0.02302207425236702, "global_step": 3818, "epoch": 32, "lr": 9.946026709697365e-05} +{"train_loss": 0.02205202914774418, "global_step": 3819, "epoch": 32, "lr": 9.945994239655891e-05} +{"train_loss": 0.018680334091186523, "global_step": 3820, "epoch": 32, "lr": 9.945961759903489e-05} +{"train_loss": 0.017528865486383438, "global_step": 3821, "epoch": 32, "lr": 9.945929270440215e-05} +{"train_loss": 0.017576107755303383, "global_step": 3822, "epoch": 32, "lr": 9.94589677126614e-05} +{"train_loss": 0.01823769323527813, "global_step": 3823, "epoch": 32, "lr": 9.945864262381323e-05} +{"train_loss": 0.021007725968956947, "global_step": 3824, "epoch": 32, "lr": 9.945831743785832e-05} +{"train_loss": 0.01922261156141758, "global_step": 3825, "epoch": 32, "lr": 9.945799215479729e-05} +{"train_loss": 0.016024034470319748, "global_step": 3826, "epoch": 32, "lr": 9.945766677463075e-05} +{"train_loss": 0.022862274199724197, "global_step": 3827, "epoch": 32, "lr": 9.94573412973594e-05} +{"train_loss": 0.0196380577981472, "global_step": 3828, "epoch": 32, "lr": 9.945701572298382e-05} +{"train_loss": 0.017365621402859688, "global_step": 3829, "epoch": 32, "lr": 9.945669005150467e-05} +{"train_loss": 0.01840611919760704, "global_step": 3830, "epoch": 32, "lr": 9.945636428292261e-05} +{"train_loss": 0.019174065440893173, "global_step": 3831, "epoch": 32, "lr": 9.945603841723825e-05} +{"train_loss": 0.021330101415514946, "global_step": 3832, "epoch": 32, "lr": 9.945571245445225e-05} +{"train_loss": 0.015110846608877182, "global_step": 3833, "epoch": 32, "lr": 9.945538639456524e-05} +{"train_loss": 0.016567829996347427, "global_step": 3834, "epoch": 32, "lr": 9.945506023757785e-05} +{"train_loss": 0.016569634899497032, "global_step": 3835, "epoch": 32, "lr": 9.945473398349074e-05} +{"train_loss": 0.016964973881840706, "global_step": 3836, "epoch": 32, "lr": 9.945440763230455e-05} +{"train_loss": 0.023950321599841118, "global_step": 3837, "epoch": 32, "lr": 9.945408118401992e-05} +{"train_loss": 0.012181395664811134, "global_step": 3838, "epoch": 32, "lr": 9.945375463863748e-05} +{"train_loss": 0.017835764214396477, "global_step": 3839, "epoch": 32, "lr": 9.945342799615787e-05} +{"train_loss": 0.011977036483585835, "global_step": 3840, "epoch": 32, "lr": 9.945310125658174e-05} +{"train_loss": 0.013387655839323997, "global_step": 3841, "epoch": 32, "lr": 9.945277441990972e-05} +{"train_loss": 0.017563484609127045, "global_step": 3842, "epoch": 32, "lr": 9.945244748614247e-05} +{"train_loss": 0.018898162990808487, "global_step": 3843, "epoch": 32, "lr": 9.945212045528063e-05} +{"train_loss": 0.017575083300471306, "global_step": 3844, "epoch": 32, "lr": 9.945179332732482e-05} +{"train_loss": 0.014632787555456161, "global_step": 3845, "epoch": 32, "lr": 9.94514661022757e-05} +{"train_loss": 0.01996087282896042, "global_step": 3846, "epoch": 32, "lr": 9.945113878013392e-05} +{"train_loss": 0.021921945735812187, "global_step": 3847, "epoch": 32, "lr": 9.945081136090012e-05} +{"train_loss": 0.01675277017056942, "global_step": 3848, "epoch": 32, "lr": 9.94504838445749e-05} +{"train_loss": 0.015723075717687607, "global_step": 3849, "epoch": 32, "lr": 9.945015623115897e-05} +{"train_loss": 0.014415335841476917, "global_step": 3850, "epoch": 32, "lr": 9.944982852065293e-05} +{"train_loss": 0.017887435853481293, "global_step": 3851, "epoch": 32, "lr": 9.944950071305742e-05} +{"train_loss": 0.022060859948396683, "global_step": 3852, "epoch": 32, "lr": 9.944917280837311e-05} +{"train_loss": 0.016865549609065056, "global_step": 3853, "epoch": 32, "lr": 9.944884480660064e-05} +{"train_loss": 0.018109267577528954, "global_step": 3854, "epoch": 32, "lr": 9.944851670774064e-05} +{"train_loss": 0.01738964393734932, "global_step": 3855, "epoch": 32, "lr": 9.944818851179375e-05} +{"train_loss": 0.01599055901169777, "global_step": 3856, "epoch": 32, "lr": 9.944786021876064e-05} +{"train_loss": 0.016673654317855835, "global_step": 3857, "epoch": 32, "lr": 9.944753182864194e-05} +{"train_loss": 0.016582144424319267, "global_step": 3858, "epoch": 32, "lr": 9.944720334143829e-05} +{"train_loss": 0.01292321179062128, "global_step": 3859, "epoch": 32, "lr": 9.944687475715034e-05} +{"train_loss": 0.023883497342467308, "global_step": 3860, "epoch": 32, "lr": 9.944654607577872e-05} +{"train_loss": 0.021288776770234108, "global_step": 3861, "epoch": 32, "lr": 9.94462172973241e-05} +{"train_loss": 0.01919913850724697, "global_step": 3862, "epoch": 32, "lr": 9.944588842178711e-05} +{"train_loss": 0.013301103375852108, "global_step": 3863, "epoch": 32, "lr": 9.944555944916841e-05} +{"train_loss": 0.01995972916483879, "global_step": 3864, "epoch": 32, "lr": 9.944523037946863e-05} +{"train_loss": 0.020706629380583763, "global_step": 3865, "epoch": 32, "lr": 9.944490121268844e-05} +{"train_loss": 0.016059936955571175, "global_step": 3866, "epoch": 32, "lr": 9.944457194882843e-05} +{"train_loss": 0.015799425542354584, "global_step": 3867, "epoch": 32, "lr": 9.944424258788932e-05} +{"train_loss": 0.012833688408136368, "global_step": 3868, "epoch": 32, "lr": 9.944391312987171e-05} +{"train_loss": 0.015845095738768578, "global_step": 3869, "epoch": 32, "lr": 9.944358357477626e-05} +{"train_loss": 0.015195329673588276, "global_step": 3870, "epoch": 32, "lr": 9.944325392260362e-05} +{"train_loss": 0.019689369946718216, "global_step": 3871, "epoch": 32, "lr": 9.944292417335442e-05} +{"train_loss": 0.017824022099375725, "global_step": 3872, "epoch": 32, "lr": 9.944259432702934e-05} +{"train_loss": 0.017739657312631607, "global_step": 3873, "epoch": 32, "lr": 9.944226438362899e-05} +{"train_loss": 0.01413089781999588, "global_step": 3874, "epoch": 32, "lr": 9.944193434315405e-05} +{"train_loss": 0.0197746679186821, "global_step": 3875, "epoch": 32, "lr": 9.944160420560514e-05} +{"train_loss": 0.018313979730010033, "global_step": 3876, "epoch": 32, "lr": 9.944127397098293e-05} +{"train_loss": 0.021442610770463943, "global_step": 3877, "epoch": 32, "lr": 9.944094363928807e-05} +{"train_loss": 0.013798829168081284, "global_step": 3878, "epoch": 32, "lr": 9.944061321052119e-05} +{"train_loss": 0.017427384853363037, "global_step": 3879, "epoch": 32, "lr": 9.944028268468294e-05} +{"train_loss": 0.013964913785457611, "global_step": 3880, "epoch": 32, "lr": 9.943995206177399e-05} +{"train_loss": 0.01734185591340065, "global_step": 3881, "epoch": 32, "lr": 9.943962134179496e-05} +{"train_loss": 0.020610176026821136, "global_step": 3882, "epoch": 32, "lr": 9.943929052474653e-05} +{"train_loss": 0.016181310638785362, "global_step": 3883, "epoch": 32, "lr": 9.943895961062934e-05} +{"train_loss": 0.014673976227641106, "global_step": 3884, "epoch": 32, "lr": 9.943862859944401e-05} +{"train_loss": 0.022492635995149612, "global_step": 3885, "epoch": 32, "lr": 9.943829749119123e-05} +{"train_loss": 0.014850100502371788, "global_step": 3886, "epoch": 32, "lr": 9.943796628587165e-05} +{"train_loss": 0.012083126232028008, "global_step": 3887, "epoch": 32, "lr": 9.943763498348588e-05} +{"train_loss": 0.014862465672194958, "global_step": 3888, "epoch": 32, "lr": 9.94373035840346e-05} +{"train_loss": 0.02280428074300289, "global_step": 3889, "epoch": 32, "lr": 9.943697208751846e-05} +{"train_loss": 0.013018355704843998, "global_step": 3890, "epoch": 32, "lr": 9.943664049393811e-05} +{"train_loss": 0.01535478513687849, "global_step": 3891, "epoch": 32, "lr": 9.94363088032942e-05} +{"train_loss": 0.021367229521274567, "global_step": 3892, "epoch": 32, "lr": 9.943597701558738e-05} +{"train_loss": 0.01661611720919609, "global_step": 3893, "epoch": 32, "lr": 9.943564513081829e-05} +{"train_loss": 0.01766594499349594, "global_step": 3894, "epoch": 32, "lr": 9.94353131489876e-05} +{"train_loss": 0.026757054030895233, "global_step": 3895, "epoch": 32, "lr": 9.943498107009594e-05} +{"train_loss": 0.015858791768550873, "global_step": 3896, "epoch": 32, "lr": 9.9434648894144e-05} +{"train_loss": 0.020940057933330536, "global_step": 3897, "epoch": 32, "lr": 9.943431662113239e-05} +{"train_loss": 0.012566016986966133, "global_step": 3898, "epoch": 32, "lr": 9.943398425106178e-05} +{"train_loss": 0.020806673914194107, "global_step": 3899, "epoch": 32, "lr": 9.943365178393284e-05} +{"train_loss": 0.015171313658356667, "global_step": 3900, "epoch": 32, "lr": 9.943331921974619e-05} +{"train_loss": 0.01540936529636383, "global_step": 3901, "epoch": 32, "lr": 9.94329865585025e-05} +{"train_loss": 0.01696660742163658, "global_step": 3902, "epoch": 32, "lr": 9.943265380020243e-05} +{"train_loss": 0.03082340583205223, "global_step": 3903, "epoch": 32, "lr": 9.943232094484662e-05} +{"train_loss": 0.015117119997739792, "global_step": 3904, "epoch": 32, "lr": 9.943198799243574e-05} +{"train_loss": 0.012584758922457695, "global_step": 3905, "epoch": 32, "lr": 9.943165494297043e-05} +{"train_loss": 0.021782267838716507, "global_step": 3906, "epoch": 32, "lr": 9.943132179645132e-05} +{"train_loss": 0.02239142172038555, "global_step": 3907, "epoch": 32, "lr": 9.943098855287911e-05} +{"train_loss": 0.018631018698215485, "global_step": 3908, "epoch": 32, "lr": 9.943065521225444e-05} +{"train_loss": 0.03013530559837818, "global_step": 3909, "epoch": 32, "lr": 9.943032177457795e-05} +{"train_loss": 0.022189516574144363, "global_step": 3910, "epoch": 32, "lr": 9.942998823985032e-05} +{"train_loss": 0.015297824516892433, "global_step": 3911, "epoch": 32, "lr": 9.942965460807216e-05} +{"train_loss": 0.019642125815153122, "global_step": 3912, "epoch": 32, "lr": 9.942932087924418e-05} +{"train_loss": 0.019394375383853912, "global_step": 3913, "epoch": 32, "lr": 9.9428987053367e-05} +{"train_loss": 0.023555317893624306, "global_step": 3914, "epoch": 32, "lr": 9.942865313044129e-05} +{"train_loss": 0.023141277953982353, "global_step": 3915, "epoch": 32, "lr": 9.942831911046769e-05} +{"train_loss": 0.020517073571681976, "global_step": 3916, "epoch": 32, "lr": 9.942798499344688e-05} +{"train_loss": 0.025897638872265816, "global_step": 3917, "epoch": 32, "lr": 9.942765077937948e-05} +{"train_loss": 0.022318225353956223, "global_step": 3918, "epoch": 32, "lr": 9.942731646826618e-05} +{"train_loss": 0.017992740496993065, "global_step": 3919, "epoch": 32, "lr": 9.942698206010763e-05} +{"train_loss": 0.020100286230444908, "global_step": 3920, "epoch": 32, "lr": 9.942664755490447e-05} +{"train_loss": 0.021554263308644295, "global_step": 3921, "epoch": 32, "lr": 9.942631295265738e-05} +{"train_loss": 0.022661613300442696, "global_step": 3922, "epoch": 32, "lr": 9.942597825336702e-05} +{"train_loss": 0.02125188335776329, "global_step": 3923, "epoch": 32, "lr": 9.9425643457034e-05} +{"train_loss": 0.015468315221369267, "global_step": 3924, "epoch": 32, "lr": 9.942530856365902e-05} +{"train_loss": 0.019652802497148514, "global_step": 3925, "epoch": 32, "lr": 9.942497357324272e-05} +{"train_loss": 0.01823609008477265, "global_step": 3926, "epoch": 32, "lr": 9.942463848578578e-05, "val_loss": 0.021965267136693} +{"train_loss": 0.018832091242074966, "global_step": 3927, "epoch": 33, "lr": 9.942430330128884e-05} +{"train_loss": 0.02314714901149273, "global_step": 3928, "epoch": 33, "lr": 9.942396801975256e-05} +{"train_loss": 0.020137766376137733, "global_step": 3929, "epoch": 33, "lr": 9.94236326411776e-05} +{"train_loss": 0.020302295684814453, "global_step": 3930, "epoch": 33, "lr": 9.94232971655646e-05} +{"train_loss": 0.018285684287548065, "global_step": 3931, "epoch": 33, "lr": 9.942296159291426e-05} +{"train_loss": 0.02688463032245636, "global_step": 3932, "epoch": 33, "lr": 9.94226259232272e-05} +{"train_loss": 0.022621773183345795, "global_step": 3933, "epoch": 33, "lr": 9.94222901565041e-05} +{"train_loss": 0.012102781794965267, "global_step": 3934, "epoch": 33, "lr": 9.942195429274561e-05} +{"train_loss": 0.018097469583153725, "global_step": 3935, "epoch": 33, "lr": 9.94216183319524e-05} +{"train_loss": 0.02421620860695839, "global_step": 3936, "epoch": 33, "lr": 9.94212822741251e-05} +{"train_loss": 0.009718013927340508, "global_step": 3937, "epoch": 33, "lr": 9.942094611926443e-05} +{"train_loss": 0.029980357736349106, "global_step": 3938, "epoch": 33, "lr": 9.942060986737098e-05} +{"train_loss": 0.01260469015687704, "global_step": 3939, "epoch": 33, "lr": 9.942027351844545e-05} +{"train_loss": 0.017155088484287262, "global_step": 3940, "epoch": 33, "lr": 9.94199370724885e-05} +{"train_loss": 0.017142485827207565, "global_step": 3941, "epoch": 33, "lr": 9.941960052950078e-05} +{"train_loss": 0.019035007804632187, "global_step": 3942, "epoch": 33, "lr": 9.941926388948296e-05} +{"train_loss": 0.018499035388231277, "global_step": 3943, "epoch": 33, "lr": 9.941892715243568e-05} +{"train_loss": 0.014904029667377472, "global_step": 3944, "epoch": 33, "lr": 9.941859031835963e-05} +{"train_loss": 0.027025319635868073, "global_step": 3945, "epoch": 33, "lr": 9.941825338725546e-05} +{"train_loss": 0.015297828242182732, "global_step": 3946, "epoch": 33, "lr": 9.941791635912381e-05} +{"train_loss": 0.017619218677282333, "global_step": 3947, "epoch": 33, "lr": 9.941757923396537e-05} +{"train_loss": 0.015782438218593597, "global_step": 3948, "epoch": 33, "lr": 9.94172420117808e-05} +{"train_loss": 0.0201709121465683, "global_step": 3949, "epoch": 33, "lr": 9.941690469257075e-05} +{"train_loss": 0.020643793046474457, "global_step": 3950, "epoch": 33, "lr": 9.941656727633588e-05} +{"train_loss": 0.02079462632536888, "global_step": 3951, "epoch": 33, "lr": 9.941622976307688e-05} +{"train_loss": 0.01604827120900154, "global_step": 3952, "epoch": 33, "lr": 9.941589215279437e-05} +{"train_loss": 0.01838870905339718, "global_step": 3953, "epoch": 33, "lr": 9.941555444548904e-05} +{"train_loss": 0.018684890121221542, "global_step": 3954, "epoch": 33, "lr": 9.941521664116156e-05} +{"train_loss": 0.015815984457731247, "global_step": 3955, "epoch": 33, "lr": 9.941487873981257e-05} +{"train_loss": 0.014251035638153553, "global_step": 3956, "epoch": 33, "lr": 9.941454074144275e-05} +{"train_loss": 0.015868350863456726, "global_step": 3957, "epoch": 33, "lr": 9.941420264605275e-05} +{"train_loss": 0.012902098707854748, "global_step": 3958, "epoch": 33, "lr": 9.941386445364325e-05} +{"train_loss": 0.01773100718855858, "global_step": 3959, "epoch": 33, "lr": 9.94135261642149e-05} +{"train_loss": 0.01593257486820221, "global_step": 3960, "epoch": 33, "lr": 9.941318777776838e-05} +{"train_loss": 0.01458224467933178, "global_step": 3961, "epoch": 33, "lr": 9.941284929430433e-05} +{"train_loss": 0.016362948343157768, "global_step": 3962, "epoch": 33, "lr": 9.941251071382345e-05} +{"train_loss": 0.020711911842226982, "global_step": 3963, "epoch": 33, "lr": 9.941217203632636e-05} +{"train_loss": 0.014937769621610641, "global_step": 3964, "epoch": 33, "lr": 9.941183326181377e-05} +{"train_loss": 0.020539548248052597, "global_step": 3965, "epoch": 33, "lr": 9.941149439028632e-05} +{"train_loss": 0.016341589391231537, "global_step": 3966, "epoch": 33, "lr": 9.941115542174468e-05} +{"train_loss": 0.023375341668725014, "global_step": 3967, "epoch": 33, "lr": 9.94108163561895e-05} +{"train_loss": 0.017124010249972343, "global_step": 3968, "epoch": 33, "lr": 9.941047719362148e-05} +{"train_loss": 0.020970823243260384, "global_step": 3969, "epoch": 33, "lr": 9.941013793404126e-05} +{"train_loss": 0.01789732091128826, "global_step": 3970, "epoch": 33, "lr": 9.94097985774495e-05} +{"train_loss": 0.013526956550776958, "global_step": 3971, "epoch": 33, "lr": 9.940945912384689e-05} +{"train_loss": 0.019415244460105896, "global_step": 3972, "epoch": 33, "lr": 9.940911957323408e-05} +{"train_loss": 0.017138071358203888, "global_step": 3973, "epoch": 33, "lr": 9.940877992561176e-05} +{"train_loss": 0.016820160672068596, "global_step": 3974, "epoch": 33, "lr": 9.940844018098057e-05} +{"train_loss": 0.02011336199939251, "global_step": 3975, "epoch": 33, "lr": 9.940810033934119e-05} +{"train_loss": 0.02164522372186184, "global_step": 3976, "epoch": 33, "lr": 9.940776040069427e-05} +{"train_loss": 0.01633995771408081, "global_step": 3977, "epoch": 33, "lr": 9.94074203650405e-05} +{"train_loss": 0.019237173721194267, "global_step": 3978, "epoch": 33, "lr": 9.940708023238055e-05} +{"train_loss": 0.013111838139593601, "global_step": 3979, "epoch": 33, "lr": 9.940674000271505e-05} +{"train_loss": 0.019289886578917503, "global_step": 3980, "epoch": 33, "lr": 9.94063996760447e-05} +{"train_loss": 0.017797641456127167, "global_step": 3981, "epoch": 33, "lr": 9.940605925237017e-05} +{"train_loss": 0.02075081132352352, "global_step": 3982, "epoch": 33, "lr": 9.940571873169214e-05} +{"train_loss": 0.02312135510146618, "global_step": 3983, "epoch": 33, "lr": 9.940537811401123e-05} +{"train_loss": 0.012752484530210495, "global_step": 3984, "epoch": 33, "lr": 9.940503739932816e-05} +{"train_loss": 0.0185439120978117, "global_step": 3985, "epoch": 33, "lr": 9.940469658764355e-05} +{"train_loss": 0.018035510554909706, "global_step": 3986, "epoch": 33, "lr": 9.940435567895811e-05} +{"train_loss": 0.016995035111904144, "global_step": 3987, "epoch": 33, "lr": 9.940401467327251e-05} +{"train_loss": 0.024213526397943497, "global_step": 3988, "epoch": 33, "lr": 9.940367357058739e-05} +{"train_loss": 0.015797479078173637, "global_step": 3989, "epoch": 33, "lr": 9.940333237090345e-05} +{"train_loss": 0.016700580716133118, "global_step": 3990, "epoch": 33, "lr": 9.940299107422133e-05} +{"train_loss": 0.0126098757609725, "global_step": 3991, "epoch": 33, "lr": 9.940264968054171e-05} +{"train_loss": 0.021253475919365883, "global_step": 3992, "epoch": 33, "lr": 9.940230818986526e-05} +{"train_loss": 0.024228377267718315, "global_step": 3993, "epoch": 33, "lr": 9.940196660219267e-05} +{"train_loss": 0.02436595782637596, "global_step": 3994, "epoch": 33, "lr": 9.940162491752461e-05} +{"train_loss": 0.014766045846045017, "global_step": 3995, "epoch": 33, "lr": 9.940128313586173e-05} +{"train_loss": 0.02263142727315426, "global_step": 3996, "epoch": 33, "lr": 9.94009412572047e-05} +{"train_loss": 0.016096627339720726, "global_step": 3997, "epoch": 33, "lr": 9.94005992815542e-05} +{"train_loss": 0.021695103496313095, "global_step": 3998, "epoch": 33, "lr": 9.94002572089109e-05} +{"train_loss": 0.01125921867787838, "global_step": 3999, "epoch": 33, "lr": 9.939991503927547e-05} +{"train_loss": 0.01947042904794216, "global_step": 4000, "epoch": 33, "lr": 9.93995727726486e-05} +{"train_loss": 0.017921485006809235, "global_step": 4001, "epoch": 33, "lr": 9.939923040903091e-05} +{"train_loss": 0.01986895501613617, "global_step": 4002, "epoch": 33, "lr": 9.939888794842315e-05} +{"train_loss": 0.019017690792679787, "global_step": 4003, "epoch": 33, "lr": 9.939854539082594e-05} +{"train_loss": 0.016123853623867035, "global_step": 4004, "epoch": 33, "lr": 9.939820273623996e-05} +{"train_loss": 0.012562716379761696, "global_step": 4005, "epoch": 33, "lr": 9.939785998466587e-05} +{"train_loss": 0.02110319584608078, "global_step": 4006, "epoch": 33, "lr": 9.939751713610438e-05} +{"train_loss": 0.017088020220398903, "global_step": 4007, "epoch": 33, "lr": 9.939717419055614e-05} +{"train_loss": 0.021987207233905792, "global_step": 4008, "epoch": 33, "lr": 9.939683114802182e-05} +{"train_loss": 0.013737999834120274, "global_step": 4009, "epoch": 33, "lr": 9.939648800850209e-05} +{"train_loss": 0.015282721258699894, "global_step": 4010, "epoch": 33, "lr": 9.939614477199766e-05} +{"train_loss": 0.015773935243487358, "global_step": 4011, "epoch": 33, "lr": 9.939580143850915e-05} +{"train_loss": 0.02066165581345558, "global_step": 4012, "epoch": 33, "lr": 9.939545800803728e-05} +{"train_loss": 0.020840980112552643, "global_step": 4013, "epoch": 33, "lr": 9.93951144805827e-05} +{"train_loss": 0.012646949850022793, "global_step": 4014, "epoch": 33, "lr": 9.939477085614608e-05} +{"train_loss": 0.013473929837346077, "global_step": 4015, "epoch": 33, "lr": 9.939442713472812e-05} +{"train_loss": 0.017742319032549858, "global_step": 4016, "epoch": 33, "lr": 9.939408331632947e-05} +{"train_loss": 0.019310632720589638, "global_step": 4017, "epoch": 33, "lr": 9.939373940095081e-05} +{"train_loss": 0.018807953223586082, "global_step": 4018, "epoch": 33, "lr": 9.939339538859283e-05} +{"train_loss": 0.024116072803735733, "global_step": 4019, "epoch": 33, "lr": 9.939305127925619e-05} +{"train_loss": 0.016197433695197105, "global_step": 4020, "epoch": 33, "lr": 9.939270707294157e-05} +{"train_loss": 0.015608144924044609, "global_step": 4021, "epoch": 33, "lr": 9.939236276964965e-05} +{"train_loss": 0.014190243557095528, "global_step": 4022, "epoch": 33, "lr": 9.93920183693811e-05} +{"train_loss": 0.02406293898820877, "global_step": 4023, "epoch": 33, "lr": 9.939167387213661e-05} +{"train_loss": 0.022093122825026512, "global_step": 4024, "epoch": 33, "lr": 9.939132927791683e-05} +{"train_loss": 0.022138601168990135, "global_step": 4025, "epoch": 33, "lr": 9.939098458672245e-05} +{"train_loss": 0.018391404300928116, "global_step": 4026, "epoch": 33, "lr": 9.939063979855415e-05} +{"train_loss": 0.02345312014222145, "global_step": 4027, "epoch": 33, "lr": 9.93902949134126e-05} +{"train_loss": 0.01841181516647339, "global_step": 4028, "epoch": 33, "lr": 9.93899499312985e-05} +{"train_loss": 0.023550352081656456, "global_step": 4029, "epoch": 33, "lr": 9.938960485221251e-05} +{"train_loss": 0.022664131596684456, "global_step": 4030, "epoch": 33, "lr": 9.93892596761553e-05} +{"train_loss": 0.016598422080278397, "global_step": 4031, "epoch": 33, "lr": 9.938891440312755e-05} +{"train_loss": 0.026071177795529366, "global_step": 4032, "epoch": 33, "lr": 9.938856903312995e-05} +{"train_loss": 0.020963389426469803, "global_step": 4033, "epoch": 33, "lr": 9.938822356616317e-05} +{"train_loss": 0.015548723749816418, "global_step": 4034, "epoch": 33, "lr": 9.938787800222789e-05} +{"train_loss": 0.01785369962453842, "global_step": 4035, "epoch": 33, "lr": 9.938753234132478e-05} +{"train_loss": 0.022372327744960785, "global_step": 4036, "epoch": 33, "lr": 9.938718658345454e-05} +{"train_loss": 0.01965051144361496, "global_step": 4037, "epoch": 33, "lr": 9.938684072861783e-05} +{"train_loss": 0.03091464936733246, "global_step": 4038, "epoch": 33, "lr": 9.938649477681532e-05} +{"train_loss": 0.0272048432379961, "global_step": 4039, "epoch": 33, "lr": 9.938614872804773e-05} +{"train_loss": 0.021983793005347252, "global_step": 4040, "epoch": 33, "lr": 9.93858025823157e-05} +{"train_loss": 0.020577341318130493, "global_step": 4041, "epoch": 33, "lr": 9.938545633961991e-05} +{"train_loss": 0.014149191789329052, "global_step": 4042, "epoch": 33, "lr": 9.938510999996107e-05} +{"train_loss": 0.015121021308004856, "global_step": 4043, "epoch": 33, "lr": 9.938476356333983e-05} +{"train_loss": 0.023825310170650482, "global_step": 4044, "epoch": 33, "lr": 9.938441702975689e-05} +{"train_loss": 0.01872933267795739, "global_step": 4045, "epoch": 33, "lr": 9.938407039921293e-05, "val_loss": 0.02705894038081169} +{"train_loss": 0.016200095415115356, "global_step": 4046, "epoch": 34, "lr": 9.938372367170861e-05} +{"train_loss": 0.01803094521164894, "global_step": 4047, "epoch": 34, "lr": 9.938337684724463e-05} +{"train_loss": 0.01681794971227646, "global_step": 4048, "epoch": 34, "lr": 9.938302992582167e-05} +{"train_loss": 0.01485341228544712, "global_step": 4049, "epoch": 34, "lr": 9.93826829074404e-05} +{"train_loss": 0.018512193113565445, "global_step": 4050, "epoch": 34, "lr": 9.938233579210151e-05} +{"train_loss": 0.02002536505460739, "global_step": 4051, "epoch": 34, "lr": 9.938198857980568e-05} +{"train_loss": 0.018169647082686424, "global_step": 4052, "epoch": 34, "lr": 9.938164127055359e-05} +{"train_loss": 0.02421359159052372, "global_step": 4053, "epoch": 34, "lr": 9.938129386434593e-05} +{"train_loss": 0.013439055532217026, "global_step": 4054, "epoch": 34, "lr": 9.938094636118336e-05} +{"train_loss": 0.01915609836578369, "global_step": 4055, "epoch": 34, "lr": 9.93805987610666e-05} +{"train_loss": 0.021216560155153275, "global_step": 4056, "epoch": 34, "lr": 9.93802510639963e-05} +{"train_loss": 0.015241638757288456, "global_step": 4057, "epoch": 34, "lr": 9.937990326997313e-05} +{"train_loss": 0.021539535373449326, "global_step": 4058, "epoch": 34, "lr": 9.937955537899781e-05} +{"train_loss": 0.014490386471152306, "global_step": 4059, "epoch": 34, "lr": 9.937920739107103e-05} +{"train_loss": 0.017976069822907448, "global_step": 4060, "epoch": 34, "lr": 9.937885930619343e-05} +{"train_loss": 0.01614310033619404, "global_step": 4061, "epoch": 34, "lr": 9.937851112436571e-05} +{"train_loss": 0.016884760931134224, "global_step": 4062, "epoch": 34, "lr": 9.937816284558857e-05} +{"train_loss": 0.012909776531159878, "global_step": 4063, "epoch": 34, "lr": 9.937781446986268e-05} +{"train_loss": 0.01230370718985796, "global_step": 4064, "epoch": 34, "lr": 9.937746599718873e-05} +{"train_loss": 0.015893155708909035, "global_step": 4065, "epoch": 34, "lr": 9.93771174275674e-05} +{"train_loss": 0.018320851027965546, "global_step": 4066, "epoch": 34, "lr": 9.937676876099938e-05} +{"train_loss": 0.014249402098357677, "global_step": 4067, "epoch": 34, "lr": 9.937641999748534e-05} +{"train_loss": 0.018689332529902458, "global_step": 4068, "epoch": 34, "lr": 9.937607113702598e-05} +{"train_loss": 0.028291622176766396, "global_step": 4069, "epoch": 34, "lr": 9.937572217962196e-05} +{"train_loss": 0.02517613396048546, "global_step": 4070, "epoch": 34, "lr": 9.937537312527401e-05} +{"train_loss": 0.018746832385659218, "global_step": 4071, "epoch": 34, "lr": 9.937502397398278e-05} +{"train_loss": 0.012240124866366386, "global_step": 4072, "epoch": 34, "lr": 9.937467472574897e-05} +{"train_loss": 0.012030106037855148, "global_step": 4073, "epoch": 34, "lr": 9.937432538057325e-05} +{"train_loss": 0.01846723072230816, "global_step": 4074, "epoch": 34, "lr": 9.937397593845634e-05} +{"train_loss": 0.01794295944273472, "global_step": 4075, "epoch": 34, "lr": 9.937362639939888e-05} +{"train_loss": 0.017423562705516815, "global_step": 4076, "epoch": 34, "lr": 9.937327676340158e-05} +{"train_loss": 0.020960349589586258, "global_step": 4077, "epoch": 34, "lr": 9.937292703046515e-05} +{"train_loss": 0.014744075946509838, "global_step": 4078, "epoch": 34, "lr": 9.937257720059022e-05} +{"train_loss": 0.016684353351593018, "global_step": 4079, "epoch": 34, "lr": 9.937222727377753e-05} +{"train_loss": 0.01995374634861946, "global_step": 4080, "epoch": 34, "lr": 9.937187725002774e-05} +{"train_loss": 0.017871404066681862, "global_step": 4081, "epoch": 34, "lr": 9.937152712934154e-05} +{"train_loss": 0.012587634846568108, "global_step": 4082, "epoch": 34, "lr": 9.937117691171962e-05} +{"train_loss": 0.018493860960006714, "global_step": 4083, "epoch": 34, "lr": 9.937082659716269e-05} +{"train_loss": 0.018596453592181206, "global_step": 4084, "epoch": 34, "lr": 9.937047618567138e-05} +{"train_loss": 0.017748797312378883, "global_step": 4085, "epoch": 34, "lr": 9.937012567724645e-05} +{"train_loss": 0.014394392259418964, "global_step": 4086, "epoch": 34, "lr": 9.936977507188854e-05} +{"train_loss": 0.01655319146811962, "global_step": 4087, "epoch": 34, "lr": 9.936942436959836e-05} +{"train_loss": 0.020188424736261368, "global_step": 4088, "epoch": 34, "lr": 9.936907357037657e-05} +{"train_loss": 0.01629573293030262, "global_step": 4089, "epoch": 34, "lr": 9.936872267422388e-05} +{"train_loss": 0.017586957663297653, "global_step": 4090, "epoch": 34, "lr": 9.9368371681141e-05} +{"train_loss": 0.015984613448381424, "global_step": 4091, "epoch": 34, "lr": 9.936802059112856e-05} +{"train_loss": 0.019393466413021088, "global_step": 4092, "epoch": 34, "lr": 9.936766940418731e-05} +{"train_loss": 0.019645189866423607, "global_step": 4093, "epoch": 34, "lr": 9.936731812031792e-05} +{"train_loss": 0.019710596650838852, "global_step": 4094, "epoch": 34, "lr": 9.936696673952106e-05} +{"train_loss": 0.020362457260489464, "global_step": 4095, "epoch": 34, "lr": 9.936661526179745e-05} +{"train_loss": 0.0163729265332222, "global_step": 4096, "epoch": 34, "lr": 9.936626368714774e-05} +{"train_loss": 0.024822648614645004, "global_step": 4097, "epoch": 34, "lr": 9.936591201557268e-05} +{"train_loss": 0.01535908691585064, "global_step": 4098, "epoch": 34, "lr": 9.93655602470729e-05} +{"train_loss": 0.0151201281696558, "global_step": 4099, "epoch": 34, "lr": 9.936520838164912e-05} +{"train_loss": 0.016453733667731285, "global_step": 4100, "epoch": 34, "lr": 9.936485641930203e-05} +{"train_loss": 0.019314100965857506, "global_step": 4101, "epoch": 34, "lr": 9.936450436003233e-05} +{"train_loss": 0.01763417385518551, "global_step": 4102, "epoch": 34, "lr": 9.936415220384068e-05} +{"train_loss": 0.020910145714879036, "global_step": 4103, "epoch": 34, "lr": 9.93637999507278e-05} +{"train_loss": 0.020242704078555107, "global_step": 4104, "epoch": 34, "lr": 9.936344760069437e-05} +{"train_loss": 0.020751366391777992, "global_step": 4105, "epoch": 34, "lr": 9.936309515374109e-05} +{"train_loss": 0.019907105714082718, "global_step": 4106, "epoch": 34, "lr": 9.936274260986865e-05} +{"train_loss": 0.01887076534330845, "global_step": 4107, "epoch": 34, "lr": 9.936238996907772e-05} +{"train_loss": 0.014549186453223228, "global_step": 4108, "epoch": 34, "lr": 9.936203723136903e-05} +{"train_loss": 0.01958698034286499, "global_step": 4109, "epoch": 34, "lr": 9.936168439674324e-05} +{"train_loss": 0.022732233628630638, "global_step": 4110, "epoch": 34, "lr": 9.936133146520106e-05} +{"train_loss": 0.01938779093325138, "global_step": 4111, "epoch": 34, "lr": 9.936097843674319e-05} +{"train_loss": 0.019383680075407028, "global_step": 4112, "epoch": 34, "lr": 9.93606253113703e-05} +{"train_loss": 0.01778186485171318, "global_step": 4113, "epoch": 34, "lr": 9.93602720890831e-05} +{"train_loss": 0.013665099628269672, "global_step": 4114, "epoch": 34, "lr": 9.935991876988227e-05} +{"train_loss": 0.025085123255848885, "global_step": 4115, "epoch": 34, "lr": 9.935956535376853e-05} +{"train_loss": 0.016464723274111748, "global_step": 4116, "epoch": 34, "lr": 9.935921184074255e-05} +{"train_loss": 0.020710622891783714, "global_step": 4117, "epoch": 34, "lr": 9.935885823080502e-05} +{"train_loss": 0.01652589999139309, "global_step": 4118, "epoch": 34, "lr": 9.935850452395665e-05} +{"train_loss": 0.020784329622983932, "global_step": 4119, "epoch": 34, "lr": 9.935815072019814e-05} +{"train_loss": 0.015814879909157753, "global_step": 4120, "epoch": 34, "lr": 9.935779681953018e-05} +{"train_loss": 0.015412503853440285, "global_step": 4121, "epoch": 34, "lr": 9.935744282195343e-05} +{"train_loss": 0.01868802309036255, "global_step": 4122, "epoch": 34, "lr": 9.935708872746863e-05} +{"train_loss": 0.01701154001057148, "global_step": 4123, "epoch": 34, "lr": 9.935673453607647e-05} +{"train_loss": 0.017764929682016373, "global_step": 4124, "epoch": 34, "lr": 9.935638024777763e-05} +{"train_loss": 0.016432583332061768, "global_step": 4125, "epoch": 34, "lr": 9.93560258625728e-05} +{"train_loss": 0.016430765390396118, "global_step": 4126, "epoch": 34, "lr": 9.935567138046269e-05} +{"train_loss": 0.015602372586727142, "global_step": 4127, "epoch": 34, "lr": 9.935531680144799e-05} +{"train_loss": 0.016987737268209457, "global_step": 4128, "epoch": 34, "lr": 9.935496212552939e-05} +{"train_loss": 0.015862800180912018, "global_step": 4129, "epoch": 34, "lr": 9.935460735270762e-05} +{"train_loss": 0.021531717851758003, "global_step": 4130, "epoch": 34, "lr": 9.935425248298333e-05} +{"train_loss": 0.016026385128498077, "global_step": 4131, "epoch": 34, "lr": 9.935389751635724e-05} +{"train_loss": 0.01546353381127119, "global_step": 4132, "epoch": 34, "lr": 9.935354245283006e-05} +{"train_loss": 0.01771526224911213, "global_step": 4133, "epoch": 34, "lr": 9.935318729240246e-05} +{"train_loss": 0.011202718131244183, "global_step": 4134, "epoch": 34, "lr": 9.935283203507515e-05} +{"train_loss": 0.018747935071587563, "global_step": 4135, "epoch": 34, "lr": 9.935247668084884e-05} +{"train_loss": 0.018557662144303322, "global_step": 4136, "epoch": 34, "lr": 9.93521212297242e-05} +{"train_loss": 0.016040440648794174, "global_step": 4137, "epoch": 34, "lr": 9.935176568170195e-05} +{"train_loss": 0.01576046645641327, "global_step": 4138, "epoch": 34, "lr": 9.935141003678277e-05} +{"train_loss": 0.01175337191671133, "global_step": 4139, "epoch": 34, "lr": 9.935105429496737e-05} +{"train_loss": 0.013487868010997772, "global_step": 4140, "epoch": 34, "lr": 9.935069845625646e-05} +{"train_loss": 0.017510665580630302, "global_step": 4141, "epoch": 34, "lr": 9.935034252065072e-05} +{"train_loss": 0.015246153809130192, "global_step": 4142, "epoch": 34, "lr": 9.934998648815085e-05} +{"train_loss": 0.013416014611721039, "global_step": 4143, "epoch": 34, "lr": 9.934963035875756e-05} +{"train_loss": 0.015549489296972752, "global_step": 4144, "epoch": 34, "lr": 9.934927413247152e-05} +{"train_loss": 0.014077846892178059, "global_step": 4145, "epoch": 34, "lr": 9.934891780929349e-05} +{"train_loss": 0.025240132585167885, "global_step": 4146, "epoch": 34, "lr": 9.93485613892241e-05} +{"train_loss": 0.01740342192351818, "global_step": 4147, "epoch": 34, "lr": 9.93482048722641e-05} +{"train_loss": 0.0210585854947567, "global_step": 4148, "epoch": 34, "lr": 9.934784825841416e-05} +{"train_loss": 0.014000642113387585, "global_step": 4149, "epoch": 34, "lr": 9.934749154767502e-05} +{"train_loss": 0.022758297622203827, "global_step": 4150, "epoch": 34, "lr": 9.934713474004734e-05} +{"train_loss": 0.020164791494607925, "global_step": 4151, "epoch": 34, "lr": 9.934677783553182e-05} +{"train_loss": 0.011722364462912083, "global_step": 4152, "epoch": 34, "lr": 9.934642083412918e-05} +{"train_loss": 0.02000395394861698, "global_step": 4153, "epoch": 34, "lr": 9.93460637358401e-05} +{"train_loss": 0.014542898163199425, "global_step": 4154, "epoch": 34, "lr": 9.934570654066531e-05} +{"train_loss": 0.01770378090441227, "global_step": 4155, "epoch": 34, "lr": 9.93453492486055e-05} +{"train_loss": 0.014600795693695545, "global_step": 4156, "epoch": 34, "lr": 9.934499185966137e-05} +{"train_loss": 0.02070305310189724, "global_step": 4157, "epoch": 34, "lr": 9.934463437383362e-05} +{"train_loss": 0.016132742166519165, "global_step": 4158, "epoch": 34, "lr": 9.934427679112293e-05} +{"train_loss": 0.018800966441631317, "global_step": 4159, "epoch": 34, "lr": 9.934391911153005e-05} +{"train_loss": 0.011513282544910908, "global_step": 4160, "epoch": 34, "lr": 9.934356133505564e-05} +{"train_loss": 0.021944431588053703, "global_step": 4161, "epoch": 34, "lr": 9.934320346170042e-05} +{"train_loss": 0.014797280542552471, "global_step": 4162, "epoch": 34, "lr": 9.934284549146511e-05} +{"train_loss": 0.020171549171209335, "global_step": 4163, "epoch": 34, "lr": 9.934248742435038e-05} +{"train_loss": 0.017624539299672393, "global_step": 4164, "epoch": 34, "lr": 9.934212926035695e-05, "val_loss": 0.030122894793748856} +{"train_loss": 0.01513589359819889, "global_step": 4165, "epoch": 35, "lr": 9.934177099948551e-05} +{"train_loss": 0.01921643689274788, "global_step": 4166, "epoch": 35, "lr": 9.93414126417368e-05} +{"train_loss": 0.01831076107919216, "global_step": 4167, "epoch": 35, "lr": 9.934105418711149e-05} +{"train_loss": 0.01706971973180771, "global_step": 4168, "epoch": 35, "lr": 9.934069563561027e-05} +{"train_loss": 0.01564962789416313, "global_step": 4169, "epoch": 35, "lr": 9.934033698723389e-05} +{"train_loss": 0.01865130290389061, "global_step": 4170, "epoch": 35, "lr": 9.9339978241983e-05} +{"train_loss": 0.022359563037753105, "global_step": 4171, "epoch": 35, "lr": 9.933961939985837e-05} +{"train_loss": 0.022380510345101357, "global_step": 4172, "epoch": 35, "lr": 9.933926046086064e-05} +{"train_loss": 0.01410638727247715, "global_step": 4173, "epoch": 35, "lr": 9.933890142499056e-05} +{"train_loss": 0.017489973455667496, "global_step": 4174, "epoch": 35, "lr": 9.93385422922488e-05} +{"train_loss": 0.016821566969156265, "global_step": 4175, "epoch": 35, "lr": 9.93381830626361e-05} +{"train_loss": 0.014291472733020782, "global_step": 4176, "epoch": 35, "lr": 9.933782373615314e-05} +{"train_loss": 0.01534789614379406, "global_step": 4177, "epoch": 35, "lr": 9.933746431280064e-05} +{"train_loss": 0.017876992002129555, "global_step": 4178, "epoch": 35, "lr": 9.933710479257929e-05} +{"train_loss": 0.01740240305662155, "global_step": 4179, "epoch": 35, "lr": 9.933674517548983e-05} +{"train_loss": 0.016765113919973373, "global_step": 4180, "epoch": 35, "lr": 9.933638546153292e-05} +{"train_loss": 0.02240418829023838, "global_step": 4181, "epoch": 35, "lr": 9.93360256507093e-05} +{"train_loss": 0.012885911390185356, "global_step": 4182, "epoch": 35, "lr": 9.933566574301964e-05} +{"train_loss": 0.01624394953250885, "global_step": 4183, "epoch": 35, "lr": 9.933530573846471e-05} +{"train_loss": 0.018221460282802582, "global_step": 4184, "epoch": 35, "lr": 9.933494563704516e-05} +{"train_loss": 0.013301202096045017, "global_step": 4185, "epoch": 35, "lr": 9.93345854387617e-05} +{"train_loss": 0.021070854738354683, "global_step": 4186, "epoch": 35, "lr": 9.933422514361505e-05} +{"train_loss": 0.013251650147140026, "global_step": 4187, "epoch": 35, "lr": 9.933386475160594e-05} +{"train_loss": 0.012232263572514057, "global_step": 4188, "epoch": 35, "lr": 9.933350426273505e-05} +{"train_loss": 0.01820340007543564, "global_step": 4189, "epoch": 35, "lr": 9.933314367700311e-05} +{"train_loss": 0.015854567289352417, "global_step": 4190, "epoch": 35, "lr": 9.933278299441078e-05} +{"train_loss": 0.016458427533507347, "global_step": 4191, "epoch": 35, "lr": 9.933242221495883e-05} +{"train_loss": 0.02275073155760765, "global_step": 4192, "epoch": 35, "lr": 9.933206133864792e-05} +{"train_loss": 0.022249814122915268, "global_step": 4193, "epoch": 35, "lr": 9.933170036547879e-05} +{"train_loss": 0.018944192677736282, "global_step": 4194, "epoch": 35, "lr": 9.933133929545213e-05} +{"train_loss": 0.02497991733253002, "global_step": 4195, "epoch": 35, "lr": 9.933097812856866e-05} +{"train_loss": 0.014817384071648121, "global_step": 4196, "epoch": 35, "lr": 9.933061686482909e-05} +{"train_loss": 0.020205659791827202, "global_step": 4197, "epoch": 35, "lr": 9.933025550423412e-05} +{"train_loss": 0.020525390282273293, "global_step": 4198, "epoch": 35, "lr": 9.932989404678445e-05} +{"train_loss": 0.021052677184343338, "global_step": 4199, "epoch": 35, "lr": 9.932953249248081e-05} +{"train_loss": 0.02241435833275318, "global_step": 4200, "epoch": 35, "lr": 9.932917084132391e-05} +{"train_loss": 0.012423532083630562, "global_step": 4201, "epoch": 35, "lr": 9.932880909331445e-05} +{"train_loss": 0.01721321977674961, "global_step": 4202, "epoch": 35, "lr": 9.932844724845314e-05} +{"train_loss": 0.02190283127129078, "global_step": 4203, "epoch": 35, "lr": 9.93280853067407e-05} +{"train_loss": 0.022471774369478226, "global_step": 4204, "epoch": 35, "lr": 9.932772326817783e-05} +{"train_loss": 0.023836098611354828, "global_step": 4205, "epoch": 35, "lr": 9.932736113276525e-05} +{"train_loss": 0.01787964254617691, "global_step": 4206, "epoch": 35, "lr": 9.932699890050367e-05} +{"train_loss": 0.018814275041222572, "global_step": 4207, "epoch": 35, "lr": 9.932663657139379e-05} +{"train_loss": 0.021320955827832222, "global_step": 4208, "epoch": 35, "lr": 9.932627414543631e-05} +{"train_loss": 0.020722314715385437, "global_step": 4209, "epoch": 35, "lr": 9.932591162263199e-05} +{"train_loss": 0.016424506902694702, "global_step": 4210, "epoch": 35, "lr": 9.93255490029815e-05} +{"train_loss": 0.020685797557234764, "global_step": 4211, "epoch": 35, "lr": 9.932518628648557e-05} +{"train_loss": 0.018883060663938522, "global_step": 4212, "epoch": 35, "lr": 9.93248234731449e-05} +{"train_loss": 0.01418511662632227, "global_step": 4213, "epoch": 35, "lr": 9.93244605629602e-05} +{"train_loss": 0.022203024476766586, "global_step": 4214, "epoch": 35, "lr": 9.932409755593222e-05} +{"train_loss": 0.023623548448085785, "global_step": 4215, "epoch": 35, "lr": 9.932373445206163e-05} +{"train_loss": 0.014640421606600285, "global_step": 4216, "epoch": 35, "lr": 9.932337125134915e-05} +{"train_loss": 0.01947234943509102, "global_step": 4217, "epoch": 35, "lr": 9.93230079537955e-05} +{"train_loss": 0.016908664256334305, "global_step": 4218, "epoch": 35, "lr": 9.932264455940139e-05} +{"train_loss": 0.01979975961148739, "global_step": 4219, "epoch": 35, "lr": 9.932228106816754e-05} +{"train_loss": 0.014466915279626846, "global_step": 4220, "epoch": 35, "lr": 9.932191748009467e-05} +{"train_loss": 0.016260845586657524, "global_step": 4221, "epoch": 35, "lr": 9.932155379518349e-05} +{"train_loss": 0.017942991107702255, "global_step": 4222, "epoch": 35, "lr": 9.932119001343468e-05} +{"train_loss": 0.017623376101255417, "global_step": 4223, "epoch": 35, "lr": 9.932082613484901e-05} +{"train_loss": 0.018676389008760452, "global_step": 4224, "epoch": 35, "lr": 9.932046215942715e-05} +{"train_loss": 0.014030832797288895, "global_step": 4225, "epoch": 35, "lr": 9.932009808716985e-05} +{"train_loss": 0.017777394503355026, "global_step": 4226, "epoch": 35, "lr": 9.931973391807779e-05} +{"train_loss": 0.012602015398442745, "global_step": 4227, "epoch": 35, "lr": 9.931936965215169e-05} +{"train_loss": 0.020056385546922684, "global_step": 4228, "epoch": 35, "lr": 9.931900528939231e-05} +{"train_loss": 0.01505344733595848, "global_step": 4229, "epoch": 35, "lr": 9.93186408298003e-05} +{"train_loss": 0.018701935186982155, "global_step": 4230, "epoch": 35, "lr": 9.931827627337642e-05} +{"train_loss": 0.014133181422948837, "global_step": 4231, "epoch": 35, "lr": 9.931791162012139e-05} +{"train_loss": 0.015086645260453224, "global_step": 4232, "epoch": 35, "lr": 9.93175468700359e-05} +{"train_loss": 0.018653269857168198, "global_step": 4233, "epoch": 35, "lr": 9.931718202312065e-05} +{"train_loss": 0.01825389824807644, "global_step": 4234, "epoch": 35, "lr": 9.931681707937642e-05} +{"train_loss": 0.014490448869764805, "global_step": 4235, "epoch": 35, "lr": 9.931645203880386e-05} +{"train_loss": 0.017740193754434586, "global_step": 4236, "epoch": 35, "lr": 9.931608690140373e-05} +{"train_loss": 0.022999299690127373, "global_step": 4237, "epoch": 35, "lr": 9.931572166717674e-05} +{"train_loss": 0.017565393820405006, "global_step": 4238, "epoch": 35, "lr": 9.931535633612357e-05} +{"train_loss": 0.013569576665759087, "global_step": 4239, "epoch": 35, "lr": 9.931499090824499e-05} +{"train_loss": 0.01673409715294838, "global_step": 4240, "epoch": 35, "lr": 9.931462538354168e-05} +{"train_loss": 0.013718690723180771, "global_step": 4241, "epoch": 35, "lr": 9.931425976201438e-05} +{"train_loss": 0.01707642897963524, "global_step": 4242, "epoch": 35, "lr": 9.93138940436638e-05} +{"train_loss": 0.01747460663318634, "global_step": 4243, "epoch": 35, "lr": 9.931352822849065e-05} +{"train_loss": 0.011601035483181477, "global_step": 4244, "epoch": 35, "lr": 9.931316231649566e-05} +{"train_loss": 0.01447996310889721, "global_step": 4245, "epoch": 35, "lr": 9.931279630767956e-05} +{"train_loss": 0.018706945702433586, "global_step": 4246, "epoch": 35, "lr": 9.931243020204303e-05} +{"train_loss": 0.010529699735343456, "global_step": 4247, "epoch": 35, "lr": 9.931206399958681e-05} +{"train_loss": 0.012996428646147251, "global_step": 4248, "epoch": 35, "lr": 9.931169770031164e-05} +{"train_loss": 0.01649704948067665, "global_step": 4249, "epoch": 35, "lr": 9.931133130421822e-05} +{"train_loss": 0.017925765365362167, "global_step": 4250, "epoch": 35, "lr": 9.931096481130725e-05} +{"train_loss": 0.011109982617199421, "global_step": 4251, "epoch": 35, "lr": 9.931059822157947e-05} +{"train_loss": 0.021242721006274223, "global_step": 4252, "epoch": 35, "lr": 9.93102315350356e-05} +{"train_loss": 0.015721524134278297, "global_step": 4253, "epoch": 35, "lr": 9.930986475167637e-05} +{"train_loss": 0.01444966346025467, "global_step": 4254, "epoch": 35, "lr": 9.930949787150248e-05} +{"train_loss": 0.017452847212553024, "global_step": 4255, "epoch": 35, "lr": 9.930913089451466e-05} +{"train_loss": 0.018231788650155067, "global_step": 4256, "epoch": 35, "lr": 9.930876382071363e-05} +{"train_loss": 0.023985961452126503, "global_step": 4257, "epoch": 35, "lr": 9.930839665010013e-05} +{"train_loss": 0.02167925052344799, "global_step": 4258, "epoch": 35, "lr": 9.930802938267483e-05} +{"train_loss": 0.013492914848029613, "global_step": 4259, "epoch": 35, "lr": 9.930766201843851e-05} +{"train_loss": 0.018565906211733818, "global_step": 4260, "epoch": 35, "lr": 9.930729455739184e-05} +{"train_loss": 0.01754235289990902, "global_step": 4261, "epoch": 35, "lr": 9.930692699953557e-05} +{"train_loss": 0.014002900570631027, "global_step": 4262, "epoch": 35, "lr": 9.930655934487042e-05} +{"train_loss": 0.018385913223028183, "global_step": 4263, "epoch": 35, "lr": 9.930619159339711e-05} +{"train_loss": 0.013868078589439392, "global_step": 4264, "epoch": 35, "lr": 9.930582374511636e-05} +{"train_loss": 0.022797944024205208, "global_step": 4265, "epoch": 35, "lr": 9.930545580002888e-05} +{"train_loss": 0.011655997484922409, "global_step": 4266, "epoch": 35, "lr": 9.930508775813543e-05} +{"train_loss": 0.017599796876311302, "global_step": 4267, "epoch": 35, "lr": 9.930471961943668e-05} +{"train_loss": 0.015992801636457443, "global_step": 4268, "epoch": 35, "lr": 9.93043513839334e-05} +{"train_loss": 0.020957101136446, "global_step": 4269, "epoch": 35, "lr": 9.930398305162629e-05} +{"train_loss": 0.01963885873556137, "global_step": 4270, "epoch": 35, "lr": 9.930361462251607e-05} +{"train_loss": 0.01531602069735527, "global_step": 4271, "epoch": 35, "lr": 9.930324609660347e-05} +{"train_loss": 0.022345658391714096, "global_step": 4272, "epoch": 35, "lr": 9.930287747388922e-05} +{"train_loss": 0.015199706889688969, "global_step": 4273, "epoch": 35, "lr": 9.930250875437403e-05} +{"train_loss": 0.01655673235654831, "global_step": 4274, "epoch": 35, "lr": 9.930213993805864e-05} +{"train_loss": 0.020092733204364777, "global_step": 4275, "epoch": 35, "lr": 9.930177102494375e-05} +{"train_loss": 0.017821213230490685, "global_step": 4276, "epoch": 35, "lr": 9.930140201503013e-05} +{"train_loss": 0.013166953809559345, "global_step": 4277, "epoch": 35, "lr": 9.930103290831845e-05} +{"train_loss": 0.012569157406687737, "global_step": 4278, "epoch": 35, "lr": 9.930066370480946e-05} +{"train_loss": 0.015866024419665337, "global_step": 4279, "epoch": 35, "lr": 9.93002944045039e-05} +{"train_loss": 0.014367761090397835, "global_step": 4280, "epoch": 35, "lr": 9.929992500740246e-05} +{"train_loss": 0.014941513538360596, "global_step": 4281, "epoch": 35, "lr": 9.92995555135059e-05} +{"train_loss": 0.015807069838047028, "global_step": 4282, "epoch": 35, "lr": 9.92991859228149e-05} +{"train_loss": 0.017429742985600682, "global_step": 4283, "epoch": 35, "lr": 9.929881623533024e-05, "val_loss": 0.02045135572552681, "train_action_mse_error": 0.0014016530476510525} +{"train_loss": 0.02209480293095112, "global_step": 4284, "epoch": 36, "lr": 9.929844645105262e-05} +{"train_loss": 0.016789648681879044, "global_step": 4285, "epoch": 36, "lr": 9.929807656998277e-05} +{"train_loss": 0.01669246517121792, "global_step": 4286, "epoch": 36, "lr": 9.929770659212141e-05} +{"train_loss": 0.024386120960116386, "global_step": 4287, "epoch": 36, "lr": 9.929733651746927e-05} +{"train_loss": 0.015259452164173126, "global_step": 4288, "epoch": 36, "lr": 9.929696634602708e-05} +{"train_loss": 0.013147057965397835, "global_step": 4289, "epoch": 36, "lr": 9.929659607779555e-05} +{"train_loss": 0.01692887395620346, "global_step": 4290, "epoch": 36, "lr": 9.929622571277542e-05} +{"train_loss": 0.015394756570458412, "global_step": 4291, "epoch": 36, "lr": 9.929585525096744e-05} +{"train_loss": 0.01365652959793806, "global_step": 4292, "epoch": 36, "lr": 9.929548469237229e-05} +{"train_loss": 0.01915830932557583, "global_step": 4293, "epoch": 36, "lr": 9.929511403699074e-05} +{"train_loss": 0.019254140555858612, "global_step": 4294, "epoch": 36, "lr": 9.929474328482349e-05} +{"train_loss": 0.020487535744905472, "global_step": 4295, "epoch": 36, "lr": 9.929437243587128e-05} +{"train_loss": 0.01505235768854618, "global_step": 4296, "epoch": 36, "lr": 9.929400149013484e-05} +{"train_loss": 0.01764742285013199, "global_step": 4297, "epoch": 36, "lr": 9.929363044761489e-05} +{"train_loss": 0.013488687574863434, "global_step": 4298, "epoch": 36, "lr": 9.929325930831215e-05} +{"train_loss": 0.019823335111141205, "global_step": 4299, "epoch": 36, "lr": 9.929288807222738e-05} +{"train_loss": 0.01853366009891033, "global_step": 4300, "epoch": 36, "lr": 9.929251673936129e-05} +{"train_loss": 0.013418078422546387, "global_step": 4301, "epoch": 36, "lr": 9.92921453097146e-05} +{"train_loss": 0.02383512817323208, "global_step": 4302, "epoch": 36, "lr": 9.929177378328805e-05} +{"train_loss": 0.013538965955376625, "global_step": 4303, "epoch": 36, "lr": 9.929140216008237e-05} +{"train_loss": 0.016361985355615616, "global_step": 4304, "epoch": 36, "lr": 9.929103044009829e-05} +{"train_loss": 0.01771908812224865, "global_step": 4305, "epoch": 36, "lr": 9.929065862333653e-05} +{"train_loss": 0.021957237273454666, "global_step": 4306, "epoch": 36, "lr": 9.929028670979784e-05} +{"train_loss": 0.019314710050821304, "global_step": 4307, "epoch": 36, "lr": 9.928991469948294e-05} +{"train_loss": 0.0158910620957613, "global_step": 4308, "epoch": 36, "lr": 9.928954259239254e-05} +{"train_loss": 0.018955612555146217, "global_step": 4309, "epoch": 36, "lr": 9.92891703885274e-05} +{"train_loss": 0.023107998073101044, "global_step": 4310, "epoch": 36, "lr": 9.928879808788825e-05} +{"train_loss": 0.014367373660206795, "global_step": 4311, "epoch": 36, "lr": 9.928842569047579e-05} +{"train_loss": 0.014448394067585468, "global_step": 4312, "epoch": 36, "lr": 9.928805319629079e-05} +{"train_loss": 0.020445555448532104, "global_step": 4313, "epoch": 36, "lr": 9.928768060533396e-05} +{"train_loss": 0.020606381818652153, "global_step": 4314, "epoch": 36, "lr": 9.928730791760602e-05} +{"train_loss": 0.012519178912043571, "global_step": 4315, "epoch": 36, "lr": 9.928693513310773e-05} +{"train_loss": 0.02054314687848091, "global_step": 4316, "epoch": 36, "lr": 9.928656225183981e-05} +{"train_loss": 0.013914366252720356, "global_step": 4317, "epoch": 36, "lr": 9.928618927380298e-05} +{"train_loss": 0.021708564832806587, "global_step": 4318, "epoch": 36, "lr": 9.928581619899798e-05} +{"train_loss": 0.009411584585905075, "global_step": 4319, "epoch": 36, "lr": 9.928544302742555e-05} +{"train_loss": 0.02218247391283512, "global_step": 4320, "epoch": 36, "lr": 9.928506975908643e-05} +{"train_loss": 0.01956983655691147, "global_step": 4321, "epoch": 36, "lr": 9.928469639398133e-05} +{"train_loss": 0.014361188746988773, "global_step": 4322, "epoch": 36, "lr": 9.9284322932111e-05} +{"train_loss": 0.016459817066788673, "global_step": 4323, "epoch": 36, "lr": 9.928394937347616e-05} +{"train_loss": 0.018322881311178207, "global_step": 4324, "epoch": 36, "lr": 9.928357571807756e-05} +{"train_loss": 0.017140060663223267, "global_step": 4325, "epoch": 36, "lr": 9.928320196591592e-05} +{"train_loss": 0.015928778797388077, "global_step": 4326, "epoch": 36, "lr": 9.928282811699196e-05} +{"train_loss": 0.013255398720502853, "global_step": 4327, "epoch": 36, "lr": 9.928245417130645e-05} +{"train_loss": 0.01984752155840397, "global_step": 4328, "epoch": 36, "lr": 9.92820801288601e-05} +{"train_loss": 0.014515199698507786, "global_step": 4329, "epoch": 36, "lr": 9.928170598965367e-05} +{"train_loss": 0.0138486223295331, "global_step": 4330, "epoch": 36, "lr": 9.928133175368786e-05} +{"train_loss": 0.021407103165984154, "global_step": 4331, "epoch": 36, "lr": 9.928095742096342e-05} +{"train_loss": 0.017877347767353058, "global_step": 4332, "epoch": 36, "lr": 9.928058299148108e-05} +{"train_loss": 0.01772547885775566, "global_step": 4333, "epoch": 36, "lr": 9.92802084652416e-05} +{"train_loss": 0.015643926337361336, "global_step": 4334, "epoch": 36, "lr": 9.927983384224567e-05} +{"train_loss": 0.014993442222476006, "global_step": 4335, "epoch": 36, "lr": 9.927945912249406e-05} +{"train_loss": 0.014761887490749359, "global_step": 4336, "epoch": 36, "lr": 9.927908430598751e-05} +{"train_loss": 0.017432376742362976, "global_step": 4337, "epoch": 36, "lr": 9.927870939272674e-05} +{"train_loss": 0.016496047377586365, "global_step": 4338, "epoch": 36, "lr": 9.927833438271247e-05} +{"train_loss": 0.016462858766317368, "global_step": 4339, "epoch": 36, "lr": 9.927795927594547e-05} +{"train_loss": 0.01833166927099228, "global_step": 4340, "epoch": 36, "lr": 9.927758407242646e-05} +{"train_loss": 0.016301462426781654, "global_step": 4341, "epoch": 36, "lr": 9.927720877215616e-05} +{"train_loss": 0.012857687659561634, "global_step": 4342, "epoch": 36, "lr": 9.927683337513534e-05} +{"train_loss": 0.015101226046681404, "global_step": 4343, "epoch": 36, "lr": 9.927645788136473e-05} +{"train_loss": 0.018077310174703598, "global_step": 4344, "epoch": 36, "lr": 9.927608229084505e-05} +{"train_loss": 0.01889387145638466, "global_step": 4345, "epoch": 36, "lr": 9.927570660357706e-05} +{"train_loss": 0.01055933814495802, "global_step": 4346, "epoch": 36, "lr": 9.927533081956146e-05} +{"train_loss": 0.015383297577500343, "global_step": 4347, "epoch": 36, "lr": 9.927495493879904e-05} +{"train_loss": 0.027049470692873, "global_step": 4348, "epoch": 36, "lr": 9.927457896129049e-05} +{"train_loss": 0.0208729337900877, "global_step": 4349, "epoch": 36, "lr": 9.927420288703657e-05} +{"train_loss": 0.020799150690436363, "global_step": 4350, "epoch": 36, "lr": 9.927382671603802e-05} +{"train_loss": 0.01652580499649048, "global_step": 4351, "epoch": 36, "lr": 9.927345044829558e-05} +{"train_loss": 0.019647737964987755, "global_step": 4352, "epoch": 36, "lr": 9.927307408380998e-05} +{"train_loss": 0.013180623762309551, "global_step": 4353, "epoch": 36, "lr": 9.927269762258196e-05} +{"train_loss": 0.015651563182473183, "global_step": 4354, "epoch": 36, "lr": 9.927232106461225e-05} +{"train_loss": 0.01632499322295189, "global_step": 4355, "epoch": 36, "lr": 9.927194440990165e-05} +{"train_loss": 0.016013972461223602, "global_step": 4356, "epoch": 36, "lr": 9.927156765845081e-05} +{"train_loss": 0.013781712390482426, "global_step": 4357, "epoch": 36, "lr": 9.92711908102605e-05} +{"train_loss": 0.022757282480597496, "global_step": 4358, "epoch": 36, "lr": 9.927081386533151e-05} +{"train_loss": 0.014642645604908466, "global_step": 4359, "epoch": 36, "lr": 9.927043682366451e-05} +{"train_loss": 0.018033139407634735, "global_step": 4360, "epoch": 36, "lr": 9.927005968526029e-05} +{"train_loss": 0.015607270412147045, "global_step": 4361, "epoch": 36, "lr": 9.926968245011956e-05} +{"train_loss": 0.009434748440980911, "global_step": 4362, "epoch": 36, "lr": 9.926930511824308e-05} +{"train_loss": 0.02184356190264225, "global_step": 4363, "epoch": 36, "lr": 9.926892768963157e-05} +{"train_loss": 0.014881078153848648, "global_step": 4364, "epoch": 36, "lr": 9.92685501642858e-05} +{"train_loss": 0.0165228471159935, "global_step": 4365, "epoch": 36, "lr": 9.926817254220649e-05} +{"train_loss": 0.021146606653928757, "global_step": 4366, "epoch": 36, "lr": 9.926779482339438e-05} +{"train_loss": 0.019594743847846985, "global_step": 4367, "epoch": 36, "lr": 9.926741700785023e-05} +{"train_loss": 0.01302836462855339, "global_step": 4368, "epoch": 36, "lr": 9.926703909557476e-05} +{"train_loss": 0.020064929500222206, "global_step": 4369, "epoch": 36, "lr": 9.926666108656873e-05} +{"train_loss": 0.018116770312190056, "global_step": 4370, "epoch": 36, "lr": 9.926628298083285e-05} +{"train_loss": 0.012702560983598232, "global_step": 4371, "epoch": 36, "lr": 9.926590477836792e-05} +{"train_loss": 0.014079057611525059, "global_step": 4372, "epoch": 36, "lr": 9.926552647917463e-05} +{"train_loss": 0.021385271102190018, "global_step": 4373, "epoch": 36, "lr": 9.926514808325374e-05} +{"train_loss": 0.014432787895202637, "global_step": 4374, "epoch": 36, "lr": 9.926476959060601e-05} +{"train_loss": 0.012251745909452438, "global_step": 4375, "epoch": 36, "lr": 9.926439100123216e-05} +{"train_loss": 0.019685858860611916, "global_step": 4376, "epoch": 36, "lr": 9.926401231513294e-05} +{"train_loss": 0.014078851789236069, "global_step": 4377, "epoch": 36, "lr": 9.92636335323091e-05} +{"train_loss": 0.014160717837512493, "global_step": 4378, "epoch": 36, "lr": 9.926325465276139e-05} +{"train_loss": 0.01812898740172386, "global_step": 4379, "epoch": 36, "lr": 9.92628756764905e-05} +{"train_loss": 0.026424022391438484, "global_step": 4380, "epoch": 36, "lr": 9.926249660349726e-05} +{"train_loss": 0.01843782514333725, "global_step": 4381, "epoch": 36, "lr": 9.926211743378236e-05} +{"train_loss": 0.012716061435639858, "global_step": 4382, "epoch": 36, "lr": 9.926173816734654e-05} +{"train_loss": 0.013969223946332932, "global_step": 4383, "epoch": 36, "lr": 9.926135880419058e-05} +{"train_loss": 0.015672970563173294, "global_step": 4384, "epoch": 36, "lr": 9.926097934431519e-05} +{"train_loss": 0.01360298041254282, "global_step": 4385, "epoch": 36, "lr": 9.926059978772113e-05} +{"train_loss": 0.016920235008001328, "global_step": 4386, "epoch": 36, "lr": 9.926022013440915e-05} +{"train_loss": 0.024333788082003593, "global_step": 4387, "epoch": 36, "lr": 9.925984038438e-05} +{"train_loss": 0.016407569870352745, "global_step": 4388, "epoch": 36, "lr": 9.92594605376344e-05} +{"train_loss": 0.019481008872389793, "global_step": 4389, "epoch": 36, "lr": 9.925908059417312e-05} +{"train_loss": 0.018687186762690544, "global_step": 4390, "epoch": 36, "lr": 9.92587005539969e-05} +{"train_loss": 0.025400476530194283, "global_step": 4391, "epoch": 36, "lr": 9.925832041710648e-05} +{"train_loss": 0.021499117836356163, "global_step": 4392, "epoch": 36, "lr": 9.925794018350261e-05} +{"train_loss": 0.020615888759493828, "global_step": 4393, "epoch": 36, "lr": 9.925755985318603e-05} +{"train_loss": 0.02159837819635868, "global_step": 4394, "epoch": 36, "lr": 9.925717942615751e-05} +{"train_loss": 0.013307911343872547, "global_step": 4395, "epoch": 36, "lr": 9.925679890241777e-05} +{"train_loss": 0.015662644058465958, "global_step": 4396, "epoch": 36, "lr": 9.925641828196756e-05} +{"train_loss": 0.019163204357028008, "global_step": 4397, "epoch": 36, "lr": 9.925603756480766e-05} +{"train_loss": 0.019562337547540665, "global_step": 4398, "epoch": 36, "lr": 9.925565675093877e-05} +{"train_loss": 0.01659460924565792, "global_step": 4399, "epoch": 36, "lr": 9.925527584036167e-05} +{"train_loss": 0.016909552738070488, "global_step": 4400, "epoch": 36, "lr": 9.92548948330771e-05} +{"train_loss": 0.01934691146016121, "global_step": 4401, "epoch": 36, "lr": 9.92545137290858e-05} +{"train_loss": 0.017361051082110203, "global_step": 4402, "epoch": 36, "lr": 9.925413252838853e-05, "val_loss": 0.027870459482073784} +{"train_loss": 0.015920108184218407, "global_step": 4403, "epoch": 37, "lr": 9.925375123098601e-05} +{"train_loss": 0.016025397926568985, "global_step": 4404, "epoch": 37, "lr": 9.925336983687904e-05} +{"train_loss": 0.017653916031122208, "global_step": 4405, "epoch": 37, "lr": 9.925298834606834e-05} +{"train_loss": 0.02595963142812252, "global_step": 4406, "epoch": 37, "lr": 9.925260675855463e-05} +{"train_loss": 0.015027208253741264, "global_step": 4407, "epoch": 37, "lr": 9.925222507433871e-05} +{"train_loss": 0.01404907088726759, "global_step": 4408, "epoch": 37, "lr": 9.925184329342132e-05} +{"train_loss": 0.020810944959521294, "global_step": 4409, "epoch": 37, "lr": 9.925146141580316e-05} +{"train_loss": 0.013553679920732975, "global_step": 4410, "epoch": 37, "lr": 9.925107944148506e-05} +{"train_loss": 0.01751633733510971, "global_step": 4411, "epoch": 37, "lr": 9.92506973704677e-05} +{"train_loss": 0.01813535764813423, "global_step": 4412, "epoch": 37, "lr": 9.925031520275188e-05} +{"train_loss": 0.018343620002269745, "global_step": 4413, "epoch": 37, "lr": 9.92499329383383e-05} +{"train_loss": 0.01603051833808422, "global_step": 4414, "epoch": 37, "lr": 9.924955057722776e-05} +{"train_loss": 0.017535319551825523, "global_step": 4415, "epoch": 37, "lr": 9.924916811942097e-05} +{"train_loss": 0.015367306768894196, "global_step": 4416, "epoch": 37, "lr": 9.924878556491871e-05} +{"train_loss": 0.018451564013957977, "global_step": 4417, "epoch": 37, "lr": 9.924840291372172e-05} +{"train_loss": 0.020000586286187172, "global_step": 4418, "epoch": 37, "lr": 9.924802016583075e-05} +{"train_loss": 0.01763727329671383, "global_step": 4419, "epoch": 37, "lr": 9.924763732124655e-05} +{"train_loss": 0.014448655769228935, "global_step": 4420, "epoch": 37, "lr": 9.92472543799699e-05} +{"train_loss": 0.01184671651571989, "global_step": 4421, "epoch": 37, "lr": 9.92468713420015e-05} +{"train_loss": 0.01576620526611805, "global_step": 4422, "epoch": 37, "lr": 9.924648820734215e-05} +{"train_loss": 0.018650228157639503, "global_step": 4423, "epoch": 37, "lr": 9.924610497599256e-05} +{"train_loss": 0.01414200197905302, "global_step": 4424, "epoch": 37, "lr": 9.924572164795351e-05} +{"train_loss": 0.011710398830473423, "global_step": 4425, "epoch": 37, "lr": 9.924533822322577e-05} +{"train_loss": 0.017504312098026276, "global_step": 4426, "epoch": 37, "lr": 9.924495470181004e-05} +{"train_loss": 0.016960371285676956, "global_step": 4427, "epoch": 37, "lr": 9.924457108370711e-05} +{"train_loss": 0.022914452478289604, "global_step": 4428, "epoch": 37, "lr": 9.924418736891774e-05} +{"train_loss": 0.016293831169605255, "global_step": 4429, "epoch": 37, "lr": 9.924380355744264e-05} +{"train_loss": 0.01324089989066124, "global_step": 4430, "epoch": 37, "lr": 9.924341964928263e-05} +{"train_loss": 0.01537652499973774, "global_step": 4431, "epoch": 37, "lr": 9.92430356444384e-05} +{"train_loss": 0.016760477796196938, "global_step": 4432, "epoch": 37, "lr": 9.924265154291075e-05} +{"train_loss": 0.011314276605844498, "global_step": 4433, "epoch": 37, "lr": 9.92422673447004e-05} +{"train_loss": 0.01378634199500084, "global_step": 4434, "epoch": 37, "lr": 9.924188304980812e-05} +{"train_loss": 0.013843327760696411, "global_step": 4435, "epoch": 37, "lr": 9.924149865823467e-05} +{"train_loss": 0.018088124692440033, "global_step": 4436, "epoch": 37, "lr": 9.924111416998078e-05} +{"train_loss": 0.019969290122389793, "global_step": 4437, "epoch": 37, "lr": 9.924072958504725e-05} +{"train_loss": 0.01474605780094862, "global_step": 4438, "epoch": 37, "lr": 9.924034490343478e-05} +{"train_loss": 0.016625938937067986, "global_step": 4439, "epoch": 37, "lr": 9.923996012514416e-05} +{"train_loss": 0.019927984103560448, "global_step": 4440, "epoch": 37, "lr": 9.923957525017615e-05} +{"train_loss": 0.015608507208526134, "global_step": 4441, "epoch": 37, "lr": 9.923919027853149e-05} +{"train_loss": 0.01332162693142891, "global_step": 4442, "epoch": 37, "lr": 9.923880521021094e-05} +{"train_loss": 0.018741915002465248, "global_step": 4443, "epoch": 37, "lr": 9.923842004521526e-05} +{"train_loss": 0.019649464637041092, "global_step": 4444, "epoch": 37, "lr": 9.92380347835452e-05} +{"train_loss": 0.012825331650674343, "global_step": 4445, "epoch": 37, "lr": 9.923764942520152e-05} +{"train_loss": 0.01647249609231949, "global_step": 4446, "epoch": 37, "lr": 9.923726397018498e-05} +{"train_loss": 0.013524720445275307, "global_step": 4447, "epoch": 37, "lr": 9.923687841849632e-05} +{"train_loss": 0.015265977010130882, "global_step": 4448, "epoch": 37, "lr": 9.923649277013631e-05} +{"train_loss": 0.010992110706865788, "global_step": 4449, "epoch": 37, "lr": 9.923610702510572e-05} +{"train_loss": 0.021265769377350807, "global_step": 4450, "epoch": 37, "lr": 9.923572118340528e-05} +{"train_loss": 0.019253313541412354, "global_step": 4451, "epoch": 37, "lr": 9.923533524503576e-05} +{"train_loss": 0.018303655087947845, "global_step": 4452, "epoch": 37, "lr": 9.923494920999793e-05} +{"train_loss": 0.011603744700551033, "global_step": 4453, "epoch": 37, "lr": 9.923456307829254e-05} +{"train_loss": 0.014525056816637516, "global_step": 4454, "epoch": 37, "lr": 9.923417684992033e-05} +{"train_loss": 0.018408674746751785, "global_step": 4455, "epoch": 37, "lr": 9.923379052488209e-05} +{"train_loss": 0.01936197653412819, "global_step": 4456, "epoch": 37, "lr": 9.923340410317856e-05} +{"train_loss": 0.021022729575634003, "global_step": 4457, "epoch": 37, "lr": 9.92330175848105e-05} +{"train_loss": 0.016799114644527435, "global_step": 4458, "epoch": 37, "lr": 9.923263096977866e-05} +{"train_loss": 0.014456219971179962, "global_step": 4459, "epoch": 37, "lr": 9.923224425808381e-05} +{"train_loss": 0.019932812079787254, "global_step": 4460, "epoch": 37, "lr": 9.923185744972671e-05} +{"train_loss": 0.012579789385199547, "global_step": 4461, "epoch": 37, "lr": 9.923147054470814e-05} +{"train_loss": 0.015701761469244957, "global_step": 4462, "epoch": 37, "lr": 9.923108354302882e-05} +{"train_loss": 0.02316197007894516, "global_step": 4463, "epoch": 37, "lr": 9.923069644468951e-05} +{"train_loss": 0.014307710342109203, "global_step": 4464, "epoch": 37, "lr": 9.923030924969101e-05} +{"train_loss": 0.015563244000077248, "global_step": 4465, "epoch": 37, "lr": 9.922992195803404e-05} +{"train_loss": 0.017419788986444473, "global_step": 4466, "epoch": 37, "lr": 9.922953456971939e-05} +{"train_loss": 0.023269496858119965, "global_step": 4467, "epoch": 37, "lr": 9.92291470847478e-05} +{"train_loss": 0.011910850182175636, "global_step": 4468, "epoch": 37, "lr": 9.922875950312006e-05} +{"train_loss": 0.014633079059422016, "global_step": 4469, "epoch": 37, "lr": 9.922837182483689e-05} +{"train_loss": 0.021489324048161507, "global_step": 4470, "epoch": 37, "lr": 9.922798404989907e-05} +{"train_loss": 0.017252493649721146, "global_step": 4471, "epoch": 37, "lr": 9.922759617830737e-05} +{"train_loss": 0.018470022827386856, "global_step": 4472, "epoch": 37, "lr": 9.922720821006254e-05} +{"train_loss": 0.019391506910324097, "global_step": 4473, "epoch": 37, "lr": 9.922682014516535e-05} +{"train_loss": 0.011907055042684078, "global_step": 4474, "epoch": 37, "lr": 9.922643198361655e-05} +{"train_loss": 0.018002144992351532, "global_step": 4475, "epoch": 37, "lr": 9.922604372541691e-05} +{"train_loss": 0.01778898574411869, "global_step": 4476, "epoch": 37, "lr": 9.922565537056721e-05} +{"train_loss": 0.014383489266037941, "global_step": 4477, "epoch": 37, "lr": 9.922526691906817e-05} +{"train_loss": 0.019726587459445, "global_step": 4478, "epoch": 37, "lr": 9.92248783709206e-05} +{"train_loss": 0.013676841743290424, "global_step": 4479, "epoch": 37, "lr": 9.922448972612524e-05} +{"train_loss": 0.012255514971911907, "global_step": 4480, "epoch": 37, "lr": 9.922410098468284e-05} +{"train_loss": 0.018413996323943138, "global_step": 4481, "epoch": 37, "lr": 9.922371214659417e-05} +{"train_loss": 0.013085483573377132, "global_step": 4482, "epoch": 37, "lr": 9.922332321186001e-05} +{"train_loss": 0.018521901220083237, "global_step": 4483, "epoch": 37, "lr": 9.922293418048112e-05} +{"train_loss": 0.02177104540169239, "global_step": 4484, "epoch": 37, "lr": 9.922254505245825e-05} +{"train_loss": 0.016673840582370758, "global_step": 4485, "epoch": 37, "lr": 9.922215582779218e-05} +{"train_loss": 0.02512313239276409, "global_step": 4486, "epoch": 37, "lr": 9.922176650648366e-05} +{"train_loss": 0.021853316575288773, "global_step": 4487, "epoch": 37, "lr": 9.922137708853344e-05} +{"train_loss": 0.016390884295105934, "global_step": 4488, "epoch": 37, "lr": 9.922098757394233e-05} +{"train_loss": 0.01969827152788639, "global_step": 4489, "epoch": 37, "lr": 9.922059796271106e-05} +{"train_loss": 0.018193837255239487, "global_step": 4490, "epoch": 37, "lr": 9.922020825484039e-05} +{"train_loss": 0.017464449629187584, "global_step": 4491, "epoch": 37, "lr": 9.921981845033112e-05} +{"train_loss": 0.020136216655373573, "global_step": 4492, "epoch": 37, "lr": 9.9219428549184e-05} +{"train_loss": 0.021519558504223824, "global_step": 4493, "epoch": 37, "lr": 9.921903855139978e-05} +{"train_loss": 0.014856281690299511, "global_step": 4494, "epoch": 37, "lr": 9.921864845697923e-05} +{"train_loss": 0.014707310125231743, "global_step": 4495, "epoch": 37, "lr": 9.921825826592313e-05} +{"train_loss": 0.01877235621213913, "global_step": 4496, "epoch": 37, "lr": 9.921786797823225e-05} +{"train_loss": 0.01604856550693512, "global_step": 4497, "epoch": 37, "lr": 9.921747759390733e-05} +{"train_loss": 0.014748435467481613, "global_step": 4498, "epoch": 37, "lr": 9.921708711294915e-05} +{"train_loss": 0.019746994599699974, "global_step": 4499, "epoch": 37, "lr": 9.921669653535848e-05} +{"train_loss": 0.019856266677379608, "global_step": 4500, "epoch": 37, "lr": 9.921630586113608e-05} +{"train_loss": 0.014409807510674, "global_step": 4501, "epoch": 37, "lr": 9.921591509028272e-05} +{"train_loss": 0.01896287314593792, "global_step": 4502, "epoch": 37, "lr": 9.921552422279918e-05} +{"train_loss": 0.017133643850684166, "global_step": 4503, "epoch": 37, "lr": 9.921513325868621e-05} +{"train_loss": 0.02332206815481186, "global_step": 4504, "epoch": 37, "lr": 9.921474219794457e-05} +{"train_loss": 0.013888256624341011, "global_step": 4505, "epoch": 37, "lr": 9.921435104057507e-05} +{"train_loss": 0.011968771927058697, "global_step": 4506, "epoch": 37, "lr": 9.921395978657843e-05} +{"train_loss": 0.01483799796551466, "global_step": 4507, "epoch": 37, "lr": 9.921356843595545e-05} +{"train_loss": 0.020807679742574692, "global_step": 4508, "epoch": 37, "lr": 9.921317698870688e-05} +{"train_loss": 0.01850481890141964, "global_step": 4509, "epoch": 37, "lr": 9.921278544483349e-05} +{"train_loss": 0.015251453965902328, "global_step": 4510, "epoch": 37, "lr": 9.921239380433606e-05} +{"train_loss": 0.020544013008475304, "global_step": 4511, "epoch": 37, "lr": 9.921200206721535e-05} +{"train_loss": 0.015132587403059006, "global_step": 4512, "epoch": 37, "lr": 9.921161023347213e-05} +{"train_loss": 0.015642074868083, "global_step": 4513, "epoch": 37, "lr": 9.921121830310717e-05} +{"train_loss": 0.024296458810567856, "global_step": 4514, "epoch": 37, "lr": 9.921082627612123e-05} +{"train_loss": 0.011832740157842636, "global_step": 4515, "epoch": 37, "lr": 9.921043415251512e-05} +{"train_loss": 0.013264534994959831, "global_step": 4516, "epoch": 37, "lr": 9.921004193228956e-05} +{"train_loss": 0.014727235771715641, "global_step": 4517, "epoch": 37, "lr": 9.920964961544534e-05} +{"train_loss": 0.011711390689015388, "global_step": 4518, "epoch": 37, "lr": 9.920925720198323e-05} +{"train_loss": 0.022029003128409386, "global_step": 4519, "epoch": 37, "lr": 9.9208864691904e-05} +{"train_loss": 0.02444167248904705, "global_step": 4520, "epoch": 37, "lr": 9.920847208520843e-05} +{"train_loss": 0.017006529299464047, "global_step": 4521, "epoch": 37, "lr": 9.920807938189727e-05, "val_loss": 0.02169877104461193} +{"train_loss": 0.01774834655225277, "global_step": 4522, "epoch": 38, "lr": 9.92076865819713e-05} +{"train_loss": 0.01168275810778141, "global_step": 4523, "epoch": 38, "lr": 9.920729368543131e-05} +{"train_loss": 0.018481289967894554, "global_step": 4524, "epoch": 38, "lr": 9.920690069227804e-05} +{"train_loss": 0.019753403961658478, "global_step": 4525, "epoch": 38, "lr": 9.92065076025123e-05} +{"train_loss": 0.019672507420182228, "global_step": 4526, "epoch": 38, "lr": 9.920611441613484e-05} +{"train_loss": 0.01486913301050663, "global_step": 4527, "epoch": 38, "lr": 9.920572113314641e-05} +{"train_loss": 0.015501533634960651, "global_step": 4528, "epoch": 38, "lr": 9.920532775354781e-05} +{"train_loss": 0.020593935623764992, "global_step": 4529, "epoch": 38, "lr": 9.920493427733981e-05} +{"train_loss": 0.02818613499403, "global_step": 4530, "epoch": 38, "lr": 9.920454070452317e-05} +{"train_loss": 0.015577883459627628, "global_step": 4531, "epoch": 38, "lr": 9.920414703509868e-05} +{"train_loss": 0.01568959653377533, "global_step": 4532, "epoch": 38, "lr": 9.92037532690671e-05} +{"train_loss": 0.01960708200931549, "global_step": 4533, "epoch": 38, "lr": 9.92033594064292e-05} +{"train_loss": 0.023976054042577744, "global_step": 4534, "epoch": 38, "lr": 9.920296544718577e-05} +{"train_loss": 0.020703522488474846, "global_step": 4535, "epoch": 38, "lr": 9.920257139133757e-05} +{"train_loss": 0.01610325090587139, "global_step": 4536, "epoch": 38, "lr": 9.920217723888538e-05} +{"train_loss": 0.026557454839348793, "global_step": 4537, "epoch": 38, "lr": 9.920178298982997e-05} +{"train_loss": 0.019589193165302277, "global_step": 4538, "epoch": 38, "lr": 9.920138864417212e-05} +{"train_loss": 0.013243784196674824, "global_step": 4539, "epoch": 38, "lr": 9.92009942019126e-05} +{"train_loss": 0.015536430291831493, "global_step": 4540, "epoch": 38, "lr": 9.920059966305218e-05} +{"train_loss": 0.01992287114262581, "global_step": 4541, "epoch": 38, "lr": 9.920020502759164e-05} +{"train_loss": 0.017973676323890686, "global_step": 4542, "epoch": 38, "lr": 9.919981029553175e-05} +{"train_loss": 0.017328042536973953, "global_step": 4543, "epoch": 38, "lr": 9.919941546687329e-05} +{"train_loss": 0.024305330589413643, "global_step": 4544, "epoch": 38, "lr": 9.919902054161704e-05} +{"train_loss": 0.018113870173692703, "global_step": 4545, "epoch": 38, "lr": 9.919862551976376e-05} +{"train_loss": 0.018628716468811035, "global_step": 4546, "epoch": 38, "lr": 9.919823040131425e-05} +{"train_loss": 0.02296489104628563, "global_step": 4547, "epoch": 38, "lr": 9.919783518626924e-05} +{"train_loss": 0.021828465163707733, "global_step": 4548, "epoch": 38, "lr": 9.919743987462957e-05} +{"train_loss": 0.016429537907242775, "global_step": 4549, "epoch": 38, "lr": 9.919704446639597e-05} +{"train_loss": 0.016988836228847504, "global_step": 4550, "epoch": 38, "lr": 9.919664896156923e-05} +{"train_loss": 0.012154396623373032, "global_step": 4551, "epoch": 38, "lr": 9.919625336015012e-05} +{"train_loss": 0.015364136546850204, "global_step": 4552, "epoch": 38, "lr": 9.919585766213943e-05} +{"train_loss": 0.016664890572428703, "global_step": 4553, "epoch": 38, "lr": 9.919546186753792e-05} +{"train_loss": 0.014585310593247414, "global_step": 4554, "epoch": 38, "lr": 9.919506597634638e-05} +{"train_loss": 0.01427703071385622, "global_step": 4555, "epoch": 38, "lr": 9.919466998856559e-05} +{"train_loss": 0.0170887503772974, "global_step": 4556, "epoch": 38, "lr": 9.919427390419632e-05} +{"train_loss": 0.015537992119789124, "global_step": 4557, "epoch": 38, "lr": 9.919387772323934e-05} +{"train_loss": 0.025228412821888924, "global_step": 4558, "epoch": 38, "lr": 9.919348144569544e-05} +{"train_loss": 0.01666862517595291, "global_step": 4559, "epoch": 38, "lr": 9.919308507156542e-05} +{"train_loss": 0.013447646982967854, "global_step": 4560, "epoch": 38, "lr": 9.919268860085e-05} +{"train_loss": 0.02231050282716751, "global_step": 4561, "epoch": 38, "lr": 9.919229203355e-05} +{"train_loss": 0.019895559176802635, "global_step": 4562, "epoch": 38, "lr": 9.919189536966619e-05} +{"train_loss": 0.01225848775357008, "global_step": 4563, "epoch": 38, "lr": 9.919149860919936e-05} +{"train_loss": 0.018755992874503136, "global_step": 4564, "epoch": 38, "lr": 9.919110175215026e-05} +{"train_loss": 0.01646609976887703, "global_step": 4565, "epoch": 38, "lr": 9.919070479851971e-05} +{"train_loss": 0.012556055560708046, "global_step": 4566, "epoch": 38, "lr": 9.919030774830844e-05} +{"train_loss": 0.018789920955896378, "global_step": 4567, "epoch": 38, "lr": 9.918991060151727e-05} +{"train_loss": 0.014179416932165623, "global_step": 4568, "epoch": 38, "lr": 9.918951335814697e-05} +{"train_loss": 0.018097393214702606, "global_step": 4569, "epoch": 38, "lr": 9.91891160181983e-05} +{"train_loss": 0.0187841709703207, "global_step": 4570, "epoch": 38, "lr": 9.918871858167207e-05} +{"train_loss": 0.015372575260698795, "global_step": 4571, "epoch": 38, "lr": 9.918832104856904e-05} +{"train_loss": 0.020188113674521446, "global_step": 4572, "epoch": 38, "lr": 9.918792341889e-05} +{"train_loss": 0.013536393642425537, "global_step": 4573, "epoch": 38, "lr": 9.918752569263571e-05} +{"train_loss": 0.015225512906908989, "global_step": 4574, "epoch": 38, "lr": 9.9187127869807e-05} +{"train_loss": 0.013729169964790344, "global_step": 4575, "epoch": 38, "lr": 9.91867299504046e-05} +{"train_loss": 0.015461551025509834, "global_step": 4576, "epoch": 38, "lr": 9.91863319344293e-05} +{"train_loss": 0.014229219406843185, "global_step": 4577, "epoch": 38, "lr": 9.918593382188192e-05} +{"train_loss": 0.011331343092024326, "global_step": 4578, "epoch": 38, "lr": 9.91855356127632e-05} +{"train_loss": 0.011892781592905521, "global_step": 4579, "epoch": 38, "lr": 9.918513730707393e-05} +{"train_loss": 0.015734625980257988, "global_step": 4580, "epoch": 38, "lr": 9.91847389048149e-05} +{"train_loss": 0.013535628095269203, "global_step": 4581, "epoch": 38, "lr": 9.918434040598689e-05} +{"train_loss": 0.013917614705860615, "global_step": 4582, "epoch": 38, "lr": 9.91839418105907e-05} +{"train_loss": 0.014214801602065563, "global_step": 4583, "epoch": 38, "lr": 9.918354311862707e-05} +{"train_loss": 0.013629783876240253, "global_step": 4584, "epoch": 38, "lr": 9.918314433009681e-05} +{"train_loss": 0.01233517937362194, "global_step": 4585, "epoch": 38, "lr": 9.918274544500072e-05} +{"train_loss": 0.012594897300004959, "global_step": 4586, "epoch": 38, "lr": 9.918234646333954e-05} +{"train_loss": 0.016093533486127853, "global_step": 4587, "epoch": 38, "lr": 9.918194738511408e-05} +{"train_loss": 0.015669910237193108, "global_step": 4588, "epoch": 38, "lr": 9.918154821032514e-05} +{"train_loss": 0.01210702769458294, "global_step": 4589, "epoch": 38, "lr": 9.918114893897348e-05} +{"train_loss": 0.016355600208044052, "global_step": 4590, "epoch": 38, "lr": 9.918074957105987e-05} +{"train_loss": 0.011924322694540024, "global_step": 4591, "epoch": 38, "lr": 9.918035010658513e-05} +{"train_loss": 0.018220722675323486, "global_step": 4592, "epoch": 38, "lr": 9.917995054555002e-05} +{"train_loss": 0.011429991573095322, "global_step": 4593, "epoch": 38, "lr": 9.917955088795534e-05} +{"train_loss": 0.01383073441684246, "global_step": 4594, "epoch": 38, "lr": 9.917915113380185e-05} +{"train_loss": 0.01689934730529785, "global_step": 4595, "epoch": 38, "lr": 9.917875128309035e-05} +{"train_loss": 0.013992027379572392, "global_step": 4596, "epoch": 38, "lr": 9.917835133582163e-05} +{"train_loss": 0.011730192229151726, "global_step": 4597, "epoch": 38, "lr": 9.917795129199647e-05} +{"train_loss": 0.010264111682772636, "global_step": 4598, "epoch": 38, "lr": 9.917755115161567e-05} +{"train_loss": 0.012508037500083447, "global_step": 4599, "epoch": 38, "lr": 9.917715091467999e-05} +{"train_loss": 0.015230858698487282, "global_step": 4600, "epoch": 38, "lr": 9.917675058119023e-05} +{"train_loss": 0.01459437608718872, "global_step": 4601, "epoch": 38, "lr": 9.917635015114719e-05} +{"train_loss": 0.013759816065430641, "global_step": 4602, "epoch": 38, "lr": 9.917594962455163e-05} +{"train_loss": 0.013895092532038689, "global_step": 4603, "epoch": 38, "lr": 9.917554900140433e-05} +{"train_loss": 0.01378208864480257, "global_step": 4604, "epoch": 38, "lr": 9.917514828170611e-05} +{"train_loss": 0.014760160818696022, "global_step": 4605, "epoch": 38, "lr": 9.917474746545774e-05} +{"train_loss": 0.015393240377306938, "global_step": 4606, "epoch": 38, "lr": 9.917434655266e-05} +{"train_loss": 0.010852208361029625, "global_step": 4607, "epoch": 38, "lr": 9.917394554331368e-05} +{"train_loss": 0.015718229115009308, "global_step": 4608, "epoch": 38, "lr": 9.917354443741958e-05} +{"train_loss": 0.010394822806119919, "global_step": 4609, "epoch": 38, "lr": 9.917314323497848e-05} +{"train_loss": 0.012697641737759113, "global_step": 4610, "epoch": 38, "lr": 9.917274193599115e-05} +{"train_loss": 0.011977746151387691, "global_step": 4611, "epoch": 38, "lr": 9.917234054045841e-05} +{"train_loss": 0.016804005950689316, "global_step": 4612, "epoch": 38, "lr": 9.917193904838105e-05} +{"train_loss": 0.01345060020685196, "global_step": 4613, "epoch": 38, "lr": 9.91715374597598e-05} +{"train_loss": 0.010468533262610435, "global_step": 4614, "epoch": 38, "lr": 9.917113577459551e-05} +{"train_loss": 0.011838177219033241, "global_step": 4615, "epoch": 38, "lr": 9.917073399288897e-05} +{"train_loss": 0.013692141510546207, "global_step": 4616, "epoch": 38, "lr": 9.917033211464092e-05} +{"train_loss": 0.016806254163384438, "global_step": 4617, "epoch": 38, "lr": 9.916993013985218e-05} +{"train_loss": 0.010636168532073498, "global_step": 4618, "epoch": 38, "lr": 9.916952806852353e-05} +{"train_loss": 0.019475845620036125, "global_step": 4619, "epoch": 38, "lr": 9.916912590065578e-05} +{"train_loss": 0.014267743565142155, "global_step": 4620, "epoch": 38, "lr": 9.91687236362497e-05} +{"train_loss": 0.012119642458856106, "global_step": 4621, "epoch": 38, "lr": 9.916832127530608e-05} +{"train_loss": 0.013583436608314514, "global_step": 4622, "epoch": 38, "lr": 9.91679188178257e-05} +{"train_loss": 0.016324542462825775, "global_step": 4623, "epoch": 38, "lr": 9.916751626380938e-05} +{"train_loss": 0.013462645001709461, "global_step": 4624, "epoch": 38, "lr": 9.91671136132579e-05} +{"train_loss": 0.015472386963665485, "global_step": 4625, "epoch": 38, "lr": 9.916671086617204e-05} +{"train_loss": 0.012614612467586994, "global_step": 4626, "epoch": 38, "lr": 9.916630802255259e-05} +{"train_loss": 0.010071422904729843, "global_step": 4627, "epoch": 38, "lr": 9.916590508240036e-05} +{"train_loss": 0.017123565077781677, "global_step": 4628, "epoch": 38, "lr": 9.91655020457161e-05} +{"train_loss": 0.013375142589211464, "global_step": 4629, "epoch": 38, "lr": 9.916509891250066e-05} +{"train_loss": 0.01742110773921013, "global_step": 4630, "epoch": 38, "lr": 9.91646956827548e-05} +{"train_loss": 0.014714667573571205, "global_step": 4631, "epoch": 38, "lr": 9.916429235647928e-05} +{"train_loss": 0.01830216497182846, "global_step": 4632, "epoch": 38, "lr": 9.916388893367496e-05} +{"train_loss": 0.016214560717344284, "global_step": 4633, "epoch": 38, "lr": 9.916348541434258e-05} +{"train_loss": 0.013555670157074928, "global_step": 4634, "epoch": 38, "lr": 9.916308179848294e-05} +{"train_loss": 0.015596827492117882, "global_step": 4635, "epoch": 38, "lr": 9.916267808609686e-05} +{"train_loss": 0.016053736209869385, "global_step": 4636, "epoch": 38, "lr": 9.916227427718511e-05} +{"train_loss": 0.020734816789627075, "global_step": 4637, "epoch": 38, "lr": 9.916187037174848e-05} +{"train_loss": 0.017289837822318077, "global_step": 4638, "epoch": 38, "lr": 9.916146636978777e-05} +{"train_loss": 0.01799202896654606, "global_step": 4639, "epoch": 38, "lr": 9.916106227130378e-05} +{"train_loss": 0.015864714040976613, "global_step": 4640, "epoch": 38, "lr": 9.916065807629729e-05, "val_loss": 0.02327880822122097} +{"train_loss": 0.014799276366829872, "global_step": 4641, "epoch": 39, "lr": 9.91602537847691e-05} +{"train_loss": 0.019842490553855896, "global_step": 4642, "epoch": 39, "lr": 9.915984939672001e-05} +{"train_loss": 0.019342023879289627, "global_step": 4643, "epoch": 39, "lr": 9.915944491215079e-05} +{"train_loss": 0.016511375084519386, "global_step": 4644, "epoch": 39, "lr": 9.915904033106226e-05} +{"train_loss": 0.016998615115880966, "global_step": 4645, "epoch": 39, "lr": 9.915863565345522e-05} +{"train_loss": 0.019306831061840057, "global_step": 4646, "epoch": 39, "lr": 9.915823087933045e-05} +{"train_loss": 0.010428186506032944, "global_step": 4647, "epoch": 39, "lr": 9.915782600868872e-05} +{"train_loss": 0.017939135432243347, "global_step": 4648, "epoch": 39, "lr": 9.915742104153088e-05} +{"train_loss": 0.012670604512095451, "global_step": 4649, "epoch": 39, "lr": 9.915701597785768e-05} +{"train_loss": 0.01376822404563427, "global_step": 4650, "epoch": 39, "lr": 9.915661081766993e-05} +{"train_loss": 0.0161728672683239, "global_step": 4651, "epoch": 39, "lr": 9.915620556096843e-05} +{"train_loss": 0.010460708290338516, "global_step": 4652, "epoch": 39, "lr": 9.915580020775398e-05} +{"train_loss": 0.018012993037700653, "global_step": 4653, "epoch": 39, "lr": 9.915539475802735e-05} +{"train_loss": 0.013902941718697548, "global_step": 4654, "epoch": 39, "lr": 9.915498921178937e-05} +{"train_loss": 0.013697744347155094, "global_step": 4655, "epoch": 39, "lr": 9.915458356904082e-05} +{"train_loss": 0.010516067035496235, "global_step": 4656, "epoch": 39, "lr": 9.91541778297825e-05} +{"train_loss": 0.015094811096787453, "global_step": 4657, "epoch": 39, "lr": 9.915377199401517e-05} +{"train_loss": 0.009687259793281555, "global_step": 4658, "epoch": 39, "lr": 9.915336606173968e-05} +{"train_loss": 0.015691913664340973, "global_step": 4659, "epoch": 39, "lr": 9.915296003295682e-05} +{"train_loss": 0.01154540665447712, "global_step": 4660, "epoch": 39, "lr": 9.915255390766736e-05} +{"train_loss": 0.017631342634558678, "global_step": 4661, "epoch": 39, "lr": 9.915214768587212e-05} +{"train_loss": 0.015516767278313637, "global_step": 4662, "epoch": 39, "lr": 9.915174136757188e-05} +{"train_loss": 0.014561958611011505, "global_step": 4663, "epoch": 39, "lr": 9.915133495276747e-05} +{"train_loss": 0.01397630199790001, "global_step": 4664, "epoch": 39, "lr": 9.915092844145963e-05} +{"train_loss": 0.015482902526855469, "global_step": 4665, "epoch": 39, "lr": 9.91505218336492e-05} +{"train_loss": 0.02039244771003723, "global_step": 4666, "epoch": 39, "lr": 9.915011512933701e-05} +{"train_loss": 0.011859768070280552, "global_step": 4667, "epoch": 39, "lr": 9.914970832852379e-05} +{"train_loss": 0.01112310029566288, "global_step": 4668, "epoch": 39, "lr": 9.914930143121036e-05} +{"train_loss": 0.015511381439864635, "global_step": 4669, "epoch": 39, "lr": 9.914889443739754e-05} +{"train_loss": 0.01417210791260004, "global_step": 4670, "epoch": 39, "lr": 9.91484873470861e-05} +{"train_loss": 0.013551171869039536, "global_step": 4671, "epoch": 39, "lr": 9.914808016027687e-05} +{"train_loss": 0.016409553587436676, "global_step": 4672, "epoch": 39, "lr": 9.914767287697065e-05} +{"train_loss": 0.010732765309512615, "global_step": 4673, "epoch": 39, "lr": 9.91472654971682e-05} +{"train_loss": 0.012276948429644108, "global_step": 4674, "epoch": 39, "lr": 9.914685802087035e-05} +{"train_loss": 0.018155043944716454, "global_step": 4675, "epoch": 39, "lr": 9.914645044807792e-05} +{"train_loss": 0.011956336908042431, "global_step": 4676, "epoch": 39, "lr": 9.914604277879165e-05} +{"train_loss": 0.0135463522747159, "global_step": 4677, "epoch": 39, "lr": 9.914563501301239e-05} +{"train_loss": 0.010801177471876144, "global_step": 4678, "epoch": 39, "lr": 9.914522715074093e-05} +{"train_loss": 0.012883474119007587, "global_step": 4679, "epoch": 39, "lr": 9.914481919197807e-05} +{"train_loss": 0.014223478734493256, "global_step": 4680, "epoch": 39, "lr": 9.914441113672458e-05} +{"train_loss": 0.015917610377073288, "global_step": 4681, "epoch": 39, "lr": 9.914400298498132e-05} +{"train_loss": 0.01599392667412758, "global_step": 4682, "epoch": 39, "lr": 9.914359473674906e-05} +{"train_loss": 0.011197772808372974, "global_step": 4683, "epoch": 39, "lr": 9.914318639202858e-05} +{"train_loss": 0.013204594142735004, "global_step": 4684, "epoch": 39, "lr": 9.914277795082071e-05} +{"train_loss": 0.014246819540858269, "global_step": 4685, "epoch": 39, "lr": 9.914236941312626e-05} +{"train_loss": 0.012431162409484386, "global_step": 4686, "epoch": 39, "lr": 9.914196077894602e-05} +{"train_loss": 0.021156687289476395, "global_step": 4687, "epoch": 39, "lr": 9.914155204828078e-05} +{"train_loss": 0.012013515457510948, "global_step": 4688, "epoch": 39, "lr": 9.914114322113134e-05} +{"train_loss": 0.010963504202663898, "global_step": 4689, "epoch": 39, "lr": 9.914073429749853e-05} +{"train_loss": 0.01141061820089817, "global_step": 4690, "epoch": 39, "lr": 9.914032527738314e-05} +{"train_loss": 0.016223441809415817, "global_step": 4691, "epoch": 39, "lr": 9.913991616078598e-05} +{"train_loss": 0.01518489234149456, "global_step": 4692, "epoch": 39, "lr": 9.913950694770781e-05} +{"train_loss": 0.009046738967299461, "global_step": 4693, "epoch": 39, "lr": 9.91390976381495e-05} +{"train_loss": 0.014250796288251877, "global_step": 4694, "epoch": 39, "lr": 9.913868823211182e-05} +{"train_loss": 0.016670741140842438, "global_step": 4695, "epoch": 39, "lr": 9.913827872959556e-05} +{"train_loss": 0.020172318443655968, "global_step": 4696, "epoch": 39, "lr": 9.913786913060155e-05} +{"train_loss": 0.009881201200187206, "global_step": 4697, "epoch": 39, "lr": 9.913745943513057e-05} +{"train_loss": 0.01919085718691349, "global_step": 4698, "epoch": 39, "lr": 9.913704964318344e-05} +{"train_loss": 0.019818011671304703, "global_step": 4699, "epoch": 39, "lr": 9.913663975476097e-05} +{"train_loss": 0.016637077555060387, "global_step": 4700, "epoch": 39, "lr": 9.913622976986396e-05} +{"train_loss": 0.012340920977294445, "global_step": 4701, "epoch": 39, "lr": 9.913581968849322e-05} +{"train_loss": 0.018818408250808716, "global_step": 4702, "epoch": 39, "lr": 9.913540951064953e-05} +{"train_loss": 0.010250096209347248, "global_step": 4703, "epoch": 39, "lr": 9.913499923633371e-05} +{"train_loss": 0.015055414289236069, "global_step": 4704, "epoch": 39, "lr": 9.913458886554658e-05} +{"train_loss": 0.01760912872850895, "global_step": 4705, "epoch": 39, "lr": 9.913417839828893e-05} +{"train_loss": 0.015348049812018871, "global_step": 4706, "epoch": 39, "lr": 9.913376783456157e-05} +{"train_loss": 0.015614275820553303, "global_step": 4707, "epoch": 39, "lr": 9.913335717436532e-05} +{"train_loss": 0.01854952797293663, "global_step": 4708, "epoch": 39, "lr": 9.913294641770096e-05} +{"train_loss": 0.015435157343745232, "global_step": 4709, "epoch": 39, "lr": 9.91325355645693e-05} +{"train_loss": 0.017265787348151207, "global_step": 4710, "epoch": 39, "lr": 9.913212461497117e-05} +{"train_loss": 0.017117535695433617, "global_step": 4711, "epoch": 39, "lr": 9.913171356890736e-05} +{"train_loss": 0.010564659722149372, "global_step": 4712, "epoch": 39, "lr": 9.913130242637867e-05} +{"train_loss": 0.01586596854031086, "global_step": 4713, "epoch": 39, "lr": 9.913089118738593e-05} +{"train_loss": 0.02118251658976078, "global_step": 4714, "epoch": 39, "lr": 9.913047985192991e-05} +{"train_loss": 0.010951651260256767, "global_step": 4715, "epoch": 39, "lr": 9.913006842001147e-05} +{"train_loss": 0.01769610308110714, "global_step": 4716, "epoch": 39, "lr": 9.912965689163137e-05} +{"train_loss": 0.013128445483744144, "global_step": 4717, "epoch": 39, "lr": 9.912924526679044e-05} +{"train_loss": 0.016111042350530624, "global_step": 4718, "epoch": 39, "lr": 9.91288335454895e-05} +{"train_loss": 0.020808249711990356, "global_step": 4719, "epoch": 39, "lr": 9.912842172772933e-05} +{"train_loss": 0.012098783627152443, "global_step": 4720, "epoch": 39, "lr": 9.912800981351075e-05} +{"train_loss": 0.018633315339684486, "global_step": 4721, "epoch": 39, "lr": 9.912759780283458e-05} +{"train_loss": 0.013894269242882729, "global_step": 4722, "epoch": 39, "lr": 9.912718569570163e-05} +{"train_loss": 0.009396597743034363, "global_step": 4723, "epoch": 39, "lr": 9.912677349211269e-05} +{"train_loss": 0.014928136020898819, "global_step": 4724, "epoch": 39, "lr": 9.912636119206858e-05} +{"train_loss": 0.011636155657470226, "global_step": 4725, "epoch": 39, "lr": 9.912594879557009e-05} +{"train_loss": 0.019003132358193398, "global_step": 4726, "epoch": 39, "lr": 9.912553630261808e-05} +{"train_loss": 0.015231117606163025, "global_step": 4727, "epoch": 39, "lr": 9.91251237132133e-05} +{"train_loss": 0.013896055519580841, "global_step": 4728, "epoch": 39, "lr": 9.912471102735659e-05} +{"train_loss": 0.01625269651412964, "global_step": 4729, "epoch": 39, "lr": 9.912429824504877e-05} +{"train_loss": 0.017688868567347527, "global_step": 4730, "epoch": 39, "lr": 9.912388536629064e-05} +{"train_loss": 0.011462931521236897, "global_step": 4731, "epoch": 39, "lr": 9.912347239108299e-05} +{"train_loss": 0.017616955563426018, "global_step": 4732, "epoch": 39, "lr": 9.912305931942667e-05} +{"train_loss": 0.022525804117321968, "global_step": 4733, "epoch": 39, "lr": 9.912264615132247e-05} +{"train_loss": 0.019938750192523003, "global_step": 4734, "epoch": 39, "lr": 9.912223288677119e-05} +{"train_loss": 0.019232086837291718, "global_step": 4735, "epoch": 39, "lr": 9.912181952577366e-05} +{"train_loss": 0.01451015193015337, "global_step": 4736, "epoch": 39, "lr": 9.91214060683307e-05} +{"train_loss": 0.015908023342490196, "global_step": 4737, "epoch": 39, "lr": 9.91209925144431e-05} +{"train_loss": 0.015451672486960888, "global_step": 4738, "epoch": 39, "lr": 9.912057886411166e-05} +{"train_loss": 0.012727420777082443, "global_step": 4739, "epoch": 39, "lr": 9.912016511733722e-05} +{"train_loss": 0.01707746647298336, "global_step": 4740, "epoch": 39, "lr": 9.911975127412059e-05} +{"train_loss": 0.015466214157640934, "global_step": 4741, "epoch": 39, "lr": 9.911933733446257e-05} +{"train_loss": 0.017443310469388962, "global_step": 4742, "epoch": 39, "lr": 9.911892329836399e-05} +{"train_loss": 0.012223182246088982, "global_step": 4743, "epoch": 39, "lr": 9.911850916582564e-05} +{"train_loss": 0.0150667205452919, "global_step": 4744, "epoch": 39, "lr": 9.911809493684834e-05} +{"train_loss": 0.016037248075008392, "global_step": 4745, "epoch": 39, "lr": 9.911768061143291e-05} +{"train_loss": 0.021034378558397293, "global_step": 4746, "epoch": 39, "lr": 9.911726618958018e-05} +{"train_loss": 0.01274487841874361, "global_step": 4747, "epoch": 39, "lr": 9.911685167129094e-05} +{"train_loss": 0.016492031514644623, "global_step": 4748, "epoch": 39, "lr": 9.911643705656599e-05} +{"train_loss": 0.01604500412940979, "global_step": 4749, "epoch": 39, "lr": 9.911602234540618e-05} +{"train_loss": 0.02024422027170658, "global_step": 4750, "epoch": 39, "lr": 9.911560753781231e-05} +{"train_loss": 0.018264111131429672, "global_step": 4751, "epoch": 39, "lr": 9.911519263378517e-05} +{"train_loss": 0.01370531041175127, "global_step": 4752, "epoch": 39, "lr": 9.911477763332561e-05} +{"train_loss": 0.014103559777140617, "global_step": 4753, "epoch": 39, "lr": 9.911436253643445e-05} +{"train_loss": 0.014046890661120415, "global_step": 4754, "epoch": 39, "lr": 9.911394734311246e-05} +{"train_loss": 0.013576810248196125, "global_step": 4755, "epoch": 39, "lr": 9.911353205336049e-05} +{"train_loss": 0.015763457864522934, "global_step": 4756, "epoch": 39, "lr": 9.911311666717935e-05} +{"train_loss": 0.01541669201105833, "global_step": 4757, "epoch": 39, "lr": 9.911270118456985e-05} +{"train_loss": 0.017970353364944458, "global_step": 4758, "epoch": 39, "lr": 9.91122856055328e-05} +{"train_loss": 0.015194357646738781, "global_step": 4759, "epoch": 39, "lr": 9.911186993006903e-05, "val_loss": 0.0236833319067955} +{"train_loss": 0.01621217280626297, "global_step": 4760, "epoch": 40, "lr": 9.911145415817935e-05} +{"train_loss": 0.009801343083381653, "global_step": 4761, "epoch": 40, "lr": 9.911103828986459e-05} +{"train_loss": 0.015695661306381226, "global_step": 4762, "epoch": 40, "lr": 9.911062232512553e-05} +{"train_loss": 0.01580752804875374, "global_step": 4763, "epoch": 40, "lr": 9.911020626396303e-05} +{"train_loss": 0.015754519030451775, "global_step": 4764, "epoch": 40, "lr": 9.910979010637787e-05} +{"train_loss": 0.010089165531098843, "global_step": 4765, "epoch": 40, "lr": 9.910937385237088e-05} +{"train_loss": 0.01934596337378025, "global_step": 4766, "epoch": 40, "lr": 9.910895750194291e-05} +{"train_loss": 0.01424870453774929, "global_step": 4767, "epoch": 40, "lr": 9.910854105509473e-05} +{"train_loss": 0.019796589389443398, "global_step": 4768, "epoch": 40, "lr": 9.910812451182717e-05} +{"train_loss": 0.01673588715493679, "global_step": 4769, "epoch": 40, "lr": 9.910770787214107e-05} +{"train_loss": 0.01437988318502903, "global_step": 4770, "epoch": 40, "lr": 9.910729113603722e-05} +{"train_loss": 0.012835697270929813, "global_step": 4771, "epoch": 40, "lr": 9.910687430351645e-05} +{"train_loss": 0.01794959045946598, "global_step": 4772, "epoch": 40, "lr": 9.910645737457957e-05} +{"train_loss": 0.015659887343645096, "global_step": 4773, "epoch": 40, "lr": 9.910604034922744e-05} +{"train_loss": 0.020263085141777992, "global_step": 4774, "epoch": 40, "lr": 9.910562322746082e-05} +{"train_loss": 0.016875559464097023, "global_step": 4775, "epoch": 40, "lr": 9.910520600928055e-05} +{"train_loss": 0.015500007197260857, "global_step": 4776, "epoch": 40, "lr": 9.910478869468747e-05} +{"train_loss": 0.013724787160754204, "global_step": 4777, "epoch": 40, "lr": 9.910437128368238e-05} +{"train_loss": 0.009977933950722218, "global_step": 4778, "epoch": 40, "lr": 9.910395377626609e-05} +{"train_loss": 0.013249063864350319, "global_step": 4779, "epoch": 40, "lr": 9.910353617243944e-05} +{"train_loss": 0.017774013802409172, "global_step": 4780, "epoch": 40, "lr": 9.910311847220326e-05} +{"train_loss": 0.012816586531698704, "global_step": 4781, "epoch": 40, "lr": 9.910270067555833e-05} +{"train_loss": 0.013096030801534653, "global_step": 4782, "epoch": 40, "lr": 9.91022827825055e-05} +{"train_loss": 0.018058251589536667, "global_step": 4783, "epoch": 40, "lr": 9.910186479304559e-05} +{"train_loss": 0.011281165294349194, "global_step": 4784, "epoch": 40, "lr": 9.910144670717941e-05} +{"train_loss": 0.015969224274158478, "global_step": 4785, "epoch": 40, "lr": 9.910102852490779e-05} +{"train_loss": 0.013149122707545757, "global_step": 4786, "epoch": 40, "lr": 9.910061024623154e-05} +{"train_loss": 0.013995920307934284, "global_step": 4787, "epoch": 40, "lr": 9.910019187115149e-05} +{"train_loss": 0.013873194344341755, "global_step": 4788, "epoch": 40, "lr": 9.909977339966845e-05} +{"train_loss": 0.011766474694013596, "global_step": 4789, "epoch": 40, "lr": 9.909935483178325e-05} +{"train_loss": 0.014563473872840405, "global_step": 4790, "epoch": 40, "lr": 9.909893616749672e-05} +{"train_loss": 0.02009204961359501, "global_step": 4791, "epoch": 40, "lr": 9.909851740680969e-05} +{"train_loss": 0.010939639993011951, "global_step": 4792, "epoch": 40, "lr": 9.909809854972294e-05} +{"train_loss": 0.016820332035422325, "global_step": 4793, "epoch": 40, "lr": 9.909767959623732e-05} +{"train_loss": 0.01878664270043373, "global_step": 4794, "epoch": 40, "lr": 9.909726054635367e-05} +{"train_loss": 0.015217815525829792, "global_step": 4795, "epoch": 40, "lr": 9.909684140007279e-05} +{"train_loss": 0.017977217212319374, "global_step": 4796, "epoch": 40, "lr": 9.90964221573955e-05} +{"train_loss": 0.015593571588397026, "global_step": 4797, "epoch": 40, "lr": 9.909600281832263e-05} +{"train_loss": 0.02254127338528633, "global_step": 4798, "epoch": 40, "lr": 9.9095583382855e-05} +{"train_loss": 0.015857940539717674, "global_step": 4799, "epoch": 40, "lr": 9.909516385099345e-05} +{"train_loss": 0.019040195271372795, "global_step": 4800, "epoch": 40, "lr": 9.909474422273878e-05} +{"train_loss": 0.015260639600455761, "global_step": 4801, "epoch": 40, "lr": 9.909432449809185e-05} +{"train_loss": 0.011729518882930279, "global_step": 4802, "epoch": 40, "lr": 9.909390467705341e-05} +{"train_loss": 0.012144477106630802, "global_step": 4803, "epoch": 40, "lr": 9.909348475962436e-05} +{"train_loss": 0.014243364334106445, "global_step": 4804, "epoch": 40, "lr": 9.909306474580551e-05} +{"train_loss": 0.01963389478623867, "global_step": 4805, "epoch": 40, "lr": 9.909264463559766e-05} +{"train_loss": 0.01581004075706005, "global_step": 4806, "epoch": 40, "lr": 9.909222442900166e-05} +{"train_loss": 0.021960748359560966, "global_step": 4807, "epoch": 40, "lr": 9.909180412601831e-05} +{"train_loss": 0.015034845098853111, "global_step": 4808, "epoch": 40, "lr": 9.909138372664843e-05} +{"train_loss": 0.013808885589241982, "global_step": 4809, "epoch": 40, "lr": 9.909096323089289e-05} +{"train_loss": 0.010238038375973701, "global_step": 4810, "epoch": 40, "lr": 9.909054263875247e-05} +{"train_loss": 0.0130379069596529, "global_step": 4811, "epoch": 40, "lr": 9.909012195022802e-05} +{"train_loss": 0.020660346373915672, "global_step": 4812, "epoch": 40, "lr": 9.908970116532037e-05} +{"train_loss": 0.01600024849176407, "global_step": 4813, "epoch": 40, "lr": 9.908928028403033e-05} +{"train_loss": 0.018564939498901367, "global_step": 4814, "epoch": 40, "lr": 9.908885930635872e-05} +{"train_loss": 0.016055157408118248, "global_step": 4815, "epoch": 40, "lr": 9.90884382323064e-05} +{"train_loss": 0.015112238936126232, "global_step": 4816, "epoch": 40, "lr": 9.908801706187415e-05} +{"train_loss": 0.014063267037272453, "global_step": 4817, "epoch": 40, "lr": 9.908759579506284e-05} +{"train_loss": 0.018652819097042084, "global_step": 4818, "epoch": 40, "lr": 9.908717443187329e-05} +{"train_loss": 0.015180043876171112, "global_step": 4819, "epoch": 40, "lr": 9.90867529723063e-05} +{"train_loss": 0.021910328418016434, "global_step": 4820, "epoch": 40, "lr": 9.908633141636272e-05} +{"train_loss": 0.016609014943242073, "global_step": 4821, "epoch": 40, "lr": 9.908590976404337e-05} +{"train_loss": 0.011381256394088268, "global_step": 4822, "epoch": 40, "lr": 9.90854880153491e-05} +{"train_loss": 0.019085906445980072, "global_step": 4823, "epoch": 40, "lr": 9.908506617028068e-05} +{"train_loss": 0.011128260754048824, "global_step": 4824, "epoch": 40, "lr": 9.9084644228839e-05} +{"train_loss": 0.01642150990664959, "global_step": 4825, "epoch": 40, "lr": 9.908422219102487e-05} +{"train_loss": 0.013347385451197624, "global_step": 4826, "epoch": 40, "lr": 9.908380005683911e-05} +{"train_loss": 0.01662786491215229, "global_step": 4827, "epoch": 40, "lr": 9.908337782628254e-05} +{"train_loss": 0.016960706561803818, "global_step": 4828, "epoch": 40, "lr": 9.908295549935601e-05} +{"train_loss": 0.011112522333860397, "global_step": 4829, "epoch": 40, "lr": 9.908253307606034e-05} +{"train_loss": 0.015826314687728882, "global_step": 4830, "epoch": 40, "lr": 9.908211055639635e-05} +{"train_loss": 0.014077129773795605, "global_step": 4831, "epoch": 40, "lr": 9.90816879403649e-05} +{"train_loss": 0.01568502001464367, "global_step": 4832, "epoch": 40, "lr": 9.90812652279668e-05} +{"train_loss": 0.011634016409516335, "global_step": 4833, "epoch": 40, "lr": 9.908084241920286e-05} +{"train_loss": 0.01872175931930542, "global_step": 4834, "epoch": 40, "lr": 9.908041951407394e-05} +{"train_loss": 0.014138762839138508, "global_step": 4835, "epoch": 40, "lr": 9.907999651258086e-05} +{"train_loss": 0.017511337995529175, "global_step": 4836, "epoch": 40, "lr": 9.907957341472445e-05} +{"train_loss": 0.021152373403310776, "global_step": 4837, "epoch": 40, "lr": 9.907915022050554e-05} +{"train_loss": 0.017669010907411575, "global_step": 4838, "epoch": 40, "lr": 9.907872692992496e-05} +{"train_loss": 0.01888393424451351, "global_step": 4839, "epoch": 40, "lr": 9.907830354298354e-05} +{"train_loss": 0.012844578363001347, "global_step": 4840, "epoch": 40, "lr": 9.907788005968213e-05} +{"train_loss": 0.01420037541538477, "global_step": 4841, "epoch": 40, "lr": 9.907745648002152e-05} +{"train_loss": 0.017787238582968712, "global_step": 4842, "epoch": 40, "lr": 9.907703280400258e-05} +{"train_loss": 0.013772646896541119, "global_step": 4843, "epoch": 40, "lr": 9.907660903162614e-05} +{"train_loss": 0.02130080945789814, "global_step": 4844, "epoch": 40, "lr": 9.9076185162893e-05} +{"train_loss": 0.021112043410539627, "global_step": 4845, "epoch": 40, "lr": 9.907576119780404e-05} +{"train_loss": 0.009925773367285728, "global_step": 4846, "epoch": 40, "lr": 9.907533713636003e-05} +{"train_loss": 0.01691761240363121, "global_step": 4847, "epoch": 40, "lr": 9.907491297856187e-05} +{"train_loss": 0.02058349922299385, "global_step": 4848, "epoch": 40, "lr": 9.907448872441035e-05} +{"train_loss": 0.025561001151800156, "global_step": 4849, "epoch": 40, "lr": 9.907406437390632e-05} +{"train_loss": 0.017077069729566574, "global_step": 4850, "epoch": 40, "lr": 9.90736399270506e-05} +{"train_loss": 0.011902724392712116, "global_step": 4851, "epoch": 40, "lr": 9.907321538384404e-05} +{"train_loss": 0.016534212976694107, "global_step": 4852, "epoch": 40, "lr": 9.907279074428746e-05} +{"train_loss": 0.01592624932527542, "global_step": 4853, "epoch": 40, "lr": 9.907236600838169e-05} +{"train_loss": 0.021441062912344933, "global_step": 4854, "epoch": 40, "lr": 9.907194117612757e-05} +{"train_loss": 0.01676274836063385, "global_step": 4855, "epoch": 40, "lr": 9.907151624752596e-05} +{"train_loss": 0.01248810812830925, "global_step": 4856, "epoch": 40, "lr": 9.907109122257766e-05} +{"train_loss": 0.014148732647299767, "global_step": 4857, "epoch": 40, "lr": 9.907066610128349e-05} +{"train_loss": 0.017320483922958374, "global_step": 4858, "epoch": 40, "lr": 9.907024088364433e-05} +{"train_loss": 0.013324031606316566, "global_step": 4859, "epoch": 40, "lr": 9.9069815569661e-05} +{"train_loss": 0.015877123922109604, "global_step": 4860, "epoch": 40, "lr": 9.906939015933432e-05} +{"train_loss": 0.02089007943868637, "global_step": 4861, "epoch": 40, "lr": 9.906896465266513e-05} +{"train_loss": 0.014237921684980392, "global_step": 4862, "epoch": 40, "lr": 9.906853904965427e-05} +{"train_loss": 0.01573135331273079, "global_step": 4863, "epoch": 40, "lr": 9.90681133503026e-05} +{"train_loss": 0.015719469636678696, "global_step": 4864, "epoch": 40, "lr": 9.906768755461091e-05} +{"train_loss": 0.01878378354012966, "global_step": 4865, "epoch": 40, "lr": 9.906726166258006e-05} +{"train_loss": 0.012549717910587788, "global_step": 4866, "epoch": 40, "lr": 9.906683567421089e-05} +{"train_loss": 0.016044853255152702, "global_step": 4867, "epoch": 40, "lr": 9.906640958950422e-05} +{"train_loss": 0.017948083579540253, "global_step": 4868, "epoch": 40, "lr": 9.906598340846091e-05} +{"train_loss": 0.02178121544420719, "global_step": 4869, "epoch": 40, "lr": 9.906555713108176e-05} +{"train_loss": 0.013163996860384941, "global_step": 4870, "epoch": 40, "lr": 9.906513075736765e-05} +{"train_loss": 0.0166177861392498, "global_step": 4871, "epoch": 40, "lr": 9.90647042873194e-05} +{"train_loss": 0.016660140827298164, "global_step": 4872, "epoch": 40, "lr": 9.906427772093784e-05} +{"train_loss": 0.014506806619465351, "global_step": 4873, "epoch": 40, "lr": 9.906385105822381e-05} +{"train_loss": 0.016223832964897156, "global_step": 4874, "epoch": 40, "lr": 9.906342429917816e-05} +{"train_loss": 0.016755729913711548, "global_step": 4875, "epoch": 40, "lr": 9.90629974438017e-05} +{"train_loss": 0.02230164036154747, "global_step": 4876, "epoch": 40, "lr": 9.906257049209529e-05} +{"train_loss": 0.01524893008172512, "global_step": 4877, "epoch": 40, "lr": 9.906214344405978e-05} +{"train_loss": 0.01595842292798417, "global_step": 4878, "epoch": 40, "lr": 9.906171629969598e-05, "val_loss": 0.030263058841228485, "train_action_mse_error": 0.0008767992258071899} +{"train_loss": 0.015444117598235607, "global_step": 4879, "epoch": 41, "lr": 9.906128905900475e-05} +{"train_loss": 0.013562541455030441, "global_step": 4880, "epoch": 41, "lr": 9.906086172198692e-05} +{"train_loss": 0.02196488156914711, "global_step": 4881, "epoch": 41, "lr": 9.906043428864331e-05} +{"train_loss": 0.012909851036965847, "global_step": 4882, "epoch": 41, "lr": 9.90600067589748e-05} +{"train_loss": 0.016021301969885826, "global_step": 4883, "epoch": 41, "lr": 9.90595791329822e-05} +{"train_loss": 0.014580768533051014, "global_step": 4884, "epoch": 41, "lr": 9.905915141066635e-05} +{"train_loss": 0.015280396677553654, "global_step": 4885, "epoch": 41, "lr": 9.905872359202812e-05} +{"train_loss": 0.015154304914176464, "global_step": 4886, "epoch": 41, "lr": 9.90582956770683e-05} +{"train_loss": 0.013948582112789154, "global_step": 4887, "epoch": 41, "lr": 9.905786766578778e-05} +{"train_loss": 0.011652610264718533, "global_step": 4888, "epoch": 41, "lr": 9.905743955818737e-05} +{"train_loss": 0.015589216724038124, "global_step": 4889, "epoch": 41, "lr": 9.905701135426792e-05} +{"train_loss": 0.011931494809687138, "global_step": 4890, "epoch": 41, "lr": 9.905658305403026e-05} +{"train_loss": 0.013897704891860485, "global_step": 4891, "epoch": 41, "lr": 9.905615465747524e-05} +{"train_loss": 0.018506456166505814, "global_step": 4892, "epoch": 41, "lr": 9.905572616460373e-05} +{"train_loss": 0.014127025380730629, "global_step": 4893, "epoch": 41, "lr": 9.90552975754165e-05} +{"train_loss": 0.019052982330322266, "global_step": 4894, "epoch": 41, "lr": 9.905486888991446e-05} +{"train_loss": 0.012432186864316463, "global_step": 4895, "epoch": 41, "lr": 9.905444010809842e-05} +{"train_loss": 0.013729863800108433, "global_step": 4896, "epoch": 41, "lr": 9.905401122996923e-05} +{"train_loss": 0.011787878349423409, "global_step": 4897, "epoch": 41, "lr": 9.905358225552772e-05} +{"train_loss": 0.01176205463707447, "global_step": 4898, "epoch": 41, "lr": 9.905315318477475e-05} +{"train_loss": 0.01410539261996746, "global_step": 4899, "epoch": 41, "lr": 9.905272401771115e-05} +{"train_loss": 0.01894201710820198, "global_step": 4900, "epoch": 41, "lr": 9.905229475433777e-05} +{"train_loss": 0.021160386502742767, "global_step": 4901, "epoch": 41, "lr": 9.905186539465546e-05} +{"train_loss": 0.012371564283967018, "global_step": 4902, "epoch": 41, "lr": 9.905143593866503e-05} +{"train_loss": 0.018009811639785767, "global_step": 4903, "epoch": 41, "lr": 9.905100638636737e-05} +{"train_loss": 0.020375218242406845, "global_step": 4904, "epoch": 41, "lr": 9.90505767377633e-05} +{"train_loss": 0.014255326241254807, "global_step": 4905, "epoch": 41, "lr": 9.905014699285365e-05} +{"train_loss": 0.022768838331103325, "global_step": 4906, "epoch": 41, "lr": 9.904971715163927e-05} +{"train_loss": 0.016115255653858185, "global_step": 4907, "epoch": 41, "lr": 9.904928721412101e-05} +{"train_loss": 0.01599007286131382, "global_step": 4908, "epoch": 41, "lr": 9.904885718029973e-05} +{"train_loss": 0.011568835005164146, "global_step": 4909, "epoch": 41, "lr": 9.904842705017625e-05} +{"train_loss": 0.015322353690862656, "global_step": 4910, "epoch": 41, "lr": 9.904799682375142e-05} +{"train_loss": 0.01685597561299801, "global_step": 4911, "epoch": 41, "lr": 9.904756650102609e-05} +{"train_loss": 0.013980702497065067, "global_step": 4912, "epoch": 41, "lr": 9.904713608200111e-05} +{"train_loss": 0.018348632380366325, "global_step": 4913, "epoch": 41, "lr": 9.904670556667732e-05} +{"train_loss": 0.016335776075720787, "global_step": 4914, "epoch": 41, "lr": 9.904627495505556e-05} +{"train_loss": 0.010665546171367168, "global_step": 4915, "epoch": 41, "lr": 9.904584424713668e-05} +{"train_loss": 0.01893768459558487, "global_step": 4916, "epoch": 41, "lr": 9.904541344292151e-05} +{"train_loss": 0.02047649957239628, "global_step": 4917, "epoch": 41, "lr": 9.904498254241093e-05} +{"train_loss": 0.014585107564926147, "global_step": 4918, "epoch": 41, "lr": 9.904455154560576e-05} +{"train_loss": 0.01253525074571371, "global_step": 4919, "epoch": 41, "lr": 9.904412045250685e-05} +{"train_loss": 0.01708807609975338, "global_step": 4920, "epoch": 41, "lr": 9.904368926311504e-05} +{"train_loss": 0.012938138097524643, "global_step": 4921, "epoch": 41, "lr": 9.90432579774312e-05} +{"train_loss": 0.018089180812239647, "global_step": 4922, "epoch": 41, "lr": 9.904282659545616e-05} +{"train_loss": 0.013891080394387245, "global_step": 4923, "epoch": 41, "lr": 9.904239511719077e-05} +{"train_loss": 0.0162351056933403, "global_step": 4924, "epoch": 41, "lr": 9.904196354263587e-05} +{"train_loss": 0.013945827260613441, "global_step": 4925, "epoch": 41, "lr": 9.904153187179233e-05} +{"train_loss": 0.012168443761765957, "global_step": 4926, "epoch": 41, "lr": 9.904110010466097e-05} +{"train_loss": 0.012933095917105675, "global_step": 4927, "epoch": 41, "lr": 9.904066824124266e-05} +{"train_loss": 0.0174824558198452, "global_step": 4928, "epoch": 41, "lr": 9.904023628153821e-05} +{"train_loss": 0.021938344463706017, "global_step": 4929, "epoch": 41, "lr": 9.90398042255485e-05} +{"train_loss": 0.015420198440551758, "global_step": 4930, "epoch": 41, "lr": 9.90393720732744e-05} +{"train_loss": 0.012783383019268513, "global_step": 4931, "epoch": 41, "lr": 9.903893982471672e-05} +{"train_loss": 0.011835549958050251, "global_step": 4932, "epoch": 41, "lr": 9.903850747987631e-05} +{"train_loss": 0.01798832044005394, "global_step": 4933, "epoch": 41, "lr": 9.903807503875404e-05} +{"train_loss": 0.010344460606575012, "global_step": 4934, "epoch": 41, "lr": 9.903764250135074e-05} +{"train_loss": 0.013118686154484749, "global_step": 4935, "epoch": 41, "lr": 9.903720986766728e-05} +{"train_loss": 0.012425611726939678, "global_step": 4936, "epoch": 41, "lr": 9.90367771377045e-05} +{"train_loss": 0.01564241759479046, "global_step": 4937, "epoch": 41, "lr": 9.903634431146323e-05} +{"train_loss": 0.012783144600689411, "global_step": 4938, "epoch": 41, "lr": 9.903591138894435e-05} +{"train_loss": 0.0128799919039011, "global_step": 4939, "epoch": 41, "lr": 9.903547837014869e-05} +{"train_loss": 0.016409432515501976, "global_step": 4940, "epoch": 41, "lr": 9.90350452550771e-05} +{"train_loss": 0.012764290906488895, "global_step": 4941, "epoch": 41, "lr": 9.903461204373045e-05} +{"train_loss": 0.015762649476528168, "global_step": 4942, "epoch": 41, "lr": 9.903417873610957e-05} +{"train_loss": 0.012681666761636734, "global_step": 4943, "epoch": 41, "lr": 9.903374533221532e-05} +{"train_loss": 0.015060449950397015, "global_step": 4944, "epoch": 41, "lr": 9.903331183204856e-05} +{"train_loss": 0.01178482361137867, "global_step": 4945, "epoch": 41, "lr": 9.903287823561011e-05} +{"train_loss": 0.014886917546391487, "global_step": 4946, "epoch": 41, "lr": 9.903244454290086e-05} +{"train_loss": 0.015703493729233742, "global_step": 4947, "epoch": 41, "lr": 9.903201075392163e-05} +{"train_loss": 0.011986766941845417, "global_step": 4948, "epoch": 41, "lr": 9.903157686867331e-05} +{"train_loss": 0.0127669433131814, "global_step": 4949, "epoch": 41, "lr": 9.90311428871567e-05} +{"train_loss": 0.015147490426898003, "global_step": 4950, "epoch": 41, "lr": 9.903070880937268e-05} +{"train_loss": 0.011140813119709492, "global_step": 4951, "epoch": 41, "lr": 9.903027463532213e-05} +{"train_loss": 0.010583379305899143, "global_step": 4952, "epoch": 41, "lr": 9.902984036500584e-05} +{"train_loss": 0.011427406221628189, "global_step": 4953, "epoch": 41, "lr": 9.902940599842472e-05} +{"train_loss": 0.01804305426776409, "global_step": 4954, "epoch": 41, "lr": 9.90289715355796e-05} +{"train_loss": 0.013517488725483418, "global_step": 4955, "epoch": 41, "lr": 9.90285369764713e-05} +{"train_loss": 0.0115963164716959, "global_step": 4956, "epoch": 41, "lr": 9.902810232110073e-05} +{"train_loss": 0.012697710655629635, "global_step": 4957, "epoch": 41, "lr": 9.902766756946872e-05} +{"train_loss": 0.010311365127563477, "global_step": 4958, "epoch": 41, "lr": 9.902723272157613e-05} +{"train_loss": 0.012980998493731022, "global_step": 4959, "epoch": 41, "lr": 9.902679777742379e-05} +{"train_loss": 0.01826753094792366, "global_step": 4960, "epoch": 41, "lr": 9.902636273701258e-05} +{"train_loss": 0.016655832529067993, "global_step": 4961, "epoch": 41, "lr": 9.902592760034333e-05} +{"train_loss": 0.015505818650126457, "global_step": 4962, "epoch": 41, "lr": 9.902549236741693e-05} +{"train_loss": 0.01876811683177948, "global_step": 4963, "epoch": 41, "lr": 9.90250570382342e-05} +{"train_loss": 0.014331289567053318, "global_step": 4964, "epoch": 41, "lr": 9.9024621612796e-05} +{"train_loss": 0.019293611869215965, "global_step": 4965, "epoch": 41, "lr": 9.902418609110323e-05} +{"train_loss": 0.013171822763979435, "global_step": 4966, "epoch": 41, "lr": 9.902375047315666e-05} +{"train_loss": 0.01358499750494957, "global_step": 4967, "epoch": 41, "lr": 9.902331475895722e-05} +{"train_loss": 0.017377901822328568, "global_step": 4968, "epoch": 41, "lr": 9.902287894850574e-05} +{"train_loss": 0.014736322686076164, "global_step": 4969, "epoch": 41, "lr": 9.902244304180306e-05} +{"train_loss": 0.013295430690050125, "global_step": 4970, "epoch": 41, "lr": 9.902200703885007e-05} +{"train_loss": 0.019463393837213516, "global_step": 4971, "epoch": 41, "lr": 9.90215709396476e-05} +{"train_loss": 0.013051819056272507, "global_step": 4972, "epoch": 41, "lr": 9.90211347441965e-05} +{"train_loss": 0.017788676545023918, "global_step": 4973, "epoch": 41, "lr": 9.902069845249764e-05} +{"train_loss": 0.017338989302515984, "global_step": 4974, "epoch": 41, "lr": 9.902026206455189e-05} +{"train_loss": 0.020463109016418457, "global_step": 4975, "epoch": 41, "lr": 9.901982558036009e-05} +{"train_loss": 0.01755039393901825, "global_step": 4976, "epoch": 41, "lr": 9.901938899992309e-05} +{"train_loss": 0.012847189791500568, "global_step": 4977, "epoch": 41, "lr": 9.901895232324177e-05} +{"train_loss": 0.021183717995882034, "global_step": 4978, "epoch": 41, "lr": 9.901851555031696e-05} +{"train_loss": 0.01647537760436535, "global_step": 4979, "epoch": 41, "lr": 9.901807868114953e-05} +{"train_loss": 0.012343773618340492, "global_step": 4980, "epoch": 41, "lr": 9.901764171574035e-05} +{"train_loss": 0.01394694298505783, "global_step": 4981, "epoch": 41, "lr": 9.901720465409026e-05} +{"train_loss": 0.018313461914658546, "global_step": 4982, "epoch": 41, "lr": 9.901676749620013e-05} +{"train_loss": 0.01101064495742321, "global_step": 4983, "epoch": 41, "lr": 9.901633024207082e-05} +{"train_loss": 0.013162964954972267, "global_step": 4984, "epoch": 41, "lr": 9.901589289170316e-05} +{"train_loss": 0.018650438636541367, "global_step": 4985, "epoch": 41, "lr": 9.901545544509804e-05} +{"train_loss": 0.02163732796907425, "global_step": 4986, "epoch": 41, "lr": 9.901501790225634e-05} +{"train_loss": 0.018558314070105553, "global_step": 4987, "epoch": 41, "lr": 9.901458026317885e-05} +{"train_loss": 0.02214660495519638, "global_step": 4988, "epoch": 41, "lr": 9.901414252786649e-05} +{"train_loss": 0.014371158555150032, "global_step": 4989, "epoch": 41, "lr": 9.901370469632009e-05} +{"train_loss": 0.017025461420416832, "global_step": 4990, "epoch": 41, "lr": 9.901326676854051e-05} +{"train_loss": 0.017141280695796013, "global_step": 4991, "epoch": 41, "lr": 9.901282874452863e-05} +{"train_loss": 0.015787901356816292, "global_step": 4992, "epoch": 41, "lr": 9.901239062428528e-05} +{"train_loss": 0.014917011372745037, "global_step": 4993, "epoch": 41, "lr": 9.901195240781135e-05} +{"train_loss": 0.017889171838760376, "global_step": 4994, "epoch": 41, "lr": 9.901151409510769e-05} +{"train_loss": 0.015369733795523643, "global_step": 4995, "epoch": 41, "lr": 9.901107568617516e-05} +{"train_loss": 0.016734767705202103, "global_step": 4996, "epoch": 41, "lr": 9.901063718101462e-05} +{"train_loss": 0.015339152143970757, "global_step": 4997, "epoch": 41, "lr": 9.901019857962692e-05, "val_loss": 0.019614536315202713} +{"train_loss": 0.020512819290161133, "global_step": 4998, "epoch": 42, "lr": 9.900975988201293e-05} +{"train_loss": 0.019981496036052704, "global_step": 4999, "epoch": 42, "lr": 9.90093210881735e-05} +{"train_loss": 0.012108875438570976, "global_step": 5000, "epoch": 42, "lr": 9.900888219810954e-05} +{"train_loss": 0.016287801787257195, "global_step": 5001, "epoch": 42, "lr": 9.900844321182186e-05} +{"train_loss": 0.017048131674528122, "global_step": 5002, "epoch": 42, "lr": 9.900800412931133e-05} +{"train_loss": 0.015424149110913277, "global_step": 5003, "epoch": 42, "lr": 9.900756495057881e-05} +{"train_loss": 0.01556527242064476, "global_step": 5004, "epoch": 42, "lr": 9.90071256756252e-05} +{"train_loss": 0.01827351190149784, "global_step": 5005, "epoch": 42, "lr": 9.900668630445132e-05} +{"train_loss": 0.015161499381065369, "global_step": 5006, "epoch": 42, "lr": 9.900624683705803e-05} +{"train_loss": 0.01523342914879322, "global_step": 5007, "epoch": 42, "lr": 9.900580727344624e-05} +{"train_loss": 0.017848161980509758, "global_step": 5008, "epoch": 42, "lr": 9.900536761361676e-05} +{"train_loss": 0.017428908497095108, "global_step": 5009, "epoch": 42, "lr": 9.90049278575705e-05} +{"train_loss": 0.020818106830120087, "global_step": 5010, "epoch": 42, "lr": 9.900448800530829e-05} +{"train_loss": 0.01518442202359438, "global_step": 5011, "epoch": 42, "lr": 9.900404805683099e-05} +{"train_loss": 0.017483685165643692, "global_step": 5012, "epoch": 42, "lr": 9.900360801213948e-05} +{"train_loss": 0.009764309972524643, "global_step": 5013, "epoch": 42, "lr": 9.900316787123463e-05} +{"train_loss": 0.015793567523360252, "global_step": 5014, "epoch": 42, "lr": 9.900272763411729e-05} +{"train_loss": 0.01463385671377182, "global_step": 5015, "epoch": 42, "lr": 9.900228730078833e-05} +{"train_loss": 0.012269078753888607, "global_step": 5016, "epoch": 42, "lr": 9.900184687124862e-05} +{"train_loss": 0.02266726642847061, "global_step": 5017, "epoch": 42, "lr": 9.900140634549902e-05} +{"train_loss": 0.011555229313671589, "global_step": 5018, "epoch": 42, "lr": 9.900096572354037e-05} +{"train_loss": 0.02223796583712101, "global_step": 5019, "epoch": 42, "lr": 9.900052500537357e-05} +{"train_loss": 0.014547296799719334, "global_step": 5020, "epoch": 42, "lr": 9.900008419099949e-05} +{"train_loss": 0.021400712430477142, "global_step": 5021, "epoch": 42, "lr": 9.899964328041897e-05} +{"train_loss": 0.016104184091091156, "global_step": 5022, "epoch": 42, "lr": 9.899920227363288e-05} +{"train_loss": 0.014813319779932499, "global_step": 5023, "epoch": 42, "lr": 9.89987611706421e-05} +{"train_loss": 0.013305594213306904, "global_step": 5024, "epoch": 42, "lr": 9.899831997144748e-05} +{"train_loss": 0.012903247959911823, "global_step": 5025, "epoch": 42, "lr": 9.89978786760499e-05} +{"train_loss": 0.016667146235704422, "global_step": 5026, "epoch": 42, "lr": 9.899743728445021e-05} +{"train_loss": 0.01395419705659151, "global_step": 5027, "epoch": 42, "lr": 9.89969957966493e-05} +{"train_loss": 0.014026920311152935, "global_step": 5028, "epoch": 42, "lr": 9.899655421264802e-05} +{"train_loss": 0.015395648777484894, "global_step": 5029, "epoch": 42, "lr": 9.899611253244723e-05} +{"train_loss": 0.011764529161155224, "global_step": 5030, "epoch": 42, "lr": 9.899567075604782e-05} +{"train_loss": 0.015079514123499393, "global_step": 5031, "epoch": 42, "lr": 9.899522888345063e-05} +{"train_loss": 0.014743761159479618, "global_step": 5032, "epoch": 42, "lr": 9.899478691465656e-05} +{"train_loss": 0.01265482883900404, "global_step": 5033, "epoch": 42, "lr": 9.899434484966645e-05} +{"train_loss": 0.0174160934984684, "global_step": 5034, "epoch": 42, "lr": 9.899390268848118e-05} +{"train_loss": 0.017110338434576988, "global_step": 5035, "epoch": 42, "lr": 9.899346043110162e-05} +{"train_loss": 0.020002583041787148, "global_step": 5036, "epoch": 42, "lr": 9.899301807752863e-05} +{"train_loss": 0.017272192984819412, "global_step": 5037, "epoch": 42, "lr": 9.899257562776307e-05} +{"train_loss": 0.0125857163220644, "global_step": 5038, "epoch": 42, "lr": 9.899213308180583e-05} +{"train_loss": 0.022724518552422523, "global_step": 5039, "epoch": 42, "lr": 9.899169043965779e-05} +{"train_loss": 0.013200937770307064, "global_step": 5040, "epoch": 42, "lr": 9.899124770131978e-05} +{"train_loss": 0.020589714869856834, "global_step": 5041, "epoch": 42, "lr": 9.89908048667927e-05} +{"train_loss": 0.015427176840603352, "global_step": 5042, "epoch": 42, "lr": 9.899036193607741e-05} +{"train_loss": 0.01488158106803894, "global_step": 5043, "epoch": 42, "lr": 9.898991890917477e-05} +{"train_loss": 0.012558958493173122, "global_step": 5044, "epoch": 42, "lr": 9.898947578608566e-05} +{"train_loss": 0.01887844316661358, "global_step": 5045, "epoch": 42, "lr": 9.898903256681095e-05} +{"train_loss": 0.016718527302145958, "global_step": 5046, "epoch": 42, "lr": 9.898858925135151e-05} +{"train_loss": 0.020077791064977646, "global_step": 5047, "epoch": 42, "lr": 9.898814583970818e-05} +{"train_loss": 0.013142828829586506, "global_step": 5048, "epoch": 42, "lr": 9.898770233188191e-05} +{"train_loss": 0.0190740879625082, "global_step": 5049, "epoch": 42, "lr": 9.898725872787348e-05} +{"train_loss": 0.014514517039060593, "global_step": 5050, "epoch": 42, "lr": 9.898681502768382e-05} +{"train_loss": 0.017357274889945984, "global_step": 5051, "epoch": 42, "lr": 9.898637123131377e-05} +{"train_loss": 0.013170983642339706, "global_step": 5052, "epoch": 42, "lr": 9.898592733876422e-05} +{"train_loss": 0.016086066141724586, "global_step": 5053, "epoch": 42, "lr": 9.898548335003605e-05} +{"train_loss": 0.020100951194763184, "global_step": 5054, "epoch": 42, "lr": 9.89850392651301e-05} +{"train_loss": 0.014695072546601295, "global_step": 5055, "epoch": 42, "lr": 9.898459508404726e-05} +{"train_loss": 0.016012510284781456, "global_step": 5056, "epoch": 42, "lr": 9.89841508067884e-05} +{"train_loss": 0.014641236513853073, "global_step": 5057, "epoch": 42, "lr": 9.89837064333544e-05} +{"train_loss": 0.014710947871208191, "global_step": 5058, "epoch": 42, "lr": 9.898326196374612e-05} +{"train_loss": 0.02105610817670822, "global_step": 5059, "epoch": 42, "lr": 9.898281739796444e-05} +{"train_loss": 0.018747199326753616, "global_step": 5060, "epoch": 42, "lr": 9.898237273601024e-05} +{"train_loss": 0.011787045747041702, "global_step": 5061, "epoch": 42, "lr": 9.898192797788437e-05} +{"train_loss": 0.020841369405388832, "global_step": 5062, "epoch": 42, "lr": 9.898148312358772e-05} +{"train_loss": 0.020494848489761353, "global_step": 5063, "epoch": 42, "lr": 9.898103817312115e-05} +{"train_loss": 0.015774551779031754, "global_step": 5064, "epoch": 42, "lr": 9.898059312648557e-05} +{"train_loss": 0.019298534840345383, "global_step": 5065, "epoch": 42, "lr": 9.89801479836818e-05} +{"train_loss": 0.018884476274251938, "global_step": 5066, "epoch": 42, "lr": 9.897970274471077e-05} +{"train_loss": 0.012357017956674099, "global_step": 5067, "epoch": 42, "lr": 9.897925740957331e-05} +{"train_loss": 0.01861295849084854, "global_step": 5068, "epoch": 42, "lr": 9.897881197827032e-05} +{"train_loss": 0.018680527806282043, "global_step": 5069, "epoch": 42, "lr": 9.897836645080265e-05} +{"train_loss": 0.018943404778838158, "global_step": 5070, "epoch": 42, "lr": 9.897792082717121e-05} +{"train_loss": 0.017532387748360634, "global_step": 5071, "epoch": 42, "lr": 9.897747510737683e-05} +{"train_loss": 0.021880947053432465, "global_step": 5072, "epoch": 42, "lr": 9.897702929142043e-05} +{"train_loss": 0.01756155490875244, "global_step": 5073, "epoch": 42, "lr": 9.897658337930287e-05} +{"train_loss": 0.011618168093264103, "global_step": 5074, "epoch": 42, "lr": 9.8976137371025e-05} +{"train_loss": 0.019027646631002426, "global_step": 5075, "epoch": 42, "lr": 9.897569126658773e-05} +{"train_loss": 0.01799129694700241, "global_step": 5076, "epoch": 42, "lr": 9.897524506599192e-05} +{"train_loss": 0.015554339624941349, "global_step": 5077, "epoch": 42, "lr": 9.897479876923845e-05} +{"train_loss": 0.017553385347127914, "global_step": 5078, "epoch": 42, "lr": 9.89743523763282e-05} +{"train_loss": 0.018343139439821243, "global_step": 5079, "epoch": 42, "lr": 9.897390588726203e-05} +{"train_loss": 0.012040168978273869, "global_step": 5080, "epoch": 42, "lr": 9.897345930204083e-05} +{"train_loss": 0.017027396708726883, "global_step": 5081, "epoch": 42, "lr": 9.897301262066547e-05} +{"train_loss": 0.016604190692305565, "global_step": 5082, "epoch": 42, "lr": 9.897256584313686e-05} +{"train_loss": 0.012554937973618507, "global_step": 5083, "epoch": 42, "lr": 9.897211896945581e-05} +{"train_loss": 0.015933414921164513, "global_step": 5084, "epoch": 42, "lr": 9.897167199962326e-05} +{"train_loss": 0.017820676788687706, "global_step": 5085, "epoch": 42, "lr": 9.897122493364006e-05} +{"train_loss": 0.016581831499934196, "global_step": 5086, "epoch": 42, "lr": 9.89707777715071e-05} +{"train_loss": 0.014960777014493942, "global_step": 5087, "epoch": 42, "lr": 9.897033051322522e-05} +{"train_loss": 0.018282633274793625, "global_step": 5088, "epoch": 42, "lr": 9.896988315879536e-05} +{"train_loss": 0.014077265746891499, "global_step": 5089, "epoch": 42, "lr": 9.896943570821835e-05} +{"train_loss": 0.018336648121476173, "global_step": 5090, "epoch": 42, "lr": 9.896898816149509e-05} +{"train_loss": 0.01417867187410593, "global_step": 5091, "epoch": 42, "lr": 9.896854051862646e-05} +{"train_loss": 0.020625753328204155, "global_step": 5092, "epoch": 42, "lr": 9.89680927796133e-05} +{"train_loss": 0.01429071743041277, "global_step": 5093, "epoch": 42, "lr": 9.896764494445657e-05} +{"train_loss": 0.014234675094485283, "global_step": 5094, "epoch": 42, "lr": 9.896719701315707e-05} +{"train_loss": 0.016366902738809586, "global_step": 5095, "epoch": 42, "lr": 9.896674898571571e-05} +{"train_loss": 0.01573815383017063, "global_step": 5096, "epoch": 42, "lr": 9.896630086213337e-05} +{"train_loss": 0.021722758188843727, "global_step": 5097, "epoch": 42, "lr": 9.896585264241094e-05} +{"train_loss": 0.012008399702608585, "global_step": 5098, "epoch": 42, "lr": 9.896540432654928e-05} +{"train_loss": 0.014542756602168083, "global_step": 5099, "epoch": 42, "lr": 9.896495591454928e-05} +{"train_loss": 0.016103653237223625, "global_step": 5100, "epoch": 42, "lr": 9.896450740641183e-05} +{"train_loss": 0.01726696826517582, "global_step": 5101, "epoch": 42, "lr": 9.89640588021378e-05} +{"train_loss": 0.020115522667765617, "global_step": 5102, "epoch": 42, "lr": 9.896361010172806e-05} +{"train_loss": 0.017003830522298813, "global_step": 5103, "epoch": 42, "lr": 9.89631613051835e-05} +{"train_loss": 0.022473778575658798, "global_step": 5104, "epoch": 42, "lr": 9.896271241250502e-05} +{"train_loss": 0.015439866110682487, "global_step": 5105, "epoch": 42, "lr": 9.896226342369348e-05} +{"train_loss": 0.015180046670138836, "global_step": 5106, "epoch": 42, "lr": 9.896181433874976e-05} +{"train_loss": 0.012713705189526081, "global_step": 5107, "epoch": 42, "lr": 9.896136515767476e-05} +{"train_loss": 0.02182616852223873, "global_step": 5108, "epoch": 42, "lr": 9.896091588046934e-05} +{"train_loss": 0.014830153435468674, "global_step": 5109, "epoch": 42, "lr": 9.89604665071344e-05} +{"train_loss": 0.013199608772993088, "global_step": 5110, "epoch": 42, "lr": 9.896001703767081e-05} +{"train_loss": 0.012643805705010891, "global_step": 5111, "epoch": 42, "lr": 9.895956747207944e-05} +{"train_loss": 0.012798277661204338, "global_step": 5112, "epoch": 42, "lr": 9.895911781036122e-05} +{"train_loss": 0.013670657761394978, "global_step": 5113, "epoch": 42, "lr": 9.895866805251699e-05} +{"train_loss": 0.009446606040000916, "global_step": 5114, "epoch": 42, "lr": 9.895821819854765e-05} +{"train_loss": 0.01828840747475624, "global_step": 5115, "epoch": 42, "lr": 9.895776824845406e-05} +{"train_loss": 0.016338304569553427, "global_step": 5116, "epoch": 42, "lr": 9.895731820223715e-05, "val_loss": 0.026246268302202225} +{"train_loss": 0.014129983261227608, "global_step": 5117, "epoch": 43, "lr": 9.895686805989776e-05} +{"train_loss": 0.013922902755439281, "global_step": 5118, "epoch": 43, "lr": 9.895641782143678e-05} +{"train_loss": 0.022278374060988426, "global_step": 5119, "epoch": 43, "lr": 9.895596748685513e-05} +{"train_loss": 0.00892159529030323, "global_step": 5120, "epoch": 43, "lr": 9.895551705615365e-05} +{"train_loss": 0.01537149678915739, "global_step": 5121, "epoch": 43, "lr": 9.895506652933325e-05} +{"train_loss": 0.014974264428019524, "global_step": 5122, "epoch": 43, "lr": 9.895461590639482e-05} +{"train_loss": 0.009260505437850952, "global_step": 5123, "epoch": 43, "lr": 9.89541651873392e-05} +{"train_loss": 0.017855988815426826, "global_step": 5124, "epoch": 43, "lr": 9.895371437216732e-05} +{"train_loss": 0.014988663606345654, "global_step": 5125, "epoch": 43, "lr": 9.895326346088005e-05} +{"train_loss": 0.01926831528544426, "global_step": 5126, "epoch": 43, "lr": 9.89528124534783e-05} +{"train_loss": 0.014660777524113655, "global_step": 5127, "epoch": 43, "lr": 9.89523613499629e-05} +{"train_loss": 0.016473902389407158, "global_step": 5128, "epoch": 43, "lr": 9.895191015033479e-05} +{"train_loss": 0.010298793204128742, "global_step": 5129, "epoch": 43, "lr": 9.895145885459483e-05} +{"train_loss": 0.013482675887644291, "global_step": 5130, "epoch": 43, "lr": 9.895100746274389e-05} +{"train_loss": 0.012475109659135342, "global_step": 5131, "epoch": 43, "lr": 9.89505559747829e-05} +{"train_loss": 0.01724802888929844, "global_step": 5132, "epoch": 43, "lr": 9.89501043907127e-05} +{"train_loss": 0.01713545434176922, "global_step": 5133, "epoch": 43, "lr": 9.894965271053423e-05} +{"train_loss": 0.019102884456515312, "global_step": 5134, "epoch": 43, "lr": 9.894920093424833e-05} +{"train_loss": 0.01543465070426464, "global_step": 5135, "epoch": 43, "lr": 9.89487490618559e-05} +{"train_loss": 0.01741359755396843, "global_step": 5136, "epoch": 43, "lr": 9.894829709335784e-05} +{"train_loss": 0.013890944421291351, "global_step": 5137, "epoch": 43, "lr": 9.894784502875503e-05} +{"train_loss": 0.016873179003596306, "global_step": 5138, "epoch": 43, "lr": 9.894739286804836e-05} +{"train_loss": 0.018320556730031967, "global_step": 5139, "epoch": 43, "lr": 9.894694061123868e-05} +{"train_loss": 0.01732845976948738, "global_step": 5140, "epoch": 43, "lr": 9.894648825832694e-05} +{"train_loss": 0.015032771043479443, "global_step": 5141, "epoch": 43, "lr": 9.8946035809314e-05} +{"train_loss": 0.015250349417328835, "global_step": 5142, "epoch": 43, "lr": 9.894558326420074e-05} +{"train_loss": 0.020103558897972107, "global_step": 5143, "epoch": 43, "lr": 9.894513062298805e-05} +{"train_loss": 0.017187979072332382, "global_step": 5144, "epoch": 43, "lr": 9.894467788567684e-05} +{"train_loss": 0.02079745940864086, "global_step": 5145, "epoch": 43, "lr": 9.894422505226797e-05} +{"train_loss": 0.018067894503474236, "global_step": 5146, "epoch": 43, "lr": 9.894377212276235e-05} +{"train_loss": 0.013038835488259792, "global_step": 5147, "epoch": 43, "lr": 9.894331909716086e-05} +{"train_loss": 0.01851467229425907, "global_step": 5148, "epoch": 43, "lr": 9.894286597546441e-05} +{"train_loss": 0.017478294670581818, "global_step": 5149, "epoch": 43, "lr": 9.894241275767384e-05} +{"train_loss": 0.018222499638795853, "global_step": 5150, "epoch": 43, "lr": 9.894195944379008e-05} +{"train_loss": 0.015372497029602528, "global_step": 5151, "epoch": 43, "lr": 9.894150603381403e-05} +{"train_loss": 0.013008727692067623, "global_step": 5152, "epoch": 43, "lr": 9.894105252774654e-05} +{"train_loss": 0.016453472897410393, "global_step": 5153, "epoch": 43, "lr": 9.894059892558854e-05} +{"train_loss": 0.017589859664440155, "global_step": 5154, "epoch": 43, "lr": 9.89401452273409e-05} +{"train_loss": 0.015268308110535145, "global_step": 5155, "epoch": 43, "lr": 9.89396914330045e-05} +{"train_loss": 0.012758990749716759, "global_step": 5156, "epoch": 43, "lr": 9.893923754258026e-05} +{"train_loss": 0.013874942436814308, "global_step": 5157, "epoch": 43, "lr": 9.893878355606903e-05} +{"train_loss": 0.016567079350352287, "global_step": 5158, "epoch": 43, "lr": 9.893832947347175e-05} +{"train_loss": 0.013924781233072281, "global_step": 5159, "epoch": 43, "lr": 9.893787529478929e-05} +{"train_loss": 0.01464033592492342, "global_step": 5160, "epoch": 43, "lr": 9.893742102002252e-05} +{"train_loss": 0.017687875777482986, "global_step": 5161, "epoch": 43, "lr": 9.893696664917237e-05} +{"train_loss": 0.010206273756921291, "global_step": 5162, "epoch": 43, "lr": 9.893651218223971e-05} +{"train_loss": 0.015777593478560448, "global_step": 5163, "epoch": 43, "lr": 9.893605761922545e-05} +{"train_loss": 0.012762160040438175, "global_step": 5164, "epoch": 43, "lr": 9.893560296013043e-05} +{"train_loss": 0.016736295074224472, "global_step": 5165, "epoch": 43, "lr": 9.893514820495562e-05} +{"train_loss": 0.011782761663198471, "global_step": 5166, "epoch": 43, "lr": 9.893469335370184e-05} +{"train_loss": 0.017288267612457275, "global_step": 5167, "epoch": 43, "lr": 9.893423840637006e-05} +{"train_loss": 0.016339613124728203, "global_step": 5168, "epoch": 43, "lr": 9.89337833629611e-05} +{"train_loss": 0.024580752477049828, "global_step": 5169, "epoch": 43, "lr": 9.89333282234759e-05} +{"train_loss": 0.01789877377450466, "global_step": 5170, "epoch": 43, "lr": 9.893287298791531e-05} +{"train_loss": 0.016794942319393158, "global_step": 5171, "epoch": 43, "lr": 9.893241765628027e-05} +{"train_loss": 0.015926547348499298, "global_step": 5172, "epoch": 43, "lr": 9.893196222857166e-05} +{"train_loss": 0.015049228444695473, "global_step": 5173, "epoch": 43, "lr": 9.893150670479038e-05} +{"train_loss": 0.011637713760137558, "global_step": 5174, "epoch": 43, "lr": 9.89310510849373e-05} +{"train_loss": 0.0228286013007164, "global_step": 5175, "epoch": 43, "lr": 9.893059536901333e-05} +{"train_loss": 0.014818374998867512, "global_step": 5176, "epoch": 43, "lr": 9.893013955701935e-05} +{"train_loss": 0.016619782894849777, "global_step": 5177, "epoch": 43, "lr": 9.89296836489563e-05} +{"train_loss": 0.020438004285097122, "global_step": 5178, "epoch": 43, "lr": 9.892922764482502e-05} +{"train_loss": 0.014383068308234215, "global_step": 5179, "epoch": 43, "lr": 9.892877154462643e-05} +{"train_loss": 0.013876472599804401, "global_step": 5180, "epoch": 43, "lr": 9.892831534836142e-05} +{"train_loss": 0.010413187555968761, "global_step": 5181, "epoch": 43, "lr": 9.89278590560309e-05} +{"train_loss": 0.009286110289394855, "global_step": 5182, "epoch": 43, "lr": 9.892740266763576e-05} +{"train_loss": 0.016824133694171906, "global_step": 5183, "epoch": 43, "lr": 9.892694618317689e-05} +{"train_loss": 0.01619982160627842, "global_step": 5184, "epoch": 43, "lr": 9.892648960265518e-05} +{"train_loss": 0.009321595542132854, "global_step": 5185, "epoch": 43, "lr": 9.892603292607155e-05} +{"train_loss": 0.023872515186667442, "global_step": 5186, "epoch": 43, "lr": 9.892557615342685e-05} +{"train_loss": 0.01637827791273594, "global_step": 5187, "epoch": 43, "lr": 9.892511928472204e-05} +{"train_loss": 0.015567426569759846, "global_step": 5188, "epoch": 43, "lr": 9.892466231995797e-05} +{"train_loss": 0.01742151938378811, "global_step": 5189, "epoch": 43, "lr": 9.892420525913557e-05} +{"train_loss": 0.013319049961864948, "global_step": 5190, "epoch": 43, "lr": 9.89237481022557e-05} +{"train_loss": 0.012060687877237797, "global_step": 5191, "epoch": 43, "lr": 9.892329084931928e-05} +{"train_loss": 0.015642773360013962, "global_step": 5192, "epoch": 43, "lr": 9.89228335003272e-05} +{"train_loss": 0.01905452087521553, "global_step": 5193, "epoch": 43, "lr": 9.892237605528038e-05} +{"train_loss": 0.01653239317238331, "global_step": 5194, "epoch": 43, "lr": 9.892191851417968e-05} +{"train_loss": 0.01978798769414425, "global_step": 5195, "epoch": 43, "lr": 9.892146087702605e-05} +{"train_loss": 0.013665882870554924, "global_step": 5196, "epoch": 43, "lr": 9.892100314382034e-05} +{"train_loss": 0.016124270856380463, "global_step": 5197, "epoch": 43, "lr": 9.892054531456346e-05} +{"train_loss": 0.01285457331687212, "global_step": 5198, "epoch": 43, "lr": 9.892008738925634e-05} +{"train_loss": 0.013630202040076256, "global_step": 5199, "epoch": 43, "lr": 9.891962936789983e-05} +{"train_loss": 0.01575828157365322, "global_step": 5200, "epoch": 43, "lr": 9.891917125049486e-05} +{"train_loss": 0.01178902667015791, "global_step": 5201, "epoch": 43, "lr": 9.891871303704232e-05} +{"train_loss": 0.013939091004431248, "global_step": 5202, "epoch": 43, "lr": 9.891825472754313e-05} +{"train_loss": 0.0174561720341444, "global_step": 5203, "epoch": 43, "lr": 9.891779632199814e-05} +{"train_loss": 0.012298808433115482, "global_step": 5204, "epoch": 43, "lr": 9.891733782040831e-05} +{"train_loss": 0.021205725148320198, "global_step": 5205, "epoch": 43, "lr": 9.89168792227745e-05} +{"train_loss": 0.01768469624221325, "global_step": 5206, "epoch": 43, "lr": 9.891642052909764e-05} +{"train_loss": 0.014727268368005753, "global_step": 5207, "epoch": 43, "lr": 9.89159617393786e-05} +{"train_loss": 0.011826125904917717, "global_step": 5208, "epoch": 43, "lr": 9.891550285361831e-05} +{"train_loss": 0.011255821213126183, "global_step": 5209, "epoch": 43, "lr": 9.891504387181765e-05} +{"train_loss": 0.017204951494932175, "global_step": 5210, "epoch": 43, "lr": 9.891458479397752e-05} +{"train_loss": 0.013563130050897598, "global_step": 5211, "epoch": 43, "lr": 9.891412562009883e-05} +{"train_loss": 0.01230836845934391, "global_step": 5212, "epoch": 43, "lr": 9.891366635018248e-05} +{"train_loss": 0.013821885921061039, "global_step": 5213, "epoch": 43, "lr": 9.891320698422936e-05} +{"train_loss": 0.016610099002718925, "global_step": 5214, "epoch": 43, "lr": 9.891274752224041e-05} +{"train_loss": 0.018609410151839256, "global_step": 5215, "epoch": 43, "lr": 9.89122879642165e-05} +{"train_loss": 0.00974587257951498, "global_step": 5216, "epoch": 43, "lr": 9.891182831015853e-05} +{"train_loss": 0.010794539004564285, "global_step": 5217, "epoch": 43, "lr": 9.891136856006741e-05} +{"train_loss": 0.02107100747525692, "global_step": 5218, "epoch": 43, "lr": 9.891090871394404e-05} +{"train_loss": 0.018387446179986, "global_step": 5219, "epoch": 43, "lr": 9.891044877178933e-05} +{"train_loss": 0.013679571449756622, "global_step": 5220, "epoch": 43, "lr": 9.890998873360418e-05} +{"train_loss": 0.014830545522272587, "global_step": 5221, "epoch": 43, "lr": 9.890952859938949e-05} +{"train_loss": 0.02104904316365719, "global_step": 5222, "epoch": 43, "lr": 9.890906836914617e-05} +{"train_loss": 0.015289668925106525, "global_step": 5223, "epoch": 43, "lr": 9.890860804287512e-05} +{"train_loss": 0.0120463902130723, "global_step": 5224, "epoch": 43, "lr": 9.890814762057726e-05} +{"train_loss": 0.015400076285004616, "global_step": 5225, "epoch": 43, "lr": 9.890768710225344e-05} +{"train_loss": 0.01512379664927721, "global_step": 5226, "epoch": 43, "lr": 9.890722648790462e-05} +{"train_loss": 0.01511357817798853, "global_step": 5227, "epoch": 43, "lr": 9.890676577753168e-05} +{"train_loss": 0.014166430570185184, "global_step": 5228, "epoch": 43, "lr": 9.890630497113555e-05} +{"train_loss": 0.016971418634057045, "global_step": 5229, "epoch": 43, "lr": 9.89058440687171e-05} +{"train_loss": 0.01767955906689167, "global_step": 5230, "epoch": 43, "lr": 9.890538307027724e-05} +{"train_loss": 0.010332486592233181, "global_step": 5231, "epoch": 43, "lr": 9.89049219758169e-05} +{"train_loss": 0.013222419656813145, "global_step": 5232, "epoch": 43, "lr": 9.890446078533697e-05} +{"train_loss": 0.012271111831068993, "global_step": 5233, "epoch": 43, "lr": 9.890399949883835e-05} +{"train_loss": 0.015302211046218872, "global_step": 5234, "epoch": 43, "lr": 9.890353811632195e-05} +{"train_loss": 0.015530098417476445, "global_step": 5235, "epoch": 43, "lr": 9.890307663778868e-05, "val_loss": 0.0218149833381176} +{"train_loss": 0.021436555311083794, "global_step": 5236, "epoch": 44, "lr": 9.890261506323946e-05} +{"train_loss": 0.01262377854436636, "global_step": 5237, "epoch": 44, "lr": 9.890215339267516e-05} +{"train_loss": 0.017182691022753716, "global_step": 5238, "epoch": 44, "lr": 9.89016916260967e-05} +{"train_loss": 0.014673599041998386, "global_step": 5239, "epoch": 44, "lr": 9.890122976350501e-05} +{"train_loss": 0.01567530632019043, "global_step": 5240, "epoch": 44, "lr": 9.890076780490098e-05} +{"train_loss": 0.013137297704815865, "global_step": 5241, "epoch": 44, "lr": 9.89003057502855e-05} +{"train_loss": 0.014397725462913513, "global_step": 5242, "epoch": 44, "lr": 9.889984359965952e-05} +{"train_loss": 0.013705054298043251, "global_step": 5243, "epoch": 44, "lr": 9.88993813530239e-05} +{"train_loss": 0.015500904060900211, "global_step": 5244, "epoch": 44, "lr": 9.889891901037957e-05} +{"train_loss": 0.01425888016819954, "global_step": 5245, "epoch": 44, "lr": 9.889845657172743e-05} +{"train_loss": 0.018774135038256645, "global_step": 5246, "epoch": 44, "lr": 9.889799403706841e-05} +{"train_loss": 0.014176912605762482, "global_step": 5247, "epoch": 44, "lr": 9.88975314064034e-05} +{"train_loss": 0.012727594934403896, "global_step": 5248, "epoch": 44, "lr": 9.889706867973331e-05} +{"train_loss": 0.01652585342526436, "global_step": 5249, "epoch": 44, "lr": 9.889660585705904e-05} +{"train_loss": 0.013372981920838356, "global_step": 5250, "epoch": 44, "lr": 9.889614293838153e-05} +{"train_loss": 0.02155318483710289, "global_step": 5251, "epoch": 44, "lr": 9.889567992370166e-05} +{"train_loss": 0.014918055385351181, "global_step": 5252, "epoch": 44, "lr": 9.889521681302033e-05} +{"train_loss": 0.015851551666855812, "global_step": 5253, "epoch": 44, "lr": 9.889475360633848e-05} +{"train_loss": 0.015405161306262016, "global_step": 5254, "epoch": 44, "lr": 9.8894290303657e-05} +{"train_loss": 0.015712466090917587, "global_step": 5255, "epoch": 44, "lr": 9.88938269049768e-05} +{"train_loss": 0.01940998062491417, "global_step": 5256, "epoch": 44, "lr": 9.88933634102988e-05} +{"train_loss": 0.011186046525835991, "global_step": 5257, "epoch": 44, "lr": 9.889289981962391e-05} +{"train_loss": 0.012890194542706013, "global_step": 5258, "epoch": 44, "lr": 9.889243613295302e-05} +{"train_loss": 0.015935592353343964, "global_step": 5259, "epoch": 44, "lr": 9.889197235028706e-05} +{"train_loss": 0.014802088029682636, "global_step": 5260, "epoch": 44, "lr": 9.889150847162694e-05} +{"train_loss": 0.01692947745323181, "global_step": 5261, "epoch": 44, "lr": 9.889104449697357e-05} +{"train_loss": 0.015674080699682236, "global_step": 5262, "epoch": 44, "lr": 9.889058042632786e-05} +{"train_loss": 0.011317462660372257, "global_step": 5263, "epoch": 44, "lr": 9.889011625969071e-05} +{"train_loss": 0.015181638300418854, "global_step": 5264, "epoch": 44, "lr": 9.888965199706304e-05} +{"train_loss": 0.011540989391505718, "global_step": 5265, "epoch": 44, "lr": 9.888918763844576e-05} +{"train_loss": 0.014156993478536606, "global_step": 5266, "epoch": 44, "lr": 9.888872318383979e-05} +{"train_loss": 0.015686018392443657, "global_step": 5267, "epoch": 44, "lr": 9.888825863324604e-05} +{"train_loss": 0.013263382948935032, "global_step": 5268, "epoch": 44, "lr": 9.88877939866654e-05} +{"train_loss": 0.012724768370389938, "global_step": 5269, "epoch": 44, "lr": 9.88873292440988e-05} +{"train_loss": 0.01703498512506485, "global_step": 5270, "epoch": 44, "lr": 9.888686440554717e-05} +{"train_loss": 0.01247361395508051, "global_step": 5271, "epoch": 44, "lr": 9.888639947101139e-05} +{"train_loss": 0.016443829983472824, "global_step": 5272, "epoch": 44, "lr": 9.888593444049239e-05} +{"train_loss": 0.011295528151094913, "global_step": 5273, "epoch": 44, "lr": 9.888546931399108e-05} +{"train_loss": 0.013017314486205578, "global_step": 5274, "epoch": 44, "lr": 9.888500409150838e-05} +{"train_loss": 0.010936380364000797, "global_step": 5275, "epoch": 44, "lr": 9.88845387730452e-05} +{"train_loss": 0.01731657236814499, "global_step": 5276, "epoch": 44, "lr": 9.888407335860243e-05} +{"train_loss": 0.018039938062429428, "global_step": 5277, "epoch": 44, "lr": 9.888360784818103e-05} +{"train_loss": 0.015259847976267338, "global_step": 5278, "epoch": 44, "lr": 9.888314224178187e-05} +{"train_loss": 0.01864667236804962, "global_step": 5279, "epoch": 44, "lr": 9.888267653940588e-05} +{"train_loss": 0.012194710783660412, "global_step": 5280, "epoch": 44, "lr": 9.8882210741054e-05} +{"train_loss": 0.018906986340880394, "global_step": 5281, "epoch": 44, "lr": 9.888174484672709e-05} +{"train_loss": 0.01610136590898037, "global_step": 5282, "epoch": 44, "lr": 9.888127885642613e-05} +{"train_loss": 0.013388855382800102, "global_step": 5283, "epoch": 44, "lr": 9.888081277015198e-05} +{"train_loss": 0.02046840265393257, "global_step": 5284, "epoch": 44, "lr": 9.888034658790558e-05} +{"train_loss": 0.009260140359401703, "global_step": 5285, "epoch": 44, "lr": 9.887988030968784e-05} +{"train_loss": 0.016844822093844414, "global_step": 5286, "epoch": 44, "lr": 9.887941393549969e-05} +{"train_loss": 0.011728144250810146, "global_step": 5287, "epoch": 44, "lr": 9.8878947465342e-05} +{"train_loss": 0.01528091449290514, "global_step": 5288, "epoch": 44, "lr": 9.887848089921575e-05} +{"train_loss": 0.014993207529187202, "global_step": 5289, "epoch": 44, "lr": 9.887801423712181e-05} +{"train_loss": 0.013064738363027573, "global_step": 5290, "epoch": 44, "lr": 9.887754747906113e-05} +{"train_loss": 0.017146192491054535, "global_step": 5291, "epoch": 44, "lr": 9.887708062503458e-05} +{"train_loss": 0.011292023584246635, "global_step": 5292, "epoch": 44, "lr": 9.887661367504313e-05} +{"train_loss": 0.01573711819946766, "global_step": 5293, "epoch": 44, "lr": 9.887614662908766e-05} +{"train_loss": 0.017810020595788956, "global_step": 5294, "epoch": 44, "lr": 9.887567948716909e-05} +{"train_loss": 0.013933480717241764, "global_step": 5295, "epoch": 44, "lr": 9.887521224928835e-05} +{"train_loss": 0.011972093023359776, "global_step": 5296, "epoch": 44, "lr": 9.887474491544635e-05} +{"train_loss": 0.015124042518436909, "global_step": 5297, "epoch": 44, "lr": 9.887427748564402e-05} +{"train_loss": 0.013660456985235214, "global_step": 5298, "epoch": 44, "lr": 9.887380995988226e-05} +{"train_loss": 0.014792934991419315, "global_step": 5299, "epoch": 44, "lr": 9.8873342338162e-05} +{"train_loss": 0.01601908914744854, "global_step": 5300, "epoch": 44, "lr": 9.887287462048415e-05} +{"train_loss": 0.01081812009215355, "global_step": 5301, "epoch": 44, "lr": 9.887240680684962e-05} +{"train_loss": 0.016021396964788437, "global_step": 5302, "epoch": 44, "lr": 9.887193889725936e-05} +{"train_loss": 0.015379290096461773, "global_step": 5303, "epoch": 44, "lr": 9.887147089171426e-05} +{"train_loss": 0.01675262860953808, "global_step": 5304, "epoch": 44, "lr": 9.887100279021525e-05} +{"train_loss": 0.011561383493244648, "global_step": 5305, "epoch": 44, "lr": 9.887053459276325e-05} +{"train_loss": 0.01568838581442833, "global_step": 5306, "epoch": 44, "lr": 9.887006629935917e-05} +{"train_loss": 0.015145081095397472, "global_step": 5307, "epoch": 44, "lr": 9.886959791000394e-05} +{"train_loss": 0.014078477397561073, "global_step": 5308, "epoch": 44, "lr": 9.886912942469848e-05} +{"train_loss": 0.01197057031095028, "global_step": 5309, "epoch": 44, "lr": 9.886866084344369e-05} +{"train_loss": 0.009218316525220871, "global_step": 5310, "epoch": 44, "lr": 9.886819216624052e-05} +{"train_loss": 0.014604573138058186, "global_step": 5311, "epoch": 44, "lr": 9.886772339308987e-05} +{"train_loss": 0.011825965717434883, "global_step": 5312, "epoch": 44, "lr": 9.886725452399266e-05} +{"train_loss": 0.013366344384849072, "global_step": 5313, "epoch": 44, "lr": 9.886678555894982e-05} +{"train_loss": 0.011811544187366962, "global_step": 5314, "epoch": 44, "lr": 9.886631649796228e-05} +{"train_loss": 0.011665171943604946, "global_step": 5315, "epoch": 44, "lr": 9.886584734103094e-05} +{"train_loss": 0.018600251525640488, "global_step": 5316, "epoch": 44, "lr": 9.886537808815673e-05} +{"train_loss": 0.009115559048950672, "global_step": 5317, "epoch": 44, "lr": 9.886490873934055e-05} +{"train_loss": 0.018031341955065727, "global_step": 5318, "epoch": 44, "lr": 9.886443929458338e-05} +{"train_loss": 0.017351318150758743, "global_step": 5319, "epoch": 44, "lr": 9.886396975388607e-05} +{"train_loss": 0.010293504223227501, "global_step": 5320, "epoch": 44, "lr": 9.88635001172496e-05} +{"train_loss": 0.014087515883147717, "global_step": 5321, "epoch": 44, "lr": 9.886303038467486e-05} +{"train_loss": 0.01983831636607647, "global_step": 5322, "epoch": 44, "lr": 9.886256055616277e-05} +{"train_loss": 0.017021894454956055, "global_step": 5323, "epoch": 44, "lr": 9.886209063171428e-05} +{"train_loss": 0.012964247725903988, "global_step": 5324, "epoch": 44, "lr": 9.886162061133027e-05} +{"train_loss": 0.01732485741376877, "global_step": 5325, "epoch": 44, "lr": 9.88611504950117e-05} +{"train_loss": 0.011526749469339848, "global_step": 5326, "epoch": 44, "lr": 9.88606802827595e-05} +{"train_loss": 0.013073470443487167, "global_step": 5327, "epoch": 44, "lr": 9.886020997457455e-05} +{"train_loss": 0.018473757430911064, "global_step": 5328, "epoch": 44, "lr": 9.885973957045781e-05} +{"train_loss": 0.016307927668094635, "global_step": 5329, "epoch": 44, "lr": 9.885926907041018e-05} +{"train_loss": 0.019576026126742363, "global_step": 5330, "epoch": 44, "lr": 9.88587984744326e-05} +{"train_loss": 0.013351392932236195, "global_step": 5331, "epoch": 44, "lr": 9.8858327782526e-05} +{"train_loss": 0.012456483207643032, "global_step": 5332, "epoch": 44, "lr": 9.885785699469128e-05} +{"train_loss": 0.019551826640963554, "global_step": 5333, "epoch": 44, "lr": 9.885738611092938e-05} +{"train_loss": 0.015534237958490849, "global_step": 5334, "epoch": 44, "lr": 9.885691513124123e-05} +{"train_loss": 0.016240395605564117, "global_step": 5335, "epoch": 44, "lr": 9.885644405562773e-05} +{"train_loss": 0.018666347488760948, "global_step": 5336, "epoch": 44, "lr": 9.885597288408985e-05} +{"train_loss": 0.019832756370306015, "global_step": 5337, "epoch": 44, "lr": 9.885550161662847e-05} +{"train_loss": 0.014824861660599709, "global_step": 5338, "epoch": 44, "lr": 9.885503025324452e-05} +{"train_loss": 0.017422035336494446, "global_step": 5339, "epoch": 44, "lr": 9.885455879393896e-05} +{"train_loss": 0.01270404551178217, "global_step": 5340, "epoch": 44, "lr": 9.885408723871267e-05} +{"train_loss": 0.013194097205996513, "global_step": 5341, "epoch": 44, "lr": 9.885361558756662e-05} +{"train_loss": 0.019359776750206947, "global_step": 5342, "epoch": 44, "lr": 9.885314384050171e-05} +{"train_loss": 0.01610870659351349, "global_step": 5343, "epoch": 44, "lr": 9.885267199751886e-05} +{"train_loss": 0.014168037101626396, "global_step": 5344, "epoch": 44, "lr": 9.885220005861901e-05} +{"train_loss": 0.014697562903165817, "global_step": 5345, "epoch": 44, "lr": 9.885172802380309e-05} +{"train_loss": 0.016011539846658707, "global_step": 5346, "epoch": 44, "lr": 9.885125589307202e-05} +{"train_loss": 0.013787622563540936, "global_step": 5347, "epoch": 44, "lr": 9.885078366642673e-05} +{"train_loss": 0.016904406249523163, "global_step": 5348, "epoch": 44, "lr": 9.885031134386816e-05} +{"train_loss": 0.015175499953329563, "global_step": 5349, "epoch": 44, "lr": 9.884983892539718e-05} +{"train_loss": 0.011848116293549538, "global_step": 5350, "epoch": 44, "lr": 9.88493664110148e-05} +{"train_loss": 0.015661058947443962, "global_step": 5351, "epoch": 44, "lr": 9.884889380072188e-05} +{"train_loss": 0.021300723776221275, "global_step": 5352, "epoch": 44, "lr": 9.884842109451939e-05} +{"train_loss": 0.015214601531624794, "global_step": 5353, "epoch": 44, "lr": 9.884794829240826e-05} +{"train_loss": 0.014951358056243728, "global_step": 5354, "epoch": 44, "lr": 9.884747539438939e-05, "val_loss": 0.022471686825156212} +{"train_loss": 0.0211081113666296, "global_step": 5355, "epoch": 45, "lr": 9.884700240046371e-05} +{"train_loss": 0.022990994155406952, "global_step": 5356, "epoch": 45, "lr": 9.884652931063216e-05} +{"train_loss": 0.01264707837253809, "global_step": 5357, "epoch": 45, "lr": 9.884605612489567e-05} +{"train_loss": 0.015975341200828552, "global_step": 5358, "epoch": 45, "lr": 9.884558284325518e-05} +{"train_loss": 0.011206451803445816, "global_step": 5359, "epoch": 45, "lr": 9.88451094657116e-05} +{"train_loss": 0.009691617451608181, "global_step": 5360, "epoch": 45, "lr": 9.884463599226585e-05} +{"train_loss": 0.016544101759791374, "global_step": 5361, "epoch": 45, "lr": 9.88441624229189e-05} +{"train_loss": 0.0182778462767601, "global_step": 5362, "epoch": 45, "lr": 9.884368875767165e-05} +{"train_loss": 0.016518406569957733, "global_step": 5363, "epoch": 45, "lr": 9.884321499652502e-05} +{"train_loss": 0.013299825601279736, "global_step": 5364, "epoch": 45, "lr": 9.884274113947996e-05} +{"train_loss": 0.015793224796652794, "global_step": 5365, "epoch": 45, "lr": 9.884226718653741e-05} +{"train_loss": 0.009881239384412766, "global_step": 5366, "epoch": 45, "lr": 9.884179313769828e-05} +{"train_loss": 0.012740490958094597, "global_step": 5367, "epoch": 45, "lr": 9.88413189929635e-05} +{"train_loss": 0.014904174022376537, "global_step": 5368, "epoch": 45, "lr": 9.884084475233401e-05} +{"train_loss": 0.014522157609462738, "global_step": 5369, "epoch": 45, "lr": 9.884037041581074e-05} +{"train_loss": 0.01584218069911003, "global_step": 5370, "epoch": 45, "lr": 9.883989598339462e-05} +{"train_loss": 0.01423989050090313, "global_step": 5371, "epoch": 45, "lr": 9.88394214550866e-05} +{"train_loss": 0.009257740341126919, "global_step": 5372, "epoch": 45, "lr": 9.883894683088757e-05} +{"train_loss": 0.015071794390678406, "global_step": 5373, "epoch": 45, "lr": 9.88384721107985e-05} +{"train_loss": 0.01584019511938095, "global_step": 5374, "epoch": 45, "lr": 9.88379972948203e-05} +{"train_loss": 0.009676851332187653, "global_step": 5375, "epoch": 45, "lr": 9.883752238295391e-05} +{"train_loss": 0.01891326904296875, "global_step": 5376, "epoch": 45, "lr": 9.883704737520026e-05} +{"train_loss": 0.012233162298798561, "global_step": 5377, "epoch": 45, "lr": 9.883657227156029e-05} +{"train_loss": 0.013007118366658688, "global_step": 5378, "epoch": 45, "lr": 9.883609707203493e-05} +{"train_loss": 0.018834475427865982, "global_step": 5379, "epoch": 45, "lr": 9.883562177662511e-05} +{"train_loss": 0.018915215507149696, "global_step": 5380, "epoch": 45, "lr": 9.883514638533175e-05} +{"train_loss": 0.011203283444046974, "global_step": 5381, "epoch": 45, "lr": 9.88346708981558e-05} +{"train_loss": 0.012362814508378506, "global_step": 5382, "epoch": 45, "lr": 9.883419531509821e-05} +{"train_loss": 0.015752997249364853, "global_step": 5383, "epoch": 45, "lr": 9.883371963615989e-05} +{"train_loss": 0.015629341825842857, "global_step": 5384, "epoch": 45, "lr": 9.883324386134176e-05} +{"train_loss": 0.01681574247777462, "global_step": 5385, "epoch": 45, "lr": 9.88327679906448e-05} +{"train_loss": 0.014154551550745964, "global_step": 5386, "epoch": 45, "lr": 9.883229202406989e-05} +{"train_loss": 0.012406034395098686, "global_step": 5387, "epoch": 45, "lr": 9.883181596161802e-05} +{"train_loss": 0.012182346545159817, "global_step": 5388, "epoch": 45, "lr": 9.883133980329007e-05} +{"train_loss": 0.013857407495379448, "global_step": 5389, "epoch": 45, "lr": 9.883086354908702e-05} +{"train_loss": 0.01039785798639059, "global_step": 5390, "epoch": 45, "lr": 9.883038719900977e-05} +{"train_loss": 0.016730897128582, "global_step": 5391, "epoch": 45, "lr": 9.882991075305927e-05} +{"train_loss": 0.01763462834060192, "global_step": 5392, "epoch": 45, "lr": 9.882943421123648e-05} +{"train_loss": 0.010993930511176586, "global_step": 5393, "epoch": 45, "lr": 9.882895757354229e-05} +{"train_loss": 0.012420998886227608, "global_step": 5394, "epoch": 45, "lr": 9.882848083997767e-05} +{"train_loss": 0.016108060255646706, "global_step": 5395, "epoch": 45, "lr": 9.882800401054353e-05} +{"train_loss": 0.01109930220991373, "global_step": 5396, "epoch": 45, "lr": 9.882752708524083e-05} +{"train_loss": 0.012428892776370049, "global_step": 5397, "epoch": 45, "lr": 9.882705006407052e-05} +{"train_loss": 0.011926143430173397, "global_step": 5398, "epoch": 45, "lr": 9.882657294703348e-05} +{"train_loss": 0.010802037082612514, "global_step": 5399, "epoch": 45, "lr": 9.88260957341307e-05} +{"train_loss": 0.011099886149168015, "global_step": 5400, "epoch": 45, "lr": 9.882561842536309e-05} +{"train_loss": 0.011156211607158184, "global_step": 5401, "epoch": 45, "lr": 9.88251410207316e-05} +{"train_loss": 0.00956930872052908, "global_step": 5402, "epoch": 45, "lr": 9.882466352023715e-05} +{"train_loss": 0.019977539777755737, "global_step": 5403, "epoch": 45, "lr": 9.88241859238807e-05} +{"train_loss": 0.018811076879501343, "global_step": 5404, "epoch": 45, "lr": 9.882370823166316e-05} +{"train_loss": 0.011335056275129318, "global_step": 5405, "epoch": 45, "lr": 9.88232304435855e-05} +{"train_loss": 0.014977002516388893, "global_step": 5406, "epoch": 45, "lr": 9.882275255964864e-05} +{"train_loss": 0.010786117054522038, "global_step": 5407, "epoch": 45, "lr": 9.882227457985352e-05} +{"train_loss": 0.009800035506486893, "global_step": 5408, "epoch": 45, "lr": 9.882179650420109e-05} +{"train_loss": 0.014715835452079773, "global_step": 5409, "epoch": 45, "lr": 9.882131833269227e-05} +{"train_loss": 0.016206640750169754, "global_step": 5410, "epoch": 45, "lr": 9.882084006532802e-05} +{"train_loss": 0.015318883582949638, "global_step": 5411, "epoch": 45, "lr": 9.882036170210924e-05} +{"train_loss": 0.011230370961129665, "global_step": 5412, "epoch": 45, "lr": 9.88198832430369e-05} +{"train_loss": 0.016763359308242798, "global_step": 5413, "epoch": 45, "lr": 9.881940468811195e-05} +{"train_loss": 0.018985487520694733, "global_step": 5414, "epoch": 45, "lr": 9.881892603733532e-05} +{"train_loss": 0.012575222179293633, "global_step": 5415, "epoch": 45, "lr": 9.881844729070793e-05} +{"train_loss": 0.014472735114395618, "global_step": 5416, "epoch": 45, "lr": 9.881796844823072e-05} +{"train_loss": 0.01550380140542984, "global_step": 5417, "epoch": 45, "lr": 9.881748950990468e-05} +{"train_loss": 0.010246869176626205, "global_step": 5418, "epoch": 45, "lr": 9.881701047573069e-05} +{"train_loss": 0.020465990528464317, "global_step": 5419, "epoch": 45, "lr": 9.881653134570971e-05} +{"train_loss": 0.020278772339224815, "global_step": 5420, "epoch": 45, "lr": 9.88160521198427e-05} +{"train_loss": 0.018832499161362648, "global_step": 5421, "epoch": 45, "lr": 9.881557279813059e-05} +{"train_loss": 0.013689227402210236, "global_step": 5422, "epoch": 45, "lr": 9.88150933805743e-05} +{"train_loss": 0.014637444168329239, "global_step": 5423, "epoch": 45, "lr": 9.88146138671748e-05} +{"train_loss": 0.011105376295745373, "global_step": 5424, "epoch": 45, "lr": 9.881413425793304e-05} +{"train_loss": 0.019623195752501488, "global_step": 5425, "epoch": 45, "lr": 9.881365455284993e-05} +{"train_loss": 0.015464995056390762, "global_step": 5426, "epoch": 45, "lr": 9.881317475192642e-05} +{"train_loss": 0.01423108670860529, "global_step": 5427, "epoch": 45, "lr": 9.881269485516344e-05} +{"train_loss": 0.01573471538722515, "global_step": 5428, "epoch": 45, "lr": 9.881221486256198e-05} +{"train_loss": 0.015689667314291, "global_step": 5429, "epoch": 45, "lr": 9.881173477412293e-05} +{"train_loss": 0.011700666509568691, "global_step": 5430, "epoch": 45, "lr": 9.881125458984726e-05} +{"train_loss": 0.020420532673597336, "global_step": 5431, "epoch": 45, "lr": 9.88107743097359e-05} +{"train_loss": 0.01271698996424675, "global_step": 5432, "epoch": 45, "lr": 9.88102939337898e-05} +{"train_loss": 0.01669883355498314, "global_step": 5433, "epoch": 45, "lr": 9.88098134620099e-05} +{"train_loss": 0.01713668741285801, "global_step": 5434, "epoch": 45, "lr": 9.880933289439717e-05} +{"train_loss": 0.02012140303850174, "global_step": 5435, "epoch": 45, "lr": 9.880885223095251e-05} +{"train_loss": 0.01170123741030693, "global_step": 5436, "epoch": 45, "lr": 9.880837147167687e-05} +{"train_loss": 0.016716910526156425, "global_step": 5437, "epoch": 45, "lr": 9.880789061657123e-05} +{"train_loss": 0.012930737808346748, "global_step": 5438, "epoch": 45, "lr": 9.88074096656365e-05} +{"train_loss": 0.013111572712659836, "global_step": 5439, "epoch": 45, "lr": 9.880692861887364e-05} +{"train_loss": 0.02000230923295021, "global_step": 5440, "epoch": 45, "lr": 9.88064474762836e-05} +{"train_loss": 0.01254244800657034, "global_step": 5441, "epoch": 45, "lr": 9.880596623786729e-05} +{"train_loss": 0.013283280655741692, "global_step": 5442, "epoch": 45, "lr": 9.880548490362569e-05} +{"train_loss": 0.017232028767466545, "global_step": 5443, "epoch": 45, "lr": 9.880500347355974e-05} +{"train_loss": 0.012898063287138939, "global_step": 5444, "epoch": 45, "lr": 9.880452194767039e-05} +{"train_loss": 0.012999610044062138, "global_step": 5445, "epoch": 45, "lr": 9.880404032595855e-05} +{"train_loss": 0.013618932105600834, "global_step": 5446, "epoch": 45, "lr": 9.88035586084252e-05} +{"train_loss": 0.013605383224785328, "global_step": 5447, "epoch": 45, "lr": 9.880307679507127e-05} +{"train_loss": 0.014525452628731728, "global_step": 5448, "epoch": 45, "lr": 9.880259488589774e-05} +{"train_loss": 0.011083140037953854, "global_step": 5449, "epoch": 45, "lr": 9.88021128809055e-05} +{"train_loss": 0.01684541441500187, "global_step": 5450, "epoch": 45, "lr": 9.880163078009555e-05} +{"train_loss": 0.013560411520302296, "global_step": 5451, "epoch": 45, "lr": 9.880114858346879e-05} +{"train_loss": 0.01259987335652113, "global_step": 5452, "epoch": 45, "lr": 9.88006662910262e-05} +{"train_loss": 0.017540685832500458, "global_step": 5453, "epoch": 45, "lr": 9.880018390276871e-05} +{"train_loss": 0.01631079614162445, "global_step": 5454, "epoch": 45, "lr": 9.879970141869727e-05} +{"train_loss": 0.014805281534790993, "global_step": 5455, "epoch": 45, "lr": 9.879921883881282e-05} +{"train_loss": 0.018072020262479782, "global_step": 5456, "epoch": 45, "lr": 9.879873616311634e-05} +{"train_loss": 0.013974563218653202, "global_step": 5457, "epoch": 45, "lr": 9.879825339160875e-05} +{"train_loss": 0.01337627787142992, "global_step": 5458, "epoch": 45, "lr": 9.879777052429099e-05} +{"train_loss": 0.01597375050187111, "global_step": 5459, "epoch": 45, "lr": 9.879728756116403e-05} +{"train_loss": 0.00957122165709734, "global_step": 5460, "epoch": 45, "lr": 9.879680450222881e-05} +{"train_loss": 0.01194761972874403, "global_step": 5461, "epoch": 45, "lr": 9.879632134748628e-05} +{"train_loss": 0.01573937013745308, "global_step": 5462, "epoch": 45, "lr": 9.879583809693738e-05} +{"train_loss": 0.012950499542057514, "global_step": 5463, "epoch": 45, "lr": 9.879535475058305e-05} +{"train_loss": 0.013416420668363571, "global_step": 5464, "epoch": 45, "lr": 9.879487130842429e-05} +{"train_loss": 0.0208696611225605, "global_step": 5465, "epoch": 45, "lr": 9.879438777046198e-05} +{"train_loss": 0.014315376989543438, "global_step": 5466, "epoch": 45, "lr": 9.879390413669711e-05} +{"train_loss": 0.012271489948034286, "global_step": 5467, "epoch": 45, "lr": 9.879342040713064e-05} +{"train_loss": 0.010146645829081535, "global_step": 5468, "epoch": 45, "lr": 9.879293658176349e-05} +{"train_loss": 0.014162791892886162, "global_step": 5469, "epoch": 45, "lr": 9.879245266059663e-05} +{"train_loss": 0.014464647509157658, "global_step": 5470, "epoch": 45, "lr": 9.879196864363099e-05} +{"train_loss": 0.009239345788955688, "global_step": 5471, "epoch": 45, "lr": 9.879148453086753e-05} +{"train_loss": 0.009159665554761887, "global_step": 5472, "epoch": 45, "lr": 9.879100032230721e-05} +{"train_loss": 0.014440761495600729, "global_step": 5473, "epoch": 45, "lr": 9.879051601795098e-05, "val_loss": 0.02193647064268589, "train_action_mse_error": 0.0007924311212264001} +{"train_loss": 0.01435060240328312, "global_step": 5474, "epoch": 46, "lr": 9.879003161779976e-05} +{"train_loss": 0.014568393118679523, "global_step": 5475, "epoch": 46, "lr": 9.878954712185455e-05} +{"train_loss": 0.011745011433959007, "global_step": 5476, "epoch": 46, "lr": 9.878906253011626e-05} +{"train_loss": 0.011120232753455639, "global_step": 5477, "epoch": 46, "lr": 9.878857784258588e-05} +{"train_loss": 0.01388260256499052, "global_step": 5478, "epoch": 46, "lr": 9.878809305926432e-05} +{"train_loss": 0.013374350033700466, "global_step": 5479, "epoch": 46, "lr": 9.878760818015256e-05} +{"train_loss": 0.010849318467080593, "global_step": 5480, "epoch": 46, "lr": 9.878712320525154e-05} +{"train_loss": 0.016631830483675003, "global_step": 5481, "epoch": 46, "lr": 9.878663813456221e-05} +{"train_loss": 0.014749989844858646, "global_step": 5482, "epoch": 46, "lr": 9.878615296808554e-05} +{"train_loss": 0.012832725420594215, "global_step": 5483, "epoch": 46, "lr": 9.878566770582247e-05} +{"train_loss": 0.012362794019281864, "global_step": 5484, "epoch": 46, "lr": 9.878518234777394e-05} +{"train_loss": 0.013216801919043064, "global_step": 5485, "epoch": 46, "lr": 9.878469689394093e-05} +{"train_loss": 0.013303459621965885, "global_step": 5486, "epoch": 46, "lr": 9.878421134432439e-05} +{"train_loss": 0.013133244588971138, "global_step": 5487, "epoch": 46, "lr": 9.878372569892523e-05} +{"train_loss": 0.013084701262414455, "global_step": 5488, "epoch": 46, "lr": 9.878323995774445e-05} +{"train_loss": 0.014753473922610283, "global_step": 5489, "epoch": 46, "lr": 9.8782754120783e-05} +{"train_loss": 0.01542429905384779, "global_step": 5490, "epoch": 46, "lr": 9.878226818804182e-05} +{"train_loss": 0.025084378197789192, "global_step": 5491, "epoch": 46, "lr": 9.878178215952187e-05} +{"train_loss": 0.013659952208399773, "global_step": 5492, "epoch": 46, "lr": 9.87812960352241e-05} +{"train_loss": 0.018899045884609222, "global_step": 5493, "epoch": 46, "lr": 9.878080981514945e-05} +{"train_loss": 0.014294857159256935, "global_step": 5494, "epoch": 46, "lr": 9.878032349929891e-05} +{"train_loss": 0.01662066951394081, "global_step": 5495, "epoch": 46, "lr": 9.877983708767343e-05} +{"train_loss": 0.01387084275484085, "global_step": 5496, "epoch": 46, "lr": 9.877935058027391e-05} +{"train_loss": 0.019506841897964478, "global_step": 5497, "epoch": 46, "lr": 9.877886397710139e-05} +{"train_loss": 0.012417674995958805, "global_step": 5498, "epoch": 46, "lr": 9.877837727815675e-05} +{"train_loss": 0.015559801831841469, "global_step": 5499, "epoch": 46, "lr": 9.877789048344099e-05} +{"train_loss": 0.008945069275796413, "global_step": 5500, "epoch": 46, "lr": 9.877740359295507e-05} +{"train_loss": 0.014115286991000175, "global_step": 5501, "epoch": 46, "lr": 9.87769166066999e-05} +{"train_loss": 0.013950016349554062, "global_step": 5502, "epoch": 46, "lr": 9.877642952467648e-05} +{"train_loss": 0.012590141035616398, "global_step": 5503, "epoch": 46, "lr": 9.877594234688575e-05} +{"train_loss": 0.01773567870259285, "global_step": 5504, "epoch": 46, "lr": 9.877545507332866e-05} +{"train_loss": 0.012653624638915062, "global_step": 5505, "epoch": 46, "lr": 9.877496770400619e-05} +{"train_loss": 0.011713062413036823, "global_step": 5506, "epoch": 46, "lr": 9.877448023891927e-05} +{"train_loss": 0.016532085835933685, "global_step": 5507, "epoch": 46, "lr": 9.877399267806888e-05} +{"train_loss": 0.016779623925685883, "global_step": 5508, "epoch": 46, "lr": 9.877350502145595e-05} +{"train_loss": 0.013400468975305557, "global_step": 5509, "epoch": 46, "lr": 9.877301726908145e-05} +{"train_loss": 0.013584349304437637, "global_step": 5510, "epoch": 46, "lr": 9.877252942094637e-05} +{"train_loss": 0.01328787487000227, "global_step": 5511, "epoch": 46, "lr": 9.877204147705162e-05} +{"train_loss": 0.011054816655814648, "global_step": 5512, "epoch": 46, "lr": 9.877155343739818e-05} +{"train_loss": 0.014546656049787998, "global_step": 5513, "epoch": 46, "lr": 9.877106530198701e-05} +{"train_loss": 0.01380757987499237, "global_step": 5514, "epoch": 46, "lr": 9.877057707081905e-05} +{"train_loss": 0.011947057209908962, "global_step": 5515, "epoch": 46, "lr": 9.877008874389528e-05} +{"train_loss": 0.010205703787505627, "global_step": 5516, "epoch": 46, "lr": 9.876960032121666e-05} +{"train_loss": 0.017615966498851776, "global_step": 5517, "epoch": 46, "lr": 9.876911180278413e-05} +{"train_loss": 0.010249942541122437, "global_step": 5518, "epoch": 46, "lr": 9.876862318859867e-05} +{"train_loss": 0.01153613906353712, "global_step": 5519, "epoch": 46, "lr": 9.876813447866121e-05} +{"train_loss": 0.014899533241987228, "global_step": 5520, "epoch": 46, "lr": 9.876764567297274e-05} +{"train_loss": 0.016778355464339256, "global_step": 5521, "epoch": 46, "lr": 9.87671567715342e-05} +{"train_loss": 0.01318336185067892, "global_step": 5522, "epoch": 46, "lr": 9.876666777434657e-05} +{"train_loss": 0.013742872513830662, "global_step": 5523, "epoch": 46, "lr": 9.876617868141078e-05} +{"train_loss": 0.01442623883485794, "global_step": 5524, "epoch": 46, "lr": 9.876568949272783e-05} +{"train_loss": 0.010494592599570751, "global_step": 5525, "epoch": 46, "lr": 9.876520020829865e-05} +{"train_loss": 0.020902924239635468, "global_step": 5526, "epoch": 46, "lr": 9.876471082812419e-05} +{"train_loss": 0.015049026347696781, "global_step": 5527, "epoch": 46, "lr": 9.876422135220546e-05} +{"train_loss": 0.013375853188335896, "global_step": 5528, "epoch": 46, "lr": 9.876373178054338e-05} +{"train_loss": 0.015274547971785069, "global_step": 5529, "epoch": 46, "lr": 9.876324211313892e-05} +{"train_loss": 0.012307754717767239, "global_step": 5530, "epoch": 46, "lr": 9.876275234999304e-05} +{"train_loss": 0.012249517254531384, "global_step": 5531, "epoch": 46, "lr": 9.876226249110672e-05} +{"train_loss": 0.010865656659007072, "global_step": 5532, "epoch": 46, "lr": 9.876177253648088e-05} +{"train_loss": 0.010994515381753445, "global_step": 5533, "epoch": 46, "lr": 9.876128248611654e-05} +{"train_loss": 0.018856151029467583, "global_step": 5534, "epoch": 46, "lr": 9.876079234001461e-05} +{"train_loss": 0.014610209502279758, "global_step": 5535, "epoch": 46, "lr": 9.876030209817609e-05} +{"train_loss": 0.01254646759480238, "global_step": 5536, "epoch": 46, "lr": 9.87598117606019e-05} +{"train_loss": 0.013955357484519482, "global_step": 5537, "epoch": 46, "lr": 9.875932132729306e-05} +{"train_loss": 0.014883997850120068, "global_step": 5538, "epoch": 46, "lr": 9.875883079825047e-05} +{"train_loss": 0.009743745438754559, "global_step": 5539, "epoch": 46, "lr": 9.875834017347516e-05} +{"train_loss": 0.014166095294058323, "global_step": 5540, "epoch": 46, "lr": 9.875784945296804e-05} +{"train_loss": 0.01531203556805849, "global_step": 5541, "epoch": 46, "lr": 9.875735863673009e-05} +{"train_loss": 0.012734482996165752, "global_step": 5542, "epoch": 46, "lr": 9.875686772476227e-05} +{"train_loss": 0.013467803597450256, "global_step": 5543, "epoch": 46, "lr": 9.875637671706554e-05} +{"train_loss": 0.018411530181765556, "global_step": 5544, "epoch": 46, "lr": 9.87558856136409e-05} +{"train_loss": 0.009890928864479065, "global_step": 5545, "epoch": 46, "lr": 9.875539441448928e-05} +{"train_loss": 0.01573001779615879, "global_step": 5546, "epoch": 46, "lr": 9.875490311961164e-05} +{"train_loss": 0.009991667233407497, "global_step": 5547, "epoch": 46, "lr": 9.875441172900897e-05} +{"train_loss": 0.014579410664737225, "global_step": 5548, "epoch": 46, "lr": 9.875392024268222e-05} +{"train_loss": 0.009877732954919338, "global_step": 5549, "epoch": 46, "lr": 9.875342866063235e-05} +{"train_loss": 0.010644680820405483, "global_step": 5550, "epoch": 46, "lr": 9.875293698286034e-05} +{"train_loss": 0.018447335809469223, "global_step": 5551, "epoch": 46, "lr": 9.875244520936713e-05} +{"train_loss": 0.01606932282447815, "global_step": 5552, "epoch": 46, "lr": 9.875195334015372e-05} +{"train_loss": 0.010129017755389214, "global_step": 5553, "epoch": 46, "lr": 9.875146137522105e-05} +{"train_loss": 0.020777564495801926, "global_step": 5554, "epoch": 46, "lr": 9.875096931457009e-05} +{"train_loss": 0.010546392761170864, "global_step": 5555, "epoch": 46, "lr": 9.875047715820181e-05} +{"train_loss": 0.01120703388005495, "global_step": 5556, "epoch": 46, "lr": 9.874998490611719e-05} +{"train_loss": 0.01052586454898119, "global_step": 5557, "epoch": 46, "lr": 9.874949255831717e-05} +{"train_loss": 0.011374465189874172, "global_step": 5558, "epoch": 46, "lr": 9.874900011480273e-05} +{"train_loss": 0.013274949975311756, "global_step": 5559, "epoch": 46, "lr": 9.874850757557483e-05} +{"train_loss": 0.01137212011963129, "global_step": 5560, "epoch": 46, "lr": 9.874801494063446e-05} +{"train_loss": 0.01275319792330265, "global_step": 5561, "epoch": 46, "lr": 9.874752220998257e-05} +{"train_loss": 0.016973648220300674, "global_step": 5562, "epoch": 46, "lr": 9.874702938362011e-05} +{"train_loss": 0.014145801775157452, "global_step": 5563, "epoch": 46, "lr": 9.874653646154808e-05} +{"train_loss": 0.01299014501273632, "global_step": 5564, "epoch": 46, "lr": 9.874604344376743e-05} +{"train_loss": 0.02026747167110443, "global_step": 5565, "epoch": 46, "lr": 9.874555033027914e-05} +{"train_loss": 0.014591054059565067, "global_step": 5566, "epoch": 46, "lr": 9.874505712108417e-05} +{"train_loss": 0.021690798923373222, "global_step": 5567, "epoch": 46, "lr": 9.874456381618347e-05} +{"train_loss": 0.013247217983007431, "global_step": 5568, "epoch": 46, "lr": 9.874407041557803e-05} +{"train_loss": 0.012902355752885342, "global_step": 5569, "epoch": 46, "lr": 9.874357691926883e-05} +{"train_loss": 0.01628817245364189, "global_step": 5570, "epoch": 46, "lr": 9.874308332725681e-05} +{"train_loss": 0.01418508030474186, "global_step": 5571, "epoch": 46, "lr": 9.874258963954296e-05} +{"train_loss": 0.01428182888776064, "global_step": 5572, "epoch": 46, "lr": 9.874209585612824e-05} +{"train_loss": 0.015052182599902153, "global_step": 5573, "epoch": 46, "lr": 9.874160197701363e-05} +{"train_loss": 0.014547680504620075, "global_step": 5574, "epoch": 46, "lr": 9.874110800220007e-05} +{"train_loss": 0.015456117689609528, "global_step": 5575, "epoch": 46, "lr": 9.874061393168857e-05} +{"train_loss": 0.01331789419054985, "global_step": 5576, "epoch": 46, "lr": 9.874011976548009e-05} +{"train_loss": 0.009893890470266342, "global_step": 5577, "epoch": 46, "lr": 9.873962550357559e-05} +{"train_loss": 0.018276002258062363, "global_step": 5578, "epoch": 46, "lr": 9.873913114597601e-05} +{"train_loss": 0.015035872347652912, "global_step": 5579, "epoch": 46, "lr": 9.873863669268238e-05} +{"train_loss": 0.013603711500763893, "global_step": 5580, "epoch": 46, "lr": 9.873814214369565e-05} +{"train_loss": 0.017053935676813126, "global_step": 5581, "epoch": 46, "lr": 9.873764749901677e-05} +{"train_loss": 0.01994132436811924, "global_step": 5582, "epoch": 46, "lr": 9.873715275864673e-05} +{"train_loss": 0.01594431884586811, "global_step": 5583, "epoch": 46, "lr": 9.873665792258651e-05} +{"train_loss": 0.01201749686151743, "global_step": 5584, "epoch": 46, "lr": 9.873616299083704e-05} +{"train_loss": 0.01305986288934946, "global_step": 5585, "epoch": 46, "lr": 9.873566796339935e-05} +{"train_loss": 0.013999399729073048, "global_step": 5586, "epoch": 46, "lr": 9.873517284027436e-05} +{"train_loss": 0.012773435562849045, "global_step": 5587, "epoch": 46, "lr": 9.873467762146308e-05} +{"train_loss": 0.015543458983302116, "global_step": 5588, "epoch": 46, "lr": 9.873418230696646e-05} +{"train_loss": 0.01422970462590456, "global_step": 5589, "epoch": 46, "lr": 9.873368689678548e-05} +{"train_loss": 0.013160092756152153, "global_step": 5590, "epoch": 46, "lr": 9.873319139092112e-05} +{"train_loss": 0.017105605453252792, "global_step": 5591, "epoch": 46, "lr": 9.873269578937433e-05} +{"train_loss": 0.01412144538891666, "global_step": 5592, "epoch": 46, "lr": 9.873220009214612e-05, "val_loss": 0.029864493757486343} +{"train_loss": 0.01643824577331543, "global_step": 5593, "epoch": 47, "lr": 9.873170429923742e-05} +{"train_loss": 0.015115298330783844, "global_step": 5594, "epoch": 47, "lr": 9.873120841064924e-05} +{"train_loss": 0.017145883291959763, "global_step": 5595, "epoch": 47, "lr": 9.873071242638252e-05} +{"train_loss": 0.014761917293071747, "global_step": 5596, "epoch": 47, "lr": 9.873021634643827e-05} +{"train_loss": 0.00970777589827776, "global_step": 5597, "epoch": 47, "lr": 9.872972017081743e-05} +{"train_loss": 0.011387085542082787, "global_step": 5598, "epoch": 47, "lr": 9.8729223899521e-05} +{"train_loss": 0.015421513468027115, "global_step": 5599, "epoch": 47, "lr": 9.872872753254996e-05} +{"train_loss": 0.010745782405138016, "global_step": 5600, "epoch": 47, "lr": 9.872823106990526e-05} +{"train_loss": 0.013761389069259167, "global_step": 5601, "epoch": 47, "lr": 9.872773451158787e-05} +{"train_loss": 0.015183662064373493, "global_step": 5602, "epoch": 47, "lr": 9.872723785759879e-05} +{"train_loss": 0.013522488996386528, "global_step": 5603, "epoch": 47, "lr": 9.872674110793898e-05} +{"train_loss": 0.020281801000237465, "global_step": 5604, "epoch": 47, "lr": 9.872624426260941e-05} +{"train_loss": 0.016097141429781914, "global_step": 5605, "epoch": 47, "lr": 9.872574732161109e-05} +{"train_loss": 0.011727092787623405, "global_step": 5606, "epoch": 47, "lr": 9.872525028494495e-05} +{"train_loss": 0.011799302883446217, "global_step": 5607, "epoch": 47, "lr": 9.8724753152612e-05} +{"train_loss": 0.013156956993043423, "global_step": 5608, "epoch": 47, "lr": 9.872425592461318e-05} +{"train_loss": 0.016069525852799416, "global_step": 5609, "epoch": 47, "lr": 9.872375860094951e-05} +{"train_loss": 0.015133594162762165, "global_step": 5610, "epoch": 47, "lr": 9.872326118162194e-05} +{"train_loss": 0.016050398349761963, "global_step": 5611, "epoch": 47, "lr": 9.872276366663147e-05} +{"train_loss": 0.017077190801501274, "global_step": 5612, "epoch": 47, "lr": 9.872226605597903e-05} +{"train_loss": 0.01864435337483883, "global_step": 5613, "epoch": 47, "lr": 9.872176834966565e-05} +{"train_loss": 0.01326413732022047, "global_step": 5614, "epoch": 47, "lr": 9.872127054769227e-05} +{"train_loss": 0.012713068164885044, "global_step": 5615, "epoch": 47, "lr": 9.872077265005988e-05} +{"train_loss": 0.01452701911330223, "global_step": 5616, "epoch": 47, "lr": 9.872027465676945e-05} +{"train_loss": 0.01641990803182125, "global_step": 5617, "epoch": 47, "lr": 9.871977656782197e-05} +{"train_loss": 0.009462211281061172, "global_step": 5618, "epoch": 47, "lr": 9.871927838321842e-05} +{"train_loss": 0.011502997018396854, "global_step": 5619, "epoch": 47, "lr": 9.871878010295977e-05} +{"train_loss": 0.018138667568564415, "global_step": 5620, "epoch": 47, "lr": 9.8718281727047e-05} +{"train_loss": 0.011609728448092937, "global_step": 5621, "epoch": 47, "lr": 9.871778325548109e-05} +{"train_loss": 0.013175351545214653, "global_step": 5622, "epoch": 47, "lr": 9.871728468826302e-05} +{"train_loss": 0.020480748265981674, "global_step": 5623, "epoch": 47, "lr": 9.871678602539376e-05} +{"train_loss": 0.019266486167907715, "global_step": 5624, "epoch": 47, "lr": 9.871628726687429e-05} +{"train_loss": 0.010142184793949127, "global_step": 5625, "epoch": 47, "lr": 9.871578841270561e-05} +{"train_loss": 0.012510105036199093, "global_step": 5626, "epoch": 47, "lr": 9.871528946288868e-05} +{"train_loss": 0.022685779258608818, "global_step": 5627, "epoch": 47, "lr": 9.871479041742447e-05} +{"train_loss": 0.017864082008600235, "global_step": 5628, "epoch": 47, "lr": 9.871429127631399e-05} +{"train_loss": 0.016521859914064407, "global_step": 5629, "epoch": 47, "lr": 9.87137920395582e-05} +{"train_loss": 0.025373129174113274, "global_step": 5630, "epoch": 47, "lr": 9.871329270715807e-05} +{"train_loss": 0.010962646454572678, "global_step": 5631, "epoch": 47, "lr": 9.87127932791146e-05} +{"train_loss": 0.015032249502837658, "global_step": 5632, "epoch": 47, "lr": 9.871229375542878e-05} +{"train_loss": 0.020889228209853172, "global_step": 5633, "epoch": 47, "lr": 9.871179413610156e-05} +{"train_loss": 0.020627163350582123, "global_step": 5634, "epoch": 47, "lr": 9.871129442113394e-05} +{"train_loss": 0.012047408148646355, "global_step": 5635, "epoch": 47, "lr": 9.871079461052691e-05} +{"train_loss": 0.02224579080939293, "global_step": 5636, "epoch": 47, "lr": 9.871029470428141e-05} +{"train_loss": 0.019285261631011963, "global_step": 5637, "epoch": 47, "lr": 9.870979470239847e-05} +{"train_loss": 0.016667146235704422, "global_step": 5638, "epoch": 47, "lr": 9.870929460487906e-05} +{"train_loss": 0.016336066648364067, "global_step": 5639, "epoch": 47, "lr": 9.870879441172414e-05} +{"train_loss": 0.016457878053188324, "global_step": 5640, "epoch": 47, "lr": 9.87082941229347e-05} +{"train_loss": 0.01786666177213192, "global_step": 5641, "epoch": 47, "lr": 9.870779373851173e-05} +{"train_loss": 0.01981452852487564, "global_step": 5642, "epoch": 47, "lr": 9.870729325845622e-05} +{"train_loss": 0.018952857702970505, "global_step": 5643, "epoch": 47, "lr": 9.870679268276914e-05} +{"train_loss": 0.015676941722631454, "global_step": 5644, "epoch": 47, "lr": 9.870629201145149e-05} +{"train_loss": 0.017624689266085625, "global_step": 5645, "epoch": 47, "lr": 9.870579124450421e-05} +{"train_loss": 0.020377827808260918, "global_step": 5646, "epoch": 47, "lr": 9.870529038192833e-05} +{"train_loss": 0.016965575516223907, "global_step": 5647, "epoch": 47, "lr": 9.870478942372482e-05} +{"train_loss": 0.018631339073181152, "global_step": 5648, "epoch": 47, "lr": 9.870428836989465e-05} +{"train_loss": 0.013554905541241169, "global_step": 5649, "epoch": 47, "lr": 9.870378722043883e-05} +{"train_loss": 0.018319962546229362, "global_step": 5650, "epoch": 47, "lr": 9.870328597535831e-05} +{"train_loss": 0.020079655572772026, "global_step": 5651, "epoch": 47, "lr": 9.870278463465409e-05} +{"train_loss": 0.013483154587447643, "global_step": 5652, "epoch": 47, "lr": 9.870228319832715e-05} +{"train_loss": 0.01897994615137577, "global_step": 5653, "epoch": 47, "lr": 9.870178166637849e-05} +{"train_loss": 0.012643813155591488, "global_step": 5654, "epoch": 47, "lr": 9.870128003880909e-05} +{"train_loss": 0.016909245401620865, "global_step": 5655, "epoch": 47, "lr": 9.870077831561992e-05} +{"train_loss": 0.014414866454899311, "global_step": 5656, "epoch": 47, "lr": 9.870027649681198e-05} +{"train_loss": 0.013567008078098297, "global_step": 5657, "epoch": 47, "lr": 9.869977458238627e-05} +{"train_loss": 0.023303935304284096, "global_step": 5658, "epoch": 47, "lr": 9.869927257234372e-05} +{"train_loss": 0.017758194357156754, "global_step": 5659, "epoch": 47, "lr": 9.869877046668536e-05} +{"train_loss": 0.014270397834479809, "global_step": 5660, "epoch": 47, "lr": 9.869826826541217e-05} +{"train_loss": 0.017611663788557053, "global_step": 5661, "epoch": 47, "lr": 9.869776596852513e-05} +{"train_loss": 0.013018067926168442, "global_step": 5662, "epoch": 47, "lr": 9.869726357602524e-05} +{"train_loss": 0.01732814311981201, "global_step": 5663, "epoch": 47, "lr": 9.869676108791348e-05} +{"train_loss": 0.015177617780864239, "global_step": 5664, "epoch": 47, "lr": 9.869625850419082e-05} +{"train_loss": 0.017533479258418083, "global_step": 5665, "epoch": 47, "lr": 9.869575582485826e-05} +{"train_loss": 0.01582525297999382, "global_step": 5666, "epoch": 47, "lr": 9.869525304991678e-05} +{"train_loss": 0.020308876410126686, "global_step": 5667, "epoch": 47, "lr": 9.869475017936738e-05} +{"train_loss": 0.01423816941678524, "global_step": 5668, "epoch": 47, "lr": 9.869424721321104e-05} +{"train_loss": 0.016698315739631653, "global_step": 5669, "epoch": 47, "lr": 9.869374415144875e-05} +{"train_loss": 0.014574868604540825, "global_step": 5670, "epoch": 47, "lr": 9.86932409940815e-05} +{"train_loss": 0.010365118272602558, "global_step": 5671, "epoch": 47, "lr": 9.869273774111026e-05} +{"train_loss": 0.013546274043619633, "global_step": 5672, "epoch": 47, "lr": 9.869223439253604e-05} +{"train_loss": 0.009667202830314636, "global_step": 5673, "epoch": 47, "lr": 9.869173094835982e-05} +{"train_loss": 0.017112158238887787, "global_step": 5674, "epoch": 47, "lr": 9.869122740858259e-05} +{"train_loss": 0.01574678160250187, "global_step": 5675, "epoch": 47, "lr": 9.869072377320533e-05} +{"train_loss": 0.01744745299220085, "global_step": 5676, "epoch": 47, "lr": 9.869022004222903e-05} +{"train_loss": 0.012934712693095207, "global_step": 5677, "epoch": 47, "lr": 9.86897162156547e-05} +{"train_loss": 0.013220689259469509, "global_step": 5678, "epoch": 47, "lr": 9.868921229348332e-05} +{"train_loss": 0.01711048185825348, "global_step": 5679, "epoch": 47, "lr": 9.868870827571584e-05} +{"train_loss": 0.014015814289450645, "global_step": 5680, "epoch": 47, "lr": 9.868820416235331e-05} +{"train_loss": 0.016262495890259743, "global_step": 5681, "epoch": 47, "lr": 9.868769995339669e-05} +{"train_loss": 0.013218970969319344, "global_step": 5682, "epoch": 47, "lr": 9.868719564884696e-05} +{"train_loss": 0.010050284676253796, "global_step": 5683, "epoch": 47, "lr": 9.868669124870514e-05} +{"train_loss": 0.013074970804154873, "global_step": 5684, "epoch": 47, "lr": 9.868618675297219e-05} +{"train_loss": 0.012322443537414074, "global_step": 5685, "epoch": 47, "lr": 9.868568216164913e-05} +{"train_loss": 0.02045854926109314, "global_step": 5686, "epoch": 47, "lr": 9.868517747473691e-05} +{"train_loss": 0.013408457860350609, "global_step": 5687, "epoch": 47, "lr": 9.868467269223656e-05} +{"train_loss": 0.012928825803101063, "global_step": 5688, "epoch": 47, "lr": 9.868416781414907e-05} +{"train_loss": 0.015166020020842552, "global_step": 5689, "epoch": 47, "lr": 9.868366284047538e-05} +{"train_loss": 0.014787796884775162, "global_step": 5690, "epoch": 47, "lr": 9.868315777121655e-05} +{"train_loss": 0.01467572245746851, "global_step": 5691, "epoch": 47, "lr": 9.868265260637352e-05} +{"train_loss": 0.015701165422797203, "global_step": 5692, "epoch": 47, "lr": 9.868214734594733e-05} +{"train_loss": 0.010459925048053265, "global_step": 5693, "epoch": 47, "lr": 9.868164198993892e-05} +{"train_loss": 0.01161467656493187, "global_step": 5694, "epoch": 47, "lr": 9.868113653834932e-05} +{"train_loss": 0.01355293020606041, "global_step": 5695, "epoch": 47, "lr": 9.868063099117951e-05} +{"train_loss": 0.015284367837011814, "global_step": 5696, "epoch": 47, "lr": 9.868012534843047e-05} +{"train_loss": 0.011882399208843708, "global_step": 5697, "epoch": 47, "lr": 9.867961961010321e-05} +{"train_loss": 0.015800664201378822, "global_step": 5698, "epoch": 47, "lr": 9.867911377619873e-05} +{"train_loss": 0.011830384843051434, "global_step": 5699, "epoch": 47, "lr": 9.8678607846718e-05} +{"train_loss": 0.01513373851776123, "global_step": 5700, "epoch": 47, "lr": 9.867810182166202e-05} +{"train_loss": 0.011862348765134811, "global_step": 5701, "epoch": 47, "lr": 9.867759570103179e-05} +{"train_loss": 0.010202502831816673, "global_step": 5702, "epoch": 47, "lr": 9.86770894848283e-05} +{"train_loss": 0.010419799014925957, "global_step": 5703, "epoch": 47, "lr": 9.867658317305255e-05} +{"train_loss": 0.0140666039660573, "global_step": 5704, "epoch": 47, "lr": 9.867607676570554e-05} +{"train_loss": 0.017071858048439026, "global_step": 5705, "epoch": 47, "lr": 9.867557026278823e-05} +{"train_loss": 0.013527164235711098, "global_step": 5706, "epoch": 47, "lr": 9.867506366430165e-05} +{"train_loss": 0.01631106063723564, "global_step": 5707, "epoch": 47, "lr": 9.867455697024679e-05} +{"train_loss": 0.012895438820123672, "global_step": 5708, "epoch": 47, "lr": 9.867405018062463e-05} +{"train_loss": 0.010832345113158226, "global_step": 5709, "epoch": 47, "lr": 9.867354329543617e-05} +{"train_loss": 0.00922179501503706, "global_step": 5710, "epoch": 47, "lr": 9.86730363146824e-05} +{"train_loss": 0.015204071020316175, "global_step": 5711, "epoch": 47, "lr": 9.867252923836435e-05, "val_loss": 0.018701786175370216} +{"train_loss": 0.014774715527892113, "global_step": 5712, "epoch": 48, "lr": 9.867202206648297e-05} +{"train_loss": 0.01580127887427807, "global_step": 5713, "epoch": 48, "lr": 9.867151479903927e-05} +{"train_loss": 0.01214480772614479, "global_step": 5714, "epoch": 48, "lr": 9.867100743603424e-05} +{"train_loss": 0.014364885166287422, "global_step": 5715, "epoch": 48, "lr": 9.86704999774689e-05} +{"train_loss": 0.009793701581656933, "global_step": 5716, "epoch": 48, "lr": 9.866999242334426e-05} +{"train_loss": 0.01313698198646307, "global_step": 5717, "epoch": 48, "lr": 9.866948477366125e-05} +{"train_loss": 0.02043825015425682, "global_step": 5718, "epoch": 48, "lr": 9.866897702842093e-05} +{"train_loss": 0.01462253276258707, "global_step": 5719, "epoch": 48, "lr": 9.866846918762426e-05} +{"train_loss": 0.014364984817802906, "global_step": 5720, "epoch": 48, "lr": 9.866796125127225e-05} +{"train_loss": 0.014394226484000683, "global_step": 5721, "epoch": 48, "lr": 9.86674532193659e-05} +{"train_loss": 0.014048580080270767, "global_step": 5722, "epoch": 48, "lr": 9.866694509190622e-05} +{"train_loss": 0.01969146355986595, "global_step": 5723, "epoch": 48, "lr": 9.866643686889418e-05} +{"train_loss": 0.011619357392191887, "global_step": 5724, "epoch": 48, "lr": 9.866592855033079e-05} +{"train_loss": 0.012557823210954666, "global_step": 5725, "epoch": 48, "lr": 9.866542013621704e-05} +{"train_loss": 0.012493336573243141, "global_step": 5726, "epoch": 48, "lr": 9.866491162655395e-05} +{"train_loss": 0.015902377665042877, "global_step": 5727, "epoch": 48, "lr": 9.86644030213425e-05} +{"train_loss": 0.013723541982471943, "global_step": 5728, "epoch": 48, "lr": 9.86638943205837e-05} +{"train_loss": 0.015063537284731865, "global_step": 5729, "epoch": 48, "lr": 9.866338552427853e-05} +{"train_loss": 0.017182067036628723, "global_step": 5730, "epoch": 48, "lr": 9.866287663242801e-05} +{"train_loss": 0.016723159700632095, "global_step": 5731, "epoch": 48, "lr": 9.866236764503312e-05} +{"train_loss": 0.011963849887251854, "global_step": 5732, "epoch": 48, "lr": 9.866185856209488e-05} +{"train_loss": 0.012570220045745373, "global_step": 5733, "epoch": 48, "lr": 9.86613493836143e-05} +{"train_loss": 0.013305007480084896, "global_step": 5734, "epoch": 48, "lr": 9.86608401095923e-05} +{"train_loss": 0.013696539215743542, "global_step": 5735, "epoch": 48, "lr": 9.866033074002999e-05} +{"train_loss": 0.011591512709856033, "global_step": 5736, "epoch": 48, "lr": 9.86598212749283e-05} +{"train_loss": 0.009346927516162395, "global_step": 5737, "epoch": 48, "lr": 9.865931171428826e-05} +{"train_loss": 0.014908852055668831, "global_step": 5738, "epoch": 48, "lr": 9.865880205811086e-05} +{"train_loss": 0.01727159135043621, "global_step": 5739, "epoch": 48, "lr": 9.86582923063971e-05} +{"train_loss": 0.01639876887202263, "global_step": 5740, "epoch": 48, "lr": 9.865778245914797e-05} +{"train_loss": 0.01895810477435589, "global_step": 5741, "epoch": 48, "lr": 9.86572725163645e-05} +{"train_loss": 0.013321262784302235, "global_step": 5742, "epoch": 48, "lr": 9.865676247804764e-05} +{"train_loss": 0.010497457347810268, "global_step": 5743, "epoch": 48, "lr": 9.865625234419846e-05} +{"train_loss": 0.017075322568416595, "global_step": 5744, "epoch": 48, "lr": 9.865574211481792e-05} +{"train_loss": 0.012400257401168346, "global_step": 5745, "epoch": 48, "lr": 9.865523178990702e-05} +{"train_loss": 0.011835996992886066, "global_step": 5746, "epoch": 48, "lr": 9.865472136946679e-05} +{"train_loss": 0.02134901098906994, "global_step": 5747, "epoch": 48, "lr": 9.865421085349818e-05} +{"train_loss": 0.014503483660519123, "global_step": 5748, "epoch": 48, "lr": 9.865370024200225e-05} +{"train_loss": 0.013954837806522846, "global_step": 5749, "epoch": 48, "lr": 9.865318953497996e-05} +{"train_loss": 0.016267046332359314, "global_step": 5750, "epoch": 48, "lr": 9.865267873243234e-05} +{"train_loss": 0.014833644963800907, "global_step": 5751, "epoch": 48, "lr": 9.865216783436037e-05} +{"train_loss": 0.01203917060047388, "global_step": 5752, "epoch": 48, "lr": 9.865165684076509e-05} +{"train_loss": 0.014945531263947487, "global_step": 5753, "epoch": 48, "lr": 9.865114575164746e-05} +{"train_loss": 0.01951375976204872, "global_step": 5754, "epoch": 48, "lr": 9.865063456700852e-05} +{"train_loss": 0.020465770736336708, "global_step": 5755, "epoch": 48, "lr": 9.865012328684925e-05} +{"train_loss": 0.010387874208390713, "global_step": 5756, "epoch": 48, "lr": 9.864961191117066e-05} +{"train_loss": 0.01052522286772728, "global_step": 5757, "epoch": 48, "lr": 9.864910043997376e-05} +{"train_loss": 0.014789996668696404, "global_step": 5758, "epoch": 48, "lr": 9.864858887325953e-05} +{"train_loss": 0.012945244088768959, "global_step": 5759, "epoch": 48, "lr": 9.8648077211029e-05} +{"train_loss": 0.00822348054498434, "global_step": 5760, "epoch": 48, "lr": 9.864756545328317e-05} +{"train_loss": 0.014999102801084518, "global_step": 5761, "epoch": 48, "lr": 9.864705360002304e-05} +{"train_loss": 0.01659790426492691, "global_step": 5762, "epoch": 48, "lr": 9.864654165124963e-05} +{"train_loss": 0.010391694493591785, "global_step": 5763, "epoch": 48, "lr": 9.864602960696392e-05} +{"train_loss": 0.011792344972491264, "global_step": 5764, "epoch": 48, "lr": 9.864551746716694e-05} +{"train_loss": 0.011792509816586971, "global_step": 5765, "epoch": 48, "lr": 9.864500523185967e-05} +{"train_loss": 0.012459727004170418, "global_step": 5766, "epoch": 48, "lr": 9.864449290104314e-05} +{"train_loss": 0.013620239682495594, "global_step": 5767, "epoch": 48, "lr": 9.864398047471834e-05} +{"train_loss": 0.012846053577959538, "global_step": 5768, "epoch": 48, "lr": 9.864346795288628e-05} +{"train_loss": 0.015416063368320465, "global_step": 5769, "epoch": 48, "lr": 9.864295533554797e-05} +{"train_loss": 0.013036008924245834, "global_step": 5770, "epoch": 48, "lr": 9.864244262270441e-05} +{"train_loss": 0.0118377935141325, "global_step": 5771, "epoch": 48, "lr": 9.86419298143566e-05} +{"train_loss": 0.014366915449500084, "global_step": 5772, "epoch": 48, "lr": 9.864141691050558e-05} +{"train_loss": 0.014879395253956318, "global_step": 5773, "epoch": 48, "lr": 9.864090391115233e-05} +{"train_loss": 0.012027398683130741, "global_step": 5774, "epoch": 48, "lr": 9.864039081629785e-05} +{"train_loss": 0.011286740191280842, "global_step": 5775, "epoch": 48, "lr": 9.863987762594317e-05} +{"train_loss": 0.013363623060286045, "global_step": 5776, "epoch": 48, "lr": 9.863936434008927e-05} +{"train_loss": 0.009939396753907204, "global_step": 5777, "epoch": 48, "lr": 9.863885095873719e-05} +{"train_loss": 0.00940164178609848, "global_step": 5778, "epoch": 48, "lr": 9.863833748188792e-05} +{"train_loss": 0.013047846034169197, "global_step": 5779, "epoch": 48, "lr": 9.863782390954248e-05} +{"train_loss": 0.011891954578459263, "global_step": 5780, "epoch": 48, "lr": 9.863731024170185e-05} +{"train_loss": 0.01167617179453373, "global_step": 5781, "epoch": 48, "lr": 9.863679647836706e-05} +{"train_loss": 0.013125528581440449, "global_step": 5782, "epoch": 48, "lr": 9.863628261953912e-05} +{"train_loss": 0.010357453487813473, "global_step": 5783, "epoch": 48, "lr": 9.863576866521905e-05} +{"train_loss": 0.016489427536725998, "global_step": 5784, "epoch": 48, "lr": 9.863525461540784e-05} +{"train_loss": 0.012592937797307968, "global_step": 5785, "epoch": 48, "lr": 9.863474047010647e-05} +{"train_loss": 0.017502767965197563, "global_step": 5786, "epoch": 48, "lr": 9.863422622931602e-05} +{"train_loss": 0.012038367800414562, "global_step": 5787, "epoch": 48, "lr": 9.863371189303746e-05} +{"train_loss": 0.009404649958014488, "global_step": 5788, "epoch": 48, "lr": 9.863319746127178e-05} +{"train_loss": 0.015568838454782963, "global_step": 5789, "epoch": 48, "lr": 9.863268293402003e-05} +{"train_loss": 0.016834799200296402, "global_step": 5790, "epoch": 48, "lr": 9.863216831128319e-05} +{"train_loss": 0.014218609780073166, "global_step": 5791, "epoch": 48, "lr": 9.86316535930623e-05} +{"train_loss": 0.011379610747098923, "global_step": 5792, "epoch": 48, "lr": 9.863113877935835e-05} +{"train_loss": 0.01909099891781807, "global_step": 5793, "epoch": 48, "lr": 9.863062387017234e-05} +{"train_loss": 0.0123011264950037, "global_step": 5794, "epoch": 48, "lr": 9.863010886550531e-05} +{"train_loss": 0.01039215363562107, "global_step": 5795, "epoch": 48, "lr": 9.862959376535826e-05} +{"train_loss": 0.014219525270164013, "global_step": 5796, "epoch": 48, "lr": 9.862907856973218e-05} +{"train_loss": 0.008831227198243141, "global_step": 5797, "epoch": 48, "lr": 9.86285632786281e-05} +{"train_loss": 0.011394870467483997, "global_step": 5798, "epoch": 48, "lr": 9.862804789204705e-05} +{"train_loss": 0.0100166080519557, "global_step": 5799, "epoch": 48, "lr": 9.862753240999001e-05} +{"train_loss": 0.011238854378461838, "global_step": 5800, "epoch": 48, "lr": 9.862701683245801e-05} +{"train_loss": 0.008764544501900673, "global_step": 5801, "epoch": 48, "lr": 9.862650115945206e-05} +{"train_loss": 0.01577964425086975, "global_step": 5802, "epoch": 48, "lr": 9.862598539097316e-05} +{"train_loss": 0.01338158454746008, "global_step": 5803, "epoch": 48, "lr": 9.862546952702234e-05} +{"train_loss": 0.014410555362701416, "global_step": 5804, "epoch": 48, "lr": 9.86249535676006e-05} +{"train_loss": 0.011394361034035683, "global_step": 5805, "epoch": 48, "lr": 9.862443751270897e-05} +{"train_loss": 0.010181865654885769, "global_step": 5806, "epoch": 48, "lr": 9.862392136234844e-05} +{"train_loss": 0.010627464391291142, "global_step": 5807, "epoch": 48, "lr": 9.862340511652004e-05} +{"train_loss": 0.013968919403851032, "global_step": 5808, "epoch": 48, "lr": 9.862288877522478e-05} +{"train_loss": 0.01166932936757803, "global_step": 5809, "epoch": 48, "lr": 9.862237233846367e-05} +{"train_loss": 0.013280821032822132, "global_step": 5810, "epoch": 48, "lr": 9.862185580623773e-05} +{"train_loss": 0.013574166223406792, "global_step": 5811, "epoch": 48, "lr": 9.862133917854796e-05} +{"train_loss": 0.014472436159849167, "global_step": 5812, "epoch": 48, "lr": 9.862082245539539e-05} +{"train_loss": 0.01574617251753807, "global_step": 5813, "epoch": 48, "lr": 9.862030563678104e-05} +{"train_loss": 0.014738932251930237, "global_step": 5814, "epoch": 48, "lr": 9.861978872270589e-05} +{"train_loss": 0.0165090411901474, "global_step": 5815, "epoch": 48, "lr": 9.8619271713171e-05} +{"train_loss": 0.013600073754787445, "global_step": 5816, "epoch": 48, "lr": 9.861875460817736e-05} +{"train_loss": 0.016141364350914955, "global_step": 5817, "epoch": 48, "lr": 9.8618237407726e-05} +{"train_loss": 0.014757911674678326, "global_step": 5818, "epoch": 48, "lr": 9.861772011181791e-05} +{"train_loss": 0.01463822741061449, "global_step": 5819, "epoch": 48, "lr": 9.861720272045412e-05} +{"train_loss": 0.01679135113954544, "global_step": 5820, "epoch": 48, "lr": 9.861668523363565e-05} +{"train_loss": 0.012935396283864975, "global_step": 5821, "epoch": 48, "lr": 9.861616765136353e-05} +{"train_loss": 0.014852406457066536, "global_step": 5822, "epoch": 48, "lr": 9.861564997363873e-05} +{"train_loss": 0.014810176566243172, "global_step": 5823, "epoch": 48, "lr": 9.86151322004623e-05} +{"train_loss": 0.010915171355009079, "global_step": 5824, "epoch": 48, "lr": 9.861461433183527e-05} +{"train_loss": 0.015507818199694157, "global_step": 5825, "epoch": 48, "lr": 9.861409636775862e-05} +{"train_loss": 0.016785992309451103, "global_step": 5826, "epoch": 48, "lr": 9.861357830823339e-05} +{"train_loss": 0.011844946071505547, "global_step": 5827, "epoch": 48, "lr": 9.86130601532606e-05} +{"train_loss": 0.012177051045000553, "global_step": 5828, "epoch": 48, "lr": 9.861254190284125e-05} +{"train_loss": 0.013606289401650429, "global_step": 5829, "epoch": 48, "lr": 9.861202355697638e-05} +{"train_loss": 0.013665945574390787, "global_step": 5830, "epoch": 48, "lr": 9.8611505115667e-05, "val_loss": 0.014516489580273628} +{"train_loss": 0.015526838600635529, "global_step": 5831, "epoch": 49, "lr": 9.86109865789141e-05} +{"train_loss": 0.019130945205688477, "global_step": 5832, "epoch": 49, "lr": 9.861046794671873e-05} +{"train_loss": 0.009030239656567574, "global_step": 5833, "epoch": 49, "lr": 9.860994921908191e-05} +{"train_loss": 0.012562748044729233, "global_step": 5834, "epoch": 49, "lr": 9.860943039600463e-05} +{"train_loss": 0.016946513205766678, "global_step": 5835, "epoch": 49, "lr": 9.860891147748794e-05} +{"train_loss": 0.009767075069248676, "global_step": 5836, "epoch": 49, "lr": 9.860839246353284e-05} +{"train_loss": 0.013112509623169899, "global_step": 5837, "epoch": 49, "lr": 9.860787335414036e-05} +{"train_loss": 0.013455387204885483, "global_step": 5838, "epoch": 49, "lr": 9.86073541493115e-05} +{"train_loss": 0.018722182139754295, "global_step": 5839, "epoch": 49, "lr": 9.860683484904731e-05} +{"train_loss": 0.014926783740520477, "global_step": 5840, "epoch": 49, "lr": 9.860631545334877e-05} +{"train_loss": 0.016045011579990387, "global_step": 5841, "epoch": 49, "lr": 9.860579596221695e-05} +{"train_loss": 0.012762255035340786, "global_step": 5842, "epoch": 49, "lr": 9.860527637565283e-05} +{"train_loss": 0.014151357114315033, "global_step": 5843, "epoch": 49, "lr": 9.860475669365745e-05} +{"train_loss": 0.01707093045115471, "global_step": 5844, "epoch": 49, "lr": 9.860423691623181e-05} +{"train_loss": 0.012527773156762123, "global_step": 5845, "epoch": 49, "lr": 9.860371704337694e-05} +{"train_loss": 0.014933891594409943, "global_step": 5846, "epoch": 49, "lr": 9.860319707509388e-05} +{"train_loss": 0.01654912531375885, "global_step": 5847, "epoch": 49, "lr": 9.860267701138363e-05} +{"train_loss": 0.011539539322257042, "global_step": 5848, "epoch": 49, "lr": 9.86021568522472e-05} +{"train_loss": 0.016427721828222275, "global_step": 5849, "epoch": 49, "lr": 9.860163659768566e-05} +{"train_loss": 0.011099088005721569, "global_step": 5850, "epoch": 49, "lr": 9.860111624769997e-05} +{"train_loss": 0.01604640483856201, "global_step": 5851, "epoch": 49, "lr": 9.86005958022912e-05} +{"train_loss": 0.016090085729956627, "global_step": 5852, "epoch": 49, "lr": 9.860007526146034e-05} +{"train_loss": 0.01188756711781025, "global_step": 5853, "epoch": 49, "lr": 9.859955462520843e-05} +{"train_loss": 0.016983576118946075, "global_step": 5854, "epoch": 49, "lr": 9.859903389353649e-05} +{"train_loss": 0.014200441539287567, "global_step": 5855, "epoch": 49, "lr": 9.859851306644552e-05} +{"train_loss": 0.01472785696387291, "global_step": 5856, "epoch": 49, "lr": 9.859799214393658e-05} +{"train_loss": 0.017009522765874863, "global_step": 5857, "epoch": 49, "lr": 9.859747112601066e-05} +{"train_loss": 0.008653913624584675, "global_step": 5858, "epoch": 49, "lr": 9.859695001266882e-05} +{"train_loss": 0.01789524219930172, "global_step": 5859, "epoch": 49, "lr": 9.859642880391204e-05} +{"train_loss": 0.008490387350320816, "global_step": 5860, "epoch": 49, "lr": 9.859590749974137e-05} +{"train_loss": 0.01745237037539482, "global_step": 5861, "epoch": 49, "lr": 9.859538610015783e-05} +{"train_loss": 0.014718150720000267, "global_step": 5862, "epoch": 49, "lr": 9.859486460516245e-05} +{"train_loss": 0.014168808236718178, "global_step": 5863, "epoch": 49, "lr": 9.859434301475623e-05} +{"train_loss": 0.016022490337491035, "global_step": 5864, "epoch": 49, "lr": 9.859382132894021e-05} +{"train_loss": 0.010674522258341312, "global_step": 5865, "epoch": 49, "lr": 9.859329954771542e-05} +{"train_loss": 0.016968749463558197, "global_step": 5866, "epoch": 49, "lr": 9.859277767108287e-05} +{"train_loss": 0.01699667237699032, "global_step": 5867, "epoch": 49, "lr": 9.859225569904358e-05} +{"train_loss": 0.024382861331105232, "global_step": 5868, "epoch": 49, "lr": 9.859173363159862e-05} +{"train_loss": 0.011280057020485401, "global_step": 5869, "epoch": 49, "lr": 9.859121146874897e-05} +{"train_loss": 0.012730794958770275, "global_step": 5870, "epoch": 49, "lr": 9.859068921049566e-05} +{"train_loss": 0.01682518981397152, "global_step": 5871, "epoch": 49, "lr": 9.859016685683972e-05} +{"train_loss": 0.018166769295930862, "global_step": 5872, "epoch": 49, "lr": 9.85896444077822e-05} +{"train_loss": 0.011949540115892887, "global_step": 5873, "epoch": 49, "lr": 9.858912186332408e-05} +{"train_loss": 0.017291761934757233, "global_step": 5874, "epoch": 49, "lr": 9.858859922346642e-05} +{"train_loss": 0.01615198887884617, "global_step": 5875, "epoch": 49, "lr": 9.858807648821023e-05} +{"train_loss": 0.01605972647666931, "global_step": 5876, "epoch": 49, "lr": 9.858755365755655e-05} +{"train_loss": 0.01695662923157215, "global_step": 5877, "epoch": 49, "lr": 9.858703073150639e-05} +{"train_loss": 0.011331142857670784, "global_step": 5878, "epoch": 49, "lr": 9.85865077100608e-05} +{"train_loss": 0.01352381519973278, "global_step": 5879, "epoch": 49, "lr": 9.858598459322079e-05} +{"train_loss": 0.018326427787542343, "global_step": 5880, "epoch": 49, "lr": 9.858546138098739e-05} +{"train_loss": 0.012842091731727123, "global_step": 5881, "epoch": 49, "lr": 9.858493807336163e-05} +{"train_loss": 0.013780194334685802, "global_step": 5882, "epoch": 49, "lr": 9.858441467034452e-05} +{"train_loss": 0.01905997470021248, "global_step": 5883, "epoch": 49, "lr": 9.858389117193711e-05} +{"train_loss": 0.01606012135744095, "global_step": 5884, "epoch": 49, "lr": 9.858336757814041e-05} +{"train_loss": 0.0126179289072752, "global_step": 5885, "epoch": 49, "lr": 9.858284388895547e-05} +{"train_loss": 0.01799345575273037, "global_step": 5886, "epoch": 49, "lr": 9.85823201043833e-05} +{"train_loss": 0.017858412116765976, "global_step": 5887, "epoch": 49, "lr": 9.858179622442494e-05} +{"train_loss": 0.01813860982656479, "global_step": 5888, "epoch": 49, "lr": 9.858127224908143e-05} +{"train_loss": 0.023974234238266945, "global_step": 5889, "epoch": 49, "lr": 9.858074817835377e-05} +{"train_loss": 0.012179332785308361, "global_step": 5890, "epoch": 49, "lr": 9.858022401224298e-05} +{"train_loss": 0.015276342630386353, "global_step": 5891, "epoch": 49, "lr": 9.857969975075013e-05} +{"train_loss": 0.012927868403494358, "global_step": 5892, "epoch": 49, "lr": 9.857917539387623e-05} +{"train_loss": 0.010337303392589092, "global_step": 5893, "epoch": 49, "lr": 9.85786509416223e-05} +{"train_loss": 0.026371216401457787, "global_step": 5894, "epoch": 49, "lr": 9.857812639398938e-05} +{"train_loss": 0.013189942575991154, "global_step": 5895, "epoch": 49, "lr": 9.85776017509785e-05} +{"train_loss": 0.022858327254652977, "global_step": 5896, "epoch": 49, "lr": 9.85770770125907e-05} +{"train_loss": 0.014487923122942448, "global_step": 5897, "epoch": 49, "lr": 9.857655217882698e-05} +{"train_loss": 0.012831267900764942, "global_step": 5898, "epoch": 49, "lr": 9.857602724968841e-05} +{"train_loss": 0.01244044117629528, "global_step": 5899, "epoch": 49, "lr": 9.857550222517598e-05} +{"train_loss": 0.011921227909624577, "global_step": 5900, "epoch": 49, "lr": 9.857497710529076e-05} +{"train_loss": 0.014592273160815239, "global_step": 5901, "epoch": 49, "lr": 9.857445189003374e-05} +{"train_loss": 0.011851665563881397, "global_step": 5902, "epoch": 49, "lr": 9.8573926579406e-05} +{"train_loss": 0.012272639200091362, "global_step": 5903, "epoch": 49, "lr": 9.857340117340852e-05} +{"train_loss": 0.017395472154021263, "global_step": 5904, "epoch": 49, "lr": 9.857287567204237e-05} +{"train_loss": 0.015424516052007675, "global_step": 5905, "epoch": 49, "lr": 9.857235007530856e-05} +{"train_loss": 0.015454856678843498, "global_step": 5906, "epoch": 49, "lr": 9.857182438320813e-05} +{"train_loss": 0.01459411345422268, "global_step": 5907, "epoch": 49, "lr": 9.857129859574213e-05} +{"train_loss": 0.018045520409941673, "global_step": 5908, "epoch": 49, "lr": 9.857077271291155e-05} +{"train_loss": 0.014258025214076042, "global_step": 5909, "epoch": 49, "lr": 9.857024673471747e-05} +{"train_loss": 0.016230685636401176, "global_step": 5910, "epoch": 49, "lr": 9.856972066116088e-05} +{"train_loss": 0.012057336047291756, "global_step": 5911, "epoch": 49, "lr": 9.856919449224284e-05} +{"train_loss": 0.01885749213397503, "global_step": 5912, "epoch": 49, "lr": 9.856866822796437e-05} +{"train_loss": 0.01295651588588953, "global_step": 5913, "epoch": 49, "lr": 9.856814186832652e-05} +{"train_loss": 0.015839822590351105, "global_step": 5914, "epoch": 49, "lr": 9.85676154133303e-05} +{"train_loss": 0.016216248273849487, "global_step": 5915, "epoch": 49, "lr": 9.856708886297676e-05} +{"train_loss": 0.01947150193154812, "global_step": 5916, "epoch": 49, "lr": 9.856656221726693e-05} +{"train_loss": 0.013884317129850388, "global_step": 5917, "epoch": 49, "lr": 9.856603547620184e-05} +{"train_loss": 0.013184514828026295, "global_step": 5918, "epoch": 49, "lr": 9.856550863978253e-05} +{"train_loss": 0.012668686918914318, "global_step": 5919, "epoch": 49, "lr": 9.856498170801004e-05} +{"train_loss": 0.012369167059659958, "global_step": 5920, "epoch": 49, "lr": 9.856445468088539e-05} +{"train_loss": 0.018626146018505096, "global_step": 5921, "epoch": 49, "lr": 9.856392755840962e-05} +{"train_loss": 0.01493245828896761, "global_step": 5922, "epoch": 49, "lr": 9.856340034058377e-05} +{"train_loss": 0.015494871884584427, "global_step": 5923, "epoch": 49, "lr": 9.856287302740888e-05} +{"train_loss": 0.016585176810622215, "global_step": 5924, "epoch": 49, "lr": 9.856234561888595e-05} +{"train_loss": 0.010340566746890545, "global_step": 5925, "epoch": 49, "lr": 9.856181811501607e-05} +{"train_loss": 0.017959222197532654, "global_step": 5926, "epoch": 49, "lr": 9.856129051580024e-05} +{"train_loss": 0.014080311171710491, "global_step": 5927, "epoch": 49, "lr": 9.856076282123949e-05} +{"train_loss": 0.017516732215881348, "global_step": 5928, "epoch": 49, "lr": 9.85602350313349e-05} +{"train_loss": 0.015702692791819572, "global_step": 5929, "epoch": 49, "lr": 9.855970714608746e-05} +{"train_loss": 0.012127223424613476, "global_step": 5930, "epoch": 49, "lr": 9.855917916549822e-05} +{"train_loss": 0.015898481011390686, "global_step": 5931, "epoch": 49, "lr": 9.85586510895682e-05} +{"train_loss": 0.017786243930459023, "global_step": 5932, "epoch": 49, "lr": 9.855812291829849e-05} +{"train_loss": 0.011105780489742756, "global_step": 5933, "epoch": 49, "lr": 9.855759465169008e-05} +{"train_loss": 0.01382816769182682, "global_step": 5934, "epoch": 49, "lr": 9.855706628974402e-05} +{"train_loss": 0.015849027782678604, "global_step": 5935, "epoch": 49, "lr": 9.855653783246136e-05} +{"train_loss": 0.015587938949465752, "global_step": 5936, "epoch": 49, "lr": 9.855600927984313e-05} +{"train_loss": 0.01478596031665802, "global_step": 5937, "epoch": 49, "lr": 9.855548063189033e-05} +{"train_loss": 0.01934804394841194, "global_step": 5938, "epoch": 49, "lr": 9.855495188860405e-05} +{"train_loss": 0.011660037562251091, "global_step": 5939, "epoch": 49, "lr": 9.855442304998531e-05} +{"train_loss": 0.017596889287233353, "global_step": 5940, "epoch": 49, "lr": 9.855389411603515e-05} +{"train_loss": 0.012165357358753681, "global_step": 5941, "epoch": 49, "lr": 9.855336508675459e-05} +{"train_loss": 0.018338441848754883, "global_step": 5942, "epoch": 49, "lr": 9.855283596214471e-05} +{"train_loss": 0.014780459925532341, "global_step": 5943, "epoch": 49, "lr": 9.85523067422065e-05} +{"train_loss": 0.015355887822806835, "global_step": 5944, "epoch": 49, "lr": 9.855177742694103e-05} +{"train_loss": 0.017457768321037292, "global_step": 5945, "epoch": 49, "lr": 9.855124801634935e-05} +{"train_loss": 0.011254838667809963, "global_step": 5946, "epoch": 49, "lr": 9.855071851043248e-05} +{"train_loss": 0.016436783596873283, "global_step": 5947, "epoch": 49, "lr": 9.855018890919143e-05} +{"train_loss": 0.01166228111833334, "global_step": 5948, "epoch": 49, "lr": 9.854965921262728e-05} +{"train_loss": 0.015091352180397812, "global_step": 5949, "epoch": 49, "lr": 9.854912942074109e-05, "val_loss": 0.03011769987642765} +{"train_loss": 0.017327485606074333, "global_step": 5950, "epoch": 50, "lr": 9.854859953353384e-05} +{"train_loss": 0.01675298623740673, "global_step": 5951, "epoch": 50, "lr": 9.854806955100662e-05} +{"train_loss": 0.01207214780151844, "global_step": 5952, "epoch": 50, "lr": 9.854753947316044e-05} +{"train_loss": 0.011613714508712292, "global_step": 5953, "epoch": 50, "lr": 9.854700929999636e-05} +{"train_loss": 0.01890776865184307, "global_step": 5954, "epoch": 50, "lr": 9.854647903151541e-05} +{"train_loss": 0.014203274622559547, "global_step": 5955, "epoch": 50, "lr": 9.854594866771864e-05} +{"train_loss": 0.01369271520525217, "global_step": 5956, "epoch": 50, "lr": 9.854541820860708e-05} +{"train_loss": 0.015945283696055412, "global_step": 5957, "epoch": 50, "lr": 9.854488765418178e-05} +{"train_loss": 0.015193718485534191, "global_step": 5958, "epoch": 50, "lr": 9.854435700444377e-05} +{"train_loss": 0.012216526083648205, "global_step": 5959, "epoch": 50, "lr": 9.854382625939411e-05} +{"train_loss": 0.01022236980497837, "global_step": 5960, "epoch": 50, "lr": 9.854329541903385e-05} +{"train_loss": 0.01742561161518097, "global_step": 5961, "epoch": 50, "lr": 9.854276448336399e-05} +{"train_loss": 0.01353775430470705, "global_step": 5962, "epoch": 50, "lr": 9.85422334523856e-05} +{"train_loss": 0.01414740551263094, "global_step": 5963, "epoch": 50, "lr": 9.854170232609973e-05} +{"train_loss": 0.01546777505427599, "global_step": 5964, "epoch": 50, "lr": 9.854117110450742e-05} +{"train_loss": 0.014957865700125694, "global_step": 5965, "epoch": 50, "lr": 9.85406397876097e-05} +{"train_loss": 0.010749286971986294, "global_step": 5966, "epoch": 50, "lr": 9.854010837540761e-05} +{"train_loss": 0.01613239198923111, "global_step": 5967, "epoch": 50, "lr": 9.85395768679022e-05} +{"train_loss": 0.010514369234442711, "global_step": 5968, "epoch": 50, "lr": 9.853904526509454e-05} +{"train_loss": 0.014822719618678093, "global_step": 5969, "epoch": 50, "lr": 9.853851356698563e-05} +{"train_loss": 0.012643950060009956, "global_step": 5970, "epoch": 50, "lr": 9.853798177357653e-05} +{"train_loss": 0.014050735160708427, "global_step": 5971, "epoch": 50, "lr": 9.853744988486831e-05} +{"train_loss": 0.015280215069651604, "global_step": 5972, "epoch": 50, "lr": 9.853691790086199e-05} +{"train_loss": 0.013430026359856129, "global_step": 5973, "epoch": 50, "lr": 9.853638582155861e-05} +{"train_loss": 0.01277477853000164, "global_step": 5974, "epoch": 50, "lr": 9.853585364695921e-05} +{"train_loss": 0.01971546746790409, "global_step": 5975, "epoch": 50, "lr": 9.853532137706487e-05} +{"train_loss": 0.01520448736846447, "global_step": 5976, "epoch": 50, "lr": 9.853478901187659e-05} +{"train_loss": 0.012900707311928272, "global_step": 5977, "epoch": 50, "lr": 9.853425655139546e-05} +{"train_loss": 0.012484027072787285, "global_step": 5978, "epoch": 50, "lr": 9.853372399562249e-05} +{"train_loss": 0.01587524265050888, "global_step": 5979, "epoch": 50, "lr": 9.853319134455871e-05} +{"train_loss": 0.013598261401057243, "global_step": 5980, "epoch": 50, "lr": 9.853265859820524e-05} +{"train_loss": 0.010715917684137821, "global_step": 5981, "epoch": 50, "lr": 9.853212575656305e-05} +{"train_loss": 0.018622061237692833, "global_step": 5982, "epoch": 50, "lr": 9.853159281963324e-05} +{"train_loss": 0.01358216442167759, "global_step": 5983, "epoch": 50, "lr": 9.853105978741681e-05} +{"train_loss": 0.012517424300312996, "global_step": 5984, "epoch": 50, "lr": 9.853052665991485e-05} +{"train_loss": 0.010920650325715542, "global_step": 5985, "epoch": 50, "lr": 9.852999343712837e-05} +{"train_loss": 0.018096692860126495, "global_step": 5986, "epoch": 50, "lr": 9.852946011905842e-05} +{"train_loss": 0.01090018730610609, "global_step": 5987, "epoch": 50, "lr": 9.852892670570609e-05} +{"train_loss": 0.013823227025568485, "global_step": 5988, "epoch": 50, "lr": 9.852839319707237e-05} +{"train_loss": 0.012505418621003628, "global_step": 5989, "epoch": 50, "lr": 9.852785959315836e-05} +{"train_loss": 0.014521334320306778, "global_step": 5990, "epoch": 50, "lr": 9.852732589396507e-05} +{"train_loss": 0.012426948174834251, "global_step": 5991, "epoch": 50, "lr": 9.852679209949355e-05} +{"train_loss": 0.011199391447007656, "global_step": 5992, "epoch": 50, "lr": 9.852625820974486e-05} +{"train_loss": 0.016310296952724457, "global_step": 5993, "epoch": 50, "lr": 9.852572422472007e-05} +{"train_loss": 0.01889563351869583, "global_step": 5994, "epoch": 50, "lr": 9.852519014442017e-05} +{"train_loss": 0.015062195248901844, "global_step": 5995, "epoch": 50, "lr": 9.852465596884627e-05} +{"train_loss": 0.010150891728699207, "global_step": 5996, "epoch": 50, "lr": 9.852412169799938e-05} +{"train_loss": 0.011796560138463974, "global_step": 5997, "epoch": 50, "lr": 9.852358733188056e-05} +{"train_loss": 0.01188965979963541, "global_step": 5998, "epoch": 50, "lr": 9.852305287049087e-05} +{"train_loss": 0.013085692189633846, "global_step": 5999, "epoch": 50, "lr": 9.852251831383135e-05} +{"train_loss": 0.009894183836877346, "global_step": 6000, "epoch": 50, "lr": 9.852198366190304e-05} +{"train_loss": 0.014429436065256596, "global_step": 6001, "epoch": 50, "lr": 9.8521448914707e-05} +{"train_loss": 0.013538491912186146, "global_step": 6002, "epoch": 50, "lr": 9.852091407224429e-05} +{"train_loss": 0.015008043497800827, "global_step": 6003, "epoch": 50, "lr": 9.852037913451592e-05} +{"train_loss": 0.010828123427927494, "global_step": 6004, "epoch": 50, "lr": 9.8519844101523e-05} +{"train_loss": 0.013441605493426323, "global_step": 6005, "epoch": 50, "lr": 9.851930897326654e-05} +{"train_loss": 0.013676656410098076, "global_step": 6006, "epoch": 50, "lr": 9.851877374974759e-05} +{"train_loss": 0.013101334683597088, "global_step": 6007, "epoch": 50, "lr": 9.851823843096724e-05} +{"train_loss": 0.01726173795759678, "global_step": 6008, "epoch": 50, "lr": 9.851770301692648e-05} +{"train_loss": 0.009891241788864136, "global_step": 6009, "epoch": 50, "lr": 9.85171675076264e-05} +{"train_loss": 0.010942270047962666, "global_step": 6010, "epoch": 50, "lr": 9.851663190306806e-05} +{"train_loss": 0.011946422979235649, "global_step": 6011, "epoch": 50, "lr": 9.851609620325248e-05} +{"train_loss": 0.014649847522377968, "global_step": 6012, "epoch": 50, "lr": 9.851556040818075e-05} +{"train_loss": 0.01693383976817131, "global_step": 6013, "epoch": 50, "lr": 9.851502451785388e-05} +{"train_loss": 0.01009735930711031, "global_step": 6014, "epoch": 50, "lr": 9.851448853227294e-05} +{"train_loss": 0.01193801686167717, "global_step": 6015, "epoch": 50, "lr": 9.851395245143899e-05} +{"train_loss": 0.01535630039870739, "global_step": 6016, "epoch": 50, "lr": 9.851341627535309e-05} +{"train_loss": 0.010510751977562904, "global_step": 6017, "epoch": 50, "lr": 9.851288000401627e-05} +{"train_loss": 0.014690540730953217, "global_step": 6018, "epoch": 50, "lr": 9.85123436374296e-05} +{"train_loss": 0.013307297602295876, "global_step": 6019, "epoch": 50, "lr": 9.851180717559411e-05} +{"train_loss": 0.011724087409675121, "global_step": 6020, "epoch": 50, "lr": 9.851127061851088e-05} +{"train_loss": 0.014655220322310925, "global_step": 6021, "epoch": 50, "lr": 9.851073396618095e-05} +{"train_loss": 0.009396749548614025, "global_step": 6022, "epoch": 50, "lr": 9.851019721860538e-05} +{"train_loss": 0.01159477885812521, "global_step": 6023, "epoch": 50, "lr": 9.850966037578521e-05} +{"train_loss": 0.014282326214015484, "global_step": 6024, "epoch": 50, "lr": 9.850912343772151e-05} +{"train_loss": 0.016856838017702103, "global_step": 6025, "epoch": 50, "lr": 9.850858640441534e-05} +{"train_loss": 0.0185987651348114, "global_step": 6026, "epoch": 50, "lr": 9.850804927586774e-05} +{"train_loss": 0.011004065163433552, "global_step": 6027, "epoch": 50, "lr": 9.850751205207976e-05} +{"train_loss": 0.010116597637534142, "global_step": 6028, "epoch": 50, "lr": 9.850697473305246e-05} +{"train_loss": 0.01468094065785408, "global_step": 6029, "epoch": 50, "lr": 9.85064373187869e-05} +{"train_loss": 0.01525653526186943, "global_step": 6030, "epoch": 50, "lr": 9.850589980928414e-05} +{"train_loss": 0.01281225960701704, "global_step": 6031, "epoch": 50, "lr": 9.850536220454523e-05} +{"train_loss": 0.01178942434489727, "global_step": 6032, "epoch": 50, "lr": 9.850482450457122e-05} +{"train_loss": 0.00898892804980278, "global_step": 6033, "epoch": 50, "lr": 9.850428670936316e-05} +{"train_loss": 0.013072827830910683, "global_step": 6034, "epoch": 50, "lr": 9.850374881892211e-05} +{"train_loss": 0.013056865893304348, "global_step": 6035, "epoch": 50, "lr": 9.850321083324914e-05} +{"train_loss": 0.007939916104078293, "global_step": 6036, "epoch": 50, "lr": 9.85026727523453e-05} +{"train_loss": 0.015414332039654255, "global_step": 6037, "epoch": 50, "lr": 9.850213457621165e-05} +{"train_loss": 0.014261492528021336, "global_step": 6038, "epoch": 50, "lr": 9.850159630484923e-05} +{"train_loss": 0.016167111694812775, "global_step": 6039, "epoch": 50, "lr": 9.85010579382591e-05} +{"train_loss": 0.013538680970668793, "global_step": 6040, "epoch": 50, "lr": 9.850051947644234e-05} +{"train_loss": 0.014584831893444061, "global_step": 6041, "epoch": 50, "lr": 9.849998091939998e-05} +{"train_loss": 0.01388122420758009, "global_step": 6042, "epoch": 50, "lr": 9.84994422671331e-05} +{"train_loss": 0.011358316987752914, "global_step": 6043, "epoch": 50, "lr": 9.849890351964273e-05} +{"train_loss": 0.00806583371013403, "global_step": 6044, "epoch": 50, "lr": 9.849836467692996e-05} +{"train_loss": 0.018001753836870193, "global_step": 6045, "epoch": 50, "lr": 9.849782573899583e-05} +{"train_loss": 0.0111139677464962, "global_step": 6046, "epoch": 50, "lr": 9.84972867058414e-05} +{"train_loss": 0.015869900584220886, "global_step": 6047, "epoch": 50, "lr": 9.849674757746772e-05} +{"train_loss": 0.013176748529076576, "global_step": 6048, "epoch": 50, "lr": 9.849620835387586e-05} +{"train_loss": 0.012719808146357536, "global_step": 6049, "epoch": 50, "lr": 9.849566903506689e-05} +{"train_loss": 0.014884994365274906, "global_step": 6050, "epoch": 50, "lr": 9.849512962104184e-05} +{"train_loss": 0.010763945989310741, "global_step": 6051, "epoch": 50, "lr": 9.849459011180179e-05} +{"train_loss": 0.01440564263612032, "global_step": 6052, "epoch": 50, "lr": 9.849405050734778e-05} +{"train_loss": 0.011299225501716137, "global_step": 6053, "epoch": 50, "lr": 9.84935108076809e-05} +{"train_loss": 0.010062932968139648, "global_step": 6054, "epoch": 50, "lr": 9.849297101280219e-05} +{"train_loss": 0.009881004691123962, "global_step": 6055, "epoch": 50, "lr": 9.849243112271272e-05} +{"train_loss": 0.015180458314716816, "global_step": 6056, "epoch": 50, "lr": 9.849189113741351e-05} +{"train_loss": 0.014512773603200912, "global_step": 6057, "epoch": 50, "lr": 9.849135105690568e-05} +{"train_loss": 0.011255752295255661, "global_step": 6058, "epoch": 50, "lr": 9.849081088119025e-05} +{"train_loss": 0.010833917185664177, "global_step": 6059, "epoch": 50, "lr": 9.84902706102683e-05} +{"train_loss": 0.013661960139870644, "global_step": 6060, "epoch": 50, "lr": 9.848973024414088e-05} +{"train_loss": 0.01244084071367979, "global_step": 6061, "epoch": 50, "lr": 9.848918978280907e-05} +{"train_loss": 0.01198619231581688, "global_step": 6062, "epoch": 50, "lr": 9.848864922627389e-05} +{"train_loss": 0.01558133214712143, "global_step": 6063, "epoch": 50, "lr": 9.848810857453646e-05} +{"train_loss": 0.01632559299468994, "global_step": 6064, "epoch": 50, "lr": 9.848756782759779e-05} +{"train_loss": 0.013420271687209606, "global_step": 6065, "epoch": 50, "lr": 9.848702698545895e-05} +{"train_loss": 0.014587105251848698, "global_step": 6066, "epoch": 50, "lr": 9.848648604812103e-05} +{"train_loss": 0.019433286041021347, "global_step": 6067, "epoch": 50, "lr": 9.848594501558506e-05} +{"train_loss": 0.013518581354693204, "global_step": 6068, "epoch": 50, "lr": 9.848540388785213e-05, "val_loss": 0.020799003541469574, "train_action_mse_error": 0.0007373442640528083} +{"train_loss": 0.012448640540242195, "global_step": 6069, "epoch": 51, "lr": 9.848486266492329e-05} +{"train_loss": 0.012151768431067467, "global_step": 6070, "epoch": 51, "lr": 9.84843213467996e-05} +{"train_loss": 0.010203376412391663, "global_step": 6071, "epoch": 51, "lr": 9.848377993348212e-05} +{"train_loss": 0.00943789817392826, "global_step": 6072, "epoch": 51, "lr": 9.848323842497192e-05} +{"train_loss": 0.009335845708847046, "global_step": 6073, "epoch": 51, "lr": 9.848269682127006e-05} +{"train_loss": 0.017735829576849937, "global_step": 6074, "epoch": 51, "lr": 9.84821551223776e-05} +{"train_loss": 0.015755977481603622, "global_step": 6075, "epoch": 51, "lr": 9.848161332829562e-05} +{"train_loss": 0.020955849438905716, "global_step": 6076, "epoch": 51, "lr": 9.848107143902517e-05} +{"train_loss": 0.010850819759070873, "global_step": 6077, "epoch": 51, "lr": 9.84805294545673e-05} +{"train_loss": 0.010670812800526619, "global_step": 6078, "epoch": 51, "lr": 9.84799873749231e-05} +{"train_loss": 0.0068854377605021, "global_step": 6079, "epoch": 51, "lr": 9.847944520009362e-05} +{"train_loss": 0.009896332398056984, "global_step": 6080, "epoch": 51, "lr": 9.847890293007994e-05} +{"train_loss": 0.020628968253731728, "global_step": 6081, "epoch": 51, "lr": 9.847836056488311e-05} +{"train_loss": 0.013213719241321087, "global_step": 6082, "epoch": 51, "lr": 9.847781810450418e-05} +{"train_loss": 0.011359849944710732, "global_step": 6083, "epoch": 51, "lr": 9.847727554894426e-05} +{"train_loss": 0.015129263512790203, "global_step": 6084, "epoch": 51, "lr": 9.847673289820438e-05} +{"train_loss": 0.014447281137108803, "global_step": 6085, "epoch": 51, "lr": 9.84761901522856e-05} +{"train_loss": 0.010061471723020077, "global_step": 6086, "epoch": 51, "lr": 9.8475647311189e-05} +{"train_loss": 0.015819713473320007, "global_step": 6087, "epoch": 51, "lr": 9.847510437491567e-05} +{"train_loss": 0.018158458173274994, "global_step": 6088, "epoch": 51, "lr": 9.847456134346663e-05} +{"train_loss": 0.009733939543366432, "global_step": 6089, "epoch": 51, "lr": 9.847401821684298e-05} +{"train_loss": 0.011099660769104958, "global_step": 6090, "epoch": 51, "lr": 9.847347499504577e-05} +{"train_loss": 0.014095187187194824, "global_step": 6091, "epoch": 51, "lr": 9.847293167807607e-05} +{"train_loss": 0.01243296917527914, "global_step": 6092, "epoch": 51, "lr": 9.847238826593495e-05} +{"train_loss": 0.014145759865641594, "global_step": 6093, "epoch": 51, "lr": 9.847184475862346e-05} +{"train_loss": 0.01371469721198082, "global_step": 6094, "epoch": 51, "lr": 9.84713011561427e-05} +{"train_loss": 0.012989197857677937, "global_step": 6095, "epoch": 51, "lr": 9.84707574584937e-05} +{"train_loss": 0.013176841661334038, "global_step": 6096, "epoch": 51, "lr": 9.847021366567754e-05} +{"train_loss": 0.010493422858417034, "global_step": 6097, "epoch": 51, "lr": 9.846966977769532e-05} +{"train_loss": 0.012970615178346634, "global_step": 6098, "epoch": 51, "lr": 9.846912579454807e-05} +{"train_loss": 0.01134657021611929, "global_step": 6099, "epoch": 51, "lr": 9.846858171623687e-05} +{"train_loss": 0.019094595685601234, "global_step": 6100, "epoch": 51, "lr": 9.84680375427628e-05} +{"train_loss": 0.014920872636139393, "global_step": 6101, "epoch": 51, "lr": 9.84674932741269e-05} +{"train_loss": 0.0119865033775568, "global_step": 6102, "epoch": 51, "lr": 9.846694891033026e-05} +{"train_loss": 0.007775886915624142, "global_step": 6103, "epoch": 51, "lr": 9.846640445137394e-05} +{"train_loss": 0.0118181137368083, "global_step": 6104, "epoch": 51, "lr": 9.846585989725902e-05} +{"train_loss": 0.012193954549729824, "global_step": 6105, "epoch": 51, "lr": 9.846531524798656e-05} +{"train_loss": 0.009845500811934471, "global_step": 6106, "epoch": 51, "lr": 9.846477050355763e-05} +{"train_loss": 0.01251622661948204, "global_step": 6107, "epoch": 51, "lr": 9.846422566397329e-05} +{"train_loss": 0.01523102167993784, "global_step": 6108, "epoch": 51, "lr": 9.846368072923464e-05} +{"train_loss": 0.014240529388189316, "global_step": 6109, "epoch": 51, "lr": 9.846313569934271e-05} +{"train_loss": 0.013597768731415272, "global_step": 6110, "epoch": 51, "lr": 9.84625905742986e-05} +{"train_loss": 0.014520220458507538, "global_step": 6111, "epoch": 51, "lr": 9.846204535410339e-05} +{"train_loss": 0.013900760561227798, "global_step": 6112, "epoch": 51, "lr": 9.846150003875811e-05} +{"train_loss": 0.011863398365676403, "global_step": 6113, "epoch": 51, "lr": 9.846095462826385e-05} +{"train_loss": 0.015903135761618614, "global_step": 6114, "epoch": 51, "lr": 9.846040912262169e-05} +{"train_loss": 0.013697062619030476, "global_step": 6115, "epoch": 51, "lr": 9.84598635218327e-05} +{"train_loss": 0.012001139111816883, "global_step": 6116, "epoch": 51, "lr": 9.845931782589794e-05} +{"train_loss": 0.009867265820503235, "global_step": 6117, "epoch": 51, "lr": 9.845877203481848e-05} +{"train_loss": 0.019999483600258827, "global_step": 6118, "epoch": 51, "lr": 9.84582261485954e-05} +{"train_loss": 0.011387280188500881, "global_step": 6119, "epoch": 51, "lr": 9.845768016722979e-05} +{"train_loss": 0.012913051061332226, "global_step": 6120, "epoch": 51, "lr": 9.845713409072267e-05} +{"train_loss": 0.011461271904408932, "global_step": 6121, "epoch": 51, "lr": 9.845658791907515e-05} +{"train_loss": 0.012145069427788258, "global_step": 6122, "epoch": 51, "lr": 9.845604165228832e-05} +{"train_loss": 0.013400363735854626, "global_step": 6123, "epoch": 51, "lr": 9.845549529036321e-05} +{"train_loss": 0.0177360400557518, "global_step": 6124, "epoch": 51, "lr": 9.845494883330091e-05} +{"train_loss": 0.01148574985563755, "global_step": 6125, "epoch": 51, "lr": 9.84544022811025e-05} +{"train_loss": 0.009464869275689125, "global_step": 6126, "epoch": 51, "lr": 9.845385563376905e-05} +{"train_loss": 0.012452898547053337, "global_step": 6127, "epoch": 51, "lr": 9.845330889130163e-05} +{"train_loss": 0.012524438090622425, "global_step": 6128, "epoch": 51, "lr": 9.845276205370131e-05} +{"train_loss": 0.014141839928925037, "global_step": 6129, "epoch": 51, "lr": 9.845221512096919e-05} +{"train_loss": 0.015939241275191307, "global_step": 6130, "epoch": 51, "lr": 9.845166809310629e-05} +{"train_loss": 0.014142843894660473, "global_step": 6131, "epoch": 51, "lr": 9.845112097011372e-05} +{"train_loss": 0.019142601639032364, "global_step": 6132, "epoch": 51, "lr": 9.845057375199257e-05} +{"train_loss": 0.012792023830115795, "global_step": 6133, "epoch": 51, "lr": 9.845002643874388e-05} +{"train_loss": 0.015210856683552265, "global_step": 6134, "epoch": 51, "lr": 9.844947903036874e-05} +{"train_loss": 0.016629738733172417, "global_step": 6135, "epoch": 51, "lr": 9.844893152686823e-05} +{"train_loss": 0.009030740708112717, "global_step": 6136, "epoch": 51, "lr": 9.844838392824342e-05} +{"train_loss": 0.019577065482735634, "global_step": 6137, "epoch": 51, "lr": 9.844783623449539e-05} +{"train_loss": 0.011126684956252575, "global_step": 6138, "epoch": 51, "lr": 9.84472884456252e-05} +{"train_loss": 0.01719137467443943, "global_step": 6139, "epoch": 51, "lr": 9.844674056163393e-05} +{"train_loss": 0.010063900612294674, "global_step": 6140, "epoch": 51, "lr": 9.844619258252267e-05} +{"train_loss": 0.01814206689596176, "global_step": 6141, "epoch": 51, "lr": 9.844564450829248e-05} +{"train_loss": 0.011430907063186169, "global_step": 6142, "epoch": 51, "lr": 9.844509633894444e-05} +{"train_loss": 0.01360243372619152, "global_step": 6143, "epoch": 51, "lr": 9.844454807447963e-05} +{"train_loss": 0.011534016579389572, "global_step": 6144, "epoch": 51, "lr": 9.844399971489914e-05} +{"train_loss": 0.011086156591773033, "global_step": 6145, "epoch": 51, "lr": 9.844345126020403e-05} +{"train_loss": 0.015423666685819626, "global_step": 6146, "epoch": 51, "lr": 9.844290271039536e-05} +{"train_loss": 0.010184429585933685, "global_step": 6147, "epoch": 51, "lr": 9.844235406547424e-05} +{"train_loss": 0.012808619067072868, "global_step": 6148, "epoch": 51, "lr": 9.844180532544172e-05} +{"train_loss": 0.012450648471713066, "global_step": 6149, "epoch": 51, "lr": 9.84412564902989e-05} +{"train_loss": 0.014683039858937263, "global_step": 6150, "epoch": 51, "lr": 9.844070756004685e-05} +{"train_loss": 0.012495147995650768, "global_step": 6151, "epoch": 51, "lr": 9.844015853468664e-05} +{"train_loss": 0.014222773723304272, "global_step": 6152, "epoch": 51, "lr": 9.843960941421938e-05} +{"train_loss": 0.009385133162140846, "global_step": 6153, "epoch": 51, "lr": 9.843906019864609e-05} +{"train_loss": 0.01661449298262596, "global_step": 6154, "epoch": 51, "lr": 9.843851088796788e-05} +{"train_loss": 0.015212136320769787, "global_step": 6155, "epoch": 51, "lr": 9.843796148218585e-05} +{"train_loss": 0.016114257276058197, "global_step": 6156, "epoch": 51, "lr": 9.843741198130104e-05} +{"train_loss": 0.013161974959075451, "global_step": 6157, "epoch": 51, "lr": 9.843686238531456e-05} +{"train_loss": 0.016373954713344574, "global_step": 6158, "epoch": 51, "lr": 9.843631269422746e-05} +{"train_loss": 0.015212517231702805, "global_step": 6159, "epoch": 51, "lr": 9.843576290804083e-05} +{"train_loss": 0.01497283112257719, "global_step": 6160, "epoch": 51, "lr": 9.843521302675578e-05} +{"train_loss": 0.012155777774751186, "global_step": 6161, "epoch": 51, "lr": 9.843466305037334e-05} +{"train_loss": 0.012794007547199726, "global_step": 6162, "epoch": 51, "lr": 9.843411297889463e-05} +{"train_loss": 0.012697873637080193, "global_step": 6163, "epoch": 51, "lr": 9.84335628123207e-05} +{"train_loss": 0.012494167312979698, "global_step": 6164, "epoch": 51, "lr": 9.843301255065265e-05} +{"train_loss": 0.01332014985382557, "global_step": 6165, "epoch": 51, "lr": 9.843246219389157e-05} +{"train_loss": 0.014722980558872223, "global_step": 6166, "epoch": 51, "lr": 9.843191174203851e-05} +{"train_loss": 0.012076840735971928, "global_step": 6167, "epoch": 51, "lr": 9.843136119509457e-05} +{"train_loss": 0.011267449706792831, "global_step": 6168, "epoch": 51, "lr": 9.843081055306082e-05} +{"train_loss": 0.01922234334051609, "global_step": 6169, "epoch": 51, "lr": 9.843025981593834e-05} +{"train_loss": 0.011811125092208385, "global_step": 6170, "epoch": 51, "lr": 9.842970898372823e-05} +{"train_loss": 0.0146992402151227, "global_step": 6171, "epoch": 51, "lr": 9.842915805643155e-05} +{"train_loss": 0.011967884376645088, "global_step": 6172, "epoch": 51, "lr": 9.842860703404941e-05} +{"train_loss": 0.015770548954606056, "global_step": 6173, "epoch": 51, "lr": 9.842805591658286e-05} +{"train_loss": 0.009467457421123981, "global_step": 6174, "epoch": 51, "lr": 9.842750470403301e-05} +{"train_loss": 0.014940913766622543, "global_step": 6175, "epoch": 51, "lr": 9.842695339640091e-05} +{"train_loss": 0.016947168856859207, "global_step": 6176, "epoch": 51, "lr": 9.842640199368768e-05} +{"train_loss": 0.012174393981695175, "global_step": 6177, "epoch": 51, "lr": 9.842585049589437e-05} +{"train_loss": 0.01945791207253933, "global_step": 6178, "epoch": 51, "lr": 9.842529890302208e-05} +{"train_loss": 0.012394175864756107, "global_step": 6179, "epoch": 51, "lr": 9.842474721507189e-05} +{"train_loss": 0.015325655229389668, "global_step": 6180, "epoch": 51, "lr": 9.842419543204487e-05} +{"train_loss": 0.01238841749727726, "global_step": 6181, "epoch": 51, "lr": 9.842364355394214e-05} +{"train_loss": 0.018069278448820114, "global_step": 6182, "epoch": 51, "lr": 9.842309158076474e-05} +{"train_loss": 0.011094914749264717, "global_step": 6183, "epoch": 51, "lr": 9.842253951251378e-05} +{"train_loss": 0.013278139755129814, "global_step": 6184, "epoch": 51, "lr": 9.842198734919032e-05} +{"train_loss": 0.01512750331312418, "global_step": 6185, "epoch": 51, "lr": 9.842143509079549e-05} +{"train_loss": 0.01736803911626339, "global_step": 6186, "epoch": 51, "lr": 9.842088273733032e-05} +{"train_loss": 0.013513580782479849, "global_step": 6187, "epoch": 51, "lr": 9.842033028879594e-05, "val_loss": 0.014004286378622055} +{"train_loss": 0.013733966276049614, "global_step": 6188, "epoch": 52, "lr": 9.84197777451934e-05} +{"train_loss": 0.016908083111047745, "global_step": 6189, "epoch": 52, "lr": 9.841922510652382e-05} +{"train_loss": 0.012439805082976818, "global_step": 6190, "epoch": 52, "lr": 9.841867237278823e-05} +{"train_loss": 0.020359359681606293, "global_step": 6191, "epoch": 52, "lr": 9.841811954398779e-05} +{"train_loss": 0.012561453506350517, "global_step": 6192, "epoch": 52, "lr": 9.841756662012352e-05} +{"train_loss": 0.019410070031881332, "global_step": 6193, "epoch": 52, "lr": 9.841701360119653e-05} +{"train_loss": 0.018540693446993828, "global_step": 6194, "epoch": 52, "lr": 9.841646048720791e-05} +{"train_loss": 0.013325583189725876, "global_step": 6195, "epoch": 52, "lr": 9.841590727815874e-05} +{"train_loss": 0.018033761531114578, "global_step": 6196, "epoch": 52, "lr": 9.84153539740501e-05} +{"train_loss": 0.01222783699631691, "global_step": 6197, "epoch": 52, "lr": 9.84148005748831e-05} +{"train_loss": 0.016381194815039635, "global_step": 6198, "epoch": 52, "lr": 9.841424708065881e-05} +{"train_loss": 0.016757406294345856, "global_step": 6199, "epoch": 52, "lr": 9.841369349137832e-05} +{"train_loss": 0.02019142359495163, "global_step": 6200, "epoch": 52, "lr": 9.841313980704271e-05} +{"train_loss": 0.013092691078782082, "global_step": 6201, "epoch": 52, "lr": 9.841258602765307e-05} +{"train_loss": 0.018610835075378418, "global_step": 6202, "epoch": 52, "lr": 9.841203215321049e-05} +{"train_loss": 0.020570585504174232, "global_step": 6203, "epoch": 52, "lr": 9.841147818371607e-05} +{"train_loss": 0.011793664656579494, "global_step": 6204, "epoch": 52, "lr": 9.841092411917088e-05} +{"train_loss": 0.01996329054236412, "global_step": 6205, "epoch": 52, "lr": 9.8410369959576e-05} +{"train_loss": 0.015427064150571823, "global_step": 6206, "epoch": 52, "lr": 9.840981570493253e-05} +{"train_loss": 0.018493756651878357, "global_step": 6207, "epoch": 52, "lr": 9.840926135524158e-05} +{"train_loss": 0.0108745526522398, "global_step": 6208, "epoch": 52, "lr": 9.840870691050418e-05} +{"train_loss": 0.016913753002882004, "global_step": 6209, "epoch": 52, "lr": 9.840815237072149e-05} +{"train_loss": 0.012789861299097538, "global_step": 6210, "epoch": 52, "lr": 9.840759773589456e-05} +{"train_loss": 0.013036017306149006, "global_step": 6211, "epoch": 52, "lr": 9.840704300602448e-05} +{"train_loss": 0.016385825350880623, "global_step": 6212, "epoch": 52, "lr": 9.840648818111234e-05} +{"train_loss": 0.020657189190387726, "global_step": 6213, "epoch": 52, "lr": 9.840593326115922e-05} +{"train_loss": 0.01252327486872673, "global_step": 6214, "epoch": 52, "lr": 9.840537824616623e-05} +{"train_loss": 0.007857323624193668, "global_step": 6215, "epoch": 52, "lr": 9.840482313613446e-05} +{"train_loss": 0.017260808497667313, "global_step": 6216, "epoch": 52, "lr": 9.840426793106499e-05} +{"train_loss": 0.01225199829787016, "global_step": 6217, "epoch": 52, "lr": 9.84037126309589e-05} +{"train_loss": 0.010955051518976688, "global_step": 6218, "epoch": 52, "lr": 9.84031572358173e-05} +{"train_loss": 0.013297623954713345, "global_step": 6219, "epoch": 52, "lr": 9.840260174564127e-05} +{"train_loss": 0.012573013082146645, "global_step": 6220, "epoch": 52, "lr": 9.840204616043189e-05} +{"train_loss": 0.010866323485970497, "global_step": 6221, "epoch": 52, "lr": 9.840149048019028e-05} +{"train_loss": 0.01359399501234293, "global_step": 6222, "epoch": 52, "lr": 9.840093470491752e-05} +{"train_loss": 0.01743795908987522, "global_step": 6223, "epoch": 52, "lr": 9.840037883461469e-05} +{"train_loss": 0.010161049664020538, "global_step": 6224, "epoch": 52, "lr": 9.839982286928286e-05} +{"train_loss": 0.012470105662941933, "global_step": 6225, "epoch": 52, "lr": 9.839926680892317e-05} +{"train_loss": 0.011900250799953938, "global_step": 6226, "epoch": 52, "lr": 9.83987106535367e-05} +{"train_loss": 0.011406979523599148, "global_step": 6227, "epoch": 52, "lr": 9.839815440312452e-05} +{"train_loss": 0.00971738900989294, "global_step": 6228, "epoch": 52, "lr": 9.839759805768774e-05} +{"train_loss": 0.014445915818214417, "global_step": 6229, "epoch": 52, "lr": 9.839704161722745e-05} +{"train_loss": 0.011089683510363102, "global_step": 6230, "epoch": 52, "lr": 9.839648508174472e-05} +{"train_loss": 0.015727557241916656, "global_step": 6231, "epoch": 52, "lr": 9.839592845124068e-05} +{"train_loss": 0.01080601941794157, "global_step": 6232, "epoch": 52, "lr": 9.83953717257164e-05} +{"train_loss": 0.017208557575941086, "global_step": 6233, "epoch": 52, "lr": 9.839481490517298e-05} +{"train_loss": 0.008247505873441696, "global_step": 6234, "epoch": 52, "lr": 9.839425798961152e-05} +{"train_loss": 0.012221326120197773, "global_step": 6235, "epoch": 52, "lr": 9.839370097903308e-05} +{"train_loss": 0.011145086027681828, "global_step": 6236, "epoch": 52, "lr": 9.83931438734388e-05} +{"train_loss": 0.013541844673454762, "global_step": 6237, "epoch": 52, "lr": 9.839258667282974e-05} +{"train_loss": 0.008787578903138638, "global_step": 6238, "epoch": 52, "lr": 9.839202937720702e-05} +{"train_loss": 0.01549385953694582, "global_step": 6239, "epoch": 52, "lr": 9.839147198657171e-05} +{"train_loss": 0.0101451575756073, "global_step": 6240, "epoch": 52, "lr": 9.839091450092491e-05} +{"train_loss": 0.010026361793279648, "global_step": 6241, "epoch": 52, "lr": 9.839035692026773e-05} +{"train_loss": 0.017629524692893028, "global_step": 6242, "epoch": 52, "lr": 9.838979924460124e-05} +{"train_loss": 0.012109548784792423, "global_step": 6243, "epoch": 52, "lr": 9.838924147392656e-05} +{"train_loss": 0.015705350786447525, "global_step": 6244, "epoch": 52, "lr": 9.838868360824477e-05} +{"train_loss": 0.011544028297066689, "global_step": 6245, "epoch": 52, "lr": 9.838812564755697e-05} +{"train_loss": 0.0112569909542799, "global_step": 6246, "epoch": 52, "lr": 9.838756759186425e-05} +{"train_loss": 0.011928758583962917, "global_step": 6247, "epoch": 52, "lr": 9.838700944116771e-05} +{"train_loss": 0.01545059122145176, "global_step": 6248, "epoch": 52, "lr": 9.838645119546847e-05} +{"train_loss": 0.012223177589476109, "global_step": 6249, "epoch": 52, "lr": 9.838589285476758e-05} +{"train_loss": 0.010739685036242008, "global_step": 6250, "epoch": 52, "lr": 9.838533441906617e-05} +{"train_loss": 0.010081363841891289, "global_step": 6251, "epoch": 52, "lr": 9.838477588836531e-05} +{"train_loss": 0.012200447730720043, "global_step": 6252, "epoch": 52, "lr": 9.838421726266612e-05} +{"train_loss": 0.011531771160662174, "global_step": 6253, "epoch": 52, "lr": 9.838365854196969e-05} +{"train_loss": 0.017277423292398453, "global_step": 6254, "epoch": 52, "lr": 9.83830997262771e-05} +{"train_loss": 0.010841947048902512, "global_step": 6255, "epoch": 52, "lr": 9.838254081558949e-05} +{"train_loss": 0.01599913090467453, "global_step": 6256, "epoch": 52, "lr": 9.838198180990792e-05} +{"train_loss": 0.011722940020263195, "global_step": 6257, "epoch": 52, "lr": 9.83814227092335e-05} +{"train_loss": 0.016297049820423126, "global_step": 6258, "epoch": 52, "lr": 9.838086351356731e-05} +{"train_loss": 0.013178455643355846, "global_step": 6259, "epoch": 52, "lr": 9.838030422291047e-05} +{"train_loss": 0.009643387980759144, "global_step": 6260, "epoch": 52, "lr": 9.837974483726408e-05} +{"train_loss": 0.011386933736503124, "global_step": 6261, "epoch": 52, "lr": 9.837918535662922e-05} +{"train_loss": 0.01108027808368206, "global_step": 6262, "epoch": 52, "lr": 9.837862578100701e-05} +{"train_loss": 0.013459749519824982, "global_step": 6263, "epoch": 52, "lr": 9.837806611039853e-05} +{"train_loss": 0.013902314007282257, "global_step": 6264, "epoch": 52, "lr": 9.837750634480487e-05} +{"train_loss": 0.011000584810972214, "global_step": 6265, "epoch": 52, "lr": 9.837694648422716e-05} +{"train_loss": 0.013350207358598709, "global_step": 6266, "epoch": 52, "lr": 9.837638652866649e-05} +{"train_loss": 0.013095232658088207, "global_step": 6267, "epoch": 52, "lr": 9.837582647812394e-05} +{"train_loss": 0.012503473088145256, "global_step": 6268, "epoch": 52, "lr": 9.837526633260063e-05} +{"train_loss": 0.013136387802660465, "global_step": 6269, "epoch": 52, "lr": 9.837470609209765e-05} +{"train_loss": 0.014914649538695812, "global_step": 6270, "epoch": 52, "lr": 9.83741457566161e-05} +{"train_loss": 0.017962897196412086, "global_step": 6271, "epoch": 52, "lr": 9.83735853261571e-05} +{"train_loss": 0.015222663059830666, "global_step": 6272, "epoch": 52, "lr": 9.837302480072171e-05} +{"train_loss": 0.01384520810097456, "global_step": 6273, "epoch": 52, "lr": 9.837246418031108e-05} +{"train_loss": 0.014170002192258835, "global_step": 6274, "epoch": 52, "lr": 9.837190346492627e-05} +{"train_loss": 0.013510020449757576, "global_step": 6275, "epoch": 52, "lr": 9.837134265456837e-05} +{"train_loss": 0.018268590793013573, "global_step": 6276, "epoch": 52, "lr": 9.837078174923854e-05} +{"train_loss": 0.011379140429198742, "global_step": 6277, "epoch": 52, "lr": 9.837022074893784e-05} +{"train_loss": 0.016936160624027252, "global_step": 6278, "epoch": 52, "lr": 9.836965965366738e-05} +{"train_loss": 0.010260484181344509, "global_step": 6279, "epoch": 52, "lr": 9.836909846342825e-05} +{"train_loss": 0.013958689756691456, "global_step": 6280, "epoch": 52, "lr": 9.836853717822157e-05} +{"train_loss": 0.011473941616714, "global_step": 6281, "epoch": 52, "lr": 9.836797579804844e-05} +{"train_loss": 0.010795651003718376, "global_step": 6282, "epoch": 52, "lr": 9.836741432290994e-05} +{"train_loss": 0.012130704708397388, "global_step": 6283, "epoch": 52, "lr": 9.836685275280721e-05} +{"train_loss": 0.015104242600500584, "global_step": 6284, "epoch": 52, "lr": 9.836629108774133e-05} +{"train_loss": 0.014146448113024235, "global_step": 6285, "epoch": 52, "lr": 9.83657293277134e-05} +{"train_loss": 0.012770033441483974, "global_step": 6286, "epoch": 52, "lr": 9.836516747272452e-05} +{"train_loss": 0.009405704215168953, "global_step": 6287, "epoch": 52, "lr": 9.83646055227758e-05} +{"train_loss": 0.013257178477942944, "global_step": 6288, "epoch": 52, "lr": 9.836404347786835e-05} +{"train_loss": 0.013098685070872307, "global_step": 6289, "epoch": 52, "lr": 9.836348133800328e-05} +{"train_loss": 0.01532209012657404, "global_step": 6290, "epoch": 52, "lr": 9.836291910318166e-05} +{"train_loss": 0.014136905781924725, "global_step": 6291, "epoch": 52, "lr": 9.836235677340462e-05} +{"train_loss": 0.017436092719435692, "global_step": 6292, "epoch": 52, "lr": 9.836179434867328e-05} +{"train_loss": 0.013451342470943928, "global_step": 6293, "epoch": 52, "lr": 9.83612318289887e-05} +{"train_loss": 0.009762566536664963, "global_step": 6294, "epoch": 52, "lr": 9.836066921435201e-05} +{"train_loss": 0.009478467516601086, "global_step": 6295, "epoch": 52, "lr": 9.836010650476432e-05} +{"train_loss": 0.015925507992506027, "global_step": 6296, "epoch": 52, "lr": 9.835954370022672e-05} +{"train_loss": 0.010622463189065456, "global_step": 6297, "epoch": 52, "lr": 9.835898080074033e-05} +{"train_loss": 0.012524639256298542, "global_step": 6298, "epoch": 52, "lr": 9.835841780630624e-05} +{"train_loss": 0.013734669424593449, "global_step": 6299, "epoch": 52, "lr": 9.835785471692558e-05} +{"train_loss": 0.02294222265481949, "global_step": 6300, "epoch": 52, "lr": 9.835729153259942e-05} +{"train_loss": 0.011343556456267834, "global_step": 6301, "epoch": 52, "lr": 9.835672825332889e-05} +{"train_loss": 0.01967793144285679, "global_step": 6302, "epoch": 52, "lr": 9.83561648791151e-05} +{"train_loss": 0.01643826812505722, "global_step": 6303, "epoch": 52, "lr": 9.835560140995912e-05} +{"train_loss": 0.010513843037188053, "global_step": 6304, "epoch": 52, "lr": 9.835503784586211e-05} +{"train_loss": 0.020018775016069412, "global_step": 6305, "epoch": 52, "lr": 9.835447418682513e-05} +{"train_loss": 0.013823093541216951, "global_step": 6306, "epoch": 52, "lr": 9.835391043284932e-05, "val_loss": 0.021226953715085983} +{"train_loss": 0.012008370831608772, "global_step": 6307, "epoch": 53, "lr": 9.835334658393577e-05} +{"train_loss": 0.013636457733809948, "global_step": 6308, "epoch": 53, "lr": 9.835278264008559e-05} +{"train_loss": 0.015218449756503105, "global_step": 6309, "epoch": 53, "lr": 9.835221860129989e-05} +{"train_loss": 0.01417433563619852, "global_step": 6310, "epoch": 53, "lr": 9.835165446757976e-05} +{"train_loss": 0.010913818143308163, "global_step": 6311, "epoch": 53, "lr": 9.835109023892632e-05} +{"train_loss": 0.016194073483347893, "global_step": 6312, "epoch": 53, "lr": 9.83505259153407e-05} +{"train_loss": 0.012010408565402031, "global_step": 6313, "epoch": 53, "lr": 9.834996149682399e-05} +{"train_loss": 0.013059567660093307, "global_step": 6314, "epoch": 53, "lr": 9.834939698337727e-05} +{"train_loss": 0.016418281942605972, "global_step": 6315, "epoch": 53, "lr": 9.83488323750017e-05} +{"train_loss": 0.014798296615481377, "global_step": 6316, "epoch": 53, "lr": 9.834826767169835e-05} +{"train_loss": 0.014292525127530098, "global_step": 6317, "epoch": 53, "lr": 9.834770287346834e-05} +{"train_loss": 0.013595650903880596, "global_step": 6318, "epoch": 53, "lr": 9.834713798031279e-05} +{"train_loss": 0.019379403442144394, "global_step": 6319, "epoch": 53, "lr": 9.834657299223279e-05} +{"train_loss": 0.008893809281289577, "global_step": 6320, "epoch": 53, "lr": 9.834600790922945e-05} +{"train_loss": 0.015054626390337944, "global_step": 6321, "epoch": 53, "lr": 9.834544273130391e-05} +{"train_loss": 0.014158813282847404, "global_step": 6322, "epoch": 53, "lr": 9.834487745845726e-05} +{"train_loss": 0.013241116888821125, "global_step": 6323, "epoch": 53, "lr": 9.834431209069059e-05} +{"train_loss": 0.01313877385109663, "global_step": 6324, "epoch": 53, "lr": 9.834374662800503e-05} +{"train_loss": 0.007953444495797157, "global_step": 6325, "epoch": 53, "lr": 9.83431810704017e-05} +{"train_loss": 0.011425619944930077, "global_step": 6326, "epoch": 53, "lr": 9.83426154178817e-05} +{"train_loss": 0.013733914121985435, "global_step": 6327, "epoch": 53, "lr": 9.834204967044613e-05} +{"train_loss": 0.015184839256107807, "global_step": 6328, "epoch": 53, "lr": 9.83414838280961e-05} +{"train_loss": 0.01710951142013073, "global_step": 6329, "epoch": 53, "lr": 9.834091789083276e-05} +{"train_loss": 0.015776678919792175, "global_step": 6330, "epoch": 53, "lr": 9.834035185865716e-05} +{"train_loss": 0.018634065985679626, "global_step": 6331, "epoch": 53, "lr": 9.833978573157046e-05} +{"train_loss": 0.013091628439724445, "global_step": 6332, "epoch": 53, "lr": 9.833921950957375e-05} +{"train_loss": 0.011896989308297634, "global_step": 6333, "epoch": 53, "lr": 9.833865319266815e-05} +{"train_loss": 0.013960707001388073, "global_step": 6334, "epoch": 53, "lr": 9.833808678085477e-05} +{"train_loss": 0.01434013806283474, "global_step": 6335, "epoch": 53, "lr": 9.833752027413472e-05} +{"train_loss": 0.017282726243138313, "global_step": 6336, "epoch": 53, "lr": 9.833695367250912e-05} +{"train_loss": 0.012229605577886105, "global_step": 6337, "epoch": 53, "lr": 9.833638697597907e-05} +{"train_loss": 0.013383457437157631, "global_step": 6338, "epoch": 53, "lr": 9.833582018454567e-05} +{"train_loss": 0.013272088952362537, "global_step": 6339, "epoch": 53, "lr": 9.833525329821007e-05} +{"train_loss": 0.0143271554261446, "global_step": 6340, "epoch": 53, "lr": 9.833468631697337e-05} +{"train_loss": 0.015024092048406601, "global_step": 6341, "epoch": 53, "lr": 9.833411924083667e-05} +{"train_loss": 0.014776164665818214, "global_step": 6342, "epoch": 53, "lr": 9.833355206980108e-05} +{"train_loss": 0.016926810145378113, "global_step": 6343, "epoch": 53, "lr": 9.833298480386775e-05} +{"train_loss": 0.012540722265839577, "global_step": 6344, "epoch": 53, "lr": 9.833241744303774e-05} +{"train_loss": 0.01736467517912388, "global_step": 6345, "epoch": 53, "lr": 9.83318499873122e-05} +{"train_loss": 0.012093625031411648, "global_step": 6346, "epoch": 53, "lr": 9.833128243669226e-05} +{"train_loss": 0.009563799947500229, "global_step": 6347, "epoch": 53, "lr": 9.833071479117898e-05} +{"train_loss": 0.017369654029607773, "global_step": 6348, "epoch": 53, "lr": 9.833014705077351e-05} +{"train_loss": 0.019149798899888992, "global_step": 6349, "epoch": 53, "lr": 9.832957921547696e-05} +{"train_loss": 0.011122825555503368, "global_step": 6350, "epoch": 53, "lr": 9.832901128529046e-05} +{"train_loss": 0.016764987260103226, "global_step": 6351, "epoch": 53, "lr": 9.832844326021508e-05} +{"train_loss": 0.01858505606651306, "global_step": 6352, "epoch": 53, "lr": 9.8327875140252e-05} +{"train_loss": 0.017302582040429115, "global_step": 6353, "epoch": 53, "lr": 9.832730692540228e-05} +{"train_loss": 0.01780565455555916, "global_step": 6354, "epoch": 53, "lr": 9.832673861566706e-05} +{"train_loss": 0.009332532063126564, "global_step": 6355, "epoch": 53, "lr": 9.832617021104745e-05} +{"train_loss": 0.011144890449941158, "global_step": 6356, "epoch": 53, "lr": 9.832560171154457e-05} +{"train_loss": 0.017614562064409256, "global_step": 6357, "epoch": 53, "lr": 9.832503311715953e-05} +{"train_loss": 0.016748636960983276, "global_step": 6358, "epoch": 53, "lr": 9.832446442789344e-05} +{"train_loss": 0.014630348421633244, "global_step": 6359, "epoch": 53, "lr": 9.832389564374745e-05} +{"train_loss": 0.014196460135281086, "global_step": 6360, "epoch": 53, "lr": 9.832332676472265e-05} +{"train_loss": 0.012797165662050247, "global_step": 6361, "epoch": 53, "lr": 9.832275779082014e-05} +{"train_loss": 0.014201872050762177, "global_step": 6362, "epoch": 53, "lr": 9.832218872204109e-05} +{"train_loss": 0.017831481993198395, "global_step": 6363, "epoch": 53, "lr": 9.832161955838655e-05} +{"train_loss": 0.015138709917664528, "global_step": 6364, "epoch": 53, "lr": 9.83210502998577e-05} +{"train_loss": 0.017377622425556183, "global_step": 6365, "epoch": 53, "lr": 9.83204809464556e-05} +{"train_loss": 0.0164346843957901, "global_step": 6366, "epoch": 53, "lr": 9.831991149818142e-05} +{"train_loss": 0.010499754920601845, "global_step": 6367, "epoch": 53, "lr": 9.831934195503627e-05} +{"train_loss": 0.014643835835158825, "global_step": 6368, "epoch": 53, "lr": 9.831877231702122e-05} +{"train_loss": 0.01325553935021162, "global_step": 6369, "epoch": 53, "lr": 9.831820258413744e-05} +{"train_loss": 0.02302704192698002, "global_step": 6370, "epoch": 53, "lr": 9.831763275638604e-05} +{"train_loss": 0.011099737137556076, "global_step": 6371, "epoch": 53, "lr": 9.831706283376811e-05} +{"train_loss": 0.01812012866139412, "global_step": 6372, "epoch": 53, "lr": 9.831649281628481e-05} +{"train_loss": 0.01318978238850832, "global_step": 6373, "epoch": 53, "lr": 9.831592270393723e-05} +{"train_loss": 0.015141201205551624, "global_step": 6374, "epoch": 53, "lr": 9.831535249672649e-05} +{"train_loss": 0.010317414999008179, "global_step": 6375, "epoch": 53, "lr": 9.831478219465373e-05} +{"train_loss": 0.016799014061689377, "global_step": 6376, "epoch": 53, "lr": 9.831421179772005e-05} +{"train_loss": 0.01465457770973444, "global_step": 6377, "epoch": 53, "lr": 9.831364130592657e-05} +{"train_loss": 0.015034976415336132, "global_step": 6378, "epoch": 53, "lr": 9.831307071927442e-05} +{"train_loss": 0.010496987961232662, "global_step": 6379, "epoch": 53, "lr": 9.831250003776474e-05} +{"train_loss": 0.012763453647494316, "global_step": 6380, "epoch": 53, "lr": 9.83119292613986e-05} +{"train_loss": 0.013194490224123001, "global_step": 6381, "epoch": 53, "lr": 9.831135839017716e-05} +{"train_loss": 0.012019469402730465, "global_step": 6382, "epoch": 53, "lr": 9.831078742410151e-05} +{"train_loss": 0.01952524110674858, "global_step": 6383, "epoch": 53, "lr": 9.831021636317282e-05} +{"train_loss": 0.011159788817167282, "global_step": 6384, "epoch": 53, "lr": 9.830964520739216e-05} +{"train_loss": 0.009319735690951347, "global_step": 6385, "epoch": 53, "lr": 9.830907395676067e-05} +{"train_loss": 0.013333204202353954, "global_step": 6386, "epoch": 53, "lr": 9.830850261127948e-05} +{"train_loss": 0.01297850999981165, "global_step": 6387, "epoch": 53, "lr": 9.830793117094972e-05} +{"train_loss": 0.014559872448444366, "global_step": 6388, "epoch": 53, "lr": 9.830735963577249e-05} +{"train_loss": 0.010255645960569382, "global_step": 6389, "epoch": 53, "lr": 9.830678800574891e-05} +{"train_loss": 0.011571763083338737, "global_step": 6390, "epoch": 53, "lr": 9.830621628088013e-05} +{"train_loss": 0.012981685809791088, "global_step": 6391, "epoch": 53, "lr": 9.830564446116724e-05} +{"train_loss": 0.009669801220297813, "global_step": 6392, "epoch": 53, "lr": 9.830507254661139e-05} +{"train_loss": 0.014660285785794258, "global_step": 6393, "epoch": 53, "lr": 9.830450053721369e-05} +{"train_loss": 0.01650770753622055, "global_step": 6394, "epoch": 53, "lr": 9.830392843297525e-05} +{"train_loss": 0.01347741112112999, "global_step": 6395, "epoch": 53, "lr": 9.830335623389721e-05} +{"train_loss": 0.018564239144325256, "global_step": 6396, "epoch": 53, "lr": 9.83027839399807e-05} +{"train_loss": 0.017463931813836098, "global_step": 6397, "epoch": 53, "lr": 9.830221155122684e-05} +{"train_loss": 0.011160566471517086, "global_step": 6398, "epoch": 53, "lr": 9.830163906763673e-05} +{"train_loss": 0.00829855352640152, "global_step": 6399, "epoch": 53, "lr": 9.830106648921151e-05} +{"train_loss": 0.010192754678428173, "global_step": 6400, "epoch": 53, "lr": 9.830049381595233e-05} +{"train_loss": 0.012923735193908215, "global_step": 6401, "epoch": 53, "lr": 9.829992104786028e-05} +{"train_loss": 0.015948455780744553, "global_step": 6402, "epoch": 53, "lr": 9.829934818493648e-05} +{"train_loss": 0.012617501430213451, "global_step": 6403, "epoch": 53, "lr": 9.829877522718208e-05} +{"train_loss": 0.01288523618131876, "global_step": 6404, "epoch": 53, "lr": 9.82982021745982e-05} +{"train_loss": 0.014602895826101303, "global_step": 6405, "epoch": 53, "lr": 9.829762902718595e-05} +{"train_loss": 0.014454107731580734, "global_step": 6406, "epoch": 53, "lr": 9.829705578494648e-05} +{"train_loss": 0.015833666548132896, "global_step": 6407, "epoch": 53, "lr": 9.829648244788089e-05} +{"train_loss": 0.008564949035644531, "global_step": 6408, "epoch": 53, "lr": 9.829590901599032e-05} +{"train_loss": 0.017636850476264954, "global_step": 6409, "epoch": 53, "lr": 9.829533548927589e-05} +{"train_loss": 0.010659920983016491, "global_step": 6410, "epoch": 53, "lr": 9.829476186773873e-05} +{"train_loss": 0.01193634606897831, "global_step": 6411, "epoch": 53, "lr": 9.829418815137997e-05} +{"train_loss": 0.01735345460474491, "global_step": 6412, "epoch": 53, "lr": 9.829361434020073e-05} +{"train_loss": 0.0162983275949955, "global_step": 6413, "epoch": 53, "lr": 9.829304043420212e-05} +{"train_loss": 0.008121021091938019, "global_step": 6414, "epoch": 53, "lr": 9.82924664333853e-05} +{"train_loss": 0.01557418517768383, "global_step": 6415, "epoch": 53, "lr": 9.829189233775138e-05} +{"train_loss": 0.013928401283919811, "global_step": 6416, "epoch": 53, "lr": 9.829131814730148e-05} +{"train_loss": 0.010999654419720173, "global_step": 6417, "epoch": 53, "lr": 9.829074386203674e-05} +{"train_loss": 0.012979191727936268, "global_step": 6418, "epoch": 53, "lr": 9.829016948195829e-05} +{"train_loss": 0.018903788179159164, "global_step": 6419, "epoch": 53, "lr": 9.828959500706725e-05} +{"train_loss": 0.019773537293076515, "global_step": 6420, "epoch": 53, "lr": 9.828902043736474e-05} +{"train_loss": 0.015250634402036667, "global_step": 6421, "epoch": 53, "lr": 9.828844577285192e-05} +{"train_loss": 0.019097954034805298, "global_step": 6422, "epoch": 53, "lr": 9.828787101352987e-05} +{"train_loss": 0.014576800167560577, "global_step": 6423, "epoch": 53, "lr": 9.828729615939975e-05} +{"train_loss": 0.012116317637264729, "global_step": 6424, "epoch": 53, "lr": 9.828672121046269e-05} +{"train_loss": 0.014139154652024017, "global_step": 6425, "epoch": 53, "lr": 9.82861461667198e-05, "val_loss": 0.02822892554104328} +{"train_loss": 0.011788611300289631, "global_step": 6426, "epoch": 54, "lr": 9.828557102817224e-05} +{"train_loss": 0.015504222363233566, "global_step": 6427, "epoch": 54, "lr": 9.828499579482111e-05} +{"train_loss": 0.015638820827007294, "global_step": 6428, "epoch": 54, "lr": 9.828442046666754e-05} +{"train_loss": 0.015028250403702259, "global_step": 6429, "epoch": 54, "lr": 9.828384504371268e-05} +{"train_loss": 0.013514296151697636, "global_step": 6430, "epoch": 54, "lr": 9.828326952595766e-05} +{"train_loss": 0.012162487022578716, "global_step": 6431, "epoch": 54, "lr": 9.828269391340356e-05} +{"train_loss": 0.009367445483803749, "global_step": 6432, "epoch": 54, "lr": 9.828211820605157e-05} +{"train_loss": 0.010122793726623058, "global_step": 6433, "epoch": 54, "lr": 9.828154240390281e-05} +{"train_loss": 0.015923775732517242, "global_step": 6434, "epoch": 54, "lr": 9.82809665069584e-05} +{"train_loss": 0.01280560065060854, "global_step": 6435, "epoch": 54, "lr": 9.828039051521947e-05} +{"train_loss": 0.012414638884365559, "global_step": 6436, "epoch": 54, "lr": 9.827981442868713e-05} +{"train_loss": 0.01379269827157259, "global_step": 6437, "epoch": 54, "lr": 9.827923824736255e-05} +{"train_loss": 0.011881453916430473, "global_step": 6438, "epoch": 54, "lr": 9.827866197124684e-05} +{"train_loss": 0.014905255287885666, "global_step": 6439, "epoch": 54, "lr": 9.827808560034113e-05} +{"train_loss": 0.013956415466964245, "global_step": 6440, "epoch": 54, "lr": 9.827750913464656e-05} +{"train_loss": 0.012163977138698101, "global_step": 6441, "epoch": 54, "lr": 9.827693257416426e-05} +{"train_loss": 0.01732044667005539, "global_step": 6442, "epoch": 54, "lr": 9.827635591889537e-05} +{"train_loss": 0.012226301245391369, "global_step": 6443, "epoch": 54, "lr": 9.827577916884098e-05} +{"train_loss": 0.012060893699526787, "global_step": 6444, "epoch": 54, "lr": 9.82752023240023e-05} +{"train_loss": 0.016868464648723602, "global_step": 6445, "epoch": 54, "lr": 9.827462538438039e-05} +{"train_loss": 0.011928514577448368, "global_step": 6446, "epoch": 54, "lr": 9.827404834997641e-05} +{"train_loss": 0.017157312482595444, "global_step": 6447, "epoch": 54, "lr": 9.82734712207915e-05} +{"train_loss": 0.015044436790049076, "global_step": 6448, "epoch": 54, "lr": 9.827289399682679e-05} +{"train_loss": 0.010507187806069851, "global_step": 6449, "epoch": 54, "lr": 9.827231667808341e-05} +{"train_loss": 0.014885252341628075, "global_step": 6450, "epoch": 54, "lr": 9.827173926456248e-05} +{"train_loss": 0.014607817865908146, "global_step": 6451, "epoch": 54, "lr": 9.827116175626516e-05} +{"train_loss": 0.011893156915903091, "global_step": 6452, "epoch": 54, "lr": 9.827058415319257e-05} +{"train_loss": 0.011082079261541367, "global_step": 6453, "epoch": 54, "lr": 9.827000645534583e-05} +{"train_loss": 0.010277310386300087, "global_step": 6454, "epoch": 54, "lr": 9.82694286627261e-05} +{"train_loss": 0.013209016062319279, "global_step": 6455, "epoch": 54, "lr": 9.826885077533452e-05} +{"train_loss": 0.008498527109622955, "global_step": 6456, "epoch": 54, "lr": 9.82682727931722e-05} +{"train_loss": 0.015973782166838646, "global_step": 6457, "epoch": 54, "lr": 9.826769471624026e-05} +{"train_loss": 0.013621550984680653, "global_step": 6458, "epoch": 54, "lr": 9.826711654453987e-05} +{"train_loss": 0.008654569275677204, "global_step": 6459, "epoch": 54, "lr": 9.826653827807215e-05} +{"train_loss": 0.012733272276818752, "global_step": 6460, "epoch": 54, "lr": 9.826595991683826e-05} +{"train_loss": 0.008806753903627396, "global_step": 6461, "epoch": 54, "lr": 9.82653814608393e-05} +{"train_loss": 0.014729577116668224, "global_step": 6462, "epoch": 54, "lr": 9.826480291007642e-05} +{"train_loss": 0.012366119772195816, "global_step": 6463, "epoch": 54, "lr": 9.826422426455076e-05} +{"train_loss": 0.010710131376981735, "global_step": 6464, "epoch": 54, "lr": 9.826364552426344e-05} +{"train_loss": 0.012088689021766186, "global_step": 6465, "epoch": 54, "lr": 9.826306668921561e-05} +{"train_loss": 0.00892466027289629, "global_step": 6466, "epoch": 54, "lr": 9.82624877594084e-05} +{"train_loss": 0.01589873433113098, "global_step": 6467, "epoch": 54, "lr": 9.826190873484298e-05} +{"train_loss": 0.009202693589031696, "global_step": 6468, "epoch": 54, "lr": 9.826132961552044e-05} +{"train_loss": 0.013104435987770557, "global_step": 6469, "epoch": 54, "lr": 9.826075040144194e-05} +{"train_loss": 0.012284344993531704, "global_step": 6470, "epoch": 54, "lr": 9.82601710926086e-05} +{"train_loss": 0.015060923993587494, "global_step": 6471, "epoch": 54, "lr": 9.825959168902159e-05} +{"train_loss": 0.011450291611254215, "global_step": 6472, "epoch": 54, "lr": 9.825901219068201e-05} +{"train_loss": 0.01048152707517147, "global_step": 6473, "epoch": 54, "lr": 9.825843259759102e-05} +{"train_loss": 0.017951050773262978, "global_step": 6474, "epoch": 54, "lr": 9.825785290974975e-05} +{"train_loss": 0.008201183751225471, "global_step": 6475, "epoch": 54, "lr": 9.825727312715935e-05} +{"train_loss": 0.013070996850728989, "global_step": 6476, "epoch": 54, "lr": 9.825669324982094e-05} +{"train_loss": 0.00977643858641386, "global_step": 6477, "epoch": 54, "lr": 9.825611327773568e-05} +{"train_loss": 0.013177512213587761, "global_step": 6478, "epoch": 54, "lr": 9.825553321090468e-05} +{"train_loss": 0.007985102944076061, "global_step": 6479, "epoch": 54, "lr": 9.82549530493291e-05} +{"train_loss": 0.01330468151718378, "global_step": 6480, "epoch": 54, "lr": 9.825437279301008e-05} +{"train_loss": 0.010118282400071621, "global_step": 6481, "epoch": 54, "lr": 9.825379244194877e-05} +{"train_loss": 0.010626604780554771, "global_step": 6482, "epoch": 54, "lr": 9.825321199614627e-05} +{"train_loss": 0.011008201166987419, "global_step": 6483, "epoch": 54, "lr": 9.825263145560376e-05} +{"train_loss": 0.014977659098803997, "global_step": 6484, "epoch": 54, "lr": 9.825205082032235e-05} +{"train_loss": 0.013180381618440151, "global_step": 6485, "epoch": 54, "lr": 9.82514700903032e-05} +{"train_loss": 0.015243550762534142, "global_step": 6486, "epoch": 54, "lr": 9.825088926554745e-05} +{"train_loss": 0.01080994587391615, "global_step": 6487, "epoch": 54, "lr": 9.825030834605622e-05} +{"train_loss": 0.018243832513689995, "global_step": 6488, "epoch": 54, "lr": 9.824972733183067e-05} +{"train_loss": 0.011006332002580166, "global_step": 6489, "epoch": 54, "lr": 9.824914622287193e-05} +{"train_loss": 0.010925067588686943, "global_step": 6490, "epoch": 54, "lr": 9.824856501918117e-05} +{"train_loss": 0.013372218236327171, "global_step": 6491, "epoch": 54, "lr": 9.824798372075947e-05} +{"train_loss": 0.01169641874730587, "global_step": 6492, "epoch": 54, "lr": 9.824740232760803e-05} +{"train_loss": 0.017177103087306023, "global_step": 6493, "epoch": 54, "lr": 9.824682083972796e-05} +{"train_loss": 0.0175042524933815, "global_step": 6494, "epoch": 54, "lr": 9.824623925712042e-05} +{"train_loss": 0.022023353725671768, "global_step": 6495, "epoch": 54, "lr": 9.824565757978654e-05} +{"train_loss": 0.013592950999736786, "global_step": 6496, "epoch": 54, "lr": 9.824507580772746e-05} +{"train_loss": 0.013066453859210014, "global_step": 6497, "epoch": 54, "lr": 9.824449394094434e-05} +{"train_loss": 0.00935408752411604, "global_step": 6498, "epoch": 54, "lr": 9.824391197943833e-05} +{"train_loss": 0.014441220089793205, "global_step": 6499, "epoch": 54, "lr": 9.824332992321051e-05} +{"train_loss": 0.011355746537446976, "global_step": 6500, "epoch": 54, "lr": 9.824274777226209e-05} +{"train_loss": 0.011685646139085293, "global_step": 6501, "epoch": 54, "lr": 9.824216552659418e-05} +{"train_loss": 0.019782787188887596, "global_step": 6502, "epoch": 54, "lr": 9.824158318620793e-05} +{"train_loss": 0.021516527980566025, "global_step": 6503, "epoch": 54, "lr": 9.82410007511045e-05} +{"train_loss": 0.013328904286026955, "global_step": 6504, "epoch": 54, "lr": 9.8240418221285e-05} +{"train_loss": 0.012976175174117088, "global_step": 6505, "epoch": 54, "lr": 9.823983559675061e-05} +{"train_loss": 0.015362019650638103, "global_step": 6506, "epoch": 54, "lr": 9.823925287750245e-05} +{"train_loss": 0.012793160043656826, "global_step": 6507, "epoch": 54, "lr": 9.823867006354167e-05} +{"train_loss": 0.013170621357858181, "global_step": 6508, "epoch": 54, "lr": 9.823808715486941e-05} +{"train_loss": 0.0134065430611372, "global_step": 6509, "epoch": 54, "lr": 9.823750415148682e-05} +{"train_loss": 0.014929890632629395, "global_step": 6510, "epoch": 54, "lr": 9.823692105339507e-05} +{"train_loss": 0.011183549650013447, "global_step": 6511, "epoch": 54, "lr": 9.823633786059524e-05} +{"train_loss": 0.015179228037595749, "global_step": 6512, "epoch": 54, "lr": 9.823575457308854e-05} +{"train_loss": 0.018231084570288658, "global_step": 6513, "epoch": 54, "lr": 9.823517119087606e-05} +{"train_loss": 0.011705887503921986, "global_step": 6514, "epoch": 54, "lr": 9.8234587713959e-05} +{"train_loss": 0.011714731343090534, "global_step": 6515, "epoch": 54, "lr": 9.823400414233847e-05} +{"train_loss": 0.009109186939895153, "global_step": 6516, "epoch": 54, "lr": 9.823342047601564e-05} +{"train_loss": 0.013478507287800312, "global_step": 6517, "epoch": 54, "lr": 9.823283671499162e-05} +{"train_loss": 0.01402854174375534, "global_step": 6518, "epoch": 54, "lr": 9.82322528592676e-05} +{"train_loss": 0.013638094998896122, "global_step": 6519, "epoch": 54, "lr": 9.82316689088447e-05} +{"train_loss": 0.019266827031970024, "global_step": 6520, "epoch": 54, "lr": 9.823108486372406e-05} +{"train_loss": 0.01046826969832182, "global_step": 6521, "epoch": 54, "lr": 9.823050072390684e-05} +{"train_loss": 0.013142170384526253, "global_step": 6522, "epoch": 54, "lr": 9.82299164893942e-05} +{"train_loss": 0.01644134521484375, "global_step": 6523, "epoch": 54, "lr": 9.822933216018724e-05} +{"train_loss": 0.01655798964202404, "global_step": 6524, "epoch": 54, "lr": 9.822874773628716e-05} +{"train_loss": 0.014610321260988712, "global_step": 6525, "epoch": 54, "lr": 9.822816321769508e-05} +{"train_loss": 0.014123710803687572, "global_step": 6526, "epoch": 54, "lr": 9.822757860441216e-05} +{"train_loss": 0.01606687158346176, "global_step": 6527, "epoch": 54, "lr": 9.822699389643955e-05} +{"train_loss": 0.01079864613711834, "global_step": 6528, "epoch": 54, "lr": 9.822640909377838e-05} +{"train_loss": 0.011890733614563942, "global_step": 6529, "epoch": 54, "lr": 9.82258241964298e-05} +{"train_loss": 0.010595128871500492, "global_step": 6530, "epoch": 54, "lr": 9.822523920439497e-05} +{"train_loss": 0.01794835738837719, "global_step": 6531, "epoch": 54, "lr": 9.822465411767504e-05} +{"train_loss": 0.012701413594186306, "global_step": 6532, "epoch": 54, "lr": 9.822406893627116e-05} +{"train_loss": 0.013300728052854538, "global_step": 6533, "epoch": 54, "lr": 9.822348366018445e-05} +{"train_loss": 0.013511279597878456, "global_step": 6534, "epoch": 54, "lr": 9.822289828941611e-05} +{"train_loss": 0.011749530211091042, "global_step": 6535, "epoch": 54, "lr": 9.822231282396725e-05} +{"train_loss": 0.01502622663974762, "global_step": 6536, "epoch": 54, "lr": 9.822172726383903e-05} +{"train_loss": 0.012297001667320728, "global_step": 6537, "epoch": 54, "lr": 9.82211416090326e-05} +{"train_loss": 0.012229238636791706, "global_step": 6538, "epoch": 54, "lr": 9.82205558595491e-05} +{"train_loss": 0.01952303759753704, "global_step": 6539, "epoch": 54, "lr": 9.82199700153897e-05} +{"train_loss": 0.012645943090319633, "global_step": 6540, "epoch": 54, "lr": 9.821938407655553e-05} +{"train_loss": 0.011033926159143448, "global_step": 6541, "epoch": 54, "lr": 9.821879804304777e-05} +{"train_loss": 0.011155194602906704, "global_step": 6542, "epoch": 54, "lr": 9.821821191486754e-05} +{"train_loss": 0.009133318439126015, "global_step": 6543, "epoch": 54, "lr": 9.8217625692016e-05} +{"train_loss": 0.01326217213567315, "global_step": 6544, "epoch": 54, "lr": 9.821703937449432e-05, "val_loss": 0.01839665323495865} +{"train_loss": 0.012691914103925228, "global_step": 6545, "epoch": 55, "lr": 9.821645296230362e-05} +{"train_loss": 0.014718987047672272, "global_step": 6546, "epoch": 55, "lr": 9.821586645544507e-05} +{"train_loss": 0.012525239959359169, "global_step": 6547, "epoch": 55, "lr": 9.82152798539198e-05} +{"train_loss": 0.014398391358554363, "global_step": 6548, "epoch": 55, "lr": 9.8214693157729e-05} +{"train_loss": 0.011371258646249771, "global_step": 6549, "epoch": 55, "lr": 9.82141063668738e-05} +{"train_loss": 0.012944044545292854, "global_step": 6550, "epoch": 55, "lr": 9.821351948135533e-05} +{"train_loss": 0.014845945872366428, "global_step": 6551, "epoch": 55, "lr": 9.821293250117479e-05} +{"train_loss": 0.015568120405077934, "global_step": 6552, "epoch": 55, "lr": 9.82123454263333e-05} +{"train_loss": 0.012162656523287296, "global_step": 6553, "epoch": 55, "lr": 9.821175825683202e-05} +{"train_loss": 0.013260831125080585, "global_step": 6554, "epoch": 55, "lr": 9.821117099267211e-05} +{"train_loss": 0.011982678435742855, "global_step": 6555, "epoch": 55, "lr": 9.821058363385472e-05} +{"train_loss": 0.014119379222393036, "global_step": 6556, "epoch": 55, "lr": 9.820999618038098e-05} +{"train_loss": 0.013020152226090431, "global_step": 6557, "epoch": 55, "lr": 9.820940863225208e-05} +{"train_loss": 0.015089821070432663, "global_step": 6558, "epoch": 55, "lr": 9.820882098946915e-05} +{"train_loss": 0.00848880223929882, "global_step": 6559, "epoch": 55, "lr": 9.820823325203335e-05} +{"train_loss": 0.010770460590720177, "global_step": 6560, "epoch": 55, "lr": 9.820764541994583e-05} +{"train_loss": 0.010970759205520153, "global_step": 6561, "epoch": 55, "lr": 9.820705749320775e-05} +{"train_loss": 0.012000438757240772, "global_step": 6562, "epoch": 55, "lr": 9.820646947182027e-05} +{"train_loss": 0.012923438102006912, "global_step": 6563, "epoch": 55, "lr": 9.820588135578454e-05} +{"train_loss": 0.016368817538022995, "global_step": 6564, "epoch": 55, "lr": 9.82052931451017e-05} +{"train_loss": 0.0126276146620512, "global_step": 6565, "epoch": 55, "lr": 9.820470483977292e-05} +{"train_loss": 0.011604899540543556, "global_step": 6566, "epoch": 55, "lr": 9.820411643979935e-05} +{"train_loss": 0.012963163666427135, "global_step": 6567, "epoch": 55, "lr": 9.820352794518215e-05} +{"train_loss": 0.010995331220328808, "global_step": 6568, "epoch": 55, "lr": 9.820293935592248e-05} +{"train_loss": 0.009812399744987488, "global_step": 6569, "epoch": 55, "lr": 9.820235067202148e-05} +{"train_loss": 0.017627617344260216, "global_step": 6570, "epoch": 55, "lr": 9.820176189348032e-05} +{"train_loss": 0.01033477857708931, "global_step": 6571, "epoch": 55, "lr": 9.820117302030014e-05} +{"train_loss": 0.013145332224667072, "global_step": 6572, "epoch": 55, "lr": 9.820058405248212e-05} +{"train_loss": 0.011822056025266647, "global_step": 6573, "epoch": 55, "lr": 9.81999949900274e-05} +{"train_loss": 0.015933886170387268, "global_step": 6574, "epoch": 55, "lr": 9.819940583293713e-05} +{"train_loss": 0.010325532406568527, "global_step": 6575, "epoch": 55, "lr": 9.819881658121248e-05} +{"train_loss": 0.014202965423464775, "global_step": 6576, "epoch": 55, "lr": 9.81982272348546e-05} +{"train_loss": 0.01198847871273756, "global_step": 6577, "epoch": 55, "lr": 9.819763779386466e-05} +{"train_loss": 0.013523543253540993, "global_step": 6578, "epoch": 55, "lr": 9.819704825824379e-05} +{"train_loss": 0.00824206043034792, "global_step": 6579, "epoch": 55, "lr": 9.819645862799319e-05} +{"train_loss": 0.015483297407627106, "global_step": 6580, "epoch": 55, "lr": 9.819586890311397e-05} +{"train_loss": 0.011890312656760216, "global_step": 6581, "epoch": 55, "lr": 9.819527908360733e-05} +{"train_loss": 0.017181722447276115, "global_step": 6582, "epoch": 55, "lr": 9.819468916947438e-05} +{"train_loss": 0.012533722445368767, "global_step": 6583, "epoch": 55, "lr": 9.819409916071633e-05} +{"train_loss": 0.013032132759690285, "global_step": 6584, "epoch": 55, "lr": 9.81935090573343e-05} +{"train_loss": 0.009733621962368488, "global_step": 6585, "epoch": 55, "lr": 9.819291885932948e-05} +{"train_loss": 0.009139453060925007, "global_step": 6586, "epoch": 55, "lr": 9.8192328566703e-05} +{"train_loss": 0.014721211045980453, "global_step": 6587, "epoch": 55, "lr": 9.819173817945603e-05} +{"train_loss": 0.012739310972392559, "global_step": 6588, "epoch": 55, "lr": 9.819114769758975e-05} +{"train_loss": 0.010108250193297863, "global_step": 6589, "epoch": 55, "lr": 9.819055712110529e-05} +{"train_loss": 0.018601614981889725, "global_step": 6590, "epoch": 55, "lr": 9.818996645000382e-05} +{"train_loss": 0.011985892429947853, "global_step": 6591, "epoch": 55, "lr": 9.81893756842865e-05} +{"train_loss": 0.014312568120658398, "global_step": 6592, "epoch": 55, "lr": 9.818878482395448e-05} +{"train_loss": 0.008844634518027306, "global_step": 6593, "epoch": 55, "lr": 9.818819386900893e-05} +{"train_loss": 0.009662500582635403, "global_step": 6594, "epoch": 55, "lr": 9.818760281945101e-05} +{"train_loss": 0.016165388748049736, "global_step": 6595, "epoch": 55, "lr": 9.818701167528189e-05} +{"train_loss": 0.01549249142408371, "global_step": 6596, "epoch": 55, "lr": 9.818642043650271e-05} +{"train_loss": 0.01331652794033289, "global_step": 6597, "epoch": 55, "lr": 9.818582910311465e-05} +{"train_loss": 0.014109781011939049, "global_step": 6598, "epoch": 55, "lr": 9.818523767511885e-05} +{"train_loss": 0.0082694748416543, "global_step": 6599, "epoch": 55, "lr": 9.81846461525165e-05} +{"train_loss": 0.01257871650159359, "global_step": 6600, "epoch": 55, "lr": 9.818405453530874e-05} +{"train_loss": 0.013054026290774345, "global_step": 6601, "epoch": 55, "lr": 9.818346282349674e-05} +{"train_loss": 0.014952433295547962, "global_step": 6602, "epoch": 55, "lr": 9.818287101708164e-05} +{"train_loss": 0.012287753634154797, "global_step": 6603, "epoch": 55, "lr": 9.818227911606464e-05} +{"train_loss": 0.012982611544430256, "global_step": 6604, "epoch": 55, "lr": 9.818168712044686e-05} +{"train_loss": 0.011499011889100075, "global_step": 6605, "epoch": 55, "lr": 9.818109503022951e-05} +{"train_loss": 0.016645535826683044, "global_step": 6606, "epoch": 55, "lr": 9.818050284541372e-05} +{"train_loss": 0.011512938886880875, "global_step": 6607, "epoch": 55, "lr": 9.817991056600065e-05} +{"train_loss": 0.015568929724395275, "global_step": 6608, "epoch": 55, "lr": 9.817931819199148e-05} +{"train_loss": 0.011308164335787296, "global_step": 6609, "epoch": 55, "lr": 9.817872572338737e-05} +{"train_loss": 0.009798738174140453, "global_step": 6610, "epoch": 55, "lr": 9.817813316018947e-05} +{"train_loss": 0.010247217491269112, "global_step": 6611, "epoch": 55, "lr": 9.817754050239896e-05} +{"train_loss": 0.011672714725136757, "global_step": 6612, "epoch": 55, "lr": 9.8176947750017e-05} +{"train_loss": 0.008426844142377377, "global_step": 6613, "epoch": 55, "lr": 9.817635490304473e-05} +{"train_loss": 0.02064594067633152, "global_step": 6614, "epoch": 55, "lr": 9.817576196148334e-05} +{"train_loss": 0.016155855730175972, "global_step": 6615, "epoch": 55, "lr": 9.817516892533401e-05} +{"train_loss": 0.014490117318928242, "global_step": 6616, "epoch": 55, "lr": 9.817457579459787e-05} +{"train_loss": 0.01671874150633812, "global_step": 6617, "epoch": 55, "lr": 9.81739825692761e-05} +{"train_loss": 0.01247699186205864, "global_step": 6618, "epoch": 55, "lr": 9.817338924936985e-05} +{"train_loss": 0.014460891485214233, "global_step": 6619, "epoch": 55, "lr": 9.81727958348803e-05} +{"train_loss": 0.01478362362831831, "global_step": 6620, "epoch": 55, "lr": 9.817220232580862e-05} +{"train_loss": 0.014732692390680313, "global_step": 6621, "epoch": 55, "lr": 9.817160872215597e-05} +{"train_loss": 0.013579728081822395, "global_step": 6622, "epoch": 55, "lr": 9.817101502392349e-05} +{"train_loss": 0.013697237707674503, "global_step": 6623, "epoch": 55, "lr": 9.81704212311124e-05} +{"train_loss": 0.012283789925277233, "global_step": 6624, "epoch": 55, "lr": 9.816982734372382e-05} +{"train_loss": 0.016395866870880127, "global_step": 6625, "epoch": 55, "lr": 9.816923336175891e-05} +{"train_loss": 0.012231514789164066, "global_step": 6626, "epoch": 55, "lr": 9.816863928521889e-05} +{"train_loss": 0.012620832771062851, "global_step": 6627, "epoch": 55, "lr": 9.816804511410487e-05} +{"train_loss": 0.016094369813799858, "global_step": 6628, "epoch": 55, "lr": 9.816745084841806e-05} +{"train_loss": 0.014439341612160206, "global_step": 6629, "epoch": 55, "lr": 9.816685648815959e-05} +{"train_loss": 0.011943492107093334, "global_step": 6630, "epoch": 55, "lr": 9.816626203333064e-05} +{"train_loss": 0.011990946717560291, "global_step": 6631, "epoch": 55, "lr": 9.816566748393239e-05} +{"train_loss": 0.011119889095425606, "global_step": 6632, "epoch": 55, "lr": 9.816507283996599e-05} +{"train_loss": 0.010058542713522911, "global_step": 6633, "epoch": 55, "lr": 9.816447810143263e-05} +{"train_loss": 0.010830993764102459, "global_step": 6634, "epoch": 55, "lr": 9.816388326833346e-05} +{"train_loss": 0.015206397511065006, "global_step": 6635, "epoch": 55, "lr": 9.816328834066963e-05} +{"train_loss": 0.008755920454859734, "global_step": 6636, "epoch": 55, "lr": 9.816269331844234e-05} +{"train_loss": 0.011121897026896477, "global_step": 6637, "epoch": 55, "lr": 9.816209820165276e-05} +{"train_loss": 0.01629999466240406, "global_step": 6638, "epoch": 55, "lr": 9.816150299030202e-05} +{"train_loss": 0.012271125800907612, "global_step": 6639, "epoch": 55, "lr": 9.816090768439135e-05} +{"train_loss": 0.012183834798634052, "global_step": 6640, "epoch": 55, "lr": 9.816031228392185e-05} +{"train_loss": 0.012204545550048351, "global_step": 6641, "epoch": 55, "lr": 9.815971678889473e-05} +{"train_loss": 0.010971653275191784, "global_step": 6642, "epoch": 55, "lr": 9.815912119931116e-05} +{"train_loss": 0.012393238954246044, "global_step": 6643, "epoch": 55, "lr": 9.815852551517229e-05} +{"train_loss": 0.009294267743825912, "global_step": 6644, "epoch": 55, "lr": 9.815792973647931e-05} +{"train_loss": 0.013442489318549633, "global_step": 6645, "epoch": 55, "lr": 9.815733386323338e-05} +{"train_loss": 0.012222763150930405, "global_step": 6646, "epoch": 55, "lr": 9.815673789543567e-05} +{"train_loss": 0.00939017254859209, "global_step": 6647, "epoch": 55, "lr": 9.815614183308735e-05} +{"train_loss": 0.0179127287119627, "global_step": 6648, "epoch": 55, "lr": 9.815554567618958e-05} +{"train_loss": 0.011181284673511982, "global_step": 6649, "epoch": 55, "lr": 9.815494942474353e-05} +{"train_loss": 0.011437821201980114, "global_step": 6650, "epoch": 55, "lr": 9.815435307875041e-05} +{"train_loss": 0.013515855185687542, "global_step": 6651, "epoch": 55, "lr": 9.815375663821135e-05} +{"train_loss": 0.012019401416182518, "global_step": 6652, "epoch": 55, "lr": 9.815316010312754e-05} +{"train_loss": 0.011927461251616478, "global_step": 6653, "epoch": 55, "lr": 9.815256347350012e-05} +{"train_loss": 0.010300293564796448, "global_step": 6654, "epoch": 55, "lr": 9.815196674933032e-05} +{"train_loss": 0.01616602949798107, "global_step": 6655, "epoch": 55, "lr": 9.815136993061925e-05} +{"train_loss": 0.015176968649029732, "global_step": 6656, "epoch": 55, "lr": 9.815077301736812e-05} +{"train_loss": 0.011671869084239006, "global_step": 6657, "epoch": 55, "lr": 9.81501760095781e-05} +{"train_loss": 0.008001787588000298, "global_step": 6658, "epoch": 55, "lr": 9.814957890725034e-05} +{"train_loss": 0.008625649847090244, "global_step": 6659, "epoch": 55, "lr": 9.814898171038603e-05} +{"train_loss": 0.006671061739325523, "global_step": 6660, "epoch": 55, "lr": 9.814838441898634e-05} +{"train_loss": 0.017282657325267792, "global_step": 6661, "epoch": 55, "lr": 9.814778703305245e-05} +{"train_loss": 0.011648348532617092, "global_step": 6662, "epoch": 55, "lr": 9.814718955258551e-05} +{"train_loss": 0.01273008029000098, "global_step": 6663, "epoch": 55, "lr": 9.81465919775867e-05, "val_loss": 0.0152872484177351, "train_action_mse_error": 0.0006704121478833258} +{"train_loss": 0.011128056794404984, "global_step": 6664, "epoch": 56, "lr": 9.814599430805722e-05} +{"train_loss": 0.010726121254265308, "global_step": 6665, "epoch": 56, "lr": 9.814539654399823e-05} +{"train_loss": 0.010340292938053608, "global_step": 6666, "epoch": 56, "lr": 9.814479868541087e-05} +{"train_loss": 0.006614792160689831, "global_step": 6667, "epoch": 56, "lr": 9.814420073229636e-05} +{"train_loss": 0.011068877764046192, "global_step": 6668, "epoch": 56, "lr": 9.814360268465586e-05} +{"train_loss": 0.017559383064508438, "global_step": 6669, "epoch": 56, "lr": 9.814300454249053e-05} +{"train_loss": 0.013323674909770489, "global_step": 6670, "epoch": 56, "lr": 9.814240630580154e-05} +{"train_loss": 0.011243891902267933, "global_step": 6671, "epoch": 56, "lr": 9.81418079745901e-05} +{"train_loss": 0.01275165006518364, "global_step": 6672, "epoch": 56, "lr": 9.814120954885735e-05} +{"train_loss": 0.011133930645883083, "global_step": 6673, "epoch": 56, "lr": 9.81406110286045e-05} +{"train_loss": 0.018035901710391045, "global_step": 6674, "epoch": 56, "lr": 9.814001241383268e-05} +{"train_loss": 0.01173342578113079, "global_step": 6675, "epoch": 56, "lr": 9.813941370454309e-05} +{"train_loss": 0.012689882889389992, "global_step": 6676, "epoch": 56, "lr": 9.813881490073691e-05} +{"train_loss": 0.015112762339413166, "global_step": 6677, "epoch": 56, "lr": 9.813821600241531e-05} +{"train_loss": 0.01387719251215458, "global_step": 6678, "epoch": 56, "lr": 9.813761700957947e-05} +{"train_loss": 0.016043582931160927, "global_step": 6679, "epoch": 56, "lr": 9.813701792223055e-05} +{"train_loss": 0.009968693368136883, "global_step": 6680, "epoch": 56, "lr": 9.813641874036974e-05} +{"train_loss": 0.014582376927137375, "global_step": 6681, "epoch": 56, "lr": 9.813581946399823e-05} +{"train_loss": 0.012293754145503044, "global_step": 6682, "epoch": 56, "lr": 9.813522009311716e-05} +{"train_loss": 0.016143295913934708, "global_step": 6683, "epoch": 56, "lr": 9.813462062772774e-05} +{"train_loss": 0.011632190085947514, "global_step": 6684, "epoch": 56, "lr": 9.813402106783113e-05} +{"train_loss": 0.01077684573829174, "global_step": 6685, "epoch": 56, "lr": 9.813342141342852e-05} +{"train_loss": 0.015717148780822754, "global_step": 6686, "epoch": 56, "lr": 9.813282166452106e-05} +{"train_loss": 0.012462244369089603, "global_step": 6687, "epoch": 56, "lr": 9.813222182110997e-05} +{"train_loss": 0.012001359835267067, "global_step": 6688, "epoch": 56, "lr": 9.81316218831964e-05} +{"train_loss": 0.0121553223580122, "global_step": 6689, "epoch": 56, "lr": 9.813102185078153e-05} +{"train_loss": 0.014818285591900349, "global_step": 6690, "epoch": 56, "lr": 9.813042172386655e-05} +{"train_loss": 0.015893738716840744, "global_step": 6691, "epoch": 56, "lr": 9.81298215024526e-05} +{"train_loss": 0.013895322568714619, "global_step": 6692, "epoch": 56, "lr": 9.812922118654091e-05} +{"train_loss": 0.014247611165046692, "global_step": 6693, "epoch": 56, "lr": 9.812862077613263e-05} +{"train_loss": 0.009939362294971943, "global_step": 6694, "epoch": 56, "lr": 9.812802027122896e-05} +{"train_loss": 0.017470549792051315, "global_step": 6695, "epoch": 56, "lr": 9.812741967183105e-05} +{"train_loss": 0.015007326379418373, "global_step": 6696, "epoch": 56, "lr": 9.81268189779401e-05} +{"train_loss": 0.015840748324990273, "global_step": 6697, "epoch": 56, "lr": 9.812621818955726e-05} +{"train_loss": 0.008913561701774597, "global_step": 6698, "epoch": 56, "lr": 9.812561730668374e-05} +{"train_loss": 0.0196898952126503, "global_step": 6699, "epoch": 56, "lr": 9.812501632932074e-05} +{"train_loss": 0.015154828317463398, "global_step": 6700, "epoch": 56, "lr": 9.812441525746939e-05} +{"train_loss": 0.01242691557854414, "global_step": 6701, "epoch": 56, "lr": 9.812381409113089e-05} +{"train_loss": 0.00909940805286169, "global_step": 6702, "epoch": 56, "lr": 9.812321283030642e-05} +{"train_loss": 0.017496559768915176, "global_step": 6703, "epoch": 56, "lr": 9.812261147499718e-05} +{"train_loss": 0.009046284481883049, "global_step": 6704, "epoch": 56, "lr": 9.812201002520432e-05} +{"train_loss": 0.010683218948543072, "global_step": 6705, "epoch": 56, "lr": 9.812140848092903e-05} +{"train_loss": 0.008477476425468922, "global_step": 6706, "epoch": 56, "lr": 9.81208068421725e-05} +{"train_loss": 0.014699108898639679, "global_step": 6707, "epoch": 56, "lr": 9.812020510893591e-05} +{"train_loss": 0.015647228807210922, "global_step": 6708, "epoch": 56, "lr": 9.811960328122044e-05} +{"train_loss": 0.015691135078668594, "global_step": 6709, "epoch": 56, "lr": 9.811900135902727e-05} +{"train_loss": 0.0149312112480402, "global_step": 6710, "epoch": 56, "lr": 9.811839934235757e-05} +{"train_loss": 0.012698721140623093, "global_step": 6711, "epoch": 56, "lr": 9.811779723121255e-05} +{"train_loss": 0.011346598155796528, "global_step": 6712, "epoch": 56, "lr": 9.811719502559337e-05} +{"train_loss": 0.011019261553883553, "global_step": 6713, "epoch": 56, "lr": 9.811659272550122e-05} +{"train_loss": 0.011751918122172356, "global_step": 6714, "epoch": 56, "lr": 9.811599033093727e-05} +{"train_loss": 0.0081411711871624, "global_step": 6715, "epoch": 56, "lr": 9.811538784190272e-05} +{"train_loss": 0.012153676711022854, "global_step": 6716, "epoch": 56, "lr": 9.811478525839874e-05} +{"train_loss": 0.009743506088852882, "global_step": 6717, "epoch": 56, "lr": 9.811418258042653e-05} +{"train_loss": 0.011641579680144787, "global_step": 6718, "epoch": 56, "lr": 9.811357980798725e-05} +{"train_loss": 0.011886129155755043, "global_step": 6719, "epoch": 56, "lr": 9.811297694108211e-05} +{"train_loss": 0.016303233802318573, "global_step": 6720, "epoch": 56, "lr": 9.811237397971228e-05} +{"train_loss": 0.017340034246444702, "global_step": 6721, "epoch": 56, "lr": 9.811177092387893e-05} +{"train_loss": 0.01005448866635561, "global_step": 6722, "epoch": 56, "lr": 9.811116777358327e-05} +{"train_loss": 0.010872459970414639, "global_step": 6723, "epoch": 56, "lr": 9.811056452882647e-05} +{"train_loss": 0.013726051896810532, "global_step": 6724, "epoch": 56, "lr": 9.810996118960971e-05} +{"train_loss": 0.01100856438279152, "global_step": 6725, "epoch": 56, "lr": 9.810935775593419e-05} +{"train_loss": 0.009562007151544094, "global_step": 6726, "epoch": 56, "lr": 9.810875422780108e-05} +{"train_loss": 0.011546548455953598, "global_step": 6727, "epoch": 56, "lr": 9.810815060521157e-05} +{"train_loss": 0.012580109760165215, "global_step": 6728, "epoch": 56, "lr": 9.810754688816686e-05} +{"train_loss": 0.015363055281341076, "global_step": 6729, "epoch": 56, "lr": 9.81069430766681e-05} +{"train_loss": 0.011076304130256176, "global_step": 6730, "epoch": 56, "lr": 9.810633917071651e-05} +{"train_loss": 0.012418398633599281, "global_step": 6731, "epoch": 56, "lr": 9.810573517031325e-05} +{"train_loss": 0.007210367824882269, "global_step": 6732, "epoch": 56, "lr": 9.810513107545954e-05} +{"train_loss": 0.015697767958045006, "global_step": 6733, "epoch": 56, "lr": 9.810452688615653e-05} +{"train_loss": 0.00962144136428833, "global_step": 6734, "epoch": 56, "lr": 9.810392260240542e-05} +{"train_loss": 0.009762655012309551, "global_step": 6735, "epoch": 56, "lr": 9.81033182242074e-05} +{"train_loss": 0.011599472723901272, "global_step": 6736, "epoch": 56, "lr": 9.810271375156366e-05} +{"train_loss": 0.008854730986058712, "global_step": 6737, "epoch": 56, "lr": 9.810210918447536e-05} +{"train_loss": 0.00949450396001339, "global_step": 6738, "epoch": 56, "lr": 9.810150452294373e-05} +{"train_loss": 0.016432618722319603, "global_step": 6739, "epoch": 56, "lr": 9.810089976696993e-05} +{"train_loss": 0.01005010586231947, "global_step": 6740, "epoch": 56, "lr": 9.810029491655514e-05} +{"train_loss": 0.012509067542850971, "global_step": 6741, "epoch": 56, "lr": 9.809968997170055e-05} +{"train_loss": 0.01158602349460125, "global_step": 6742, "epoch": 56, "lr": 9.809908493240739e-05} +{"train_loss": 0.013953378424048424, "global_step": 6743, "epoch": 56, "lr": 9.80984797986768e-05} +{"train_loss": 0.016926176846027374, "global_step": 6744, "epoch": 56, "lr": 9.809787457050999e-05} +{"train_loss": 0.009566682390868664, "global_step": 6745, "epoch": 56, "lr": 9.809726924790813e-05} +{"train_loss": 0.011287678964436054, "global_step": 6746, "epoch": 56, "lr": 9.809666383087242e-05} +{"train_loss": 0.010871254839003086, "global_step": 6747, "epoch": 56, "lr": 9.809605831940407e-05} +{"train_loss": 0.006705013103783131, "global_step": 6748, "epoch": 56, "lr": 9.809545271350422e-05} +{"train_loss": 0.010806184262037277, "global_step": 6749, "epoch": 56, "lr": 9.80948470131741e-05} +{"train_loss": 0.01022314466536045, "global_step": 6750, "epoch": 56, "lr": 9.809424121841488e-05} +{"train_loss": 0.01368520874530077, "global_step": 6751, "epoch": 56, "lr": 9.809363532922777e-05} +{"train_loss": 0.015039720572531223, "global_step": 6752, "epoch": 56, "lr": 9.809302934561394e-05} +{"train_loss": 0.017218763008713722, "global_step": 6753, "epoch": 56, "lr": 9.809242326757458e-05} +{"train_loss": 0.012435929849743843, "global_step": 6754, "epoch": 56, "lr": 9.809181709511088e-05} +{"train_loss": 0.013763291761279106, "global_step": 6755, "epoch": 56, "lr": 9.809121082822404e-05} +{"train_loss": 0.013123269192874432, "global_step": 6756, "epoch": 56, "lr": 9.809060446691525e-05} +{"train_loss": 0.011402545496821404, "global_step": 6757, "epoch": 56, "lr": 9.808999801118569e-05} +{"train_loss": 0.012564334087073803, "global_step": 6758, "epoch": 56, "lr": 9.808939146103656e-05} +{"train_loss": 0.009789292700588703, "global_step": 6759, "epoch": 56, "lr": 9.808878481646904e-05} +{"train_loss": 0.010075685568153858, "global_step": 6760, "epoch": 56, "lr": 9.808817807748434e-05} +{"train_loss": 0.015247237868607044, "global_step": 6761, "epoch": 56, "lr": 9.808757124408364e-05} +{"train_loss": 0.014641673304140568, "global_step": 6762, "epoch": 56, "lr": 9.808696431626811e-05} +{"train_loss": 0.01488103810697794, "global_step": 6763, "epoch": 56, "lr": 9.808635729403898e-05} +{"train_loss": 0.019151607528328896, "global_step": 6764, "epoch": 56, "lr": 9.808575017739742e-05} +{"train_loss": 0.01330834161490202, "global_step": 6765, "epoch": 56, "lr": 9.808514296634463e-05} +{"train_loss": 0.01608792506158352, "global_step": 6766, "epoch": 56, "lr": 9.80845356608818e-05} +{"train_loss": 0.006539320107549429, "global_step": 6767, "epoch": 56, "lr": 9.808392826101013e-05} +{"train_loss": 0.01758708991110325, "global_step": 6768, "epoch": 56, "lr": 9.808332076673079e-05} +{"train_loss": 0.01599520444869995, "global_step": 6769, "epoch": 56, "lr": 9.8082713178045e-05} +{"train_loss": 0.014470131136476994, "global_step": 6770, "epoch": 56, "lr": 9.808210549495392e-05} +{"train_loss": 0.01033661887049675, "global_step": 6771, "epoch": 56, "lr": 9.808149771745878e-05} +{"train_loss": 0.01199333742260933, "global_step": 6772, "epoch": 56, "lr": 9.808088984556074e-05} +{"train_loss": 0.01710762269794941, "global_step": 6773, "epoch": 56, "lr": 9.808028187926103e-05} +{"train_loss": 0.013697986491024494, "global_step": 6774, "epoch": 56, "lr": 9.80796738185608e-05} +{"train_loss": 0.014319140464067459, "global_step": 6775, "epoch": 56, "lr": 9.807906566346128e-05} +{"train_loss": 0.013185584917664528, "global_step": 6776, "epoch": 56, "lr": 9.807845741396366e-05} +{"train_loss": 0.010042769834399223, "global_step": 6777, "epoch": 56, "lr": 9.807784907006911e-05} +{"train_loss": 0.01347365789115429, "global_step": 6778, "epoch": 56, "lr": 9.807724063177884e-05} +{"train_loss": 0.015835564583539963, "global_step": 6779, "epoch": 56, "lr": 9.807663209909406e-05} +{"train_loss": 0.015503671020269394, "global_step": 6780, "epoch": 56, "lr": 9.807602347201593e-05} +{"train_loss": 0.010240674018859863, "global_step": 6781, "epoch": 56, "lr": 9.807541475054567e-05} +{"train_loss": 0.01278404043126507, "global_step": 6782, "epoch": 56, "lr": 9.807480593468448e-05, "val_loss": 0.018235497176647186} +{"train_loss": 0.01110196765512228, "global_step": 6783, "epoch": 57, "lr": 9.807419702443352e-05} +{"train_loss": 0.013749186880886555, "global_step": 6784, "epoch": 57, "lr": 9.807358801979404e-05} +{"train_loss": 0.02082013711333275, "global_step": 6785, "epoch": 57, "lr": 9.80729789207672e-05} +{"train_loss": 0.017860230058431625, "global_step": 6786, "epoch": 57, "lr": 9.807236972735418e-05} +{"train_loss": 0.009646128863096237, "global_step": 6787, "epoch": 57, "lr": 9.807176043955622e-05} +{"train_loss": 0.01569492369890213, "global_step": 6788, "epoch": 57, "lr": 9.807115105737447e-05} +{"train_loss": 0.011882723309099674, "global_step": 6789, "epoch": 57, "lr": 9.807054158081017e-05} +{"train_loss": 0.016549566760659218, "global_step": 6790, "epoch": 57, "lr": 9.80699320098645e-05} +{"train_loss": 0.008963379077613354, "global_step": 6791, "epoch": 57, "lr": 9.806932234453865e-05} +{"train_loss": 0.012292636558413506, "global_step": 6792, "epoch": 57, "lr": 9.806871258483381e-05} +{"train_loss": 0.009428825229406357, "global_step": 6793, "epoch": 57, "lr": 9.80681027307512e-05} +{"train_loss": 0.011962893418967724, "global_step": 6794, "epoch": 57, "lr": 9.8067492782292e-05} +{"train_loss": 0.011386648751795292, "global_step": 6795, "epoch": 57, "lr": 9.806688273945741e-05} +{"train_loss": 0.01656274124979973, "global_step": 6796, "epoch": 57, "lr": 9.806627260224864e-05} +{"train_loss": 0.013553964905440807, "global_step": 6797, "epoch": 57, "lr": 9.806566237066688e-05} +{"train_loss": 0.013515634462237358, "global_step": 6798, "epoch": 57, "lr": 9.806505204471332e-05} +{"train_loss": 0.011175188235938549, "global_step": 6799, "epoch": 57, "lr": 9.806444162438917e-05} +{"train_loss": 0.015444175340235233, "global_step": 6800, "epoch": 57, "lr": 9.806383110969562e-05} +{"train_loss": 0.021917123347520828, "global_step": 6801, "epoch": 57, "lr": 9.806322050063388e-05} +{"train_loss": 0.013640683144330978, "global_step": 6802, "epoch": 57, "lr": 9.806260979720512e-05} +{"train_loss": 0.008805557154119015, "global_step": 6803, "epoch": 57, "lr": 9.806199899941057e-05} +{"train_loss": 0.019064126536250114, "global_step": 6804, "epoch": 57, "lr": 9.806138810725144e-05} +{"train_loss": 0.01059730164706707, "global_step": 6805, "epoch": 57, "lr": 9.80607771207289e-05} +{"train_loss": 0.00960435252636671, "global_step": 6806, "epoch": 57, "lr": 9.806016603984414e-05} +{"train_loss": 0.017196981236338615, "global_step": 6807, "epoch": 57, "lr": 9.805955486459839e-05} +{"train_loss": 0.017676331102848053, "global_step": 6808, "epoch": 57, "lr": 9.805894359499285e-05} +{"train_loss": 0.011346451006829739, "global_step": 6809, "epoch": 57, "lr": 9.805833223102869e-05} +{"train_loss": 0.021069880574941635, "global_step": 6810, "epoch": 57, "lr": 9.805772077270714e-05} +{"train_loss": 0.013492199592292309, "global_step": 6811, "epoch": 57, "lr": 9.805710922002938e-05} +{"train_loss": 0.013903261162340641, "global_step": 6812, "epoch": 57, "lr": 9.805649757299664e-05} +{"train_loss": 0.014311492443084717, "global_step": 6813, "epoch": 57, "lr": 9.805588583161009e-05} +{"train_loss": 0.010672582313418388, "global_step": 6814, "epoch": 57, "lr": 9.805527399587094e-05} +{"train_loss": 0.012999435886740685, "global_step": 6815, "epoch": 57, "lr": 9.805466206578038e-05} +{"train_loss": 0.013594144955277443, "global_step": 6816, "epoch": 57, "lr": 9.805405004133965e-05} +{"train_loss": 0.013421342708170414, "global_step": 6817, "epoch": 57, "lr": 9.805343792254991e-05} +{"train_loss": 0.006495146080851555, "global_step": 6818, "epoch": 57, "lr": 9.805282570941239e-05} +{"train_loss": 0.022712649777531624, "global_step": 6819, "epoch": 57, "lr": 9.805221340192828e-05} +{"train_loss": 0.012322413735091686, "global_step": 6820, "epoch": 57, "lr": 9.805160100009875e-05} +{"train_loss": 0.010092562064528465, "global_step": 6821, "epoch": 57, "lr": 9.805098850392506e-05} +{"train_loss": 0.014818300493061543, "global_step": 6822, "epoch": 57, "lr": 9.80503759134084e-05} +{"train_loss": 0.010880068875849247, "global_step": 6823, "epoch": 57, "lr": 9.804976322854995e-05} +{"train_loss": 0.011735426262021065, "global_step": 6824, "epoch": 57, "lr": 9.804915044935092e-05} +{"train_loss": 0.008319936692714691, "global_step": 6825, "epoch": 57, "lr": 9.804853757581251e-05} +{"train_loss": 0.012177829630672932, "global_step": 6826, "epoch": 57, "lr": 9.804792460793594e-05} +{"train_loss": 0.01531457994133234, "global_step": 6827, "epoch": 57, "lr": 9.804731154572243e-05} +{"train_loss": 0.013211819343268871, "global_step": 6828, "epoch": 57, "lr": 9.804669838917312e-05} +{"train_loss": 0.009646226651966572, "global_step": 6829, "epoch": 57, "lr": 9.804608513828926e-05} +{"train_loss": 0.012753326445817947, "global_step": 6830, "epoch": 57, "lr": 9.804547179307204e-05} +{"train_loss": 0.011795679107308388, "global_step": 6831, "epoch": 57, "lr": 9.804485835352266e-05} +{"train_loss": 0.011583218351006508, "global_step": 6832, "epoch": 57, "lr": 9.804424481964237e-05} +{"train_loss": 0.010204005055129528, "global_step": 6833, "epoch": 57, "lr": 9.80436311914323e-05} +{"train_loss": 0.01195948850363493, "global_step": 6834, "epoch": 57, "lr": 9.80430174688937e-05} +{"train_loss": 0.012438316829502583, "global_step": 6835, "epoch": 57, "lr": 9.804240365202779e-05} +{"train_loss": 0.011282808147370815, "global_step": 6836, "epoch": 57, "lr": 9.804178974083573e-05} +{"train_loss": 0.013798050582408905, "global_step": 6837, "epoch": 57, "lr": 9.804117573531876e-05} +{"train_loss": 0.011687234975397587, "global_step": 6838, "epoch": 57, "lr": 9.804056163547808e-05} +{"train_loss": 0.015524214133620262, "global_step": 6839, "epoch": 57, "lr": 9.803994744131487e-05} +{"train_loss": 0.01622009463608265, "global_step": 6840, "epoch": 57, "lr": 9.803933315283036e-05} +{"train_loss": 0.013001972809433937, "global_step": 6841, "epoch": 57, "lr": 9.803871877002577e-05} +{"train_loss": 0.013191093690693378, "global_step": 6842, "epoch": 57, "lr": 9.803810429290228e-05} +{"train_loss": 0.010901867412030697, "global_step": 6843, "epoch": 57, "lr": 9.803748972146109e-05} +{"train_loss": 0.012217001058161259, "global_step": 6844, "epoch": 57, "lr": 9.803687505570343e-05} +{"train_loss": 0.016557415947318077, "global_step": 6845, "epoch": 57, "lr": 9.80362602956305e-05} +{"train_loss": 0.008904742076992989, "global_step": 6846, "epoch": 57, "lr": 9.803564544124351e-05} +{"train_loss": 0.010573428124189377, "global_step": 6847, "epoch": 57, "lr": 9.803503049254365e-05} +{"train_loss": 0.013349618762731552, "global_step": 6848, "epoch": 57, "lr": 9.803441544953213e-05} +{"train_loss": 0.0119051244109869, "global_step": 6849, "epoch": 57, "lr": 9.80338003122102e-05} +{"train_loss": 0.008964238688349724, "global_step": 6850, "epoch": 57, "lr": 9.803318508057901e-05} +{"train_loss": 0.014757656492292881, "global_step": 6851, "epoch": 57, "lr": 9.803256975463979e-05} +{"train_loss": 0.010078049264848232, "global_step": 6852, "epoch": 57, "lr": 9.803195433439377e-05} +{"train_loss": 0.013528907671570778, "global_step": 6853, "epoch": 57, "lr": 9.803133881984212e-05} +{"train_loss": 0.010372662916779518, "global_step": 6854, "epoch": 57, "lr": 9.803072321098609e-05} +{"train_loss": 0.013045324012637138, "global_step": 6855, "epoch": 57, "lr": 9.803010750782684e-05} +{"train_loss": 0.016874652355909348, "global_step": 6856, "epoch": 57, "lr": 9.802949171036563e-05} +{"train_loss": 0.012184442020952702, "global_step": 6857, "epoch": 57, "lr": 9.802887581860363e-05} +{"train_loss": 0.011350493878126144, "global_step": 6858, "epoch": 57, "lr": 9.802825983254207e-05} +{"train_loss": 0.00860568042844534, "global_step": 6859, "epoch": 57, "lr": 9.802764375218214e-05} +{"train_loss": 0.011897524818778038, "global_step": 6860, "epoch": 57, "lr": 9.802702757752508e-05} +{"train_loss": 0.011412350460886955, "global_step": 6861, "epoch": 57, "lr": 9.802641130857207e-05} +{"train_loss": 0.010840837843716145, "global_step": 6862, "epoch": 57, "lr": 9.802579494532434e-05} +{"train_loss": 0.009918699972331524, "global_step": 6863, "epoch": 57, "lr": 9.802517848778308e-05} +{"train_loss": 0.008555756881833076, "global_step": 6864, "epoch": 57, "lr": 9.802456193594952e-05} +{"train_loss": 0.017958741635084152, "global_step": 6865, "epoch": 57, "lr": 9.802394528982487e-05} +{"train_loss": 0.016826579347252846, "global_step": 6866, "epoch": 57, "lr": 9.802332854941033e-05} +{"train_loss": 0.015508088283240795, "global_step": 6867, "epoch": 57, "lr": 9.802271171470711e-05} +{"train_loss": 0.012457403354346752, "global_step": 6868, "epoch": 57, "lr": 9.802209478571642e-05} +{"train_loss": 0.009780592285096645, "global_step": 6869, "epoch": 57, "lr": 9.802147776243949e-05} +{"train_loss": 0.012794550508260727, "global_step": 6870, "epoch": 57, "lr": 9.802086064487752e-05} +{"train_loss": 0.011472934857010841, "global_step": 6871, "epoch": 57, "lr": 9.802024343303171e-05} +{"train_loss": 0.016410205513238907, "global_step": 6872, "epoch": 57, "lr": 9.801962612690329e-05} +{"train_loss": 0.014532728120684624, "global_step": 6873, "epoch": 57, "lr": 9.801900872649347e-05} +{"train_loss": 0.01093616895377636, "global_step": 6874, "epoch": 57, "lr": 9.801839123180345e-05} +{"train_loss": 0.010409696027636528, "global_step": 6875, "epoch": 57, "lr": 9.801777364283444e-05} +{"train_loss": 0.011363198049366474, "global_step": 6876, "epoch": 57, "lr": 9.801715595958767e-05} +{"train_loss": 0.011758153326809406, "global_step": 6877, "epoch": 57, "lr": 9.801653818206435e-05} +{"train_loss": 0.012845853343605995, "global_step": 6878, "epoch": 57, "lr": 9.801592031026567e-05} +{"train_loss": 0.014467538334429264, "global_step": 6879, "epoch": 57, "lr": 9.801530234419287e-05} +{"train_loss": 0.014489805325865746, "global_step": 6880, "epoch": 57, "lr": 9.801468428384716e-05} +{"train_loss": 0.009671248495578766, "global_step": 6881, "epoch": 57, "lr": 9.801406612922974e-05} +{"train_loss": 0.015341196209192276, "global_step": 6882, "epoch": 57, "lr": 9.801344788034183e-05} +{"train_loss": 0.008821303024888039, "global_step": 6883, "epoch": 57, "lr": 9.801282953718465e-05} +{"train_loss": 0.013005408458411694, "global_step": 6884, "epoch": 57, "lr": 9.80122110997594e-05} +{"train_loss": 0.012998824007809162, "global_step": 6885, "epoch": 57, "lr": 9.801159256806731e-05} +{"train_loss": 0.010879934765398502, "global_step": 6886, "epoch": 57, "lr": 9.801097394210958e-05} +{"train_loss": 0.008331402204930782, "global_step": 6887, "epoch": 57, "lr": 9.801035522188745e-05} +{"train_loss": 0.010314585641026497, "global_step": 6888, "epoch": 57, "lr": 9.80097364074021e-05} +{"train_loss": 0.015724975615739822, "global_step": 6889, "epoch": 57, "lr": 9.800911749865476e-05} +{"train_loss": 0.016872746869921684, "global_step": 6890, "epoch": 57, "lr": 9.800849849564664e-05} +{"train_loss": 0.013036119751632214, "global_step": 6891, "epoch": 57, "lr": 9.800787939837899e-05} +{"train_loss": 0.014235329814255238, "global_step": 6892, "epoch": 57, "lr": 9.800726020685298e-05} +{"train_loss": 0.011240932159125805, "global_step": 6893, "epoch": 57, "lr": 9.800664092106983e-05} +{"train_loss": 0.011453716084361076, "global_step": 6894, "epoch": 57, "lr": 9.80060215410308e-05} +{"train_loss": 0.012731482274830341, "global_step": 6895, "epoch": 57, "lr": 9.800540206673705e-05} +{"train_loss": 0.010375856421887875, "global_step": 6896, "epoch": 57, "lr": 9.800478249818984e-05} +{"train_loss": 0.014610186219215393, "global_step": 6897, "epoch": 57, "lr": 9.800416283539036e-05} +{"train_loss": 0.01140532921999693, "global_step": 6898, "epoch": 57, "lr": 9.800354307833983e-05} +{"train_loss": 0.011285609565675259, "global_step": 6899, "epoch": 57, "lr": 9.800292322703948e-05} +{"train_loss": 0.012001391500234604, "global_step": 6900, "epoch": 57, "lr": 9.800230328149051e-05} +{"train_loss": 0.012847258020661959, "global_step": 6901, "epoch": 57, "lr": 9.800168324169415e-05, "val_loss": 0.01606767624616623} +{"train_loss": 0.0069113122299313545, "global_step": 6902, "epoch": 58, "lr": 9.800106310765163e-05} +{"train_loss": 0.010427514091134071, "global_step": 6903, "epoch": 58, "lr": 9.800044287936412e-05} +{"train_loss": 0.013139511458575726, "global_step": 6904, "epoch": 58, "lr": 9.799982255683289e-05} +{"train_loss": 0.010510970838367939, "global_step": 6905, "epoch": 58, "lr": 9.799920214005912e-05} +{"train_loss": 0.006816212087869644, "global_step": 6906, "epoch": 58, "lr": 9.799858162904405e-05} +{"train_loss": 0.010285194963216782, "global_step": 6907, "epoch": 58, "lr": 9.799796102378891e-05} +{"train_loss": 0.008675020188093185, "global_step": 6908, "epoch": 58, "lr": 9.799734032429489e-05} +{"train_loss": 0.010240957140922546, "global_step": 6909, "epoch": 58, "lr": 9.799671953056321e-05} +{"train_loss": 0.02012011408805847, "global_step": 6910, "epoch": 58, "lr": 9.799609864259511e-05} +{"train_loss": 0.008123574778437614, "global_step": 6911, "epoch": 58, "lr": 9.799547766039179e-05} +{"train_loss": 0.013856083154678345, "global_step": 6912, "epoch": 58, "lr": 9.799485658395448e-05} +{"train_loss": 0.011165482923388481, "global_step": 6913, "epoch": 58, "lr": 9.79942354132844e-05} +{"train_loss": 0.012988452799618244, "global_step": 6914, "epoch": 58, "lr": 9.799361414838278e-05} +{"train_loss": 0.013403882272541523, "global_step": 6915, "epoch": 58, "lr": 9.79929927892508e-05} +{"train_loss": 0.009385650046169758, "global_step": 6916, "epoch": 58, "lr": 9.799237133588972e-05} +{"train_loss": 0.012177339754998684, "global_step": 6917, "epoch": 58, "lr": 9.799174978830073e-05} +{"train_loss": 0.008597288280725479, "global_step": 6918, "epoch": 58, "lr": 9.799112814648507e-05} +{"train_loss": 0.009409013204276562, "global_step": 6919, "epoch": 58, "lr": 9.799050641044398e-05} +{"train_loss": 0.009387440979480743, "global_step": 6920, "epoch": 58, "lr": 9.798988458017865e-05} +{"train_loss": 0.013632144778966904, "global_step": 6921, "epoch": 58, "lr": 9.79892626556903e-05} +{"train_loss": 0.009039848111569881, "global_step": 6922, "epoch": 58, "lr": 9.798864063698016e-05} +{"train_loss": 0.015474777668714523, "global_step": 6923, "epoch": 58, "lr": 9.798801852404947e-05} +{"train_loss": 0.011788245290517807, "global_step": 6924, "epoch": 58, "lr": 9.798739631689939e-05} +{"train_loss": 0.015926389023661613, "global_step": 6925, "epoch": 58, "lr": 9.798677401553123e-05} +{"train_loss": 0.00963155459612608, "global_step": 6926, "epoch": 58, "lr": 9.798615161994614e-05} +{"train_loss": 0.012142674997448921, "global_step": 6927, "epoch": 58, "lr": 9.798552913014537e-05} +{"train_loss": 0.010349269956350327, "global_step": 6928, "epoch": 58, "lr": 9.798490654613014e-05} +{"train_loss": 0.014530356973409653, "global_step": 6929, "epoch": 58, "lr": 9.798428386790168e-05} +{"train_loss": 0.008006619289517403, "global_step": 6930, "epoch": 58, "lr": 9.79836610954612e-05} +{"train_loss": 0.010314935818314552, "global_step": 6931, "epoch": 58, "lr": 9.798303822880992e-05} +{"train_loss": 0.0171703789383173, "global_step": 6932, "epoch": 58, "lr": 9.79824152679491e-05} +{"train_loss": 0.00845347810536623, "global_step": 6933, "epoch": 58, "lr": 9.798179221287991e-05} +{"train_loss": 0.011288351379334927, "global_step": 6934, "epoch": 58, "lr": 9.79811690636036e-05} +{"train_loss": 0.014520915225148201, "global_step": 6935, "epoch": 58, "lr": 9.798054582012138e-05} +{"train_loss": 0.012524407356977463, "global_step": 6936, "epoch": 58, "lr": 9.79799224824345e-05} +{"train_loss": 0.016793079674243927, "global_step": 6937, "epoch": 58, "lr": 9.797929905054417e-05} +{"train_loss": 0.01088415551930666, "global_step": 6938, "epoch": 58, "lr": 9.797867552445159e-05} +{"train_loss": 0.011183270253241062, "global_step": 6939, "epoch": 58, "lr": 9.797805190415803e-05} +{"train_loss": 0.025569431483745575, "global_step": 6940, "epoch": 58, "lr": 9.797742818966467e-05} +{"train_loss": 0.010182914324104786, "global_step": 6941, "epoch": 58, "lr": 9.797680438097277e-05} +{"train_loss": 0.01068172138184309, "global_step": 6942, "epoch": 58, "lr": 9.797618047808354e-05} +{"train_loss": 0.014423110522329807, "global_step": 6943, "epoch": 58, "lr": 9.797555648099821e-05} +{"train_loss": 0.010512718930840492, "global_step": 6944, "epoch": 58, "lr": 9.797493238971799e-05} +{"train_loss": 0.013424103148281574, "global_step": 6945, "epoch": 58, "lr": 9.797430820424412e-05} +{"train_loss": 0.012999486178159714, "global_step": 6946, "epoch": 58, "lr": 9.797368392457782e-05} +{"train_loss": 0.009958982467651367, "global_step": 6947, "epoch": 58, "lr": 9.797305955072032e-05} +{"train_loss": 0.012026308104395866, "global_step": 6948, "epoch": 58, "lr": 9.797243508267284e-05} +{"train_loss": 0.009533729404211044, "global_step": 6949, "epoch": 58, "lr": 9.79718105204366e-05} +{"train_loss": 0.009012937545776367, "global_step": 6950, "epoch": 58, "lr": 9.797118586401285e-05} +{"train_loss": 0.018500056117773056, "global_step": 6951, "epoch": 58, "lr": 9.79705611134028e-05} +{"train_loss": 0.011143929325044155, "global_step": 6952, "epoch": 58, "lr": 9.796993626860767e-05} +{"train_loss": 0.011064411140978336, "global_step": 6953, "epoch": 58, "lr": 9.79693113296287e-05} +{"train_loss": 0.011761934496462345, "global_step": 6954, "epoch": 58, "lr": 9.79686862964671e-05} +{"train_loss": 0.013333828188478947, "global_step": 6955, "epoch": 58, "lr": 9.796806116912412e-05} +{"train_loss": 0.011206294409930706, "global_step": 6956, "epoch": 58, "lr": 9.796743594760098e-05} +{"train_loss": 0.013071960769593716, "global_step": 6957, "epoch": 58, "lr": 9.79668106318989e-05} +{"train_loss": 0.014155171811580658, "global_step": 6958, "epoch": 58, "lr": 9.796618522201911e-05} +{"train_loss": 0.012540699914097786, "global_step": 6959, "epoch": 58, "lr": 9.796555971796284e-05} +{"train_loss": 0.014538929797708988, "global_step": 6960, "epoch": 58, "lr": 9.796493411973133e-05} +{"train_loss": 0.01154314260929823, "global_step": 6961, "epoch": 58, "lr": 9.796430842732578e-05} +{"train_loss": 0.010317651554942131, "global_step": 6962, "epoch": 58, "lr": 9.796368264074745e-05} +{"train_loss": 0.008181724697351456, "global_step": 6963, "epoch": 58, "lr": 9.796305675999752e-05} +{"train_loss": 0.010058458894491196, "global_step": 6964, "epoch": 58, "lr": 9.796243078507728e-05} +{"train_loss": 0.014115314930677414, "global_step": 6965, "epoch": 58, "lr": 9.796180471598793e-05} +{"train_loss": 0.011461224406957626, "global_step": 6966, "epoch": 58, "lr": 9.79611785527307e-05} +{"train_loss": 0.013275965116918087, "global_step": 6967, "epoch": 58, "lr": 9.796055229530682e-05} +{"train_loss": 0.01131105050444603, "global_step": 6968, "epoch": 58, "lr": 9.795992594371751e-05} +{"train_loss": 0.013154576532542706, "global_step": 6969, "epoch": 58, "lr": 9.795929949796402e-05} +{"train_loss": 0.00960827898234129, "global_step": 6970, "epoch": 58, "lr": 9.795867295804758e-05} +{"train_loss": 0.013761380687355995, "global_step": 6971, "epoch": 58, "lr": 9.795804632396937e-05} +{"train_loss": 0.011409043334424496, "global_step": 6972, "epoch": 58, "lr": 9.795741959573069e-05} +{"train_loss": 0.013495618477463722, "global_step": 6973, "epoch": 58, "lr": 9.795679277333273e-05} +{"train_loss": 0.01252876129001379, "global_step": 6974, "epoch": 58, "lr": 9.795616585677674e-05} +{"train_loss": 0.01191679760813713, "global_step": 6975, "epoch": 58, "lr": 9.795553884606394e-05} +{"train_loss": 0.009022857062518597, "global_step": 6976, "epoch": 58, "lr": 9.795491174119555e-05} +{"train_loss": 0.011453637853264809, "global_step": 6977, "epoch": 58, "lr": 9.795428454217284e-05} +{"train_loss": 0.0107607152312994, "global_step": 6978, "epoch": 58, "lr": 9.795365724899698e-05} +{"train_loss": 0.015097024850547314, "global_step": 6979, "epoch": 58, "lr": 9.795302986166925e-05} +{"train_loss": 0.011834998615086079, "global_step": 6980, "epoch": 58, "lr": 9.79524023801909e-05} +{"train_loss": 0.0115819638594985, "global_step": 6981, "epoch": 58, "lr": 9.795177480456309e-05} +{"train_loss": 0.015738502144813538, "global_step": 6982, "epoch": 58, "lr": 9.795114713478711e-05} +{"train_loss": 0.010491314344108105, "global_step": 6983, "epoch": 58, "lr": 9.795051937086417e-05} +{"train_loss": 0.01618460938334465, "global_step": 6984, "epoch": 58, "lr": 9.794989151279552e-05} +{"train_loss": 0.010519636794924736, "global_step": 6985, "epoch": 58, "lr": 9.794926356058236e-05} +{"train_loss": 0.01664290763437748, "global_step": 6986, "epoch": 58, "lr": 9.794863551422598e-05} +{"train_loss": 0.01225134078413248, "global_step": 6987, "epoch": 58, "lr": 9.794800737372753e-05} +{"train_loss": 0.011368251405656338, "global_step": 6988, "epoch": 58, "lr": 9.794737913908832e-05} +{"train_loss": 0.014911822974681854, "global_step": 6989, "epoch": 58, "lr": 9.794675081030955e-05} +{"train_loss": 0.014749908819794655, "global_step": 6990, "epoch": 58, "lr": 9.794612238739244e-05} +{"train_loss": 0.009108120575547218, "global_step": 6991, "epoch": 58, "lr": 9.794549387033827e-05} +{"train_loss": 0.014716686680912971, "global_step": 6992, "epoch": 58, "lr": 9.794486525914822e-05} +{"train_loss": 0.011604047380387783, "global_step": 6993, "epoch": 58, "lr": 9.794423655382356e-05} +{"train_loss": 0.013074437156319618, "global_step": 6994, "epoch": 58, "lr": 9.794360775436552e-05} +{"train_loss": 0.010896359570324421, "global_step": 6995, "epoch": 58, "lr": 9.794297886077532e-05} +{"train_loss": 0.012923206202685833, "global_step": 6996, "epoch": 58, "lr": 9.79423498730542e-05} +{"train_loss": 0.012047127820551395, "global_step": 6997, "epoch": 58, "lr": 9.79417207912034e-05} +{"train_loss": 0.012181579135358334, "global_step": 6998, "epoch": 58, "lr": 9.794109161522416e-05} +{"train_loss": 0.013522910885512829, "global_step": 6999, "epoch": 58, "lr": 9.79404623451177e-05} +{"train_loss": 0.008430576883256435, "global_step": 7000, "epoch": 58, "lr": 9.793983298088528e-05} +{"train_loss": 0.014768050983548164, "global_step": 7001, "epoch": 58, "lr": 9.79392035225281e-05} +{"train_loss": 0.011127554811537266, "global_step": 7002, "epoch": 58, "lr": 9.793857397004742e-05} +{"train_loss": 0.011015095748007298, "global_step": 7003, "epoch": 58, "lr": 9.793794432344447e-05} +{"train_loss": 0.008552903309464455, "global_step": 7004, "epoch": 58, "lr": 9.793731458272049e-05} +{"train_loss": 0.012795875780284405, "global_step": 7005, "epoch": 58, "lr": 9.793668474787672e-05} +{"train_loss": 0.010748091153800488, "global_step": 7006, "epoch": 58, "lr": 9.793605481891437e-05} +{"train_loss": 0.011510951444506645, "global_step": 7007, "epoch": 58, "lr": 9.793542479583471e-05} +{"train_loss": 0.010517148301005363, "global_step": 7008, "epoch": 58, "lr": 9.793479467863898e-05} +{"train_loss": 0.00786207802593708, "global_step": 7009, "epoch": 58, "lr": 9.793416446732839e-05} +{"train_loss": 0.010015666484832764, "global_step": 7010, "epoch": 58, "lr": 9.793353416190419e-05} +{"train_loss": 0.011796673759818077, "global_step": 7011, "epoch": 58, "lr": 9.79329037623676e-05} +{"train_loss": 0.008929576724767685, "global_step": 7012, "epoch": 58, "lr": 9.79322732687199e-05} +{"train_loss": 0.010662805289030075, "global_step": 7013, "epoch": 58, "lr": 9.793164268096229e-05} +{"train_loss": 0.01110985316336155, "global_step": 7014, "epoch": 58, "lr": 9.793101199909602e-05} +{"train_loss": 0.007922332733869553, "global_step": 7015, "epoch": 58, "lr": 9.793038122312233e-05} +{"train_loss": 0.007702638860791922, "global_step": 7016, "epoch": 58, "lr": 9.792975035304245e-05} +{"train_loss": 0.016140297055244446, "global_step": 7017, "epoch": 58, "lr": 9.792911938885765e-05} +{"train_loss": 0.016858255490660667, "global_step": 7018, "epoch": 58, "lr": 9.792848833056914e-05} +{"train_loss": 0.015429094433784485, "global_step": 7019, "epoch": 58, "lr": 9.792785717817814e-05} +{"train_loss": 0.011966660270514358, "global_step": 7020, "epoch": 58, "lr": 9.792722593168593e-05, "val_loss": 0.017246071249246597} +{"train_loss": 0.01279886532574892, "global_step": 7021, "epoch": 59, "lr": 9.792659459109372e-05} +{"train_loss": 0.008331852965056896, "global_step": 7022, "epoch": 59, "lr": 9.792596315640277e-05} +{"train_loss": 0.016023600473999977, "global_step": 7023, "epoch": 59, "lr": 9.792533162761431e-05} +{"train_loss": 0.012684856541454792, "global_step": 7024, "epoch": 59, "lr": 9.792470000472958e-05} +{"train_loss": 0.015122001059353352, "global_step": 7025, "epoch": 59, "lr": 9.792406828774982e-05} +{"train_loss": 0.01064413134008646, "global_step": 7026, "epoch": 59, "lr": 9.792343647667627e-05} +{"train_loss": 0.007043397054076195, "global_step": 7027, "epoch": 59, "lr": 9.792280457151018e-05} +{"train_loss": 0.01324156392365694, "global_step": 7028, "epoch": 59, "lr": 9.792217257225278e-05} +{"train_loss": 0.012572973035275936, "global_step": 7029, "epoch": 59, "lr": 9.792154047890531e-05} +{"train_loss": 0.009192690253257751, "global_step": 7030, "epoch": 59, "lr": 9.792090829146903e-05} +{"train_loss": 0.011981531046330929, "global_step": 7031, "epoch": 59, "lr": 9.792027600994516e-05} +{"train_loss": 0.009545236825942993, "global_step": 7032, "epoch": 59, "lr": 9.791964363433494e-05} +{"train_loss": 0.013050052337348461, "global_step": 7033, "epoch": 59, "lr": 9.791901116463962e-05} +{"train_loss": 0.009229558520019054, "global_step": 7034, "epoch": 59, "lr": 9.791837860086044e-05} +{"train_loss": 0.01099881250411272, "global_step": 7035, "epoch": 59, "lr": 9.791774594299865e-05} +{"train_loss": 0.013667271472513676, "global_step": 7036, "epoch": 59, "lr": 9.791711319105548e-05} +{"train_loss": 0.009803134016692638, "global_step": 7037, "epoch": 59, "lr": 9.791648034503218e-05} +{"train_loss": 0.008103953674435616, "global_step": 7038, "epoch": 59, "lr": 9.791584740492999e-05} +{"train_loss": 0.013713819906115532, "global_step": 7039, "epoch": 59, "lr": 9.791521437075016e-05} +{"train_loss": 0.009055803529918194, "global_step": 7040, "epoch": 59, "lr": 9.791458124249391e-05} +{"train_loss": 0.013367248699069023, "global_step": 7041, "epoch": 59, "lr": 9.791394802016249e-05} +{"train_loss": 0.013825108297169209, "global_step": 7042, "epoch": 59, "lr": 9.791331470375718e-05} +{"train_loss": 0.014412269927561283, "global_step": 7043, "epoch": 59, "lr": 9.791268129327918e-05} +{"train_loss": 0.010674062184989452, "global_step": 7044, "epoch": 59, "lr": 9.791204778872975e-05} +{"train_loss": 0.015165475197136402, "global_step": 7045, "epoch": 59, "lr": 9.791141419011013e-05} +{"train_loss": 0.010191291570663452, "global_step": 7046, "epoch": 59, "lr": 9.791078049742158e-05} +{"train_loss": 0.015487761236727238, "global_step": 7047, "epoch": 59, "lr": 9.791014671066532e-05} +{"train_loss": 0.0113391587510705, "global_step": 7048, "epoch": 59, "lr": 9.79095128298426e-05} +{"train_loss": 0.015821672976017, "global_step": 7049, "epoch": 59, "lr": 9.790887885495468e-05} +{"train_loss": 0.012486372143030167, "global_step": 7050, "epoch": 59, "lr": 9.790824478600279e-05} +{"train_loss": 0.01236169133335352, "global_step": 7051, "epoch": 59, "lr": 9.790761062298819e-05} +{"train_loss": 0.015758009627461433, "global_step": 7052, "epoch": 59, "lr": 9.79069763659121e-05} +{"train_loss": 0.015431895852088928, "global_step": 7053, "epoch": 59, "lr": 9.790634201477579e-05} +{"train_loss": 0.008099359460175037, "global_step": 7054, "epoch": 59, "lr": 9.790570756958049e-05} +{"train_loss": 0.014986301772296429, "global_step": 7055, "epoch": 59, "lr": 9.790507303032745e-05} +{"train_loss": 0.008317905478179455, "global_step": 7056, "epoch": 59, "lr": 9.790443839701792e-05} +{"train_loss": 0.012214289046823978, "global_step": 7057, "epoch": 59, "lr": 9.790380366965315e-05} +{"train_loss": 0.009773737750947475, "global_step": 7058, "epoch": 59, "lr": 9.790316884823436e-05} +{"train_loss": 0.010943317785859108, "global_step": 7059, "epoch": 59, "lr": 9.790253393276283e-05} +{"train_loss": 0.010640670545399189, "global_step": 7060, "epoch": 59, "lr": 9.79018989232398e-05} +{"train_loss": 0.009023334830999374, "global_step": 7061, "epoch": 59, "lr": 9.79012638196665e-05} +{"train_loss": 0.014276852831244469, "global_step": 7062, "epoch": 59, "lr": 9.790062862204418e-05} +{"train_loss": 0.010034550912678242, "global_step": 7063, "epoch": 59, "lr": 9.78999933303741e-05} +{"train_loss": 0.007230039685964584, "global_step": 7064, "epoch": 59, "lr": 9.78993579446575e-05} +{"train_loss": 0.011694874614477158, "global_step": 7065, "epoch": 59, "lr": 9.789872246489562e-05} +{"train_loss": 0.009291654452681541, "global_step": 7066, "epoch": 59, "lr": 9.789808689108972e-05} +{"train_loss": 0.009065840393304825, "global_step": 7067, "epoch": 59, "lr": 9.789745122324105e-05} +{"train_loss": 0.014024796895682812, "global_step": 7068, "epoch": 59, "lr": 9.789681546135086e-05} +{"train_loss": 0.011642144061625004, "global_step": 7069, "epoch": 59, "lr": 9.789617960542037e-05} +{"train_loss": 0.014445524662733078, "global_step": 7070, "epoch": 59, "lr": 9.789554365545085e-05} +{"train_loss": 0.010964149609208107, "global_step": 7071, "epoch": 59, "lr": 9.789490761144356e-05} +{"train_loss": 0.010879259556531906, "global_step": 7072, "epoch": 59, "lr": 9.789427147339972e-05} +{"train_loss": 0.009013472124934196, "global_step": 7073, "epoch": 59, "lr": 9.78936352413206e-05} +{"train_loss": 0.007792247459292412, "global_step": 7074, "epoch": 59, "lr": 9.789299891520746e-05} +{"train_loss": 0.013020158745348454, "global_step": 7075, "epoch": 59, "lr": 9.78923624950615e-05} +{"train_loss": 0.00986421387642622, "global_step": 7076, "epoch": 59, "lr": 9.789172598088403e-05} +{"train_loss": 0.006908649578690529, "global_step": 7077, "epoch": 59, "lr": 9.789108937267628e-05} +{"train_loss": 0.013476419262588024, "global_step": 7078, "epoch": 59, "lr": 9.789045267043948e-05} +{"train_loss": 0.008742314763367176, "global_step": 7079, "epoch": 59, "lr": 9.788981587417488e-05} +{"train_loss": 0.01007439661771059, "global_step": 7080, "epoch": 59, "lr": 9.788917898388376e-05} +{"train_loss": 0.009081433527171612, "global_step": 7081, "epoch": 59, "lr": 9.788854199956735e-05} +{"train_loss": 0.013408463448286057, "global_step": 7082, "epoch": 59, "lr": 9.78879049212269e-05} +{"train_loss": 0.016171330586075783, "global_step": 7083, "epoch": 59, "lr": 9.788726774886366e-05} +{"train_loss": 0.011363664641976357, "global_step": 7084, "epoch": 59, "lr": 9.788663048247888e-05} +{"train_loss": 0.012172099202871323, "global_step": 7085, "epoch": 59, "lr": 9.788599312207384e-05} +{"train_loss": 0.01188964769244194, "global_step": 7086, "epoch": 59, "lr": 9.788535566764975e-05} +{"train_loss": 0.015462933108210564, "global_step": 7087, "epoch": 59, "lr": 9.78847181192079e-05} +{"train_loss": 0.014109390787780285, "global_step": 7088, "epoch": 59, "lr": 9.788408047674949e-05} +{"train_loss": 0.009565186686813831, "global_step": 7089, "epoch": 59, "lr": 9.788344274027584e-05} +{"train_loss": 0.013683163560926914, "global_step": 7090, "epoch": 59, "lr": 9.788280490978814e-05} +{"train_loss": 0.009884227998554707, "global_step": 7091, "epoch": 59, "lr": 9.788216698528767e-05} +{"train_loss": 0.011731266044080257, "global_step": 7092, "epoch": 59, "lr": 9.788152896677569e-05} +{"train_loss": 0.011741232126951218, "global_step": 7093, "epoch": 59, "lr": 9.788089085425343e-05} +{"train_loss": 0.011979817412793636, "global_step": 7094, "epoch": 59, "lr": 9.788025264772218e-05} +{"train_loss": 0.014149636961519718, "global_step": 7095, "epoch": 59, "lr": 9.787961434718314e-05} +{"train_loss": 0.009495305828750134, "global_step": 7096, "epoch": 59, "lr": 9.787897595263762e-05} +{"train_loss": 0.013610457070171833, "global_step": 7097, "epoch": 59, "lr": 9.787833746408684e-05} +{"train_loss": 0.014254053123295307, "global_step": 7098, "epoch": 59, "lr": 9.787769888153204e-05} +{"train_loss": 0.01068157609552145, "global_step": 7099, "epoch": 59, "lr": 9.787706020497451e-05} +{"train_loss": 0.01175958476960659, "global_step": 7100, "epoch": 59, "lr": 9.787642143441548e-05} +{"train_loss": 0.011456168256700039, "global_step": 7101, "epoch": 59, "lr": 9.787578256985621e-05} +{"train_loss": 0.01386266015470028, "global_step": 7102, "epoch": 59, "lr": 9.787514361129796e-05} +{"train_loss": 0.009574946947395802, "global_step": 7103, "epoch": 59, "lr": 9.787450455874199e-05} +{"train_loss": 0.01038843858987093, "global_step": 7104, "epoch": 59, "lr": 9.787386541218953e-05} +{"train_loss": 0.013980185613036156, "global_step": 7105, "epoch": 59, "lr": 9.787322617164186e-05} +{"train_loss": 0.012378520332276821, "global_step": 7106, "epoch": 59, "lr": 9.787258683710021e-05} +{"train_loss": 0.014049299992620945, "global_step": 7107, "epoch": 59, "lr": 9.787194740856586e-05} +{"train_loss": 0.011385760270059109, "global_step": 7108, "epoch": 59, "lr": 9.787130788604007e-05} +{"train_loss": 0.01456709299236536, "global_step": 7109, "epoch": 59, "lr": 9.787066826952405e-05} +{"train_loss": 0.013003593310713768, "global_step": 7110, "epoch": 59, "lr": 9.78700285590191e-05} +{"train_loss": 0.01219384279102087, "global_step": 7111, "epoch": 59, "lr": 9.786938875452648e-05} +{"train_loss": 0.014745024964213371, "global_step": 7112, "epoch": 59, "lr": 9.786874885604742e-05} +{"train_loss": 0.00953077245503664, "global_step": 7113, "epoch": 59, "lr": 9.786810886358318e-05} +{"train_loss": 0.012498673051595688, "global_step": 7114, "epoch": 59, "lr": 9.786746877713502e-05} +{"train_loss": 0.008126987144351006, "global_step": 7115, "epoch": 59, "lr": 9.786682859670419e-05} +{"train_loss": 0.01170018594712019, "global_step": 7116, "epoch": 59, "lr": 9.786618832229198e-05} +{"train_loss": 0.01104727666825056, "global_step": 7117, "epoch": 59, "lr": 9.786554795389962e-05} +{"train_loss": 0.012802822515368462, "global_step": 7118, "epoch": 59, "lr": 9.786490749152836e-05} +{"train_loss": 0.019095638766884804, "global_step": 7119, "epoch": 59, "lr": 9.786426693517947e-05} +{"train_loss": 0.013907944783568382, "global_step": 7120, "epoch": 59, "lr": 9.78636262848542e-05} +{"train_loss": 0.009599958546459675, "global_step": 7121, "epoch": 59, "lr": 9.786298554055382e-05} +{"train_loss": 0.01593547873198986, "global_step": 7122, "epoch": 59, "lr": 9.786234470227957e-05} +{"train_loss": 0.010112252086400986, "global_step": 7123, "epoch": 59, "lr": 9.786170377003275e-05} +{"train_loss": 0.013907251879572868, "global_step": 7124, "epoch": 59, "lr": 9.786106274381456e-05} +{"train_loss": 0.010476022027432919, "global_step": 7125, "epoch": 59, "lr": 9.78604216236263e-05} +{"train_loss": 0.01362135261297226, "global_step": 7126, "epoch": 59, "lr": 9.78597804094692e-05} +{"train_loss": 0.014352075755596161, "global_step": 7127, "epoch": 59, "lr": 9.785913910134454e-05} +{"train_loss": 0.01634104922413826, "global_step": 7128, "epoch": 59, "lr": 9.785849769925357e-05} +{"train_loss": 0.012943225912749767, "global_step": 7129, "epoch": 59, "lr": 9.785785620319756e-05} +{"train_loss": 0.012107497081160545, "global_step": 7130, "epoch": 59, "lr": 9.785721461317777e-05} +{"train_loss": 0.010766142047941685, "global_step": 7131, "epoch": 59, "lr": 9.785657292919544e-05} +{"train_loss": 0.013938698917627335, "global_step": 7132, "epoch": 59, "lr": 9.785593115125184e-05} +{"train_loss": 0.010192912071943283, "global_step": 7133, "epoch": 59, "lr": 9.785528927934824e-05} +{"train_loss": 0.011317084543406963, "global_step": 7134, "epoch": 59, "lr": 9.785464731348591e-05} +{"train_loss": 0.0178394578397274, "global_step": 7135, "epoch": 59, "lr": 9.785400525366606e-05} +{"train_loss": 0.017209166660904884, "global_step": 7136, "epoch": 59, "lr": 9.785336309989e-05} +{"train_loss": 0.017063569277524948, "global_step": 7137, "epoch": 59, "lr": 9.785272085215897e-05} +{"train_loss": 0.01256223302334547, "global_step": 7138, "epoch": 59, "lr": 9.785207851047422e-05} +{"train_loss": 0.012086092079637432, "global_step": 7139, "epoch": 59, "lr": 9.785143607483704e-05, "val_loss": 0.021759554743766785} +{"train_loss": 0.014753397554159164, "global_step": 7140, "epoch": 60, "lr": 9.785079354524868e-05} +{"train_loss": 0.009801502339541912, "global_step": 7141, "epoch": 60, "lr": 9.78501509217104e-05} +{"train_loss": 0.012195611372590065, "global_step": 7142, "epoch": 60, "lr": 9.784950820422345e-05} +{"train_loss": 0.007202948443591595, "global_step": 7143, "epoch": 60, "lr": 9.784886539278912e-05} +{"train_loss": 0.013032191433012486, "global_step": 7144, "epoch": 60, "lr": 9.784822248740864e-05} +{"train_loss": 0.010625631548464298, "global_step": 7145, "epoch": 60, "lr": 9.784757948808329e-05} +{"train_loss": 0.017109135165810585, "global_step": 7146, "epoch": 60, "lr": 9.784693639481432e-05} +{"train_loss": 0.01149927917867899, "global_step": 7147, "epoch": 60, "lr": 9.784629320760302e-05} +{"train_loss": 0.013887044042348862, "global_step": 7148, "epoch": 60, "lr": 9.784564992645063e-05} +{"train_loss": 0.011544027365744114, "global_step": 7149, "epoch": 60, "lr": 9.784500655135842e-05} +{"train_loss": 0.012267260812222958, "global_step": 7150, "epoch": 60, "lr": 9.784436308232765e-05} +{"train_loss": 0.009304393082857132, "global_step": 7151, "epoch": 60, "lr": 9.784371951935957e-05} +{"train_loss": 0.010193385183811188, "global_step": 7152, "epoch": 60, "lr": 9.784307586245547e-05} +{"train_loss": 0.010442198254168034, "global_step": 7153, "epoch": 60, "lr": 9.78424321116166e-05} +{"train_loss": 0.011917655356228352, "global_step": 7154, "epoch": 60, "lr": 9.784178826684423e-05} +{"train_loss": 0.017344169318675995, "global_step": 7155, "epoch": 60, "lr": 9.784114432813962e-05} +{"train_loss": 0.013110650703310966, "global_step": 7156, "epoch": 60, "lr": 9.784050029550402e-05} +{"train_loss": 0.007343834266066551, "global_step": 7157, "epoch": 60, "lr": 9.783985616893872e-05} +{"train_loss": 0.011634440161287785, "global_step": 7158, "epoch": 60, "lr": 9.783921194844498e-05} +{"train_loss": 0.008390394039452076, "global_step": 7159, "epoch": 60, "lr": 9.783856763402406e-05} +{"train_loss": 0.013621101155877113, "global_step": 7160, "epoch": 60, "lr": 9.783792322567721e-05} +{"train_loss": 0.009942663833498955, "global_step": 7161, "epoch": 60, "lr": 9.783727872340572e-05} +{"train_loss": 0.013906341046094894, "global_step": 7162, "epoch": 60, "lr": 9.783663412721083e-05} +{"train_loss": 0.008795605972409248, "global_step": 7163, "epoch": 60, "lr": 9.783598943709382e-05} +{"train_loss": 0.012070396915078163, "global_step": 7164, "epoch": 60, "lr": 9.783534465305597e-05} +{"train_loss": 0.013433658517897129, "global_step": 7165, "epoch": 60, "lr": 9.783469977509852e-05} +{"train_loss": 0.008109662681818008, "global_step": 7166, "epoch": 60, "lr": 9.783405480322274e-05} +{"train_loss": 0.007103313691914082, "global_step": 7167, "epoch": 60, "lr": 9.783340973742992e-05} +{"train_loss": 0.01227275189012289, "global_step": 7168, "epoch": 60, "lr": 9.78327645777213e-05} +{"train_loss": 0.013758789747953415, "global_step": 7169, "epoch": 60, "lr": 9.783211932409818e-05} +{"train_loss": 0.012628499418497086, "global_step": 7170, "epoch": 60, "lr": 9.783147397656177e-05} +{"train_loss": 0.012067249976098537, "global_step": 7171, "epoch": 60, "lr": 9.783082853511338e-05} +{"train_loss": 0.009628135710954666, "global_step": 7172, "epoch": 60, "lr": 9.783018299975428e-05} +{"train_loss": 0.012977038510143757, "global_step": 7173, "epoch": 60, "lr": 9.782953737048573e-05} +{"train_loss": 0.010506383143365383, "global_step": 7174, "epoch": 60, "lr": 9.782889164730898e-05} +{"train_loss": 0.011639820411801338, "global_step": 7175, "epoch": 60, "lr": 9.78282458302253e-05} +{"train_loss": 0.009345905855298042, "global_step": 7176, "epoch": 60, "lr": 9.782759991923599e-05} +{"train_loss": 0.010724741034209728, "global_step": 7177, "epoch": 60, "lr": 9.782695391434229e-05} +{"train_loss": 0.009957874193787575, "global_step": 7178, "epoch": 60, "lr": 9.782630781554547e-05} +{"train_loss": 0.008224181830883026, "global_step": 7179, "epoch": 60, "lr": 9.78256616228468e-05} +{"train_loss": 0.0124811427667737, "global_step": 7180, "epoch": 60, "lr": 9.782501533624758e-05} +{"train_loss": 0.009855317883193493, "global_step": 7181, "epoch": 60, "lr": 9.782436895574903e-05} +{"train_loss": 0.009974784217774868, "global_step": 7182, "epoch": 60, "lr": 9.782372248135244e-05} +{"train_loss": 0.007324845064431429, "global_step": 7183, "epoch": 60, "lr": 9.782307591305908e-05} +{"train_loss": 0.00997504498809576, "global_step": 7184, "epoch": 60, "lr": 9.782242925087024e-05} +{"train_loss": 0.011596509255468845, "global_step": 7185, "epoch": 60, "lr": 9.782178249478716e-05} +{"train_loss": 0.009461525827646255, "global_step": 7186, "epoch": 60, "lr": 9.78211356448111e-05} +{"train_loss": 0.013808129355311394, "global_step": 7187, "epoch": 60, "lr": 9.782048870094336e-05} +{"train_loss": 0.012595477513968945, "global_step": 7188, "epoch": 60, "lr": 9.781984166318521e-05} +{"train_loss": 0.020596832036972046, "global_step": 7189, "epoch": 60, "lr": 9.78191945315379e-05} +{"train_loss": 0.015237787738442421, "global_step": 7190, "epoch": 60, "lr": 9.78185473060027e-05} +{"train_loss": 0.009179909713566303, "global_step": 7191, "epoch": 60, "lr": 9.781789998658091e-05} +{"train_loss": 0.010567697696387768, "global_step": 7192, "epoch": 60, "lr": 9.781725257327377e-05} +{"train_loss": 0.01090442854911089, "global_step": 7193, "epoch": 60, "lr": 9.781660506608256e-05} +{"train_loss": 0.011645903810858727, "global_step": 7194, "epoch": 60, "lr": 9.781595746500857e-05} +{"train_loss": 0.01686965674161911, "global_step": 7195, "epoch": 60, "lr": 9.781530977005304e-05} +{"train_loss": 0.012003454379737377, "global_step": 7196, "epoch": 60, "lr": 9.781466198121727e-05} +{"train_loss": 0.016492372378706932, "global_step": 7197, "epoch": 60, "lr": 9.781401409850253e-05} +{"train_loss": 0.013601548969745636, "global_step": 7198, "epoch": 60, "lr": 9.781336612191006e-05} +{"train_loss": 0.012255853973329067, "global_step": 7199, "epoch": 60, "lr": 9.781271805144116e-05} +{"train_loss": 0.011017021723091602, "global_step": 7200, "epoch": 60, "lr": 9.781206988709709e-05} +{"train_loss": 0.012098618783056736, "global_step": 7201, "epoch": 60, "lr": 9.781142162887912e-05} +{"train_loss": 0.012332586571574211, "global_step": 7202, "epoch": 60, "lr": 9.781077327678856e-05} +{"train_loss": 0.009459982626140118, "global_step": 7203, "epoch": 60, "lr": 9.781012483082664e-05} +{"train_loss": 0.011682077310979366, "global_step": 7204, "epoch": 60, "lr": 9.780947629099465e-05} +{"train_loss": 0.014852238819003105, "global_step": 7205, "epoch": 60, "lr": 9.780882765729387e-05} +{"train_loss": 0.0168879684060812, "global_step": 7206, "epoch": 60, "lr": 9.780817892972554e-05} +{"train_loss": 0.016230974346399307, "global_step": 7207, "epoch": 60, "lr": 9.780753010829098e-05} +{"train_loss": 0.012463939376175404, "global_step": 7208, "epoch": 60, "lr": 9.780688119299142e-05} +{"train_loss": 0.00960900355130434, "global_step": 7209, "epoch": 60, "lr": 9.780623218382819e-05} +{"train_loss": 0.015990890562534332, "global_step": 7210, "epoch": 60, "lr": 9.78055830808025e-05} +{"train_loss": 0.009962644428014755, "global_step": 7211, "epoch": 60, "lr": 9.780493388391568e-05} +{"train_loss": 0.015019429847598076, "global_step": 7212, "epoch": 60, "lr": 9.780428459316895e-05} +{"train_loss": 0.014496946707367897, "global_step": 7213, "epoch": 60, "lr": 9.780363520856364e-05} +{"train_loss": 0.00934681762009859, "global_step": 7214, "epoch": 60, "lr": 9.780298573010099e-05} +{"train_loss": 0.008830292150378227, "global_step": 7215, "epoch": 60, "lr": 9.780233615778227e-05} +{"train_loss": 0.01029204297810793, "global_step": 7216, "epoch": 60, "lr": 9.780168649160879e-05} +{"train_loss": 0.012595763429999352, "global_step": 7217, "epoch": 60, "lr": 9.78010367315818e-05} +{"train_loss": 0.0168070737272501, "global_step": 7218, "epoch": 60, "lr": 9.780038687770258e-05} +{"train_loss": 0.0175034012645483, "global_step": 7219, "epoch": 60, "lr": 9.77997369299724e-05} +{"train_loss": 0.013424110598862171, "global_step": 7220, "epoch": 60, "lr": 9.779908688839255e-05} +{"train_loss": 0.013829223811626434, "global_step": 7221, "epoch": 60, "lr": 9.779843675296431e-05} +{"train_loss": 0.012387323193252087, "global_step": 7222, "epoch": 60, "lr": 9.779778652368892e-05} +{"train_loss": 0.012907915748655796, "global_step": 7223, "epoch": 60, "lr": 9.779713620056771e-05} +{"train_loss": 0.013737212866544724, "global_step": 7224, "epoch": 60, "lr": 9.779648578360193e-05} +{"train_loss": 0.012825006619095802, "global_step": 7225, "epoch": 60, "lr": 9.779583527279283e-05} +{"train_loss": 0.009661823511123657, "global_step": 7226, "epoch": 60, "lr": 9.779518466814172e-05} +{"train_loss": 0.010735378600656986, "global_step": 7227, "epoch": 60, "lr": 9.779453396964989e-05} +{"train_loss": 0.009711853228509426, "global_step": 7228, "epoch": 60, "lr": 9.77938831773186e-05} +{"train_loss": 0.0058225481770932674, "global_step": 7229, "epoch": 60, "lr": 9.779323229114909e-05} +{"train_loss": 0.010505652986466885, "global_step": 7230, "epoch": 60, "lr": 9.779258131114271e-05} +{"train_loss": 0.013004150241613388, "global_step": 7231, "epoch": 60, "lr": 9.77919302373007e-05} +{"train_loss": 0.015805603936314583, "global_step": 7232, "epoch": 60, "lr": 9.779127906962432e-05} +{"train_loss": 0.010428261011838913, "global_step": 7233, "epoch": 60, "lr": 9.779062780811487e-05} +{"train_loss": 0.011953308247029781, "global_step": 7234, "epoch": 60, "lr": 9.778997645277365e-05} +{"train_loss": 0.011018818244338036, "global_step": 7235, "epoch": 60, "lr": 9.77893250036019e-05} +{"train_loss": 0.012789676897227764, "global_step": 7236, "epoch": 60, "lr": 9.778867346060092e-05} +{"train_loss": 0.013888800516724586, "global_step": 7237, "epoch": 60, "lr": 9.778802182377199e-05} +{"train_loss": 0.016155337914824486, "global_step": 7238, "epoch": 60, "lr": 9.778737009311638e-05} +{"train_loss": 0.010560957714915276, "global_step": 7239, "epoch": 60, "lr": 9.778671826863538e-05} +{"train_loss": 0.014911078847944736, "global_step": 7240, "epoch": 60, "lr": 9.778606635033025e-05} +{"train_loss": 0.012753257527947426, "global_step": 7241, "epoch": 60, "lr": 9.77854143382023e-05} +{"train_loss": 0.008421622216701508, "global_step": 7242, "epoch": 60, "lr": 9.778476223225279e-05} +{"train_loss": 0.012143319472670555, "global_step": 7243, "epoch": 60, "lr": 9.7784110032483e-05} +{"train_loss": 0.011884019710123539, "global_step": 7244, "epoch": 60, "lr": 9.778345773889421e-05} +{"train_loss": 0.009931014850735664, "global_step": 7245, "epoch": 60, "lr": 9.778280535148772e-05} +{"train_loss": 0.014410716481506824, "global_step": 7246, "epoch": 60, "lr": 9.77821528702648e-05} +{"train_loss": 0.011552531272172928, "global_step": 7247, "epoch": 60, "lr": 9.77815002952267e-05} +{"train_loss": 0.008517155423760414, "global_step": 7248, "epoch": 60, "lr": 9.778084762637474e-05} +{"train_loss": 0.012475652620196342, "global_step": 7249, "epoch": 60, "lr": 9.778019486371021e-05} +{"train_loss": 0.012069272808730602, "global_step": 7250, "epoch": 60, "lr": 9.777954200723436e-05} +{"train_loss": 0.012883833609521389, "global_step": 7251, "epoch": 60, "lr": 9.777888905694847e-05} +{"train_loss": 0.015358136035501957, "global_step": 7252, "epoch": 60, "lr": 9.777823601285386e-05} +{"train_loss": 0.00769607350230217, "global_step": 7253, "epoch": 60, "lr": 9.777758287495176e-05} +{"train_loss": 0.015269672498106956, "global_step": 7254, "epoch": 60, "lr": 9.77769296432435e-05} +{"train_loss": 0.011404509656131268, "global_step": 7255, "epoch": 60, "lr": 9.777627631773034e-05} +{"train_loss": 0.01374188344925642, "global_step": 7256, "epoch": 60, "lr": 9.777562289841357e-05} +{"train_loss": 0.01470732968300581, "global_step": 7257, "epoch": 60, "lr": 9.777496938529445e-05} +{"train_loss": 0.012033809790340792, "global_step": 7258, "epoch": 60, "lr": 9.77743157783743e-05, "val_loss": 0.01706315390765667, "train_action_mse_error": 0.0005693091079592705} +{"train_loss": 0.016806699335575104, "global_step": 7259, "epoch": 61, "lr": 9.777366207765438e-05} +{"train_loss": 0.010437256656587124, "global_step": 7260, "epoch": 61, "lr": 9.777300828313598e-05} +{"train_loss": 0.012243843637406826, "global_step": 7261, "epoch": 61, "lr": 9.777235439482037e-05} +{"train_loss": 0.009948251768946648, "global_step": 7262, "epoch": 61, "lr": 9.777170041270887e-05} +{"train_loss": 0.00971523579210043, "global_step": 7263, "epoch": 61, "lr": 9.777104633680272e-05} +{"train_loss": 0.01452963799238205, "global_step": 7264, "epoch": 61, "lr": 9.777039216710322e-05} +{"train_loss": 0.016537416726350784, "global_step": 7265, "epoch": 61, "lr": 9.776973790361169e-05} +{"train_loss": 0.011040098033845425, "global_step": 7266, "epoch": 61, "lr": 9.776908354632934e-05} +{"train_loss": 0.009731022641062737, "global_step": 7267, "epoch": 61, "lr": 9.776842909525753e-05} +{"train_loss": 0.017798740416765213, "global_step": 7268, "epoch": 61, "lr": 9.77677745503975e-05} +{"train_loss": 0.010426797904074192, "global_step": 7269, "epoch": 61, "lr": 9.776711991175053e-05} +{"train_loss": 0.008183843456208706, "global_step": 7270, "epoch": 61, "lr": 9.776646517931796e-05} +{"train_loss": 0.015554402954876423, "global_step": 7271, "epoch": 61, "lr": 9.776581035310101e-05} +{"train_loss": 0.01704130508005619, "global_step": 7272, "epoch": 61, "lr": 9.776515543310101e-05} +{"train_loss": 0.008805329911410809, "global_step": 7273, "epoch": 61, "lr": 9.776450041931923e-05} +{"train_loss": 0.009863781742751598, "global_step": 7274, "epoch": 61, "lr": 9.776384531175696e-05} +{"train_loss": 0.012217004783451557, "global_step": 7275, "epoch": 61, "lr": 9.776319011041545e-05} +{"train_loss": 0.012096972204744816, "global_step": 7276, "epoch": 61, "lr": 9.776253481529606e-05} +{"train_loss": 0.01817566715180874, "global_step": 7277, "epoch": 61, "lr": 9.776187942640002e-05} +{"train_loss": 0.012368280440568924, "global_step": 7278, "epoch": 61, "lr": 9.776122394372863e-05} +{"train_loss": 0.014193709939718246, "global_step": 7279, "epoch": 61, "lr": 9.776056836728318e-05} +{"train_loss": 0.012756098993122578, "global_step": 7280, "epoch": 61, "lr": 9.775991269706496e-05} +{"train_loss": 0.007025877479463816, "global_step": 7281, "epoch": 61, "lr": 9.775925693307525e-05} +{"train_loss": 0.01275444496423006, "global_step": 7282, "epoch": 61, "lr": 9.775860107531534e-05} +{"train_loss": 0.01717912219464779, "global_step": 7283, "epoch": 61, "lr": 9.775794512378653e-05} +{"train_loss": 0.014900223352015018, "global_step": 7284, "epoch": 61, "lr": 9.775728907849009e-05} +{"train_loss": 0.012726275250315666, "global_step": 7285, "epoch": 61, "lr": 9.77566329394273e-05} +{"train_loss": 0.014963001944124699, "global_step": 7286, "epoch": 61, "lr": 9.775597670659948e-05} +{"train_loss": 0.00899425707757473, "global_step": 7287, "epoch": 61, "lr": 9.77553203800079e-05} +{"train_loss": 0.007904290221631527, "global_step": 7288, "epoch": 61, "lr": 9.775466395965384e-05} +{"train_loss": 0.019489724189043045, "global_step": 7289, "epoch": 61, "lr": 9.775400744553862e-05} +{"train_loss": 0.014339916408061981, "global_step": 7290, "epoch": 61, "lr": 9.77533508376635e-05} +{"train_loss": 0.013416154310107231, "global_step": 7291, "epoch": 61, "lr": 9.775269413602976e-05} +{"train_loss": 0.012386954389512539, "global_step": 7292, "epoch": 61, "lr": 9.775203734063873e-05} +{"train_loss": 0.018246587365865707, "global_step": 7293, "epoch": 61, "lr": 9.775138045149166e-05} +{"train_loss": 0.009746326133608818, "global_step": 7294, "epoch": 61, "lr": 9.775072346858986e-05} +{"train_loss": 0.013268990442156792, "global_step": 7295, "epoch": 61, "lr": 9.775006639193462e-05} +{"train_loss": 0.012764480896294117, "global_step": 7296, "epoch": 61, "lr": 9.774940922152722e-05} +{"train_loss": 0.010474558919668198, "global_step": 7297, "epoch": 61, "lr": 9.774875195736897e-05} +{"train_loss": 0.010567380115389824, "global_step": 7298, "epoch": 61, "lr": 9.774809459946113e-05} +{"train_loss": 0.015245896764099598, "global_step": 7299, "epoch": 61, "lr": 9.774743714780503e-05} +{"train_loss": 0.01513221301138401, "global_step": 7300, "epoch": 61, "lr": 9.77467796024019e-05} +{"train_loss": 0.014249904081225395, "global_step": 7301, "epoch": 61, "lr": 9.77461219632531e-05} +{"train_loss": 0.009513571858406067, "global_step": 7302, "epoch": 61, "lr": 9.774546423035989e-05} +{"train_loss": 0.01262443047016859, "global_step": 7303, "epoch": 61, "lr": 9.774480640372356e-05} +{"train_loss": 0.009881293401122093, "global_step": 7304, "epoch": 61, "lr": 9.774414848334539e-05} +{"train_loss": 0.01618453860282898, "global_step": 7305, "epoch": 61, "lr": 9.774349046922668e-05} +{"train_loss": 0.010242273099720478, "global_step": 7306, "epoch": 61, "lr": 9.774283236136875e-05} +{"train_loss": 0.014381133951246738, "global_step": 7307, "epoch": 61, "lr": 9.774217415977285e-05} +{"train_loss": 0.010525447316467762, "global_step": 7308, "epoch": 61, "lr": 9.774151586444031e-05} +{"train_loss": 0.012119499035179615, "global_step": 7309, "epoch": 61, "lr": 9.77408574753724e-05} +{"train_loss": 0.01442914642393589, "global_step": 7310, "epoch": 61, "lr": 9.774019899257041e-05} +{"train_loss": 0.009991287253797054, "global_step": 7311, "epoch": 61, "lr": 9.773954041603563e-05} +{"train_loss": 0.01680763252079487, "global_step": 7312, "epoch": 61, "lr": 9.773888174576938e-05} +{"train_loss": 0.01039192732423544, "global_step": 7313, "epoch": 61, "lr": 9.773822298177293e-05} +{"train_loss": 0.01882309466600418, "global_step": 7314, "epoch": 61, "lr": 9.773756412404758e-05} +{"train_loss": 0.008717375807464123, "global_step": 7315, "epoch": 61, "lr": 9.773690517259462e-05} +{"train_loss": 0.010664097033441067, "global_step": 7316, "epoch": 61, "lr": 9.773624612741534e-05} +{"train_loss": 0.011483361013233662, "global_step": 7317, "epoch": 61, "lr": 9.773558698851106e-05} +{"train_loss": 0.014683561399579048, "global_step": 7318, "epoch": 61, "lr": 9.773492775588305e-05} +{"train_loss": 0.010563846677541733, "global_step": 7319, "epoch": 61, "lr": 9.77342684295326e-05} +{"train_loss": 0.010608414188027382, "global_step": 7320, "epoch": 61, "lr": 9.773360900946102e-05} +{"train_loss": 0.01399492472410202, "global_step": 7321, "epoch": 61, "lr": 9.773294949566958e-05} +{"train_loss": 0.015568502247333527, "global_step": 7322, "epoch": 61, "lr": 9.773228988815961e-05} +{"train_loss": 0.011941495351493359, "global_step": 7323, "epoch": 61, "lr": 9.773163018693239e-05} +{"train_loss": 0.01182502694427967, "global_step": 7324, "epoch": 61, "lr": 9.77309703919892e-05} +{"train_loss": 0.013949286192655563, "global_step": 7325, "epoch": 61, "lr": 9.773031050333137e-05} +{"train_loss": 0.010944013483822346, "global_step": 7326, "epoch": 61, "lr": 9.772965052096016e-05} +{"train_loss": 0.009107517078518867, "global_step": 7327, "epoch": 61, "lr": 9.77289904448769e-05} +{"train_loss": 0.008598106913268566, "global_step": 7328, "epoch": 61, "lr": 9.772833027508283e-05} +{"train_loss": 0.01515447348356247, "global_step": 7329, "epoch": 61, "lr": 9.772767001157931e-05} +{"train_loss": 0.015852611511945724, "global_step": 7330, "epoch": 61, "lr": 9.772700965436759e-05} +{"train_loss": 0.011494331993162632, "global_step": 7331, "epoch": 61, "lr": 9.772634920344901e-05} +{"train_loss": 0.009632114320993423, "global_step": 7332, "epoch": 61, "lr": 9.772568865882482e-05} +{"train_loss": 0.013773409649729729, "global_step": 7333, "epoch": 61, "lr": 9.772502802049634e-05} +{"train_loss": 0.013249342329800129, "global_step": 7334, "epoch": 61, "lr": 9.772436728846488e-05} +{"train_loss": 0.00935947522521019, "global_step": 7335, "epoch": 61, "lr": 9.772370646273172e-05} +{"train_loss": 0.01282479427754879, "global_step": 7336, "epoch": 61, "lr": 9.772304554329816e-05} +{"train_loss": 0.014838643372058868, "global_step": 7337, "epoch": 61, "lr": 9.772238453016549e-05} +{"train_loss": 0.010348248295485973, "global_step": 7338, "epoch": 61, "lr": 9.772172342333504e-05} +{"train_loss": 0.013313379138708115, "global_step": 7339, "epoch": 61, "lr": 9.772106222280806e-05} +{"train_loss": 0.011903652921319008, "global_step": 7340, "epoch": 61, "lr": 9.772040092858587e-05} +{"train_loss": 0.015285022556781769, "global_step": 7341, "epoch": 61, "lr": 9.771973954066978e-05} +{"train_loss": 0.014998958446085453, "global_step": 7342, "epoch": 61, "lr": 9.771907805906109e-05} +{"train_loss": 0.01084771566092968, "global_step": 7343, "epoch": 61, "lr": 9.771841648376108e-05} +{"train_loss": 0.013925023376941681, "global_step": 7344, "epoch": 61, "lr": 9.771775481477106e-05} +{"train_loss": 0.008368374779820442, "global_step": 7345, "epoch": 61, "lr": 9.771709305209232e-05} +{"train_loss": 0.020054753869771957, "global_step": 7346, "epoch": 61, "lr": 9.771643119572616e-05} +{"train_loss": 0.011803126893937588, "global_step": 7347, "epoch": 61, "lr": 9.77157692456739e-05} +{"train_loss": 0.014372160658240318, "global_step": 7348, "epoch": 61, "lr": 9.771510720193682e-05} +{"train_loss": 0.017975157126784325, "global_step": 7349, "epoch": 61, "lr": 9.771444506451621e-05} +{"train_loss": 0.013148674741387367, "global_step": 7350, "epoch": 61, "lr": 9.77137828334134e-05} +{"train_loss": 0.010582027956843376, "global_step": 7351, "epoch": 61, "lr": 9.771312050862968e-05} +{"train_loss": 0.007055670488625765, "global_step": 7352, "epoch": 61, "lr": 9.771245809016633e-05} +{"train_loss": 0.01091718953102827, "global_step": 7353, "epoch": 61, "lr": 9.771179557802468e-05} +{"train_loss": 0.014540818519890308, "global_step": 7354, "epoch": 61, "lr": 9.7711132972206e-05} +{"train_loss": 0.014066439121961594, "global_step": 7355, "epoch": 61, "lr": 9.771047027271163e-05} +{"train_loss": 0.01187338400632143, "global_step": 7356, "epoch": 61, "lr": 9.770980747954283e-05} +{"train_loss": 0.011108380742371082, "global_step": 7357, "epoch": 61, "lr": 9.770914459270093e-05} +{"train_loss": 0.015407728962600231, "global_step": 7358, "epoch": 61, "lr": 9.770848161218722e-05} +{"train_loss": 0.018831396475434303, "global_step": 7359, "epoch": 61, "lr": 9.7707818538003e-05} +{"train_loss": 0.01180937234312296, "global_step": 7360, "epoch": 61, "lr": 9.770715537014956e-05} +{"train_loss": 0.008234234526753426, "global_step": 7361, "epoch": 61, "lr": 9.770649210862824e-05} +{"train_loss": 0.012211454100906849, "global_step": 7362, "epoch": 61, "lr": 9.770582875344032e-05} +{"train_loss": 0.012413074262440205, "global_step": 7363, "epoch": 61, "lr": 9.770516530458709e-05} +{"train_loss": 0.013222914189100266, "global_step": 7364, "epoch": 61, "lr": 9.770450176206987e-05} +{"train_loss": 0.008372189477086067, "global_step": 7365, "epoch": 61, "lr": 9.770383812588995e-05} +{"train_loss": 0.014621134847402573, "global_step": 7366, "epoch": 61, "lr": 9.770317439604866e-05} +{"train_loss": 0.012205514125525951, "global_step": 7367, "epoch": 61, "lr": 9.770251057254726e-05} +{"train_loss": 0.011705364100635052, "global_step": 7368, "epoch": 61, "lr": 9.770184665538708e-05} +{"train_loss": 0.013869409449398518, "global_step": 7369, "epoch": 61, "lr": 9.770118264456944e-05} +{"train_loss": 0.011972312815487385, "global_step": 7370, "epoch": 61, "lr": 9.77005185400956e-05} +{"train_loss": 0.01312166079878807, "global_step": 7371, "epoch": 61, "lr": 9.76998543419669e-05} +{"train_loss": 0.01026334147900343, "global_step": 7372, "epoch": 61, "lr": 9.769919005018464e-05} +{"train_loss": 0.009815516881644726, "global_step": 7373, "epoch": 61, "lr": 9.76985256647501e-05} +{"train_loss": 0.011105735786259174, "global_step": 7374, "epoch": 61, "lr": 9.76978611856646e-05} +{"train_loss": 0.012170047499239445, "global_step": 7375, "epoch": 61, "lr": 9.769719661292947e-05} +{"train_loss": 0.01065221056342125, "global_step": 7376, "epoch": 61, "lr": 9.769653194654597e-05} +{"train_loss": 0.012623750229029595, "global_step": 7377, "epoch": 61, "lr": 9.769586718651542e-05, "val_loss": 0.021036183461546898} +{"train_loss": 0.011863053776323795, "global_step": 7378, "epoch": 62, "lr": 9.769520233283914e-05} +{"train_loss": 0.011391041800379753, "global_step": 7379, "epoch": 62, "lr": 9.769453738551843e-05} +{"train_loss": 0.012145085260272026, "global_step": 7380, "epoch": 62, "lr": 9.769387234455459e-05} +{"train_loss": 0.01691233552992344, "global_step": 7381, "epoch": 62, "lr": 9.769320720994892e-05} +{"train_loss": 0.013271155767142773, "global_step": 7382, "epoch": 62, "lr": 9.769254198170272e-05} +{"train_loss": 0.01112391147762537, "global_step": 7383, "epoch": 62, "lr": 9.769187665981734e-05} +{"train_loss": 0.01094913762062788, "global_step": 7384, "epoch": 62, "lr": 9.769121124429404e-05} +{"train_loss": 0.009105930104851723, "global_step": 7385, "epoch": 62, "lr": 9.769054573513415e-05} +{"train_loss": 0.012306212447583675, "global_step": 7386, "epoch": 62, "lr": 9.768988013233895e-05} +{"train_loss": 0.01023969054222107, "global_step": 7387, "epoch": 62, "lr": 9.768921443590978e-05} +{"train_loss": 0.016221780329942703, "global_step": 7388, "epoch": 62, "lr": 9.768854864584791e-05} +{"train_loss": 0.01170357596129179, "global_step": 7389, "epoch": 62, "lr": 9.76878827621547e-05} +{"train_loss": 0.010407715104520321, "global_step": 7390, "epoch": 62, "lr": 9.768721678483142e-05} +{"train_loss": 0.013787806034088135, "global_step": 7391, "epoch": 62, "lr": 9.768655071387938e-05} +{"train_loss": 0.010986356064677238, "global_step": 7392, "epoch": 62, "lr": 9.768588454929988e-05} +{"train_loss": 0.00956034380942583, "global_step": 7393, "epoch": 62, "lr": 9.768521829109425e-05} +{"train_loss": 0.010634343139827251, "global_step": 7394, "epoch": 62, "lr": 9.768455193926379e-05} +{"train_loss": 0.009507639333605766, "global_step": 7395, "epoch": 62, "lr": 9.768388549380981e-05} +{"train_loss": 0.013835886493325233, "global_step": 7396, "epoch": 62, "lr": 9.76832189547336e-05} +{"train_loss": 0.008658669888973236, "global_step": 7397, "epoch": 62, "lr": 9.76825523220365e-05} +{"train_loss": 0.013563067652285099, "global_step": 7398, "epoch": 62, "lr": 9.76818855957198e-05} +{"train_loss": 0.009338006377220154, "global_step": 7399, "epoch": 62, "lr": 9.76812187757848e-05} +{"train_loss": 0.009221136569976807, "global_step": 7400, "epoch": 62, "lr": 9.768055186223283e-05} +{"train_loss": 0.011153913103044033, "global_step": 7401, "epoch": 62, "lr": 9.76798848550652e-05} +{"train_loss": 0.007876269519329071, "global_step": 7402, "epoch": 62, "lr": 9.767921775428319e-05} +{"train_loss": 0.007843212224543095, "global_step": 7403, "epoch": 62, "lr": 9.767855055988815e-05} +{"train_loss": 0.01265785750001669, "global_step": 7404, "epoch": 62, "lr": 9.767788327188136e-05} +{"train_loss": 0.014398266561329365, "global_step": 7405, "epoch": 62, "lr": 9.767721589026413e-05} +{"train_loss": 0.008089873939752579, "global_step": 7406, "epoch": 62, "lr": 9.767654841503779e-05} +{"train_loss": 0.01261946838349104, "global_step": 7407, "epoch": 62, "lr": 9.767588084620365e-05} +{"train_loss": 0.009191743098199368, "global_step": 7408, "epoch": 62, "lr": 9.7675213183763e-05} +{"train_loss": 0.011313524097204208, "global_step": 7409, "epoch": 62, "lr": 9.767454542771717e-05} +{"train_loss": 0.014933476224541664, "global_step": 7410, "epoch": 62, "lr": 9.767387757806745e-05} +{"train_loss": 0.014168309979140759, "global_step": 7411, "epoch": 62, "lr": 9.767320963481516e-05} +{"train_loss": 0.01621648110449314, "global_step": 7412, "epoch": 62, "lr": 9.767254159796164e-05} +{"train_loss": 0.0122612239792943, "global_step": 7413, "epoch": 62, "lr": 9.767187346750817e-05} +{"train_loss": 0.01005503162741661, "global_step": 7414, "epoch": 62, "lr": 9.767120524345605e-05} +{"train_loss": 0.00625700643286109, "global_step": 7415, "epoch": 62, "lr": 9.767053692580664e-05} +{"train_loss": 0.012228061445057392, "global_step": 7416, "epoch": 62, "lr": 9.76698685145612e-05} +{"train_loss": 0.0212896429002285, "global_step": 7417, "epoch": 62, "lr": 9.766920000972108e-05} +{"train_loss": 0.01553305983543396, "global_step": 7418, "epoch": 62, "lr": 9.766853141128757e-05} +{"train_loss": 0.00978358555585146, "global_step": 7419, "epoch": 62, "lr": 9.766786271926201e-05} +{"train_loss": 0.016586212441325188, "global_step": 7420, "epoch": 62, "lr": 9.766719393364567e-05} +{"train_loss": 0.007671147584915161, "global_step": 7421, "epoch": 62, "lr": 9.766652505443989e-05} +{"train_loss": 0.019604075700044632, "global_step": 7422, "epoch": 62, "lr": 9.7665856081646e-05} +{"train_loss": 0.011794797144830227, "global_step": 7423, "epoch": 62, "lr": 9.766518701526527e-05} +{"train_loss": 0.013841865584254265, "global_step": 7424, "epoch": 62, "lr": 9.766451785529905e-05} +{"train_loss": 0.013294635340571404, "global_step": 7425, "epoch": 62, "lr": 9.766384860174865e-05} +{"train_loss": 0.011678875423967838, "global_step": 7426, "epoch": 62, "lr": 9.766317925461537e-05} +{"train_loss": 0.013293656520545483, "global_step": 7427, "epoch": 62, "lr": 9.766250981390052e-05} +{"train_loss": 0.011912408284842968, "global_step": 7428, "epoch": 62, "lr": 9.766184027960543e-05} +{"train_loss": 0.016331203281879425, "global_step": 7429, "epoch": 62, "lr": 9.76611706517314e-05} +{"train_loss": 0.010061098262667656, "global_step": 7430, "epoch": 62, "lr": 9.766050093027977e-05} +{"train_loss": 0.010312042199075222, "global_step": 7431, "epoch": 62, "lr": 9.765983111525182e-05} +{"train_loss": 0.008140158839523792, "global_step": 7432, "epoch": 62, "lr": 9.76591612066489e-05} +{"train_loss": 0.0134782325476408, "global_step": 7433, "epoch": 62, "lr": 9.76584912044723e-05} +{"train_loss": 0.012724391184747219, "global_step": 7434, "epoch": 62, "lr": 9.765782110872335e-05} +{"train_loss": 0.011008239351212978, "global_step": 7435, "epoch": 62, "lr": 9.765715091940335e-05} +{"train_loss": 0.01645437441766262, "global_step": 7436, "epoch": 62, "lr": 9.765648063651362e-05} +{"train_loss": 0.00946772750467062, "global_step": 7437, "epoch": 62, "lr": 9.76558102600555e-05} +{"train_loss": 0.014508695341646671, "global_step": 7438, "epoch": 62, "lr": 9.765513979003029e-05} +{"train_loss": 0.010268486104905605, "global_step": 7439, "epoch": 62, "lr": 9.765446922643928e-05} +{"train_loss": 0.013420813716948032, "global_step": 7440, "epoch": 62, "lr": 9.765379856928383e-05} +{"train_loss": 0.016533056274056435, "global_step": 7441, "epoch": 62, "lr": 9.765312781856524e-05} +{"train_loss": 0.013493130914866924, "global_step": 7442, "epoch": 62, "lr": 9.76524569742848e-05} +{"train_loss": 0.014813038520514965, "global_step": 7443, "epoch": 62, "lr": 9.765178603644386e-05} +{"train_loss": 0.0077287377789616585, "global_step": 7444, "epoch": 62, "lr": 9.765111500504375e-05} +{"train_loss": 0.009625464677810669, "global_step": 7445, "epoch": 62, "lr": 9.765044388008575e-05} +{"train_loss": 0.016985520720481873, "global_step": 7446, "epoch": 62, "lr": 9.76497726615712e-05} +{"train_loss": 0.013965134508907795, "global_step": 7447, "epoch": 62, "lr": 9.764910134950141e-05} +{"train_loss": 0.009462927468121052, "global_step": 7448, "epoch": 62, "lr": 9.764842994387771e-05} +{"train_loss": 0.01076638512313366, "global_step": 7449, "epoch": 62, "lr": 9.76477584447014e-05} +{"train_loss": 0.01260207500308752, "global_step": 7450, "epoch": 62, "lr": 9.76470868519738e-05} +{"train_loss": 0.01145890448242426, "global_step": 7451, "epoch": 62, "lr": 9.764641516569623e-05} +{"train_loss": 0.014034656807780266, "global_step": 7452, "epoch": 62, "lr": 9.764574338587004e-05} +{"train_loss": 0.013396110385656357, "global_step": 7453, "epoch": 62, "lr": 9.764507151249652e-05} +{"train_loss": 0.01467023603618145, "global_step": 7454, "epoch": 62, "lr": 9.764439954557696e-05} +{"train_loss": 0.00881554838269949, "global_step": 7455, "epoch": 62, "lr": 9.764372748511273e-05} +{"train_loss": 0.011254909448325634, "global_step": 7456, "epoch": 62, "lr": 9.764305533110514e-05} +{"train_loss": 0.014171188697218895, "global_step": 7457, "epoch": 62, "lr": 9.764238308355549e-05} +{"train_loss": 0.013862412422895432, "global_step": 7458, "epoch": 62, "lr": 9.764171074246511e-05} +{"train_loss": 0.011753044091165066, "global_step": 7459, "epoch": 62, "lr": 9.764103830783533e-05} +{"train_loss": 0.01271754689514637, "global_step": 7460, "epoch": 62, "lr": 9.764036577966745e-05} +{"train_loss": 0.015371191315352917, "global_step": 7461, "epoch": 62, "lr": 9.763969315796282e-05} +{"train_loss": 0.011638407595455647, "global_step": 7462, "epoch": 62, "lr": 9.763902044272273e-05} +{"train_loss": 0.010067317634820938, "global_step": 7463, "epoch": 62, "lr": 9.76383476339485e-05} +{"train_loss": 0.01490742526948452, "global_step": 7464, "epoch": 62, "lr": 9.763767473164148e-05} +{"train_loss": 0.012745896354317665, "global_step": 7465, "epoch": 62, "lr": 9.763700173580296e-05} +{"train_loss": 0.01299689058214426, "global_step": 7466, "epoch": 62, "lr": 9.763632864643431e-05} +{"train_loss": 0.009006381034851074, "global_step": 7467, "epoch": 62, "lr": 9.76356554635368e-05} +{"train_loss": 0.012475060299038887, "global_step": 7468, "epoch": 62, "lr": 9.763498218711175e-05} +{"train_loss": 0.013692803680896759, "global_step": 7469, "epoch": 62, "lr": 9.763430881716052e-05} +{"train_loss": 0.012039571069180965, "global_step": 7470, "epoch": 62, "lr": 9.763363535368441e-05} +{"train_loss": 0.009575027041137218, "global_step": 7471, "epoch": 62, "lr": 9.763296179668474e-05} +{"train_loss": 0.014211012050509453, "global_step": 7472, "epoch": 62, "lr": 9.763228814616284e-05} +{"train_loss": 0.011086257174611092, "global_step": 7473, "epoch": 62, "lr": 9.763161440212003e-05} +{"train_loss": 0.009739152155816555, "global_step": 7474, "epoch": 62, "lr": 9.763094056455765e-05} +{"train_loss": 0.016099730506539345, "global_step": 7475, "epoch": 62, "lr": 9.763026663347699e-05} +{"train_loss": 0.009294611401855946, "global_step": 7476, "epoch": 62, "lr": 9.76295926088794e-05} +{"train_loss": 0.011503605172038078, "global_step": 7477, "epoch": 62, "lr": 9.762891849076619e-05} +{"train_loss": 0.010765505954623222, "global_step": 7478, "epoch": 62, "lr": 9.762824427913869e-05} +{"train_loss": 0.011939405463635921, "global_step": 7479, "epoch": 62, "lr": 9.762756997399821e-05} +{"train_loss": 0.015223534777760506, "global_step": 7480, "epoch": 62, "lr": 9.76268955753461e-05} +{"train_loss": 0.012058022432029247, "global_step": 7481, "epoch": 62, "lr": 9.762622108318364e-05} +{"train_loss": 0.009929433465003967, "global_step": 7482, "epoch": 62, "lr": 9.762554649751222e-05} +{"train_loss": 0.014392887242138386, "global_step": 7483, "epoch": 62, "lr": 9.762487181833311e-05} +{"train_loss": 0.013902564533054829, "global_step": 7484, "epoch": 62, "lr": 9.762419704564765e-05} +{"train_loss": 0.01191659364849329, "global_step": 7485, "epoch": 62, "lr": 9.762352217945716e-05} +{"train_loss": 0.009689431637525558, "global_step": 7486, "epoch": 62, "lr": 9.7622847219763e-05} +{"train_loss": 0.01088764425367117, "global_step": 7487, "epoch": 62, "lr": 9.762217216656644e-05} +{"train_loss": 0.015539675951004028, "global_step": 7488, "epoch": 62, "lr": 9.762149701986884e-05} +{"train_loss": 0.010957040823996067, "global_step": 7489, "epoch": 62, "lr": 9.762082177967152e-05} +{"train_loss": 0.011311186477541924, "global_step": 7490, "epoch": 62, "lr": 9.76201464459758e-05} +{"train_loss": 0.010477903299033642, "global_step": 7491, "epoch": 62, "lr": 9.761947101878302e-05} +{"train_loss": 0.009098696522414684, "global_step": 7492, "epoch": 62, "lr": 9.761879549809448e-05} +{"train_loss": 0.011402548290789127, "global_step": 7493, "epoch": 62, "lr": 9.761811988391154e-05} +{"train_loss": 0.010019092820584774, "global_step": 7494, "epoch": 62, "lr": 9.76174441762355e-05} +{"train_loss": 0.015173103660345078, "global_step": 7495, "epoch": 62, "lr": 9.76167683750677e-05} +{"train_loss": 0.012193597786660706, "global_step": 7496, "epoch": 62, "lr": 9.761609248040946e-05, "val_loss": 0.01529121957719326} +{"train_loss": 0.010388056747615337, "global_step": 7497, "epoch": 63, "lr": 9.76154164922621e-05} +{"train_loss": 0.010053077712655067, "global_step": 7498, "epoch": 63, "lr": 9.761474041062697e-05} +{"train_loss": 0.018489545211195946, "global_step": 7499, "epoch": 63, "lr": 9.761406423550537e-05} +{"train_loss": 0.01014778297394514, "global_step": 7500, "epoch": 63, "lr": 9.761338796689867e-05} +{"train_loss": 0.008313044905662537, "global_step": 7501, "epoch": 63, "lr": 9.761271160480813e-05} +{"train_loss": 0.009975514374673367, "global_step": 7502, "epoch": 63, "lr": 9.761203514923515e-05} +{"train_loss": 0.009049554355442524, "global_step": 7503, "epoch": 63, "lr": 9.7611358600181e-05} +{"train_loss": 0.012229458428919315, "global_step": 7504, "epoch": 63, "lr": 9.761068195764706e-05} +{"train_loss": 0.010999801568686962, "global_step": 7505, "epoch": 63, "lr": 9.761000522163462e-05} +{"train_loss": 0.013625852763652802, "global_step": 7506, "epoch": 63, "lr": 9.760932839214501e-05} +{"train_loss": 0.0116297397762537, "global_step": 7507, "epoch": 63, "lr": 9.760865146917959e-05} +{"train_loss": 0.01565982960164547, "global_step": 7508, "epoch": 63, "lr": 9.760797445273965e-05} +{"train_loss": 0.014141333289444447, "global_step": 7509, "epoch": 63, "lr": 9.760729734282655e-05} +{"train_loss": 0.012048103846609592, "global_step": 7510, "epoch": 63, "lr": 9.760662013944162e-05} +{"train_loss": 0.014641554094851017, "global_step": 7511, "epoch": 63, "lr": 9.760594284258615e-05} +{"train_loss": 0.013959781266748905, "global_step": 7512, "epoch": 63, "lr": 9.760526545226152e-05} +{"train_loss": 0.007669283077120781, "global_step": 7513, "epoch": 63, "lr": 9.760458796846903e-05} +{"train_loss": 0.010922438465058804, "global_step": 7514, "epoch": 63, "lr": 9.760391039121e-05} +{"train_loss": 0.00906828511506319, "global_step": 7515, "epoch": 63, "lr": 9.760323272048579e-05} +{"train_loss": 0.014813828282058239, "global_step": 7516, "epoch": 63, "lr": 9.760255495629773e-05} +{"train_loss": 0.00996868871152401, "global_step": 7517, "epoch": 63, "lr": 9.760187709864713e-05} +{"train_loss": 0.01087358221411705, "global_step": 7518, "epoch": 63, "lr": 9.760119914753534e-05} +{"train_loss": 0.01272585615515709, "global_step": 7519, "epoch": 63, "lr": 9.760052110296366e-05} +{"train_loss": 0.012005100958049297, "global_step": 7520, "epoch": 63, "lr": 9.759984296493345e-05} +{"train_loss": 0.013476329855620861, "global_step": 7521, "epoch": 63, "lr": 9.759916473344604e-05} +{"train_loss": 0.008875732310116291, "global_step": 7522, "epoch": 63, "lr": 9.759848640850276e-05} +{"train_loss": 0.013207349926233292, "global_step": 7523, "epoch": 63, "lr": 9.759780799010491e-05} +{"train_loss": 0.009748917073011398, "global_step": 7524, "epoch": 63, "lr": 9.759712947825388e-05} +{"train_loss": 0.012029493227601051, "global_step": 7525, "epoch": 63, "lr": 9.759645087295095e-05} +{"train_loss": 0.0143510727211833, "global_step": 7526, "epoch": 63, "lr": 9.759577217419748e-05} +{"train_loss": 0.00826739426702261, "global_step": 7527, "epoch": 63, "lr": 9.759509338199482e-05} +{"train_loss": 0.013859336264431477, "global_step": 7528, "epoch": 63, "lr": 9.759441449634424e-05} +{"train_loss": 0.012417872436344624, "global_step": 7529, "epoch": 63, "lr": 9.759373551724714e-05} +{"train_loss": 0.019292496144771576, "global_step": 7530, "epoch": 63, "lr": 9.759305644470481e-05} +{"train_loss": 0.010958787053823471, "global_step": 7531, "epoch": 63, "lr": 9.759237727871861e-05} +{"train_loss": 0.010071133263409138, "global_step": 7532, "epoch": 63, "lr": 9.759169801928985e-05} +{"train_loss": 0.012097982689738274, "global_step": 7533, "epoch": 63, "lr": 9.759101866641989e-05} +{"train_loss": 0.008258271031081676, "global_step": 7534, "epoch": 63, "lr": 9.759033922011003e-05} +{"train_loss": 0.006838453467935324, "global_step": 7535, "epoch": 63, "lr": 9.758965968036162e-05} +{"train_loss": 0.012134948745369911, "global_step": 7536, "epoch": 63, "lr": 9.758898004717602e-05} +{"train_loss": 0.016316143795847893, "global_step": 7537, "epoch": 63, "lr": 9.758830032055453e-05} +{"train_loss": 0.011410665698349476, "global_step": 7538, "epoch": 63, "lr": 9.75876205004985e-05} +{"train_loss": 0.01452329009771347, "global_step": 7539, "epoch": 63, "lr": 9.758694058700925e-05} +{"train_loss": 0.015325577929615974, "global_step": 7540, "epoch": 63, "lr": 9.758626058008816e-05} +{"train_loss": 0.006600182969123125, "global_step": 7541, "epoch": 63, "lr": 9.75855804797365e-05} +{"train_loss": 0.011917758733034134, "global_step": 7542, "epoch": 63, "lr": 9.758490028595564e-05} +{"train_loss": 0.012325027026236057, "global_step": 7543, "epoch": 63, "lr": 9.75842199987469e-05} +{"train_loss": 0.010727700777351856, "global_step": 7544, "epoch": 63, "lr": 9.758353961811165e-05} +{"train_loss": 0.013485431671142578, "global_step": 7545, "epoch": 63, "lr": 9.758285914405119e-05} +{"train_loss": 0.007368526421487331, "global_step": 7546, "epoch": 63, "lr": 9.758217857656688e-05} +{"train_loss": 0.023873446509242058, "global_step": 7547, "epoch": 63, "lr": 9.758149791566005e-05} +{"train_loss": 0.011822461150586605, "global_step": 7548, "epoch": 63, "lr": 9.758081716133202e-05} +{"train_loss": 0.018199143931269646, "global_step": 7549, "epoch": 63, "lr": 9.758013631358414e-05} +{"train_loss": 0.008465397171676159, "global_step": 7550, "epoch": 63, "lr": 9.757945537241775e-05} +{"train_loss": 0.010389085859060287, "global_step": 7551, "epoch": 63, "lr": 9.757877433783418e-05} +{"train_loss": 0.015544016845524311, "global_step": 7552, "epoch": 63, "lr": 9.757809320983477e-05} +{"train_loss": 0.013403832912445068, "global_step": 7553, "epoch": 63, "lr": 9.757741198842085e-05} +{"train_loss": 0.008521497249603271, "global_step": 7554, "epoch": 63, "lr": 9.757673067359378e-05} +{"train_loss": 0.01129049714654684, "global_step": 7555, "epoch": 63, "lr": 9.757604926535486e-05} +{"train_loss": 0.010506452061235905, "global_step": 7556, "epoch": 63, "lr": 9.757536776370548e-05} +{"train_loss": 0.011005030013620853, "global_step": 7557, "epoch": 63, "lr": 9.757468616864692e-05} +{"train_loss": 0.015418336726725101, "global_step": 7558, "epoch": 63, "lr": 9.757400448018056e-05} +{"train_loss": 0.012133954092860222, "global_step": 7559, "epoch": 63, "lr": 9.757332269830773e-05} +{"train_loss": 0.009202959947288036, "global_step": 7560, "epoch": 63, "lr": 9.757264082302975e-05} +{"train_loss": 0.014277876354753971, "global_step": 7561, "epoch": 63, "lr": 9.757195885434798e-05} +{"train_loss": 0.013611160218715668, "global_step": 7562, "epoch": 63, "lr": 9.757127679226374e-05} +{"train_loss": 0.013291754759848118, "global_step": 7563, "epoch": 63, "lr": 9.75705946367784e-05} +{"train_loss": 0.0145869180560112, "global_step": 7564, "epoch": 63, "lr": 9.756991238789326e-05} +{"train_loss": 0.011064281687140465, "global_step": 7565, "epoch": 63, "lr": 9.756923004560969e-05} +{"train_loss": 0.010358785279095173, "global_step": 7566, "epoch": 63, "lr": 9.756854760992901e-05} +{"train_loss": 0.012398620136082172, "global_step": 7567, "epoch": 63, "lr": 9.756786508085258e-05} +{"train_loss": 0.013387936167418957, "global_step": 7568, "epoch": 63, "lr": 9.756718245838172e-05} +{"train_loss": 0.010380364954471588, "global_step": 7569, "epoch": 63, "lr": 9.756649974251779e-05} +{"train_loss": 0.008773870766162872, "global_step": 7570, "epoch": 63, "lr": 9.756581693326212e-05} +{"train_loss": 0.011136895976960659, "global_step": 7571, "epoch": 63, "lr": 9.756513403061605e-05} +{"train_loss": 0.012991022318601608, "global_step": 7572, "epoch": 63, "lr": 9.75644510345809e-05} +{"train_loss": 0.01066627912223339, "global_step": 7573, "epoch": 63, "lr": 9.756376794515804e-05} +{"train_loss": 0.010838372632861137, "global_step": 7574, "epoch": 63, "lr": 9.75630847623488e-05} +{"train_loss": 0.009997440502047539, "global_step": 7575, "epoch": 63, "lr": 9.756240148615456e-05} +{"train_loss": 0.01249267440289259, "global_step": 7576, "epoch": 63, "lr": 9.756171811657659e-05} +{"train_loss": 0.009668072685599327, "global_step": 7577, "epoch": 63, "lr": 9.756103465361628e-05} +{"train_loss": 0.006964352447539568, "global_step": 7578, "epoch": 63, "lr": 9.756035109727495e-05} +{"train_loss": 0.011695354245603085, "global_step": 7579, "epoch": 63, "lr": 9.755966744755396e-05} +{"train_loss": 0.01339862309396267, "global_step": 7580, "epoch": 63, "lr": 9.755898370445465e-05} +{"train_loss": 0.009953871369361877, "global_step": 7581, "epoch": 63, "lr": 9.755829986797835e-05} +{"train_loss": 0.014667002484202385, "global_step": 7582, "epoch": 63, "lr": 9.75576159381264e-05} +{"train_loss": 0.012709331698715687, "global_step": 7583, "epoch": 63, "lr": 9.755693191490016e-05} +{"train_loss": 0.009904379025101662, "global_step": 7584, "epoch": 63, "lr": 9.755624779830097e-05} +{"train_loss": 0.008561382070183754, "global_step": 7585, "epoch": 63, "lr": 9.755556358833016e-05} +{"train_loss": 0.012701207771897316, "global_step": 7586, "epoch": 63, "lr": 9.755487928498909e-05} +{"train_loss": 0.011101389303803444, "global_step": 7587, "epoch": 63, "lr": 9.755419488827908e-05} +{"train_loss": 0.014974410645663738, "global_step": 7588, "epoch": 63, "lr": 9.75535103982015e-05} +{"train_loss": 0.009754321537911892, "global_step": 7589, "epoch": 63, "lr": 9.755282581475769e-05} +{"train_loss": 0.013834775425493717, "global_step": 7590, "epoch": 63, "lr": 9.755214113794897e-05} +{"train_loss": 0.01414773240685463, "global_step": 7591, "epoch": 63, "lr": 9.755145636777671e-05} +{"train_loss": 0.013121481984853745, "global_step": 7592, "epoch": 63, "lr": 9.755077150424225e-05} +{"train_loss": 0.00861472636461258, "global_step": 7593, "epoch": 63, "lr": 9.755008654734693e-05} +{"train_loss": 0.016793718561530113, "global_step": 7594, "epoch": 63, "lr": 9.754940149709208e-05} +{"train_loss": 0.008710291236639023, "global_step": 7595, "epoch": 63, "lr": 9.754871635347907e-05} +{"train_loss": 0.013333206064999104, "global_step": 7596, "epoch": 63, "lr": 9.754803111650923e-05} +{"train_loss": 0.014426302164793015, "global_step": 7597, "epoch": 63, "lr": 9.754734578618391e-05} +{"train_loss": 0.01059319730848074, "global_step": 7598, "epoch": 63, "lr": 9.754666036250446e-05} +{"train_loss": 0.017592858523130417, "global_step": 7599, "epoch": 63, "lr": 9.754597484547224e-05} +{"train_loss": 0.01225992664694786, "global_step": 7600, "epoch": 63, "lr": 9.754528923508856e-05} +{"train_loss": 0.007680505979806185, "global_step": 7601, "epoch": 63, "lr": 9.754460353135478e-05} +{"train_loss": 0.013433058746159077, "global_step": 7602, "epoch": 63, "lr": 9.754391773427225e-05} +{"train_loss": 0.015218133106827736, "global_step": 7603, "epoch": 63, "lr": 9.754323184384233e-05} +{"train_loss": 0.012508693151175976, "global_step": 7604, "epoch": 63, "lr": 9.754254586006634e-05} +{"train_loss": 0.01652943715453148, "global_step": 7605, "epoch": 63, "lr": 9.754185978294565e-05} +{"train_loss": 0.01343503687530756, "global_step": 7606, "epoch": 63, "lr": 9.754117361248159e-05} +{"train_loss": 0.012640104629099369, "global_step": 7607, "epoch": 63, "lr": 9.754048734867553e-05} +{"train_loss": 0.008809302933514118, "global_step": 7608, "epoch": 63, "lr": 9.753980099152879e-05} +{"train_loss": 0.007433631923049688, "global_step": 7609, "epoch": 63, "lr": 9.753911454104272e-05} +{"train_loss": 0.013445739634335041, "global_step": 7610, "epoch": 63, "lr": 9.753842799721868e-05} +{"train_loss": 0.012633947655558586, "global_step": 7611, "epoch": 63, "lr": 9.753774136005803e-05} +{"train_loss": 0.01149427704513073, "global_step": 7612, "epoch": 63, "lr": 9.75370546295621e-05} +{"train_loss": 0.010200231336057186, "global_step": 7613, "epoch": 63, "lr": 9.753636780573224e-05} +{"train_loss": 0.01657695323228836, "global_step": 7614, "epoch": 63, "lr": 9.753568088856979e-05} +{"train_loss": 0.012010116368813925, "global_step": 7615, "epoch": 63, "lr": 9.753499387807612e-05, "val_loss": 0.016605045646429062} +{"train_loss": 0.012117045931518078, "global_step": 7616, "epoch": 64, "lr": 9.753430677425257e-05} +{"train_loss": 0.010256770066916943, "global_step": 7617, "epoch": 64, "lr": 9.753361957710048e-05} +{"train_loss": 0.010810709558427334, "global_step": 7618, "epoch": 64, "lr": 9.753293228662122e-05} +{"train_loss": 0.017757462337613106, "global_step": 7619, "epoch": 64, "lr": 9.753224490281611e-05} +{"train_loss": 0.017097238451242447, "global_step": 7620, "epoch": 64, "lr": 9.753155742568651e-05} +{"train_loss": 0.009008001536130905, "global_step": 7621, "epoch": 64, "lr": 9.753086985523379e-05} +{"train_loss": 0.013731030747294426, "global_step": 7622, "epoch": 64, "lr": 9.753018219145929e-05} +{"train_loss": 0.010652721859514713, "global_step": 7623, "epoch": 64, "lr": 9.752949443436435e-05} +{"train_loss": 0.013677318580448627, "global_step": 7624, "epoch": 64, "lr": 9.752880658395031e-05} +{"train_loss": 0.011009033769369125, "global_step": 7625, "epoch": 64, "lr": 9.752811864021853e-05} +{"train_loss": 0.010357190854847431, "global_step": 7626, "epoch": 64, "lr": 9.75274306031704e-05} +{"train_loss": 0.01674375869333744, "global_step": 7627, "epoch": 64, "lr": 9.752674247280722e-05} +{"train_loss": 0.0084049291908741, "global_step": 7628, "epoch": 64, "lr": 9.752605424913035e-05} +{"train_loss": 0.006764983758330345, "global_step": 7629, "epoch": 64, "lr": 9.752536593214117e-05} +{"train_loss": 0.009948192164301872, "global_step": 7630, "epoch": 64, "lr": 9.7524677521841e-05} +{"train_loss": 0.009455032646656036, "global_step": 7631, "epoch": 64, "lr": 9.75239890182312e-05} +{"train_loss": 0.010749460197985172, "global_step": 7632, "epoch": 64, "lr": 9.752330042131312e-05} +{"train_loss": 0.009932592511177063, "global_step": 7633, "epoch": 64, "lr": 9.752261173108813e-05} +{"train_loss": 0.016689365729689598, "global_step": 7634, "epoch": 64, "lr": 9.752192294755756e-05} +{"train_loss": 0.018589910119771957, "global_step": 7635, "epoch": 64, "lr": 9.752123407072278e-05} +{"train_loss": 0.014710972085595131, "global_step": 7636, "epoch": 64, "lr": 9.752054510058513e-05} +{"train_loss": 0.01185282226651907, "global_step": 7637, "epoch": 64, "lr": 9.751985603714597e-05} +{"train_loss": 0.010657957755029202, "global_step": 7638, "epoch": 64, "lr": 9.751916688040663e-05} +{"train_loss": 0.012079386971890926, "global_step": 7639, "epoch": 64, "lr": 9.75184776303685e-05} +{"train_loss": 0.015124726109206676, "global_step": 7640, "epoch": 64, "lr": 9.751778828703292e-05} +{"train_loss": 0.012852247804403305, "global_step": 7641, "epoch": 64, "lr": 9.751709885040123e-05} +{"train_loss": 0.00888456217944622, "global_step": 7642, "epoch": 64, "lr": 9.751640932047479e-05} +{"train_loss": 0.012388701550662518, "global_step": 7643, "epoch": 64, "lr": 9.751571969725497e-05} +{"train_loss": 0.015354328788816929, "global_step": 7644, "epoch": 64, "lr": 9.75150299807431e-05} +{"train_loss": 0.014778191223740578, "global_step": 7645, "epoch": 64, "lr": 9.751434017094054e-05} +{"train_loss": 0.0109336469322443, "global_step": 7646, "epoch": 64, "lr": 9.751365026784867e-05} +{"train_loss": 0.012236857786774635, "global_step": 7647, "epoch": 64, "lr": 9.75129602714688e-05} +{"train_loss": 0.012488281354308128, "global_step": 7648, "epoch": 64, "lr": 9.751227018180233e-05} +{"train_loss": 0.013318882323801517, "global_step": 7649, "epoch": 64, "lr": 9.751157999885056e-05} +{"train_loss": 0.009972083382308483, "global_step": 7650, "epoch": 64, "lr": 9.751088972261491e-05} +{"train_loss": 0.010795234702527523, "global_step": 7651, "epoch": 64, "lr": 9.75101993530967e-05} +{"train_loss": 0.010910475626587868, "global_step": 7652, "epoch": 64, "lr": 9.750950889029728e-05} +{"train_loss": 0.00940350629389286, "global_step": 7653, "epoch": 64, "lr": 9.750881833421802e-05} +{"train_loss": 0.012847432866692543, "global_step": 7654, "epoch": 64, "lr": 9.750812768486027e-05} +{"train_loss": 0.010340221226215363, "global_step": 7655, "epoch": 64, "lr": 9.750743694222539e-05} +{"train_loss": 0.014254821464419365, "global_step": 7656, "epoch": 64, "lr": 9.750674610631472e-05} +{"train_loss": 0.011007332243025303, "global_step": 7657, "epoch": 64, "lr": 9.750605517712965e-05} +{"train_loss": 0.009420307353138924, "global_step": 7658, "epoch": 64, "lr": 9.75053641546715e-05} +{"train_loss": 0.010078679770231247, "global_step": 7659, "epoch": 64, "lr": 9.750467303894164e-05} +{"train_loss": 0.007753737270832062, "global_step": 7660, "epoch": 64, "lr": 9.750398182994145e-05} +{"train_loss": 0.01065039075911045, "global_step": 7661, "epoch": 64, "lr": 9.750329052767224e-05} +{"train_loss": 0.010686223395168781, "global_step": 7662, "epoch": 64, "lr": 9.750259913213541e-05} +{"train_loss": 0.0124592250213027, "global_step": 7663, "epoch": 64, "lr": 9.750190764333232e-05} +{"train_loss": 0.011061266995966434, "global_step": 7664, "epoch": 64, "lr": 9.750121606126427e-05} +{"train_loss": 0.011634288355708122, "global_step": 7665, "epoch": 64, "lr": 9.750052438593268e-05} +{"train_loss": 0.012396457605063915, "global_step": 7666, "epoch": 64, "lr": 9.749983261733888e-05} +{"train_loss": 0.011125330813229084, "global_step": 7667, "epoch": 64, "lr": 9.749914075548424e-05} +{"train_loss": 0.011111641302704811, "global_step": 7668, "epoch": 64, "lr": 9.749844880037008e-05} +{"train_loss": 0.021059313789010048, "global_step": 7669, "epoch": 64, "lr": 9.749775675199784e-05} +{"train_loss": 0.008388600312173367, "global_step": 7670, "epoch": 64, "lr": 9.74970646103688e-05} +{"train_loss": 0.012139137834310532, "global_step": 7671, "epoch": 64, "lr": 9.749637237548435e-05} +{"train_loss": 0.012076329439878464, "global_step": 7672, "epoch": 64, "lr": 9.749568004734586e-05} +{"train_loss": 0.009636964648962021, "global_step": 7673, "epoch": 64, "lr": 9.749498762595466e-05} +{"train_loss": 0.010533045046031475, "global_step": 7674, "epoch": 64, "lr": 9.749429511131212e-05} +{"train_loss": 0.013768082484602928, "global_step": 7675, "epoch": 64, "lr": 9.749360250341963e-05} +{"train_loss": 0.014299356378614902, "global_step": 7676, "epoch": 64, "lr": 9.749290980227851e-05} +{"train_loss": 0.00863731186836958, "global_step": 7677, "epoch": 64, "lr": 9.749221700789013e-05} +{"train_loss": 0.015081176534295082, "global_step": 7678, "epoch": 64, "lr": 9.749152412025587e-05} +{"train_loss": 0.010598698630928993, "global_step": 7679, "epoch": 64, "lr": 9.749083113937707e-05} +{"train_loss": 0.007709761615842581, "global_step": 7680, "epoch": 64, "lr": 9.74901380652551e-05} +{"train_loss": 0.01489637978374958, "global_step": 7681, "epoch": 64, "lr": 9.748944489789132e-05} +{"train_loss": 0.009820070117712021, "global_step": 7682, "epoch": 64, "lr": 9.748875163728708e-05} +{"train_loss": 0.015097953379154205, "global_step": 7683, "epoch": 64, "lr": 9.748805828344374e-05} +{"train_loss": 0.010111238807439804, "global_step": 7684, "epoch": 64, "lr": 9.74873648363627e-05} +{"train_loss": 0.012651938013732433, "global_step": 7685, "epoch": 64, "lr": 9.748667129604528e-05} +{"train_loss": 0.011045842431485653, "global_step": 7686, "epoch": 64, "lr": 9.748597766249284e-05} +{"train_loss": 0.013553820550441742, "global_step": 7687, "epoch": 64, "lr": 9.748528393570677e-05} +{"train_loss": 0.008810354396700859, "global_step": 7688, "epoch": 64, "lr": 9.74845901156884e-05} +{"train_loss": 0.012845366261899471, "global_step": 7689, "epoch": 64, "lr": 9.748389620243913e-05} +{"train_loss": 0.011944206431508064, "global_step": 7690, "epoch": 64, "lr": 9.74832021959603e-05} +{"train_loss": 0.014633568935096264, "global_step": 7691, "epoch": 64, "lr": 9.748250809625326e-05} +{"train_loss": 0.012865345925092697, "global_step": 7692, "epoch": 64, "lr": 9.748181390331941e-05} +{"train_loss": 0.013883395120501518, "global_step": 7693, "epoch": 64, "lr": 9.748111961716009e-05} +{"train_loss": 0.009339823387563229, "global_step": 7694, "epoch": 64, "lr": 9.748042523777665e-05} +{"train_loss": 0.012677007354795933, "global_step": 7695, "epoch": 64, "lr": 9.747973076517047e-05} +{"train_loss": 0.007819673046469688, "global_step": 7696, "epoch": 64, "lr": 9.747903619934291e-05} +{"train_loss": 0.011088209226727486, "global_step": 7697, "epoch": 64, "lr": 9.747834154029533e-05} +{"train_loss": 0.009989436715841293, "global_step": 7698, "epoch": 64, "lr": 9.747764678802912e-05} +{"train_loss": 0.010619262233376503, "global_step": 7699, "epoch": 64, "lr": 9.747695194254561e-05} +{"train_loss": 0.01071635540574789, "global_step": 7700, "epoch": 64, "lr": 9.747625700384617e-05} +{"train_loss": 0.014481772668659687, "global_step": 7701, "epoch": 64, "lr": 9.747556197193219e-05} +{"train_loss": 0.01325763389468193, "global_step": 7702, "epoch": 64, "lr": 9.7474866846805e-05} +{"train_loss": 0.008999934419989586, "global_step": 7703, "epoch": 64, "lr": 9.747417162846599e-05} +{"train_loss": 0.010769708082079887, "global_step": 7704, "epoch": 64, "lr": 9.747347631691651e-05} +{"train_loss": 0.014461237005889416, "global_step": 7705, "epoch": 64, "lr": 9.747278091215794e-05} +{"train_loss": 0.011005734093487263, "global_step": 7706, "epoch": 64, "lr": 9.747208541419162e-05} +{"train_loss": 0.010534357279539108, "global_step": 7707, "epoch": 64, "lr": 9.747138982301895e-05} +{"train_loss": 0.010160095058381557, "global_step": 7708, "epoch": 64, "lr": 9.747069413864126e-05} +{"train_loss": 0.009929440915584564, "global_step": 7709, "epoch": 64, "lr": 9.746999836105995e-05} +{"train_loss": 0.013078262098133564, "global_step": 7710, "epoch": 64, "lr": 9.746930249027636e-05} +{"train_loss": 0.013821804895997047, "global_step": 7711, "epoch": 64, "lr": 9.746860652629186e-05} +{"train_loss": 0.013902468606829643, "global_step": 7712, "epoch": 64, "lr": 9.746791046910784e-05} +{"train_loss": 0.014766870066523552, "global_step": 7713, "epoch": 64, "lr": 9.746721431872563e-05} +{"train_loss": 0.011983152478933334, "global_step": 7714, "epoch": 64, "lr": 9.746651807514663e-05} +{"train_loss": 0.011407734826207161, "global_step": 7715, "epoch": 64, "lr": 9.746582173837219e-05} +{"train_loss": 0.009722795337438583, "global_step": 7716, "epoch": 64, "lr": 9.746512530840368e-05} +{"train_loss": 0.013634161092340946, "global_step": 7717, "epoch": 64, "lr": 9.746442878524246e-05} +{"train_loss": 0.011966818943619728, "global_step": 7718, "epoch": 64, "lr": 9.746373216888991e-05} +{"train_loss": 0.007396841887384653, "global_step": 7719, "epoch": 64, "lr": 9.74630354593474e-05} +{"train_loss": 0.01470700092613697, "global_step": 7720, "epoch": 64, "lr": 9.746233865661628e-05} +{"train_loss": 0.0115458182990551, "global_step": 7721, "epoch": 64, "lr": 9.746164176069794e-05} +{"train_loss": 0.010289931669831276, "global_step": 7722, "epoch": 64, "lr": 9.746094477159373e-05} +{"train_loss": 0.009431949816644192, "global_step": 7723, "epoch": 64, "lr": 9.746024768930501e-05} +{"train_loss": 0.011331499554216862, "global_step": 7724, "epoch": 64, "lr": 9.745955051383319e-05} +{"train_loss": 0.016299856826663017, "global_step": 7725, "epoch": 64, "lr": 9.745885324517959e-05} +{"train_loss": 0.008983230218291283, "global_step": 7726, "epoch": 64, "lr": 9.745815588334562e-05} +{"train_loss": 0.012416350655257702, "global_step": 7727, "epoch": 64, "lr": 9.745745842833262e-05} +{"train_loss": 0.011998968198895454, "global_step": 7728, "epoch": 64, "lr": 9.745676088014197e-05} +{"train_loss": 0.01684771664440632, "global_step": 7729, "epoch": 64, "lr": 9.745606323877505e-05} +{"train_loss": 0.012346742674708366, "global_step": 7730, "epoch": 64, "lr": 9.745536550423322e-05} +{"train_loss": 0.010342873632907867, "global_step": 7731, "epoch": 64, "lr": 9.745466767651784e-05} +{"train_loss": 0.011891776695847511, "global_step": 7732, "epoch": 64, "lr": 9.745396975563031e-05} +{"train_loss": 0.012581685557961464, "global_step": 7733, "epoch": 64, "lr": 9.745327174157196e-05} +{"train_loss": 0.011903138400814613, "global_step": 7734, "epoch": 64, "lr": 9.745257363434417e-05, "val_loss": 0.022232163697481155} +{"train_loss": 0.010283896699547768, "global_step": 7735, "epoch": 65, "lr": 9.745187543394834e-05} +{"train_loss": 0.012329479679465294, "global_step": 7736, "epoch": 65, "lr": 9.745117714038581e-05} +{"train_loss": 0.010375972837209702, "global_step": 7737, "epoch": 65, "lr": 9.745047875365798e-05} +{"train_loss": 0.016692345961928368, "global_step": 7738, "epoch": 65, "lr": 9.74497802737662e-05} +{"train_loss": 0.009168028831481934, "global_step": 7739, "epoch": 65, "lr": 9.744908170071182e-05} +{"train_loss": 0.012834043242037296, "global_step": 7740, "epoch": 65, "lr": 9.744838303449628e-05} +{"train_loss": 0.009640302509069443, "global_step": 7741, "epoch": 65, "lr": 9.744768427512088e-05} +{"train_loss": 0.0078015513718128204, "global_step": 7742, "epoch": 65, "lr": 9.744698542258704e-05} +{"train_loss": 0.014043837785720825, "global_step": 7743, "epoch": 65, "lr": 9.744628647689608e-05} +{"train_loss": 0.01717490330338478, "global_step": 7744, "epoch": 65, "lr": 9.744558743804943e-05} +{"train_loss": 0.009389961138367653, "global_step": 7745, "epoch": 65, "lr": 9.744488830604844e-05} +{"train_loss": 0.008564691059291363, "global_step": 7746, "epoch": 65, "lr": 9.744418908089448e-05} +{"train_loss": 0.015254679135978222, "global_step": 7747, "epoch": 65, "lr": 9.744348976258892e-05} +{"train_loss": 0.0115250488743186, "global_step": 7748, "epoch": 65, "lr": 9.744279035113312e-05} +{"train_loss": 0.007889634929597378, "global_step": 7749, "epoch": 65, "lr": 9.74420908465285e-05} +{"train_loss": 0.0073230876587331295, "global_step": 7750, "epoch": 65, "lr": 9.744139124877638e-05} +{"train_loss": 0.012718002311885357, "global_step": 7751, "epoch": 65, "lr": 9.744069155787817e-05} +{"train_loss": 0.008062783628702164, "global_step": 7752, "epoch": 65, "lr": 9.743999177383523e-05} +{"train_loss": 0.012867727316915989, "global_step": 7753, "epoch": 65, "lr": 9.743929189664893e-05} +{"train_loss": 0.01427934505045414, "global_step": 7754, "epoch": 65, "lr": 9.743859192632065e-05} +{"train_loss": 0.012782675214111805, "global_step": 7755, "epoch": 65, "lr": 9.743789186285175e-05} +{"train_loss": 0.012707483023405075, "global_step": 7756, "epoch": 65, "lr": 9.743719170624364e-05} +{"train_loss": 0.011290197260677814, "global_step": 7757, "epoch": 65, "lr": 9.743649145649764e-05} +{"train_loss": 0.012032587081193924, "global_step": 7758, "epoch": 65, "lr": 9.743579111361519e-05} +{"train_loss": 0.009377635084092617, "global_step": 7759, "epoch": 65, "lr": 9.743509067759762e-05} +{"train_loss": 0.01140077318996191, "global_step": 7760, "epoch": 65, "lr": 9.743439014844631e-05} +{"train_loss": 0.01374401431530714, "global_step": 7761, "epoch": 65, "lr": 9.743368952616265e-05} +{"train_loss": 0.015129901468753815, "global_step": 7762, "epoch": 65, "lr": 9.7432988810748e-05} +{"train_loss": 0.013479270040988922, "global_step": 7763, "epoch": 65, "lr": 9.743228800220376e-05} +{"train_loss": 0.007370440289378166, "global_step": 7764, "epoch": 65, "lr": 9.743158710053129e-05} +{"train_loss": 0.012265215627849102, "global_step": 7765, "epoch": 65, "lr": 9.743088610573194e-05} +{"train_loss": 0.010955270379781723, "global_step": 7766, "epoch": 65, "lr": 9.743018501780714e-05} +{"train_loss": 0.009460519067943096, "global_step": 7767, "epoch": 65, "lr": 9.742948383675823e-05} +{"train_loss": 0.015852026641368866, "global_step": 7768, "epoch": 65, "lr": 9.742878256258658e-05} +{"train_loss": 0.008582141250371933, "global_step": 7769, "epoch": 65, "lr": 9.74280811952936e-05} +{"train_loss": 0.022711915895342827, "global_step": 7770, "epoch": 65, "lr": 9.742737973488065e-05} +{"train_loss": 0.009936465881764889, "global_step": 7771, "epoch": 65, "lr": 9.742667818134909e-05} +{"train_loss": 0.010956373065710068, "global_step": 7772, "epoch": 65, "lr": 9.742597653470034e-05} +{"train_loss": 0.011693776585161686, "global_step": 7773, "epoch": 65, "lr": 9.742527479493573e-05} +{"train_loss": 0.013905845582485199, "global_step": 7774, "epoch": 65, "lr": 9.742457296205667e-05} +{"train_loss": 0.011842330917716026, "global_step": 7775, "epoch": 65, "lr": 9.742387103606452e-05} +{"train_loss": 0.011141159571707249, "global_step": 7776, "epoch": 65, "lr": 9.742316901696067e-05} +{"train_loss": 0.011616487056016922, "global_step": 7777, "epoch": 65, "lr": 9.74224669047465e-05} +{"train_loss": 0.013042601756751537, "global_step": 7778, "epoch": 65, "lr": 9.742176469942337e-05} +{"train_loss": 0.008612691424787045, "global_step": 7779, "epoch": 65, "lr": 9.742106240099269e-05} +{"train_loss": 0.012961653992533684, "global_step": 7780, "epoch": 65, "lr": 9.74203600094558e-05} +{"train_loss": 0.010167631320655346, "global_step": 7781, "epoch": 65, "lr": 9.741965752481412e-05} +{"train_loss": 0.010848123580217361, "global_step": 7782, "epoch": 65, "lr": 9.741895494706898e-05} +{"train_loss": 0.012156043201684952, "global_step": 7783, "epoch": 65, "lr": 9.741825227622181e-05} +{"train_loss": 0.013382361270487309, "global_step": 7784, "epoch": 65, "lr": 9.741754951227397e-05} +{"train_loss": 0.011770001612603664, "global_step": 7785, "epoch": 65, "lr": 9.741684665522683e-05} +{"train_loss": 0.009934064000844955, "global_step": 7786, "epoch": 65, "lr": 9.741614370508177e-05} +{"train_loss": 0.014178255572915077, "global_step": 7787, "epoch": 65, "lr": 9.741544066184019e-05} +{"train_loss": 0.012181693688035011, "global_step": 7788, "epoch": 65, "lr": 9.741473752550345e-05} +{"train_loss": 0.008866514079272747, "global_step": 7789, "epoch": 65, "lr": 9.741403429607294e-05} +{"train_loss": 0.01412984449416399, "global_step": 7790, "epoch": 65, "lr": 9.741333097355004e-05} +{"train_loss": 0.013745971024036407, "global_step": 7791, "epoch": 65, "lr": 9.741262755793613e-05} +{"train_loss": 0.013515912927687168, "global_step": 7792, "epoch": 65, "lr": 9.741192404923259e-05} +{"train_loss": 0.013033485971391201, "global_step": 7793, "epoch": 65, "lr": 9.74112204474408e-05} +{"train_loss": 0.011601106263697147, "global_step": 7794, "epoch": 65, "lr": 9.741051675256216e-05} +{"train_loss": 0.015212398022413254, "global_step": 7795, "epoch": 65, "lr": 9.740981296459801e-05} +{"train_loss": 0.016367042437195778, "global_step": 7796, "epoch": 65, "lr": 9.740910908354977e-05} +{"train_loss": 0.0075806789100170135, "global_step": 7797, "epoch": 65, "lr": 9.740840510941882e-05} +{"train_loss": 0.010367406532168388, "global_step": 7798, "epoch": 65, "lr": 9.740770104220652e-05} +{"train_loss": 0.0117255924269557, "global_step": 7799, "epoch": 65, "lr": 9.740699688191425e-05} +{"train_loss": 0.009206715039908886, "global_step": 7800, "epoch": 65, "lr": 9.740629262854342e-05} +{"train_loss": 0.013964432291686535, "global_step": 7801, "epoch": 65, "lr": 9.740558828209541e-05} +{"train_loss": 0.015263525769114494, "global_step": 7802, "epoch": 65, "lr": 9.740488384257158e-05} +{"train_loss": 0.0095804613083601, "global_step": 7803, "epoch": 65, "lr": 9.740417930997331e-05} +{"train_loss": 0.012491000816226006, "global_step": 7804, "epoch": 65, "lr": 9.740347468430203e-05} +{"train_loss": 0.008787109516561031, "global_step": 7805, "epoch": 65, "lr": 9.740276996555908e-05} +{"train_loss": 0.00967762153595686, "global_step": 7806, "epoch": 65, "lr": 9.740206515374584e-05} +{"train_loss": 0.010662409476935863, "global_step": 7807, "epoch": 65, "lr": 9.740136024886372e-05} +{"train_loss": 0.011273574084043503, "global_step": 7808, "epoch": 65, "lr": 9.740065525091411e-05} +{"train_loss": 0.008243687450885773, "global_step": 7809, "epoch": 65, "lr": 9.739995015989836e-05} +{"train_loss": 0.01178571954369545, "global_step": 7810, "epoch": 65, "lr": 9.739924497581788e-05} +{"train_loss": 0.005531849339604378, "global_step": 7811, "epoch": 65, "lr": 9.739853969867403e-05} +{"train_loss": 0.014695590361952782, "global_step": 7812, "epoch": 65, "lr": 9.739783432846821e-05} +{"train_loss": 0.010711411014199257, "global_step": 7813, "epoch": 65, "lr": 9.739712886520182e-05} +{"train_loss": 0.00995221920311451, "global_step": 7814, "epoch": 65, "lr": 9.739642330887623e-05} +{"train_loss": 0.010952210985124111, "global_step": 7815, "epoch": 65, "lr": 9.739571765949283e-05} +{"train_loss": 0.011878917925059795, "global_step": 7816, "epoch": 65, "lr": 9.739501191705301e-05} +{"train_loss": 0.008692332543432713, "global_step": 7817, "epoch": 65, "lr": 9.739430608155811e-05} +{"train_loss": 0.016665294766426086, "global_step": 7818, "epoch": 65, "lr": 9.739360015300959e-05} +{"train_loss": 0.008717907592654228, "global_step": 7819, "epoch": 65, "lr": 9.739289413140878e-05} +{"train_loss": 0.007367685902863741, "global_step": 7820, "epoch": 65, "lr": 9.739218801675709e-05} +{"train_loss": 0.014495174400508404, "global_step": 7821, "epoch": 65, "lr": 9.739148180905591e-05} +{"train_loss": 0.010144971311092377, "global_step": 7822, "epoch": 65, "lr": 9.739077550830662e-05} +{"train_loss": 0.009008878841996193, "global_step": 7823, "epoch": 65, "lr": 9.739006911451058e-05} +{"train_loss": 0.011447187513113022, "global_step": 7824, "epoch": 65, "lr": 9.738936262766922e-05} +{"train_loss": 0.014707548543810844, "global_step": 7825, "epoch": 65, "lr": 9.738865604778392e-05} +{"train_loss": 0.007634177803993225, "global_step": 7826, "epoch": 65, "lr": 9.738794937485604e-05} +{"train_loss": 0.010747809894382954, "global_step": 7827, "epoch": 65, "lr": 9.7387242608887e-05} +{"train_loss": 0.010617773048579693, "global_step": 7828, "epoch": 65, "lr": 9.738653574987816e-05} +{"train_loss": 0.01476758997887373, "global_step": 7829, "epoch": 65, "lr": 9.738582879783092e-05} +{"train_loss": 0.008271561935544014, "global_step": 7830, "epoch": 65, "lr": 9.738512175274667e-05} +{"train_loss": 0.010775847360491753, "global_step": 7831, "epoch": 65, "lr": 9.73844146146268e-05} +{"train_loss": 0.013908572494983673, "global_step": 7832, "epoch": 65, "lr": 9.738370738347269e-05} +{"train_loss": 0.01256883330643177, "global_step": 7833, "epoch": 65, "lr": 9.738300005928572e-05} +{"train_loss": 0.010772389359772205, "global_step": 7834, "epoch": 65, "lr": 9.738229264206731e-05} +{"train_loss": 0.006788498256355524, "global_step": 7835, "epoch": 65, "lr": 9.738158513181882e-05} +{"train_loss": 0.012120871804654598, "global_step": 7836, "epoch": 65, "lr": 9.738087752854166e-05} +{"train_loss": 0.012347135692834854, "global_step": 7837, "epoch": 65, "lr": 9.738016983223719e-05} +{"train_loss": 0.013820135965943336, "global_step": 7838, "epoch": 65, "lr": 9.737946204290683e-05} +{"train_loss": 0.01081645954400301, "global_step": 7839, "epoch": 65, "lr": 9.737875416055196e-05} +{"train_loss": 0.015119921416044235, "global_step": 7840, "epoch": 65, "lr": 9.737804618517396e-05} +{"train_loss": 0.010108845308423042, "global_step": 7841, "epoch": 65, "lr": 9.737733811677424e-05} +{"train_loss": 0.013149674981832504, "global_step": 7842, "epoch": 65, "lr": 9.737662995535417e-05} +{"train_loss": 0.011544805951416492, "global_step": 7843, "epoch": 65, "lr": 9.737592170091516e-05} +{"train_loss": 0.009819714352488518, "global_step": 7844, "epoch": 65, "lr": 9.737521335345858e-05} +{"train_loss": 0.00958100613206625, "global_step": 7845, "epoch": 65, "lr": 9.737450491298583e-05} +{"train_loss": 0.00938195176422596, "global_step": 7846, "epoch": 65, "lr": 9.73737963794983e-05} +{"train_loss": 0.012483608908951283, "global_step": 7847, "epoch": 65, "lr": 9.737308775299738e-05} +{"train_loss": 0.013087543658912182, "global_step": 7848, "epoch": 65, "lr": 9.737237903348446e-05} +{"train_loss": 0.01814253069460392, "global_step": 7849, "epoch": 65, "lr": 9.737167022096094e-05} +{"train_loss": 0.01294412836432457, "global_step": 7850, "epoch": 65, "lr": 9.73709613154282e-05} +{"train_loss": 0.01679937168955803, "global_step": 7851, "epoch": 65, "lr": 9.737025231688765e-05} +{"train_loss": 0.014498922973871231, "global_step": 7852, "epoch": 65, "lr": 9.736954322534068e-05} +{"train_loss": 0.011695040792946806, "global_step": 7853, "epoch": 65, "lr": 9.736883404078864e-05, "val_loss": 0.023177001625299454, "train_action_mse_error": 0.00047918822383508086} +{"train_loss": 0.009735116735100746, "global_step": 7854, "epoch": 66, "lr": 9.736812476323298e-05} +{"train_loss": 0.016140468418598175, "global_step": 7855, "epoch": 66, "lr": 9.736741539267507e-05} +{"train_loss": 0.009913317859172821, "global_step": 7856, "epoch": 66, "lr": 9.736670592911629e-05} +{"train_loss": 0.012136470526456833, "global_step": 7857, "epoch": 66, "lr": 9.736599637255804e-05} +{"train_loss": 0.01170895155519247, "global_step": 7858, "epoch": 66, "lr": 9.736528672300172e-05} +{"train_loss": 0.014029962942004204, "global_step": 7859, "epoch": 66, "lr": 9.736457698044871e-05} +{"train_loss": 0.013418905436992645, "global_step": 7860, "epoch": 66, "lr": 9.736386714490045e-05} +{"train_loss": 0.012886659242212772, "global_step": 7861, "epoch": 66, "lr": 9.736315721635825e-05} +{"train_loss": 0.01149182952940464, "global_step": 7862, "epoch": 66, "lr": 9.736244719482358e-05} +{"train_loss": 0.017507513985037804, "global_step": 7863, "epoch": 66, "lr": 9.736173708029779e-05} +{"train_loss": 0.007313946262001991, "global_step": 7864, "epoch": 66, "lr": 9.73610268727823e-05} +{"train_loss": 0.01195172592997551, "global_step": 7865, "epoch": 66, "lr": 9.736031657227849e-05} +{"train_loss": 0.020942561328411102, "global_step": 7866, "epoch": 66, "lr": 9.735960617878776e-05} +{"train_loss": 0.015390479005873203, "global_step": 7867, "epoch": 66, "lr": 9.73588956923115e-05} +{"train_loss": 0.015017109923064709, "global_step": 7868, "epoch": 66, "lr": 9.735818511285111e-05} +{"train_loss": 0.013192589394748211, "global_step": 7869, "epoch": 66, "lr": 9.735747444040796e-05} +{"train_loss": 0.01686953939497471, "global_step": 7870, "epoch": 66, "lr": 9.735676367498351e-05} +{"train_loss": 0.012350635603070259, "global_step": 7871, "epoch": 66, "lr": 9.73560528165791e-05} +{"train_loss": 0.011256466619670391, "global_step": 7872, "epoch": 66, "lr": 9.735534186519612e-05} +{"train_loss": 0.016715144738554955, "global_step": 7873, "epoch": 66, "lr": 9.7354630820836e-05} +{"train_loss": 0.015919633209705353, "global_step": 7874, "epoch": 66, "lr": 9.735391968350012e-05} +{"train_loss": 0.014666725881397724, "global_step": 7875, "epoch": 66, "lr": 9.735320845318986e-05} +{"train_loss": 0.014703628607094288, "global_step": 7876, "epoch": 66, "lr": 9.735249712990667e-05} +{"train_loss": 0.013396153226494789, "global_step": 7877, "epoch": 66, "lr": 9.735178571365189e-05} +{"train_loss": 0.018050700426101685, "global_step": 7878, "epoch": 66, "lr": 9.735107420442694e-05} +{"train_loss": 0.010871726088225842, "global_step": 7879, "epoch": 66, "lr": 9.735036260223321e-05} +{"train_loss": 0.011098283343017101, "global_step": 7880, "epoch": 66, "lr": 9.73496509070721e-05} +{"train_loss": 0.013099277392029762, "global_step": 7881, "epoch": 66, "lr": 9.734893911894502e-05} +{"train_loss": 0.011517403647303581, "global_step": 7882, "epoch": 66, "lr": 9.734822723785335e-05} +{"train_loss": 0.01229055318981409, "global_step": 7883, "epoch": 66, "lr": 9.734751526379851e-05} +{"train_loss": 0.015675831586122513, "global_step": 7884, "epoch": 66, "lr": 9.734680319678187e-05} +{"train_loss": 0.01298100408166647, "global_step": 7885, "epoch": 66, "lr": 9.734609103680483e-05} +{"train_loss": 0.014698725193738937, "global_step": 7886, "epoch": 66, "lr": 9.73453787838688e-05} +{"train_loss": 0.010940729640424252, "global_step": 7887, "epoch": 66, "lr": 9.73446664379752e-05} +{"train_loss": 0.014999196864664555, "global_step": 7888, "epoch": 66, "lr": 9.734395399912538e-05} +{"train_loss": 0.014880123548209667, "global_step": 7889, "epoch": 66, "lr": 9.734324146732077e-05} +{"train_loss": 0.012529682368040085, "global_step": 7890, "epoch": 66, "lr": 9.734252884256276e-05} +{"train_loss": 0.008573989383876324, "global_step": 7891, "epoch": 66, "lr": 9.734181612485276e-05} +{"train_loss": 0.013942431658506393, "global_step": 7892, "epoch": 66, "lr": 9.734110331419218e-05} +{"train_loss": 0.008878188207745552, "global_step": 7893, "epoch": 66, "lr": 9.734039041058238e-05} +{"train_loss": 0.012014338746666908, "global_step": 7894, "epoch": 66, "lr": 9.733967741402476e-05} +{"train_loss": 0.013515033759176731, "global_step": 7895, "epoch": 66, "lr": 9.733896432452077e-05} +{"train_loss": 0.009622949175536633, "global_step": 7896, "epoch": 66, "lr": 9.733825114207177e-05} +{"train_loss": 0.009958346374332905, "global_step": 7897, "epoch": 66, "lr": 9.733753786667918e-05} +{"train_loss": 0.013500858098268509, "global_step": 7898, "epoch": 66, "lr": 9.733682449834439e-05} +{"train_loss": 0.007630776613950729, "global_step": 7899, "epoch": 66, "lr": 9.733611103706881e-05} +{"train_loss": 0.01127308513969183, "global_step": 7900, "epoch": 66, "lr": 9.733539748285382e-05} +{"train_loss": 0.012598131783306599, "global_step": 7901, "epoch": 66, "lr": 9.733468383570083e-05} +{"train_loss": 0.013498129323124886, "global_step": 7902, "epoch": 66, "lr": 9.733397009561125e-05} +{"train_loss": 0.012805699370801449, "global_step": 7903, "epoch": 66, "lr": 9.73332562625865e-05} +{"train_loss": 0.009702485054731369, "global_step": 7904, "epoch": 66, "lr": 9.733254233662791e-05} +{"train_loss": 0.018450120463967323, "global_step": 7905, "epoch": 66, "lr": 9.733182831773697e-05} +{"train_loss": 0.008394061587750912, "global_step": 7906, "epoch": 66, "lr": 9.733111420591504e-05} +{"train_loss": 0.01590607315301895, "global_step": 7907, "epoch": 66, "lr": 9.73304000011635e-05} +{"train_loss": 0.008774449117481709, "global_step": 7908, "epoch": 66, "lr": 9.73296857034838e-05} +{"train_loss": 0.011219876818358898, "global_step": 7909, "epoch": 66, "lr": 9.73289713128773e-05} +{"train_loss": 0.007832926698029041, "global_step": 7910, "epoch": 66, "lr": 9.732825682934543e-05} +{"train_loss": 0.010865570046007633, "global_step": 7911, "epoch": 66, "lr": 9.732754225288958e-05} +{"train_loss": 0.009515486657619476, "global_step": 7912, "epoch": 66, "lr": 9.732682758351116e-05} +{"train_loss": 0.014108877629041672, "global_step": 7913, "epoch": 66, "lr": 9.732611282121157e-05} +{"train_loss": 0.011318535543978214, "global_step": 7914, "epoch": 66, "lr": 9.73253979659922e-05} +{"train_loss": 0.008578548207879066, "global_step": 7915, "epoch": 66, "lr": 9.732468301785449e-05} +{"train_loss": 0.010743137449026108, "global_step": 7916, "epoch": 66, "lr": 9.73239679767998e-05} +{"train_loss": 0.011153159663081169, "global_step": 7917, "epoch": 66, "lr": 9.732325284282958e-05} +{"train_loss": 0.010623132809996605, "global_step": 7918, "epoch": 66, "lr": 9.732253761594518e-05} +{"train_loss": 0.011387289501726627, "global_step": 7919, "epoch": 66, "lr": 9.732182229614806e-05} +{"train_loss": 0.013304049149155617, "global_step": 7920, "epoch": 66, "lr": 9.732110688343958e-05} +{"train_loss": 0.014790879562497139, "global_step": 7921, "epoch": 66, "lr": 9.732039137782117e-05} +{"train_loss": 0.011689428240060806, "global_step": 7922, "epoch": 66, "lr": 9.731967577929421e-05} +{"train_loss": 0.009280018508434296, "global_step": 7923, "epoch": 66, "lr": 9.731896008786014e-05} +{"train_loss": 0.008206183090806007, "global_step": 7924, "epoch": 66, "lr": 9.731824430352036e-05} +{"train_loss": 0.0127340666949749, "global_step": 7925, "epoch": 66, "lr": 9.731752842627624e-05} +{"train_loss": 0.014276783913373947, "global_step": 7926, "epoch": 66, "lr": 9.731681245612922e-05} +{"train_loss": 0.012379115447402, "global_step": 7927, "epoch": 66, "lr": 9.731609639308068e-05} +{"train_loss": 0.009446525946259499, "global_step": 7928, "epoch": 66, "lr": 9.731538023713205e-05} +{"train_loss": 0.012608981691300869, "global_step": 7929, "epoch": 66, "lr": 9.731466398828472e-05} +{"train_loss": 0.009107230231165886, "global_step": 7930, "epoch": 66, "lr": 9.73139476465401e-05} +{"train_loss": 0.007865425199270248, "global_step": 7931, "epoch": 66, "lr": 9.731323121189961e-05} +{"train_loss": 0.0096710454672575, "global_step": 7932, "epoch": 66, "lr": 9.731251468436465e-05} +{"train_loss": 0.013547301292419434, "global_step": 7933, "epoch": 66, "lr": 9.73117980639366e-05} +{"train_loss": 0.009437410160899162, "global_step": 7934, "epoch": 66, "lr": 9.731108135061691e-05} +{"train_loss": 0.01141597144305706, "global_step": 7935, "epoch": 66, "lr": 9.731036454440694e-05} +{"train_loss": 0.016827881336212158, "global_step": 7936, "epoch": 66, "lr": 9.730964764530815e-05} +{"train_loss": 0.015864280983805656, "global_step": 7937, "epoch": 66, "lr": 9.73089306533219e-05} +{"train_loss": 0.012808974832296371, "global_step": 7938, "epoch": 66, "lr": 9.730821356844964e-05} +{"train_loss": 0.010725126601755619, "global_step": 7939, "epoch": 66, "lr": 9.730749639069275e-05} +{"train_loss": 0.01169119868427515, "global_step": 7940, "epoch": 66, "lr": 9.730677912005263e-05} +{"train_loss": 0.012122740037739277, "global_step": 7941, "epoch": 66, "lr": 9.730606175653072e-05} +{"train_loss": 0.01581384614109993, "global_step": 7942, "epoch": 66, "lr": 9.730534430012841e-05} +{"train_loss": 0.013797695748507977, "global_step": 7943, "epoch": 66, "lr": 9.73046267508471e-05} +{"train_loss": 0.011898590251803398, "global_step": 7944, "epoch": 66, "lr": 9.730390910868822e-05} +{"train_loss": 0.007947628386318684, "global_step": 7945, "epoch": 66, "lr": 9.730319137365316e-05} +{"train_loss": 0.01777442917227745, "global_step": 7946, "epoch": 66, "lr": 9.730247354574335e-05} +{"train_loss": 0.0131519865244627, "global_step": 7947, "epoch": 66, "lr": 9.730175562496018e-05} +{"train_loss": 0.01579313725233078, "global_step": 7948, "epoch": 66, "lr": 9.730103761130506e-05} +{"train_loss": 0.0095036830753088, "global_step": 7949, "epoch": 66, "lr": 9.73003195047794e-05} +{"train_loss": 0.009697088971734047, "global_step": 7950, "epoch": 66, "lr": 9.729960130538464e-05} +{"train_loss": 0.011021781712770462, "global_step": 7951, "epoch": 66, "lr": 9.729888301312214e-05} +{"train_loss": 0.015032852999866009, "global_step": 7952, "epoch": 66, "lr": 9.729816462799336e-05} +{"train_loss": 0.014663208276033401, "global_step": 7953, "epoch": 66, "lr": 9.729744614999968e-05} +{"train_loss": 0.012292184866964817, "global_step": 7954, "epoch": 66, "lr": 9.72967275791425e-05} +{"train_loss": 0.01634858176112175, "global_step": 7955, "epoch": 66, "lr": 9.729600891542326e-05} +{"train_loss": 0.011997089721262455, "global_step": 7956, "epoch": 66, "lr": 9.729529015884337e-05} +{"train_loss": 0.010732700116932392, "global_step": 7957, "epoch": 66, "lr": 9.729457130940421e-05} +{"train_loss": 0.008300386369228363, "global_step": 7958, "epoch": 66, "lr": 9.729385236710723e-05} +{"train_loss": 0.011646485887467861, "global_step": 7959, "epoch": 66, "lr": 9.729313333195383e-05} +{"train_loss": 0.014034926891326904, "global_step": 7960, "epoch": 66, "lr": 9.72924142039454e-05} +{"train_loss": 0.01036222092807293, "global_step": 7961, "epoch": 66, "lr": 9.729169498308334e-05} +{"train_loss": 0.010438751429319382, "global_step": 7962, "epoch": 66, "lr": 9.729097566936913e-05} +{"train_loss": 0.007888957858085632, "global_step": 7963, "epoch": 66, "lr": 9.729025626280412e-05} +{"train_loss": 0.012631235644221306, "global_step": 7964, "epoch": 66, "lr": 9.728953676338977e-05} +{"train_loss": 0.01148508582264185, "global_step": 7965, "epoch": 66, "lr": 9.728881717112746e-05} +{"train_loss": 0.01266800332814455, "global_step": 7966, "epoch": 66, "lr": 9.728809748601859e-05} +{"train_loss": 0.011009952053427696, "global_step": 7967, "epoch": 66, "lr": 9.728737770806459e-05} +{"train_loss": 0.014297948218882084, "global_step": 7968, "epoch": 66, "lr": 9.72866578372669e-05} +{"train_loss": 0.009452147409319878, "global_step": 7969, "epoch": 66, "lr": 9.728593787362689e-05} +{"train_loss": 0.015237526036798954, "global_step": 7970, "epoch": 66, "lr": 9.728521781714601e-05} +{"train_loss": 0.00843233522027731, "global_step": 7971, "epoch": 66, "lr": 9.728449766782564e-05} +{"train_loss": 0.012302964330971743, "global_step": 7972, "epoch": 66, "lr": 9.728377742566723e-05, "val_loss": 0.02083118073642254} +{"train_loss": 0.009053672663867474, "global_step": 7973, "epoch": 67, "lr": 9.728305709067215e-05} +{"train_loss": 0.015390835702419281, "global_step": 7974, "epoch": 67, "lr": 9.728233666284186e-05} +{"train_loss": 0.010878448374569416, "global_step": 7975, "epoch": 67, "lr": 9.728161614217773e-05} +{"train_loss": 0.010319461114704609, "global_step": 7976, "epoch": 67, "lr": 9.728089552868123e-05} +{"train_loss": 0.009385181590914726, "global_step": 7977, "epoch": 67, "lr": 9.728017482235371e-05} +{"train_loss": 0.010449092835187912, "global_step": 7978, "epoch": 67, "lr": 9.727945402319663e-05} +{"train_loss": 0.007800178602337837, "global_step": 7979, "epoch": 67, "lr": 9.72787331312114e-05} +{"train_loss": 0.016298998147249222, "global_step": 7980, "epoch": 67, "lr": 9.727801214639942e-05} +{"train_loss": 0.010450963862240314, "global_step": 7981, "epoch": 67, "lr": 9.727729106876213e-05} +{"train_loss": 0.0075554572977125645, "global_step": 7982, "epoch": 67, "lr": 9.727656989830092e-05} +{"train_loss": 0.01316930539906025, "global_step": 7983, "epoch": 67, "lr": 9.72758486350172e-05} +{"train_loss": 0.008256789296865463, "global_step": 7984, "epoch": 67, "lr": 9.727512727891242e-05} +{"train_loss": 0.010617820546030998, "global_step": 7985, "epoch": 67, "lr": 9.727440582998797e-05} +{"train_loss": 0.010144585743546486, "global_step": 7986, "epoch": 67, "lr": 9.727368428824528e-05} +{"train_loss": 0.012790772132575512, "global_step": 7987, "epoch": 67, "lr": 9.727296265368576e-05} +{"train_loss": 0.010467964224517345, "global_step": 7988, "epoch": 67, "lr": 9.727224092631083e-05} +{"train_loss": 0.011405630968511105, "global_step": 7989, "epoch": 67, "lr": 9.727151910612191e-05} +{"train_loss": 0.01753072254359722, "global_step": 7990, "epoch": 67, "lr": 9.72707971931204e-05} +{"train_loss": 0.01230688113719225, "global_step": 7991, "epoch": 67, "lr": 9.727007518730772e-05} +{"train_loss": 0.012018167413771152, "global_step": 7992, "epoch": 67, "lr": 9.726935308868533e-05} +{"train_loss": 0.011225811205804348, "global_step": 7993, "epoch": 67, "lr": 9.72686308972546e-05} +{"train_loss": 0.014169053174555302, "global_step": 7994, "epoch": 67, "lr": 9.726790861301695e-05} +{"train_loss": 0.016162719577550888, "global_step": 7995, "epoch": 67, "lr": 9.726718623597384e-05} +{"train_loss": 0.006352712400257587, "global_step": 7996, "epoch": 67, "lr": 9.726646376612663e-05} +{"train_loss": 0.012006967328488827, "global_step": 7997, "epoch": 67, "lr": 9.726574120347678e-05} +{"train_loss": 0.013636542484164238, "global_step": 7998, "epoch": 67, "lr": 9.72650185480257e-05} +{"train_loss": 0.013998243026435375, "global_step": 7999, "epoch": 67, "lr": 9.726429579977481e-05} +{"train_loss": 0.011364788748323917, "global_step": 8000, "epoch": 67, "lr": 9.726357295872552e-05} +{"train_loss": 0.012570527382194996, "global_step": 8001, "epoch": 67, "lr": 9.726285002487925e-05} +{"train_loss": 0.01632997766137123, "global_step": 8002, "epoch": 67, "lr": 9.726212699823742e-05} +{"train_loss": 0.011618540622293949, "global_step": 8003, "epoch": 67, "lr": 9.726140387880146e-05} +{"train_loss": 0.00757077569141984, "global_step": 8004, "epoch": 67, "lr": 9.726068066657278e-05} +{"train_loss": 0.01770499162375927, "global_step": 8005, "epoch": 67, "lr": 9.72599573615528e-05} +{"train_loss": 0.01635369099676609, "global_step": 8006, "epoch": 67, "lr": 9.725923396374295e-05} +{"train_loss": 0.007815036922693253, "global_step": 8007, "epoch": 67, "lr": 9.725851047314463e-05} +{"train_loss": 0.013392971828579903, "global_step": 8008, "epoch": 67, "lr": 9.725778688975928e-05} +{"train_loss": 0.011398179456591606, "global_step": 8009, "epoch": 67, "lr": 9.725706321358832e-05} +{"train_loss": 0.014839592389762402, "global_step": 8010, "epoch": 67, "lr": 9.725633944463317e-05} +{"train_loss": 0.012458646669983864, "global_step": 8011, "epoch": 67, "lr": 9.725561558289524e-05} +{"train_loss": 0.013752015307545662, "global_step": 8012, "epoch": 67, "lr": 9.725489162837594e-05} +{"train_loss": 0.01250433549284935, "global_step": 8013, "epoch": 67, "lr": 9.725416758107673e-05} +{"train_loss": 0.011873859912157059, "global_step": 8014, "epoch": 67, "lr": 9.725344344099901e-05} +{"train_loss": 0.016509177163243294, "global_step": 8015, "epoch": 67, "lr": 9.725271920814418e-05} +{"train_loss": 0.013324162922799587, "global_step": 8016, "epoch": 67, "lr": 9.725199488251371e-05} +{"train_loss": 0.010778955183923244, "global_step": 8017, "epoch": 67, "lr": 9.725127046410898e-05} +{"train_loss": 0.010031851939857006, "global_step": 8018, "epoch": 67, "lr": 9.725054595293144e-05} +{"train_loss": 0.011970026418566704, "global_step": 8019, "epoch": 67, "lr": 9.72498213489825e-05} +{"train_loss": 0.01924203149974346, "global_step": 8020, "epoch": 67, "lr": 9.724909665226358e-05} +{"train_loss": 0.013848402537405491, "global_step": 8021, "epoch": 67, "lr": 9.72483718627761e-05} +{"train_loss": 0.008574149571359158, "global_step": 8022, "epoch": 67, "lr": 9.724764698052148e-05} +{"train_loss": 0.017094921320676804, "global_step": 8023, "epoch": 67, "lr": 9.724692200550119e-05} +{"train_loss": 0.016561411321163177, "global_step": 8024, "epoch": 67, "lr": 9.724619693771658e-05} +{"train_loss": 0.010397316887974739, "global_step": 8025, "epoch": 67, "lr": 9.724547177716912e-05} +{"train_loss": 0.010852939449250698, "global_step": 8026, "epoch": 67, "lr": 9.724474652386025e-05} +{"train_loss": 0.009239849634468555, "global_step": 8027, "epoch": 67, "lr": 9.724402117779134e-05} +{"train_loss": 0.01570061594247818, "global_step": 8028, "epoch": 67, "lr": 9.724329573896385e-05} +{"train_loss": 0.011883566156029701, "global_step": 8029, "epoch": 67, "lr": 9.724257020737919e-05} +{"train_loss": 0.010517912916839123, "global_step": 8030, "epoch": 67, "lr": 9.724184458303879e-05} +{"train_loss": 0.010563171468675137, "global_step": 8031, "epoch": 67, "lr": 9.724111886594406e-05} +{"train_loss": 0.010075045749545097, "global_step": 8032, "epoch": 67, "lr": 9.724039305609647e-05} +{"train_loss": 0.012622182257473469, "global_step": 8033, "epoch": 67, "lr": 9.72396671534974e-05} +{"train_loss": 0.009702648967504501, "global_step": 8034, "epoch": 67, "lr": 9.72389411581483e-05} +{"train_loss": 0.012240443378686905, "global_step": 8035, "epoch": 67, "lr": 9.723821507005057e-05} +{"train_loss": 0.01047433540225029, "global_step": 8036, "epoch": 67, "lr": 9.723748888920568e-05} +{"train_loss": 0.012650650925934315, "global_step": 8037, "epoch": 67, "lr": 9.7236762615615e-05} +{"train_loss": 0.012470094487071037, "global_step": 8038, "epoch": 67, "lr": 9.723603624927999e-05} +{"train_loss": 0.006561023183166981, "global_step": 8039, "epoch": 67, "lr": 9.723530979020208e-05} +{"train_loss": 0.009877617470920086, "global_step": 8040, "epoch": 67, "lr": 9.723458323838268e-05} +{"train_loss": 0.008771871216595173, "global_step": 8041, "epoch": 67, "lr": 9.72338565938232e-05} +{"train_loss": 0.012939964421093464, "global_step": 8042, "epoch": 67, "lr": 9.723312985652512e-05} +{"train_loss": 0.014974711462855339, "global_step": 8043, "epoch": 67, "lr": 9.723240302648982e-05} +{"train_loss": 0.007662735879421234, "global_step": 8044, "epoch": 67, "lr": 9.723167610371875e-05} +{"train_loss": 0.011072378605604172, "global_step": 8045, "epoch": 67, "lr": 9.723094908821332e-05} +{"train_loss": 0.011486690491437912, "global_step": 8046, "epoch": 67, "lr": 9.723022197997497e-05} +{"train_loss": 0.014262315817177296, "global_step": 8047, "epoch": 67, "lr": 9.722949477900513e-05} +{"train_loss": 0.012672538869082928, "global_step": 8048, "epoch": 67, "lr": 9.722876748530523e-05} +{"train_loss": 0.009252031333744526, "global_step": 8049, "epoch": 67, "lr": 9.722804009887668e-05} +{"train_loss": 0.010723227635025978, "global_step": 8050, "epoch": 67, "lr": 9.722731261972092e-05} +{"train_loss": 0.019521374255418777, "global_step": 8051, "epoch": 67, "lr": 9.722658504783936e-05} +{"train_loss": 0.012059465982019901, "global_step": 8052, "epoch": 67, "lr": 9.722585738323347e-05} +{"train_loss": 0.012563071213662624, "global_step": 8053, "epoch": 67, "lr": 9.722512962590465e-05} +{"train_loss": 0.010000886395573616, "global_step": 8054, "epoch": 67, "lr": 9.722440177585433e-05} +{"train_loss": 0.006595246959477663, "global_step": 8055, "epoch": 67, "lr": 9.722367383308395e-05} +{"train_loss": 0.009483139961957932, "global_step": 8056, "epoch": 67, "lr": 9.722294579759492e-05} +{"train_loss": 0.010925572365522385, "global_step": 8057, "epoch": 67, "lr": 9.722221766938868e-05} +{"train_loss": 0.010183229111135006, "global_step": 8058, "epoch": 67, "lr": 9.722148944846667e-05} +{"train_loss": 0.013869554735720158, "global_step": 8059, "epoch": 67, "lr": 9.72207611348303e-05} +{"train_loss": 0.008750645443797112, "global_step": 8060, "epoch": 67, "lr": 9.722003272848101e-05} +{"train_loss": 0.02233673445880413, "global_step": 8061, "epoch": 67, "lr": 9.721930422942025e-05} +{"train_loss": 0.01128885243088007, "global_step": 8062, "epoch": 67, "lr": 9.721857563764942e-05} +{"train_loss": 0.012542416341602802, "global_step": 8063, "epoch": 67, "lr": 9.721784695316995e-05} +{"train_loss": 0.01071538683027029, "global_step": 8064, "epoch": 67, "lr": 9.72171181759833e-05} +{"train_loss": 0.011548968032002449, "global_step": 8065, "epoch": 67, "lr": 9.721638930609088e-05} +{"train_loss": 0.00950285978615284, "global_step": 8066, "epoch": 67, "lr": 9.72156603434941e-05} +{"train_loss": 0.009576629847288132, "global_step": 8067, "epoch": 67, "lr": 9.721493128819445e-05} +{"train_loss": 0.012452255934476852, "global_step": 8068, "epoch": 67, "lr": 9.72142021401933e-05} +{"train_loss": 0.007282237522304058, "global_step": 8069, "epoch": 67, "lr": 9.721347289949211e-05} +{"train_loss": 0.013978449627757072, "global_step": 8070, "epoch": 67, "lr": 9.721274356609233e-05} +{"train_loss": 0.0070711346343159676, "global_step": 8071, "epoch": 67, "lr": 9.721201413999536e-05} +{"train_loss": 0.013331456109881401, "global_step": 8072, "epoch": 67, "lr": 9.721128462120264e-05} +{"train_loss": 0.012276769615709782, "global_step": 8073, "epoch": 67, "lr": 9.721055500971561e-05} +{"train_loss": 0.007214425131678581, "global_step": 8074, "epoch": 67, "lr": 9.72098253055357e-05} +{"train_loss": 0.016367651522159576, "global_step": 8075, "epoch": 67, "lr": 9.720909550866436e-05} +{"train_loss": 0.014726100489497185, "global_step": 8076, "epoch": 67, "lr": 9.720836561910297e-05} +{"train_loss": 0.011942586861550808, "global_step": 8077, "epoch": 67, "lr": 9.720763563685301e-05} +{"train_loss": 0.015620943158864975, "global_step": 8078, "epoch": 67, "lr": 9.72069055619159e-05} +{"train_loss": 0.009744750335812569, "global_step": 8079, "epoch": 67, "lr": 9.720617539429309e-05} +{"train_loss": 0.009468774311244488, "global_step": 8080, "epoch": 67, "lr": 9.720544513398597e-05} +{"train_loss": 0.01438906043767929, "global_step": 8081, "epoch": 67, "lr": 9.720471478099602e-05} +{"train_loss": 0.010145477950572968, "global_step": 8082, "epoch": 67, "lr": 9.720398433532466e-05} +{"train_loss": 0.005981401074677706, "global_step": 8083, "epoch": 67, "lr": 9.720325379697332e-05} +{"train_loss": 0.014296600595116615, "global_step": 8084, "epoch": 67, "lr": 9.720252316594342e-05} +{"train_loss": 0.012885447591543198, "global_step": 8085, "epoch": 67, "lr": 9.720179244223642e-05} +{"train_loss": 0.008791974745690823, "global_step": 8086, "epoch": 67, "lr": 9.720106162585375e-05} +{"train_loss": 0.011939069256186485, "global_step": 8087, "epoch": 67, "lr": 9.720033071679682e-05} +{"train_loss": 0.009641405194997787, "global_step": 8088, "epoch": 67, "lr": 9.719959971506708e-05} +{"train_loss": 0.007771642412990332, "global_step": 8089, "epoch": 67, "lr": 9.719886862066598e-05} +{"train_loss": 0.01478962879627943, "global_step": 8090, "epoch": 67, "lr": 9.719813743359494e-05} +{"train_loss": 0.011872512511439434, "global_step": 8091, "epoch": 67, "lr": 9.71974061538554e-05, "val_loss": 0.02074369788169861} +{"train_loss": 0.009205708280205727, "global_step": 8092, "epoch": 68, "lr": 9.71966747814488e-05} +{"train_loss": 0.011259956285357475, "global_step": 8093, "epoch": 68, "lr": 9.719594331637657e-05} +{"train_loss": 0.011710633523762226, "global_step": 8094, "epoch": 68, "lr": 9.719521175864014e-05} +{"train_loss": 0.012288952246308327, "global_step": 8095, "epoch": 68, "lr": 9.719448010824097e-05} +{"train_loss": 0.016328418627381325, "global_step": 8096, "epoch": 68, "lr": 9.719374836518047e-05} +{"train_loss": 0.013796119019389153, "global_step": 8097, "epoch": 68, "lr": 9.71930165294601e-05} +{"train_loss": 0.01208141166716814, "global_step": 8098, "epoch": 68, "lr": 9.719228460108125e-05} +{"train_loss": 0.013414223678410053, "global_step": 8099, "epoch": 68, "lr": 9.719155258004543e-05} +{"train_loss": 0.016155514866113663, "global_step": 8100, "epoch": 68, "lr": 9.719082046635402e-05} +{"train_loss": 0.009294014424085617, "global_step": 8101, "epoch": 68, "lr": 9.719008826000846e-05} +{"train_loss": 0.012861407361924648, "global_step": 8102, "epoch": 68, "lr": 9.718935596101021e-05} +{"train_loss": 0.018813539296388626, "global_step": 8103, "epoch": 68, "lr": 9.718862356936073e-05} +{"train_loss": 0.013264971785247326, "global_step": 8104, "epoch": 68, "lr": 9.718789108506141e-05} +{"train_loss": 0.013425428420305252, "global_step": 8105, "epoch": 68, "lr": 9.71871585081137e-05} +{"train_loss": 0.012897166423499584, "global_step": 8106, "epoch": 68, "lr": 9.718642583851904e-05} +{"train_loss": 0.010895551182329655, "global_step": 8107, "epoch": 68, "lr": 9.718569307627889e-05} +{"train_loss": 0.017822708934545517, "global_step": 8108, "epoch": 68, "lr": 9.718496022139468e-05} +{"train_loss": 0.012263800948858261, "global_step": 8109, "epoch": 68, "lr": 9.718422727386783e-05} +{"train_loss": 0.011610855348408222, "global_step": 8110, "epoch": 68, "lr": 9.718349423369979e-05} +{"train_loss": 0.011254019103944302, "global_step": 8111, "epoch": 68, "lr": 9.718276110089199e-05} +{"train_loss": 0.022220442071557045, "global_step": 8112, "epoch": 68, "lr": 9.718202787544591e-05} +{"train_loss": 0.011831843294203281, "global_step": 8113, "epoch": 68, "lr": 9.718129455736293e-05} +{"train_loss": 0.017246661707758904, "global_step": 8114, "epoch": 68, "lr": 9.718056114664453e-05} +{"train_loss": 0.017884472385048866, "global_step": 8115, "epoch": 68, "lr": 9.717982764329213e-05} +{"train_loss": 0.01397189311683178, "global_step": 8116, "epoch": 68, "lr": 9.717909404730719e-05} +{"train_loss": 0.01241361629217863, "global_step": 8117, "epoch": 68, "lr": 9.717836035869113e-05} +{"train_loss": 0.012399503029882908, "global_step": 8118, "epoch": 68, "lr": 9.71776265774454e-05} +{"train_loss": 0.010649583302438259, "global_step": 8119, "epoch": 68, "lr": 9.717689270357144e-05} +{"train_loss": 0.00826318096369505, "global_step": 8120, "epoch": 68, "lr": 9.717615873707071e-05} +{"train_loss": 0.009869730100035667, "global_step": 8121, "epoch": 68, "lr": 9.717542467794462e-05} +{"train_loss": 0.011868486180901527, "global_step": 8122, "epoch": 68, "lr": 9.717469052619462e-05} +{"train_loss": 0.014599756337702274, "global_step": 8123, "epoch": 68, "lr": 9.717395628182215e-05} +{"train_loss": 0.016599230468273163, "global_step": 8124, "epoch": 68, "lr": 9.717322194482866e-05} +{"train_loss": 0.0132904639467597, "global_step": 8125, "epoch": 68, "lr": 9.71724875152156e-05} +{"train_loss": 0.010521295480430126, "global_step": 8126, "epoch": 68, "lr": 9.71717529929844e-05} +{"train_loss": 0.011711004190146923, "global_step": 8127, "epoch": 68, "lr": 9.717101837813649e-05} +{"train_loss": 0.013678007759153843, "global_step": 8128, "epoch": 68, "lr": 9.717028367067333e-05} +{"train_loss": 0.01002467330545187, "global_step": 8129, "epoch": 68, "lr": 9.716954887059634e-05} +{"train_loss": 0.01064135693013668, "global_step": 8130, "epoch": 68, "lr": 9.7168813977907e-05} +{"train_loss": 0.016309676691889763, "global_step": 8131, "epoch": 68, "lr": 9.716807899260674e-05} +{"train_loss": 0.008965576067566872, "global_step": 8132, "epoch": 68, "lr": 9.716734391469699e-05} +{"train_loss": 0.01848832331597805, "global_step": 8133, "epoch": 68, "lr": 9.71666087441792e-05} +{"train_loss": 0.008551405742764473, "global_step": 8134, "epoch": 68, "lr": 9.716587348105479e-05} +{"train_loss": 0.014051953330636024, "global_step": 8135, "epoch": 68, "lr": 9.716513812532525e-05} +{"train_loss": 0.009851673617959023, "global_step": 8136, "epoch": 68, "lr": 9.716440267699199e-05} +{"train_loss": 0.013135384768247604, "global_step": 8137, "epoch": 68, "lr": 9.716366713605647e-05} +{"train_loss": 0.012652973644435406, "global_step": 8138, "epoch": 68, "lr": 9.716293150252014e-05} +{"train_loss": 0.012315685860812664, "global_step": 8139, "epoch": 68, "lr": 9.716219577638442e-05} +{"train_loss": 0.008823655545711517, "global_step": 8140, "epoch": 68, "lr": 9.716145995765076e-05} +{"train_loss": 0.010449854657053947, "global_step": 8141, "epoch": 68, "lr": 9.716072404632062e-05} +{"train_loss": 0.010732774622738361, "global_step": 8142, "epoch": 68, "lr": 9.715998804239543e-05} +{"train_loss": 0.01028000470250845, "global_step": 8143, "epoch": 68, "lr": 9.715925194587665e-05} +{"train_loss": 0.008340294472873211, "global_step": 8144, "epoch": 68, "lr": 9.715851575676571e-05} +{"train_loss": 0.01334956381469965, "global_step": 8145, "epoch": 68, "lr": 9.715777947506408e-05} +{"train_loss": 0.012202964164316654, "global_step": 8146, "epoch": 68, "lr": 9.715704310077316e-05} +{"train_loss": 0.01113848015666008, "global_step": 8147, "epoch": 68, "lr": 9.715630663389444e-05} +{"train_loss": 0.014729158021509647, "global_step": 8148, "epoch": 68, "lr": 9.715557007442934e-05} +{"train_loss": 0.012951362878084183, "global_step": 8149, "epoch": 68, "lr": 9.715483342237934e-05} +{"train_loss": 0.012210262008011341, "global_step": 8150, "epoch": 68, "lr": 9.715409667774584e-05} +{"train_loss": 0.01078202947974205, "global_step": 8151, "epoch": 68, "lr": 9.715335984053031e-05} +{"train_loss": 0.014699378982186317, "global_step": 8152, "epoch": 68, "lr": 9.715262291073422e-05} +{"train_loss": 0.00921525340527296, "global_step": 8153, "epoch": 68, "lr": 9.715188588835896e-05} +{"train_loss": 0.014070791192352772, "global_step": 8154, "epoch": 68, "lr": 9.715114877340603e-05} +{"train_loss": 0.007544683292508125, "global_step": 8155, "epoch": 68, "lr": 9.715041156587685e-05} +{"train_loss": 0.009589994326233864, "global_step": 8156, "epoch": 68, "lr": 9.714967426577287e-05} +{"train_loss": 0.014246267266571522, "global_step": 8157, "epoch": 68, "lr": 9.714893687309554e-05} +{"train_loss": 0.011064188554883003, "global_step": 8158, "epoch": 68, "lr": 9.714819938784632e-05} +{"train_loss": 0.013111842796206474, "global_step": 8159, "epoch": 68, "lr": 9.714746181002666e-05} +{"train_loss": 0.009331072680652142, "global_step": 8160, "epoch": 68, "lr": 9.714672413963796e-05} +{"train_loss": 0.012820275500416756, "global_step": 8161, "epoch": 68, "lr": 9.714598637668173e-05} +{"train_loss": 0.01791001483798027, "global_step": 8162, "epoch": 68, "lr": 9.714524852115939e-05} +{"train_loss": 0.010092714801430702, "global_step": 8163, "epoch": 68, "lr": 9.714451057307238e-05} +{"train_loss": 0.008643408305943012, "global_step": 8164, "epoch": 68, "lr": 9.714377253242218e-05} +{"train_loss": 0.007681187242269516, "global_step": 8165, "epoch": 68, "lr": 9.71430343992102e-05} +{"train_loss": 0.011081928387284279, "global_step": 8166, "epoch": 68, "lr": 9.71422961734379e-05} +{"train_loss": 0.010721527971327305, "global_step": 8167, "epoch": 68, "lr": 9.714155785510675e-05} +{"train_loss": 0.008194642141461372, "global_step": 8168, "epoch": 68, "lr": 9.71408194442182e-05} +{"train_loss": 0.015671394765377045, "global_step": 8169, "epoch": 68, "lr": 9.714008094077366e-05} +{"train_loss": 0.013983914628624916, "global_step": 8170, "epoch": 68, "lr": 9.713934234477465e-05} +{"train_loss": 0.011010106652975082, "global_step": 8171, "epoch": 68, "lr": 9.713860365622253e-05} +{"train_loss": 0.011661423370242119, "global_step": 8172, "epoch": 68, "lr": 9.713786487511882e-05} +{"train_loss": 0.013969136402010918, "global_step": 8173, "epoch": 68, "lr": 9.713712600146496e-05} +{"train_loss": 0.008328566327691078, "global_step": 8174, "epoch": 68, "lr": 9.713638703526237e-05} +{"train_loss": 0.01369066908955574, "global_step": 8175, "epoch": 68, "lr": 9.713564797651253e-05} +{"train_loss": 0.008703062310814857, "global_step": 8176, "epoch": 68, "lr": 9.713490882521687e-05} +{"train_loss": 0.015024490654468536, "global_step": 8177, "epoch": 68, "lr": 9.713416958137686e-05} +{"train_loss": 0.011335956864058971, "global_step": 8178, "epoch": 68, "lr": 9.713343024499395e-05} +{"train_loss": 0.01374009344726801, "global_step": 8179, "epoch": 68, "lr": 9.713269081606957e-05} +{"train_loss": 0.008775981143116951, "global_step": 8180, "epoch": 68, "lr": 9.71319512946052e-05} +{"train_loss": 0.010914596728980541, "global_step": 8181, "epoch": 68, "lr": 9.713121168060228e-05} +{"train_loss": 0.011897454038262367, "global_step": 8182, "epoch": 68, "lr": 9.713047197406224e-05} +{"train_loss": 0.00825597159564495, "global_step": 8183, "epoch": 68, "lr": 9.712973217498657e-05} +{"train_loss": 0.011969790793955326, "global_step": 8184, "epoch": 68, "lr": 9.71289922833767e-05} +{"train_loss": 0.010834692977368832, "global_step": 8185, "epoch": 68, "lr": 9.71282522992341e-05} +{"train_loss": 0.007935348898172379, "global_step": 8186, "epoch": 68, "lr": 9.712751222256022e-05} +{"train_loss": 0.012705652043223381, "global_step": 8187, "epoch": 68, "lr": 9.712677205335647e-05} +{"train_loss": 0.013632223941385746, "global_step": 8188, "epoch": 68, "lr": 9.712603179162436e-05} +{"train_loss": 0.01134371105581522, "global_step": 8189, "epoch": 68, "lr": 9.712529143736533e-05} +{"train_loss": 0.009266044944524765, "global_step": 8190, "epoch": 68, "lr": 9.712455099058081e-05} +{"train_loss": 0.00883998442441225, "global_step": 8191, "epoch": 68, "lr": 9.712381045127228e-05} +{"train_loss": 0.006562441121786833, "global_step": 8192, "epoch": 68, "lr": 9.712306981944117e-05} +{"train_loss": 0.01279706135392189, "global_step": 8193, "epoch": 68, "lr": 9.712232909508894e-05} +{"train_loss": 0.01376758236438036, "global_step": 8194, "epoch": 68, "lr": 9.712158827821707e-05} +{"train_loss": 0.00947008840739727, "global_step": 8195, "epoch": 68, "lr": 9.712084736882698e-05} +{"train_loss": 0.010915971361100674, "global_step": 8196, "epoch": 68, "lr": 9.712010636692015e-05} +{"train_loss": 0.012411723844707012, "global_step": 8197, "epoch": 68, "lr": 9.711936527249803e-05} +{"train_loss": 0.011809790506958961, "global_step": 8198, "epoch": 68, "lr": 9.711862408556207e-05} +{"train_loss": 0.009776083752512932, "global_step": 8199, "epoch": 68, "lr": 9.711788280611372e-05} +{"train_loss": 0.015570690855383873, "global_step": 8200, "epoch": 68, "lr": 9.711714143415443e-05} +{"train_loss": 0.011674963869154453, "global_step": 8201, "epoch": 68, "lr": 9.711639996968568e-05} +{"train_loss": 0.007566729094833136, "global_step": 8202, "epoch": 68, "lr": 9.711565841270891e-05} +{"train_loss": 0.014319613575935364, "global_step": 8203, "epoch": 68, "lr": 9.711491676322557e-05} +{"train_loss": 0.00956120528280735, "global_step": 8204, "epoch": 68, "lr": 9.711417502123715e-05} +{"train_loss": 0.012659438885748386, "global_step": 8205, "epoch": 68, "lr": 9.711343318674504e-05} +{"train_loss": 0.01212329138070345, "global_step": 8206, "epoch": 68, "lr": 9.711269125975076e-05} +{"train_loss": 0.02013949118554592, "global_step": 8207, "epoch": 68, "lr": 9.711194924025575e-05} +{"train_loss": 0.00664921198040247, "global_step": 8208, "epoch": 68, "lr": 9.711120712826145e-05} +{"train_loss": 0.008459893055260181, "global_step": 8209, "epoch": 68, "lr": 9.711046492376933e-05} +{"train_loss": 0.01213802968566658, "global_step": 8210, "epoch": 68, "lr": 9.710972262678085e-05, "val_loss": 0.024862919002771378} +{"train_loss": 0.008670582436025143, "global_step": 8211, "epoch": 69, "lr": 9.710898023729747e-05} +{"train_loss": 0.009113982319831848, "global_step": 8212, "epoch": 69, "lr": 9.710823775532063e-05} +{"train_loss": 0.007677431218326092, "global_step": 8213, "epoch": 69, "lr": 9.71074951808518e-05} +{"train_loss": 0.009960240684449673, "global_step": 8214, "epoch": 69, "lr": 9.710675251389243e-05} +{"train_loss": 0.005989415105432272, "global_step": 8215, "epoch": 69, "lr": 9.710600975444399e-05} +{"train_loss": 0.014015172608196735, "global_step": 8216, "epoch": 69, "lr": 9.710526690250792e-05} +{"train_loss": 0.018626196309924126, "global_step": 8217, "epoch": 69, "lr": 9.710452395808571e-05} +{"train_loss": 0.012944391928613186, "global_step": 8218, "epoch": 69, "lr": 9.710378092117879e-05} +{"train_loss": 0.011412269435822964, "global_step": 8219, "epoch": 69, "lr": 9.710303779178861e-05} +{"train_loss": 0.013089514337480068, "global_step": 8220, "epoch": 69, "lr": 9.710229456991668e-05} +{"train_loss": 0.01262423675507307, "global_step": 8221, "epoch": 69, "lr": 9.710155125556442e-05} +{"train_loss": 0.014565576799213886, "global_step": 8222, "epoch": 69, "lr": 9.710080784873329e-05} +{"train_loss": 0.007233234588056803, "global_step": 8223, "epoch": 69, "lr": 9.710006434942476e-05} +{"train_loss": 0.012836637906730175, "global_step": 8224, "epoch": 69, "lr": 9.709932075764028e-05} +{"train_loss": 0.010388932190835476, "global_step": 8225, "epoch": 69, "lr": 9.70985770733813e-05} +{"train_loss": 0.01056020986288786, "global_step": 8226, "epoch": 69, "lr": 9.709783329664932e-05} +{"train_loss": 0.012941686436533928, "global_step": 8227, "epoch": 69, "lr": 9.709708942744578e-05} +{"train_loss": 0.014949554577469826, "global_step": 8228, "epoch": 69, "lr": 9.709634546577211e-05} +{"train_loss": 0.009550695307552814, "global_step": 8229, "epoch": 69, "lr": 9.709560141162981e-05} +{"train_loss": 0.01016977895051241, "global_step": 8230, "epoch": 69, "lr": 9.709485726502034e-05} +{"train_loss": 0.016411466524004936, "global_step": 8231, "epoch": 69, "lr": 9.709411302594513e-05} +{"train_loss": 0.01703481376171112, "global_step": 8232, "epoch": 69, "lr": 9.709336869440568e-05} +{"train_loss": 0.010846557095646858, "global_step": 8233, "epoch": 69, "lr": 9.709262427040342e-05} +{"train_loss": 0.008798690512776375, "global_step": 8234, "epoch": 69, "lr": 9.709187975393983e-05} +{"train_loss": 0.01672111265361309, "global_step": 8235, "epoch": 69, "lr": 9.709113514501635e-05} +{"train_loss": 0.010122808627784252, "global_step": 8236, "epoch": 69, "lr": 9.709039044363446e-05} +{"train_loss": 0.010075352154672146, "global_step": 8237, "epoch": 69, "lr": 9.708964564979564e-05} +{"train_loss": 0.009418641217052937, "global_step": 8238, "epoch": 69, "lr": 9.708890076350131e-05} +{"train_loss": 0.008567048236727715, "global_step": 8239, "epoch": 69, "lr": 9.708815578475297e-05} +{"train_loss": 0.009659118950366974, "global_step": 8240, "epoch": 69, "lr": 9.708741071355205e-05} +{"train_loss": 0.011051212437450886, "global_step": 8241, "epoch": 69, "lr": 9.708666554990005e-05} +{"train_loss": 0.015295659191906452, "global_step": 8242, "epoch": 69, "lr": 9.70859202937984e-05} +{"train_loss": 0.0136801078915596, "global_step": 8243, "epoch": 69, "lr": 9.708517494524856e-05} +{"train_loss": 0.011444922536611557, "global_step": 8244, "epoch": 69, "lr": 9.708442950425202e-05} +{"train_loss": 0.01974276266992092, "global_step": 8245, "epoch": 69, "lr": 9.708368397081025e-05} +{"train_loss": 0.010773565620183945, "global_step": 8246, "epoch": 69, "lr": 9.708293834492467e-05} +{"train_loss": 0.011270931921899319, "global_step": 8247, "epoch": 69, "lr": 9.70821926265968e-05} +{"train_loss": 0.012914787977933884, "global_step": 8248, "epoch": 69, "lr": 9.708144681582807e-05} +{"train_loss": 0.010032154619693756, "global_step": 8249, "epoch": 69, "lr": 9.708070091261994e-05} +{"train_loss": 0.009600292891263962, "global_step": 8250, "epoch": 69, "lr": 9.707995491697389e-05} +{"train_loss": 0.011797275394201279, "global_step": 8251, "epoch": 69, "lr": 9.707920882889136e-05} +{"train_loss": 0.008782850578427315, "global_step": 8252, "epoch": 69, "lr": 9.707846264837384e-05} +{"train_loss": 0.007934422232210636, "global_step": 8253, "epoch": 69, "lr": 9.70777163754228e-05} +{"train_loss": 0.00881162192672491, "global_step": 8254, "epoch": 69, "lr": 9.707697001003968e-05} +{"train_loss": 0.016125433146953583, "global_step": 8255, "epoch": 69, "lr": 9.707622355222597e-05} +{"train_loss": 0.016132108867168427, "global_step": 8256, "epoch": 69, "lr": 9.707547700198312e-05} +{"train_loss": 0.012259313836693764, "global_step": 8257, "epoch": 69, "lr": 9.70747303593126e-05} +{"train_loss": 0.00641837390139699, "global_step": 8258, "epoch": 69, "lr": 9.707398362421587e-05} +{"train_loss": 0.014517052099108696, "global_step": 8259, "epoch": 69, "lr": 9.70732367966944e-05} +{"train_loss": 0.012104567140340805, "global_step": 8260, "epoch": 69, "lr": 9.707248987674969e-05} +{"train_loss": 0.011928536929190159, "global_step": 8261, "epoch": 69, "lr": 9.707174286438315e-05} +{"train_loss": 0.01093523483723402, "global_step": 8262, "epoch": 69, "lr": 9.707099575959626e-05} +{"train_loss": 0.016659531742334366, "global_step": 8263, "epoch": 69, "lr": 9.707024856239052e-05} +{"train_loss": 0.007412059232592583, "global_step": 8264, "epoch": 69, "lr": 9.706950127276737e-05} +{"train_loss": 0.015190225094556808, "global_step": 8265, "epoch": 69, "lr": 9.706875389072827e-05} +{"train_loss": 0.01048219297081232, "global_step": 8266, "epoch": 69, "lr": 9.706800641627471e-05} +{"train_loss": 0.01561150886118412, "global_step": 8267, "epoch": 69, "lr": 9.706725884940815e-05} +{"train_loss": 0.00949386227875948, "global_step": 8268, "epoch": 69, "lr": 9.706651119013006e-05} +{"train_loss": 0.011561294086277485, "global_step": 8269, "epoch": 69, "lr": 9.706576343844189e-05} +{"train_loss": 0.009777727536857128, "global_step": 8270, "epoch": 69, "lr": 9.706501559434513e-05} +{"train_loss": 0.013021147809922695, "global_step": 8271, "epoch": 69, "lr": 9.706426765784125e-05} +{"train_loss": 0.011239747516810894, "global_step": 8272, "epoch": 69, "lr": 9.70635196289317e-05} +{"train_loss": 0.012406561523675919, "global_step": 8273, "epoch": 69, "lr": 9.706277150761795e-05} +{"train_loss": 0.011840825900435448, "global_step": 8274, "epoch": 69, "lr": 9.706202329390149e-05} +{"train_loss": 0.011931692250072956, "global_step": 8275, "epoch": 69, "lr": 9.706127498778376e-05} +{"train_loss": 0.013811501674354076, "global_step": 8276, "epoch": 69, "lr": 9.706052658926626e-05} +{"train_loss": 0.01586359366774559, "global_step": 8277, "epoch": 69, "lr": 9.705977809835043e-05} +{"train_loss": 0.01461697556078434, "global_step": 8278, "epoch": 69, "lr": 9.705902951503776e-05} +{"train_loss": 0.006895834114402533, "global_step": 8279, "epoch": 69, "lr": 9.70582808393297e-05} +{"train_loss": 0.010645733214914799, "global_step": 8280, "epoch": 69, "lr": 9.705753207122775e-05} +{"train_loss": 0.014752556569874287, "global_step": 8281, "epoch": 69, "lr": 9.705678321073336e-05} +{"train_loss": 0.011467421427369118, "global_step": 8282, "epoch": 69, "lr": 9.7056034257848e-05} +{"train_loss": 0.013585373759269714, "global_step": 8283, "epoch": 69, "lr": 9.705528521257315e-05} +{"train_loss": 0.012674261815845966, "global_step": 8284, "epoch": 69, "lr": 9.705453607491026e-05} +{"train_loss": 0.01229705847799778, "global_step": 8285, "epoch": 69, "lr": 9.705378684486084e-05} +{"train_loss": 0.011960070580244064, "global_step": 8286, "epoch": 69, "lr": 9.705303752242632e-05} +{"train_loss": 0.010162770748138428, "global_step": 8287, "epoch": 69, "lr": 9.705228810760818e-05} +{"train_loss": 0.011955659836530685, "global_step": 8288, "epoch": 69, "lr": 9.705153860040792e-05} +{"train_loss": 0.013842668384313583, "global_step": 8289, "epoch": 69, "lr": 9.705078900082697e-05} +{"train_loss": 0.01153523102402687, "global_step": 8290, "epoch": 69, "lr": 9.705003930886683e-05} +{"train_loss": 0.00877468567341566, "global_step": 8291, "epoch": 69, "lr": 9.704928952452897e-05} +{"train_loss": 0.00820923876017332, "global_step": 8292, "epoch": 69, "lr": 9.704853964781483e-05} +{"train_loss": 0.016075698658823967, "global_step": 8293, "epoch": 69, "lr": 9.704778967872594e-05} +{"train_loss": 0.010527270846068859, "global_step": 8294, "epoch": 69, "lr": 9.704703961726374e-05} +{"train_loss": 0.011491254903376102, "global_step": 8295, "epoch": 69, "lr": 9.70462894634297e-05} +{"train_loss": 0.008832426741719246, "global_step": 8296, "epoch": 69, "lr": 9.704553921722529e-05} +{"train_loss": 0.015249420888721943, "global_step": 8297, "epoch": 69, "lr": 9.704478887865199e-05} +{"train_loss": 0.01588086038827896, "global_step": 8298, "epoch": 69, "lr": 9.704403844771128e-05} +{"train_loss": 0.010369841009378433, "global_step": 8299, "epoch": 69, "lr": 9.704328792440463e-05} +{"train_loss": 0.009959762915968895, "global_step": 8300, "epoch": 69, "lr": 9.70425373087335e-05} +{"train_loss": 0.016008496284484863, "global_step": 8301, "epoch": 69, "lr": 9.704178660069937e-05} +{"train_loss": 0.01493439543992281, "global_step": 8302, "epoch": 69, "lr": 9.704103580030373e-05} +{"train_loss": 0.01154683344066143, "global_step": 8303, "epoch": 69, "lr": 9.704028490754803e-05} +{"train_loss": 0.012684730812907219, "global_step": 8304, "epoch": 69, "lr": 9.703953392243376e-05} +{"train_loss": 0.008969409391283989, "global_step": 8305, "epoch": 69, "lr": 9.70387828449624e-05} +{"train_loss": 0.0131813520565629, "global_step": 8306, "epoch": 69, "lr": 9.70380316751354e-05} +{"train_loss": 0.014626500196754932, "global_step": 8307, "epoch": 69, "lr": 9.703728041295426e-05} +{"train_loss": 0.012658107094466686, "global_step": 8308, "epoch": 69, "lr": 9.703652905842044e-05} +{"train_loss": 0.00853902380913496, "global_step": 8309, "epoch": 69, "lr": 9.703577761153542e-05} +{"train_loss": 0.013653923757374287, "global_step": 8310, "epoch": 69, "lr": 9.703502607230069e-05} +{"train_loss": 0.009383419528603554, "global_step": 8311, "epoch": 69, "lr": 9.703427444071769e-05} +{"train_loss": 0.011905747465789318, "global_step": 8312, "epoch": 69, "lr": 9.703352271678792e-05} +{"train_loss": 0.008500069379806519, "global_step": 8313, "epoch": 69, "lr": 9.703277090051287e-05} +{"train_loss": 0.010782811790704727, "global_step": 8314, "epoch": 69, "lr": 9.703201899189398e-05} +{"train_loss": 0.010869724676012993, "global_step": 8315, "epoch": 69, "lr": 9.703126699093277e-05} +{"train_loss": 0.011812668293714523, "global_step": 8316, "epoch": 69, "lr": 9.703051489763066e-05} +{"train_loss": 0.009187269024550915, "global_step": 8317, "epoch": 69, "lr": 9.702976271198918e-05} +{"train_loss": 0.01377440057694912, "global_step": 8318, "epoch": 69, "lr": 9.702901043400978e-05} +{"train_loss": 0.012582896277308464, "global_step": 8319, "epoch": 69, "lr": 9.702825806369394e-05} +{"train_loss": 0.013801639899611473, "global_step": 8320, "epoch": 69, "lr": 9.702750560104315e-05} +{"train_loss": 0.01461938489228487, "global_step": 8321, "epoch": 69, "lr": 9.702675304605886e-05} +{"train_loss": 0.010056528262794018, "global_step": 8322, "epoch": 69, "lr": 9.702600039874258e-05} +{"train_loss": 0.007407451514154673, "global_step": 8323, "epoch": 69, "lr": 9.702524765909576e-05} +{"train_loss": 0.008497589267790318, "global_step": 8324, "epoch": 69, "lr": 9.70244948271199e-05} +{"train_loss": 0.00833290908485651, "global_step": 8325, "epoch": 69, "lr": 9.702374190281647e-05} +{"train_loss": 0.015574796125292778, "global_step": 8326, "epoch": 69, "lr": 9.702298888618693e-05} +{"train_loss": 0.016436215490102768, "global_step": 8327, "epoch": 69, "lr": 9.702223577723279e-05} +{"train_loss": 0.009756944142282009, "global_step": 8328, "epoch": 69, "lr": 9.70214825759555e-05} +{"train_loss": 0.01185202958187511, "global_step": 8329, "epoch": 69, "lr": 9.702072928235657e-05, "val_loss": 0.02232266403734684} +{"train_loss": 0.011374550871551037, "global_step": 8330, "epoch": 70, "lr": 9.701997589643746e-05} +{"train_loss": 0.007916059345006943, "global_step": 8331, "epoch": 70, "lr": 9.701922241819964e-05} +{"train_loss": 0.015687022358179092, "global_step": 8332, "epoch": 70, "lr": 9.70184688476446e-05} +{"train_loss": 0.013975473120808601, "global_step": 8333, "epoch": 70, "lr": 9.701771518477381e-05} +{"train_loss": 0.010798578150570393, "global_step": 8334, "epoch": 70, "lr": 9.701696142958878e-05} +{"train_loss": 0.010248413309454918, "global_step": 8335, "epoch": 70, "lr": 9.701620758209096e-05} +{"train_loss": 0.013278764672577381, "global_step": 8336, "epoch": 70, "lr": 9.701545364228184e-05} +{"train_loss": 0.007312391884624958, "global_step": 8337, "epoch": 70, "lr": 9.70146996101629e-05} +{"train_loss": 0.011986472643911839, "global_step": 8338, "epoch": 70, "lr": 9.701394548573563e-05} +{"train_loss": 0.011718722991645336, "global_step": 8339, "epoch": 70, "lr": 9.701319126900148e-05} +{"train_loss": 0.011238873936235905, "global_step": 8340, "epoch": 70, "lr": 9.701243695996196e-05} +{"train_loss": 0.00978445541113615, "global_step": 8341, "epoch": 70, "lr": 9.701168255861855e-05} +{"train_loss": 0.009523470886051655, "global_step": 8342, "epoch": 70, "lr": 9.701092806497271e-05} +{"train_loss": 0.012925163842737675, "global_step": 8343, "epoch": 70, "lr": 9.701017347902595e-05} +{"train_loss": 0.010910396464169025, "global_step": 8344, "epoch": 70, "lr": 9.700941880077973e-05} +{"train_loss": 0.008323504589498043, "global_step": 8345, "epoch": 70, "lr": 9.700866403023555e-05} +{"train_loss": 0.011398720555007458, "global_step": 8346, "epoch": 70, "lr": 9.700790916739487e-05} +{"train_loss": 0.010308995842933655, "global_step": 8347, "epoch": 70, "lr": 9.700715421225917e-05} +{"train_loss": 0.010456722229719162, "global_step": 8348, "epoch": 70, "lr": 9.700639916482996e-05} +{"train_loss": 0.012848704122006893, "global_step": 8349, "epoch": 70, "lr": 9.700564402510871e-05} +{"train_loss": 0.012968305498361588, "global_step": 8350, "epoch": 70, "lr": 9.70048887930969e-05} +{"train_loss": 0.00784832239151001, "global_step": 8351, "epoch": 70, "lr": 9.7004133468796e-05} +{"train_loss": 0.010301465168595314, "global_step": 8352, "epoch": 70, "lr": 9.700337805220752e-05} +{"train_loss": 0.013201426714658737, "global_step": 8353, "epoch": 70, "lr": 9.700262254333291e-05} +{"train_loss": 0.016743648797273636, "global_step": 8354, "epoch": 70, "lr": 9.700186694217368e-05} +{"train_loss": 0.011327649466693401, "global_step": 8355, "epoch": 70, "lr": 9.700111124873131e-05} +{"train_loss": 0.014667997136712074, "global_step": 8356, "epoch": 70, "lr": 9.700035546300728e-05} +{"train_loss": 0.01337958499789238, "global_step": 8357, "epoch": 70, "lr": 9.699959958500306e-05} +{"train_loss": 0.012430856004357338, "global_step": 8358, "epoch": 70, "lr": 9.699884361472016e-05} +{"train_loss": 0.011849816888570786, "global_step": 8359, "epoch": 70, "lr": 9.699808755216007e-05} +{"train_loss": 0.011911329813301563, "global_step": 8360, "epoch": 70, "lr": 9.699733139732423e-05} +{"train_loss": 0.01744234375655651, "global_step": 8361, "epoch": 70, "lr": 9.699657515021415e-05} +{"train_loss": 0.012416132725775242, "global_step": 8362, "epoch": 70, "lr": 9.699581881083133e-05} +{"train_loss": 0.008923151530325413, "global_step": 8363, "epoch": 70, "lr": 9.699506237917724e-05} +{"train_loss": 0.013045068830251694, "global_step": 8364, "epoch": 70, "lr": 9.699430585525336e-05} +{"train_loss": 0.01154958177357912, "global_step": 8365, "epoch": 70, "lr": 9.699354923906117e-05} +{"train_loss": 0.011959646828472614, "global_step": 8366, "epoch": 70, "lr": 9.699279253060219e-05} +{"train_loss": 0.012438380159437656, "global_step": 8367, "epoch": 70, "lr": 9.699203572987785e-05} +{"train_loss": 0.008132480084896088, "global_step": 8368, "epoch": 70, "lr": 9.69912788368897e-05} +{"train_loss": 0.011417601257562637, "global_step": 8369, "epoch": 70, "lr": 9.699052185163918e-05} +{"train_loss": 0.01053258404135704, "global_step": 8370, "epoch": 70, "lr": 9.698976477412778e-05} +{"train_loss": 0.008457347750663757, "global_step": 8371, "epoch": 70, "lr": 9.6989007604357e-05} +{"train_loss": 0.009359230287373066, "global_step": 8372, "epoch": 70, "lr": 9.698825034232834e-05} +{"train_loss": 0.008639789186418056, "global_step": 8373, "epoch": 70, "lr": 9.698749298804328e-05} +{"train_loss": 0.011567790061235428, "global_step": 8374, "epoch": 70, "lr": 9.698673554150327e-05} +{"train_loss": 0.013817165978252888, "global_step": 8375, "epoch": 70, "lr": 9.698597800270983e-05} +{"train_loss": 0.0076819853857159615, "global_step": 8376, "epoch": 70, "lr": 9.698522037166445e-05} +{"train_loss": 0.009377269074320793, "global_step": 8377, "epoch": 70, "lr": 9.69844626483686e-05} +{"train_loss": 0.00858356524258852, "global_step": 8378, "epoch": 70, "lr": 9.69837048328238e-05} +{"train_loss": 0.011674413457512856, "global_step": 8379, "epoch": 70, "lr": 9.69829469250315e-05} +{"train_loss": 0.008969901129603386, "global_step": 8380, "epoch": 70, "lr": 9.698218892499319e-05} +{"train_loss": 0.010918596759438515, "global_step": 8381, "epoch": 70, "lr": 9.698143083271038e-05} +{"train_loss": 0.007743356749415398, "global_step": 8382, "epoch": 70, "lr": 9.698067264818456e-05} +{"train_loss": 0.014233153313398361, "global_step": 8383, "epoch": 70, "lr": 9.69799143714172e-05} +{"train_loss": 0.011133373714983463, "global_step": 8384, "epoch": 70, "lr": 9.697915600240978e-05} +{"train_loss": 0.011339525692164898, "global_step": 8385, "epoch": 70, "lr": 9.697839754116384e-05} +{"train_loss": 0.012028737924993038, "global_step": 8386, "epoch": 70, "lr": 9.697763898768082e-05} +{"train_loss": 0.012408846989274025, "global_step": 8387, "epoch": 70, "lr": 9.697688034196221e-05} +{"train_loss": 0.009932052344083786, "global_step": 8388, "epoch": 70, "lr": 9.697612160400954e-05} +{"train_loss": 0.009191390126943588, "global_step": 8389, "epoch": 70, "lr": 9.697536277382426e-05} +{"train_loss": 0.011660193093121052, "global_step": 8390, "epoch": 70, "lr": 9.697460385140789e-05} +{"train_loss": 0.00879519060254097, "global_step": 8391, "epoch": 70, "lr": 9.697384483676189e-05} +{"train_loss": 0.009601926431059837, "global_step": 8392, "epoch": 70, "lr": 9.697308572988774e-05} +{"train_loss": 0.011004189029335976, "global_step": 8393, "epoch": 70, "lr": 9.697232653078698e-05} +{"train_loss": 0.011385458521544933, "global_step": 8394, "epoch": 70, "lr": 9.697156723946108e-05} +{"train_loss": 0.010622827336192131, "global_step": 8395, "epoch": 70, "lr": 9.697080785591152e-05} +{"train_loss": 0.004195963032543659, "global_step": 8396, "epoch": 70, "lr": 9.69700483801398e-05} +{"train_loss": 0.011471977457404137, "global_step": 8397, "epoch": 70, "lr": 9.69692888121474e-05} +{"train_loss": 0.011117265559732914, "global_step": 8398, "epoch": 70, "lr": 9.696852915193582e-05} +{"train_loss": 0.012683792039752007, "global_step": 8399, "epoch": 70, "lr": 9.696776939950656e-05} +{"train_loss": 0.012393764220178127, "global_step": 8400, "epoch": 70, "lr": 9.69670095548611e-05} +{"train_loss": 0.016120927408337593, "global_step": 8401, "epoch": 70, "lr": 9.696624961800093e-05} +{"train_loss": 0.013667557388544083, "global_step": 8402, "epoch": 70, "lr": 9.696548958892755e-05} +{"train_loss": 0.013031461276113987, "global_step": 8403, "epoch": 70, "lr": 9.696472946764245e-05} +{"train_loss": 0.010729068890213966, "global_step": 8404, "epoch": 70, "lr": 9.696396925414712e-05} +{"train_loss": 0.01206183061003685, "global_step": 8405, "epoch": 70, "lr": 9.696320894844303e-05} +{"train_loss": 0.013947580941021442, "global_step": 8406, "epoch": 70, "lr": 9.696244855053173e-05} +{"train_loss": 0.0118938023224473, "global_step": 8407, "epoch": 70, "lr": 9.696168806041468e-05} +{"train_loss": 0.01638878509402275, "global_step": 8408, "epoch": 70, "lr": 9.696092747809336e-05} +{"train_loss": 0.01147350762039423, "global_step": 8409, "epoch": 70, "lr": 9.696016680356927e-05} +{"train_loss": 0.012443970888853073, "global_step": 8410, "epoch": 70, "lr": 9.695940603684391e-05} +{"train_loss": 0.009741333313286304, "global_step": 8411, "epoch": 70, "lr": 9.695864517791878e-05} +{"train_loss": 0.007730846293270588, "global_step": 8412, "epoch": 70, "lr": 9.695788422679537e-05} +{"train_loss": 0.009664489887654781, "global_step": 8413, "epoch": 70, "lr": 9.695712318347517e-05} +{"train_loss": 0.010659067891538143, "global_step": 8414, "epoch": 70, "lr": 9.695636204795966e-05} +{"train_loss": 0.01198657788336277, "global_step": 8415, "epoch": 70, "lr": 9.695560082025037e-05} +{"train_loss": 0.010060238651931286, "global_step": 8416, "epoch": 70, "lr": 9.695483950034876e-05} +{"train_loss": 0.010535427369177341, "global_step": 8417, "epoch": 70, "lr": 9.695407808825635e-05} +{"train_loss": 0.009650006890296936, "global_step": 8418, "epoch": 70, "lr": 9.695331658397462e-05} +{"train_loss": 0.018012767657637596, "global_step": 8419, "epoch": 70, "lr": 9.695255498750507e-05} +{"train_loss": 0.011839540675282478, "global_step": 8420, "epoch": 70, "lr": 9.695179329884918e-05} +{"train_loss": 0.009478534571826458, "global_step": 8421, "epoch": 70, "lr": 9.695103151800849e-05} +{"train_loss": 0.009143780916929245, "global_step": 8422, "epoch": 70, "lr": 9.695026964498444e-05} +{"train_loss": 0.01700568199157715, "global_step": 8423, "epoch": 70, "lr": 9.694950767977856e-05} +{"train_loss": 0.008761373348534107, "global_step": 8424, "epoch": 70, "lr": 9.694874562239233e-05} +{"train_loss": 0.01243884302675724, "global_step": 8425, "epoch": 70, "lr": 9.694798347282727e-05} +{"train_loss": 0.012064485810697079, "global_step": 8426, "epoch": 70, "lr": 9.694722123108483e-05} +{"train_loss": 0.009381454437971115, "global_step": 8427, "epoch": 70, "lr": 9.694645889716658e-05} +{"train_loss": 0.01353977620601654, "global_step": 8428, "epoch": 70, "lr": 9.694569647107394e-05} +{"train_loss": 0.010077622719109058, "global_step": 8429, "epoch": 70, "lr": 9.694493395280845e-05} +{"train_loss": 0.014285366982221603, "global_step": 8430, "epoch": 70, "lr": 9.69441713423716e-05} +{"train_loss": 0.014207986183464527, "global_step": 8431, "epoch": 70, "lr": 9.694340863976489e-05} +{"train_loss": 0.018143227323889732, "global_step": 8432, "epoch": 70, "lr": 9.69426458449898e-05} +{"train_loss": 0.01165167335420847, "global_step": 8433, "epoch": 70, "lr": 9.694188295804784e-05} +{"train_loss": 0.008951164782047272, "global_step": 8434, "epoch": 70, "lr": 9.694111997894053e-05} +{"train_loss": 0.00960918515920639, "global_step": 8435, "epoch": 70, "lr": 9.694035690766932e-05} +{"train_loss": 0.01464957743883133, "global_step": 8436, "epoch": 70, "lr": 9.693959374423574e-05} +{"train_loss": 0.009498359635472298, "global_step": 8437, "epoch": 70, "lr": 9.69388304886413e-05} +{"train_loss": 0.013608117587864399, "global_step": 8438, "epoch": 70, "lr": 9.693806714088747e-05} +{"train_loss": 0.009194975718855858, "global_step": 8439, "epoch": 70, "lr": 9.693730370097574e-05} +{"train_loss": 0.009872515685856342, "global_step": 8440, "epoch": 70, "lr": 9.693654016890766e-05} +{"train_loss": 0.008209736086428165, "global_step": 8441, "epoch": 70, "lr": 9.693577654468468e-05} +{"train_loss": 0.011698564514517784, "global_step": 8442, "epoch": 70, "lr": 9.693501282830831e-05} +{"train_loss": 0.01906014233827591, "global_step": 8443, "epoch": 70, "lr": 9.693424901978007e-05} +{"train_loss": 0.00943119265139103, "global_step": 8444, "epoch": 70, "lr": 9.693348511910145e-05} +{"train_loss": 0.007968883961439133, "global_step": 8445, "epoch": 70, "lr": 9.693272112627394e-05} +{"train_loss": 0.00828753225505352, "global_step": 8446, "epoch": 70, "lr": 9.693195704129904e-05} +{"train_loss": 0.011885962449014187, "global_step": 8447, "epoch": 70, "lr": 9.693119286417827e-05} +{"train_loss": 0.011360143694807501, "global_step": 8448, "epoch": 70, "lr": 9.693042859491311e-05, "val_loss": 0.017773382365703583, "train_action_mse_error": 0.0005117133259773254} +{"train_loss": 0.011356992647051811, "global_step": 8449, "epoch": 71, "lr": 9.692966423350505e-05} +{"train_loss": 0.012723135761916637, "global_step": 8450, "epoch": 71, "lr": 9.692889977995563e-05} +{"train_loss": 0.011557960882782936, "global_step": 8451, "epoch": 71, "lr": 9.692813523426632e-05} +{"train_loss": 0.012255305424332619, "global_step": 8452, "epoch": 71, "lr": 9.692737059643864e-05} +{"train_loss": 0.012557143345475197, "global_step": 8453, "epoch": 71, "lr": 9.692660586647407e-05} +{"train_loss": 0.008755892515182495, "global_step": 8454, "epoch": 71, "lr": 9.692584104437412e-05} +{"train_loss": 0.012737116776406765, "global_step": 8455, "epoch": 71, "lr": 9.69250761301403e-05} +{"train_loss": 0.014377767220139503, "global_step": 8456, "epoch": 71, "lr": 9.692431112377412e-05} +{"train_loss": 0.009485162794589996, "global_step": 8457, "epoch": 71, "lr": 9.692354602527704e-05} +{"train_loss": 0.008447442203760147, "global_step": 8458, "epoch": 71, "lr": 9.69227808346506e-05} +{"train_loss": 0.008243989199399948, "global_step": 8459, "epoch": 71, "lr": 9.692201555189631e-05} +{"train_loss": 0.01007295586168766, "global_step": 8460, "epoch": 71, "lr": 9.692125017701565e-05} +{"train_loss": 0.009373298846185207, "global_step": 8461, "epoch": 71, "lr": 9.692048471001011e-05} +{"train_loss": 0.012956633232533932, "global_step": 8462, "epoch": 71, "lr": 9.691971915088123e-05} +{"train_loss": 0.013118554838001728, "global_step": 8463, "epoch": 71, "lr": 9.69189534996305e-05} +{"train_loss": 0.006279626861214638, "global_step": 8464, "epoch": 71, "lr": 9.691818775625939e-05} +{"train_loss": 0.011747925542294979, "global_step": 8465, "epoch": 71, "lr": 9.691742192076945e-05} +{"train_loss": 0.010351277887821198, "global_step": 8466, "epoch": 71, "lr": 9.691665599316215e-05} +{"train_loss": 0.013481960631906986, "global_step": 8467, "epoch": 71, "lr": 9.691588997343902e-05} +{"train_loss": 0.0135330306366086, "global_step": 8468, "epoch": 71, "lr": 9.691512386160155e-05} +{"train_loss": 0.012804226018488407, "global_step": 8469, "epoch": 71, "lr": 9.691435765765124e-05} +{"train_loss": 0.01110532321035862, "global_step": 8470, "epoch": 71, "lr": 9.691359136158962e-05} +{"train_loss": 0.008077236823737621, "global_step": 8471, "epoch": 71, "lr": 9.691282497341816e-05} +{"train_loss": 0.011559100821614265, "global_step": 8472, "epoch": 71, "lr": 9.691205849313838e-05} +{"train_loss": 0.015326408669352531, "global_step": 8473, "epoch": 71, "lr": 9.69112919207518e-05} +{"train_loss": 0.008875335566699505, "global_step": 8474, "epoch": 71, "lr": 9.691052525625989e-05} +{"train_loss": 0.01258271373808384, "global_step": 8475, "epoch": 71, "lr": 9.690975849966418e-05} +{"train_loss": 0.008383860811591148, "global_step": 8476, "epoch": 71, "lr": 9.690899165096618e-05} +{"train_loss": 0.007679237984120846, "global_step": 8477, "epoch": 71, "lr": 9.690822471016737e-05} +{"train_loss": 0.008602963760495186, "global_step": 8478, "epoch": 71, "lr": 9.690745767726929e-05} +{"train_loss": 0.00698115723207593, "global_step": 8479, "epoch": 71, "lr": 9.690669055227341e-05} +{"train_loss": 0.012681229040026665, "global_step": 8480, "epoch": 71, "lr": 9.690592333518127e-05} +{"train_loss": 0.012445556931197643, "global_step": 8481, "epoch": 71, "lr": 9.690515602599437e-05} +{"train_loss": 0.008216827176511288, "global_step": 8482, "epoch": 71, "lr": 9.690438862471418e-05} +{"train_loss": 0.010289866477251053, "global_step": 8483, "epoch": 71, "lr": 9.690362113134225e-05} +{"train_loss": 0.010918407700955868, "global_step": 8484, "epoch": 71, "lr": 9.690285354588007e-05} +{"train_loss": 0.006449313834309578, "global_step": 8485, "epoch": 71, "lr": 9.690208586832915e-05} +{"train_loss": 0.008140084333717823, "global_step": 8486, "epoch": 71, "lr": 9.690131809869098e-05} +{"train_loss": 0.01075960323214531, "global_step": 8487, "epoch": 71, "lr": 9.69005502369671e-05} +{"train_loss": 0.010267246514558792, "global_step": 8488, "epoch": 71, "lr": 9.6899782283159e-05} +{"train_loss": 0.01018193643540144, "global_step": 8489, "epoch": 71, "lr": 9.689901423726817e-05} +{"train_loss": 0.008784759789705276, "global_step": 8490, "epoch": 71, "lr": 9.689824609929614e-05} +{"train_loss": 0.008741697296500206, "global_step": 8491, "epoch": 71, "lr": 9.689747786924444e-05} +{"train_loss": 0.010652834549546242, "global_step": 8492, "epoch": 71, "lr": 9.689670954711452e-05} +{"train_loss": 0.00877616461366415, "global_step": 8493, "epoch": 71, "lr": 9.689594113290795e-05} +{"train_loss": 0.01752299629151821, "global_step": 8494, "epoch": 71, "lr": 9.689517262662617e-05} +{"train_loss": 0.010843048803508282, "global_step": 8495, "epoch": 71, "lr": 9.689440402827077e-05} +{"train_loss": 0.009961917996406555, "global_step": 8496, "epoch": 71, "lr": 9.689363533784319e-05} +{"train_loss": 0.007064176257699728, "global_step": 8497, "epoch": 71, "lr": 9.689286655534498e-05} +{"train_loss": 0.01239113137125969, "global_step": 8498, "epoch": 71, "lr": 9.689209768077764e-05} +{"train_loss": 0.009682873263955116, "global_step": 8499, "epoch": 71, "lr": 9.689132871414266e-05} +{"train_loss": 0.012557100504636765, "global_step": 8500, "epoch": 71, "lr": 9.689055965544158e-05} +{"train_loss": 0.013791954144835472, "global_step": 8501, "epoch": 71, "lr": 9.688979050467589e-05} +{"train_loss": 0.008764715865254402, "global_step": 8502, "epoch": 71, "lr": 9.688902126184711e-05} +{"train_loss": 0.007538247853517532, "global_step": 8503, "epoch": 71, "lr": 9.688825192695674e-05} +{"train_loss": 0.008618100546300411, "global_step": 8504, "epoch": 71, "lr": 9.68874825000063e-05} +{"train_loss": 0.01089037861675024, "global_step": 8505, "epoch": 71, "lr": 9.68867129809973e-05} +{"train_loss": 0.007827243767678738, "global_step": 8506, "epoch": 71, "lr": 9.688594336993124e-05} +{"train_loss": 0.011817870661616325, "global_step": 8507, "epoch": 71, "lr": 9.688517366680964e-05} +{"train_loss": 0.009859186597168446, "global_step": 8508, "epoch": 71, "lr": 9.688440387163403e-05} +{"train_loss": 0.011176575906574726, "global_step": 8509, "epoch": 71, "lr": 9.688363398440588e-05} +{"train_loss": 0.006612048018723726, "global_step": 8510, "epoch": 71, "lr": 9.688286400512673e-05} +{"train_loss": 0.006459287367761135, "global_step": 8511, "epoch": 71, "lr": 9.688209393379808e-05} +{"train_loss": 0.014291594736278057, "global_step": 8512, "epoch": 71, "lr": 9.688132377042147e-05} +{"train_loss": 0.010273166000843048, "global_step": 8513, "epoch": 71, "lr": 9.688055351499836e-05} +{"train_loss": 0.008594565093517303, "global_step": 8514, "epoch": 71, "lr": 9.68797831675303e-05} +{"train_loss": 0.007658706977963448, "global_step": 8515, "epoch": 71, "lr": 9.68790127280188e-05} +{"train_loss": 0.011958969756960869, "global_step": 8516, "epoch": 71, "lr": 9.687824219646537e-05} +{"train_loss": 0.012543399818241596, "global_step": 8517, "epoch": 71, "lr": 9.68774715728715e-05} +{"train_loss": 0.00749981077387929, "global_step": 8518, "epoch": 71, "lr": 9.687670085723874e-05} +{"train_loss": 0.009558355435729027, "global_step": 8519, "epoch": 71, "lr": 9.687593004956859e-05} +{"train_loss": 0.007501280400902033, "global_step": 8520, "epoch": 71, "lr": 9.687515914986254e-05} +{"train_loss": 0.010588880628347397, "global_step": 8521, "epoch": 71, "lr": 9.687438815812215e-05} +{"train_loss": 0.007294998038560152, "global_step": 8522, "epoch": 71, "lr": 9.687361707434889e-05} +{"train_loss": 0.015051783993840218, "global_step": 8523, "epoch": 71, "lr": 9.687284589854429e-05} +{"train_loss": 0.011221598833799362, "global_step": 8524, "epoch": 71, "lr": 9.687207463070986e-05} +{"train_loss": 0.007030653301626444, "global_step": 8525, "epoch": 71, "lr": 9.687130327084713e-05} +{"train_loss": 0.012817920185625553, "global_step": 8526, "epoch": 71, "lr": 9.68705318189576e-05} +{"train_loss": 0.008126108907163143, "global_step": 8527, "epoch": 71, "lr": 9.686976027504279e-05} +{"train_loss": 0.0071326615288853645, "global_step": 8528, "epoch": 71, "lr": 9.686898863910421e-05} +{"train_loss": 0.013649185188114643, "global_step": 8529, "epoch": 71, "lr": 9.686821691114338e-05} +{"train_loss": 0.012267423793673515, "global_step": 8530, "epoch": 71, "lr": 9.686744509116181e-05} +{"train_loss": 0.00956551730632782, "global_step": 8531, "epoch": 71, "lr": 9.686667317916102e-05} +{"train_loss": 0.007377917878329754, "global_step": 8532, "epoch": 71, "lr": 9.686590117514251e-05} +{"train_loss": 0.007902438752353191, "global_step": 8533, "epoch": 71, "lr": 9.686512907910784e-05} +{"train_loss": 0.014145758002996445, "global_step": 8534, "epoch": 71, "lr": 9.686435689105848e-05} +{"train_loss": 0.00920194387435913, "global_step": 8535, "epoch": 71, "lr": 9.686358461099596e-05} +{"train_loss": 0.01583387702703476, "global_step": 8536, "epoch": 71, "lr": 9.68628122389218e-05} +{"train_loss": 0.014924618415534496, "global_step": 8537, "epoch": 71, "lr": 9.686203977483753e-05} +{"train_loss": 0.01047649048268795, "global_step": 8538, "epoch": 71, "lr": 9.686126721874463e-05} +{"train_loss": 0.012696060352027416, "global_step": 8539, "epoch": 71, "lr": 9.686049457064463e-05} +{"train_loss": 0.01390183437615633, "global_step": 8540, "epoch": 71, "lr": 9.685972183053907e-05} +{"train_loss": 0.009834196418523788, "global_step": 8541, "epoch": 71, "lr": 9.685894899842945e-05} +{"train_loss": 0.012872898951172829, "global_step": 8542, "epoch": 71, "lr": 9.68581760743173e-05} +{"train_loss": 0.01339813694357872, "global_step": 8543, "epoch": 71, "lr": 9.685740305820412e-05} +{"train_loss": 0.012956063263118267, "global_step": 8544, "epoch": 71, "lr": 9.685662995009144e-05} +{"train_loss": 0.010764642618596554, "global_step": 8545, "epoch": 71, "lr": 9.685585674998077e-05} +{"train_loss": 0.01280304603278637, "global_step": 8546, "epoch": 71, "lr": 9.685508345787362e-05} +{"train_loss": 0.015642328187823296, "global_step": 8547, "epoch": 71, "lr": 9.685431007377153e-05} +{"train_loss": 0.008460051380097866, "global_step": 8548, "epoch": 71, "lr": 9.6853536597676e-05} +{"train_loss": 0.009683904238045216, "global_step": 8549, "epoch": 71, "lr": 9.685276302958857e-05} +{"train_loss": 0.013088780455291271, "global_step": 8550, "epoch": 71, "lr": 9.685198936951073e-05} +{"train_loss": 0.010450429283082485, "global_step": 8551, "epoch": 71, "lr": 9.685121561744402e-05} +{"train_loss": 0.013266066089272499, "global_step": 8552, "epoch": 71, "lr": 9.685044177338996e-05} +{"train_loss": 0.012856034561991692, "global_step": 8553, "epoch": 71, "lr": 9.684966783735006e-05} +{"train_loss": 0.009063626639544964, "global_step": 8554, "epoch": 71, "lr": 9.684889380932583e-05} +{"train_loss": 0.007916625589132309, "global_step": 8555, "epoch": 71, "lr": 9.684811968931882e-05} +{"train_loss": 0.010075186379253864, "global_step": 8556, "epoch": 71, "lr": 9.684734547733052e-05} +{"train_loss": 0.014876598492264748, "global_step": 8557, "epoch": 71, "lr": 9.684657117336246e-05} +{"train_loss": 0.013841865584254265, "global_step": 8558, "epoch": 71, "lr": 9.684579677741619e-05} +{"train_loss": 0.011120880953967571, "global_step": 8559, "epoch": 71, "lr": 9.684502228949317e-05} +{"train_loss": 0.009908108040690422, "global_step": 8560, "epoch": 71, "lr": 9.684424770959497e-05} +{"train_loss": 0.00829132366925478, "global_step": 8561, "epoch": 71, "lr": 9.684347303772308e-05} +{"train_loss": 0.0069892569445073605, "global_step": 8562, "epoch": 71, "lr": 9.684269827387905e-05} +{"train_loss": 0.010660139843821526, "global_step": 8563, "epoch": 71, "lr": 9.684192341806437e-05} +{"train_loss": 0.011077114380896091, "global_step": 8564, "epoch": 71, "lr": 9.68411484702806e-05} +{"train_loss": 0.013887199573218822, "global_step": 8565, "epoch": 71, "lr": 9.684037343052923e-05} +{"train_loss": 0.014109043404459953, "global_step": 8566, "epoch": 71, "lr": 9.683959829881178e-05} +{"train_loss": 0.010705082857308267, "global_step": 8567, "epoch": 71, "lr": 9.683882307512979e-05, "val_loss": 0.017512738704681396} +{"train_loss": 0.009899644181132317, "global_step": 8568, "epoch": 72, "lr": 9.683804775948477e-05} +{"train_loss": 0.013850914314389229, "global_step": 8569, "epoch": 72, "lr": 9.683727235187825e-05} +{"train_loss": 0.007990199141204357, "global_step": 8570, "epoch": 72, "lr": 9.683649685231177e-05} +{"train_loss": 0.0080431392416358, "global_step": 8571, "epoch": 72, "lr": 9.683572126078682e-05} +{"train_loss": 0.01016094721853733, "global_step": 8572, "epoch": 72, "lr": 9.683494557730492e-05} +{"train_loss": 0.011708811856806278, "global_step": 8573, "epoch": 72, "lr": 9.683416980186761e-05} +{"train_loss": 0.009187374264001846, "global_step": 8574, "epoch": 72, "lr": 9.683339393447643e-05} +{"train_loss": 0.012386205606162548, "global_step": 8575, "epoch": 72, "lr": 9.683261797513288e-05} +{"train_loss": 0.008586197160184383, "global_step": 8576, "epoch": 72, "lr": 9.683184192383848e-05} +{"train_loss": 0.009412596933543682, "global_step": 8577, "epoch": 72, "lr": 9.683106578059475e-05} +{"train_loss": 0.01188961137086153, "global_step": 8578, "epoch": 72, "lr": 9.683028954540326e-05} +{"train_loss": 0.012681742198765278, "global_step": 8579, "epoch": 72, "lr": 9.682951321826546e-05} +{"train_loss": 0.00959083903580904, "global_step": 8580, "epoch": 72, "lr": 9.682873679918293e-05} +{"train_loss": 0.012886153534054756, "global_step": 8581, "epoch": 72, "lr": 9.682796028815718e-05} +{"train_loss": 0.009844410233199596, "global_step": 8582, "epoch": 72, "lr": 9.682718368518974e-05} +{"train_loss": 0.008573216386139393, "global_step": 8583, "epoch": 72, "lr": 9.682640699028212e-05} +{"train_loss": 0.014032742008566856, "global_step": 8584, "epoch": 72, "lr": 9.682563020343585e-05} +{"train_loss": 0.011605849489569664, "global_step": 8585, "epoch": 72, "lr": 9.682485332465245e-05} +{"train_loss": 0.015625959262251854, "global_step": 8586, "epoch": 72, "lr": 9.682407635393346e-05} +{"train_loss": 0.0067646559327840805, "global_step": 8587, "epoch": 72, "lr": 9.682329929128042e-05} +{"train_loss": 0.01060426700860262, "global_step": 8588, "epoch": 72, "lr": 9.682252213669482e-05} +{"train_loss": 0.009440264664590359, "global_step": 8589, "epoch": 72, "lr": 9.682174489017819e-05} +{"train_loss": 0.00952349603176117, "global_step": 8590, "epoch": 72, "lr": 9.682096755173206e-05} +{"train_loss": 0.008134367875754833, "global_step": 8591, "epoch": 72, "lr": 9.682019012135799e-05} +{"train_loss": 0.014195030555129051, "global_step": 8592, "epoch": 72, "lr": 9.681941259905745e-05} +{"train_loss": 0.009057609364390373, "global_step": 8593, "epoch": 72, "lr": 9.681863498483202e-05} +{"train_loss": 0.010757223702967167, "global_step": 8594, "epoch": 72, "lr": 9.681785727868319e-05} +{"train_loss": 0.010495929047465324, "global_step": 8595, "epoch": 72, "lr": 9.68170794806125e-05} +{"train_loss": 0.009835762903094292, "global_step": 8596, "epoch": 72, "lr": 9.681630159062147e-05} +{"train_loss": 0.011653843335807323, "global_step": 8597, "epoch": 72, "lr": 9.681552360871165e-05} +{"train_loss": 0.014177260920405388, "global_step": 8598, "epoch": 72, "lr": 9.681474553488453e-05} +{"train_loss": 0.008621731773018837, "global_step": 8599, "epoch": 72, "lr": 9.681396736914168e-05} +{"train_loss": 0.013443569652736187, "global_step": 8600, "epoch": 72, "lr": 9.681318911148458e-05} +{"train_loss": 0.010279016569256783, "global_step": 8601, "epoch": 72, "lr": 9.68124107619148e-05} +{"train_loss": 0.011738118715584278, "global_step": 8602, "epoch": 72, "lr": 9.681163232043387e-05} +{"train_loss": 0.01289952453225851, "global_step": 8603, "epoch": 72, "lr": 9.681085378704326e-05} +{"train_loss": 0.008195473812520504, "global_step": 8604, "epoch": 72, "lr": 9.681007516174457e-05} +{"train_loss": 0.010656077414751053, "global_step": 8605, "epoch": 72, "lr": 9.680929644453929e-05} +{"train_loss": 0.011181541718542576, "global_step": 8606, "epoch": 72, "lr": 9.680851763542896e-05} +{"train_loss": 0.013031190261244774, "global_step": 8607, "epoch": 72, "lr": 9.680773873441511e-05} +{"train_loss": 0.008469855412840843, "global_step": 8608, "epoch": 72, "lr": 9.680695974149925e-05} +{"train_loss": 0.010535502806305885, "global_step": 8609, "epoch": 72, "lr": 9.680618065668294e-05} +{"train_loss": 0.01004360057413578, "global_step": 8610, "epoch": 72, "lr": 9.68054014799677e-05} +{"train_loss": 0.008890531025826931, "global_step": 8611, "epoch": 72, "lr": 9.680462221135505e-05} +{"train_loss": 0.010489976033568382, "global_step": 8612, "epoch": 72, "lr": 9.680384285084652e-05} +{"train_loss": 0.01241208054125309, "global_step": 8613, "epoch": 72, "lr": 9.680306339844363e-05} +{"train_loss": 0.011575558222830296, "global_step": 8614, "epoch": 72, "lr": 9.680228385414795e-05} +{"train_loss": 0.01057365071028471, "global_step": 8615, "epoch": 72, "lr": 9.680150421796097e-05} +{"train_loss": 0.015681356191635132, "global_step": 8616, "epoch": 72, "lr": 9.680072448988424e-05} +{"train_loss": 0.007655561435967684, "global_step": 8617, "epoch": 72, "lr": 9.679994466991928e-05} +{"train_loss": 0.015286490321159363, "global_step": 8618, "epoch": 72, "lr": 9.679916475806766e-05} +{"train_loss": 0.010711184702813625, "global_step": 8619, "epoch": 72, "lr": 9.679838475433086e-05} +{"train_loss": 0.014778420329093933, "global_step": 8620, "epoch": 72, "lr": 9.679760465871042e-05} +{"train_loss": 0.010846951976418495, "global_step": 8621, "epoch": 72, "lr": 9.679682447120788e-05} +{"train_loss": 0.016407229006290436, "global_step": 8622, "epoch": 72, "lr": 9.67960441918248e-05} +{"train_loss": 0.008786444552242756, "global_step": 8623, "epoch": 72, "lr": 9.679526382056267e-05} +{"train_loss": 0.007683915086090565, "global_step": 8624, "epoch": 72, "lr": 9.679448335742304e-05} +{"train_loss": 0.008539385162293911, "global_step": 8625, "epoch": 72, "lr": 9.679370280240744e-05} +{"train_loss": 0.008954274468123913, "global_step": 8626, "epoch": 72, "lr": 9.679292215551741e-05} +{"train_loss": 0.011819357052445412, "global_step": 8627, "epoch": 72, "lr": 9.679214141675446e-05} +{"train_loss": 0.015417144633829594, "global_step": 8628, "epoch": 72, "lr": 9.679136058612016e-05} +{"train_loss": 0.007281016558408737, "global_step": 8629, "epoch": 72, "lr": 9.679057966361602e-05} +{"train_loss": 0.015587126836180687, "global_step": 8630, "epoch": 72, "lr": 9.678979864924355e-05} +{"train_loss": 0.00831995066255331, "global_step": 8631, "epoch": 72, "lr": 9.678901754300435e-05} +{"train_loss": 0.008651996031403542, "global_step": 8632, "epoch": 72, "lr": 9.678823634489989e-05} +{"train_loss": 0.010605065152049065, "global_step": 8633, "epoch": 72, "lr": 9.678745505493172e-05} +{"train_loss": 0.009202335961163044, "global_step": 8634, "epoch": 72, "lr": 9.678667367310138e-05} +{"train_loss": 0.010997838340699673, "global_step": 8635, "epoch": 72, "lr": 9.678589219941044e-05} +{"train_loss": 0.011987848207354546, "global_step": 8636, "epoch": 72, "lr": 9.678511063386035e-05} +{"train_loss": 0.015087713487446308, "global_step": 8637, "epoch": 72, "lr": 9.678432897645273e-05} +{"train_loss": 0.012245437130331993, "global_step": 8638, "epoch": 72, "lr": 9.678354722718907e-05} +{"train_loss": 0.013995267450809479, "global_step": 8639, "epoch": 72, "lr": 9.67827653860709e-05} +{"train_loss": 0.010717125609517097, "global_step": 8640, "epoch": 72, "lr": 9.678198345309977e-05} +{"train_loss": 0.01207617949694395, "global_step": 8641, "epoch": 72, "lr": 9.678120142827722e-05} +{"train_loss": 0.006602430250495672, "global_step": 8642, "epoch": 72, "lr": 9.678041931160477e-05} +{"train_loss": 0.009875436313450336, "global_step": 8643, "epoch": 72, "lr": 9.677963710308398e-05} +{"train_loss": 0.010992011986672878, "global_step": 8644, "epoch": 72, "lr": 9.677885480271636e-05} +{"train_loss": 0.013520859181880951, "global_step": 8645, "epoch": 72, "lr": 9.677807241050347e-05} +{"train_loss": 0.008035439066588879, "global_step": 8646, "epoch": 72, "lr": 9.677728992644681e-05} +{"train_loss": 0.009720134548842907, "global_step": 8647, "epoch": 72, "lr": 9.677650735054795e-05} +{"train_loss": 0.014009025879204273, "global_step": 8648, "epoch": 72, "lr": 9.677572468280843e-05} +{"train_loss": 0.009203193709254265, "global_step": 8649, "epoch": 72, "lr": 9.677494192322975e-05} +{"train_loss": 0.009668124839663506, "global_step": 8650, "epoch": 72, "lr": 9.677415907181348e-05} +{"train_loss": 0.008158544078469276, "global_step": 8651, "epoch": 72, "lr": 9.677337612856115e-05} +{"train_loss": 0.006879795808345079, "global_step": 8652, "epoch": 72, "lr": 9.677259309347428e-05} +{"train_loss": 0.010089061222970486, "global_step": 8653, "epoch": 72, "lr": 9.677180996655441e-05} +{"train_loss": 0.010999377816915512, "global_step": 8654, "epoch": 72, "lr": 9.677102674780311e-05} +{"train_loss": 0.009499385952949524, "global_step": 8655, "epoch": 72, "lr": 9.677024343722189e-05} +{"train_loss": 0.007194849196821451, "global_step": 8656, "epoch": 72, "lr": 9.676946003481228e-05} +{"train_loss": 0.011269993148744106, "global_step": 8657, "epoch": 72, "lr": 9.676867654057586e-05} +{"train_loss": 0.010998719371855259, "global_step": 8658, "epoch": 72, "lr": 9.676789295451411e-05} +{"train_loss": 0.010864798910915852, "global_step": 8659, "epoch": 72, "lr": 9.676710927662862e-05} +{"train_loss": 0.011484057642519474, "global_step": 8660, "epoch": 72, "lr": 9.67663255069209e-05} +{"train_loss": 0.012157469056546688, "global_step": 8661, "epoch": 72, "lr": 9.676554164539249e-05} +{"train_loss": 0.011676195077598095, "global_step": 8662, "epoch": 72, "lr": 9.676475769204494e-05} +{"train_loss": 0.011517898179590702, "global_step": 8663, "epoch": 72, "lr": 9.676397364687979e-05} +{"train_loss": 0.009819665923714638, "global_step": 8664, "epoch": 72, "lr": 9.676318950989857e-05} +{"train_loss": 0.012491384521126747, "global_step": 8665, "epoch": 72, "lr": 9.676240528110283e-05} +{"train_loss": 0.014819009229540825, "global_step": 8666, "epoch": 72, "lr": 9.676162096049409e-05} +{"train_loss": 0.010030400939285755, "global_step": 8667, "epoch": 72, "lr": 9.676083654807391e-05} +{"train_loss": 0.01139893475919962, "global_step": 8668, "epoch": 72, "lr": 9.676005204384382e-05} +{"train_loss": 0.01570884883403778, "global_step": 8669, "epoch": 72, "lr": 9.675926744780537e-05} +{"train_loss": 0.008310539647936821, "global_step": 8670, "epoch": 72, "lr": 9.675848275996008e-05} +{"train_loss": 0.010520650073885918, "global_step": 8671, "epoch": 72, "lr": 9.675769798030952e-05} +{"train_loss": 0.01363205537199974, "global_step": 8672, "epoch": 72, "lr": 9.67569131088552e-05} +{"train_loss": 0.012680976651608944, "global_step": 8673, "epoch": 72, "lr": 9.675612814559869e-05} +{"train_loss": 0.012471691705286503, "global_step": 8674, "epoch": 72, "lr": 9.675534309054151e-05} +{"train_loss": 0.011943389661610126, "global_step": 8675, "epoch": 72, "lr": 9.675455794368522e-05} +{"train_loss": 0.011026209220290184, "global_step": 8676, "epoch": 72, "lr": 9.675377270503135e-05} +{"train_loss": 0.01160979364067316, "global_step": 8677, "epoch": 72, "lr": 9.675298737458143e-05} +{"train_loss": 0.013651533052325249, "global_step": 8678, "epoch": 72, "lr": 9.675220195233701e-05} +{"train_loss": 0.008483151905238628, "global_step": 8679, "epoch": 72, "lr": 9.675141643829964e-05} +{"train_loss": 0.01139592844992876, "global_step": 8680, "epoch": 72, "lr": 9.675063083247086e-05} +{"train_loss": 0.009808744303882122, "global_step": 8681, "epoch": 72, "lr": 9.674984513485222e-05} +{"train_loss": 0.00878676027059555, "global_step": 8682, "epoch": 72, "lr": 9.674905934544524e-05} +{"train_loss": 0.008598005399107933, "global_step": 8683, "epoch": 72, "lr": 9.674827346425148e-05} +{"train_loss": 0.011419794522225857, "global_step": 8684, "epoch": 72, "lr": 9.674748749127249e-05} +{"train_loss": 0.007983422838151455, "global_step": 8685, "epoch": 72, "lr": 9.67467014265098e-05} +{"train_loss": 0.010867946961221574, "global_step": 8686, "epoch": 72, "lr": 9.674591526996494e-05, "val_loss": 0.012858789414167404} +{"train_loss": 0.009808885864913464, "global_step": 8687, "epoch": 73, "lr": 9.674512902163949e-05} +{"train_loss": 0.014955789782106876, "global_step": 8688, "epoch": 73, "lr": 9.674434268153496e-05} +{"train_loss": 0.012207574211061, "global_step": 8689, "epoch": 73, "lr": 9.674355624965293e-05} +{"train_loss": 0.007364329881966114, "global_step": 8690, "epoch": 73, "lr": 9.67427697259949e-05} +{"train_loss": 0.014142388477921486, "global_step": 8691, "epoch": 73, "lr": 9.674198311056243e-05} +{"train_loss": 0.011430295184254646, "global_step": 8692, "epoch": 73, "lr": 9.674119640335708e-05} +{"train_loss": 0.015048978850245476, "global_step": 8693, "epoch": 73, "lr": 9.674040960438037e-05} +{"train_loss": 0.009611664339900017, "global_step": 8694, "epoch": 73, "lr": 9.673962271363388e-05} +{"train_loss": 0.013793894089758396, "global_step": 8695, "epoch": 73, "lr": 9.673883573111912e-05} +{"train_loss": 0.008086836896836758, "global_step": 8696, "epoch": 73, "lr": 9.673804865683767e-05} +{"train_loss": 0.010287076234817505, "global_step": 8697, "epoch": 73, "lr": 9.673726149079104e-05} +{"train_loss": 0.012772692367434502, "global_step": 8698, "epoch": 73, "lr": 9.673647423298078e-05} +{"train_loss": 0.008844216354191303, "global_step": 8699, "epoch": 73, "lr": 9.673568688340846e-05} +{"train_loss": 0.014286084100604057, "global_step": 8700, "epoch": 73, "lr": 9.67348994420756e-05} +{"train_loss": 0.00859833788126707, "global_step": 8701, "epoch": 73, "lr": 9.673411190898376e-05} +{"train_loss": 0.012314390391111374, "global_step": 8702, "epoch": 73, "lr": 9.67333242841345e-05} +{"train_loss": 0.012026299722492695, "global_step": 8703, "epoch": 73, "lr": 9.673253656752933e-05} +{"train_loss": 0.012160391546785831, "global_step": 8704, "epoch": 73, "lr": 9.673174875916984e-05} +{"train_loss": 0.012222382239997387, "global_step": 8705, "epoch": 73, "lr": 9.673096085905753e-05} +{"train_loss": 0.008376333862543106, "global_step": 8706, "epoch": 73, "lr": 9.673017286719399e-05} +{"train_loss": 0.008961818180978298, "global_step": 8707, "epoch": 73, "lr": 9.672938478358073e-05} +{"train_loss": 0.01244290266185999, "global_step": 8708, "epoch": 73, "lr": 9.672859660821933e-05} +{"train_loss": 0.01364844013005495, "global_step": 8709, "epoch": 73, "lr": 9.672780834111132e-05} +{"train_loss": 0.009397704154253006, "global_step": 8710, "epoch": 73, "lr": 9.672701998225824e-05} +{"train_loss": 0.017130739986896515, "global_step": 8711, "epoch": 73, "lr": 9.672623153166166e-05} +{"train_loss": 0.009984683245420456, "global_step": 8712, "epoch": 73, "lr": 9.672544298932311e-05} +{"train_loss": 0.012267845682799816, "global_step": 8713, "epoch": 73, "lr": 9.672465435524415e-05} +{"train_loss": 0.010194267146289349, "global_step": 8714, "epoch": 73, "lr": 9.672386562942632e-05} +{"train_loss": 0.010820779018104076, "global_step": 8715, "epoch": 73, "lr": 9.672307681187117e-05} +{"train_loss": 0.01963043212890625, "global_step": 8716, "epoch": 73, "lr": 9.672228790258025e-05} +{"train_loss": 0.009559670463204384, "global_step": 8717, "epoch": 73, "lr": 9.67214989015551e-05} +{"train_loss": 0.012892753817141056, "global_step": 8718, "epoch": 73, "lr": 9.67207098087973e-05} +{"train_loss": 0.01034233532845974, "global_step": 8719, "epoch": 73, "lr": 9.671992062430837e-05} +{"train_loss": 0.011606755666434765, "global_step": 8720, "epoch": 73, "lr": 9.671913134808987e-05} +{"train_loss": 0.015272376127541065, "global_step": 8721, "epoch": 73, "lr": 9.671834198014333e-05} +{"train_loss": 0.010207561776041985, "global_step": 8722, "epoch": 73, "lr": 9.671755252047034e-05} +{"train_loss": 0.01119060255587101, "global_step": 8723, "epoch": 73, "lr": 9.671676296907242e-05} +{"train_loss": 0.011061138473451138, "global_step": 8724, "epoch": 73, "lr": 9.67159733259511e-05} +{"train_loss": 0.010873908177018166, "global_step": 8725, "epoch": 73, "lr": 9.671518359110799e-05} +{"train_loss": 0.00950328167527914, "global_step": 8726, "epoch": 73, "lr": 9.67143937645446e-05} +{"train_loss": 0.00718525517731905, "global_step": 8727, "epoch": 73, "lr": 9.671360384626248e-05} +{"train_loss": 0.012241377495229244, "global_step": 8728, "epoch": 73, "lr": 9.67128138362632e-05} +{"train_loss": 0.012777570635080338, "global_step": 8729, "epoch": 73, "lr": 9.671202373454828e-05} +{"train_loss": 0.00945043470710516, "global_step": 8730, "epoch": 73, "lr": 9.671123354111932e-05} +{"train_loss": 0.011325368657708168, "global_step": 8731, "epoch": 73, "lr": 9.671044325597782e-05} +{"train_loss": 0.016853606328368187, "global_step": 8732, "epoch": 73, "lr": 9.670965287912537e-05} +{"train_loss": 0.012862867675721645, "global_step": 8733, "epoch": 73, "lr": 9.67088624105635e-05} +{"train_loss": 0.007260858081281185, "global_step": 8734, "epoch": 73, "lr": 9.670807185029378e-05} +{"train_loss": 0.010011616162955761, "global_step": 8735, "epoch": 73, "lr": 9.670728119831773e-05} +{"train_loss": 0.009745649062097073, "global_step": 8736, "epoch": 73, "lr": 9.670649045463694e-05} +{"train_loss": 0.01068459078669548, "global_step": 8737, "epoch": 73, "lr": 9.670569961925294e-05} +{"train_loss": 0.009719389490783215, "global_step": 8738, "epoch": 73, "lr": 9.670490869216729e-05} +{"train_loss": 0.007768556475639343, "global_step": 8739, "epoch": 73, "lr": 9.670411767338154e-05} +{"train_loss": 0.01079613622277975, "global_step": 8740, "epoch": 73, "lr": 9.670332656289725e-05} +{"train_loss": 0.010274848900735378, "global_step": 8741, "epoch": 73, "lr": 9.670253536071596e-05} +{"train_loss": 0.013495810329914093, "global_step": 8742, "epoch": 73, "lr": 9.670174406683922e-05} +{"train_loss": 0.010530063882470131, "global_step": 8743, "epoch": 73, "lr": 9.670095268126862e-05} +{"train_loss": 0.0088388342410326, "global_step": 8744, "epoch": 73, "lr": 9.670016120400568e-05} +{"train_loss": 0.010323832742869854, "global_step": 8745, "epoch": 73, "lr": 9.669936963505197e-05} +{"train_loss": 0.013730313628911972, "global_step": 8746, "epoch": 73, "lr": 9.669857797440902e-05} +{"train_loss": 0.01044215727597475, "global_step": 8747, "epoch": 73, "lr": 9.669778622207841e-05} +{"train_loss": 0.00901554524898529, "global_step": 8748, "epoch": 73, "lr": 9.669699437806167e-05} +{"train_loss": 0.00747648673132062, "global_step": 8749, "epoch": 73, "lr": 9.66962024423604e-05} +{"train_loss": 0.009304165840148926, "global_step": 8750, "epoch": 73, "lr": 9.66954104149761e-05} +{"train_loss": 0.008051797747612, "global_step": 8751, "epoch": 73, "lr": 9.669461829591037e-05} +{"train_loss": 0.01516362838447094, "global_step": 8752, "epoch": 73, "lr": 9.669382608516473e-05} +{"train_loss": 0.009438703767955303, "global_step": 8753, "epoch": 73, "lr": 9.669303378274076e-05} +{"train_loss": 0.009642993099987507, "global_step": 8754, "epoch": 73, "lr": 9.669224138864e-05} +{"train_loss": 0.012944449670612812, "global_step": 8755, "epoch": 73, "lr": 9.669144890286402e-05} +{"train_loss": 0.011424658820033073, "global_step": 8756, "epoch": 73, "lr": 9.669065632541437e-05} +{"train_loss": 0.00873560830950737, "global_step": 8757, "epoch": 73, "lr": 9.66898636562926e-05} +{"train_loss": 0.012958530336618423, "global_step": 8758, "epoch": 73, "lr": 9.668907089550025e-05} +{"train_loss": 0.005675734020769596, "global_step": 8759, "epoch": 73, "lr": 9.668827804303893e-05} +{"train_loss": 0.010410209186375141, "global_step": 8760, "epoch": 73, "lr": 9.668748509891014e-05} +{"train_loss": 0.011835005134344101, "global_step": 8761, "epoch": 73, "lr": 9.668669206311546e-05} +{"train_loss": 0.010268101468682289, "global_step": 8762, "epoch": 73, "lr": 9.668589893565648e-05} +{"train_loss": 0.010051319375634193, "global_step": 8763, "epoch": 73, "lr": 9.66851057165347e-05} +{"train_loss": 0.012862241826951504, "global_step": 8764, "epoch": 73, "lr": 9.668431240575171e-05} +{"train_loss": 0.006028719712048769, "global_step": 8765, "epoch": 73, "lr": 9.668351900330905e-05} +{"train_loss": 0.01016857661306858, "global_step": 8766, "epoch": 73, "lr": 9.66827255092083e-05} +{"train_loss": 0.011536885984241962, "global_step": 8767, "epoch": 73, "lr": 9.6681931923451e-05} +{"train_loss": 0.008821064606308937, "global_step": 8768, "epoch": 73, "lr": 9.66811382460387e-05} +{"train_loss": 0.008975164964795113, "global_step": 8769, "epoch": 73, "lr": 9.6680344476973e-05} +{"train_loss": 0.016209453344345093, "global_step": 8770, "epoch": 73, "lr": 9.667955061625542e-05} +{"train_loss": 0.0077704270370304585, "global_step": 8771, "epoch": 73, "lr": 9.667875666388752e-05} +{"train_loss": 0.010898320935666561, "global_step": 8772, "epoch": 73, "lr": 9.667796261987088e-05} +{"train_loss": 0.013288794085383415, "global_step": 8773, "epoch": 73, "lr": 9.667716848420704e-05} +{"train_loss": 0.009928139857947826, "global_step": 8774, "epoch": 73, "lr": 9.667637425689758e-05} +{"train_loss": 0.014732730574905872, "global_step": 8775, "epoch": 73, "lr": 9.667557993794403e-05} +{"train_loss": 0.011822656728327274, "global_step": 8776, "epoch": 73, "lr": 9.667478552734796e-05} +{"train_loss": 0.011007022112607956, "global_step": 8777, "epoch": 73, "lr": 9.667399102511095e-05} +{"train_loss": 0.010136437602341175, "global_step": 8778, "epoch": 73, "lr": 9.667319643123453e-05} +{"train_loss": 0.012054722756147385, "global_step": 8779, "epoch": 73, "lr": 9.66724017457203e-05} +{"train_loss": 0.010111604817211628, "global_step": 8780, "epoch": 73, "lr": 9.667160696856978e-05} +{"train_loss": 0.008219823241233826, "global_step": 8781, "epoch": 73, "lr": 9.667081209978454e-05} +{"train_loss": 0.009838009253144264, "global_step": 8782, "epoch": 73, "lr": 9.667001713936615e-05} +{"train_loss": 0.014025172218680382, "global_step": 8783, "epoch": 73, "lr": 9.666922208731617e-05} +{"train_loss": 0.00862869806587696, "global_step": 8784, "epoch": 73, "lr": 9.666842694363616e-05} +{"train_loss": 0.011266801506280899, "global_step": 8785, "epoch": 73, "lr": 9.666763170832767e-05} +{"train_loss": 0.008166620507836342, "global_step": 8786, "epoch": 73, "lr": 9.666683638139228e-05} +{"train_loss": 0.011477160267531872, "global_step": 8787, "epoch": 73, "lr": 9.666604096283154e-05} +{"train_loss": 0.011401579715311527, "global_step": 8788, "epoch": 73, "lr": 9.666524545264701e-05} +{"train_loss": 0.012694177217781544, "global_step": 8789, "epoch": 73, "lr": 9.666444985084026e-05} +{"train_loss": 0.013360445387661457, "global_step": 8790, "epoch": 73, "lr": 9.666365415741286e-05} +{"train_loss": 0.01301026251167059, "global_step": 8791, "epoch": 73, "lr": 9.666285837236635e-05} +{"train_loss": 0.008922187611460686, "global_step": 8792, "epoch": 73, "lr": 9.66620624957023e-05} +{"train_loss": 0.00736782094463706, "global_step": 8793, "epoch": 73, "lr": 9.666126652742227e-05} +{"train_loss": 0.011860265396535397, "global_step": 8794, "epoch": 73, "lr": 9.666047046752784e-05} +{"train_loss": 0.010634402744472027, "global_step": 8795, "epoch": 73, "lr": 9.665967431602055e-05} +{"train_loss": 0.014511587098240852, "global_step": 8796, "epoch": 73, "lr": 9.6658878072902e-05} +{"train_loss": 0.010225607082247734, "global_step": 8797, "epoch": 73, "lr": 9.66580817381737e-05} +{"train_loss": 0.006578112952411175, "global_step": 8798, "epoch": 73, "lr": 9.665728531183725e-05} +{"train_loss": 0.01494460366666317, "global_step": 8799, "epoch": 73, "lr": 9.66564887938942e-05} +{"train_loss": 0.012459277175366879, "global_step": 8800, "epoch": 73, "lr": 9.665569218434612e-05} +{"train_loss": 0.011460812762379646, "global_step": 8801, "epoch": 73, "lr": 9.665489548319457e-05} +{"train_loss": 0.009218571707606316, "global_step": 8802, "epoch": 73, "lr": 9.665409869044113e-05} +{"train_loss": 0.011074374429881573, "global_step": 8803, "epoch": 73, "lr": 9.665330180608735e-05} +{"train_loss": 0.01044610608369112, "global_step": 8804, "epoch": 73, "lr": 9.665250483013479e-05} +{"train_loss": 0.011005654031050806, "global_step": 8805, "epoch": 73, "lr": 9.665170776258504e-05, "val_loss": 0.017579765990376472} +{"train_loss": 0.007502630818635225, "global_step": 8806, "epoch": 74, "lr": 9.665091060343961e-05} +{"train_loss": 0.007549153175204992, "global_step": 8807, "epoch": 74, "lr": 9.665011335270012e-05} +{"train_loss": 0.01543360948562622, "global_step": 8808, "epoch": 74, "lr": 9.66493160103681e-05} +{"train_loss": 0.01002176571637392, "global_step": 8809, "epoch": 74, "lr": 9.664851857644517e-05} +{"train_loss": 0.00879689957946539, "global_step": 8810, "epoch": 74, "lr": 9.664772105093283e-05} +{"train_loss": 0.010189766064286232, "global_step": 8811, "epoch": 74, "lr": 9.664692343383266e-05} +{"train_loss": 0.008854681625962257, "global_step": 8812, "epoch": 74, "lr": 9.664612572514626e-05} +{"train_loss": 0.010136783123016357, "global_step": 8813, "epoch": 74, "lr": 9.664532792487518e-05} +{"train_loss": 0.013463483192026615, "global_step": 8814, "epoch": 74, "lr": 9.664453003302098e-05} +{"train_loss": 0.011380747891962528, "global_step": 8815, "epoch": 74, "lr": 9.66437320495852e-05} +{"train_loss": 0.01564929634332657, "global_step": 8816, "epoch": 74, "lr": 9.664293397456948e-05} +{"train_loss": 0.007787161972373724, "global_step": 8817, "epoch": 74, "lr": 9.664213580797533e-05} +{"train_loss": 0.007398567162454128, "global_step": 8818, "epoch": 74, "lr": 9.664133754980431e-05} +{"train_loss": 0.007540237158536911, "global_step": 8819, "epoch": 74, "lr": 9.664053920005801e-05} +{"train_loss": 0.012668288312852383, "global_step": 8820, "epoch": 74, "lr": 9.663974075873801e-05} +{"train_loss": 0.009394188411533833, "global_step": 8821, "epoch": 74, "lr": 9.663894222584584e-05} +{"train_loss": 0.008138648234307766, "global_step": 8822, "epoch": 74, "lr": 9.66381436013831e-05} +{"train_loss": 0.011539647355675697, "global_step": 8823, "epoch": 74, "lr": 9.663734488535136e-05} +{"train_loss": 0.009387909434735775, "global_step": 8824, "epoch": 74, "lr": 9.663654607775216e-05} +{"train_loss": 0.011619621887803078, "global_step": 8825, "epoch": 74, "lr": 9.66357471785871e-05} +{"train_loss": 0.011089229956269264, "global_step": 8826, "epoch": 74, "lr": 9.663494818785771e-05} +{"train_loss": 0.010285265743732452, "global_step": 8827, "epoch": 74, "lr": 9.663414910556559e-05} +{"train_loss": 0.00984931644052267, "global_step": 8828, "epoch": 74, "lr": 9.663334993171232e-05} +{"train_loss": 0.011331062763929367, "global_step": 8829, "epoch": 74, "lr": 9.663255066629942e-05} +{"train_loss": 0.0135110542178154, "global_step": 8830, "epoch": 74, "lr": 9.66317513093285e-05} +{"train_loss": 0.012654509395360947, "global_step": 8831, "epoch": 74, "lr": 9.663095186080112e-05} +{"train_loss": 0.008935609832406044, "global_step": 8832, "epoch": 74, "lr": 9.663015232071885e-05} +{"train_loss": 0.016954567283391953, "global_step": 8833, "epoch": 74, "lr": 9.662935268908325e-05} +{"train_loss": 0.007169028278440237, "global_step": 8834, "epoch": 74, "lr": 9.66285529658959e-05} +{"train_loss": 0.014065012335777283, "global_step": 8835, "epoch": 74, "lr": 9.662775315115838e-05} +{"train_loss": 0.00813410896807909, "global_step": 8836, "epoch": 74, "lr": 9.662695324487223e-05} +{"train_loss": 0.014546411111950874, "global_step": 8837, "epoch": 74, "lr": 9.662615324703905e-05} +{"train_loss": 0.014105424284934998, "global_step": 8838, "epoch": 74, "lr": 9.66253531576604e-05} +{"train_loss": 0.010131027549505234, "global_step": 8839, "epoch": 74, "lr": 9.662455297673785e-05} +{"train_loss": 0.013965833000838757, "global_step": 8840, "epoch": 74, "lr": 9.662375270427297e-05} +{"train_loss": 0.010540385730564594, "global_step": 8841, "epoch": 74, "lr": 9.662295234026733e-05} +{"train_loss": 0.011772549711167812, "global_step": 8842, "epoch": 74, "lr": 9.66221518847225e-05} +{"train_loss": 0.012534857727587223, "global_step": 8843, "epoch": 74, "lr": 9.662135133764006e-05} +{"train_loss": 0.012931550852954388, "global_step": 8844, "epoch": 74, "lr": 9.662055069902159e-05} +{"train_loss": 0.012026830576360226, "global_step": 8845, "epoch": 74, "lr": 9.661974996886863e-05} +{"train_loss": 0.01320569682866335, "global_step": 8846, "epoch": 74, "lr": 9.661894914718278e-05} +{"train_loss": 0.010733443312346935, "global_step": 8847, "epoch": 74, "lr": 9.66181482339656e-05} +{"train_loss": 0.012859529815614223, "global_step": 8848, "epoch": 74, "lr": 9.661734722921867e-05} +{"train_loss": 0.00794222205877304, "global_step": 8849, "epoch": 74, "lr": 9.661654613294355e-05} +{"train_loss": 0.011309588328003883, "global_step": 8850, "epoch": 74, "lr": 9.661574494514184e-05} +{"train_loss": 0.012200649827718735, "global_step": 8851, "epoch": 74, "lr": 9.661494366581508e-05} +{"train_loss": 0.011823918670415878, "global_step": 8852, "epoch": 74, "lr": 9.661414229496485e-05} +{"train_loss": 0.008214669302105904, "global_step": 8853, "epoch": 74, "lr": 9.661334083259276e-05} +{"train_loss": 0.006946942303329706, "global_step": 8854, "epoch": 74, "lr": 9.661253927870034e-05} +{"train_loss": 0.011928381398320198, "global_step": 8855, "epoch": 74, "lr": 9.661173763328918e-05} +{"train_loss": 0.014252139255404472, "global_step": 8856, "epoch": 74, "lr": 9.661093589636086e-05} +{"train_loss": 0.0122156273573637, "global_step": 8857, "epoch": 74, "lr": 9.661013406791692e-05} +{"train_loss": 0.014994134195148945, "global_step": 8858, "epoch": 74, "lr": 9.6609332147959e-05} +{"train_loss": 0.009427467361092567, "global_step": 8859, "epoch": 74, "lr": 9.66085301364886e-05} +{"train_loss": 0.015468055382370949, "global_step": 8860, "epoch": 74, "lr": 9.660772803350735e-05} +{"train_loss": 0.012890485115349293, "global_step": 8861, "epoch": 74, "lr": 9.660692583901681e-05} +{"train_loss": 0.006462992634624243, "global_step": 8862, "epoch": 74, "lr": 9.660612355301854e-05} +{"train_loss": 0.0111621068790555, "global_step": 8863, "epoch": 74, "lr": 9.660532117551414e-05} +{"train_loss": 0.01207713596522808, "global_step": 8864, "epoch": 74, "lr": 9.660451870650514e-05} +{"train_loss": 0.009831099770963192, "global_step": 8865, "epoch": 74, "lr": 9.660371614599317e-05} +{"train_loss": 0.01119746919721365, "global_step": 8866, "epoch": 74, "lr": 9.660291349397977e-05} +{"train_loss": 0.011193777434527874, "global_step": 8867, "epoch": 74, "lr": 9.660211075046654e-05} +{"train_loss": 0.012419612146914005, "global_step": 8868, "epoch": 74, "lr": 9.660130791545505e-05} +{"train_loss": 0.012652850709855556, "global_step": 8869, "epoch": 74, "lr": 9.660050498894685e-05} +{"train_loss": 0.008487749844789505, "global_step": 8870, "epoch": 74, "lr": 9.659970197094355e-05} +{"train_loss": 0.005198235157877207, "global_step": 8871, "epoch": 74, "lr": 9.659889886144671e-05} +{"train_loss": 0.0077679394744336605, "global_step": 8872, "epoch": 74, "lr": 9.659809566045791e-05} +{"train_loss": 0.013758699409663677, "global_step": 8873, "epoch": 74, "lr": 9.659729236797871e-05} +{"train_loss": 0.019803758710622787, "global_step": 8874, "epoch": 74, "lr": 9.659648898401075e-05} +{"train_loss": 0.012208997271955013, "global_step": 8875, "epoch": 74, "lr": 9.659568550855554e-05} +{"train_loss": 0.01500806212425232, "global_step": 8876, "epoch": 74, "lr": 9.659488194161466e-05} +{"train_loss": 0.01094975695014, "global_step": 8877, "epoch": 74, "lr": 9.659407828318972e-05} +{"train_loss": 0.014729354530572891, "global_step": 8878, "epoch": 74, "lr": 9.659327453328229e-05} +{"train_loss": 0.014711655676364899, "global_step": 8879, "epoch": 74, "lr": 9.659247069189395e-05} +{"train_loss": 0.007450620178133249, "global_step": 8880, "epoch": 74, "lr": 9.659166675902626e-05} +{"train_loss": 0.013068131171166897, "global_step": 8881, "epoch": 74, "lr": 9.659086273468081e-05} +{"train_loss": 0.012717698700726032, "global_step": 8882, "epoch": 74, "lr": 9.659005861885916e-05} +{"train_loss": 0.00925828143954277, "global_step": 8883, "epoch": 74, "lr": 9.658925441156295e-05} +{"train_loss": 0.009874271228909492, "global_step": 8884, "epoch": 74, "lr": 9.65884501127937e-05} +{"train_loss": 0.014943046495318413, "global_step": 8885, "epoch": 74, "lr": 9.658764572255299e-05} +{"train_loss": 0.00783201027661562, "global_step": 8886, "epoch": 74, "lr": 9.658684124084242e-05} +{"train_loss": 0.011947701685130596, "global_step": 8887, "epoch": 74, "lr": 9.658603666766357e-05} +{"train_loss": 0.013278590515255928, "global_step": 8888, "epoch": 74, "lr": 9.658523200301802e-05} +{"train_loss": 0.013132394291460514, "global_step": 8889, "epoch": 74, "lr": 9.658442724690732e-05} +{"train_loss": 0.009657042101025581, "global_step": 8890, "epoch": 74, "lr": 9.65836223993331e-05} +{"train_loss": 0.015495273284614086, "global_step": 8891, "epoch": 74, "lr": 9.65828174602969e-05} +{"train_loss": 0.009299635887145996, "global_step": 8892, "epoch": 74, "lr": 9.658201242980032e-05} +{"train_loss": 0.013210455887019634, "global_step": 8893, "epoch": 74, "lr": 9.658120730784494e-05} +{"train_loss": 0.009202895686030388, "global_step": 8894, "epoch": 74, "lr": 9.658040209443234e-05} +{"train_loss": 0.013110708445310593, "global_step": 8895, "epoch": 74, "lr": 9.657959678956408e-05} +{"train_loss": 0.017358912155032158, "global_step": 8896, "epoch": 74, "lr": 9.657879139324175e-05} +{"train_loss": 0.009627243503928185, "global_step": 8897, "epoch": 74, "lr": 9.657798590546696e-05} +{"train_loss": 0.010462762787938118, "global_step": 8898, "epoch": 74, "lr": 9.657718032624125e-05} +{"train_loss": 0.010126238688826561, "global_step": 8899, "epoch": 74, "lr": 9.657637465556626e-05} +{"train_loss": 0.011521599255502224, "global_step": 8900, "epoch": 74, "lr": 9.65755688934435e-05} +{"train_loss": 0.010472971014678478, "global_step": 8901, "epoch": 74, "lr": 9.65747630398746e-05} +{"train_loss": 0.009342501871287823, "global_step": 8902, "epoch": 74, "lr": 9.657395709486113e-05} +{"train_loss": 0.010319167748093605, "global_step": 8903, "epoch": 74, "lr": 9.657315105840466e-05} +{"train_loss": 0.01215888001024723, "global_step": 8904, "epoch": 74, "lr": 9.65723449305068e-05} +{"train_loss": 0.010169416666030884, "global_step": 8905, "epoch": 74, "lr": 9.65715387111691e-05} +{"train_loss": 0.008691484108567238, "global_step": 8906, "epoch": 74, "lr": 9.657073240039317e-05} +{"train_loss": 0.009854432195425034, "global_step": 8907, "epoch": 74, "lr": 9.656992599818058e-05} +{"train_loss": 0.01211442332714796, "global_step": 8908, "epoch": 74, "lr": 9.656911950453291e-05} +{"train_loss": 0.01022946834564209, "global_step": 8909, "epoch": 74, "lr": 9.656831291945176e-05} +{"train_loss": 0.01034180261194706, "global_step": 8910, "epoch": 74, "lr": 9.656750624293868e-05} +{"train_loss": 0.007513483986258507, "global_step": 8911, "epoch": 74, "lr": 9.656669947499531e-05} +{"train_loss": 0.010996378026902676, "global_step": 8912, "epoch": 74, "lr": 9.656589261562317e-05} +{"train_loss": 0.0067382254637777805, "global_step": 8913, "epoch": 74, "lr": 9.656508566482389e-05} +{"train_loss": 0.013526225462555885, "global_step": 8914, "epoch": 74, "lr": 9.656427862259905e-05} +{"train_loss": 0.009311082772910595, "global_step": 8915, "epoch": 74, "lr": 9.65634714889502e-05} +{"train_loss": 0.006583085283637047, "global_step": 8916, "epoch": 74, "lr": 9.656266426387897e-05} +{"train_loss": 0.01430312916636467, "global_step": 8917, "epoch": 74, "lr": 9.656185694738691e-05} +{"train_loss": 0.011685797944664955, "global_step": 8918, "epoch": 74, "lr": 9.656104953947562e-05} +{"train_loss": 0.009982960298657417, "global_step": 8919, "epoch": 74, "lr": 9.656024204014667e-05} +{"train_loss": 0.015697918832302094, "global_step": 8920, "epoch": 74, "lr": 9.655943444940167e-05} +{"train_loss": 0.009654328227043152, "global_step": 8921, "epoch": 74, "lr": 9.655862676724221e-05} +{"train_loss": 0.009756064042448997, "global_step": 8922, "epoch": 74, "lr": 9.655781899366984e-05} +{"train_loss": 0.011345942504703999, "global_step": 8923, "epoch": 74, "lr": 9.655701112868618e-05} +{"train_loss": 0.011178410134646072, "global_step": 8924, "epoch": 74, "lr": 9.65562031722928e-05, "val_loss": 0.024413302540779114} +{"train_loss": 0.0071298470720648766, "global_step": 8925, "epoch": 75, "lr": 9.655539512449127e-05} +{"train_loss": 0.008248135447502136, "global_step": 8926, "epoch": 75, "lr": 9.655458698528323e-05} +{"train_loss": 0.014223612844944, "global_step": 8927, "epoch": 75, "lr": 9.65537787546702e-05} +{"train_loss": 0.009187798015773296, "global_step": 8928, "epoch": 75, "lr": 9.655297043265381e-05} +{"train_loss": 0.0074604107066988945, "global_step": 8929, "epoch": 75, "lr": 9.655216201923565e-05} +{"train_loss": 0.011451437138020992, "global_step": 8930, "epoch": 75, "lr": 9.655135351441727e-05} +{"train_loss": 0.013258134014904499, "global_step": 8931, "epoch": 75, "lr": 9.65505449182003e-05} +{"train_loss": 0.008576620370149612, "global_step": 8932, "epoch": 75, "lr": 9.65497362305863e-05} +{"train_loss": 0.009942923672497272, "global_step": 8933, "epoch": 75, "lr": 9.654892745157687e-05} +{"train_loss": 0.014511149376630783, "global_step": 8934, "epoch": 75, "lr": 9.654811858117359e-05} +{"train_loss": 0.01028876006603241, "global_step": 8935, "epoch": 75, "lr": 9.654730961937805e-05} +{"train_loss": 0.010660073719918728, "global_step": 8936, "epoch": 75, "lr": 9.654650056619183e-05} +{"train_loss": 0.010896923951804638, "global_step": 8937, "epoch": 75, "lr": 9.654569142161654e-05} +{"train_loss": 0.009614815935492516, "global_step": 8938, "epoch": 75, "lr": 9.654488218565377e-05} +{"train_loss": 0.011462508700788021, "global_step": 8939, "epoch": 75, "lr": 9.654407285830509e-05} +{"train_loss": 0.010397213511168957, "global_step": 8940, "epoch": 75, "lr": 9.654326343957209e-05} +{"train_loss": 0.016192486509680748, "global_step": 8941, "epoch": 75, "lr": 9.654245392945636e-05} +{"train_loss": 0.00810883566737175, "global_step": 8942, "epoch": 75, "lr": 9.654164432795949e-05} +{"train_loss": 0.01300144288688898, "global_step": 8943, "epoch": 75, "lr": 9.65408346350831e-05} +{"train_loss": 0.008291550911962986, "global_step": 8944, "epoch": 75, "lr": 9.654002485082873e-05} +{"train_loss": 0.013619892299175262, "global_step": 8945, "epoch": 75, "lr": 9.6539214975198e-05} +{"train_loss": 0.013262108899652958, "global_step": 8946, "epoch": 75, "lr": 9.653840500819249e-05} +{"train_loss": 0.012722629122436047, "global_step": 8947, "epoch": 75, "lr": 9.653759494981381e-05} +{"train_loss": 0.011972044594585896, "global_step": 8948, "epoch": 75, "lr": 9.65367848000635e-05} +{"train_loss": 0.009773707948625088, "global_step": 8949, "epoch": 75, "lr": 9.653597455894321e-05} +{"train_loss": 0.011549337767064571, "global_step": 8950, "epoch": 75, "lr": 9.65351642264545e-05} +{"train_loss": 0.010998483747243881, "global_step": 8951, "epoch": 75, "lr": 9.653435380259896e-05} +{"train_loss": 0.012581891380250454, "global_step": 8952, "epoch": 75, "lr": 9.65335432873782e-05} +{"train_loss": 0.011651406064629555, "global_step": 8953, "epoch": 75, "lr": 9.65327326807938e-05} +{"train_loss": 0.011112690903246403, "global_step": 8954, "epoch": 75, "lr": 9.653192198284736e-05} +{"train_loss": 0.011500275693833828, "global_step": 8955, "epoch": 75, "lr": 9.653111119354043e-05} +{"train_loss": 0.0114134531468153, "global_step": 8956, "epoch": 75, "lr": 9.653030031287466e-05} +{"train_loss": 0.01072094775736332, "global_step": 8957, "epoch": 75, "lr": 9.652948934085161e-05} +{"train_loss": 0.010342809371650219, "global_step": 8958, "epoch": 75, "lr": 9.652867827747288e-05} +{"train_loss": 0.010540018789470196, "global_step": 8959, "epoch": 75, "lr": 9.652786712274005e-05} +{"train_loss": 0.014538523741066456, "global_step": 8960, "epoch": 75, "lr": 9.652705587665474e-05} +{"train_loss": 0.011402885429561138, "global_step": 8961, "epoch": 75, "lr": 9.652624453921851e-05} +{"train_loss": 0.01143623422831297, "global_step": 8962, "epoch": 75, "lr": 9.652543311043298e-05} +{"train_loss": 0.009926581755280495, "global_step": 8963, "epoch": 75, "lr": 9.652462159029974e-05} +{"train_loss": 0.010156664066016674, "global_step": 8964, "epoch": 75, "lr": 9.652380997882035e-05} +{"train_loss": 0.01036433782428503, "global_step": 8965, "epoch": 75, "lr": 9.652299827599645e-05} +{"train_loss": 0.009230921044945717, "global_step": 8966, "epoch": 75, "lr": 9.652218648182961e-05} +{"train_loss": 0.009025831706821918, "global_step": 8967, "epoch": 75, "lr": 9.652137459632143e-05} +{"train_loss": 0.007462438195943832, "global_step": 8968, "epoch": 75, "lr": 9.652056261947349e-05} +{"train_loss": 0.013681423850357533, "global_step": 8969, "epoch": 75, "lr": 9.651975055128741e-05} +{"train_loss": 0.012147856876254082, "global_step": 8970, "epoch": 75, "lr": 9.651893839176475e-05} +{"train_loss": 0.005980752874165773, "global_step": 8971, "epoch": 75, "lr": 9.651812614090714e-05} +{"train_loss": 0.00848314817994833, "global_step": 8972, "epoch": 75, "lr": 9.651731379871616e-05} +{"train_loss": 0.009660151787102222, "global_step": 8973, "epoch": 75, "lr": 9.651650136519339e-05} +{"train_loss": 0.012404733337461948, "global_step": 8974, "epoch": 75, "lr": 9.651568884034046e-05} +{"train_loss": 0.007939338684082031, "global_step": 8975, "epoch": 75, "lr": 9.651487622415894e-05} +{"train_loss": 0.011411109939217567, "global_step": 8976, "epoch": 75, "lr": 9.651406351665041e-05} +{"train_loss": 0.008953533135354519, "global_step": 8977, "epoch": 75, "lr": 9.651325071781649e-05} +{"train_loss": 0.010330859571695328, "global_step": 8978, "epoch": 75, "lr": 9.65124378276588e-05} +{"train_loss": 0.008543932810425758, "global_step": 8979, "epoch": 75, "lr": 9.651162484617888e-05} +{"train_loss": 0.009118235670030117, "global_step": 8980, "epoch": 75, "lr": 9.651081177337834e-05} +{"train_loss": 0.010909791104495525, "global_step": 8981, "epoch": 75, "lr": 9.650999860925882e-05} +{"train_loss": 0.008436080068349838, "global_step": 8982, "epoch": 75, "lr": 9.650918535382188e-05} +{"train_loss": 0.010855207219719887, "global_step": 8983, "epoch": 75, "lr": 9.650837200706913e-05} +{"train_loss": 0.007731122896075249, "global_step": 8984, "epoch": 75, "lr": 9.650755856900216e-05} +{"train_loss": 0.007828658446669579, "global_step": 8985, "epoch": 75, "lr": 9.650674503962255e-05} +{"train_loss": 0.01322296541184187, "global_step": 8986, "epoch": 75, "lr": 9.650593141893192e-05} +{"train_loss": 0.007643884047865868, "global_step": 8987, "epoch": 75, "lr": 9.650511770693187e-05} +{"train_loss": 0.006449883803725243, "global_step": 8988, "epoch": 75, "lr": 9.650430390362397e-05} +{"train_loss": 0.009806538932025433, "global_step": 8989, "epoch": 75, "lr": 9.650349000900987e-05} +{"train_loss": 0.011435311287641525, "global_step": 8990, "epoch": 75, "lr": 9.650267602309111e-05} +{"train_loss": 0.011039036326110363, "global_step": 8991, "epoch": 75, "lr": 9.650186194586932e-05} +{"train_loss": 0.008239871822297573, "global_step": 8992, "epoch": 75, "lr": 9.65010477773461e-05} +{"train_loss": 0.012079647742211819, "global_step": 8993, "epoch": 75, "lr": 9.650023351752303e-05} +{"train_loss": 0.012561557814478874, "global_step": 8994, "epoch": 75, "lr": 9.649941916640173e-05} +{"train_loss": 0.013087240979075432, "global_step": 8995, "epoch": 75, "lr": 9.649860472398378e-05} +{"train_loss": 0.007666627876460552, "global_step": 8996, "epoch": 75, "lr": 9.649779019027078e-05} +{"train_loss": 0.013001377694308758, "global_step": 8997, "epoch": 75, "lr": 9.649697556526435e-05} +{"train_loss": 0.007877376861870289, "global_step": 8998, "epoch": 75, "lr": 9.649616084896607e-05} +{"train_loss": 0.01084194891154766, "global_step": 8999, "epoch": 75, "lr": 9.649534604137755e-05} +{"train_loss": 0.015034432522952557, "global_step": 9000, "epoch": 75, "lr": 9.649453114250037e-05} +{"train_loss": 0.009242537431418896, "global_step": 9001, "epoch": 75, "lr": 9.649371615233616e-05} +{"train_loss": 0.011971889063715935, "global_step": 9002, "epoch": 75, "lr": 9.649290107088651e-05} +{"train_loss": 0.01165006123483181, "global_step": 9003, "epoch": 75, "lr": 9.649208589815301e-05} +{"train_loss": 0.010472212918102741, "global_step": 9004, "epoch": 75, "lr": 9.649127063413726e-05} +{"train_loss": 0.012689268216490746, "global_step": 9005, "epoch": 75, "lr": 9.649045527884088e-05} +{"train_loss": 0.010286429896950722, "global_step": 9006, "epoch": 75, "lr": 9.648963983226545e-05} +{"train_loss": 0.011684331111609936, "global_step": 9007, "epoch": 75, "lr": 9.648882429441257e-05} +{"train_loss": 0.010754029266536236, "global_step": 9008, "epoch": 75, "lr": 9.648800866528386e-05} +{"train_loss": 0.013300258666276932, "global_step": 9009, "epoch": 75, "lr": 9.648719294488091e-05} +{"train_loss": 0.009130601771175861, "global_step": 9010, "epoch": 75, "lr": 9.648637713320533e-05} +{"train_loss": 0.009285504929721355, "global_step": 9011, "epoch": 75, "lr": 9.648556123025871e-05} +{"train_loss": 0.011474997736513615, "global_step": 9012, "epoch": 75, "lr": 9.648474523604266e-05} +{"train_loss": 0.011049812659621239, "global_step": 9013, "epoch": 75, "lr": 9.648392915055877e-05} +{"train_loss": 0.016980387270450592, "global_step": 9014, "epoch": 75, "lr": 9.648311297380866e-05} +{"train_loss": 0.011111496947705746, "global_step": 9015, "epoch": 75, "lr": 9.648229670579392e-05} +{"train_loss": 0.0083059286698699, "global_step": 9016, "epoch": 75, "lr": 9.648148034651614e-05} +{"train_loss": 0.012417001649737358, "global_step": 9017, "epoch": 75, "lr": 9.648066389597697e-05} +{"train_loss": 0.010629843920469284, "global_step": 9018, "epoch": 75, "lr": 9.647984735417795e-05} +{"train_loss": 0.00946829654276371, "global_step": 9019, "epoch": 75, "lr": 9.647903072112074e-05} +{"train_loss": 0.00964132510125637, "global_step": 9020, "epoch": 75, "lr": 9.647821399680691e-05} +{"train_loss": 0.008115939795970917, "global_step": 9021, "epoch": 75, "lr": 9.647739718123807e-05} +{"train_loss": 0.014985315501689911, "global_step": 9022, "epoch": 75, "lr": 9.647658027441583e-05} +{"train_loss": 0.01609538495540619, "global_step": 9023, "epoch": 75, "lr": 9.647576327634179e-05} +{"train_loss": 0.00944353174418211, "global_step": 9024, "epoch": 75, "lr": 9.647494618701756e-05} +{"train_loss": 0.013491181656718254, "global_step": 9025, "epoch": 75, "lr": 9.647412900644473e-05} +{"train_loss": 0.006253275088965893, "global_step": 9026, "epoch": 75, "lr": 9.64733117346249e-05} +{"train_loss": 0.009744352661073208, "global_step": 9027, "epoch": 75, "lr": 9.64724943715597e-05} +{"train_loss": 0.013377535156905651, "global_step": 9028, "epoch": 75, "lr": 9.647167691725073e-05} +{"train_loss": 0.009068803861737251, "global_step": 9029, "epoch": 75, "lr": 9.647085937169958e-05} +{"train_loss": 0.009662041440606117, "global_step": 9030, "epoch": 75, "lr": 9.647004173490785e-05} +{"train_loss": 0.011855987831950188, "global_step": 9031, "epoch": 75, "lr": 9.646922400687719e-05} +{"train_loss": 0.014959512278437614, "global_step": 9032, "epoch": 75, "lr": 9.646840618760915e-05} +{"train_loss": 0.011956343427300453, "global_step": 9033, "epoch": 75, "lr": 9.646758827710536e-05} +{"train_loss": 0.008680304512381554, "global_step": 9034, "epoch": 75, "lr": 9.646677027536744e-05} +{"train_loss": 0.014608071185648441, "global_step": 9035, "epoch": 75, "lr": 9.646595218239695e-05} +{"train_loss": 0.01079573668539524, "global_step": 9036, "epoch": 75, "lr": 9.646513399819555e-05} +{"train_loss": 0.012161409482359886, "global_step": 9037, "epoch": 75, "lr": 9.646431572276482e-05} +{"train_loss": 0.015706434845924377, "global_step": 9038, "epoch": 75, "lr": 9.646349735610637e-05} +{"train_loss": 0.01214288268238306, "global_step": 9039, "epoch": 75, "lr": 9.64626788982218e-05} +{"train_loss": 0.011870290152728558, "global_step": 9040, "epoch": 75, "lr": 9.646186034911274e-05} +{"train_loss": 0.007516919635236263, "global_step": 9041, "epoch": 75, "lr": 9.646104170878077e-05} +{"train_loss": 0.014379153028130531, "global_step": 9042, "epoch": 75, "lr": 9.64602229772275e-05} +{"train_loss": 0.01087256396940651, "global_step": 9043, "epoch": 75, "lr": 9.645940415445455e-05, "val_loss": 0.01864815503358841, "train_action_mse_error": 0.0004177363880444318} +{"train_loss": 0.008263937197625637, "global_step": 9044, "epoch": 76, "lr": 9.645858524046354e-05} +{"train_loss": 0.007880846969783306, "global_step": 9045, "epoch": 76, "lr": 9.645776623525605e-05} +{"train_loss": 0.010662795044481754, "global_step": 9046, "epoch": 76, "lr": 9.645694713883368e-05} +{"train_loss": 0.015249576419591904, "global_step": 9047, "epoch": 76, "lr": 9.645612795119808e-05} +{"train_loss": 0.0077298479154706, "global_step": 9048, "epoch": 76, "lr": 9.645530867235085e-05} +{"train_loss": 0.007221552077680826, "global_step": 9049, "epoch": 76, "lr": 9.645448930229354e-05} +{"train_loss": 0.009619339369237423, "global_step": 9050, "epoch": 76, "lr": 9.645366984102784e-05} +{"train_loss": 0.008709820918738842, "global_step": 9051, "epoch": 76, "lr": 9.645285028855531e-05} +{"train_loss": 0.011897492222487926, "global_step": 9052, "epoch": 76, "lr": 9.645203064487758e-05} +{"train_loss": 0.007980043068528175, "global_step": 9053, "epoch": 76, "lr": 9.645121090999624e-05} +{"train_loss": 0.014938474632799625, "global_step": 9054, "epoch": 76, "lr": 9.645039108391292e-05} +{"train_loss": 0.008759895339608192, "global_step": 9055, "epoch": 76, "lr": 9.644957116662921e-05} +{"train_loss": 0.00630187476053834, "global_step": 9056, "epoch": 76, "lr": 9.644875115814673e-05} +{"train_loss": 0.008504818193614483, "global_step": 9057, "epoch": 76, "lr": 9.644793105846709e-05} +{"train_loss": 0.009160567075014114, "global_step": 9058, "epoch": 76, "lr": 9.64471108675919e-05} +{"train_loss": 0.007231500931084156, "global_step": 9059, "epoch": 76, "lr": 9.644629058552277e-05} +{"train_loss": 0.014046733267605305, "global_step": 9060, "epoch": 76, "lr": 9.644547021226131e-05} +{"train_loss": 0.01145437266677618, "global_step": 9061, "epoch": 76, "lr": 9.644464974780913e-05} +{"train_loss": 0.010459943674504757, "global_step": 9062, "epoch": 76, "lr": 9.644382919216785e-05} +{"train_loss": 0.007264627609401941, "global_step": 9063, "epoch": 76, "lr": 9.644300854533906e-05} +{"train_loss": 0.008182073011994362, "global_step": 9064, "epoch": 76, "lr": 9.644218780732439e-05} +{"train_loss": 0.008150829933583736, "global_step": 9065, "epoch": 76, "lr": 9.644136697812545e-05} +{"train_loss": 0.010956919752061367, "global_step": 9066, "epoch": 76, "lr": 9.644054605774385e-05} +{"train_loss": 0.01010454073548317, "global_step": 9067, "epoch": 76, "lr": 9.643972504618119e-05} +{"train_loss": 0.009847315028309822, "global_step": 9068, "epoch": 76, "lr": 9.64389039434391e-05} +{"train_loss": 0.008349580690264702, "global_step": 9069, "epoch": 76, "lr": 9.643808274951918e-05} +{"train_loss": 0.011594964191317558, "global_step": 9070, "epoch": 76, "lr": 9.643726146442304e-05} +{"train_loss": 0.010163280181586742, "global_step": 9071, "epoch": 76, "lr": 9.643644008815232e-05} +{"train_loss": 0.013030720874667168, "global_step": 9072, "epoch": 76, "lr": 9.643561862070858e-05} +{"train_loss": 0.0066296691074967384, "global_step": 9073, "epoch": 76, "lr": 9.643479706209348e-05} +{"train_loss": 0.007810782641172409, "global_step": 9074, "epoch": 76, "lr": 9.643397541230861e-05} +{"train_loss": 0.012977140955626965, "global_step": 9075, "epoch": 76, "lr": 9.64331536713556e-05} +{"train_loss": 0.010414314456284046, "global_step": 9076, "epoch": 76, "lr": 9.643233183923606e-05} +{"train_loss": 0.009753814898431301, "global_step": 9077, "epoch": 76, "lr": 9.643150991595158e-05} +{"train_loss": 0.009554430842399597, "global_step": 9078, "epoch": 76, "lr": 9.64306879015038e-05} +{"train_loss": 0.012165997177362442, "global_step": 9079, "epoch": 76, "lr": 9.642986579589431e-05} +{"train_loss": 0.013120409101247787, "global_step": 9080, "epoch": 76, "lr": 9.642904359912475e-05} +{"train_loss": 0.01690071076154709, "global_step": 9081, "epoch": 76, "lr": 9.642822131119672e-05} +{"train_loss": 0.010707245208323002, "global_step": 9082, "epoch": 76, "lr": 9.642739893211185e-05} +{"train_loss": 0.011689482256770134, "global_step": 9083, "epoch": 76, "lr": 9.642657646187171e-05} +{"train_loss": 0.011406420730054379, "global_step": 9084, "epoch": 76, "lr": 9.642575390047799e-05} +{"train_loss": 0.0108122443780303, "global_step": 9085, "epoch": 76, "lr": 9.642493124793224e-05} +{"train_loss": 0.007800678256899118, "global_step": 9086, "epoch": 76, "lr": 9.642410850423608e-05} +{"train_loss": 0.010067884810268879, "global_step": 9087, "epoch": 76, "lr": 9.642328566939119e-05} +{"train_loss": 0.013085606507956982, "global_step": 9088, "epoch": 76, "lr": 9.64224627433991e-05} +{"train_loss": 0.01861431635916233, "global_step": 9089, "epoch": 76, "lr": 9.642163972626147e-05} +{"train_loss": 0.010840598493814468, "global_step": 9090, "epoch": 76, "lr": 9.642081661797992e-05} +{"train_loss": 0.009309104643762112, "global_step": 9091, "epoch": 76, "lr": 9.641999341855605e-05} +{"train_loss": 0.008608004078269005, "global_step": 9092, "epoch": 76, "lr": 9.641917012799146e-05} +{"train_loss": 0.015547391958534718, "global_step": 9093, "epoch": 76, "lr": 9.641834674628782e-05} +{"train_loss": 0.01448194868862629, "global_step": 9094, "epoch": 76, "lr": 9.64175232734467e-05} +{"train_loss": 0.01204033475369215, "global_step": 9095, "epoch": 76, "lr": 9.641669970946973e-05} +{"train_loss": 0.013287008740007877, "global_step": 9096, "epoch": 76, "lr": 9.641587605435855e-05} +{"train_loss": 0.009477771818637848, "global_step": 9097, "epoch": 76, "lr": 9.641505230811474e-05} +{"train_loss": 0.008749469183385372, "global_step": 9098, "epoch": 76, "lr": 9.641422847073994e-05} +{"train_loss": 0.007577054668217897, "global_step": 9099, "epoch": 76, "lr": 9.641340454223576e-05} +{"train_loss": 0.01422165147960186, "global_step": 9100, "epoch": 76, "lr": 9.641258052260381e-05} +{"train_loss": 0.00906859990209341, "global_step": 9101, "epoch": 76, "lr": 9.641175641184573e-05} +{"train_loss": 0.013339324854314327, "global_step": 9102, "epoch": 76, "lr": 9.64109322099631e-05} +{"train_loss": 0.008978493511676788, "global_step": 9103, "epoch": 76, "lr": 9.641010791695759e-05} +{"train_loss": 0.007934797555208206, "global_step": 9104, "epoch": 76, "lr": 9.640928353283079e-05} +{"train_loss": 0.009968859143555164, "global_step": 9105, "epoch": 76, "lr": 9.64084590575843e-05} +{"train_loss": 0.0077872080728411674, "global_step": 9106, "epoch": 76, "lr": 9.640763449121976e-05} +{"train_loss": 0.009837642312049866, "global_step": 9107, "epoch": 76, "lr": 9.64068098337388e-05} +{"train_loss": 0.012286714278161526, "global_step": 9108, "epoch": 76, "lr": 9.640598508514304e-05} +{"train_loss": 0.00888722576200962, "global_step": 9109, "epoch": 76, "lr": 9.640516024543406e-05} +{"train_loss": 0.010496007278561592, "global_step": 9110, "epoch": 76, "lr": 9.640433531461353e-05} +{"train_loss": 0.006670220755040646, "global_step": 9111, "epoch": 76, "lr": 9.640351029268302e-05} +{"train_loss": 0.00952295120805502, "global_step": 9112, "epoch": 76, "lr": 9.640268517964419e-05} +{"train_loss": 0.010101452469825745, "global_step": 9113, "epoch": 76, "lr": 9.640185997549864e-05} +{"train_loss": 0.007402668707072735, "global_step": 9114, "epoch": 76, "lr": 9.640103468024799e-05} +{"train_loss": 0.009335989132523537, "global_step": 9115, "epoch": 76, "lr": 9.640020929389389e-05} +{"train_loss": 0.01508919708430767, "global_step": 9116, "epoch": 76, "lr": 9.639938381643791e-05} +{"train_loss": 0.009246580302715302, "global_step": 9117, "epoch": 76, "lr": 9.63985582478817e-05} +{"train_loss": 0.014742826111614704, "global_step": 9118, "epoch": 76, "lr": 9.639773258822689e-05} +{"train_loss": 0.007771120872348547, "global_step": 9119, "epoch": 76, "lr": 9.639690683747507e-05} +{"train_loss": 0.01019755657762289, "global_step": 9120, "epoch": 76, "lr": 9.639608099562789e-05} +{"train_loss": 0.007658873684704304, "global_step": 9121, "epoch": 76, "lr": 9.639525506268696e-05} +{"train_loss": 0.011436155065894127, "global_step": 9122, "epoch": 76, "lr": 9.639442903865393e-05} +{"train_loss": 0.012023890390992165, "global_step": 9123, "epoch": 76, "lr": 9.639360292353035e-05} +{"train_loss": 0.010547105222940445, "global_step": 9124, "epoch": 76, "lr": 9.639277671731791e-05} +{"train_loss": 0.009549092501401901, "global_step": 9125, "epoch": 76, "lr": 9.63919504200182e-05} +{"train_loss": 0.010195660404860973, "global_step": 9126, "epoch": 76, "lr": 9.639112403163287e-05} +{"train_loss": 0.010930772870779037, "global_step": 9127, "epoch": 76, "lr": 9.639029755216351e-05} +{"train_loss": 0.00691183190792799, "global_step": 9128, "epoch": 76, "lr": 9.638947098161177e-05} +{"train_loss": 0.010586370714008808, "global_step": 9129, "epoch": 76, "lr": 9.638864431997925e-05} +{"train_loss": 0.009764465503394604, "global_step": 9130, "epoch": 76, "lr": 9.638781756726759e-05} +{"train_loss": 0.007532735355198383, "global_step": 9131, "epoch": 76, "lr": 9.638699072347839e-05} +{"train_loss": 0.010206830687820911, "global_step": 9132, "epoch": 76, "lr": 9.63861637886133e-05} +{"train_loss": 0.011084978468716145, "global_step": 9133, "epoch": 76, "lr": 9.638533676267393e-05} +{"train_loss": 0.009445120580494404, "global_step": 9134, "epoch": 76, "lr": 9.63845096456619e-05} +{"train_loss": 0.01298131700605154, "global_step": 9135, "epoch": 76, "lr": 9.638368243757886e-05} +{"train_loss": 0.009290646761655807, "global_step": 9136, "epoch": 76, "lr": 9.638285513842639e-05} +{"train_loss": 0.011937620118260384, "global_step": 9137, "epoch": 76, "lr": 9.638202774820617e-05} +{"train_loss": 0.014044376090168953, "global_step": 9138, "epoch": 76, "lr": 9.638120026691977e-05} +{"train_loss": 0.009264294989407063, "global_step": 9139, "epoch": 76, "lr": 9.638037269456886e-05} +{"train_loss": 0.00998220220208168, "global_step": 9140, "epoch": 76, "lr": 9.637954503115502e-05} +{"train_loss": 0.00784939806908369, "global_step": 9141, "epoch": 76, "lr": 9.637871727667991e-05} +{"train_loss": 0.009757472202181816, "global_step": 9142, "epoch": 76, "lr": 9.637788943114514e-05} +{"train_loss": 0.016375476494431496, "global_step": 9143, "epoch": 76, "lr": 9.637706149455233e-05} +{"train_loss": 0.012098078615963459, "global_step": 9144, "epoch": 76, "lr": 9.637623346690312e-05} +{"train_loss": 0.009239790961146355, "global_step": 9145, "epoch": 76, "lr": 9.637540534819914e-05} +{"train_loss": 0.011718557216227055, "global_step": 9146, "epoch": 76, "lr": 9.6374577138442e-05} +{"train_loss": 0.00957297720015049, "global_step": 9147, "epoch": 76, "lr": 9.637374883763332e-05} +{"train_loss": 0.009640688076615334, "global_step": 9148, "epoch": 76, "lr": 9.637292044577477e-05} +{"train_loss": 0.01058943010866642, "global_step": 9149, "epoch": 76, "lr": 9.637209196286792e-05} +{"train_loss": 0.010400399565696716, "global_step": 9150, "epoch": 76, "lr": 9.637126338891443e-05} +{"train_loss": 0.008698584511876106, "global_step": 9151, "epoch": 76, "lr": 9.637043472391591e-05} +{"train_loss": 0.008355467580258846, "global_step": 9152, "epoch": 76, "lr": 9.6369605967874e-05} +{"train_loss": 0.013033954426646233, "global_step": 9153, "epoch": 76, "lr": 9.636877712079034e-05} +{"train_loss": 0.011673327535390854, "global_step": 9154, "epoch": 76, "lr": 9.63679481826665e-05} +{"train_loss": 0.011051815934479237, "global_step": 9155, "epoch": 76, "lr": 9.636711915350418e-05} +{"train_loss": 0.005507193971425295, "global_step": 9156, "epoch": 76, "lr": 9.636629003330497e-05} +{"train_loss": 0.009711106307804585, "global_step": 9157, "epoch": 76, "lr": 9.63654608220705e-05} +{"train_loss": 0.007312459871172905, "global_step": 9158, "epoch": 76, "lr": 9.63646315198024e-05} +{"train_loss": 0.011345778591930866, "global_step": 9159, "epoch": 76, "lr": 9.636380212650229e-05} +{"train_loss": 0.011710436083376408, "global_step": 9160, "epoch": 76, "lr": 9.636297264217182e-05} +{"train_loss": 0.008760331198573112, "global_step": 9161, "epoch": 76, "lr": 9.63621430668126e-05} +{"train_loss": 0.010311059105922194, "global_step": 9162, "epoch": 76, "lr": 9.636131340042626e-05, "val_loss": 0.018288541585206985} +{"train_loss": 0.0076103610917925835, "global_step": 9163, "epoch": 77, "lr": 9.636048364301445e-05} +{"train_loss": 0.011262809857726097, "global_step": 9164, "epoch": 77, "lr": 9.635965379457878e-05} +{"train_loss": 0.010378938168287277, "global_step": 9165, "epoch": 77, "lr": 9.635882385512087e-05} +{"train_loss": 0.007520400453358889, "global_step": 9166, "epoch": 77, "lr": 9.635799382464237e-05} +{"train_loss": 0.008659208193421364, "global_step": 9167, "epoch": 77, "lr": 9.635716370314491e-05} +{"train_loss": 0.010287027806043625, "global_step": 9168, "epoch": 77, "lr": 9.63563334906301e-05} +{"train_loss": 0.011004823260009289, "global_step": 9169, "epoch": 77, "lr": 9.635550318709958e-05} +{"train_loss": 0.007676348555833101, "global_step": 9170, "epoch": 77, "lr": 9.635467279255499e-05} +{"train_loss": 0.007875203154981136, "global_step": 9171, "epoch": 77, "lr": 9.635384230699796e-05} +{"train_loss": 0.009244381450116634, "global_step": 9172, "epoch": 77, "lr": 9.63530117304301e-05} +{"train_loss": 0.008821167051792145, "global_step": 9173, "epoch": 77, "lr": 9.635218106285307e-05} +{"train_loss": 0.009041686542332172, "global_step": 9174, "epoch": 77, "lr": 9.635135030426845e-05} +{"train_loss": 0.009401912800967693, "global_step": 9175, "epoch": 77, "lr": 9.635051945467792e-05} +{"train_loss": 0.005942878779023886, "global_step": 9176, "epoch": 77, "lr": 9.634968851408312e-05} +{"train_loss": 0.012210807763040066, "global_step": 9177, "epoch": 77, "lr": 9.634885748248563e-05} +{"train_loss": 0.011368685401976109, "global_step": 9178, "epoch": 77, "lr": 9.634802635988714e-05} +{"train_loss": 0.01280246488749981, "global_step": 9179, "epoch": 77, "lr": 9.634719514628923e-05} +{"train_loss": 0.009222686290740967, "global_step": 9180, "epoch": 77, "lr": 9.634636384169355e-05} +{"train_loss": 0.010648428462445736, "global_step": 9181, "epoch": 77, "lr": 9.634553244610173e-05} +{"train_loss": 0.011246339417994022, "global_step": 9182, "epoch": 77, "lr": 9.634470095951543e-05} +{"train_loss": 0.010728562250733376, "global_step": 9183, "epoch": 77, "lr": 9.634386938193624e-05} +{"train_loss": 0.010164101608097553, "global_step": 9184, "epoch": 77, "lr": 9.634303771336583e-05} +{"train_loss": 0.01118498109281063, "global_step": 9185, "epoch": 77, "lr": 9.634220595380582e-05} +{"train_loss": 0.00706908293068409, "global_step": 9186, "epoch": 77, "lr": 9.634137410325783e-05} +{"train_loss": 0.008920778520405293, "global_step": 9187, "epoch": 77, "lr": 9.63405421617235e-05} +{"train_loss": 0.008438102900981903, "global_step": 9188, "epoch": 77, "lr": 9.633971012920448e-05} +{"train_loss": 0.008771040476858616, "global_step": 9189, "epoch": 77, "lr": 9.633887800570239e-05} +{"train_loss": 0.008826571516692638, "global_step": 9190, "epoch": 77, "lr": 9.633804579121884e-05} +{"train_loss": 0.008026680909097195, "global_step": 9191, "epoch": 77, "lr": 9.63372134857555e-05} +{"train_loss": 0.008835872635245323, "global_step": 9192, "epoch": 77, "lr": 9.6336381089314e-05} +{"train_loss": 0.008702563121914864, "global_step": 9193, "epoch": 77, "lr": 9.633554860189596e-05} +{"train_loss": 0.015711022540926933, "global_step": 9194, "epoch": 77, "lr": 9.633471602350301e-05} +{"train_loss": 0.01292066927999258, "global_step": 9195, "epoch": 77, "lr": 9.633388335413681e-05} +{"train_loss": 0.010088575072586536, "global_step": 9196, "epoch": 77, "lr": 9.633305059379898e-05} +{"train_loss": 0.010520746000111103, "global_step": 9197, "epoch": 77, "lr": 9.633221774249115e-05} +{"train_loss": 0.010120043531060219, "global_step": 9198, "epoch": 77, "lr": 9.633138480021495e-05} +{"train_loss": 0.009632905013859272, "global_step": 9199, "epoch": 77, "lr": 9.633055176697205e-05} +{"train_loss": 0.013653673231601715, "global_step": 9200, "epoch": 77, "lr": 9.632971864276405e-05} +{"train_loss": 0.00839173048734665, "global_step": 9201, "epoch": 77, "lr": 9.632888542759259e-05} +{"train_loss": 0.008640105836093426, "global_step": 9202, "epoch": 77, "lr": 9.632805212145932e-05} +{"train_loss": 0.01008232869207859, "global_step": 9203, "epoch": 77, "lr": 9.632721872436585e-05} +{"train_loss": 0.00848380010575056, "global_step": 9204, "epoch": 77, "lr": 9.632638523631386e-05} +{"train_loss": 0.011620085686445236, "global_step": 9205, "epoch": 77, "lr": 9.632555165730496e-05} +{"train_loss": 0.008342615328729153, "global_step": 9206, "epoch": 77, "lr": 9.632471798734077e-05} +{"train_loss": 0.015480482950806618, "global_step": 9207, "epoch": 77, "lr": 9.632388422642296e-05} +{"train_loss": 0.00837462954223156, "global_step": 9208, "epoch": 77, "lr": 9.632305037455315e-05} +{"train_loss": 0.009378457441926003, "global_step": 9209, "epoch": 77, "lr": 9.632221643173299e-05} +{"train_loss": 0.016473539173603058, "global_step": 9210, "epoch": 77, "lr": 9.632138239796408e-05} +{"train_loss": 0.011769931763410568, "global_step": 9211, "epoch": 77, "lr": 9.632054827324812e-05} +{"train_loss": 0.008515551686286926, "global_step": 9212, "epoch": 77, "lr": 9.631971405758668e-05} +{"train_loss": 0.009375184774398804, "global_step": 9213, "epoch": 77, "lr": 9.631887975098145e-05} +{"train_loss": 0.013007779605686665, "global_step": 9214, "epoch": 77, "lr": 9.631804535343404e-05} +{"train_loss": 0.010624049231410027, "global_step": 9215, "epoch": 77, "lr": 9.631721086494609e-05} +{"train_loss": 0.009675219655036926, "global_step": 9216, "epoch": 77, "lr": 9.631637628551925e-05} +{"train_loss": 0.007097456604242325, "global_step": 9217, "epoch": 77, "lr": 9.631554161515517e-05} +{"train_loss": 0.006682110019028187, "global_step": 9218, "epoch": 77, "lr": 9.631470685385545e-05} +{"train_loss": 0.0073497784323990345, "global_step": 9219, "epoch": 77, "lr": 9.631387200162176e-05} +{"train_loss": 0.00740513252094388, "global_step": 9220, "epoch": 77, "lr": 9.631303705845573e-05} +{"train_loss": 0.009249693714082241, "global_step": 9221, "epoch": 77, "lr": 9.6312202024359e-05} +{"train_loss": 0.011748719029128551, "global_step": 9222, "epoch": 77, "lr": 9.63113668993332e-05} +{"train_loss": 0.008809211663901806, "global_step": 9223, "epoch": 77, "lr": 9.631053168337999e-05} +{"train_loss": 0.011065890081226826, "global_step": 9224, "epoch": 77, "lr": 9.630969637650101e-05} +{"train_loss": 0.012002063915133476, "global_step": 9225, "epoch": 77, "lr": 9.630886097869787e-05} +{"train_loss": 0.007322516292333603, "global_step": 9226, "epoch": 77, "lr": 9.630802548997222e-05} +{"train_loss": 0.012490618973970413, "global_step": 9227, "epoch": 77, "lr": 9.630718991032572e-05} +{"train_loss": 0.010914614424109459, "global_step": 9228, "epoch": 77, "lr": 9.630635423976e-05} +{"train_loss": 0.010061553679406643, "global_step": 9229, "epoch": 77, "lr": 9.630551847827672e-05} +{"train_loss": 0.008864529430866241, "global_step": 9230, "epoch": 77, "lr": 9.630468262587746e-05} +{"train_loss": 0.004500445909798145, "global_step": 9231, "epoch": 77, "lr": 9.630384668256393e-05} +{"train_loss": 0.01276721153408289, "global_step": 9232, "epoch": 77, "lr": 9.630301064833774e-05} +{"train_loss": 0.012446588836610317, "global_step": 9233, "epoch": 77, "lr": 9.630217452320054e-05} +{"train_loss": 0.009340089745819569, "global_step": 9234, "epoch": 77, "lr": 9.630133830715395e-05} +{"train_loss": 0.00845417845994234, "global_step": 9235, "epoch": 77, "lr": 9.630050200019965e-05} +{"train_loss": 0.010651142336428165, "global_step": 9236, "epoch": 77, "lr": 9.629966560233926e-05} +{"train_loss": 0.00993811059743166, "global_step": 9237, "epoch": 77, "lr": 9.62988291135744e-05} +{"train_loss": 0.007704117801040411, "global_step": 9238, "epoch": 77, "lr": 9.629799253390676e-05} +{"train_loss": 0.008582456037402153, "global_step": 9239, "epoch": 77, "lr": 9.629715586333795e-05} +{"train_loss": 0.007456934545189142, "global_step": 9240, "epoch": 77, "lr": 9.629631910186962e-05} +{"train_loss": 0.014129010029137135, "global_step": 9241, "epoch": 77, "lr": 9.62954822495034e-05} +{"train_loss": 0.01246940903365612, "global_step": 9242, "epoch": 77, "lr": 9.629464530624098e-05} +{"train_loss": 0.011259634979069233, "global_step": 9243, "epoch": 77, "lr": 9.629380827208394e-05} +{"train_loss": 0.012836028821766376, "global_step": 9244, "epoch": 77, "lr": 9.629297114703394e-05} +{"train_loss": 0.012640619650483131, "global_step": 9245, "epoch": 77, "lr": 9.629213393109266e-05} +{"train_loss": 0.010052982717752457, "global_step": 9246, "epoch": 77, "lr": 9.629129662426172e-05} +{"train_loss": 0.011221951805055141, "global_step": 9247, "epoch": 77, "lr": 9.629045922654278e-05} +{"train_loss": 0.009122610092163086, "global_step": 9248, "epoch": 77, "lr": 9.628962173793745e-05} +{"train_loss": 0.009877949953079224, "global_step": 9249, "epoch": 77, "lr": 9.62887841584474e-05} +{"train_loss": 0.008687048219144344, "global_step": 9250, "epoch": 77, "lr": 9.628794648807426e-05} +{"train_loss": 0.009900783188641071, "global_step": 9251, "epoch": 77, "lr": 9.628710872681967e-05} +{"train_loss": 0.015211114659905434, "global_step": 9252, "epoch": 77, "lr": 9.628627087468532e-05} +{"train_loss": 0.011132155545055866, "global_step": 9253, "epoch": 77, "lr": 9.62854329316728e-05} +{"train_loss": 0.006898375693708658, "global_step": 9254, "epoch": 77, "lr": 9.628459489778377e-05} +{"train_loss": 0.006250809412449598, "global_step": 9255, "epoch": 77, "lr": 9.62837567730199e-05} +{"train_loss": 0.010567066259682178, "global_step": 9256, "epoch": 77, "lr": 9.628291855738281e-05} +{"train_loss": 0.011048289947211742, "global_step": 9257, "epoch": 77, "lr": 9.628208025087417e-05} +{"train_loss": 0.010934696532785892, "global_step": 9258, "epoch": 77, "lr": 9.628124185349559e-05} +{"train_loss": 0.008086620829999447, "global_step": 9259, "epoch": 77, "lr": 9.628040336524873e-05} +{"train_loss": 0.009123328141868114, "global_step": 9260, "epoch": 77, "lr": 9.627956478613526e-05} +{"train_loss": 0.011109433136880398, "global_step": 9261, "epoch": 77, "lr": 9.62787261161568e-05} +{"train_loss": 0.011616993695497513, "global_step": 9262, "epoch": 77, "lr": 9.627788735531503e-05} +{"train_loss": 0.013967390172183514, "global_step": 9263, "epoch": 77, "lr": 9.627704850361154e-05} +{"train_loss": 0.008481962606310844, "global_step": 9264, "epoch": 77, "lr": 9.627620956104801e-05} +{"train_loss": 0.010815338231623173, "global_step": 9265, "epoch": 77, "lr": 9.62753705276261e-05} +{"train_loss": 0.010616817511618137, "global_step": 9266, "epoch": 77, "lr": 9.627453140334744e-05} +{"train_loss": 0.011989651247859001, "global_step": 9267, "epoch": 77, "lr": 9.62736921882137e-05} +{"train_loss": 0.013155410066246986, "global_step": 9268, "epoch": 77, "lr": 9.627285288222647e-05} +{"train_loss": 0.011456543579697609, "global_step": 9269, "epoch": 77, "lr": 9.627201348538745e-05} +{"train_loss": 0.009129618294537067, "global_step": 9270, "epoch": 77, "lr": 9.627117399769829e-05} +{"train_loss": 0.007228192873299122, "global_step": 9271, "epoch": 77, "lr": 9.627033441916063e-05} +{"train_loss": 0.010269224643707275, "global_step": 9272, "epoch": 77, "lr": 9.62694947497761e-05} +{"train_loss": 0.01005149818956852, "global_step": 9273, "epoch": 77, "lr": 9.626865498954635e-05} +{"train_loss": 0.00934532843530178, "global_step": 9274, "epoch": 77, "lr": 9.626781513847306e-05} +{"train_loss": 0.012328235432505608, "global_step": 9275, "epoch": 77, "lr": 9.626697519655783e-05} +{"train_loss": 0.009211440570652485, "global_step": 9276, "epoch": 77, "lr": 9.626613516380235e-05} +{"train_loss": 0.011581302620470524, "global_step": 9277, "epoch": 77, "lr": 9.626529504020826e-05} +{"train_loss": 0.012875314801931381, "global_step": 9278, "epoch": 77, "lr": 9.62644548257772e-05} +{"train_loss": 0.007551392540335655, "global_step": 9279, "epoch": 77, "lr": 9.626361452051084e-05} +{"train_loss": 0.010745448060333729, "global_step": 9280, "epoch": 77, "lr": 9.626277412441081e-05} +{"train_loss": 0.010091411775494573, "global_step": 9281, "epoch": 77, "lr": 9.626193363747875e-05, "val_loss": 0.011087017133831978} +{"train_loss": 0.008289537392556667, "global_step": 9282, "epoch": 78, "lr": 9.626109305971634e-05} +{"train_loss": 0.010281701572239399, "global_step": 9283, "epoch": 78, "lr": 9.626025239112521e-05} +{"train_loss": 0.008477512747049332, "global_step": 9284, "epoch": 78, "lr": 9.625941163170702e-05} +{"train_loss": 0.007603306323289871, "global_step": 9285, "epoch": 78, "lr": 9.62585707814634e-05} +{"train_loss": 0.01401674933731556, "global_step": 9286, "epoch": 78, "lr": 9.625772984039606e-05} +{"train_loss": 0.010487700812518597, "global_step": 9287, "epoch": 78, "lr": 9.625688880850658e-05} +{"train_loss": 0.00745042460039258, "global_step": 9288, "epoch": 78, "lr": 9.625604768579663e-05} +{"train_loss": 0.013095158152282238, "global_step": 9289, "epoch": 78, "lr": 9.625520647226789e-05} +{"train_loss": 0.006976609583944082, "global_step": 9290, "epoch": 78, "lr": 9.625436516792199e-05} +{"train_loss": 0.008828768506646156, "global_step": 9291, "epoch": 78, "lr": 9.625352377276058e-05} +{"train_loss": 0.008405493572354317, "global_step": 9292, "epoch": 78, "lr": 9.625268228678534e-05} +{"train_loss": 0.012397530488669872, "global_step": 9293, "epoch": 78, "lr": 9.625184070999787e-05} +{"train_loss": 0.014005821198225021, "global_step": 9294, "epoch": 78, "lr": 9.625099904239987e-05} +{"train_loss": 0.010694808326661587, "global_step": 9295, "epoch": 78, "lr": 9.625015728399298e-05} +{"train_loss": 0.010998311452567577, "global_step": 9296, "epoch": 78, "lr": 9.624931543477884e-05} +{"train_loss": 0.010462593287229538, "global_step": 9297, "epoch": 78, "lr": 9.62484734947591e-05} +{"train_loss": 0.01259271614253521, "global_step": 9298, "epoch": 78, "lr": 9.624763146393542e-05} +{"train_loss": 0.011109967716038227, "global_step": 9299, "epoch": 78, "lr": 9.624678934230948e-05} +{"train_loss": 0.010706056840717793, "global_step": 9300, "epoch": 78, "lr": 9.624594712988289e-05} +{"train_loss": 0.007139911409467459, "global_step": 9301, "epoch": 78, "lr": 9.624510482665733e-05} +{"train_loss": 0.01078185997903347, "global_step": 9302, "epoch": 78, "lr": 9.624426243263444e-05} +{"train_loss": 0.010564463213086128, "global_step": 9303, "epoch": 78, "lr": 9.62434199478159e-05} +{"train_loss": 0.013391208834946156, "global_step": 9304, "epoch": 78, "lr": 9.624257737220333e-05} +{"train_loss": 0.013230354525148869, "global_step": 9305, "epoch": 78, "lr": 9.62417347057984e-05} +{"train_loss": 0.011072726920247078, "global_step": 9306, "epoch": 78, "lr": 9.624089194860277e-05} +{"train_loss": 0.008831002749502659, "global_step": 9307, "epoch": 78, "lr": 9.624004910061809e-05} +{"train_loss": 0.013073244132101536, "global_step": 9308, "epoch": 78, "lr": 9.6239206161846e-05} +{"train_loss": 0.009903967380523682, "global_step": 9309, "epoch": 78, "lr": 9.623836313228819e-05} +{"train_loss": 0.010654209181666374, "global_step": 9310, "epoch": 78, "lr": 9.623752001194628e-05} +{"train_loss": 0.014447526074945927, "global_step": 9311, "epoch": 78, "lr": 9.623667680082193e-05} +{"train_loss": 0.008932497352361679, "global_step": 9312, "epoch": 78, "lr": 9.623583349891683e-05} +{"train_loss": 0.010035832412540913, "global_step": 9313, "epoch": 78, "lr": 9.62349901062326e-05} +{"train_loss": 0.010072635486721992, "global_step": 9314, "epoch": 78, "lr": 9.62341466227709e-05} +{"train_loss": 0.008276786655187607, "global_step": 9315, "epoch": 78, "lr": 9.62333030485334e-05} +{"train_loss": 0.010707888752222061, "global_step": 9316, "epoch": 78, "lr": 9.623245938352175e-05} +{"train_loss": 0.007642665412276983, "global_step": 9317, "epoch": 78, "lr": 9.62316156277376e-05} +{"train_loss": 0.009749933145940304, "global_step": 9318, "epoch": 78, "lr": 9.62307717811826e-05} +{"train_loss": 0.008344431407749653, "global_step": 9319, "epoch": 78, "lr": 9.622992784385843e-05} +{"train_loss": 0.008554426021873951, "global_step": 9320, "epoch": 78, "lr": 9.622908381576674e-05} +{"train_loss": 0.00886467844247818, "global_step": 9321, "epoch": 78, "lr": 9.622823969690917e-05} +{"train_loss": 0.009712157770991325, "global_step": 9322, "epoch": 78, "lr": 9.622739548728741e-05} +{"train_loss": 0.010398605838418007, "global_step": 9323, "epoch": 78, "lr": 9.622655118690308e-05} +{"train_loss": 0.006046812515705824, "global_step": 9324, "epoch": 78, "lr": 9.622570679575786e-05} +{"train_loss": 0.007444691378623247, "global_step": 9325, "epoch": 78, "lr": 9.622486231385341e-05} +{"train_loss": 0.006178546231240034, "global_step": 9326, "epoch": 78, "lr": 9.622401774119137e-05} +{"train_loss": 0.0079563669860363, "global_step": 9327, "epoch": 78, "lr": 9.622317307777342e-05} +{"train_loss": 0.009824588894844055, "global_step": 9328, "epoch": 78, "lr": 9.62223283236012e-05} +{"train_loss": 0.009846260771155357, "global_step": 9329, "epoch": 78, "lr": 9.622148347867639e-05} +{"train_loss": 0.010657385922968388, "global_step": 9330, "epoch": 78, "lr": 9.622063854300062e-05} +{"train_loss": 0.007922397926449776, "global_step": 9331, "epoch": 78, "lr": 9.621979351657558e-05} +{"train_loss": 0.010407565161585808, "global_step": 9332, "epoch": 78, "lr": 9.621894839940288e-05} +{"train_loss": 0.010148631408810616, "global_step": 9333, "epoch": 78, "lr": 9.621810319148425e-05} +{"train_loss": 0.008832166902720928, "global_step": 9334, "epoch": 78, "lr": 9.62172578928213e-05} +{"train_loss": 0.008633371442556381, "global_step": 9335, "epoch": 78, "lr": 9.621641250341569e-05} +{"train_loss": 0.010216332040727139, "global_step": 9336, "epoch": 78, "lr": 9.62155670232691e-05} +{"train_loss": 0.0074516888707876205, "global_step": 9337, "epoch": 78, "lr": 9.621472145238318e-05} +{"train_loss": 0.011637398973107338, "global_step": 9338, "epoch": 78, "lr": 9.62138757907596e-05} +{"train_loss": 0.006274286191910505, "global_step": 9339, "epoch": 78, "lr": 9.621303003840001e-05} +{"train_loss": 0.012794388458132744, "global_step": 9340, "epoch": 78, "lr": 9.621218419530607e-05} +{"train_loss": 0.01076881866902113, "global_step": 9341, "epoch": 78, "lr": 9.621133826147943e-05} +{"train_loss": 0.009985513053834438, "global_step": 9342, "epoch": 78, "lr": 9.621049223692178e-05} +{"train_loss": 0.008475731126964092, "global_step": 9343, "epoch": 78, "lr": 9.620964612163477e-05} +{"train_loss": 0.011560911312699318, "global_step": 9344, "epoch": 78, "lr": 9.620879991562004e-05} +{"train_loss": 0.007804931607097387, "global_step": 9345, "epoch": 78, "lr": 9.620795361887928e-05} +{"train_loss": 0.0047632488422095776, "global_step": 9346, "epoch": 78, "lr": 9.620710723141413e-05} +{"train_loss": 0.005666519049555063, "global_step": 9347, "epoch": 78, "lr": 9.620626075322627e-05} +{"train_loss": 0.014402145519852638, "global_step": 9348, "epoch": 78, "lr": 9.620541418431735e-05} +{"train_loss": 0.009395618923008442, "global_step": 9349, "epoch": 78, "lr": 9.620456752468904e-05} +{"train_loss": 0.00868596974760294, "global_step": 9350, "epoch": 78, "lr": 9.6203720774343e-05} +{"train_loss": 0.010243749246001244, "global_step": 9351, "epoch": 78, "lr": 9.620287393328088e-05} +{"train_loss": 0.00809998344630003, "global_step": 9352, "epoch": 78, "lr": 9.620202700150436e-05} +{"train_loss": 0.006695957854390144, "global_step": 9353, "epoch": 78, "lr": 9.62011799790151e-05} +{"train_loss": 0.008771093562245369, "global_step": 9354, "epoch": 78, "lr": 9.620033286581475e-05} +{"train_loss": 0.006551552098244429, "global_step": 9355, "epoch": 78, "lr": 9.619948566190497e-05} +{"train_loss": 0.006241714581847191, "global_step": 9356, "epoch": 78, "lr": 9.619863836728746e-05} +{"train_loss": 0.009110423736274242, "global_step": 9357, "epoch": 78, "lr": 9.619779098196385e-05} +{"train_loss": 0.012770102359354496, "global_step": 9358, "epoch": 78, "lr": 9.619694350593581e-05} +{"train_loss": 0.006891237106174231, "global_step": 9359, "epoch": 78, "lr": 9.619609593920501e-05} +{"train_loss": 0.006470457185059786, "global_step": 9360, "epoch": 78, "lr": 9.619524828177311e-05} +{"train_loss": 0.008985240012407303, "global_step": 9361, "epoch": 78, "lr": 9.619440053364177e-05} +{"train_loss": 0.006491749081760645, "global_step": 9362, "epoch": 78, "lr": 9.619355269481268e-05} +{"train_loss": 0.00979702454060316, "global_step": 9363, "epoch": 78, "lr": 9.619270476528746e-05} +{"train_loss": 0.009621855802834034, "global_step": 9364, "epoch": 78, "lr": 9.619185674506781e-05} +{"train_loss": 0.006951966788619757, "global_step": 9365, "epoch": 78, "lr": 9.619100863415538e-05} +{"train_loss": 0.008550173602998257, "global_step": 9366, "epoch": 78, "lr": 9.619016043255185e-05} +{"train_loss": 0.008425100706517696, "global_step": 9367, "epoch": 78, "lr": 9.618931214025885e-05} +{"train_loss": 0.010848293080925941, "global_step": 9368, "epoch": 78, "lr": 9.61884637572781e-05} +{"train_loss": 0.008548829704523087, "global_step": 9369, "epoch": 78, "lr": 9.618761528361122e-05} +{"train_loss": 0.0075443945825099945, "global_step": 9370, "epoch": 78, "lr": 9.61867667192599e-05} +{"train_loss": 0.012592548504471779, "global_step": 9371, "epoch": 78, "lr": 9.618591806422578e-05} +{"train_loss": 0.010334981605410576, "global_step": 9372, "epoch": 78, "lr": 9.618506931851057e-05} +{"train_loss": 0.008129285648465157, "global_step": 9373, "epoch": 78, "lr": 9.618422048211591e-05} +{"train_loss": 0.01119818165898323, "global_step": 9374, "epoch": 78, "lr": 9.618337155504344e-05} +{"train_loss": 0.006432777736335993, "global_step": 9375, "epoch": 78, "lr": 9.618252253729487e-05} +{"train_loss": 0.005561656318604946, "global_step": 9376, "epoch": 78, "lr": 9.618167342887185e-05} +{"train_loss": 0.008412527851760387, "global_step": 9377, "epoch": 78, "lr": 9.618082422977604e-05} +{"train_loss": 0.011817208491265774, "global_step": 9378, "epoch": 78, "lr": 9.617997494000914e-05} +{"train_loss": 0.01047432515770197, "global_step": 9379, "epoch": 78, "lr": 9.617912555957276e-05} +{"train_loss": 0.009545463137328625, "global_step": 9380, "epoch": 78, "lr": 9.617827608846862e-05} +{"train_loss": 0.01172805204987526, "global_step": 9381, "epoch": 78, "lr": 9.617742652669837e-05} +{"train_loss": 0.011023017577826977, "global_step": 9382, "epoch": 78, "lr": 9.617657687426367e-05} +{"train_loss": 0.008656536228954792, "global_step": 9383, "epoch": 78, "lr": 9.61757271311662e-05} +{"train_loss": 0.011397999711334705, "global_step": 9384, "epoch": 78, "lr": 9.617487729740762e-05} +{"train_loss": 0.007548481225967407, "global_step": 9385, "epoch": 78, "lr": 9.61740273729896e-05} +{"train_loss": 0.008020385168492794, "global_step": 9386, "epoch": 78, "lr": 9.61731773579138e-05} +{"train_loss": 0.00886592548340559, "global_step": 9387, "epoch": 78, "lr": 9.617232725218191e-05} +{"train_loss": 0.00907126720994711, "global_step": 9388, "epoch": 78, "lr": 9.61714770557956e-05} +{"train_loss": 0.008345445618033409, "global_step": 9389, "epoch": 78, "lr": 9.61706267687565e-05} +{"train_loss": 0.008892321959137917, "global_step": 9390, "epoch": 78, "lr": 9.616977639106633e-05} +{"train_loss": 0.008059604093432426, "global_step": 9391, "epoch": 78, "lr": 9.616892592272672e-05} +{"train_loss": 0.008288407698273659, "global_step": 9392, "epoch": 78, "lr": 9.616807536373937e-05} +{"train_loss": 0.008158257231116295, "global_step": 9393, "epoch": 78, "lr": 9.616722471410593e-05} +{"train_loss": 0.015219936147332191, "global_step": 9394, "epoch": 78, "lr": 9.616637397382807e-05} +{"train_loss": 0.009746398776769638, "global_step": 9395, "epoch": 78, "lr": 9.616552314290748e-05} +{"train_loss": 0.013009446673095226, "global_step": 9396, "epoch": 78, "lr": 9.61646722213458e-05} +{"train_loss": 0.009632262401282787, "global_step": 9397, "epoch": 78, "lr": 9.616382120914473e-05} +{"train_loss": 0.009795529767870903, "global_step": 9398, "epoch": 78, "lr": 9.616297010630593e-05} +{"train_loss": 0.009850806556642056, "global_step": 9399, "epoch": 78, "lr": 9.616211891283108e-05} +{"train_loss": 0.009513733583745085, "global_step": 9400, "epoch": 78, "lr": 9.616126762872183e-05, "val_loss": 0.013250992633402348} +{"train_loss": 0.012185939587652683, "global_step": 9401, "epoch": 79, "lr": 9.616041625397987e-05} +{"train_loss": 0.014245559461414814, "global_step": 9402, "epoch": 79, "lr": 9.615956478860685e-05} +{"train_loss": 0.01190250739455223, "global_step": 9403, "epoch": 79, "lr": 9.615871323260446e-05} +{"train_loss": 0.01303925085812807, "global_step": 9404, "epoch": 79, "lr": 9.615786158597437e-05} +{"train_loss": 0.012676808051764965, "global_step": 9405, "epoch": 79, "lr": 9.615700984871824e-05} +{"train_loss": 0.0071038296446204185, "global_step": 9406, "epoch": 79, "lr": 9.615615802083777e-05} +{"train_loss": 0.013438213616609573, "global_step": 9407, "epoch": 79, "lr": 9.61553061023346e-05} +{"train_loss": 0.010783151723444462, "global_step": 9408, "epoch": 79, "lr": 9.615445409321045e-05} +{"train_loss": 0.011948798783123493, "global_step": 9409, "epoch": 79, "lr": 9.615360199346693e-05} +{"train_loss": 0.01020940113812685, "global_step": 9410, "epoch": 79, "lr": 9.615274980310574e-05} +{"train_loss": 0.012471044436097145, "global_step": 9411, "epoch": 79, "lr": 9.615189752212857e-05} +{"train_loss": 0.009399301372468472, "global_step": 9412, "epoch": 79, "lr": 9.615104515053707e-05} +{"train_loss": 0.0126624945551157, "global_step": 9413, "epoch": 79, "lr": 9.615019268833293e-05} +{"train_loss": 0.013803993351757526, "global_step": 9414, "epoch": 79, "lr": 9.614934013551782e-05} +{"train_loss": 0.009091127663850784, "global_step": 9415, "epoch": 79, "lr": 9.614848749209339e-05} +{"train_loss": 0.012745103798806667, "global_step": 9416, "epoch": 79, "lr": 9.614763475806137e-05} +{"train_loss": 0.012026181444525719, "global_step": 9417, "epoch": 79, "lr": 9.614678193342336e-05} +{"train_loss": 0.009720604866743088, "global_step": 9418, "epoch": 79, "lr": 9.614592901818112e-05} +{"train_loss": 0.014037267304956913, "global_step": 9419, "epoch": 79, "lr": 9.614507601233625e-05} +{"train_loss": 0.015592013485729694, "global_step": 9420, "epoch": 79, "lr": 9.614422291589045e-05} +{"train_loss": 0.011935083195567131, "global_step": 9421, "epoch": 79, "lr": 9.61433697288454e-05} +{"train_loss": 0.010559664107859135, "global_step": 9422, "epoch": 79, "lr": 9.614251645120278e-05} +{"train_loss": 0.008312579244375229, "global_step": 9423, "epoch": 79, "lr": 9.614166308296425e-05} +{"train_loss": 0.01152284536510706, "global_step": 9424, "epoch": 79, "lr": 9.61408096241315e-05} +{"train_loss": 0.009506828151643276, "global_step": 9425, "epoch": 79, "lr": 9.61399560747062e-05} +{"train_loss": 0.010012338869273663, "global_step": 9426, "epoch": 79, "lr": 9.613910243469003e-05} +{"train_loss": 0.017241772264242172, "global_step": 9427, "epoch": 79, "lr": 9.613824870408465e-05} +{"train_loss": 0.009597793221473694, "global_step": 9428, "epoch": 79, "lr": 9.613739488289176e-05} +{"train_loss": 0.01215240079909563, "global_step": 9429, "epoch": 79, "lr": 9.613654097111301e-05} +{"train_loss": 0.008169461041688919, "global_step": 9430, "epoch": 79, "lr": 9.61356869687501e-05} +{"train_loss": 0.013267994858324528, "global_step": 9431, "epoch": 79, "lr": 9.61348328758047e-05} +{"train_loss": 0.009817409329116344, "global_step": 9432, "epoch": 79, "lr": 9.613397869227849e-05} +{"train_loss": 0.01315899658948183, "global_step": 9433, "epoch": 79, "lr": 9.613312441817312e-05} +{"train_loss": 0.014736928977072239, "global_step": 9434, "epoch": 79, "lr": 9.61322700534903e-05} +{"train_loss": 0.00859084539115429, "global_step": 9435, "epoch": 79, "lr": 9.613141559823171e-05} +{"train_loss": 0.008406881242990494, "global_step": 9436, "epoch": 79, "lr": 9.6130561052399e-05} +{"train_loss": 0.013638947159051895, "global_step": 9437, "epoch": 79, "lr": 9.612970641599386e-05} +{"train_loss": 0.016193615272641182, "global_step": 9438, "epoch": 79, "lr": 9.612885168901797e-05} +{"train_loss": 0.008723333477973938, "global_step": 9439, "epoch": 79, "lr": 9.612799687147302e-05} +{"train_loss": 0.012616054154932499, "global_step": 9440, "epoch": 79, "lr": 9.612714196336067e-05} +{"train_loss": 0.011644302867352962, "global_step": 9441, "epoch": 79, "lr": 9.61262869646826e-05} +{"train_loss": 0.011522428132593632, "global_step": 9442, "epoch": 79, "lr": 9.61254318754405e-05} +{"train_loss": 0.01001304853707552, "global_step": 9443, "epoch": 79, "lr": 9.612457669563603e-05} +{"train_loss": 0.01164263766258955, "global_step": 9444, "epoch": 79, "lr": 9.612372142527088e-05} +{"train_loss": 0.009160305373370647, "global_step": 9445, "epoch": 79, "lr": 9.612286606434676e-05} +{"train_loss": 0.01173719484359026, "global_step": 9446, "epoch": 79, "lr": 9.61220106128653e-05} +{"train_loss": 0.009770608507096767, "global_step": 9447, "epoch": 79, "lr": 9.612115507082819e-05} +{"train_loss": 0.012012726627290249, "global_step": 9448, "epoch": 79, "lr": 9.612029943823713e-05} +{"train_loss": 0.010335519909858704, "global_step": 9449, "epoch": 79, "lr": 9.611944371509378e-05} +{"train_loss": 0.013726094737648964, "global_step": 9450, "epoch": 79, "lr": 9.611858790139985e-05} +{"train_loss": 0.008951153606176376, "global_step": 9451, "epoch": 79, "lr": 9.6117731997157e-05} +{"train_loss": 0.016085725277662277, "global_step": 9452, "epoch": 79, "lr": 9.611687600236688e-05} +{"train_loss": 0.009087017737329006, "global_step": 9453, "epoch": 79, "lr": 9.611601991703121e-05} +{"train_loss": 0.010731427930295467, "global_step": 9454, "epoch": 79, "lr": 9.611516374115168e-05} +{"train_loss": 0.010224414989352226, "global_step": 9455, "epoch": 79, "lr": 9.611430747472993e-05} +{"train_loss": 0.012489528395235538, "global_step": 9456, "epoch": 79, "lr": 9.611345111776769e-05} +{"train_loss": 0.01146530918776989, "global_step": 9457, "epoch": 79, "lr": 9.611259467026659e-05} +{"train_loss": 0.012597991153597832, "global_step": 9458, "epoch": 79, "lr": 9.611173813222836e-05} +{"train_loss": 0.012121916748583317, "global_step": 9459, "epoch": 79, "lr": 9.611088150365464e-05} +{"train_loss": 0.009590381756424904, "global_step": 9460, "epoch": 79, "lr": 9.611002478454714e-05} +{"train_loss": 0.012830372899770737, "global_step": 9461, "epoch": 79, "lr": 9.610916797490753e-05} +{"train_loss": 0.009399567730724812, "global_step": 9462, "epoch": 79, "lr": 9.61083110747375e-05} +{"train_loss": 0.013032599352300167, "global_step": 9463, "epoch": 79, "lr": 9.610745408403871e-05} +{"train_loss": 0.009282640181481838, "global_step": 9464, "epoch": 79, "lr": 9.610659700281289e-05} +{"train_loss": 0.009991569444537163, "global_step": 9465, "epoch": 79, "lr": 9.610573983106166e-05} +{"train_loss": 0.00942408200353384, "global_step": 9466, "epoch": 79, "lr": 9.610488256878674e-05} +{"train_loss": 0.008555098436772823, "global_step": 9467, "epoch": 79, "lr": 9.610402521598982e-05} +{"train_loss": 0.011830711737275124, "global_step": 9468, "epoch": 79, "lr": 9.610316777267257e-05} +{"train_loss": 0.0072905984707176685, "global_step": 9469, "epoch": 79, "lr": 9.610231023883668e-05} +{"train_loss": 0.010690064169466496, "global_step": 9470, "epoch": 79, "lr": 9.610145261448382e-05} +{"train_loss": 0.008875931613147259, "global_step": 9471, "epoch": 79, "lr": 9.61005948996157e-05} +{"train_loss": 0.014859129674732685, "global_step": 9472, "epoch": 79, "lr": 9.609973709423397e-05} +{"train_loss": 0.008256315253674984, "global_step": 9473, "epoch": 79, "lr": 9.609887919834033e-05} +{"train_loss": 0.009137166664004326, "global_step": 9474, "epoch": 79, "lr": 9.609802121193648e-05} +{"train_loss": 0.01215082872658968, "global_step": 9475, "epoch": 79, "lr": 9.609716313502408e-05} +{"train_loss": 0.00987002719193697, "global_step": 9476, "epoch": 79, "lr": 9.609630496760482e-05} +{"train_loss": 0.012847156263887882, "global_step": 9477, "epoch": 79, "lr": 9.60954467096804e-05} +{"train_loss": 0.012479592114686966, "global_step": 9478, "epoch": 79, "lr": 9.609458836125249e-05} +{"train_loss": 0.012836139649152756, "global_step": 9479, "epoch": 79, "lr": 9.609372992232278e-05} +{"train_loss": 0.011386191472411156, "global_step": 9480, "epoch": 79, "lr": 9.609287139289296e-05} +{"train_loss": 0.010723208077251911, "global_step": 9481, "epoch": 79, "lr": 9.609201277296471e-05} +{"train_loss": 0.008241075091063976, "global_step": 9482, "epoch": 79, "lr": 9.609115406253972e-05} +{"train_loss": 0.010261248797178268, "global_step": 9483, "epoch": 79, "lr": 9.609029526161966e-05} +{"train_loss": 0.009957273490726948, "global_step": 9484, "epoch": 79, "lr": 9.608943637020624e-05} +{"train_loss": 0.009793201461434364, "global_step": 9485, "epoch": 79, "lr": 9.608857738830113e-05} +{"train_loss": 0.01278176810592413, "global_step": 9486, "epoch": 79, "lr": 9.608771831590604e-05} +{"train_loss": 0.006316551472991705, "global_step": 9487, "epoch": 79, "lr": 9.608685915302263e-05} +{"train_loss": 0.010040460154414177, "global_step": 9488, "epoch": 79, "lr": 9.608599989965256e-05} +{"train_loss": 0.011222935281693935, "global_step": 9489, "epoch": 79, "lr": 9.60851405557976e-05} +{"train_loss": 0.010012457147240639, "global_step": 9490, "epoch": 79, "lr": 9.608428112145937e-05} +{"train_loss": 0.009294223040342331, "global_step": 9491, "epoch": 79, "lr": 9.608342159663959e-05} +{"train_loss": 0.009540682658553123, "global_step": 9492, "epoch": 79, "lr": 9.608256198133991e-05} +{"train_loss": 0.004946093540638685, "global_step": 9493, "epoch": 79, "lr": 9.608170227556208e-05} +{"train_loss": 0.015118559822440147, "global_step": 9494, "epoch": 79, "lr": 9.608084247930771e-05} +{"train_loss": 0.007307151798158884, "global_step": 9495, "epoch": 79, "lr": 9.607998259257855e-05} +{"train_loss": 0.012822975404560566, "global_step": 9496, "epoch": 79, "lr": 9.607912261537627e-05} +{"train_loss": 0.009618948213756084, "global_step": 9497, "epoch": 79, "lr": 9.607826254770254e-05} +{"train_loss": 0.015745339915156364, "global_step": 9498, "epoch": 79, "lr": 9.607740238955909e-05} +{"train_loss": 0.011206748895347118, "global_step": 9499, "epoch": 79, "lr": 9.607654214094757e-05} +{"train_loss": 0.01037229411303997, "global_step": 9500, "epoch": 79, "lr": 9.607568180186967e-05} +{"train_loss": 0.00857974961400032, "global_step": 9501, "epoch": 79, "lr": 9.60748213723271e-05} +{"train_loss": 0.013330434449017048, "global_step": 9502, "epoch": 79, "lr": 9.607396085232155e-05} +{"train_loss": 0.009162046015262604, "global_step": 9503, "epoch": 79, "lr": 9.607310024185468e-05} +{"train_loss": 0.010118802078068256, "global_step": 9504, "epoch": 79, "lr": 9.607223954092821e-05} +{"train_loss": 0.012154164724051952, "global_step": 9505, "epoch": 79, "lr": 9.607137874954382e-05} +{"train_loss": 0.008715523406863213, "global_step": 9506, "epoch": 79, "lr": 9.607051786770321e-05} +{"train_loss": 0.01065539475530386, "global_step": 9507, "epoch": 79, "lr": 9.606965689540806e-05} +{"train_loss": 0.010607532225549221, "global_step": 9508, "epoch": 79, "lr": 9.606879583266004e-05} +{"train_loss": 0.009493311867117882, "global_step": 9509, "epoch": 79, "lr": 9.606793467946086e-05} +{"train_loss": 0.005042861681431532, "global_step": 9510, "epoch": 79, "lr": 9.606707343581224e-05} +{"train_loss": 0.009959278628230095, "global_step": 9511, "epoch": 79, "lr": 9.606621210171583e-05} +{"train_loss": 0.011954186484217644, "global_step": 9512, "epoch": 79, "lr": 9.606535067717333e-05} +{"train_loss": 0.007784757763147354, "global_step": 9513, "epoch": 79, "lr": 9.606448916218644e-05} +{"train_loss": 0.01010057982057333, "global_step": 9514, "epoch": 79, "lr": 9.606362755675684e-05} +{"train_loss": 0.006719001103192568, "global_step": 9515, "epoch": 79, "lr": 9.606276586088623e-05} +{"train_loss": 0.014978939667344093, "global_step": 9516, "epoch": 79, "lr": 9.60619040745763e-05} +{"train_loss": 0.007825740613043308, "global_step": 9517, "epoch": 79, "lr": 9.606104219782874e-05} +{"train_loss": 0.007856212556362152, "global_step": 9518, "epoch": 79, "lr": 9.606018023064525e-05} +{"train_loss": 0.010902953271542778, "global_step": 9519, "epoch": 79, "lr": 9.605931817302753e-05, "val_loss": 0.01833386719226837} +{"train_loss": 0.007218444719910622, "global_step": 9520, "epoch": 80, "lr": 9.605845602497725e-05} +{"train_loss": 0.012480375356972218, "global_step": 9521, "epoch": 80, "lr": 9.60575937864961e-05} +{"train_loss": 0.012040356174111366, "global_step": 9522, "epoch": 80, "lr": 9.605673145758579e-05} +{"train_loss": 0.00898466445505619, "global_step": 9523, "epoch": 80, "lr": 9.605586903824801e-05} +{"train_loss": 0.009052787907421589, "global_step": 9524, "epoch": 80, "lr": 9.605500652848446e-05} +{"train_loss": 0.009336044080555439, "global_step": 9525, "epoch": 80, "lr": 9.605414392829681e-05} +{"train_loss": 0.0070524662733078, "global_step": 9526, "epoch": 80, "lr": 9.605328123768678e-05} +{"train_loss": 0.010992024093866348, "global_step": 9527, "epoch": 80, "lr": 9.605241845665604e-05} +{"train_loss": 0.013756789267063141, "global_step": 9528, "epoch": 80, "lr": 9.60515555852063e-05} +{"train_loss": 0.009731008671224117, "global_step": 9529, "epoch": 80, "lr": 9.605069262333927e-05} +{"train_loss": 0.008244074881076813, "global_step": 9530, "epoch": 80, "lr": 9.604982957105661e-05} +{"train_loss": 0.011673024855554104, "global_step": 9531, "epoch": 80, "lr": 9.604896642836003e-05} +{"train_loss": 0.009932714514434338, "global_step": 9532, "epoch": 80, "lr": 9.604810319525123e-05} +{"train_loss": 0.008967244997620583, "global_step": 9533, "epoch": 80, "lr": 9.604723987173189e-05} +{"train_loss": 0.009511321783065796, "global_step": 9534, "epoch": 80, "lr": 9.604637645780373e-05} +{"train_loss": 0.012017262168228626, "global_step": 9535, "epoch": 80, "lr": 9.60455129534684e-05} +{"train_loss": 0.00826459564268589, "global_step": 9536, "epoch": 80, "lr": 9.604464935872763e-05} +{"train_loss": 0.0070063453167676926, "global_step": 9537, "epoch": 80, "lr": 9.604378567358313e-05} +{"train_loss": 0.006083435378968716, "global_step": 9538, "epoch": 80, "lr": 9.604292189803656e-05} +{"train_loss": 0.011517227627336979, "global_step": 9539, "epoch": 80, "lr": 9.604205803208966e-05} +{"train_loss": 0.00834276620298624, "global_step": 9540, "epoch": 80, "lr": 9.604119407574405e-05} +{"train_loss": 0.008921952918171883, "global_step": 9541, "epoch": 80, "lr": 9.604033002900152e-05} +{"train_loss": 0.013084398582577705, "global_step": 9542, "epoch": 80, "lr": 9.60394658918637e-05} +{"train_loss": 0.0075063505209982395, "global_step": 9543, "epoch": 80, "lr": 9.603860166433229e-05} +{"train_loss": 0.008946418762207031, "global_step": 9544, "epoch": 80, "lr": 9.603773734640904e-05} +{"train_loss": 0.009128621779382229, "global_step": 9545, "epoch": 80, "lr": 9.603687293809559e-05} +{"train_loss": 0.008923130109906197, "global_step": 9546, "epoch": 80, "lr": 9.603600843939366e-05} +{"train_loss": 0.015266425907611847, "global_step": 9547, "epoch": 80, "lr": 9.603514385030494e-05} +{"train_loss": 0.010524390265345573, "global_step": 9548, "epoch": 80, "lr": 9.603427917083114e-05} +{"train_loss": 0.011564305052161217, "global_step": 9549, "epoch": 80, "lr": 9.603341440097395e-05} +{"train_loss": 0.007070540450513363, "global_step": 9550, "epoch": 80, "lr": 9.603254954073508e-05} +{"train_loss": 0.012373875826597214, "global_step": 9551, "epoch": 80, "lr": 9.60316845901162e-05} +{"train_loss": 0.008196263574063778, "global_step": 9552, "epoch": 80, "lr": 9.603081954911904e-05} +{"train_loss": 0.00822401512414217, "global_step": 9553, "epoch": 80, "lr": 9.602995441774527e-05} +{"train_loss": 0.006573328282684088, "global_step": 9554, "epoch": 80, "lr": 9.602908919599662e-05} +{"train_loss": 0.01190402265638113, "global_step": 9555, "epoch": 80, "lr": 9.602822388387476e-05} +{"train_loss": 0.006855024490505457, "global_step": 9556, "epoch": 80, "lr": 9.602735848138139e-05} +{"train_loss": 0.008082525804638863, "global_step": 9557, "epoch": 80, "lr": 9.602649298851822e-05} +{"train_loss": 0.008394036442041397, "global_step": 9558, "epoch": 80, "lr": 9.602562740528696e-05} +{"train_loss": 0.0076492419466376305, "global_step": 9559, "epoch": 80, "lr": 9.60247617316893e-05} +{"train_loss": 0.010354051366448402, "global_step": 9560, "epoch": 80, "lr": 9.602389596772692e-05} +{"train_loss": 0.009521177969872952, "global_step": 9561, "epoch": 80, "lr": 9.602303011340154e-05} +{"train_loss": 0.008274780586361885, "global_step": 9562, "epoch": 80, "lr": 9.602216416871487e-05} +{"train_loss": 0.00875774584710598, "global_step": 9563, "epoch": 80, "lr": 9.60212981336686e-05} +{"train_loss": 0.012342783622443676, "global_step": 9564, "epoch": 80, "lr": 9.602043200826443e-05} +{"train_loss": 0.007838696241378784, "global_step": 9565, "epoch": 80, "lr": 9.601956579250404e-05} +{"train_loss": 0.010848160833120346, "global_step": 9566, "epoch": 80, "lr": 9.601869948638915e-05} +{"train_loss": 0.007993075996637344, "global_step": 9567, "epoch": 80, "lr": 9.601783308992147e-05} +{"train_loss": 0.008779800496995449, "global_step": 9568, "epoch": 80, "lr": 9.601696660310269e-05} +{"train_loss": 0.010031028650701046, "global_step": 9569, "epoch": 80, "lr": 9.601610002593451e-05} +{"train_loss": 0.011118502356112003, "global_step": 9570, "epoch": 80, "lr": 9.601523335841864e-05} +{"train_loss": 0.008210104890167713, "global_step": 9571, "epoch": 80, "lr": 9.601436660055676e-05} +{"train_loss": 0.009286555461585522, "global_step": 9572, "epoch": 80, "lr": 9.601349975235062e-05} +{"train_loss": 0.012293512932956219, "global_step": 9573, "epoch": 80, "lr": 9.601263281380185e-05} +{"train_loss": 0.010528421960771084, "global_step": 9574, "epoch": 80, "lr": 9.60117657849122e-05} +{"train_loss": 0.009638181887567043, "global_step": 9575, "epoch": 80, "lr": 9.601089866568338e-05} +{"train_loss": 0.010204573161900043, "global_step": 9576, "epoch": 80, "lr": 9.601003145611707e-05} +{"train_loss": 0.014808794483542442, "global_step": 9577, "epoch": 80, "lr": 9.600916415621497e-05} +{"train_loss": 0.010349220596253872, "global_step": 9578, "epoch": 80, "lr": 9.60082967659788e-05} +{"train_loss": 0.011412105523049831, "global_step": 9579, "epoch": 80, "lr": 9.600742928541024e-05} +{"train_loss": 0.009675472974777222, "global_step": 9580, "epoch": 80, "lr": 9.600656171451103e-05} +{"train_loss": 0.008691822178661823, "global_step": 9581, "epoch": 80, "lr": 9.600569405328284e-05} +{"train_loss": 0.007088853046298027, "global_step": 9582, "epoch": 80, "lr": 9.600482630172738e-05} +{"train_loss": 0.007116979919373989, "global_step": 9583, "epoch": 80, "lr": 9.600395845984637e-05} +{"train_loss": 0.009374827146530151, "global_step": 9584, "epoch": 80, "lr": 9.600309052764149e-05} +{"train_loss": 0.014817413873970509, "global_step": 9585, "epoch": 80, "lr": 9.600222250511446e-05} +{"train_loss": 0.008963825181126595, "global_step": 9586, "epoch": 80, "lr": 9.600135439226699e-05} +{"train_loss": 0.010834804736077785, "global_step": 9587, "epoch": 80, "lr": 9.600048618910075e-05} +{"train_loss": 0.007667570374906063, "global_step": 9588, "epoch": 80, "lr": 9.59996178956175e-05} +{"train_loss": 0.01190200075507164, "global_step": 9589, "epoch": 80, "lr": 9.599874951181891e-05} +{"train_loss": 0.01008552685379982, "global_step": 9590, "epoch": 80, "lr": 9.599788103770668e-05} +{"train_loss": 0.005175404250621796, "global_step": 9591, "epoch": 80, "lr": 9.599701247328252e-05} +{"train_loss": 0.010642501525580883, "global_step": 9592, "epoch": 80, "lr": 9.599614381854816e-05} +{"train_loss": 0.012038475833833218, "global_step": 9593, "epoch": 80, "lr": 9.599527507350527e-05} +{"train_loss": 0.012940720655024052, "global_step": 9594, "epoch": 80, "lr": 9.599440623815557e-05} +{"train_loss": 0.009117616340517998, "global_step": 9595, "epoch": 80, "lr": 9.599353731250077e-05} +{"train_loss": 0.011177251115441322, "global_step": 9596, "epoch": 80, "lr": 9.599266829654256e-05} +{"train_loss": 0.007364796474575996, "global_step": 9597, "epoch": 80, "lr": 9.599179919028269e-05} +{"train_loss": 0.008409841917455196, "global_step": 9598, "epoch": 80, "lr": 9.599092999372281e-05} +{"train_loss": 0.010676799342036247, "global_step": 9599, "epoch": 80, "lr": 9.599006070686467e-05} +{"train_loss": 0.00908732134848833, "global_step": 9600, "epoch": 80, "lr": 9.598919132970995e-05} +{"train_loss": 0.011983765289187431, "global_step": 9601, "epoch": 80, "lr": 9.598832186226037e-05} +{"train_loss": 0.0063479626551270485, "global_step": 9602, "epoch": 80, "lr": 9.598745230451763e-05} +{"train_loss": 0.007862302474677563, "global_step": 9603, "epoch": 80, "lr": 9.598658265648343e-05} +{"train_loss": 0.011388363316655159, "global_step": 9604, "epoch": 80, "lr": 9.59857129181595e-05} +{"train_loss": 0.014167698100209236, "global_step": 9605, "epoch": 80, "lr": 9.598484308954754e-05} +{"train_loss": 0.009604573249816895, "global_step": 9606, "epoch": 80, "lr": 9.598397317064924e-05} +{"train_loss": 0.010560010559856892, "global_step": 9607, "epoch": 80, "lr": 9.598310316146633e-05} +{"train_loss": 0.006336026359349489, "global_step": 9608, "epoch": 80, "lr": 9.598223306200052e-05} +{"train_loss": 0.012887684628367424, "global_step": 9609, "epoch": 80, "lr": 9.598136287225349e-05} +{"train_loss": 0.01031993143260479, "global_step": 9610, "epoch": 80, "lr": 9.598049259222696e-05} +{"train_loss": 0.01083529181778431, "global_step": 9611, "epoch": 80, "lr": 9.597962222192268e-05} +{"train_loss": 0.00891247671097517, "global_step": 9612, "epoch": 80, "lr": 9.597875176134229e-05} +{"train_loss": 0.010684843175113201, "global_step": 9613, "epoch": 80, "lr": 9.597788121048755e-05} +{"train_loss": 0.010758614167571068, "global_step": 9614, "epoch": 80, "lr": 9.597701056936013e-05} +{"train_loss": 0.01025074440985918, "global_step": 9615, "epoch": 80, "lr": 9.597613983796178e-05} +{"train_loss": 0.007887148298323154, "global_step": 9616, "epoch": 80, "lr": 9.597526901629419e-05} +{"train_loss": 0.012947061099112034, "global_step": 9617, "epoch": 80, "lr": 9.597439810435908e-05} +{"train_loss": 0.009737836197018623, "global_step": 9618, "epoch": 80, "lr": 9.597352710215814e-05} +{"train_loss": 0.009800995700061321, "global_step": 9619, "epoch": 80, "lr": 9.59726560096931e-05} +{"train_loss": 0.012139583937823772, "global_step": 9620, "epoch": 80, "lr": 9.597178482696564e-05} +{"train_loss": 0.008748229593038559, "global_step": 9621, "epoch": 80, "lr": 9.597091355397752e-05} +{"train_loss": 0.013966311700642109, "global_step": 9622, "epoch": 80, "lr": 9.59700421907304e-05} +{"train_loss": 0.008287344127893448, "global_step": 9623, "epoch": 80, "lr": 9.596917073722602e-05} +{"train_loss": 0.008798581548035145, "global_step": 9624, "epoch": 80, "lr": 9.596829919346608e-05} +{"train_loss": 0.007398855872452259, "global_step": 9625, "epoch": 80, "lr": 9.59674275594523e-05} +{"train_loss": 0.009196851402521133, "global_step": 9626, "epoch": 80, "lr": 9.596655583518639e-05} +{"train_loss": 0.015236240811645985, "global_step": 9627, "epoch": 80, "lr": 9.596568402067007e-05} +{"train_loss": 0.0070066992193460464, "global_step": 9628, "epoch": 80, "lr": 9.596481211590502e-05} +{"train_loss": 0.009913158603012562, "global_step": 9629, "epoch": 80, "lr": 9.596394012089297e-05} +{"train_loss": 0.009992874227464199, "global_step": 9630, "epoch": 80, "lr": 9.596306803563565e-05} +{"train_loss": 0.011049922555685043, "global_step": 9631, "epoch": 80, "lr": 9.596219586013475e-05} +{"train_loss": 0.012243554927408695, "global_step": 9632, "epoch": 80, "lr": 9.596132359439199e-05} +{"train_loss": 0.00836996641010046, "global_step": 9633, "epoch": 80, "lr": 9.596045123840907e-05} +{"train_loss": 0.011233319528400898, "global_step": 9634, "epoch": 80, "lr": 9.595957879218773e-05} +{"train_loss": 0.008972627110779285, "global_step": 9635, "epoch": 80, "lr": 9.595870625572967e-05} +{"train_loss": 0.009124581702053547, "global_step": 9636, "epoch": 80, "lr": 9.595783362903659e-05} +{"train_loss": 0.010874600149691105, "global_step": 9637, "epoch": 80, "lr": 9.595696091211022e-05} +{"train_loss": 0.009861212364640557, "global_step": 9638, "epoch": 80, "lr": 9.595608810495225e-05, "val_loss": 0.02084166929125786, "train_action_mse_error": 0.0003131883859168738} +{"train_loss": 0.012445148080587387, "global_step": 9639, "epoch": 81, "lr": 9.595521520756443e-05} +{"train_loss": 0.011965782381594181, "global_step": 9640, "epoch": 81, "lr": 9.595434221994843e-05} +{"train_loss": 0.008060541935265064, "global_step": 9641, "epoch": 81, "lr": 9.595346914210602e-05} +{"train_loss": 0.008969644084572792, "global_step": 9642, "epoch": 81, "lr": 9.595259597403886e-05} +{"train_loss": 0.012416582554578781, "global_step": 9643, "epoch": 81, "lr": 9.59517227157487e-05} +{"train_loss": 0.008842000737786293, "global_step": 9644, "epoch": 81, "lr": 9.595084936723724e-05} +{"train_loss": 0.010966336354613304, "global_step": 9645, "epoch": 81, "lr": 9.594997592850618e-05} +{"train_loss": 0.008333700709044933, "global_step": 9646, "epoch": 81, "lr": 9.594910239955728e-05} +{"train_loss": 0.013472246937453747, "global_step": 9647, "epoch": 81, "lr": 9.59482287803922e-05} +{"train_loss": 0.007242273539304733, "global_step": 9648, "epoch": 81, "lr": 9.59473550710127e-05} +{"train_loss": 0.00914799328893423, "global_step": 9649, "epoch": 81, "lr": 9.594648127142047e-05} +{"train_loss": 0.009541776031255722, "global_step": 9650, "epoch": 81, "lr": 9.594560738161721e-05} +{"train_loss": 0.012090069241821766, "global_step": 9651, "epoch": 81, "lr": 9.594473340160471e-05} +{"train_loss": 0.010127576999366283, "global_step": 9652, "epoch": 81, "lr": 9.594385933138459e-05} +{"train_loss": 0.010699283331632614, "global_step": 9653, "epoch": 81, "lr": 9.594298517095863e-05} +{"train_loss": 0.012921897694468498, "global_step": 9654, "epoch": 81, "lr": 9.594211092032852e-05} +{"train_loss": 0.008626919239759445, "global_step": 9655, "epoch": 81, "lr": 9.594123657949598e-05} +{"train_loss": 0.009555133990943432, "global_step": 9656, "epoch": 81, "lr": 9.594036214846275e-05} +{"train_loss": 0.018071619793772697, "global_step": 9657, "epoch": 81, "lr": 9.593948762723051e-05} +{"train_loss": 0.014109119772911072, "global_step": 9658, "epoch": 81, "lr": 9.593861301580099e-05} +{"train_loss": 0.010607775300741196, "global_step": 9659, "epoch": 81, "lr": 9.593773831417592e-05} +{"train_loss": 0.008887013420462608, "global_step": 9660, "epoch": 81, "lr": 9.593686352235701e-05} +{"train_loss": 0.009229485876858234, "global_step": 9661, "epoch": 81, "lr": 9.593598864034598e-05} +{"train_loss": 0.008989457972347736, "global_step": 9662, "epoch": 81, "lr": 9.593511366814453e-05} +{"train_loss": 0.010878313332796097, "global_step": 9663, "epoch": 81, "lr": 9.593423860575438e-05} +{"train_loss": 0.014400888234376907, "global_step": 9664, "epoch": 81, "lr": 9.59333634531773e-05} +{"train_loss": 0.008102166466414928, "global_step": 9665, "epoch": 81, "lr": 9.593248821041494e-05} +{"train_loss": 0.015940696001052856, "global_step": 9666, "epoch": 81, "lr": 9.593161287746906e-05} +{"train_loss": 0.008969616144895554, "global_step": 9667, "epoch": 81, "lr": 9.593073745434135e-05} +{"train_loss": 0.015441404655575752, "global_step": 9668, "epoch": 81, "lr": 9.592986194103354e-05} +{"train_loss": 0.010090593248605728, "global_step": 9669, "epoch": 81, "lr": 9.592898633754738e-05} +{"train_loss": 0.012430139817297459, "global_step": 9670, "epoch": 81, "lr": 9.592811064388455e-05} +{"train_loss": 0.009030429646372795, "global_step": 9671, "epoch": 81, "lr": 9.592723486004678e-05} +{"train_loss": 0.013043788261711597, "global_step": 9672, "epoch": 81, "lr": 9.592635898603579e-05} +{"train_loss": 0.01497908029705286, "global_step": 9673, "epoch": 81, "lr": 9.59254830218533e-05} +{"train_loss": 0.008191801607608795, "global_step": 9674, "epoch": 81, "lr": 9.592460696750103e-05} +{"train_loss": 0.010623674839735031, "global_step": 9675, "epoch": 81, "lr": 9.59237308229807e-05} +{"train_loss": 0.01154414750635624, "global_step": 9676, "epoch": 81, "lr": 9.592285458829403e-05} +{"train_loss": 0.01164951641112566, "global_step": 9677, "epoch": 81, "lr": 9.592197826344275e-05} +{"train_loss": 0.008583607152104378, "global_step": 9678, "epoch": 81, "lr": 9.592110184842855e-05} +{"train_loss": 0.011263752356171608, "global_step": 9679, "epoch": 81, "lr": 9.59202253432532e-05} +{"train_loss": 0.015255862846970558, "global_step": 9680, "epoch": 81, "lr": 9.591934874791838e-05} +{"train_loss": 0.00803802814334631, "global_step": 9681, "epoch": 81, "lr": 9.591847206242582e-05} +{"train_loss": 0.007187879178673029, "global_step": 9682, "epoch": 81, "lr": 9.591759528677725e-05} +{"train_loss": 0.011744841001927853, "global_step": 9683, "epoch": 81, "lr": 9.59167184209744e-05} +{"train_loss": 0.008346560411155224, "global_step": 9684, "epoch": 81, "lr": 9.591584146501897e-05} +{"train_loss": 0.01202174462378025, "global_step": 9685, "epoch": 81, "lr": 9.591496441891268e-05} +{"train_loss": 0.008457652293145657, "global_step": 9686, "epoch": 81, "lr": 9.591408728265727e-05} +{"train_loss": 0.01086196769028902, "global_step": 9687, "epoch": 81, "lr": 9.591321005625446e-05} +{"train_loss": 0.012289894744753838, "global_step": 9688, "epoch": 81, "lr": 9.591233273970596e-05} +{"train_loss": 0.009212354198098183, "global_step": 9689, "epoch": 81, "lr": 9.59114553330135e-05} +{"train_loss": 0.010093748569488525, "global_step": 9690, "epoch": 81, "lr": 9.59105778361788e-05} +{"train_loss": 0.010913621634244919, "global_step": 9691, "epoch": 81, "lr": 9.59097002492036e-05} +{"train_loss": 0.011331219226121902, "global_step": 9692, "epoch": 81, "lr": 9.59088225720896e-05} +{"train_loss": 0.006763497833162546, "global_step": 9693, "epoch": 81, "lr": 9.590794480483852e-05} +{"train_loss": 0.015046224929392338, "global_step": 9694, "epoch": 81, "lr": 9.59070669474521e-05} +{"train_loss": 0.007613819558173418, "global_step": 9695, "epoch": 81, "lr": 9.590618899993206e-05} +{"train_loss": 0.007498761173337698, "global_step": 9696, "epoch": 81, "lr": 9.590531096228012e-05} +{"train_loss": 0.010733362287282944, "global_step": 9697, "epoch": 81, "lr": 9.590443283449803e-05} +{"train_loss": 0.012718490324914455, "global_step": 9698, "epoch": 81, "lr": 9.590355461658747e-05} +{"train_loss": 0.011944207362830639, "global_step": 9699, "epoch": 81, "lr": 9.590267630855018e-05} +{"train_loss": 0.006500551477074623, "global_step": 9700, "epoch": 81, "lr": 9.59017979103879e-05} +{"train_loss": 0.007662232965230942, "global_step": 9701, "epoch": 81, "lr": 9.590091942210234e-05} +{"train_loss": 0.006608310621231794, "global_step": 9702, "epoch": 81, "lr": 9.590004084369523e-05} +{"train_loss": 0.009299016557633877, "global_step": 9703, "epoch": 81, "lr": 9.589916217516827e-05} +{"train_loss": 0.014204745180904865, "global_step": 9704, "epoch": 81, "lr": 9.589828341652325e-05} +{"train_loss": 0.01308263000100851, "global_step": 9705, "epoch": 81, "lr": 9.589740456776183e-05} +{"train_loss": 0.011609761975705624, "global_step": 9706, "epoch": 81, "lr": 9.589652562888576e-05} +{"train_loss": 0.007381145842373371, "global_step": 9707, "epoch": 81, "lr": 9.589564659989677e-05} +{"train_loss": 0.01108689233660698, "global_step": 9708, "epoch": 81, "lr": 9.589476748079658e-05} +{"train_loss": 0.00904536247253418, "global_step": 9709, "epoch": 81, "lr": 9.589388827158691e-05} +{"train_loss": 0.011509268544614315, "global_step": 9710, "epoch": 81, "lr": 9.58930089722695e-05} +{"train_loss": 0.00877366028726101, "global_step": 9711, "epoch": 81, "lr": 9.589212958284608e-05} +{"train_loss": 0.008297109976410866, "global_step": 9712, "epoch": 81, "lr": 9.589125010331835e-05} +{"train_loss": 0.010046686045825481, "global_step": 9713, "epoch": 81, "lr": 9.589037053368806e-05} +{"train_loss": 0.00963097345083952, "global_step": 9714, "epoch": 81, "lr": 9.588949087395694e-05} +{"train_loss": 0.011064962483942509, "global_step": 9715, "epoch": 81, "lr": 9.588861112412669e-05} +{"train_loss": 0.010904223658144474, "global_step": 9716, "epoch": 81, "lr": 9.588773128419906e-05} +{"train_loss": 0.00904517900198698, "global_step": 9717, "epoch": 81, "lr": 9.588685135417578e-05} +{"train_loss": 0.011939769610762596, "global_step": 9718, "epoch": 81, "lr": 9.588597133405856e-05} +{"train_loss": 0.008217046037316322, "global_step": 9719, "epoch": 81, "lr": 9.588509122384915e-05} +{"train_loss": 0.010579178109765053, "global_step": 9720, "epoch": 81, "lr": 9.588421102354924e-05} +{"train_loss": 0.008816007524728775, "global_step": 9721, "epoch": 81, "lr": 9.58833307331606e-05} +{"train_loss": 0.008377354592084885, "global_step": 9722, "epoch": 81, "lr": 9.588245035268495e-05} +{"train_loss": 0.009608673863112926, "global_step": 9723, "epoch": 81, "lr": 9.5881569882124e-05} +{"train_loss": 0.006854879669845104, "global_step": 9724, "epoch": 81, "lr": 9.588068932147949e-05} +{"train_loss": 0.009823686443269253, "global_step": 9725, "epoch": 81, "lr": 9.587980867075314e-05} +{"train_loss": 0.011431943625211716, "global_step": 9726, "epoch": 81, "lr": 9.58789279299467e-05} +{"train_loss": 0.011517414823174477, "global_step": 9727, "epoch": 81, "lr": 9.58780470990619e-05} +{"train_loss": 0.012200047262012959, "global_step": 9728, "epoch": 81, "lr": 9.587716617810043e-05} +{"train_loss": 0.00826554000377655, "global_step": 9729, "epoch": 81, "lr": 9.587628516706406e-05} +{"train_loss": 0.00738801434636116, "global_step": 9730, "epoch": 81, "lr": 9.58754040659545e-05} +{"train_loss": 0.009304894134402275, "global_step": 9731, "epoch": 81, "lr": 9.587452287477348e-05} +{"train_loss": 0.009124553762376308, "global_step": 9732, "epoch": 81, "lr": 9.587364159352274e-05} +{"train_loss": 0.015185436233878136, "global_step": 9733, "epoch": 81, "lr": 9.587276022220402e-05} +{"train_loss": 0.009013738483190536, "global_step": 9734, "epoch": 81, "lr": 9.587187876081901e-05} +{"train_loss": 0.010168138891458511, "global_step": 9735, "epoch": 81, "lr": 9.587099720936947e-05} +{"train_loss": 0.013158591464161873, "global_step": 9736, "epoch": 81, "lr": 9.587011556785714e-05} +{"train_loss": 0.009408161044120789, "global_step": 9737, "epoch": 81, "lr": 9.586923383628375e-05} +{"train_loss": 0.012651899829506874, "global_step": 9738, "epoch": 81, "lr": 9.5868352014651e-05} +{"train_loss": 0.010129320435225964, "global_step": 9739, "epoch": 81, "lr": 9.586747010296064e-05} +{"train_loss": 0.009673014283180237, "global_step": 9740, "epoch": 81, "lr": 9.586658810121441e-05} +{"train_loss": 0.0071665700525045395, "global_step": 9741, "epoch": 81, "lr": 9.586570600941404e-05} +{"train_loss": 0.011043207719922066, "global_step": 9742, "epoch": 81, "lr": 9.586482382756124e-05} +{"train_loss": 0.007446862757205963, "global_step": 9743, "epoch": 81, "lr": 9.586394155565777e-05} +{"train_loss": 0.009587448090314865, "global_step": 9744, "epoch": 81, "lr": 9.586305919370536e-05} +{"train_loss": 0.012154358439147472, "global_step": 9745, "epoch": 81, "lr": 9.586217674170571e-05} +{"train_loss": 0.007462071720510721, "global_step": 9746, "epoch": 81, "lr": 9.586129419966059e-05} +{"train_loss": 0.008336115628480911, "global_step": 9747, "epoch": 81, "lr": 9.586041156757171e-05} +{"train_loss": 0.013535819947719574, "global_step": 9748, "epoch": 81, "lr": 9.585952884544082e-05} +{"train_loss": 0.010478531010448933, "global_step": 9749, "epoch": 81, "lr": 9.585864603326963e-05} +{"train_loss": 0.008877054788172245, "global_step": 9750, "epoch": 81, "lr": 9.58577631310599e-05} +{"train_loss": 0.011327991262078285, "global_step": 9751, "epoch": 81, "lr": 9.585688013881335e-05} +{"train_loss": 0.00790919829159975, "global_step": 9752, "epoch": 81, "lr": 9.585599705653172e-05} +{"train_loss": 0.01174834556877613, "global_step": 9753, "epoch": 81, "lr": 9.585511388421674e-05} +{"train_loss": 0.010306458920240402, "global_step": 9754, "epoch": 81, "lr": 9.585423062187013e-05} +{"train_loss": 0.008480883203446865, "global_step": 9755, "epoch": 81, "lr": 9.585334726949364e-05} +{"train_loss": 0.012643621303141117, "global_step": 9756, "epoch": 81, "lr": 9.585246382708902e-05} +{"train_loss": 0.010368727257146555, "global_step": 9757, "epoch": 81, "lr": 9.585158029465798e-05, "val_loss": 0.027001207694411278} +{"train_loss": 0.012953639961779118, "global_step": 9758, "epoch": 82, "lr": 9.585069667220224e-05} +{"train_loss": 0.008585833013057709, "global_step": 9759, "epoch": 82, "lr": 9.584981295972356e-05} +{"train_loss": 0.008808281272649765, "global_step": 9760, "epoch": 82, "lr": 9.584892915722368e-05} +{"train_loss": 0.011543403379619122, "global_step": 9761, "epoch": 82, "lr": 9.584804526470432e-05} +{"train_loss": 0.011239706538617611, "global_step": 9762, "epoch": 82, "lr": 9.584716128216723e-05} +{"train_loss": 0.010046365670859814, "global_step": 9763, "epoch": 82, "lr": 9.584627720961413e-05} +{"train_loss": 0.010155778378248215, "global_step": 9764, "epoch": 82, "lr": 9.584539304704676e-05} +{"train_loss": 0.00990414060652256, "global_step": 9765, "epoch": 82, "lr": 9.584450879446687e-05} +{"train_loss": 0.008424917235970497, "global_step": 9766, "epoch": 82, "lr": 9.584362445187618e-05} +{"train_loss": 0.006254090927541256, "global_step": 9767, "epoch": 82, "lr": 9.584274001927642e-05} +{"train_loss": 0.006224433425813913, "global_step": 9768, "epoch": 82, "lr": 9.584185549666935e-05} +{"train_loss": 0.005861050449311733, "global_step": 9769, "epoch": 82, "lr": 9.58409708840567e-05} +{"train_loss": 0.016201278194785118, "global_step": 9770, "epoch": 82, "lr": 9.584008618144018e-05} +{"train_loss": 0.014075199142098427, "global_step": 9771, "epoch": 82, "lr": 9.583920138882157e-05} +{"train_loss": 0.009133107028901577, "global_step": 9772, "epoch": 82, "lr": 9.583831650620257e-05} +{"train_loss": 0.01020103134214878, "global_step": 9773, "epoch": 82, "lr": 9.583743153358493e-05} +{"train_loss": 0.01316769141703844, "global_step": 9774, "epoch": 82, "lr": 9.58365464709704e-05} +{"train_loss": 0.009718500077724457, "global_step": 9775, "epoch": 82, "lr": 9.58356613183607e-05} +{"train_loss": 0.007052509114146233, "global_step": 9776, "epoch": 82, "lr": 9.583477607575759e-05} +{"train_loss": 0.010467903688549995, "global_step": 9777, "epoch": 82, "lr": 9.583389074316278e-05} +{"train_loss": 0.009247388690710068, "global_step": 9778, "epoch": 82, "lr": 9.583300532057805e-05} +{"train_loss": 0.009607132524251938, "global_step": 9779, "epoch": 82, "lr": 9.583211980800507e-05} +{"train_loss": 0.01281803473830223, "global_step": 9780, "epoch": 82, "lr": 9.583123420544564e-05} +{"train_loss": 0.011132956482470036, "global_step": 9781, "epoch": 82, "lr": 9.583034851290146e-05} +{"train_loss": 0.009104229509830475, "global_step": 9782, "epoch": 82, "lr": 9.582946273037432e-05} +{"train_loss": 0.009592603892087936, "global_step": 9783, "epoch": 82, "lr": 9.582857685786591e-05} +{"train_loss": 0.007932676933705807, "global_step": 9784, "epoch": 82, "lr": 9.582769089537798e-05} +{"train_loss": 0.015188758261501789, "global_step": 9785, "epoch": 82, "lr": 9.582680484291227e-05} +{"train_loss": 0.009981974959373474, "global_step": 9786, "epoch": 82, "lr": 9.582591870047054e-05} +{"train_loss": 0.011748667806386948, "global_step": 9787, "epoch": 82, "lr": 9.58250324680545e-05} +{"train_loss": 0.012484387494623661, "global_step": 9788, "epoch": 82, "lr": 9.582414614566592e-05} +{"train_loss": 0.009020998142659664, "global_step": 9789, "epoch": 82, "lr": 9.582325973330651e-05} +{"train_loss": 0.011521426029503345, "global_step": 9790, "epoch": 82, "lr": 9.582237323097803e-05} +{"train_loss": 0.011978095397353172, "global_step": 9791, "epoch": 82, "lr": 9.582148663868222e-05} +{"train_loss": 0.011506402865052223, "global_step": 9792, "epoch": 82, "lr": 9.582059995642081e-05} +{"train_loss": 0.00912030041217804, "global_step": 9793, "epoch": 82, "lr": 9.581971318419556e-05} +{"train_loss": 0.009480232372879982, "global_step": 9794, "epoch": 82, "lr": 9.581882632200818e-05} +{"train_loss": 0.011979728005826473, "global_step": 9795, "epoch": 82, "lr": 9.581793936986044e-05} +{"train_loss": 0.012802532874047756, "global_step": 9796, "epoch": 82, "lr": 9.581705232775408e-05} +{"train_loss": 0.0076693203300237656, "global_step": 9797, "epoch": 82, "lr": 9.58161651956908e-05} +{"train_loss": 0.013143536634743214, "global_step": 9798, "epoch": 82, "lr": 9.581527797367242e-05} +{"train_loss": 0.008169670589268208, "global_step": 9799, "epoch": 82, "lr": 9.581439066170061e-05} +{"train_loss": 0.006617235951125622, "global_step": 9800, "epoch": 82, "lr": 9.581350325977714e-05} +{"train_loss": 0.012103138491511345, "global_step": 9801, "epoch": 82, "lr": 9.581261576790375e-05} +{"train_loss": 0.010329185985028744, "global_step": 9802, "epoch": 82, "lr": 9.581172818608219e-05} +{"train_loss": 0.01284284982830286, "global_step": 9803, "epoch": 82, "lr": 9.581084051431419e-05} +{"train_loss": 0.009821908548474312, "global_step": 9804, "epoch": 82, "lr": 9.58099527526015e-05} +{"train_loss": 0.011884353123605251, "global_step": 9805, "epoch": 82, "lr": 9.580906490094585e-05} +{"train_loss": 0.010155437514185905, "global_step": 9806, "epoch": 82, "lr": 9.580817695934902e-05} +{"train_loss": 0.00848092045634985, "global_step": 9807, "epoch": 82, "lr": 9.58072889278127e-05} +{"train_loss": 0.009119311347603798, "global_step": 9808, "epoch": 82, "lr": 9.580640080633869e-05} +{"train_loss": 0.01337888278067112, "global_step": 9809, "epoch": 82, "lr": 9.58055125949287e-05} +{"train_loss": 0.007357897702604532, "global_step": 9810, "epoch": 82, "lr": 9.580462429358446e-05} +{"train_loss": 0.0074252597987651825, "global_step": 9811, "epoch": 82, "lr": 9.580373590230775e-05} +{"train_loss": 0.00971222948282957, "global_step": 9812, "epoch": 82, "lr": 9.58028474211003e-05} +{"train_loss": 0.012396513484418392, "global_step": 9813, "epoch": 82, "lr": 9.580195884996384e-05} +{"train_loss": 0.016008827835321426, "global_step": 9814, "epoch": 82, "lr": 9.580107018890013e-05} +{"train_loss": 0.015169625170528889, "global_step": 9815, "epoch": 82, "lr": 9.580018143791092e-05} +{"train_loss": 0.00865038763731718, "global_step": 9816, "epoch": 82, "lr": 9.579929259699794e-05} +{"train_loss": 0.008719577454030514, "global_step": 9817, "epoch": 82, "lr": 9.579840366616295e-05} +{"train_loss": 0.007561708800494671, "global_step": 9818, "epoch": 82, "lr": 9.579751464540767e-05} +{"train_loss": 0.01071662176400423, "global_step": 9819, "epoch": 82, "lr": 9.579662553473388e-05} +{"train_loss": 0.008505819365382195, "global_step": 9820, "epoch": 82, "lr": 9.57957363341433e-05} +{"train_loss": 0.008407548069953918, "global_step": 9821, "epoch": 82, "lr": 9.579484704363769e-05} +{"train_loss": 0.010128808207809925, "global_step": 9822, "epoch": 82, "lr": 9.57939576632188e-05} +{"train_loss": 0.01091520395129919, "global_step": 9823, "epoch": 82, "lr": 9.579306819288833e-05} +{"train_loss": 0.0097279017791152, "global_step": 9824, "epoch": 82, "lr": 9.57921786326481e-05} +{"train_loss": 0.009041251614689827, "global_step": 9825, "epoch": 82, "lr": 9.57912889824998e-05} +{"train_loss": 0.010417226701974869, "global_step": 9826, "epoch": 82, "lr": 9.57903992424452e-05} +{"train_loss": 0.011259532533586025, "global_step": 9827, "epoch": 82, "lr": 9.578950941248606e-05} +{"train_loss": 0.008475294336676598, "global_step": 9828, "epoch": 82, "lr": 9.57886194926241e-05} +{"train_loss": 0.0122762406244874, "global_step": 9829, "epoch": 82, "lr": 9.578772948286105e-05} +{"train_loss": 0.00840399693697691, "global_step": 9830, "epoch": 82, "lr": 9.578683938319872e-05} +{"train_loss": 0.012228244915604591, "global_step": 9831, "epoch": 82, "lr": 9.578594919363881e-05} +{"train_loss": 0.01000074204057455, "global_step": 9832, "epoch": 82, "lr": 9.578505891418308e-05} +{"train_loss": 0.009878023527562618, "global_step": 9833, "epoch": 82, "lr": 9.578416854483327e-05} +{"train_loss": 0.0066817705519497395, "global_step": 9834, "epoch": 82, "lr": 9.578327808559115e-05} +{"train_loss": 0.009739946573972702, "global_step": 9835, "epoch": 82, "lr": 9.578238753645845e-05} +{"train_loss": 0.01101667806506157, "global_step": 9836, "epoch": 82, "lr": 9.578149689743692e-05} +{"train_loss": 0.011796361766755581, "global_step": 9837, "epoch": 82, "lr": 9.578060616852833e-05} +{"train_loss": 0.008126961998641491, "global_step": 9838, "epoch": 82, "lr": 9.577971534973438e-05} +{"train_loss": 0.010514603927731514, "global_step": 9839, "epoch": 82, "lr": 9.577882444105686e-05} +{"train_loss": 0.008200336247682571, "global_step": 9840, "epoch": 82, "lr": 9.577793344249752e-05} +{"train_loss": 0.009313913062214851, "global_step": 9841, "epoch": 82, "lr": 9.57770423540581e-05} +{"train_loss": 0.011050606146454811, "global_step": 9842, "epoch": 82, "lr": 9.577615117574034e-05} +{"train_loss": 0.01159739214926958, "global_step": 9843, "epoch": 82, "lr": 9.5775259907546e-05} +{"train_loss": 0.00977228581905365, "global_step": 9844, "epoch": 82, "lr": 9.577436854947682e-05} +{"train_loss": 0.011484187096357346, "global_step": 9845, "epoch": 82, "lr": 9.577347710153457e-05} +{"train_loss": 0.013328982517123222, "global_step": 9846, "epoch": 82, "lr": 9.577258556372097e-05} +{"train_loss": 0.00960659608244896, "global_step": 9847, "epoch": 82, "lr": 9.577169393603781e-05} +{"train_loss": 0.006858621723949909, "global_step": 9848, "epoch": 82, "lr": 9.57708022184868e-05} +{"train_loss": 0.011706982739269733, "global_step": 9849, "epoch": 82, "lr": 9.576991041106973e-05} +{"train_loss": 0.010018125176429749, "global_step": 9850, "epoch": 82, "lr": 9.57690185137883e-05} +{"train_loss": 0.007500124163925648, "global_step": 9851, "epoch": 82, "lr": 9.576812652664433e-05} +{"train_loss": 0.010047033429145813, "global_step": 9852, "epoch": 82, "lr": 9.57672344496395e-05} +{"train_loss": 0.007790455594658852, "global_step": 9853, "epoch": 82, "lr": 9.576634228277561e-05} +{"train_loss": 0.0072304923087358475, "global_step": 9854, "epoch": 82, "lr": 9.576545002605439e-05} +{"train_loss": 0.006946431938558817, "global_step": 9855, "epoch": 82, "lr": 9.576455767947762e-05} +{"train_loss": 0.00745796225965023, "global_step": 9856, "epoch": 82, "lr": 9.576366524304701e-05} +{"train_loss": 0.0071245403960347176, "global_step": 9857, "epoch": 82, "lr": 9.576277271676432e-05} +{"train_loss": 0.007559033576399088, "global_step": 9858, "epoch": 82, "lr": 9.576188010063134e-05} +{"train_loss": 0.009966684505343437, "global_step": 9859, "epoch": 82, "lr": 9.57609873946498e-05} +{"train_loss": 0.010903320275247097, "global_step": 9860, "epoch": 82, "lr": 9.576009459882143e-05} +{"train_loss": 0.009726520627737045, "global_step": 9861, "epoch": 82, "lr": 9.5759201713148e-05} +{"train_loss": 0.01134481094777584, "global_step": 9862, "epoch": 82, "lr": 9.57583087376313e-05} +{"train_loss": 0.010999959893524647, "global_step": 9863, "epoch": 82, "lr": 9.575741567227301e-05} +{"train_loss": 0.006520248018205166, "global_step": 9864, "epoch": 82, "lr": 9.575652251707495e-05} +{"train_loss": 0.008687330409884453, "global_step": 9865, "epoch": 82, "lr": 9.575562927203882e-05} +{"train_loss": 0.008181980811059475, "global_step": 9866, "epoch": 82, "lr": 9.575473593716642e-05} +{"train_loss": 0.011212623678147793, "global_step": 9867, "epoch": 82, "lr": 9.575384251245949e-05} +{"train_loss": 0.015365881845355034, "global_step": 9868, "epoch": 82, "lr": 9.575294899791976e-05} +{"train_loss": 0.008948098868131638, "global_step": 9869, "epoch": 82, "lr": 9.575205539354901e-05} +{"train_loss": 0.008227791637182236, "global_step": 9870, "epoch": 82, "lr": 9.575116169934899e-05} +{"train_loss": 0.009069398045539856, "global_step": 9871, "epoch": 82, "lr": 9.575026791532145e-05} +{"train_loss": 0.009695415385067463, "global_step": 9872, "epoch": 82, "lr": 9.574937404146815e-05} +{"train_loss": 0.009237153455615044, "global_step": 9873, "epoch": 82, "lr": 9.574848007779084e-05} +{"train_loss": 0.012164292857050896, "global_step": 9874, "epoch": 82, "lr": 9.574758602429129e-05} +{"train_loss": 0.007546828594058752, "global_step": 9875, "epoch": 82, "lr": 9.57466918809712e-05} +{"train_loss": 0.010010409740214589, "global_step": 9876, "epoch": 82, "lr": 9.57457976478324e-05, "val_loss": 0.01927519217133522} +{"train_loss": 0.00736277038231492, "global_step": 9877, "epoch": 83, "lr": 9.574490332487661e-05} +{"train_loss": 0.010464934632182121, "global_step": 9878, "epoch": 83, "lr": 9.57440089121056e-05} +{"train_loss": 0.005520402919501066, "global_step": 9879, "epoch": 83, "lr": 9.574311440952109e-05} +{"train_loss": 0.008434801362454891, "global_step": 9880, "epoch": 83, "lr": 9.574221981712488e-05} +{"train_loss": 0.008869572542607784, "global_step": 9881, "epoch": 83, "lr": 9.574132513491871e-05} +{"train_loss": 0.009315267205238342, "global_step": 9882, "epoch": 83, "lr": 9.574043036290432e-05} +{"train_loss": 0.006289937533438206, "global_step": 9883, "epoch": 83, "lr": 9.57395355010835e-05} +{"train_loss": 0.008629422634840012, "global_step": 9884, "epoch": 83, "lr": 9.573864054945797e-05} +{"train_loss": 0.010438033379614353, "global_step": 9885, "epoch": 83, "lr": 9.573774550802952e-05} +{"train_loss": 0.006333019118756056, "global_step": 9886, "epoch": 83, "lr": 9.573685037679988e-05} +{"train_loss": 0.007159982807934284, "global_step": 9887, "epoch": 83, "lr": 9.573595515577083e-05} +{"train_loss": 0.0099006537348032, "global_step": 9888, "epoch": 83, "lr": 9.573505984494411e-05} +{"train_loss": 0.010406827554106712, "global_step": 9889, "epoch": 83, "lr": 9.573416444432151e-05} +{"train_loss": 0.01013559103012085, "global_step": 9890, "epoch": 83, "lr": 9.573326895390473e-05} +{"train_loss": 0.01231398619711399, "global_step": 9891, "epoch": 83, "lr": 9.573237337369558e-05} +{"train_loss": 0.006926063448190689, "global_step": 9892, "epoch": 83, "lr": 9.573147770369581e-05} +{"train_loss": 0.008064869791269302, "global_step": 9893, "epoch": 83, "lr": 9.573058194390715e-05} +{"train_loss": 0.007643142249435186, "global_step": 9894, "epoch": 83, "lr": 9.572968609433139e-05} +{"train_loss": 0.011361595243215561, "global_step": 9895, "epoch": 83, "lr": 9.572879015497026e-05} +{"train_loss": 0.010753295384347439, "global_step": 9896, "epoch": 83, "lr": 9.572789412582557e-05} +{"train_loss": 0.009458268992602825, "global_step": 9897, "epoch": 83, "lr": 9.572699800689902e-05} +{"train_loss": 0.006730107590556145, "global_step": 9898, "epoch": 83, "lr": 9.572610179819239e-05} +{"train_loss": 0.014711850322782993, "global_step": 9899, "epoch": 83, "lr": 9.572520549970746e-05} +{"train_loss": 0.006995557341724634, "global_step": 9900, "epoch": 83, "lr": 9.572430911144596e-05} +{"train_loss": 0.008702879771590233, "global_step": 9901, "epoch": 83, "lr": 9.572341263340966e-05} +{"train_loss": 0.007623388431966305, "global_step": 9902, "epoch": 83, "lr": 9.572251606560036e-05} +{"train_loss": 0.009698736481368542, "global_step": 9903, "epoch": 83, "lr": 9.572161940801976e-05} +{"train_loss": 0.007185005117207766, "global_step": 9904, "epoch": 83, "lr": 9.572072266066964e-05} +{"train_loss": 0.009004514664411545, "global_step": 9905, "epoch": 83, "lr": 9.571982582355176e-05} +{"train_loss": 0.012689025141298771, "global_step": 9906, "epoch": 83, "lr": 9.57189288966679e-05} +{"train_loss": 0.008981148712337017, "global_step": 9907, "epoch": 83, "lr": 9.57180318800198e-05} +{"train_loss": 0.009421955794095993, "global_step": 9908, "epoch": 83, "lr": 9.571713477360924e-05} +{"train_loss": 0.009566407650709152, "global_step": 9909, "epoch": 83, "lr": 9.571623757743796e-05} +{"train_loss": 0.007663148455321789, "global_step": 9910, "epoch": 83, "lr": 9.571534029150774e-05} +{"train_loss": 0.01065710000693798, "global_step": 9911, "epoch": 83, "lr": 9.571444291582032e-05} +{"train_loss": 0.006347829941660166, "global_step": 9912, "epoch": 83, "lr": 9.57135454503775e-05} +{"train_loss": 0.010179526172578335, "global_step": 9913, "epoch": 83, "lr": 9.5712647895181e-05} +{"train_loss": 0.008042072877287865, "global_step": 9914, "epoch": 83, "lr": 9.571175025023259e-05} +{"train_loss": 0.016722341999411583, "global_step": 9915, "epoch": 83, "lr": 9.571085251553404e-05} +{"train_loss": 0.005195422098040581, "global_step": 9916, "epoch": 83, "lr": 9.570995469108715e-05} +{"train_loss": 0.013048416003584862, "global_step": 9917, "epoch": 83, "lr": 9.570905677689361e-05} +{"train_loss": 0.008246873505413532, "global_step": 9918, "epoch": 83, "lr": 9.570815877295523e-05} +{"train_loss": 0.012230725958943367, "global_step": 9919, "epoch": 83, "lr": 9.570726067927378e-05} +{"train_loss": 0.011178376153111458, "global_step": 9920, "epoch": 83, "lr": 9.570636249585099e-05} +{"train_loss": 0.008951005525887012, "global_step": 9921, "epoch": 83, "lr": 9.570546422268864e-05} +{"train_loss": 0.009984229691326618, "global_step": 9922, "epoch": 83, "lr": 9.57045658597885e-05} +{"train_loss": 0.006997725926339626, "global_step": 9923, "epoch": 83, "lr": 9.570366740715233e-05} +{"train_loss": 0.007981489412486553, "global_step": 9924, "epoch": 83, "lr": 9.570276886478189e-05} +{"train_loss": 0.008516998030245304, "global_step": 9925, "epoch": 83, "lr": 9.570187023267894e-05} +{"train_loss": 0.00998009368777275, "global_step": 9926, "epoch": 83, "lr": 9.570097151084525e-05} +{"train_loss": 0.013059529475867748, "global_step": 9927, "epoch": 83, "lr": 9.57000726992826e-05} +{"train_loss": 0.008353151381015778, "global_step": 9928, "epoch": 83, "lr": 9.569917379799271e-05} +{"train_loss": 0.012400475330650806, "global_step": 9929, "epoch": 83, "lr": 9.56982748069774e-05} +{"train_loss": 0.012679250910878181, "global_step": 9930, "epoch": 83, "lr": 9.56973757262384e-05} +{"train_loss": 0.008106268011033535, "global_step": 9931, "epoch": 83, "lr": 9.569647655577749e-05} +{"train_loss": 0.009528303518891335, "global_step": 9932, "epoch": 83, "lr": 9.569557729559644e-05} +{"train_loss": 0.012438765726983547, "global_step": 9933, "epoch": 83, "lr": 9.569467794569699e-05} +{"train_loss": 0.009151767939329147, "global_step": 9934, "epoch": 83, "lr": 9.569377850608092e-05} +{"train_loss": 0.012851600535213947, "global_step": 9935, "epoch": 83, "lr": 9.569287897675e-05} +{"train_loss": 0.0065933107398450375, "global_step": 9936, "epoch": 83, "lr": 9.569197935770599e-05} +{"train_loss": 0.010640156455338001, "global_step": 9937, "epoch": 83, "lr": 9.569107964895067e-05} +{"train_loss": 0.011314361356198788, "global_step": 9938, "epoch": 83, "lr": 9.569017985048581e-05} +{"train_loss": 0.009870335459709167, "global_step": 9939, "epoch": 83, "lr": 9.568927996231314e-05} +{"train_loss": 0.011079346761107445, "global_step": 9940, "epoch": 83, "lr": 9.568837998443446e-05} +{"train_loss": 0.011124130338430405, "global_step": 9941, "epoch": 83, "lr": 9.568747991685152e-05} +{"train_loss": 0.009237358346581459, "global_step": 9942, "epoch": 83, "lr": 9.56865797595661e-05} +{"train_loss": 0.010446065105497837, "global_step": 9943, "epoch": 83, "lr": 9.568567951257996e-05} +{"train_loss": 0.011832169257104397, "global_step": 9944, "epoch": 83, "lr": 9.568477917589485e-05} +{"train_loss": 0.010742869228124619, "global_step": 9945, "epoch": 83, "lr": 9.56838787495126e-05} +{"train_loss": 0.010254505090415478, "global_step": 9946, "epoch": 83, "lr": 9.56829782334349e-05} +{"train_loss": 0.010627361945807934, "global_step": 9947, "epoch": 83, "lr": 9.568207762766354e-05} +{"train_loss": 0.009622368030250072, "global_step": 9948, "epoch": 83, "lr": 9.568117693220033e-05} +{"train_loss": 0.010371821001172066, "global_step": 9949, "epoch": 83, "lr": 9.568027614704701e-05} +{"train_loss": 0.00786904152482748, "global_step": 9950, "epoch": 83, "lr": 9.567937527220534e-05} +{"train_loss": 0.01356718223541975, "global_step": 9951, "epoch": 83, "lr": 9.567847430767709e-05} +{"train_loss": 0.01460862997919321, "global_step": 9952, "epoch": 83, "lr": 9.567757325346405e-05} +{"train_loss": 0.0099102221429348, "global_step": 9953, "epoch": 83, "lr": 9.567667210956796e-05} +{"train_loss": 0.013863088563084602, "global_step": 9954, "epoch": 83, "lr": 9.567577087599063e-05} +{"train_loss": 0.00932984333485365, "global_step": 9955, "epoch": 83, "lr": 9.567486955273377e-05} +{"train_loss": 0.013020183891057968, "global_step": 9956, "epoch": 83, "lr": 9.567396813979921e-05} +{"train_loss": 0.007429600227624178, "global_step": 9957, "epoch": 83, "lr": 9.567306663718866e-05} +{"train_loss": 0.012734318152070045, "global_step": 9958, "epoch": 83, "lr": 9.567216504490396e-05} +{"train_loss": 0.008009805344045162, "global_step": 9959, "epoch": 83, "lr": 9.567126336294683e-05} +{"train_loss": 0.008267729543149471, "global_step": 9960, "epoch": 83, "lr": 9.567036159131906e-05} +{"train_loss": 0.007442964240908623, "global_step": 9961, "epoch": 83, "lr": 9.56694597300224e-05} +{"train_loss": 0.010126888751983643, "global_step": 9962, "epoch": 83, "lr": 9.566855777905864e-05} +{"train_loss": 0.008432356640696526, "global_step": 9963, "epoch": 83, "lr": 9.566765573842956e-05} +{"train_loss": 0.008757869713008404, "global_step": 9964, "epoch": 83, "lr": 9.566675360813689e-05} +{"train_loss": 0.012109956704080105, "global_step": 9965, "epoch": 83, "lr": 9.566585138818245e-05} +{"train_loss": 0.013050112873315811, "global_step": 9966, "epoch": 83, "lr": 9.566494907856798e-05} +{"train_loss": 0.007831636816263199, "global_step": 9967, "epoch": 83, "lr": 9.566404667929525e-05} +{"train_loss": 0.006660829298198223, "global_step": 9968, "epoch": 83, "lr": 9.566314419036606e-05} +{"train_loss": 0.009176251478493214, "global_step": 9969, "epoch": 83, "lr": 9.566224161178217e-05} +{"train_loss": 0.009219581261277199, "global_step": 9970, "epoch": 83, "lr": 9.566133894354531e-05} +{"train_loss": 0.008259734138846397, "global_step": 9971, "epoch": 83, "lr": 9.566043618565734e-05} +{"train_loss": 0.008465863764286041, "global_step": 9972, "epoch": 83, "lr": 9.565953333811994e-05} +{"train_loss": 0.01029680110514164, "global_step": 9973, "epoch": 83, "lr": 9.565863040093494e-05} +{"train_loss": 0.010368123650550842, "global_step": 9974, "epoch": 83, "lr": 9.565772737410411e-05} +{"train_loss": 0.006161561701446772, "global_step": 9975, "epoch": 83, "lr": 9.56568242576292e-05} +{"train_loss": 0.005521436221897602, "global_step": 9976, "epoch": 83, "lr": 9.565592105151199e-05} +{"train_loss": 0.00858309492468834, "global_step": 9977, "epoch": 83, "lr": 9.565501775575426e-05} +{"train_loss": 0.008873553946614265, "global_step": 9978, "epoch": 83, "lr": 9.565411437035778e-05} +{"train_loss": 0.010982573963701725, "global_step": 9979, "epoch": 83, "lr": 9.565321089532432e-05} +{"train_loss": 0.012908216565847397, "global_step": 9980, "epoch": 83, "lr": 9.565230733065566e-05} +{"train_loss": 0.008991003036499023, "global_step": 9981, "epoch": 83, "lr": 9.565140367635357e-05} +{"train_loss": 0.013597178272902966, "global_step": 9982, "epoch": 83, "lr": 9.565049993241984e-05} +{"train_loss": 0.008061590604484081, "global_step": 9983, "epoch": 83, "lr": 9.564959609885622e-05} +{"train_loss": 0.010668712668120861, "global_step": 9984, "epoch": 83, "lr": 9.564869217566447e-05} +{"train_loss": 0.005814378149807453, "global_step": 9985, "epoch": 83, "lr": 9.564778816284643e-05} +{"train_loss": 0.011584104038774967, "global_step": 9986, "epoch": 83, "lr": 9.564688406040382e-05} +{"train_loss": 0.008585073053836823, "global_step": 9987, "epoch": 83, "lr": 9.564597986833843e-05} +{"train_loss": 0.010864096693694592, "global_step": 9988, "epoch": 83, "lr": 9.564507558665203e-05} +{"train_loss": 0.00950300320982933, "global_step": 9989, "epoch": 83, "lr": 9.56441712153464e-05} +{"train_loss": 0.008457218296825886, "global_step": 9990, "epoch": 83, "lr": 9.564326675442332e-05} +{"train_loss": 0.01513483002781868, "global_step": 9991, "epoch": 83, "lr": 9.564236220388456e-05} +{"train_loss": 0.009659554809331894, "global_step": 9992, "epoch": 83, "lr": 9.56414575637319e-05} +{"train_loss": 0.0072407471016049385, "global_step": 9993, "epoch": 83, "lr": 9.564055283396712e-05} +{"train_loss": 0.013934985734522343, "global_step": 9994, "epoch": 83, "lr": 9.563964801459199e-05} +{"train_loss": 0.009681719691813494, "global_step": 9995, "epoch": 83, "lr": 9.563874310560828e-05, "val_loss": 0.01821405254304409} +{"train_loss": 0.012432589195668697, "global_step": 9996, "epoch": 84, "lr": 9.563783810701778e-05} +{"train_loss": 0.009359284304082394, "global_step": 9997, "epoch": 84, "lr": 9.563693301882224e-05} +{"train_loss": 0.006398952100425959, "global_step": 9998, "epoch": 84, "lr": 9.563602784102348e-05} +{"train_loss": 0.013140257447957993, "global_step": 9999, "epoch": 84, "lr": 9.563512257362325e-05} +{"train_loss": 0.010002236813306808, "global_step": 10000, "epoch": 84, "lr": 9.563421721662334e-05} +{"train_loss": 0.008788732811808586, "global_step": 10001, "epoch": 84, "lr": 9.56333117700255e-05} +{"train_loss": 0.007530511822551489, "global_step": 10002, "epoch": 84, "lr": 9.563240623383154e-05} +{"train_loss": 0.010373112745583057, "global_step": 10003, "epoch": 84, "lr": 9.563150060804323e-05} +{"train_loss": 0.009290918707847595, "global_step": 10004, "epoch": 84, "lr": 9.563059489266233e-05} +{"train_loss": 0.0125581631436944, "global_step": 10005, "epoch": 84, "lr": 9.562968908769064e-05} +{"train_loss": 0.007006531115621328, "global_step": 10006, "epoch": 84, "lr": 9.562878319312994e-05} +{"train_loss": 0.01069026067852974, "global_step": 10007, "epoch": 84, "lr": 9.562787720898198e-05} +{"train_loss": 0.008142462931573391, "global_step": 10008, "epoch": 84, "lr": 9.562697113524856e-05} +{"train_loss": 0.008026785217225552, "global_step": 10009, "epoch": 84, "lr": 9.562606497193146e-05} +{"train_loss": 0.008391356095671654, "global_step": 10010, "epoch": 84, "lr": 9.562515871903246e-05} +{"train_loss": 0.010781494900584221, "global_step": 10011, "epoch": 84, "lr": 9.562425237655332e-05} +{"train_loss": 0.010724036954343319, "global_step": 10012, "epoch": 84, "lr": 9.562334594449587e-05} +{"train_loss": 0.01273958757519722, "global_step": 10013, "epoch": 84, "lr": 9.562243942286183e-05} +{"train_loss": 0.010645662434399128, "global_step": 10014, "epoch": 84, "lr": 9.5621532811653e-05} +{"train_loss": 0.00913555733859539, "global_step": 10015, "epoch": 84, "lr": 9.562062611087117e-05} +{"train_loss": 0.007753560785204172, "global_step": 10016, "epoch": 84, "lr": 9.561971932051811e-05} +{"train_loss": 0.008293014951050282, "global_step": 10017, "epoch": 84, "lr": 9.561881244059561e-05} +{"train_loss": 0.011122282594442368, "global_step": 10018, "epoch": 84, "lr": 9.561790547110545e-05} +{"train_loss": 0.011345949955284595, "global_step": 10019, "epoch": 84, "lr": 9.56169984120494e-05} +{"train_loss": 0.00625654635950923, "global_step": 10020, "epoch": 84, "lr": 9.561609126342926e-05} +{"train_loss": 0.007673053070902824, "global_step": 10021, "epoch": 84, "lr": 9.561518402524678e-05} +{"train_loss": 0.0098153380677104, "global_step": 10022, "epoch": 84, "lr": 9.561427669750377e-05} +{"train_loss": 0.00807643961161375, "global_step": 10023, "epoch": 84, "lr": 9.561336928020199e-05} +{"train_loss": 0.010528577491641045, "global_step": 10024, "epoch": 84, "lr": 9.561246177334324e-05} +{"train_loss": 0.0124672157689929, "global_step": 10025, "epoch": 84, "lr": 9.56115541769293e-05} +{"train_loss": 0.007161058951169252, "global_step": 10026, "epoch": 84, "lr": 9.561064649096195e-05} +{"train_loss": 0.008108234964311123, "global_step": 10027, "epoch": 84, "lr": 9.560973871544294e-05} +{"train_loss": 0.009674089960753918, "global_step": 10028, "epoch": 84, "lr": 9.56088308503741e-05} +{"train_loss": 0.011825785972177982, "global_step": 10029, "epoch": 84, "lr": 9.560792289575719e-05} +{"train_loss": 0.008247872814536095, "global_step": 10030, "epoch": 84, "lr": 9.5607014851594e-05} +{"train_loss": 0.004346308298408985, "global_step": 10031, "epoch": 84, "lr": 9.560610671788632e-05} +{"train_loss": 0.00784199871122837, "global_step": 10032, "epoch": 84, "lr": 9.56051984946359e-05} +{"train_loss": 0.007396571338176727, "global_step": 10033, "epoch": 84, "lr": 9.560429018184455e-05} +{"train_loss": 0.00863372441381216, "global_step": 10034, "epoch": 84, "lr": 9.560338177951406e-05} +{"train_loss": 0.009262431412935257, "global_step": 10035, "epoch": 84, "lr": 9.56024732876462e-05} +{"train_loss": 0.011152980849146843, "global_step": 10036, "epoch": 84, "lr": 9.560156470624275e-05} +{"train_loss": 0.008783649653196335, "global_step": 10037, "epoch": 84, "lr": 9.56006560353055e-05} +{"train_loss": 0.010198700241744518, "global_step": 10038, "epoch": 84, "lr": 9.559974727483623e-05} +{"train_loss": 0.01154004130512476, "global_step": 10039, "epoch": 84, "lr": 9.559883842483672e-05} +{"train_loss": 0.007566316984593868, "global_step": 10040, "epoch": 84, "lr": 9.559792948530877e-05} +{"train_loss": 0.009388966485857964, "global_step": 10041, "epoch": 84, "lr": 9.559702045625418e-05} +{"train_loss": 0.00829255860298872, "global_step": 10042, "epoch": 84, "lr": 9.559611133767467e-05} +{"train_loss": 0.012241555377840996, "global_step": 10043, "epoch": 84, "lr": 9.559520212957211e-05} +{"train_loss": 0.006112899165600538, "global_step": 10044, "epoch": 84, "lr": 9.55942928319482e-05} +{"train_loss": 0.011515998281538486, "global_step": 10045, "epoch": 84, "lr": 9.55933834448048e-05} +{"train_loss": 0.00887362565845251, "global_step": 10046, "epoch": 84, "lr": 9.559247396814365e-05} +{"train_loss": 0.009255025535821915, "global_step": 10047, "epoch": 84, "lr": 9.559156440196656e-05} +{"train_loss": 0.011752007529139519, "global_step": 10048, "epoch": 84, "lr": 9.559065474627527e-05} +{"train_loss": 0.009807044640183449, "global_step": 10049, "epoch": 84, "lr": 9.558974500107163e-05} +{"train_loss": 0.012409956194460392, "global_step": 10050, "epoch": 84, "lr": 9.55888351663574e-05} +{"train_loss": 0.013671888038516045, "global_step": 10051, "epoch": 84, "lr": 9.558792524213434e-05} +{"train_loss": 0.010734076611697674, "global_step": 10052, "epoch": 84, "lr": 9.558701522840428e-05} +{"train_loss": 0.010990173555910587, "global_step": 10053, "epoch": 84, "lr": 9.558610512516896e-05} +{"train_loss": 0.010248375125229359, "global_step": 10054, "epoch": 84, "lr": 9.558519493243021e-05} +{"train_loss": 0.008027861826121807, "global_step": 10055, "epoch": 84, "lr": 9.55842846501898e-05} +{"train_loss": 0.007471964228898287, "global_step": 10056, "epoch": 84, "lr": 9.558337427844952e-05} +{"train_loss": 0.008706938475370407, "global_step": 10057, "epoch": 84, "lr": 9.558246381721114e-05} +{"train_loss": 0.009415275417268276, "global_step": 10058, "epoch": 84, "lr": 9.558155326647647e-05} +{"train_loss": 0.007862260565161705, "global_step": 10059, "epoch": 84, "lr": 9.55806426262473e-05} +{"train_loss": 0.012078271247446537, "global_step": 10060, "epoch": 84, "lr": 9.55797318965254e-05} +{"train_loss": 0.011292589828372002, "global_step": 10061, "epoch": 84, "lr": 9.557882107731256e-05} +{"train_loss": 0.010191338136792183, "global_step": 10062, "epoch": 84, "lr": 9.557791016861059e-05} +{"train_loss": 0.008564569987356663, "global_step": 10063, "epoch": 84, "lr": 9.557699917042124e-05} +{"train_loss": 0.00983467511832714, "global_step": 10064, "epoch": 84, "lr": 9.557608808274635e-05} +{"train_loss": 0.008147342130541801, "global_step": 10065, "epoch": 84, "lr": 9.557517690558766e-05} +{"train_loss": 0.007798411883413792, "global_step": 10066, "epoch": 84, "lr": 9.557426563894699e-05} +{"train_loss": 0.012095624580979347, "global_step": 10067, "epoch": 84, "lr": 9.55733542828261e-05} +{"train_loss": 0.01255040429532528, "global_step": 10068, "epoch": 84, "lr": 9.557244283722681e-05} +{"train_loss": 0.0069464086554944515, "global_step": 10069, "epoch": 84, "lr": 9.557153130215089e-05} +{"train_loss": 0.010430751368403435, "global_step": 10070, "epoch": 84, "lr": 9.557061967760015e-05} +{"train_loss": 0.011013085022568703, "global_step": 10071, "epoch": 84, "lr": 9.556970796357636e-05} +{"train_loss": 0.0064015923999249935, "global_step": 10072, "epoch": 84, "lr": 9.556879616008131e-05} +{"train_loss": 0.01140724215656519, "global_step": 10073, "epoch": 84, "lr": 9.55678842671168e-05} +{"train_loss": 0.010611627250909805, "global_step": 10074, "epoch": 84, "lr": 9.556697228468463e-05} +{"train_loss": 0.011338145472109318, "global_step": 10075, "epoch": 84, "lr": 9.556606021278655e-05} +{"train_loss": 0.009946219623088837, "global_step": 10076, "epoch": 84, "lr": 9.556514805142442e-05} +{"train_loss": 0.009394986554980278, "global_step": 10077, "epoch": 84, "lr": 9.556423580059996e-05} +{"train_loss": 0.007923346012830734, "global_step": 10078, "epoch": 84, "lr": 9.5563323460315e-05} +{"train_loss": 0.01225415151566267, "global_step": 10079, "epoch": 84, "lr": 9.556241103057132e-05} +{"train_loss": 0.013626890257000923, "global_step": 10080, "epoch": 84, "lr": 9.556149851137071e-05} +{"train_loss": 0.012131957337260246, "global_step": 10081, "epoch": 84, "lr": 9.556058590271498e-05} +{"train_loss": 0.007726443000137806, "global_step": 10082, "epoch": 84, "lr": 9.555967320460588e-05} +{"train_loss": 0.0074261389672756195, "global_step": 10083, "epoch": 84, "lr": 9.555876041704526e-05} +{"train_loss": 0.009633654728531837, "global_step": 10084, "epoch": 84, "lr": 9.555784754003486e-05} +{"train_loss": 0.005217294674366713, "global_step": 10085, "epoch": 84, "lr": 9.55569345735765e-05} +{"train_loss": 0.007397618144750595, "global_step": 10086, "epoch": 84, "lr": 9.555602151767195e-05} +{"train_loss": 0.012412747368216515, "global_step": 10087, "epoch": 84, "lr": 9.555510837232304e-05} +{"train_loss": 0.009339837357401848, "global_step": 10088, "epoch": 84, "lr": 9.555419513753154e-05} +{"train_loss": 0.005974320694804192, "global_step": 10089, "epoch": 84, "lr": 9.555328181329924e-05} +{"train_loss": 0.009285913780331612, "global_step": 10090, "epoch": 84, "lr": 9.555236839962795e-05} +{"train_loss": 0.01130661740899086, "global_step": 10091, "epoch": 84, "lr": 9.555145489651943e-05} +{"train_loss": 0.007880213670432568, "global_step": 10092, "epoch": 84, "lr": 9.555054130397551e-05} +{"train_loss": 0.009912674315273762, "global_step": 10093, "epoch": 84, "lr": 9.554962762199795e-05} +{"train_loss": 0.010418330319225788, "global_step": 10094, "epoch": 84, "lr": 9.554871385058859e-05} +{"train_loss": 0.006738883443176746, "global_step": 10095, "epoch": 84, "lr": 9.554779998974918e-05} +{"train_loss": 0.013308431021869183, "global_step": 10096, "epoch": 84, "lr": 9.554688603948153e-05} +{"train_loss": 0.012621202506124973, "global_step": 10097, "epoch": 84, "lr": 9.554597199978744e-05} +{"train_loss": 0.012130169197916985, "global_step": 10098, "epoch": 84, "lr": 9.55450578706687e-05} +{"train_loss": 0.00541825732216239, "global_step": 10099, "epoch": 84, "lr": 9.554414365212709e-05} +{"train_loss": 0.008987468667328358, "global_step": 10100, "epoch": 84, "lr": 9.554322934416444e-05} +{"train_loss": 0.01100018061697483, "global_step": 10101, "epoch": 84, "lr": 9.554231494678252e-05} +{"train_loss": 0.005910994950681925, "global_step": 10102, "epoch": 84, "lr": 9.554140045998313e-05} +{"train_loss": 0.008997081778943539, "global_step": 10103, "epoch": 84, "lr": 9.554048588376806e-05} +{"train_loss": 0.008363466709852219, "global_step": 10104, "epoch": 84, "lr": 9.553957121813911e-05} +{"train_loss": 0.0110431844368577, "global_step": 10105, "epoch": 84, "lr": 9.553865646309808e-05} +{"train_loss": 0.00884025264531374, "global_step": 10106, "epoch": 84, "lr": 9.553774161864677e-05} +{"train_loss": 0.0082806795835495, "global_step": 10107, "epoch": 84, "lr": 9.553682668478697e-05} +{"train_loss": 0.007942034862935543, "global_step": 10108, "epoch": 84, "lr": 9.553591166152044e-05} +{"train_loss": 0.008027927950024605, "global_step": 10109, "epoch": 84, "lr": 9.553499654884905e-05} +{"train_loss": 0.008634014055132866, "global_step": 10110, "epoch": 84, "lr": 9.553408134677456e-05} +{"train_loss": 0.010071626864373684, "global_step": 10111, "epoch": 84, "lr": 9.553316605529877e-05} +{"train_loss": 0.008321551606059074, "global_step": 10112, "epoch": 84, "lr": 9.553225067442345e-05} +{"train_loss": 0.00940086878836155, "global_step": 10113, "epoch": 84, "lr": 9.553133520415042e-05} +{"train_loss": 0.009498321869950584, "global_step": 10114, "epoch": 84, "lr": 9.553041964448148e-05, "val_loss": 0.0167283583432436} +{"train_loss": 0.008001593872904778, "global_step": 10115, "epoch": 85, "lr": 9.552950399541845e-05} +{"train_loss": 0.01013899128884077, "global_step": 10116, "epoch": 85, "lr": 9.552858825696308e-05} +{"train_loss": 0.00863704551011324, "global_step": 10117, "epoch": 85, "lr": 9.55276724291172e-05} +{"train_loss": 0.008305144496262074, "global_step": 10118, "epoch": 85, "lr": 9.552675651188259e-05} +{"train_loss": 0.005767571274191141, "global_step": 10119, "epoch": 85, "lr": 9.552584050526106e-05} +{"train_loss": 0.009503260254859924, "global_step": 10120, "epoch": 85, "lr": 9.55249244092544e-05} +{"train_loss": 0.010949448682367802, "global_step": 10121, "epoch": 85, "lr": 9.552400822386442e-05} +{"train_loss": 0.008464391343295574, "global_step": 10122, "epoch": 85, "lr": 9.552309194909293e-05} +{"train_loss": 0.006508936174213886, "global_step": 10123, "epoch": 85, "lr": 9.55221755849417e-05} +{"train_loss": 0.010861525312066078, "global_step": 10124, "epoch": 85, "lr": 9.552125913141254e-05} +{"train_loss": 0.012281445786356926, "global_step": 10125, "epoch": 85, "lr": 9.552034258850725e-05} +{"train_loss": 0.012052563950419426, "global_step": 10126, "epoch": 85, "lr": 9.551942595622762e-05} +{"train_loss": 0.00853019393980503, "global_step": 10127, "epoch": 85, "lr": 9.551850923457548e-05} +{"train_loss": 0.008238079957664013, "global_step": 10128, "epoch": 85, "lr": 9.55175924235526e-05} +{"train_loss": 0.013810987584292889, "global_step": 10129, "epoch": 85, "lr": 9.551667552316079e-05} +{"train_loss": 0.01132580079138279, "global_step": 10130, "epoch": 85, "lr": 9.551575853340187e-05} +{"train_loss": 0.005933065433055162, "global_step": 10131, "epoch": 85, "lr": 9.551484145427759e-05} +{"train_loss": 0.015834370627999306, "global_step": 10132, "epoch": 85, "lr": 9.55139242857898e-05} +{"train_loss": 0.014608437195420265, "global_step": 10133, "epoch": 85, "lr": 9.551300702794027e-05} +{"train_loss": 0.006653165910393, "global_step": 10134, "epoch": 85, "lr": 9.551208968073082e-05} +{"train_loss": 0.011131024919450283, "global_step": 10135, "epoch": 85, "lr": 9.551117224416326e-05} +{"train_loss": 0.009668986313045025, "global_step": 10136, "epoch": 85, "lr": 9.551025471823934e-05} +{"train_loss": 0.008582960814237595, "global_step": 10137, "epoch": 85, "lr": 9.550933710296093e-05} +{"train_loss": 0.0068960171192884445, "global_step": 10138, "epoch": 85, "lr": 9.550841939832978e-05} +{"train_loss": 0.013041931204497814, "global_step": 10139, "epoch": 85, "lr": 9.550750160434772e-05} +{"train_loss": 0.009898409247398376, "global_step": 10140, "epoch": 85, "lr": 9.550658372101653e-05} +{"train_loss": 0.01270188856869936, "global_step": 10141, "epoch": 85, "lr": 9.550566574833804e-05} +{"train_loss": 0.010964603163301945, "global_step": 10142, "epoch": 85, "lr": 9.550474768631402e-05} +{"train_loss": 0.007530533708631992, "global_step": 10143, "epoch": 85, "lr": 9.55038295349463e-05} +{"train_loss": 0.011710218153893948, "global_step": 10144, "epoch": 85, "lr": 9.550291129423668e-05} +{"train_loss": 0.015184549614787102, "global_step": 10145, "epoch": 85, "lr": 9.550199296418694e-05} +{"train_loss": 0.007357409223914146, "global_step": 10146, "epoch": 85, "lr": 9.55010745447989e-05} +{"train_loss": 0.00696775084361434, "global_step": 10147, "epoch": 85, "lr": 9.550015603607436e-05} +{"train_loss": 0.014231165871024132, "global_step": 10148, "epoch": 85, "lr": 9.549923743801513e-05} +{"train_loss": 0.01031134556978941, "global_step": 10149, "epoch": 85, "lr": 9.549831875062301e-05} +{"train_loss": 0.013621104881167412, "global_step": 10150, "epoch": 85, "lr": 9.54973999738998e-05} +{"train_loss": 0.009035888127982616, "global_step": 10151, "epoch": 85, "lr": 9.549648110784731e-05} +{"train_loss": 0.00964404921978712, "global_step": 10152, "epoch": 85, "lr": 9.549556215246734e-05} +{"train_loss": 0.006605194415897131, "global_step": 10153, "epoch": 85, "lr": 9.549464310776168e-05} +{"train_loss": 0.011516915634274483, "global_step": 10154, "epoch": 85, "lr": 9.549372397373215e-05} +{"train_loss": 0.012344422750175, "global_step": 10155, "epoch": 85, "lr": 9.549280475038056e-05} +{"train_loss": 0.01096239872276783, "global_step": 10156, "epoch": 85, "lr": 9.549188543770872e-05} +{"train_loss": 0.013729956932365894, "global_step": 10157, "epoch": 85, "lr": 9.549096603571842e-05} +{"train_loss": 0.013209294527769089, "global_step": 10158, "epoch": 85, "lr": 9.549004654441145e-05} +{"train_loss": 0.008927087299525738, "global_step": 10159, "epoch": 85, "lr": 9.548912696378964e-05} +{"train_loss": 0.011867223307490349, "global_step": 10160, "epoch": 85, "lr": 9.548820729385479e-05} +{"train_loss": 0.009765852242708206, "global_step": 10161, "epoch": 85, "lr": 9.548728753460871e-05} +{"train_loss": 0.01145209465175867, "global_step": 10162, "epoch": 85, "lr": 9.548636768605321e-05} +{"train_loss": 0.00959270354360342, "global_step": 10163, "epoch": 85, "lr": 9.548544774819006e-05} +{"train_loss": 0.01556213479489088, "global_step": 10164, "epoch": 85, "lr": 9.548452772102111e-05} +{"train_loss": 0.01041001733392477, "global_step": 10165, "epoch": 85, "lr": 9.548360760454816e-05} +{"train_loss": 0.010582076385617256, "global_step": 10166, "epoch": 85, "lr": 9.548268739877297e-05} +{"train_loss": 0.00783414114266634, "global_step": 10167, "epoch": 85, "lr": 9.548176710369742e-05} +{"train_loss": 0.011915943585336208, "global_step": 10168, "epoch": 85, "lr": 9.548084671932326e-05} +{"train_loss": 0.010918017476797104, "global_step": 10169, "epoch": 85, "lr": 9.547992624565232e-05} +{"train_loss": 0.00872519426047802, "global_step": 10170, "epoch": 85, "lr": 9.547900568268639e-05} +{"train_loss": 0.009582312777638435, "global_step": 10171, "epoch": 85, "lr": 9.547808503042732e-05} +{"train_loss": 0.009983265772461891, "global_step": 10172, "epoch": 85, "lr": 9.547716428887688e-05} +{"train_loss": 0.008511300198733807, "global_step": 10173, "epoch": 85, "lr": 9.547624345803687e-05} +{"train_loss": 0.010751147754490376, "global_step": 10174, "epoch": 85, "lr": 9.547532253790912e-05} +{"train_loss": 0.008763805031776428, "global_step": 10175, "epoch": 85, "lr": 9.547440152849544e-05} +{"train_loss": 0.008425227366387844, "global_step": 10176, "epoch": 85, "lr": 9.547348042979763e-05} +{"train_loss": 0.009488269686698914, "global_step": 10177, "epoch": 85, "lr": 9.54725592418175e-05} +{"train_loss": 0.006790472194552422, "global_step": 10178, "epoch": 85, "lr": 9.547163796455685e-05} +{"train_loss": 0.006509753875434399, "global_step": 10179, "epoch": 85, "lr": 9.54707165980175e-05} +{"train_loss": 0.009305777959525585, "global_step": 10180, "epoch": 85, "lr": 9.546979514220127e-05} +{"train_loss": 0.008803650736808777, "global_step": 10181, "epoch": 85, "lr": 9.546887359710994e-05} +{"train_loss": 0.008676644414663315, "global_step": 10182, "epoch": 85, "lr": 9.546795196274534e-05} +{"train_loss": 0.0080666309222579, "global_step": 10183, "epoch": 85, "lr": 9.546703023910926e-05} +{"train_loss": 0.008885917253792286, "global_step": 10184, "epoch": 85, "lr": 9.546610842620353e-05} +{"train_loss": 0.009963657706975937, "global_step": 10185, "epoch": 85, "lr": 9.546518652402995e-05} +{"train_loss": 0.007819592021405697, "global_step": 10186, "epoch": 85, "lr": 9.546426453259035e-05} +{"train_loss": 0.009472502395510674, "global_step": 10187, "epoch": 85, "lr": 9.546334245188653e-05} +{"train_loss": 0.009424516931176186, "global_step": 10188, "epoch": 85, "lr": 9.546242028192027e-05} +{"train_loss": 0.012483741156756878, "global_step": 10189, "epoch": 85, "lr": 9.546149802269342e-05} +{"train_loss": 0.00574239669367671, "global_step": 10190, "epoch": 85, "lr": 9.546057567420776e-05} +{"train_loss": 0.00858919695019722, "global_step": 10191, "epoch": 85, "lr": 9.545965323646513e-05} +{"train_loss": 0.0065457383170723915, "global_step": 10192, "epoch": 85, "lr": 9.545873070946732e-05} +{"train_loss": 0.010122865438461304, "global_step": 10193, "epoch": 85, "lr": 9.545780809321617e-05} +{"train_loss": 0.008247175253927708, "global_step": 10194, "epoch": 85, "lr": 9.545688538771344e-05} +{"train_loss": 0.007041463162750006, "global_step": 10195, "epoch": 85, "lr": 9.545596259296097e-05} +{"train_loss": 0.006143658421933651, "global_step": 10196, "epoch": 85, "lr": 9.54550397089606e-05} +{"train_loss": 0.009680514223873615, "global_step": 10197, "epoch": 85, "lr": 9.54541167357141e-05} +{"train_loss": 0.007938086055219173, "global_step": 10198, "epoch": 85, "lr": 9.54531936732233e-05} +{"train_loss": 0.010459410957992077, "global_step": 10199, "epoch": 85, "lr": 9.545227052149002e-05} +{"train_loss": 0.007004282437264919, "global_step": 10200, "epoch": 85, "lr": 9.545134728051606e-05} +{"train_loss": 0.00900277029722929, "global_step": 10201, "epoch": 85, "lr": 9.545042395030321e-05} +{"train_loss": 0.01063521858304739, "global_step": 10202, "epoch": 85, "lr": 9.544950053085334e-05} +{"train_loss": 0.007588815875351429, "global_step": 10203, "epoch": 85, "lr": 9.544857702216822e-05} +{"train_loss": 0.008669689297676086, "global_step": 10204, "epoch": 85, "lr": 9.544765342424967e-05} +{"train_loss": 0.011973957531154156, "global_step": 10205, "epoch": 85, "lr": 9.544672973709952e-05} +{"train_loss": 0.008946378715336323, "global_step": 10206, "epoch": 85, "lr": 9.544580596071954e-05} +{"train_loss": 0.008940204977989197, "global_step": 10207, "epoch": 85, "lr": 9.544488209511161e-05} +{"train_loss": 0.007953925989568233, "global_step": 10208, "epoch": 85, "lr": 9.54439581402775e-05} +{"train_loss": 0.006588198710232973, "global_step": 10209, "epoch": 85, "lr": 9.544303409621903e-05} +{"train_loss": 0.01039206888526678, "global_step": 10210, "epoch": 85, "lr": 9.5442109962938e-05} +{"train_loss": 0.009607197716832161, "global_step": 10211, "epoch": 85, "lr": 9.544118574043628e-05} +{"train_loss": 0.0068858168087899685, "global_step": 10212, "epoch": 85, "lr": 9.544026142871562e-05} +{"train_loss": 0.007935316301882267, "global_step": 10213, "epoch": 85, "lr": 9.543933702777787e-05} +{"train_loss": 0.006157314870506525, "global_step": 10214, "epoch": 85, "lr": 9.543841253762483e-05} +{"train_loss": 0.010718939825892448, "global_step": 10215, "epoch": 85, "lr": 9.543748795825833e-05} +{"train_loss": 0.008247148245573044, "global_step": 10216, "epoch": 85, "lr": 9.543656328968017e-05} +{"train_loss": 0.01021659653633833, "global_step": 10217, "epoch": 85, "lr": 9.543563853189217e-05} +{"train_loss": 0.008689992129802704, "global_step": 10218, "epoch": 85, "lr": 9.543471368489616e-05} +{"train_loss": 0.008973045274615288, "global_step": 10219, "epoch": 85, "lr": 9.543378874869393e-05} +{"train_loss": 0.0054850284941494465, "global_step": 10220, "epoch": 85, "lr": 9.543286372328731e-05} +{"train_loss": 0.009549779817461967, "global_step": 10221, "epoch": 85, "lr": 9.543193860867813e-05} +{"train_loss": 0.007917066104710102, "global_step": 10222, "epoch": 85, "lr": 9.543101340486817e-05} +{"train_loss": 0.010959864594042301, "global_step": 10223, "epoch": 85, "lr": 9.543008811185929e-05} +{"train_loss": 0.008368875831365585, "global_step": 10224, "epoch": 85, "lr": 9.542916272965328e-05} +{"train_loss": 0.011733491905033588, "global_step": 10225, "epoch": 85, "lr": 9.542823725825197e-05} +{"train_loss": 0.009694449603557587, "global_step": 10226, "epoch": 85, "lr": 9.542731169765715e-05} +{"train_loss": 0.005563500802963972, "global_step": 10227, "epoch": 85, "lr": 9.542638604787066e-05} +{"train_loss": 0.013993565924465656, "global_step": 10228, "epoch": 85, "lr": 9.542546030889432e-05} +{"train_loss": 0.00888458639383316, "global_step": 10229, "epoch": 85, "lr": 9.542453448072994e-05} +{"train_loss": 0.011334921233355999, "global_step": 10230, "epoch": 85, "lr": 9.542360856337935e-05} +{"train_loss": 0.007783703505992889, "global_step": 10231, "epoch": 85, "lr": 9.542268255684435e-05} +{"train_loss": 0.01211925782263279, "global_step": 10232, "epoch": 85, "lr": 9.542175646112676e-05} +{"train_loss": 0.009597049204303938, "global_step": 10233, "epoch": 85, "lr": 9.542083027622842e-05, "val_loss": 0.015045549720525742, "train_action_mse_error": 0.00027611030964180827} +{"train_loss": 0.008104845881462097, "global_step": 10234, "epoch": 86, "lr": 9.54199040021511e-05} +{"train_loss": 0.00959688425064087, "global_step": 10235, "epoch": 86, "lr": 9.541897763889668e-05} +{"train_loss": 0.009784679859876633, "global_step": 10236, "epoch": 86, "lr": 9.541805118646694e-05} +{"train_loss": 0.01153807993978262, "global_step": 10237, "epoch": 86, "lr": 9.54171246448637e-05} +{"train_loss": 0.009144860319793224, "global_step": 10238, "epoch": 86, "lr": 9.54161980140888e-05} +{"train_loss": 0.007594941183924675, "global_step": 10239, "epoch": 86, "lr": 9.541527129414404e-05} +{"train_loss": 0.011131275445222855, "global_step": 10240, "epoch": 86, "lr": 9.541434448503126e-05} +{"train_loss": 0.010744304396212101, "global_step": 10241, "epoch": 86, "lr": 9.541341758675226e-05} +{"train_loss": 0.009119155816733837, "global_step": 10242, "epoch": 86, "lr": 9.541249059930886e-05} +{"train_loss": 0.008582960814237595, "global_step": 10243, "epoch": 86, "lr": 9.541156352270288e-05} +{"train_loss": 0.013950925320386887, "global_step": 10244, "epoch": 86, "lr": 9.541063635693616e-05} +{"train_loss": 0.010209711268544197, "global_step": 10245, "epoch": 86, "lr": 9.54097091020105e-05} +{"train_loss": 0.009806131012737751, "global_step": 10246, "epoch": 86, "lr": 9.540878175792774e-05} +{"train_loss": 0.011046944186091423, "global_step": 10247, "epoch": 86, "lr": 9.540785432468968e-05} +{"train_loss": 0.014927016571164131, "global_step": 10248, "epoch": 86, "lr": 9.540692680229814e-05} +{"train_loss": 0.014530804939568043, "global_step": 10249, "epoch": 86, "lr": 9.540599919075497e-05} +{"train_loss": 0.008046159520745277, "global_step": 10250, "epoch": 86, "lr": 9.540507149006196e-05} +{"train_loss": 0.006670877803117037, "global_step": 10251, "epoch": 86, "lr": 9.540414370022094e-05} +{"train_loss": 0.013226184993982315, "global_step": 10252, "epoch": 86, "lr": 9.540321582123374e-05} +{"train_loss": 0.009168851189315319, "global_step": 10253, "epoch": 86, "lr": 9.540228785310217e-05} +{"train_loss": 0.008909315802156925, "global_step": 10254, "epoch": 86, "lr": 9.540135979582808e-05} +{"train_loss": 0.009132777340710163, "global_step": 10255, "epoch": 86, "lr": 9.540043164941324e-05} +{"train_loss": 0.00952478963881731, "global_step": 10256, "epoch": 86, "lr": 9.539950341385952e-05} +{"train_loss": 0.007864370942115784, "global_step": 10257, "epoch": 86, "lr": 9.539857508916872e-05} +{"train_loss": 0.009417260065674782, "global_step": 10258, "epoch": 86, "lr": 9.539764667534265e-05} +{"train_loss": 0.008509975858032703, "global_step": 10259, "epoch": 86, "lr": 9.539671817238318e-05} +{"train_loss": 0.008230169303715229, "global_step": 10260, "epoch": 86, "lr": 9.539578958029209e-05} +{"train_loss": 0.008424261584877968, "global_step": 10261, "epoch": 86, "lr": 9.539486089907123e-05} +{"train_loss": 0.009766040369868279, "global_step": 10262, "epoch": 86, "lr": 9.53939321287224e-05} +{"train_loss": 0.01158534549176693, "global_step": 10263, "epoch": 86, "lr": 9.539300326924742e-05} +{"train_loss": 0.0085112564265728, "global_step": 10264, "epoch": 86, "lr": 9.539207432064814e-05} +{"train_loss": 0.009608114138245583, "global_step": 10265, "epoch": 86, "lr": 9.539114528292639e-05} +{"train_loss": 0.010871055535972118, "global_step": 10266, "epoch": 86, "lr": 9.539021615608395e-05} +{"train_loss": 0.010280575603246689, "global_step": 10267, "epoch": 86, "lr": 9.538928694012268e-05} +{"train_loss": 0.010782997123897076, "global_step": 10268, "epoch": 86, "lr": 9.538835763504438e-05} +{"train_loss": 0.010302933864295483, "global_step": 10269, "epoch": 86, "lr": 9.538742824085092e-05} +{"train_loss": 0.01035897247493267, "global_step": 10270, "epoch": 86, "lr": 9.538649875754408e-05} +{"train_loss": 0.006135846953839064, "global_step": 10271, "epoch": 86, "lr": 9.538556918512569e-05} +{"train_loss": 0.009242147207260132, "global_step": 10272, "epoch": 86, "lr": 9.538463952359759e-05} +{"train_loss": 0.010306712239980698, "global_step": 10273, "epoch": 86, "lr": 9.538370977296159e-05} +{"train_loss": 0.007070999592542648, "global_step": 10274, "epoch": 86, "lr": 9.538277993321953e-05} +{"train_loss": 0.007550220936536789, "global_step": 10275, "epoch": 86, "lr": 9.538185000437323e-05} +{"train_loss": 0.010569607838988304, "global_step": 10276, "epoch": 86, "lr": 9.538091998642452e-05} +{"train_loss": 0.0060467952862381935, "global_step": 10277, "epoch": 86, "lr": 9.537998987937521e-05} +{"train_loss": 0.011332998052239418, "global_step": 10278, "epoch": 86, "lr": 9.537905968322716e-05} +{"train_loss": 0.011206227354705334, "global_step": 10279, "epoch": 86, "lr": 9.537812939798216e-05} +{"train_loss": 0.011880893260240555, "global_step": 10280, "epoch": 86, "lr": 9.537719902364205e-05} +{"train_loss": 0.007111355662345886, "global_step": 10281, "epoch": 86, "lr": 9.537626856020867e-05} +{"train_loss": 0.008108030073344707, "global_step": 10282, "epoch": 86, "lr": 9.537533800768381e-05} +{"train_loss": 0.006849480327218771, "global_step": 10283, "epoch": 86, "lr": 9.537440736606934e-05} +{"train_loss": 0.011005546897649765, "global_step": 10284, "epoch": 86, "lr": 9.537347663536706e-05} +{"train_loss": 0.00558732682839036, "global_step": 10285, "epoch": 86, "lr": 9.537254581557882e-05} +{"train_loss": 0.008656419813632965, "global_step": 10286, "epoch": 86, "lr": 9.537161490670642e-05} +{"train_loss": 0.013495628722012043, "global_step": 10287, "epoch": 86, "lr": 9.53706839087517e-05} +{"train_loss": 0.00941880326718092, "global_step": 10288, "epoch": 86, "lr": 9.536975282171649e-05} +{"train_loss": 0.008787678554654121, "global_step": 10289, "epoch": 86, "lr": 9.536882164560263e-05} +{"train_loss": 0.008067290298640728, "global_step": 10290, "epoch": 86, "lr": 9.536789038041193e-05} +{"train_loss": 0.012349910102784634, "global_step": 10291, "epoch": 86, "lr": 9.536695902614622e-05} +{"train_loss": 0.011124556884169579, "global_step": 10292, "epoch": 86, "lr": 9.536602758280733e-05} +{"train_loss": 0.006105375941842794, "global_step": 10293, "epoch": 86, "lr": 9.53650960503971e-05} +{"train_loss": 0.007144308649003506, "global_step": 10294, "epoch": 86, "lr": 9.536416442891734e-05} +{"train_loss": 0.011121616698801517, "global_step": 10295, "epoch": 86, "lr": 9.536323271836991e-05} +{"train_loss": 0.01041836105287075, "global_step": 10296, "epoch": 86, "lr": 9.53623009187566e-05} +{"train_loss": 0.006707571446895599, "global_step": 10297, "epoch": 86, "lr": 9.536136903007926e-05} +{"train_loss": 0.0092572420835495, "global_step": 10298, "epoch": 86, "lr": 9.536043705233972e-05} +{"train_loss": 0.009471586905419827, "global_step": 10299, "epoch": 86, "lr": 9.53595049855398e-05} +{"train_loss": 0.014458740130066872, "global_step": 10300, "epoch": 86, "lr": 9.535857282968136e-05} +{"train_loss": 0.008558741770684719, "global_step": 10301, "epoch": 86, "lr": 9.53576405847662e-05} +{"train_loss": 0.007591879926621914, "global_step": 10302, "epoch": 86, "lr": 9.535670825079615e-05} +{"train_loss": 0.011289292946457863, "global_step": 10303, "epoch": 86, "lr": 9.535577582777305e-05} +{"train_loss": 0.011866315267980099, "global_step": 10304, "epoch": 86, "lr": 9.535484331569872e-05} +{"train_loss": 0.0071839941665530205, "global_step": 10305, "epoch": 86, "lr": 9.535391071457502e-05} +{"train_loss": 0.006585612427443266, "global_step": 10306, "epoch": 86, "lr": 9.535297802440376e-05} +{"train_loss": 0.008299439214169979, "global_step": 10307, "epoch": 86, "lr": 9.535204524518677e-05} +{"train_loss": 0.0063046785071492195, "global_step": 10308, "epoch": 86, "lr": 9.535111237692588e-05} +{"train_loss": 0.007069181650876999, "global_step": 10309, "epoch": 86, "lr": 9.535017941962292e-05} +{"train_loss": 0.00768665038049221, "global_step": 10310, "epoch": 86, "lr": 9.534924637327974e-05} +{"train_loss": 0.008434242568910122, "global_step": 10311, "epoch": 86, "lr": 9.534831323789815e-05} +{"train_loss": 0.008302649483084679, "global_step": 10312, "epoch": 86, "lr": 9.534738001348e-05} +{"train_loss": 0.006448482163250446, "global_step": 10313, "epoch": 86, "lr": 9.534644670002711e-05} +{"train_loss": 0.008525402285158634, "global_step": 10314, "epoch": 86, "lr": 9.534551329754133e-05} +{"train_loss": 0.011236361227929592, "global_step": 10315, "epoch": 86, "lr": 9.534457980602445e-05} +{"train_loss": 0.013304052874445915, "global_step": 10316, "epoch": 86, "lr": 9.534364622547836e-05} +{"train_loss": 0.008662618696689606, "global_step": 10317, "epoch": 86, "lr": 9.534271255590486e-05} +{"train_loss": 0.008812583051621914, "global_step": 10318, "epoch": 86, "lr": 9.534177879730577e-05} +{"train_loss": 0.007609276566654444, "global_step": 10319, "epoch": 86, "lr": 9.534084494968297e-05} +{"train_loss": 0.008398155681788921, "global_step": 10320, "epoch": 86, "lr": 9.533991101303823e-05} +{"train_loss": 0.006541960407048464, "global_step": 10321, "epoch": 86, "lr": 9.533897698737344e-05} +{"train_loss": 0.009522657841444016, "global_step": 10322, "epoch": 86, "lr": 9.53380428726904e-05} +{"train_loss": 0.011111714877188206, "global_step": 10323, "epoch": 86, "lr": 9.533710866899097e-05} +{"train_loss": 0.008182268589735031, "global_step": 10324, "epoch": 86, "lr": 9.533617437627696e-05} +{"train_loss": 0.010111088864505291, "global_step": 10325, "epoch": 86, "lr": 9.533523999455023e-05} +{"train_loss": 0.009098025038838387, "global_step": 10326, "epoch": 86, "lr": 9.533430552381258e-05} +{"train_loss": 0.014917255379259586, "global_step": 10327, "epoch": 86, "lr": 9.533337096406587e-05} +{"train_loss": 0.009559033438563347, "global_step": 10328, "epoch": 86, "lr": 9.533243631531195e-05} +{"train_loss": 0.007141719106584787, "global_step": 10329, "epoch": 86, "lr": 9.533150157755262e-05} +{"train_loss": 0.007818219251930714, "global_step": 10330, "epoch": 86, "lr": 9.533056675078971e-05} +{"train_loss": 0.009366091340780258, "global_step": 10331, "epoch": 86, "lr": 9.53296318350251e-05} +{"train_loss": 0.008761119097471237, "global_step": 10332, "epoch": 86, "lr": 9.53286968302606e-05} +{"train_loss": 0.007382493931800127, "global_step": 10333, "epoch": 86, "lr": 9.532776173649805e-05} +{"train_loss": 0.014293809421360493, "global_step": 10334, "epoch": 86, "lr": 9.532682655373926e-05} +{"train_loss": 0.008282492868602276, "global_step": 10335, "epoch": 86, "lr": 9.532589128198611e-05} +{"train_loss": 0.010454492643475533, "global_step": 10336, "epoch": 86, "lr": 9.53249559212404e-05} +{"train_loss": 0.011576330289244652, "global_step": 10337, "epoch": 86, "lr": 9.532402047150398e-05} +{"train_loss": 0.0086373807862401, "global_step": 10338, "epoch": 86, "lr": 9.53230849327787e-05} +{"train_loss": 0.007301836274564266, "global_step": 10339, "epoch": 86, "lr": 9.532214930506638e-05} +{"train_loss": 0.013979906216263771, "global_step": 10340, "epoch": 86, "lr": 9.532121358836885e-05} +{"train_loss": 0.009310356341302395, "global_step": 10341, "epoch": 86, "lr": 9.532027778268797e-05} +{"train_loss": 0.006968361791223288, "global_step": 10342, "epoch": 86, "lr": 9.531934188802558e-05} +{"train_loss": 0.008342662826180458, "global_step": 10343, "epoch": 86, "lr": 9.531840590438348e-05} +{"train_loss": 0.006793235428631306, "global_step": 10344, "epoch": 86, "lr": 9.531746983176355e-05} +{"train_loss": 0.006979198660701513, "global_step": 10345, "epoch": 86, "lr": 9.53165336701676e-05} +{"train_loss": 0.012050884775817394, "global_step": 10346, "epoch": 86, "lr": 9.531559741959748e-05} +{"train_loss": 0.009855899028480053, "global_step": 10347, "epoch": 86, "lr": 9.531466108005503e-05} +{"train_loss": 0.010738309472799301, "global_step": 10348, "epoch": 86, "lr": 9.531372465154207e-05} +{"train_loss": 0.006919358856976032, "global_step": 10349, "epoch": 86, "lr": 9.531278813406045e-05} +{"train_loss": 0.007950013503432274, "global_step": 10350, "epoch": 86, "lr": 9.531185152761204e-05} +{"train_loss": 0.005693987477570772, "global_step": 10351, "epoch": 86, "lr": 9.531091483219862e-05} +{"train_loss": 0.009380979576938543, "global_step": 10352, "epoch": 86, "lr": 9.530997804782208e-05, "val_loss": 0.01885736919939518} +{"train_loss": 0.01190000120550394, "global_step": 10353, "epoch": 87, "lr": 9.530904117448424e-05} +{"train_loss": 0.008310697041451931, "global_step": 10354, "epoch": 87, "lr": 9.530810421218692e-05} +{"train_loss": 0.009000043384730816, "global_step": 10355, "epoch": 87, "lr": 9.5307167160932e-05} +{"train_loss": 0.008219875395298004, "global_step": 10356, "epoch": 87, "lr": 9.530623002072127e-05} +{"train_loss": 0.01046360470354557, "global_step": 10357, "epoch": 87, "lr": 9.530529279155662e-05} +{"train_loss": 0.005831817630678415, "global_step": 10358, "epoch": 87, "lr": 9.530435547343986e-05} +{"train_loss": 0.008586851879954338, "global_step": 10359, "epoch": 87, "lr": 9.530341806637284e-05} +{"train_loss": 0.009527558460831642, "global_step": 10360, "epoch": 87, "lr": 9.53024805703574e-05} +{"train_loss": 0.007776553276926279, "global_step": 10361, "epoch": 87, "lr": 9.530154298539538e-05} +{"train_loss": 0.010457415133714676, "global_step": 10362, "epoch": 87, "lr": 9.530060531148861e-05} +{"train_loss": 0.008681226521730423, "global_step": 10363, "epoch": 87, "lr": 9.529966754863895e-05} +{"train_loss": 0.00878528505563736, "global_step": 10364, "epoch": 87, "lr": 9.529872969684823e-05} +{"train_loss": 0.00825019832700491, "global_step": 10365, "epoch": 87, "lr": 9.52977917561183e-05} +{"train_loss": 0.007942330092191696, "global_step": 10366, "epoch": 87, "lr": 9.529685372645099e-05} +{"train_loss": 0.008762739598751068, "global_step": 10367, "epoch": 87, "lr": 9.529591560784814e-05} +{"train_loss": 0.013233420439064503, "global_step": 10368, "epoch": 87, "lr": 9.529497740031162e-05} +{"train_loss": 0.00772120850160718, "global_step": 10369, "epoch": 87, "lr": 9.529403910384322e-05} +{"train_loss": 0.008236887864768505, "global_step": 10370, "epoch": 87, "lr": 9.529310071844484e-05} +{"train_loss": 0.008332774043083191, "global_step": 10371, "epoch": 87, "lr": 9.529216224411828e-05} +{"train_loss": 0.00785315502434969, "global_step": 10372, "epoch": 87, "lr": 9.529122368086541e-05} +{"train_loss": 0.012976001016795635, "global_step": 10373, "epoch": 87, "lr": 9.529028502868805e-05} +{"train_loss": 0.00905616581439972, "global_step": 10374, "epoch": 87, "lr": 9.528934628758806e-05} +{"train_loss": 0.010423588566482067, "global_step": 10375, "epoch": 87, "lr": 9.528840745756727e-05} +{"train_loss": 0.0073633273132145405, "global_step": 10376, "epoch": 87, "lr": 9.528746853862753e-05} +{"train_loss": 0.009431568905711174, "global_step": 10377, "epoch": 87, "lr": 9.528652953077068e-05} +{"train_loss": 0.008245156146585941, "global_step": 10378, "epoch": 87, "lr": 9.528559043399859e-05} +{"train_loss": 0.005115768872201443, "global_step": 10379, "epoch": 87, "lr": 9.528465124831307e-05} +{"train_loss": 0.0057630413211882114, "global_step": 10380, "epoch": 87, "lr": 9.528371197371597e-05} +{"train_loss": 0.01174890622496605, "global_step": 10381, "epoch": 87, "lr": 9.528277261020915e-05} +{"train_loss": 0.00891105830669403, "global_step": 10382, "epoch": 87, "lr": 9.528183315779444e-05} +{"train_loss": 0.007442701607942581, "global_step": 10383, "epoch": 87, "lr": 9.528089361647367e-05} +{"train_loss": 0.008322315290570259, "global_step": 10384, "epoch": 87, "lr": 9.527995398624871e-05} +{"train_loss": 0.009592458605766296, "global_step": 10385, "epoch": 87, "lr": 9.527901426712141e-05} +{"train_loss": 0.011592630296945572, "global_step": 10386, "epoch": 87, "lr": 9.52780744590936e-05} +{"train_loss": 0.006960602477192879, "global_step": 10387, "epoch": 87, "lr": 9.527713456216713e-05} +{"train_loss": 0.011347083374857903, "global_step": 10388, "epoch": 87, "lr": 9.527619457634385e-05} +{"train_loss": 0.006182153709232807, "global_step": 10389, "epoch": 87, "lr": 9.527525450162558e-05} +{"train_loss": 0.00953584536910057, "global_step": 10390, "epoch": 87, "lr": 9.527431433801419e-05} +{"train_loss": 0.011275647208094597, "global_step": 10391, "epoch": 87, "lr": 9.527337408551153e-05} +{"train_loss": 0.011671368032693863, "global_step": 10392, "epoch": 87, "lr": 9.527243374411943e-05} +{"train_loss": 0.008655420504510403, "global_step": 10393, "epoch": 87, "lr": 9.527149331383973e-05} +{"train_loss": 0.008342656306922436, "global_step": 10394, "epoch": 87, "lr": 9.527055279467432e-05} +{"train_loss": 0.012441867962479591, "global_step": 10395, "epoch": 87, "lr": 9.526961218662499e-05} +{"train_loss": 0.011027897708117962, "global_step": 10396, "epoch": 87, "lr": 9.526867148969361e-05} +{"train_loss": 0.008853644132614136, "global_step": 10397, "epoch": 87, "lr": 9.526773070388205e-05} +{"train_loss": 0.007071599829941988, "global_step": 10398, "epoch": 87, "lr": 9.526678982919213e-05} +{"train_loss": 0.016744310036301613, "global_step": 10399, "epoch": 87, "lr": 9.52658488656257e-05} +{"train_loss": 0.007573270238935947, "global_step": 10400, "epoch": 87, "lr": 9.526490781318463e-05} +{"train_loss": 0.013368695043027401, "global_step": 10401, "epoch": 87, "lr": 9.526396667187072e-05} +{"train_loss": 0.008766015991568565, "global_step": 10402, "epoch": 87, "lr": 9.526302544168587e-05} +{"train_loss": 0.012011999264359474, "global_step": 10403, "epoch": 87, "lr": 9.526208412263189e-05} +{"train_loss": 0.012972420081496239, "global_step": 10404, "epoch": 87, "lr": 9.526114271471065e-05} +{"train_loss": 0.008785792626440525, "global_step": 10405, "epoch": 87, "lr": 9.526020121792399e-05} +{"train_loss": 0.00700937956571579, "global_step": 10406, "epoch": 87, "lr": 9.525925963227376e-05} +{"train_loss": 0.008692285045981407, "global_step": 10407, "epoch": 87, "lr": 9.52583179577618e-05} +{"train_loss": 0.010015677660703659, "global_step": 10408, "epoch": 87, "lr": 9.525737619439e-05} +{"train_loss": 0.00701351510360837, "global_step": 10409, "epoch": 87, "lr": 9.525643434216014e-05} +{"train_loss": 0.007947225123643875, "global_step": 10410, "epoch": 87, "lr": 9.525549240107412e-05} +{"train_loss": 0.00896395742893219, "global_step": 10411, "epoch": 87, "lr": 9.525455037113378e-05} +{"train_loss": 0.011191288009285927, "global_step": 10412, "epoch": 87, "lr": 9.525360825234097e-05} +{"train_loss": 0.009990173391997814, "global_step": 10413, "epoch": 87, "lr": 9.525266604469752e-05} +{"train_loss": 0.008507261984050274, "global_step": 10414, "epoch": 87, "lr": 9.52517237482053e-05} +{"train_loss": 0.008548540063202381, "global_step": 10415, "epoch": 87, "lr": 9.525078136286616e-05} +{"train_loss": 0.010277727618813515, "global_step": 10416, "epoch": 87, "lr": 9.524983888868193e-05} +{"train_loss": 0.007994798943400383, "global_step": 10417, "epoch": 87, "lr": 9.52488963256545e-05} +{"train_loss": 0.012282412499189377, "global_step": 10418, "epoch": 87, "lr": 9.524795367378567e-05} +{"train_loss": 0.0069939070381224155, "global_step": 10419, "epoch": 87, "lr": 9.524701093307734e-05} +{"train_loss": 0.009612519294023514, "global_step": 10420, "epoch": 87, "lr": 9.524606810353132e-05} +{"train_loss": 0.007541922852396965, "global_step": 10421, "epoch": 87, "lr": 9.524512518514949e-05} +{"train_loss": 0.005095082800835371, "global_step": 10422, "epoch": 87, "lr": 9.524418217793369e-05} +{"train_loss": 0.009369623847305775, "global_step": 10423, "epoch": 87, "lr": 9.524323908188577e-05} +{"train_loss": 0.010724411346018314, "global_step": 10424, "epoch": 87, "lr": 9.524229589700759e-05} +{"train_loss": 0.005941221956163645, "global_step": 10425, "epoch": 87, "lr": 9.524135262330098e-05} +{"train_loss": 0.015416482463479042, "global_step": 10426, "epoch": 87, "lr": 9.524040926076782e-05} +{"train_loss": 0.010388885624706745, "global_step": 10427, "epoch": 87, "lr": 9.523946580940994e-05} +{"train_loss": 0.00585016468539834, "global_step": 10428, "epoch": 87, "lr": 9.52385222692292e-05} +{"train_loss": 0.008311981335282326, "global_step": 10429, "epoch": 87, "lr": 9.523757864022746e-05} +{"train_loss": 0.008326354436576366, "global_step": 10430, "epoch": 87, "lr": 9.523663492240657e-05} +{"train_loss": 0.009509557858109474, "global_step": 10431, "epoch": 87, "lr": 9.523569111576839e-05} +{"train_loss": 0.013975310139358044, "global_step": 10432, "epoch": 87, "lr": 9.523474722031476e-05} +{"train_loss": 0.01061050221323967, "global_step": 10433, "epoch": 87, "lr": 9.523380323604753e-05} +{"train_loss": 0.015034760348498821, "global_step": 10434, "epoch": 87, "lr": 9.523285916296855e-05} +{"train_loss": 0.007256072945892811, "global_step": 10435, "epoch": 87, "lr": 9.52319150010797e-05} +{"train_loss": 0.013570331037044525, "global_step": 10436, "epoch": 87, "lr": 9.523097075038281e-05} +{"train_loss": 0.007059497758746147, "global_step": 10437, "epoch": 87, "lr": 9.523002641087973e-05} +{"train_loss": 0.006989260204136372, "global_step": 10438, "epoch": 87, "lr": 9.522908198257235e-05} +{"train_loss": 0.014122959226369858, "global_step": 10439, "epoch": 87, "lr": 9.522813746546249e-05} +{"train_loss": 0.005864883307367563, "global_step": 10440, "epoch": 87, "lr": 9.522719285955199e-05} +{"train_loss": 0.008572757244110107, "global_step": 10441, "epoch": 87, "lr": 9.522624816484276e-05} +{"train_loss": 0.010686910711228848, "global_step": 10442, "epoch": 87, "lr": 9.522530338133661e-05} +{"train_loss": 0.008219740353524685, "global_step": 10443, "epoch": 87, "lr": 9.52243585090354e-05} +{"train_loss": 0.00789912324398756, "global_step": 10444, "epoch": 87, "lr": 9.522341354794102e-05} +{"train_loss": 0.01443654764443636, "global_step": 10445, "epoch": 87, "lr": 9.522246849805527e-05} +{"train_loss": 0.0158843956887722, "global_step": 10446, "epoch": 87, "lr": 9.522152335938005e-05} +{"train_loss": 0.01169415470212698, "global_step": 10447, "epoch": 87, "lr": 9.52205781319172e-05} +{"train_loss": 0.009938433766365051, "global_step": 10448, "epoch": 87, "lr": 9.521963281566857e-05} +{"train_loss": 0.01367627177387476, "global_step": 10449, "epoch": 87, "lr": 9.521868741063602e-05} +{"train_loss": 0.010135170072317123, "global_step": 10450, "epoch": 87, "lr": 9.521774191682143e-05} +{"train_loss": 0.00765852490440011, "global_step": 10451, "epoch": 87, "lr": 9.52167963342266e-05} +{"train_loss": 0.013023314997553825, "global_step": 10452, "epoch": 87, "lr": 9.521585066285345e-05} +{"train_loss": 0.009272699244320393, "global_step": 10453, "epoch": 87, "lr": 9.52149049027038e-05} +{"train_loss": 0.00979333370923996, "global_step": 10454, "epoch": 87, "lr": 9.52139590537795e-05} +{"train_loss": 0.009194908663630486, "global_step": 10455, "epoch": 87, "lr": 9.521301311608244e-05} +{"train_loss": 0.012267551384866238, "global_step": 10456, "epoch": 87, "lr": 9.521206708961446e-05} +{"train_loss": 0.008834918960928917, "global_step": 10457, "epoch": 87, "lr": 9.52111209743774e-05} +{"train_loss": 0.007629323750734329, "global_step": 10458, "epoch": 87, "lr": 9.521017477037315e-05} +{"train_loss": 0.011322187259793282, "global_step": 10459, "epoch": 87, "lr": 9.520922847760354e-05} +{"train_loss": 0.00727094616740942, "global_step": 10460, "epoch": 87, "lr": 9.520828209607045e-05} +{"train_loss": 0.007561800070106983, "global_step": 10461, "epoch": 87, "lr": 9.52073356257757e-05} +{"train_loss": 0.006710023153573275, "global_step": 10462, "epoch": 87, "lr": 9.520638906672122e-05} +{"train_loss": 0.010462906211614609, "global_step": 10463, "epoch": 87, "lr": 9.52054424189088e-05} +{"train_loss": 0.010115260258316994, "global_step": 10464, "epoch": 87, "lr": 9.520449568234033e-05} +{"train_loss": 0.00762367807328701, "global_step": 10465, "epoch": 87, "lr": 9.520354885701766e-05} +{"train_loss": 0.008679931983351707, "global_step": 10466, "epoch": 87, "lr": 9.520260194294264e-05} +{"train_loss": 0.011073696427047253, "global_step": 10467, "epoch": 87, "lr": 9.520165494011715e-05} +{"train_loss": 0.008481676690280437, "global_step": 10468, "epoch": 87, "lr": 9.520070784854304e-05} +{"train_loss": 0.006873604841530323, "global_step": 10469, "epoch": 87, "lr": 9.519976066822217e-05} +{"train_loss": 0.009874878451228142, "global_step": 10470, "epoch": 87, "lr": 9.51988133991564e-05} +{"train_loss": 0.009450417630249211, "global_step": 10471, "epoch": 87, "lr": 9.519786604134758e-05, "val_loss": 0.018628908321261406} +{"train_loss": 0.00640258751809597, "global_step": 10472, "epoch": 88, "lr": 9.519691859479757e-05} +{"train_loss": 0.013836192898452282, "global_step": 10473, "epoch": 88, "lr": 9.519597105950827e-05} +{"train_loss": 0.012438478879630566, "global_step": 10474, "epoch": 88, "lr": 9.51950234354815e-05} +{"train_loss": 0.009498871862888336, "global_step": 10475, "epoch": 88, "lr": 9.519407572271912e-05} +{"train_loss": 0.006835402455180883, "global_step": 10476, "epoch": 88, "lr": 9.519312792122301e-05} +{"train_loss": 0.0050186458975076675, "global_step": 10477, "epoch": 88, "lr": 9.519218003099501e-05} +{"train_loss": 0.012173129245638847, "global_step": 10478, "epoch": 88, "lr": 9.5191232052037e-05} +{"train_loss": 0.01110679842531681, "global_step": 10479, "epoch": 88, "lr": 9.519028398435082e-05} +{"train_loss": 0.011694056913256645, "global_step": 10480, "epoch": 88, "lr": 9.518933582793836e-05} +{"train_loss": 0.010560736991465092, "global_step": 10481, "epoch": 88, "lr": 9.518838758280146e-05} +{"train_loss": 0.011144713498651981, "global_step": 10482, "epoch": 88, "lr": 9.5187439248942e-05} +{"train_loss": 0.008603803813457489, "global_step": 10483, "epoch": 88, "lr": 9.518649082636182e-05} +{"train_loss": 0.007639455143362284, "global_step": 10484, "epoch": 88, "lr": 9.51855423150628e-05} +{"train_loss": 0.006751521490514278, "global_step": 10485, "epoch": 88, "lr": 9.518459371504679e-05} +{"train_loss": 0.00836342852562666, "global_step": 10486, "epoch": 88, "lr": 9.518364502631564e-05} +{"train_loss": 0.01220310665667057, "global_step": 10487, "epoch": 88, "lr": 9.518269624887126e-05} +{"train_loss": 0.0095093147829175, "global_step": 10488, "epoch": 88, "lr": 9.518174738271549e-05} +{"train_loss": 0.009915901347994804, "global_step": 10489, "epoch": 88, "lr": 9.518079842785015e-05} +{"train_loss": 0.006902774330228567, "global_step": 10490, "epoch": 88, "lr": 9.517984938427715e-05} +{"train_loss": 0.010560659691691399, "global_step": 10491, "epoch": 88, "lr": 9.517890025199836e-05} +{"train_loss": 0.011182008311152458, "global_step": 10492, "epoch": 88, "lr": 9.517795103101562e-05} +{"train_loss": 0.010621505789458752, "global_step": 10493, "epoch": 88, "lr": 9.517700172133079e-05} +{"train_loss": 0.008085078559815884, "global_step": 10494, "epoch": 88, "lr": 9.517605232294575e-05} +{"train_loss": 0.00773311173543334, "global_step": 10495, "epoch": 88, "lr": 9.517510283586235e-05} +{"train_loss": 0.010749218054115772, "global_step": 10496, "epoch": 88, "lr": 9.517415326008248e-05} +{"train_loss": 0.008912581019103527, "global_step": 10497, "epoch": 88, "lr": 9.517320359560796e-05} +{"train_loss": 0.010004321113228798, "global_step": 10498, "epoch": 88, "lr": 9.517225384244071e-05} +{"train_loss": 0.008436049334704876, "global_step": 10499, "epoch": 88, "lr": 9.517130400058253e-05} +{"train_loss": 0.008532221429049969, "global_step": 10500, "epoch": 88, "lr": 9.517035407003535e-05} +{"train_loss": 0.012080756947398186, "global_step": 10501, "epoch": 88, "lr": 9.516940405080099e-05} +{"train_loss": 0.007325794547796249, "global_step": 10502, "epoch": 88, "lr": 9.516845394288134e-05} +{"train_loss": 0.00950663723051548, "global_step": 10503, "epoch": 88, "lr": 9.516750374627826e-05} +{"train_loss": 0.008910740725696087, "global_step": 10504, "epoch": 88, "lr": 9.51665534609936e-05} +{"train_loss": 0.012283279560506344, "global_step": 10505, "epoch": 88, "lr": 9.516560308702924e-05} +{"train_loss": 0.008504016324877739, "global_step": 10506, "epoch": 88, "lr": 9.516465262438705e-05} +{"train_loss": 0.00929418858140707, "global_step": 10507, "epoch": 88, "lr": 9.516370207306888e-05} +{"train_loss": 0.00898038037121296, "global_step": 10508, "epoch": 88, "lr": 9.516275143307662e-05} +{"train_loss": 0.009824422188103199, "global_step": 10509, "epoch": 88, "lr": 9.516180070441212e-05} +{"train_loss": 0.009775320068001747, "global_step": 10510, "epoch": 88, "lr": 9.516084988707724e-05} +{"train_loss": 0.006534108892083168, "global_step": 10511, "epoch": 88, "lr": 9.515989898107384e-05} +{"train_loss": 0.00783170759677887, "global_step": 10512, "epoch": 88, "lr": 9.515894798640384e-05} +{"train_loss": 0.011192353442311287, "global_step": 10513, "epoch": 88, "lr": 9.515799690306906e-05} +{"train_loss": 0.005383426323533058, "global_step": 10514, "epoch": 88, "lr": 9.515704573107137e-05} +{"train_loss": 0.009220478124916553, "global_step": 10515, "epoch": 88, "lr": 9.515609447041262e-05} +{"train_loss": 0.009813395328819752, "global_step": 10516, "epoch": 88, "lr": 9.515514312109475e-05} +{"train_loss": 0.006241178140044212, "global_step": 10517, "epoch": 88, "lr": 9.515419168311955e-05} +{"train_loss": 0.011485601775348186, "global_step": 10518, "epoch": 88, "lr": 9.515324015648892e-05} +{"train_loss": 0.00815097987651825, "global_step": 10519, "epoch": 88, "lr": 9.515228854120475e-05} +{"train_loss": 0.014153662137687206, "global_step": 10520, "epoch": 88, "lr": 9.515133683726886e-05} +{"train_loss": 0.010665363632142544, "global_step": 10521, "epoch": 88, "lr": 9.515038504468316e-05} +{"train_loss": 0.008396010845899582, "global_step": 10522, "epoch": 88, "lr": 9.514943316344949e-05} +{"train_loss": 0.010655502788722515, "global_step": 10523, "epoch": 88, "lr": 9.514848119356974e-05} +{"train_loss": 0.010475289076566696, "global_step": 10524, "epoch": 88, "lr": 9.514752913504576e-05} +{"train_loss": 0.006072813645005226, "global_step": 10525, "epoch": 88, "lr": 9.514657698787944e-05} +{"train_loss": 0.006633649114519358, "global_step": 10526, "epoch": 88, "lr": 9.514562475207265e-05} +{"train_loss": 0.006958091165870428, "global_step": 10527, "epoch": 88, "lr": 9.514467242762722e-05} +{"train_loss": 0.012479033321142197, "global_step": 10528, "epoch": 88, "lr": 9.514372001454506e-05} +{"train_loss": 0.010039872489869595, "global_step": 10529, "epoch": 88, "lr": 9.514276751282805e-05} +{"train_loss": 0.009094555862247944, "global_step": 10530, "epoch": 88, "lr": 9.514181492247803e-05} +{"train_loss": 0.007308460772037506, "global_step": 10531, "epoch": 88, "lr": 9.514086224349686e-05} +{"train_loss": 0.009948056191205978, "global_step": 10532, "epoch": 88, "lr": 9.513990947588643e-05} +{"train_loss": 0.012215808965265751, "global_step": 10533, "epoch": 88, "lr": 9.513895661964862e-05} +{"train_loss": 0.008625390939414501, "global_step": 10534, "epoch": 88, "lr": 9.51380036747853e-05} +{"train_loss": 0.00834193080663681, "global_step": 10535, "epoch": 88, "lr": 9.513705064129832e-05} +{"train_loss": 0.009093891829252243, "global_step": 10536, "epoch": 88, "lr": 9.513609751918957e-05} +{"train_loss": 0.004320950713008642, "global_step": 10537, "epoch": 88, "lr": 9.513514430846091e-05} +{"train_loss": 0.009678525850176811, "global_step": 10538, "epoch": 88, "lr": 9.513419100911422e-05} +{"train_loss": 0.00945383869111538, "global_step": 10539, "epoch": 88, "lr": 9.513323762115136e-05} +{"train_loss": 0.010901490226387978, "global_step": 10540, "epoch": 88, "lr": 9.513228414457423e-05} +{"train_loss": 0.005921473726630211, "global_step": 10541, "epoch": 88, "lr": 9.513133057938466e-05} +{"train_loss": 0.015001942403614521, "global_step": 10542, "epoch": 88, "lr": 9.513037692558455e-05} +{"train_loss": 0.007163806352764368, "global_step": 10543, "epoch": 88, "lr": 9.512942318317577e-05} +{"train_loss": 0.005715852603316307, "global_step": 10544, "epoch": 88, "lr": 9.512846935216018e-05} +{"train_loss": 0.007629201747477055, "global_step": 10545, "epoch": 88, "lr": 9.512751543253967e-05} +{"train_loss": 0.008127456530928612, "global_step": 10546, "epoch": 88, "lr": 9.51265614243161e-05} +{"train_loss": 0.01057166513055563, "global_step": 10547, "epoch": 88, "lr": 9.512560732749137e-05} +{"train_loss": 0.006959948688745499, "global_step": 10548, "epoch": 88, "lr": 9.512465314206729e-05} +{"train_loss": 0.004858169239014387, "global_step": 10549, "epoch": 88, "lr": 9.51236988680458e-05} +{"train_loss": 0.006980805657804012, "global_step": 10550, "epoch": 88, "lr": 9.512274450542876e-05} +{"train_loss": 0.008601857349276543, "global_step": 10551, "epoch": 88, "lr": 9.5121790054218e-05} +{"train_loss": 0.009232631884515285, "global_step": 10552, "epoch": 88, "lr": 9.512083551441544e-05} +{"train_loss": 0.009980532340705395, "global_step": 10553, "epoch": 88, "lr": 9.511988088602295e-05} +{"train_loss": 0.009325919672846794, "global_step": 10554, "epoch": 88, "lr": 9.511892616904239e-05} +{"train_loss": 0.009998107329010963, "global_step": 10555, "epoch": 88, "lr": 9.511797136347562e-05} +{"train_loss": 0.0067656319588422775, "global_step": 10556, "epoch": 88, "lr": 9.511701646932457e-05} +{"train_loss": 0.009843307547271252, "global_step": 10557, "epoch": 88, "lr": 9.511606148659105e-05} +{"train_loss": 0.006055222358554602, "global_step": 10558, "epoch": 88, "lr": 9.511510641527695e-05} +{"train_loss": 0.010432885959744453, "global_step": 10559, "epoch": 88, "lr": 9.511415125538419e-05} +{"train_loss": 0.006898366380482912, "global_step": 10560, "epoch": 88, "lr": 9.511319600691459e-05} +{"train_loss": 0.009827119298279285, "global_step": 10561, "epoch": 88, "lr": 9.511224066987007e-05} +{"train_loss": 0.009117637760937214, "global_step": 10562, "epoch": 88, "lr": 9.511128524425248e-05} +{"train_loss": 0.009565195068717003, "global_step": 10563, "epoch": 88, "lr": 9.511032973006369e-05} +{"train_loss": 0.008669753558933735, "global_step": 10564, "epoch": 88, "lr": 9.510937412730558e-05} +{"train_loss": 0.013613175600767136, "global_step": 10565, "epoch": 88, "lr": 9.510841843598006e-05} +{"train_loss": 0.009725874289870262, "global_step": 10566, "epoch": 88, "lr": 9.510746265608896e-05} +{"train_loss": 0.011768116615712643, "global_step": 10567, "epoch": 88, "lr": 9.510650678763419e-05} +{"train_loss": 0.007730219513177872, "global_step": 10568, "epoch": 88, "lr": 9.51055508306176e-05} +{"train_loss": 0.007318597286939621, "global_step": 10569, "epoch": 88, "lr": 9.510459478504107e-05} +{"train_loss": 0.007470362354069948, "global_step": 10570, "epoch": 88, "lr": 9.510363865090652e-05} +{"train_loss": 0.010470458306372166, "global_step": 10571, "epoch": 88, "lr": 9.510268242821577e-05} +{"train_loss": 0.00716459471732378, "global_step": 10572, "epoch": 88, "lr": 9.510172611697072e-05} +{"train_loss": 0.0078684501349926, "global_step": 10573, "epoch": 88, "lr": 9.510076971717327e-05} +{"train_loss": 0.006493974942713976, "global_step": 10574, "epoch": 88, "lr": 9.509981322882527e-05} +{"train_loss": 0.01252746395766735, "global_step": 10575, "epoch": 88, "lr": 9.50988566519286e-05} +{"train_loss": 0.010626627132296562, "global_step": 10576, "epoch": 88, "lr": 9.509789998648513e-05} +{"train_loss": 0.007047989871352911, "global_step": 10577, "epoch": 88, "lr": 9.509694323249676e-05} +{"train_loss": 0.00842040404677391, "global_step": 10578, "epoch": 88, "lr": 9.509598638996536e-05} +{"train_loss": 0.006941885221749544, "global_step": 10579, "epoch": 88, "lr": 9.509502945889281e-05} +{"train_loss": 0.013128841295838356, "global_step": 10580, "epoch": 88, "lr": 9.5094072439281e-05} +{"train_loss": 0.009914613328874111, "global_step": 10581, "epoch": 88, "lr": 9.509311533113178e-05} +{"train_loss": 0.007107262499630451, "global_step": 10582, "epoch": 88, "lr": 9.509215813444706e-05} +{"train_loss": 0.011715714819729328, "global_step": 10583, "epoch": 88, "lr": 9.509120084922869e-05} +{"train_loss": 0.006036955397576094, "global_step": 10584, "epoch": 88, "lr": 9.509024347547857e-05} +{"train_loss": 0.011915306560695171, "global_step": 10585, "epoch": 88, "lr": 9.508928601319857e-05} +{"train_loss": 0.012735980562865734, "global_step": 10586, "epoch": 88, "lr": 9.508832846239057e-05} +{"train_loss": 0.006649009417742491, "global_step": 10587, "epoch": 88, "lr": 9.508737082305647e-05} +{"train_loss": 0.010337087325751781, "global_step": 10588, "epoch": 88, "lr": 9.508641309519812e-05} +{"train_loss": 0.013037648983299732, "global_step": 10589, "epoch": 88, "lr": 9.508545527881743e-05} +{"train_loss": 0.009219667040782064, "global_step": 10590, "epoch": 88, "lr": 9.508449737391625e-05, "val_loss": 0.011999481357634068} +{"train_loss": 0.013109478168189526, "global_step": 10591, "epoch": 89, "lr": 9.508353938049648e-05} +{"train_loss": 0.017680762335658073, "global_step": 10592, "epoch": 89, "lr": 9.508258129856001e-05} +{"train_loss": 0.009338012896478176, "global_step": 10593, "epoch": 89, "lr": 9.508162312810869e-05} +{"train_loss": 0.012361941859126091, "global_step": 10594, "epoch": 89, "lr": 9.508066486914442e-05} +{"train_loss": 0.012002185918390751, "global_step": 10595, "epoch": 89, "lr": 9.507970652166909e-05} +{"train_loss": 0.00951459538191557, "global_step": 10596, "epoch": 89, "lr": 9.507874808568457e-05} +{"train_loss": 0.007501138374209404, "global_step": 10597, "epoch": 89, "lr": 9.507778956119274e-05} +{"train_loss": 0.007527139503508806, "global_step": 10598, "epoch": 89, "lr": 9.50768309481955e-05} +{"train_loss": 0.009428901597857475, "global_step": 10599, "epoch": 89, "lr": 9.507587224669469e-05} +{"train_loss": 0.00820083636790514, "global_step": 10600, "epoch": 89, "lr": 9.507491345669225e-05} +{"train_loss": 0.0057197934947907925, "global_step": 10601, "epoch": 89, "lr": 9.507395457819001e-05} +{"train_loss": 0.009132719598710537, "global_step": 10602, "epoch": 89, "lr": 9.50729956111899e-05} +{"train_loss": 0.01467023603618145, "global_step": 10603, "epoch": 89, "lr": 9.507203655569376e-05} +{"train_loss": 0.011857995763421059, "global_step": 10604, "epoch": 89, "lr": 9.50710774117035e-05} +{"train_loss": 0.011077234521508217, "global_step": 10605, "epoch": 89, "lr": 9.507011817922099e-05} +{"train_loss": 0.008768575266003609, "global_step": 10606, "epoch": 89, "lr": 9.506915885824812e-05} +{"train_loss": 0.0058131651021540165, "global_step": 10607, "epoch": 89, "lr": 9.506819944878678e-05} +{"train_loss": 0.009143105708062649, "global_step": 10608, "epoch": 89, "lr": 9.506723995083881e-05} +{"train_loss": 0.010933329351246357, "global_step": 10609, "epoch": 89, "lr": 9.506628036440617e-05} +{"train_loss": 0.00955759733915329, "global_step": 10610, "epoch": 89, "lr": 9.50653206894907e-05} +{"train_loss": 0.01191206369549036, "global_step": 10611, "epoch": 89, "lr": 9.506436092609425e-05} +{"train_loss": 0.013253698125481606, "global_step": 10612, "epoch": 89, "lr": 9.506340107421878e-05} +{"train_loss": 0.010786638595163822, "global_step": 10613, "epoch": 89, "lr": 9.506244113386612e-05} +{"train_loss": 0.008130501955747604, "global_step": 10614, "epoch": 89, "lr": 9.506148110503818e-05} +{"train_loss": 0.011357767507433891, "global_step": 10615, "epoch": 89, "lr": 9.506052098773684e-05} +{"train_loss": 0.013604678213596344, "global_step": 10616, "epoch": 89, "lr": 9.505956078196397e-05} +{"train_loss": 0.0071105025708675385, "global_step": 10617, "epoch": 89, "lr": 9.505860048772146e-05} +{"train_loss": 0.00609353743493557, "global_step": 10618, "epoch": 89, "lr": 9.50576401050112e-05} +{"train_loss": 0.01263527199625969, "global_step": 10619, "epoch": 89, "lr": 9.505667963383508e-05} +{"train_loss": 0.010358601808547974, "global_step": 10620, "epoch": 89, "lr": 9.505571907419501e-05} +{"train_loss": 0.008457643911242485, "global_step": 10621, "epoch": 89, "lr": 9.505475842609282e-05} +{"train_loss": 0.009098978713154793, "global_step": 10622, "epoch": 89, "lr": 9.505379768953044e-05} +{"train_loss": 0.009462663903832436, "global_step": 10623, "epoch": 89, "lr": 9.505283686450973e-05} +{"train_loss": 0.008380348794162273, "global_step": 10624, "epoch": 89, "lr": 9.50518759510326e-05} +{"train_loss": 0.012167045846581459, "global_step": 10625, "epoch": 89, "lr": 9.50509149491009e-05} +{"train_loss": 0.01272099744528532, "global_step": 10626, "epoch": 89, "lr": 9.504995385871657e-05} +{"train_loss": 0.00914907269179821, "global_step": 10627, "epoch": 89, "lr": 9.504899267988145e-05} +{"train_loss": 0.007424337323755026, "global_step": 10628, "epoch": 89, "lr": 9.504803141259746e-05} +{"train_loss": 0.011751226149499416, "global_step": 10629, "epoch": 89, "lr": 9.504707005686648e-05} +{"train_loss": 0.0137330936267972, "global_step": 10630, "epoch": 89, "lr": 9.504610861269036e-05} +{"train_loss": 0.008160920813679695, "global_step": 10631, "epoch": 89, "lr": 9.504514708007105e-05} +{"train_loss": 0.00901777297258377, "global_step": 10632, "epoch": 89, "lr": 9.504418545901039e-05} +{"train_loss": 0.011734348721802235, "global_step": 10633, "epoch": 89, "lr": 9.504322374951028e-05} +{"train_loss": 0.01506062876433134, "global_step": 10634, "epoch": 89, "lr": 9.504226195157262e-05} +{"train_loss": 0.006370130460709333, "global_step": 10635, "epoch": 89, "lr": 9.504130006519929e-05} +{"train_loss": 0.00905685406178236, "global_step": 10636, "epoch": 89, "lr": 9.504033809039217e-05} +{"train_loss": 0.011042026802897453, "global_step": 10637, "epoch": 89, "lr": 9.503937602715318e-05} +{"train_loss": 0.01097621489316225, "global_step": 10638, "epoch": 89, "lr": 9.503841387548417e-05} +{"train_loss": 0.0071611907333135605, "global_step": 10639, "epoch": 89, "lr": 9.503745163538704e-05} +{"train_loss": 0.013331588357686996, "global_step": 10640, "epoch": 89, "lr": 9.50364893068637e-05} +{"train_loss": 0.009122462943196297, "global_step": 10641, "epoch": 89, "lr": 9.503552688991602e-05} +{"train_loss": 0.0080651780590415, "global_step": 10642, "epoch": 89, "lr": 9.50345643845459e-05} +{"train_loss": 0.011270520277321339, "global_step": 10643, "epoch": 89, "lr": 9.50336017907552e-05} +{"train_loss": 0.009009310975670815, "global_step": 10644, "epoch": 89, "lr": 9.503263910854586e-05} +{"train_loss": 0.009229866787791252, "global_step": 10645, "epoch": 89, "lr": 9.503167633791974e-05} +{"train_loss": 0.00829208455979824, "global_step": 10646, "epoch": 89, "lr": 9.503071347887872e-05} +{"train_loss": 0.007020789198577404, "global_step": 10647, "epoch": 89, "lr": 9.502975053142473e-05} +{"train_loss": 0.01018398255109787, "global_step": 10648, "epoch": 89, "lr": 9.50287874955596e-05} +{"train_loss": 0.00934829842299223, "global_step": 10649, "epoch": 89, "lr": 9.502782437128529e-05} +{"train_loss": 0.010737325996160507, "global_step": 10650, "epoch": 89, "lr": 9.502686115860364e-05} +{"train_loss": 0.010700452141463757, "global_step": 10651, "epoch": 89, "lr": 9.502589785751657e-05} +{"train_loss": 0.009418470785021782, "global_step": 10652, "epoch": 89, "lr": 9.502493446802595e-05} +{"train_loss": 0.009011422283947468, "global_step": 10653, "epoch": 89, "lr": 9.502397099013369e-05} +{"train_loss": 0.009459925815463066, "global_step": 10654, "epoch": 89, "lr": 9.502300742384167e-05} +{"train_loss": 0.010045172646641731, "global_step": 10655, "epoch": 89, "lr": 9.502204376915178e-05} +{"train_loss": 0.008302081376314163, "global_step": 10656, "epoch": 89, "lr": 9.502108002606592e-05} +{"train_loss": 0.010938229039311409, "global_step": 10657, "epoch": 89, "lr": 9.502011619458597e-05} +{"train_loss": 0.007796477992087603, "global_step": 10658, "epoch": 89, "lr": 9.501915227471384e-05} +{"train_loss": 0.009624890983104706, "global_step": 10659, "epoch": 89, "lr": 9.501818826645141e-05} +{"train_loss": 0.007815594784915447, "global_step": 10660, "epoch": 89, "lr": 9.501722416980059e-05} +{"train_loss": 0.009890301153063774, "global_step": 10661, "epoch": 89, "lr": 9.501625998476325e-05} +{"train_loss": 0.005775083787739277, "global_step": 10662, "epoch": 89, "lr": 9.501529571134129e-05} +{"train_loss": 0.009081070311367512, "global_step": 10663, "epoch": 89, "lr": 9.501433134953662e-05} +{"train_loss": 0.0057877181097865105, "global_step": 10664, "epoch": 89, "lr": 9.50133668993511e-05} +{"train_loss": 0.00942403543740511, "global_step": 10665, "epoch": 89, "lr": 9.501240236078666e-05} +{"train_loss": 0.009204437024891376, "global_step": 10666, "epoch": 89, "lr": 9.501143773384516e-05} +{"train_loss": 0.007161862216889858, "global_step": 10667, "epoch": 89, "lr": 9.501047301852852e-05} +{"train_loss": 0.014666436240077019, "global_step": 10668, "epoch": 89, "lr": 9.500950821483863e-05} +{"train_loss": 0.007327033206820488, "global_step": 10669, "epoch": 89, "lr": 9.500854332277736e-05} +{"train_loss": 0.006311176810413599, "global_step": 10670, "epoch": 89, "lr": 9.500757834234664e-05} +{"train_loss": 0.007301481906324625, "global_step": 10671, "epoch": 89, "lr": 9.500661327354834e-05} +{"train_loss": 0.008303552865982056, "global_step": 10672, "epoch": 89, "lr": 9.500564811638438e-05} +{"train_loss": 0.010931579396128654, "global_step": 10673, "epoch": 89, "lr": 9.500468287085662e-05} +{"train_loss": 0.00843795109540224, "global_step": 10674, "epoch": 89, "lr": 9.500371753696698e-05} +{"train_loss": 0.008783544413745403, "global_step": 10675, "epoch": 89, "lr": 9.500275211471734e-05} +{"train_loss": 0.005588874686509371, "global_step": 10676, "epoch": 89, "lr": 9.500178660410963e-05} +{"train_loss": 0.010123921558260918, "global_step": 10677, "epoch": 89, "lr": 9.50008210051457e-05} +{"train_loss": 0.007784989662468433, "global_step": 10678, "epoch": 89, "lr": 9.499985531782747e-05} +{"train_loss": 0.011179843917489052, "global_step": 10679, "epoch": 89, "lr": 9.499888954215683e-05} +{"train_loss": 0.008303098380565643, "global_step": 10680, "epoch": 89, "lr": 9.499792367813567e-05} +{"train_loss": 0.0125865014269948, "global_step": 10681, "epoch": 89, "lr": 9.49969577257659e-05} +{"train_loss": 0.008864625357091427, "global_step": 10682, "epoch": 89, "lr": 9.499599168504941e-05} +{"train_loss": 0.008131424896419048, "global_step": 10683, "epoch": 89, "lr": 9.49950255559881e-05} +{"train_loss": 0.01111073698848486, "global_step": 10684, "epoch": 89, "lr": 9.499405933858386e-05} +{"train_loss": 0.012069402262568474, "global_step": 10685, "epoch": 89, "lr": 9.49930930328386e-05} +{"train_loss": 0.009411169216036797, "global_step": 10686, "epoch": 89, "lr": 9.499212663875421e-05} +{"train_loss": 0.008979766629636288, "global_step": 10687, "epoch": 89, "lr": 9.499116015633257e-05} +{"train_loss": 0.012142610736191273, "global_step": 10688, "epoch": 89, "lr": 9.49901935855756e-05} +{"train_loss": 0.008095277473330498, "global_step": 10689, "epoch": 89, "lr": 9.498922692648519e-05} +{"train_loss": 0.00788866076618433, "global_step": 10690, "epoch": 89, "lr": 9.498826017906326e-05} +{"train_loss": 0.00841991975903511, "global_step": 10691, "epoch": 89, "lr": 9.498729334331167e-05} +{"train_loss": 0.009749108925461769, "global_step": 10692, "epoch": 89, "lr": 9.498632641923233e-05} +{"train_loss": 0.0076162489131093025, "global_step": 10693, "epoch": 89, "lr": 9.498535940682716e-05} +{"train_loss": 0.007131011690944433, "global_step": 10694, "epoch": 89, "lr": 9.498439230609803e-05} +{"train_loss": 0.010523787699639797, "global_step": 10695, "epoch": 89, "lr": 9.498342511704685e-05} +{"train_loss": 0.00956272054463625, "global_step": 10696, "epoch": 89, "lr": 9.498245783967553e-05} +{"train_loss": 0.012163978070020676, "global_step": 10697, "epoch": 89, "lr": 9.498149047398596e-05} +{"train_loss": 0.009757010266184807, "global_step": 10698, "epoch": 89, "lr": 9.498052301998004e-05} +{"train_loss": 0.0073427604511380196, "global_step": 10699, "epoch": 89, "lr": 9.497955547765965e-05} +{"train_loss": 0.009153902530670166, "global_step": 10700, "epoch": 89, "lr": 9.497858784702674e-05} +{"train_loss": 0.005889428313821554, "global_step": 10701, "epoch": 89, "lr": 9.497762012808316e-05} +{"train_loss": 0.010089504532516003, "global_step": 10702, "epoch": 89, "lr": 9.497665232083082e-05} +{"train_loss": 0.010178651660680771, "global_step": 10703, "epoch": 89, "lr": 9.497568442527163e-05} +{"train_loss": 0.01254526898264885, "global_step": 10704, "epoch": 89, "lr": 9.497471644140749e-05} +{"train_loss": 0.010861963964998722, "global_step": 10705, "epoch": 89, "lr": 9.497374836924032e-05} +{"train_loss": 0.00985655002295971, "global_step": 10706, "epoch": 89, "lr": 9.497278020877198e-05} +{"train_loss": 0.008885546587407589, "global_step": 10707, "epoch": 89, "lr": 9.497181196000438e-05} +{"train_loss": 0.011125770397484303, "global_step": 10708, "epoch": 89, "lr": 9.497084362293946e-05} +{"train_loss": 0.00965759003566218, "global_step": 10709, "epoch": 89, "lr": 9.496987519757907e-05, "val_loss": 0.018689913675189018} +{"train_loss": 0.011347866617143154, "global_step": 10710, "epoch": 90, "lr": 9.496890668392515e-05} +{"train_loss": 0.009287120774388313, "global_step": 10711, "epoch": 90, "lr": 9.496793808197957e-05} +{"train_loss": 0.00925229862332344, "global_step": 10712, "epoch": 90, "lr": 9.496696939174426e-05} +{"train_loss": 0.010984820313751698, "global_step": 10713, "epoch": 90, "lr": 9.49660006132211e-05} +{"train_loss": 0.007273172028362751, "global_step": 10714, "epoch": 90, "lr": 9.496503174641201e-05} +{"train_loss": 0.00859282910823822, "global_step": 10715, "epoch": 90, "lr": 9.496406279131889e-05} +{"train_loss": 0.010416032746434212, "global_step": 10716, "epoch": 90, "lr": 9.496309374794363e-05} +{"train_loss": 0.009963670745491982, "global_step": 10717, "epoch": 90, "lr": 9.496212461628813e-05} +{"train_loss": 0.00821937620639801, "global_step": 10718, "epoch": 90, "lr": 9.49611553963543e-05} +{"train_loss": 0.008190132677555084, "global_step": 10719, "epoch": 90, "lr": 9.496018608814407e-05} +{"train_loss": 0.00809442438185215, "global_step": 10720, "epoch": 90, "lr": 9.495921669165931e-05} +{"train_loss": 0.007963264361023903, "global_step": 10721, "epoch": 90, "lr": 9.495824720690192e-05} +{"train_loss": 0.011650963686406612, "global_step": 10722, "epoch": 90, "lr": 9.495727763387381e-05} +{"train_loss": 0.010649869218468666, "global_step": 10723, "epoch": 90, "lr": 9.49563079725769e-05} +{"train_loss": 0.012573210522532463, "global_step": 10724, "epoch": 90, "lr": 9.495533822301307e-05} +{"train_loss": 0.007815766148269176, "global_step": 10725, "epoch": 90, "lr": 9.495436838518425e-05} +{"train_loss": 0.009431513957679272, "global_step": 10726, "epoch": 90, "lr": 9.495339845909232e-05} +{"train_loss": 0.008629467338323593, "global_step": 10727, "epoch": 90, "lr": 9.495242844473921e-05} +{"train_loss": 0.00864049419760704, "global_step": 10728, "epoch": 90, "lr": 9.495145834212679e-05} +{"train_loss": 0.0077920155599713326, "global_step": 10729, "epoch": 90, "lr": 9.4950488151257e-05} +{"train_loss": 0.010487886145710945, "global_step": 10730, "epoch": 90, "lr": 9.494951787213172e-05} +{"train_loss": 0.009053601883351803, "global_step": 10731, "epoch": 90, "lr": 9.494854750475287e-05} +{"train_loss": 0.009284282103180885, "global_step": 10732, "epoch": 90, "lr": 9.494757704912234e-05} +{"train_loss": 0.009965001605451107, "global_step": 10733, "epoch": 90, "lr": 9.494660650524205e-05} +{"train_loss": 0.009828750975430012, "global_step": 10734, "epoch": 90, "lr": 9.49456358731139e-05} +{"train_loss": 0.01129122544080019, "global_step": 10735, "epoch": 90, "lr": 9.494466515273979e-05} +{"train_loss": 0.01085243746638298, "global_step": 10736, "epoch": 90, "lr": 9.494369434412163e-05} +{"train_loss": 0.009684452787041664, "global_step": 10737, "epoch": 90, "lr": 9.494272344726134e-05} +{"train_loss": 0.0071708522737026215, "global_step": 10738, "epoch": 90, "lr": 9.494175246216082e-05} +{"train_loss": 0.010458534583449364, "global_step": 10739, "epoch": 90, "lr": 9.494078138882194e-05} +{"train_loss": 0.008085346780717373, "global_step": 10740, "epoch": 90, "lr": 9.493981022724666e-05} +{"train_loss": 0.005828479770570993, "global_step": 10741, "epoch": 90, "lr": 9.493883897743686e-05} +{"train_loss": 0.010713706724345684, "global_step": 10742, "epoch": 90, "lr": 9.493786763939446e-05} +{"train_loss": 0.009463367983698845, "global_step": 10743, "epoch": 90, "lr": 9.493689621312133e-05} +{"train_loss": 0.005770688410848379, "global_step": 10744, "epoch": 90, "lr": 9.493592469861943e-05} +{"train_loss": 0.01121449563652277, "global_step": 10745, "epoch": 90, "lr": 9.493495309589064e-05} +{"train_loss": 0.008509010076522827, "global_step": 10746, "epoch": 90, "lr": 9.493398140493686e-05} +{"train_loss": 0.006836377549916506, "global_step": 10747, "epoch": 90, "lr": 9.493300962576002e-05} +{"train_loss": 0.01048947498202324, "global_step": 10748, "epoch": 90, "lr": 9.493203775836201e-05} +{"train_loss": 0.011254463344812393, "global_step": 10749, "epoch": 90, "lr": 9.493106580274474e-05} +{"train_loss": 0.008500991389155388, "global_step": 10750, "epoch": 90, "lr": 9.493009375891011e-05} +{"train_loss": 0.0062651741318404675, "global_step": 10751, "epoch": 90, "lr": 9.492912162686007e-05} +{"train_loss": 0.006112797651439905, "global_step": 10752, "epoch": 90, "lr": 9.492814940659649e-05} +{"train_loss": 0.00867647398263216, "global_step": 10753, "epoch": 90, "lr": 9.492717709812128e-05} +{"train_loss": 0.01265456061810255, "global_step": 10754, "epoch": 90, "lr": 9.492620470143636e-05} +{"train_loss": 0.00811128318309784, "global_step": 10755, "epoch": 90, "lr": 9.492523221654363e-05} +{"train_loss": 0.009530487470328808, "global_step": 10756, "epoch": 90, "lr": 9.492425964344502e-05} +{"train_loss": 0.007721861824393272, "global_step": 10757, "epoch": 90, "lr": 9.492328698214242e-05} +{"train_loss": 0.008297417312860489, "global_step": 10758, "epoch": 90, "lr": 9.492231423263775e-05} +{"train_loss": 0.011403596960008144, "global_step": 10759, "epoch": 90, "lr": 9.492134139493292e-05} +{"train_loss": 0.008474785834550858, "global_step": 10760, "epoch": 90, "lr": 9.492036846902982e-05} +{"train_loss": 0.008916485123336315, "global_step": 10761, "epoch": 90, "lr": 9.491939545493039e-05} +{"train_loss": 0.009106014855206013, "global_step": 10762, "epoch": 90, "lr": 9.491842235263651e-05} +{"train_loss": 0.006471770349889994, "global_step": 10763, "epoch": 90, "lr": 9.491744916215011e-05} +{"train_loss": 0.008927318267524242, "global_step": 10764, "epoch": 90, "lr": 9.491647588347311e-05} +{"train_loss": 0.00719761848449707, "global_step": 10765, "epoch": 90, "lr": 9.49155025166074e-05} +{"train_loss": 0.00931229442358017, "global_step": 10766, "epoch": 90, "lr": 9.49145290615549e-05} +{"train_loss": 0.012312653474509716, "global_step": 10767, "epoch": 90, "lr": 9.491355551831752e-05} +{"train_loss": 0.009073304943740368, "global_step": 10768, "epoch": 90, "lr": 9.491258188689718e-05} +{"train_loss": 0.0090839434415102, "global_step": 10769, "epoch": 90, "lr": 9.491160816729577e-05} +{"train_loss": 0.009490626864135265, "global_step": 10770, "epoch": 90, "lr": 9.491063435951522e-05} +{"train_loss": 0.004513572435826063, "global_step": 10771, "epoch": 90, "lr": 9.490966046355744e-05} +{"train_loss": 0.011633564718067646, "global_step": 10772, "epoch": 90, "lr": 9.490868647942434e-05} +{"train_loss": 0.010924520902335644, "global_step": 10773, "epoch": 90, "lr": 9.490771240711783e-05} +{"train_loss": 0.015062023885548115, "global_step": 10774, "epoch": 90, "lr": 9.490673824663982e-05} +{"train_loss": 0.007697457447648048, "global_step": 10775, "epoch": 90, "lr": 9.490576399799223e-05} +{"train_loss": 0.010224446654319763, "global_step": 10776, "epoch": 90, "lr": 9.490478966117697e-05} +{"train_loss": 0.010869855992496014, "global_step": 10777, "epoch": 90, "lr": 9.490381523619596e-05} +{"train_loss": 0.008664669468998909, "global_step": 10778, "epoch": 90, "lr": 9.490284072305109e-05} +{"train_loss": 0.00821401085704565, "global_step": 10779, "epoch": 90, "lr": 9.49018661217443e-05} +{"train_loss": 0.009535728953778744, "global_step": 10780, "epoch": 90, "lr": 9.49008914322775e-05} +{"train_loss": 0.006839795038104057, "global_step": 10781, "epoch": 90, "lr": 9.489991665465259e-05} +{"train_loss": 0.009631355293095112, "global_step": 10782, "epoch": 90, "lr": 9.489894178887148e-05} +{"train_loss": 0.013061834499239922, "global_step": 10783, "epoch": 90, "lr": 9.489796683493611e-05} +{"train_loss": 0.011383388191461563, "global_step": 10784, "epoch": 90, "lr": 9.489699179284838e-05} +{"train_loss": 0.008010515943169594, "global_step": 10785, "epoch": 90, "lr": 9.489601666261018e-05} +{"train_loss": 0.006727918051183224, "global_step": 10786, "epoch": 90, "lr": 9.489504144422348e-05} +{"train_loss": 0.007430932484567165, "global_step": 10787, "epoch": 90, "lr": 9.489406613769014e-05} +{"train_loss": 0.009215099737048149, "global_step": 10788, "epoch": 90, "lr": 9.489309074301212e-05} +{"train_loss": 0.007397232577204704, "global_step": 10789, "epoch": 90, "lr": 9.489211526019128e-05} +{"train_loss": 0.010347971692681313, "global_step": 10790, "epoch": 90, "lr": 9.48911396892296e-05} +{"train_loss": 0.009159400127828121, "global_step": 10791, "epoch": 90, "lr": 9.489016403012894e-05} +{"train_loss": 0.008727142587304115, "global_step": 10792, "epoch": 90, "lr": 9.488918828289124e-05} +{"train_loss": 0.008907695300877094, "global_step": 10793, "epoch": 90, "lr": 9.488821244751842e-05} +{"train_loss": 0.007918326184153557, "global_step": 10794, "epoch": 90, "lr": 9.488723652401239e-05} +{"train_loss": 0.00663677416741848, "global_step": 10795, "epoch": 90, "lr": 9.488626051237507e-05} +{"train_loss": 0.00798763521015644, "global_step": 10796, "epoch": 90, "lr": 9.488528441260838e-05} +{"train_loss": 0.012800880707800388, "global_step": 10797, "epoch": 90, "lr": 9.488430822471422e-05} +{"train_loss": 0.013640441000461578, "global_step": 10798, "epoch": 90, "lr": 9.48833319486945e-05} +{"train_loss": 0.008228903636336327, "global_step": 10799, "epoch": 90, "lr": 9.488235558455117e-05} +{"train_loss": 0.010308478958904743, "global_step": 10800, "epoch": 90, "lr": 9.488137913228613e-05} +{"train_loss": 0.008085307665169239, "global_step": 10801, "epoch": 90, "lr": 9.488040259190129e-05} +{"train_loss": 0.006982200313359499, "global_step": 10802, "epoch": 90, "lr": 9.487942596339858e-05} +{"train_loss": 0.011779163032770157, "global_step": 10803, "epoch": 90, "lr": 9.487844924677991e-05} +{"train_loss": 0.011372646316885948, "global_step": 10804, "epoch": 90, "lr": 9.487747244204721e-05} +{"train_loss": 0.006344319321215153, "global_step": 10805, "epoch": 90, "lr": 9.487649554920237e-05} +{"train_loss": 0.008376732468605042, "global_step": 10806, "epoch": 90, "lr": 9.487551856824735e-05} +{"train_loss": 0.006114458665251732, "global_step": 10807, "epoch": 90, "lr": 9.487454149918402e-05} +{"train_loss": 0.011045685969293118, "global_step": 10808, "epoch": 90, "lr": 9.487356434201433e-05} +{"train_loss": 0.01035059243440628, "global_step": 10809, "epoch": 90, "lr": 9.487258709674018e-05} +{"train_loss": 0.006567653734236956, "global_step": 10810, "epoch": 90, "lr": 9.48716097633635e-05} +{"train_loss": 0.00975143350660801, "global_step": 10811, "epoch": 90, "lr": 9.487063234188623e-05} +{"train_loss": 0.006625268142670393, "global_step": 10812, "epoch": 90, "lr": 9.486965483231025e-05} +{"train_loss": 0.00553453154861927, "global_step": 10813, "epoch": 90, "lr": 9.486867723463751e-05} +{"train_loss": 0.007092147134244442, "global_step": 10814, "epoch": 90, "lr": 9.486769954886989e-05} +{"train_loss": 0.00678061880171299, "global_step": 10815, "epoch": 90, "lr": 9.486672177500936e-05} +{"train_loss": 0.00754193589091301, "global_step": 10816, "epoch": 90, "lr": 9.48657439130578e-05} +{"train_loss": 0.008225756697356701, "global_step": 10817, "epoch": 90, "lr": 9.486476596301717e-05} +{"train_loss": 0.0058458950370550156, "global_step": 10818, "epoch": 90, "lr": 9.486378792488933e-05} +{"train_loss": 0.011110070161521435, "global_step": 10819, "epoch": 90, "lr": 9.486280979867625e-05} +{"train_loss": 0.009905672632157803, "global_step": 10820, "epoch": 90, "lr": 9.486183158437985e-05} +{"train_loss": 0.007638384122401476, "global_step": 10821, "epoch": 90, "lr": 9.486085328200202e-05} +{"train_loss": 0.006387902423739433, "global_step": 10822, "epoch": 90, "lr": 9.48598748915447e-05} +{"train_loss": 0.006627154536545277, "global_step": 10823, "epoch": 90, "lr": 9.48588964130098e-05} +{"train_loss": 0.00650051049888134, "global_step": 10824, "epoch": 90, "lr": 9.485791784639926e-05} +{"train_loss": 0.009084032848477364, "global_step": 10825, "epoch": 90, "lr": 9.485693919171499e-05} +{"train_loss": 0.008311234414577484, "global_step": 10826, "epoch": 90, "lr": 9.485596044895892e-05} +{"train_loss": 0.007482857909053564, "global_step": 10827, "epoch": 90, "lr": 9.485498161813295e-05} +{"train_loss": 0.008982115393864508, "global_step": 10828, "epoch": 90, "lr": 9.485400269923904e-05, "val_loss": 0.01791250705718994, "train_action_mse_error": 0.00032033328898251057} +{"train_loss": 0.013164077885448933, "global_step": 10829, "epoch": 91, "lr": 9.485302369227905e-05} +{"train_loss": 0.00692230649292469, "global_step": 10830, "epoch": 91, "lr": 9.485204459725496e-05} +{"train_loss": 0.011690259911119938, "global_step": 10831, "epoch": 91, "lr": 9.485106541416867e-05} +{"train_loss": 0.012811913155019283, "global_step": 10832, "epoch": 91, "lr": 9.48500861430221e-05} +{"train_loss": 0.006847011391073465, "global_step": 10833, "epoch": 91, "lr": 9.48491067838172e-05} +{"train_loss": 0.007790994830429554, "global_step": 10834, "epoch": 91, "lr": 9.484812733655583e-05} +{"train_loss": 0.010125111788511276, "global_step": 10835, "epoch": 91, "lr": 9.484714780123999e-05} +{"train_loss": 0.012022433802485466, "global_step": 10836, "epoch": 91, "lr": 9.484616817787155e-05} +{"train_loss": 0.007579291705042124, "global_step": 10837, "epoch": 91, "lr": 9.484518846645245e-05} +{"train_loss": 0.00656849704682827, "global_step": 10838, "epoch": 91, "lr": 9.484420866698463e-05} +{"train_loss": 0.013948393985629082, "global_step": 10839, "epoch": 91, "lr": 9.484322877946998e-05} +{"train_loss": 0.0099211186170578, "global_step": 10840, "epoch": 91, "lr": 9.484224880391044e-05} +{"train_loss": 0.00989554263651371, "global_step": 10841, "epoch": 91, "lr": 9.484126874030794e-05} +{"train_loss": 0.007655132561922073, "global_step": 10842, "epoch": 91, "lr": 9.48402885886644e-05} +{"train_loss": 0.01364111341536045, "global_step": 10843, "epoch": 91, "lr": 9.483930834898174e-05} +{"train_loss": 0.00991389062255621, "global_step": 10844, "epoch": 91, "lr": 9.483832802126189e-05} +{"train_loss": 0.009089733473956585, "global_step": 10845, "epoch": 91, "lr": 9.483734760550677e-05} +{"train_loss": 0.012456314638257027, "global_step": 10846, "epoch": 91, "lr": 9.483636710171833e-05} +{"train_loss": 0.014456073753535748, "global_step": 10847, "epoch": 91, "lr": 9.483538650989845e-05} +{"train_loss": 0.009495988488197327, "global_step": 10848, "epoch": 91, "lr": 9.483440583004908e-05} +{"train_loss": 0.010647646151483059, "global_step": 10849, "epoch": 91, "lr": 9.483342506217214e-05} +{"train_loss": 0.0093892402946949, "global_step": 10850, "epoch": 91, "lr": 9.483244420626958e-05} +{"train_loss": 0.009692884981632233, "global_step": 10851, "epoch": 91, "lr": 9.48314632623433e-05} +{"train_loss": 0.013818467035889626, "global_step": 10852, "epoch": 91, "lr": 9.483048223039521e-05} +{"train_loss": 0.01738353632390499, "global_step": 10853, "epoch": 91, "lr": 9.482950111042728e-05} +{"train_loss": 0.008382435888051987, "global_step": 10854, "epoch": 91, "lr": 9.482851990244139e-05} +{"train_loss": 0.008104880340397358, "global_step": 10855, "epoch": 91, "lr": 9.482753860643951e-05} +{"train_loss": 0.011014940217137337, "global_step": 10856, "epoch": 91, "lr": 9.482655722242355e-05} +{"train_loss": 0.009072424843907356, "global_step": 10857, "epoch": 91, "lr": 9.482557575039544e-05} +{"train_loss": 0.010171584784984589, "global_step": 10858, "epoch": 91, "lr": 9.482459419035707e-05} +{"train_loss": 0.00903868954628706, "global_step": 10859, "epoch": 91, "lr": 9.482361254231042e-05} +{"train_loss": 0.009345133788883686, "global_step": 10860, "epoch": 91, "lr": 9.482263080625739e-05} +{"train_loss": 0.006539211608469486, "global_step": 10861, "epoch": 91, "lr": 9.482164898219992e-05} +{"train_loss": 0.009738996624946594, "global_step": 10862, "epoch": 91, "lr": 9.482066707013992e-05} +{"train_loss": 0.009688823483884335, "global_step": 10863, "epoch": 91, "lr": 9.481968507007935e-05} +{"train_loss": 0.010517474263906479, "global_step": 10864, "epoch": 91, "lr": 9.481870298202009e-05} +{"train_loss": 0.009919782169163227, "global_step": 10865, "epoch": 91, "lr": 9.481772080596412e-05} +{"train_loss": 0.011442985385656357, "global_step": 10866, "epoch": 91, "lr": 9.481673854191332e-05} +{"train_loss": 0.009597032330930233, "global_step": 10867, "epoch": 91, "lr": 9.481575618986965e-05} +{"train_loss": 0.010832690633833408, "global_step": 10868, "epoch": 91, "lr": 9.481477374983503e-05} +{"train_loss": 0.008856574073433876, "global_step": 10869, "epoch": 91, "lr": 9.48137912218114e-05} +{"train_loss": 0.007131113670766354, "global_step": 10870, "epoch": 91, "lr": 9.481280860580066e-05} +{"train_loss": 0.008394382894039154, "global_step": 10871, "epoch": 91, "lr": 9.481182590180478e-05} +{"train_loss": 0.007890268228948116, "global_step": 10872, "epoch": 91, "lr": 9.481084310982564e-05} +{"train_loss": 0.012901263311505318, "global_step": 10873, "epoch": 91, "lr": 9.480986022986523e-05} +{"train_loss": 0.00787657406181097, "global_step": 10874, "epoch": 91, "lr": 9.480887726192542e-05} +{"train_loss": 0.007045120000839233, "global_step": 10875, "epoch": 91, "lr": 9.480789420600818e-05} +{"train_loss": 0.008607341907918453, "global_step": 10876, "epoch": 91, "lr": 9.480691106211541e-05} +{"train_loss": 0.007802407257258892, "global_step": 10877, "epoch": 91, "lr": 9.480592783024907e-05} +{"train_loss": 0.007292637135833502, "global_step": 10878, "epoch": 91, "lr": 9.480494451041108e-05} +{"train_loss": 0.010571474209427834, "global_step": 10879, "epoch": 91, "lr": 9.480396110260337e-05} +{"train_loss": 0.010544282384216785, "global_step": 10880, "epoch": 91, "lr": 9.480297760682787e-05} +{"train_loss": 0.010455415584146976, "global_step": 10881, "epoch": 91, "lr": 9.480199402308649e-05} +{"train_loss": 0.005634190980345011, "global_step": 10882, "epoch": 91, "lr": 9.48010103513812e-05} +{"train_loss": 0.0076339393854141235, "global_step": 10883, "epoch": 91, "lr": 9.48000265917139e-05} +{"train_loss": 0.00962917786091566, "global_step": 10884, "epoch": 91, "lr": 9.479904274408655e-05} +{"train_loss": 0.006260092370212078, "global_step": 10885, "epoch": 91, "lr": 9.479805880850106e-05} +{"train_loss": 0.00828003603965044, "global_step": 10886, "epoch": 91, "lr": 9.479707478495936e-05} +{"train_loss": 0.010335113853216171, "global_step": 10887, "epoch": 91, "lr": 9.479609067346339e-05} +{"train_loss": 0.009479823522269726, "global_step": 10888, "epoch": 91, "lr": 9.479510647401509e-05} +{"train_loss": 0.008150063455104828, "global_step": 10889, "epoch": 91, "lr": 9.479412218661638e-05} +{"train_loss": 0.008033113554120064, "global_step": 10890, "epoch": 91, "lr": 9.479313781126919e-05} +{"train_loss": 0.009382716380059719, "global_step": 10891, "epoch": 91, "lr": 9.479215334797547e-05} +{"train_loss": 0.01151537336409092, "global_step": 10892, "epoch": 91, "lr": 9.479116879673713e-05} +{"train_loss": 0.010008332319557667, "global_step": 10893, "epoch": 91, "lr": 9.479018415755613e-05} +{"train_loss": 0.006496382411569357, "global_step": 10894, "epoch": 91, "lr": 9.478919943043438e-05} +{"train_loss": 0.008240457624197006, "global_step": 10895, "epoch": 91, "lr": 9.478821461537381e-05} +{"train_loss": 0.009569913148880005, "global_step": 10896, "epoch": 91, "lr": 9.478722971237638e-05} +{"train_loss": 0.008125945925712585, "global_step": 10897, "epoch": 91, "lr": 9.478624472144402e-05} +{"train_loss": 0.009857552126049995, "global_step": 10898, "epoch": 91, "lr": 9.478525964257864e-05} +{"train_loss": 0.007584093138575554, "global_step": 10899, "epoch": 91, "lr": 9.478427447578218e-05} +{"train_loss": 0.007982965558767319, "global_step": 10900, "epoch": 91, "lr": 9.478328922105659e-05} +{"train_loss": 0.01011716853827238, "global_step": 10901, "epoch": 91, "lr": 9.47823038784038e-05} +{"train_loss": 0.00827739853411913, "global_step": 10902, "epoch": 91, "lr": 9.478131844782574e-05} +{"train_loss": 0.010091247037053108, "global_step": 10903, "epoch": 91, "lr": 9.478033292932434e-05} +{"train_loss": 0.008303282782435417, "global_step": 10904, "epoch": 91, "lr": 9.477934732290154e-05} +{"train_loss": 0.012230154126882553, "global_step": 10905, "epoch": 91, "lr": 9.477836162855928e-05} +{"train_loss": 0.009981419891119003, "global_step": 10906, "epoch": 91, "lr": 9.477737584629948e-05} +{"train_loss": 0.008908072486519814, "global_step": 10907, "epoch": 91, "lr": 9.477638997612411e-05} +{"train_loss": 0.009329823777079582, "global_step": 10908, "epoch": 91, "lr": 9.477540401803506e-05} +{"train_loss": 0.010211861692368984, "global_step": 10909, "epoch": 91, "lr": 9.47744179720343e-05} +{"train_loss": 0.01122802309691906, "global_step": 10910, "epoch": 91, "lr": 9.477343183812375e-05} +{"train_loss": 0.012310068123042583, "global_step": 10911, "epoch": 91, "lr": 9.477244561630535e-05} +{"train_loss": 0.007965452037751675, "global_step": 10912, "epoch": 91, "lr": 9.477145930658103e-05} +{"train_loss": 0.011466574855148792, "global_step": 10913, "epoch": 91, "lr": 9.477047290895275e-05} +{"train_loss": 0.00966811366379261, "global_step": 10914, "epoch": 91, "lr": 9.47694864234224e-05} +{"train_loss": 0.013995151966810226, "global_step": 10915, "epoch": 91, "lr": 9.476849984999198e-05} +{"train_loss": 0.010710906237363815, "global_step": 10916, "epoch": 91, "lr": 9.476751318866337e-05} +{"train_loss": 0.011094600893557072, "global_step": 10917, "epoch": 91, "lr": 9.476652643943854e-05} +{"train_loss": 0.006713272538036108, "global_step": 10918, "epoch": 91, "lr": 9.476553960231942e-05} +{"train_loss": 0.009630175307393074, "global_step": 10919, "epoch": 91, "lr": 9.476455267730793e-05} +{"train_loss": 0.013451811857521534, "global_step": 10920, "epoch": 91, "lr": 9.476356566440604e-05} +{"train_loss": 0.00605201767757535, "global_step": 10921, "epoch": 91, "lr": 9.476257856361566e-05} +{"train_loss": 0.00997401587665081, "global_step": 10922, "epoch": 91, "lr": 9.476159137493875e-05} +{"train_loss": 0.01367347314953804, "global_step": 10923, "epoch": 91, "lr": 9.476060409837723e-05} +{"train_loss": 0.007944541051983833, "global_step": 10924, "epoch": 91, "lr": 9.475961673393305e-05} +{"train_loss": 0.011643944308161736, "global_step": 10925, "epoch": 91, "lr": 9.475862928160815e-05} +{"train_loss": 0.012695261277258396, "global_step": 10926, "epoch": 91, "lr": 9.475764174140444e-05} +{"train_loss": 0.013780157081782818, "global_step": 10927, "epoch": 91, "lr": 9.47566541133239e-05} +{"train_loss": 0.012350580655038357, "global_step": 10928, "epoch": 91, "lr": 9.475566639736845e-05} +{"train_loss": 0.009453912265598774, "global_step": 10929, "epoch": 91, "lr": 9.475467859354004e-05} +{"train_loss": 0.011821610853075981, "global_step": 10930, "epoch": 91, "lr": 9.475369070184058e-05} +{"train_loss": 0.009334391914308071, "global_step": 10931, "epoch": 91, "lr": 9.475270272227203e-05} +{"train_loss": 0.00873345136642456, "global_step": 10932, "epoch": 91, "lr": 9.475171465483634e-05} +{"train_loss": 0.009074853733181953, "global_step": 10933, "epoch": 91, "lr": 9.475072649953544e-05} +{"train_loss": 0.013484500348567963, "global_step": 10934, "epoch": 91, "lr": 9.474973825637126e-05} +{"train_loss": 0.0144653944298625, "global_step": 10935, "epoch": 91, "lr": 9.474874992534578e-05} +{"train_loss": 0.010458485223352909, "global_step": 10936, "epoch": 91, "lr": 9.474776150646087e-05} +{"train_loss": 0.01097304280847311, "global_step": 10937, "epoch": 91, "lr": 9.474677299971852e-05} +{"train_loss": 0.008905846625566483, "global_step": 10938, "epoch": 91, "lr": 9.474578440512068e-05} +{"train_loss": 0.010349849238991737, "global_step": 10939, "epoch": 91, "lr": 9.474479572266926e-05} +{"train_loss": 0.013835803605616093, "global_step": 10940, "epoch": 91, "lr": 9.474380695236623e-05} +{"train_loss": 0.007003122474998236, "global_step": 10941, "epoch": 91, "lr": 9.474281809421348e-05} +{"train_loss": 0.011547490023076534, "global_step": 10942, "epoch": 91, "lr": 9.474182914821301e-05} +{"train_loss": 0.009995675645768642, "global_step": 10943, "epoch": 91, "lr": 9.474084011436674e-05} +{"train_loss": 0.010043841786682606, "global_step": 10944, "epoch": 91, "lr": 9.473985099267661e-05} +{"train_loss": 0.0061921533197164536, "global_step": 10945, "epoch": 91, "lr": 9.473886178314455e-05} +{"train_loss": 0.012630244717001915, "global_step": 10946, "epoch": 91, "lr": 9.473787248577252e-05} +{"train_loss": 0.00989743268132961, "global_step": 10947, "epoch": 91, "lr": 9.473688310056245e-05, "val_loss": 0.01704360358417034} +{"train_loss": 0.01119153667241335, "global_step": 10948, "epoch": 92, "lr": 9.473589362751631e-05} +{"train_loss": 0.008515658788383007, "global_step": 10949, "epoch": 92, "lr": 9.473490406663601e-05} +{"train_loss": 0.010999957099556923, "global_step": 10950, "epoch": 92, "lr": 9.473391441792352e-05} +{"train_loss": 0.008645940572023392, "global_step": 10951, "epoch": 92, "lr": 9.473292468138075e-05} +{"train_loss": 0.009003284387290478, "global_step": 10952, "epoch": 92, "lr": 9.473193485700966e-05} +{"train_loss": 0.010737749747931957, "global_step": 10953, "epoch": 92, "lr": 9.47309449448122e-05} +{"train_loss": 0.007271718233823776, "global_step": 10954, "epoch": 92, "lr": 9.472995494479031e-05} +{"train_loss": 0.010536571964621544, "global_step": 10955, "epoch": 92, "lr": 9.472896485694593e-05} +{"train_loss": 0.013784492388367653, "global_step": 10956, "epoch": 92, "lr": 9.4727974681281e-05} +{"train_loss": 0.00694028427824378, "global_step": 10957, "epoch": 92, "lr": 9.47269844177975e-05} +{"train_loss": 0.0073286318220198154, "global_step": 10958, "epoch": 92, "lr": 9.472599406649732e-05} +{"train_loss": 0.011027304455637932, "global_step": 10959, "epoch": 92, "lr": 9.472500362738242e-05} +{"train_loss": 0.010911038145422935, "global_step": 10960, "epoch": 92, "lr": 9.472401310045477e-05} +{"train_loss": 0.013017109595239162, "global_step": 10961, "epoch": 92, "lr": 9.47230224857163e-05} +{"train_loss": 0.006748205050826073, "global_step": 10962, "epoch": 92, "lr": 9.472203178316894e-05} +{"train_loss": 0.006852401420474052, "global_step": 10963, "epoch": 92, "lr": 9.472104099281464e-05} +{"train_loss": 0.01236019004136324, "global_step": 10964, "epoch": 92, "lr": 9.472005011465539e-05} +{"train_loss": 0.014888705685734749, "global_step": 10965, "epoch": 92, "lr": 9.471905914869308e-05} +{"train_loss": 0.008933063596487045, "global_step": 10966, "epoch": 92, "lr": 9.471806809492966e-05} +{"train_loss": 0.009520809166133404, "global_step": 10967, "epoch": 92, "lr": 9.471707695336711e-05} +{"train_loss": 0.00849378015846014, "global_step": 10968, "epoch": 92, "lr": 9.471608572400734e-05} +{"train_loss": 0.005111311562359333, "global_step": 10969, "epoch": 92, "lr": 9.471509440685233e-05} +{"train_loss": 0.009216452948749065, "global_step": 10970, "epoch": 92, "lr": 9.471410300190399e-05} +{"train_loss": 0.008797163143754005, "global_step": 10971, "epoch": 92, "lr": 9.471311150916431e-05} +{"train_loss": 0.010671659372746944, "global_step": 10972, "epoch": 92, "lr": 9.47121199286352e-05} +{"train_loss": 0.008372798562049866, "global_step": 10973, "epoch": 92, "lr": 9.471112826031862e-05} +{"train_loss": 0.011144036427140236, "global_step": 10974, "epoch": 92, "lr": 9.471013650421652e-05} +{"train_loss": 0.007923925295472145, "global_step": 10975, "epoch": 92, "lr": 9.470914466033084e-05} +{"train_loss": 0.00662180595099926, "global_step": 10976, "epoch": 92, "lr": 9.470815272866354e-05} +{"train_loss": 0.011162174865603447, "global_step": 10977, "epoch": 92, "lr": 9.470716070921654e-05} +{"train_loss": 0.0079725943505764, "global_step": 10978, "epoch": 92, "lr": 9.470616860199182e-05} +{"train_loss": 0.013066903688013554, "global_step": 10979, "epoch": 92, "lr": 9.47051764069913e-05} +{"train_loss": 0.007609772030264139, "global_step": 10980, "epoch": 92, "lr": 9.470418412421695e-05} +{"train_loss": 0.012797626666724682, "global_step": 10981, "epoch": 92, "lr": 9.470319175367071e-05} +{"train_loss": 0.01319741178303957, "global_step": 10982, "epoch": 92, "lr": 9.470219929535453e-05} +{"train_loss": 0.009975427761673927, "global_step": 10983, "epoch": 92, "lr": 9.470120674927036e-05} +{"train_loss": 0.007908014580607414, "global_step": 10984, "epoch": 92, "lr": 9.470021411542015e-05} +{"train_loss": 0.012686080299317837, "global_step": 10985, "epoch": 92, "lr": 9.469922139380583e-05} +{"train_loss": 0.006289849057793617, "global_step": 10986, "epoch": 92, "lr": 9.469822858442939e-05} +{"train_loss": 0.006364398170262575, "global_step": 10987, "epoch": 92, "lr": 9.469723568729273e-05} +{"train_loss": 0.012075242586433887, "global_step": 10988, "epoch": 92, "lr": 9.469624270239783e-05} +{"train_loss": 0.007821165025234222, "global_step": 10989, "epoch": 92, "lr": 9.469524962974663e-05} +{"train_loss": 0.014615614898502827, "global_step": 10990, "epoch": 92, "lr": 9.46942564693411e-05} +{"train_loss": 0.008269800804555416, "global_step": 10991, "epoch": 92, "lr": 9.469326322118315e-05} +{"train_loss": 0.006357853300869465, "global_step": 10992, "epoch": 92, "lr": 9.469226988527475e-05} +{"train_loss": 0.009698067791759968, "global_step": 10993, "epoch": 92, "lr": 9.469127646161786e-05} +{"train_loss": 0.012396570295095444, "global_step": 10994, "epoch": 92, "lr": 9.469028295021442e-05} +{"train_loss": 0.00940869003534317, "global_step": 10995, "epoch": 92, "lr": 9.46892893510664e-05} +{"train_loss": 0.008118588477373123, "global_step": 10996, "epoch": 92, "lr": 9.468829566417572e-05} +{"train_loss": 0.009590618312358856, "global_step": 10997, "epoch": 92, "lr": 9.468730188954435e-05} +{"train_loss": 0.005746106151491404, "global_step": 10998, "epoch": 92, "lr": 9.468630802717424e-05} +{"train_loss": 0.007752951234579086, "global_step": 10999, "epoch": 92, "lr": 9.468531407706734e-05} +{"train_loss": 0.01045570895075798, "global_step": 11000, "epoch": 92, "lr": 9.468432003922559e-05} +{"train_loss": 0.01007931586354971, "global_step": 11001, "epoch": 92, "lr": 9.468332591365097e-05} +{"train_loss": 0.009393933229148388, "global_step": 11002, "epoch": 92, "lr": 9.46823317003454e-05} +{"train_loss": 0.012021655216813087, "global_step": 11003, "epoch": 92, "lr": 9.468133739931083e-05} +{"train_loss": 0.009315861389040947, "global_step": 11004, "epoch": 92, "lr": 9.468034301054924e-05} +{"train_loss": 0.009501393884420395, "global_step": 11005, "epoch": 92, "lr": 9.467934853406258e-05} +{"train_loss": 0.005380542483180761, "global_step": 11006, "epoch": 92, "lr": 9.467835396985278e-05} +{"train_loss": 0.0062771388329565525, "global_step": 11007, "epoch": 92, "lr": 9.467735931792181e-05} +{"train_loss": 0.009265981614589691, "global_step": 11008, "epoch": 92, "lr": 9.467636457827162e-05} +{"train_loss": 0.008961326442658901, "global_step": 11009, "epoch": 92, "lr": 9.467536975090417e-05} +{"train_loss": 0.013793284073472023, "global_step": 11010, "epoch": 92, "lr": 9.467437483582138e-05} +{"train_loss": 0.0070478287525475025, "global_step": 11011, "epoch": 92, "lr": 9.467337983302524e-05} +{"train_loss": 0.01257611345499754, "global_step": 11012, "epoch": 92, "lr": 9.467238474251769e-05} +{"train_loss": 0.011674631386995316, "global_step": 11013, "epoch": 92, "lr": 9.467138956430069e-05} +{"train_loss": 0.012704724445939064, "global_step": 11014, "epoch": 92, "lr": 9.467039429837619e-05} +{"train_loss": 0.007138016168028116, "global_step": 11015, "epoch": 92, "lr": 9.466939894474613e-05} +{"train_loss": 0.00878760777413845, "global_step": 11016, "epoch": 92, "lr": 9.46684035034125e-05} +{"train_loss": 0.00824230257421732, "global_step": 11017, "epoch": 92, "lr": 9.466740797437722e-05} +{"train_loss": 0.009776552207767963, "global_step": 11018, "epoch": 92, "lr": 9.466641235764226e-05} +{"train_loss": 0.009731476195156574, "global_step": 11019, "epoch": 92, "lr": 9.466541665320956e-05} +{"train_loss": 0.010864575393497944, "global_step": 11020, "epoch": 92, "lr": 9.466442086108109e-05} +{"train_loss": 0.016932278871536255, "global_step": 11021, "epoch": 92, "lr": 9.466342498125881e-05} +{"train_loss": 0.008143240585923195, "global_step": 11022, "epoch": 92, "lr": 9.466242901374466e-05} +{"train_loss": 0.010737796314060688, "global_step": 11023, "epoch": 92, "lr": 9.46614329585406e-05} +{"train_loss": 0.010660829953849316, "global_step": 11024, "epoch": 92, "lr": 9.466043681564859e-05} +{"train_loss": 0.009830092079937458, "global_step": 11025, "epoch": 92, "lr": 9.465944058507059e-05} +{"train_loss": 0.017390176653862, "global_step": 11026, "epoch": 92, "lr": 9.465844426680855e-05} +{"train_loss": 0.011433950625360012, "global_step": 11027, "epoch": 92, "lr": 9.465744786086441e-05} +{"train_loss": 0.00935235247015953, "global_step": 11028, "epoch": 92, "lr": 9.465645136724016e-05} +{"train_loss": 0.009034229442477226, "global_step": 11029, "epoch": 92, "lr": 9.465545478593772e-05} +{"train_loss": 0.009618472307920456, "global_step": 11030, "epoch": 92, "lr": 9.465445811695907e-05} +{"train_loss": 0.008946646004915237, "global_step": 11031, "epoch": 92, "lr": 9.465346136030618e-05} +{"train_loss": 0.011100607924163342, "global_step": 11032, "epoch": 92, "lr": 9.465246451598097e-05} +{"train_loss": 0.009008612483739853, "global_step": 11033, "epoch": 92, "lr": 9.465146758398542e-05} +{"train_loss": 0.010438070632517338, "global_step": 11034, "epoch": 92, "lr": 9.465047056432149e-05} +{"train_loss": 0.010366044007241726, "global_step": 11035, "epoch": 92, "lr": 9.464947345699114e-05} +{"train_loss": 0.009523570537567139, "global_step": 11036, "epoch": 92, "lr": 9.464847626199629e-05} +{"train_loss": 0.0107507836073637, "global_step": 11037, "epoch": 92, "lr": 9.464747897933894e-05} +{"train_loss": 0.010103359818458557, "global_step": 11038, "epoch": 92, "lr": 9.464648160902106e-05} +{"train_loss": 0.013260583393275738, "global_step": 11039, "epoch": 92, "lr": 9.464548415104454e-05} +{"train_loss": 0.014544193632900715, "global_step": 11040, "epoch": 92, "lr": 9.464448660541141e-05} +{"train_loss": 0.009201965294778347, "global_step": 11041, "epoch": 92, "lr": 9.46434889721236e-05} +{"train_loss": 0.007313952315598726, "global_step": 11042, "epoch": 92, "lr": 9.464249125118305e-05} +{"train_loss": 0.01139811985194683, "global_step": 11043, "epoch": 92, "lr": 9.464149344259175e-05} +{"train_loss": 0.005944783333688974, "global_step": 11044, "epoch": 92, "lr": 9.464049554635166e-05} +{"train_loss": 0.009902196004986763, "global_step": 11045, "epoch": 92, "lr": 9.463949756246471e-05} +{"train_loss": 0.014136267825961113, "global_step": 11046, "epoch": 92, "lr": 9.463849949093288e-05} +{"train_loss": 0.00891309417784214, "global_step": 11047, "epoch": 92, "lr": 9.463750133175813e-05} +{"train_loss": 0.009301957674324512, "global_step": 11048, "epoch": 92, "lr": 9.463650308494239e-05} +{"train_loss": 0.011839030310511589, "global_step": 11049, "epoch": 92, "lr": 9.463550475048768e-05} +{"train_loss": 0.009296666830778122, "global_step": 11050, "epoch": 92, "lr": 9.46345063283959e-05} +{"train_loss": 0.008731406182050705, "global_step": 11051, "epoch": 92, "lr": 9.463350781866905e-05} +{"train_loss": 0.009504457004368305, "global_step": 11052, "epoch": 92, "lr": 9.463250922130907e-05} +{"train_loss": 0.011411977931857109, "global_step": 11053, "epoch": 92, "lr": 9.463151053631792e-05} +{"train_loss": 0.010339147411286831, "global_step": 11054, "epoch": 92, "lr": 9.463051176369757e-05} +{"train_loss": 0.009868098422884941, "global_step": 11055, "epoch": 92, "lr": 9.462951290345e-05} +{"train_loss": 0.006786888465285301, "global_step": 11056, "epoch": 92, "lr": 9.462851395557713e-05} +{"train_loss": 0.010533086024224758, "global_step": 11057, "epoch": 92, "lr": 9.462751492008093e-05} +{"train_loss": 0.007309446111321449, "global_step": 11058, "epoch": 92, "lr": 9.462651579696338e-05} +{"train_loss": 0.012429563328623772, "global_step": 11059, "epoch": 92, "lr": 9.462551658622644e-05} +{"train_loss": 0.010420398786664009, "global_step": 11060, "epoch": 92, "lr": 9.462451728787206e-05} +{"train_loss": 0.007356161717325449, "global_step": 11061, "epoch": 92, "lr": 9.462351790190221e-05} +{"train_loss": 0.006550424266606569, "global_step": 11062, "epoch": 92, "lr": 9.462251842831886e-05} +{"train_loss": 0.012916556559503078, "global_step": 11063, "epoch": 92, "lr": 9.462151886712395e-05} +{"train_loss": 0.00935015082359314, "global_step": 11064, "epoch": 92, "lr": 9.462051921831946e-05} +{"train_loss": 0.00996455829590559, "global_step": 11065, "epoch": 92, "lr": 9.461951948190734e-05} +{"train_loss": 0.009804159528067131, "global_step": 11066, "epoch": 92, "lr": 9.461851965788958e-05, "val_loss": 0.015877095982432365} +{"train_loss": 0.010973313823342323, "global_step": 11067, "epoch": 93, "lr": 9.46175197462681e-05} +{"train_loss": 0.014918583445250988, "global_step": 11068, "epoch": 93, "lr": 9.46165197470449e-05} +{"train_loss": 0.007171935401856899, "global_step": 11069, "epoch": 93, "lr": 9.461551966022193e-05} +{"train_loss": 0.009598423726856709, "global_step": 11070, "epoch": 93, "lr": 9.461451948580114e-05} +{"train_loss": 0.00941872876137495, "global_step": 11071, "epoch": 93, "lr": 9.461351922378452e-05} +{"train_loss": 0.008232985623180866, "global_step": 11072, "epoch": 93, "lr": 9.461251887417402e-05} +{"train_loss": 0.009276628494262695, "global_step": 11073, "epoch": 93, "lr": 9.461151843697161e-05} +{"train_loss": 0.007723677903413773, "global_step": 11074, "epoch": 93, "lr": 9.461051791217923e-05} +{"train_loss": 0.007965263910591602, "global_step": 11075, "epoch": 93, "lr": 9.460951729979888e-05} +{"train_loss": 0.012082627974450588, "global_step": 11076, "epoch": 93, "lr": 9.46085165998325e-05} +{"train_loss": 0.010477734729647636, "global_step": 11077, "epoch": 93, "lr": 9.460751581228209e-05} +{"train_loss": 0.009948615916073322, "global_step": 11078, "epoch": 93, "lr": 9.460651493714956e-05} +{"train_loss": 0.006558730732649565, "global_step": 11079, "epoch": 93, "lr": 9.460551397443691e-05} +{"train_loss": 0.008091684430837631, "global_step": 11080, "epoch": 93, "lr": 9.46045129241461e-05} +{"train_loss": 0.007894793525338173, "global_step": 11081, "epoch": 93, "lr": 9.460351178627909e-05} +{"train_loss": 0.010987278074026108, "global_step": 11082, "epoch": 93, "lr": 9.460251056083786e-05} +{"train_loss": 0.010099450126290321, "global_step": 11083, "epoch": 93, "lr": 9.460150924782435e-05} +{"train_loss": 0.009443563409149647, "global_step": 11084, "epoch": 93, "lr": 9.460050784724055e-05} +{"train_loss": 0.009476600214838982, "global_step": 11085, "epoch": 93, "lr": 9.459950635908843e-05} +{"train_loss": 0.00711845001205802, "global_step": 11086, "epoch": 93, "lr": 9.459850478336993e-05} +{"train_loss": 0.011231927201151848, "global_step": 11087, "epoch": 93, "lr": 9.459750312008704e-05} +{"train_loss": 0.007964848540723324, "global_step": 11088, "epoch": 93, "lr": 9.45965013692417e-05} +{"train_loss": 0.010788374580442905, "global_step": 11089, "epoch": 93, "lr": 9.459549953083591e-05} +{"train_loss": 0.006742928177118301, "global_step": 11090, "epoch": 93, "lr": 9.459449760487161e-05} +{"train_loss": 0.009252450428903103, "global_step": 11091, "epoch": 93, "lr": 9.459349559135077e-05} +{"train_loss": 0.010304654948413372, "global_step": 11092, "epoch": 93, "lr": 9.45924934902754e-05} +{"train_loss": 0.007126336917281151, "global_step": 11093, "epoch": 93, "lr": 9.459149130164741e-05} +{"train_loss": 0.007080612704157829, "global_step": 11094, "epoch": 93, "lr": 9.459048902546879e-05} +{"train_loss": 0.005764944013208151, "global_step": 11095, "epoch": 93, "lr": 9.458948666174152e-05} +{"train_loss": 0.007141474634408951, "global_step": 11096, "epoch": 93, "lr": 9.458848421046754e-05} +{"train_loss": 0.008432071655988693, "global_step": 11097, "epoch": 93, "lr": 9.458748167164884e-05} +{"train_loss": 0.00841308943927288, "global_step": 11098, "epoch": 93, "lr": 9.458647904528738e-05} +{"train_loss": 0.010521580465137959, "global_step": 11099, "epoch": 93, "lr": 9.458547633138515e-05} +{"train_loss": 0.009620062075555325, "global_step": 11100, "epoch": 93, "lr": 9.458447352994408e-05} +{"train_loss": 0.006113116629421711, "global_step": 11101, "epoch": 93, "lr": 9.458347064096618e-05} +{"train_loss": 0.008620630949735641, "global_step": 11102, "epoch": 93, "lr": 9.458246766445338e-05} +{"train_loss": 0.011454949155449867, "global_step": 11103, "epoch": 93, "lr": 9.458146460040766e-05} +{"train_loss": 0.009742873720824718, "global_step": 11104, "epoch": 93, "lr": 9.458046144883103e-05} +{"train_loss": 0.00810165423899889, "global_step": 11105, "epoch": 93, "lr": 9.45794582097254e-05} +{"train_loss": 0.007664069999009371, "global_step": 11106, "epoch": 93, "lr": 9.457845488309278e-05} +{"train_loss": 0.010197456926107407, "global_step": 11107, "epoch": 93, "lr": 9.457745146893511e-05} +{"train_loss": 0.010571477934718132, "global_step": 11108, "epoch": 93, "lr": 9.457644796725441e-05} +{"train_loss": 0.00857614167034626, "global_step": 11109, "epoch": 93, "lr": 9.457544437805257e-05} +{"train_loss": 0.008361214771866798, "global_step": 11110, "epoch": 93, "lr": 9.457444070133164e-05} +{"train_loss": 0.009810782968997955, "global_step": 11111, "epoch": 93, "lr": 9.457343693709355e-05} +{"train_loss": 0.008150539360940456, "global_step": 11112, "epoch": 93, "lr": 9.457243308534027e-05} +{"train_loss": 0.007826524786651134, "global_step": 11113, "epoch": 93, "lr": 9.457142914607379e-05} +{"train_loss": 0.007751488592475653, "global_step": 11114, "epoch": 93, "lr": 9.457042511929606e-05} +{"train_loss": 0.010038629174232483, "global_step": 11115, "epoch": 93, "lr": 9.456942100500908e-05} +{"train_loss": 0.005562593694776297, "global_step": 11116, "epoch": 93, "lr": 9.456841680321479e-05} +{"train_loss": 0.01948029361665249, "global_step": 11117, "epoch": 93, "lr": 9.456741251391518e-05} +{"train_loss": 0.007826880551874638, "global_step": 11118, "epoch": 93, "lr": 9.456640813711222e-05} +{"train_loss": 0.012264920398592949, "global_step": 11119, "epoch": 93, "lr": 9.456540367280787e-05} +{"train_loss": 0.007375686429440975, "global_step": 11120, "epoch": 93, "lr": 9.45643991210041e-05} +{"train_loss": 0.011223811656236649, "global_step": 11121, "epoch": 93, "lr": 9.456339448170291e-05} +{"train_loss": 0.008685787208378315, "global_step": 11122, "epoch": 93, "lr": 9.456238975490625e-05} +{"train_loss": 0.012473721988499165, "global_step": 11123, "epoch": 93, "lr": 9.45613849406161e-05} +{"train_loss": 0.008434469811618328, "global_step": 11124, "epoch": 93, "lr": 9.456038003883446e-05} +{"train_loss": 0.010005106218159199, "global_step": 11125, "epoch": 93, "lr": 9.455937504956322e-05} +{"train_loss": 0.010638829320669174, "global_step": 11126, "epoch": 93, "lr": 9.455836997280445e-05} +{"train_loss": 0.006859597750008106, "global_step": 11127, "epoch": 93, "lr": 9.455736480856005e-05} +{"train_loss": 0.008539493195712566, "global_step": 11128, "epoch": 93, "lr": 9.455635955683206e-05} +{"train_loss": 0.009302685037255287, "global_step": 11129, "epoch": 93, "lr": 9.455535421762239e-05} +{"train_loss": 0.011112784035503864, "global_step": 11130, "epoch": 93, "lr": 9.455434879093306e-05} +{"train_loss": 0.011666057631373405, "global_step": 11131, "epoch": 93, "lr": 9.455334327676601e-05} +{"train_loss": 0.007737084291875362, "global_step": 11132, "epoch": 93, "lr": 9.455233767512324e-05} +{"train_loss": 0.008795066736638546, "global_step": 11133, "epoch": 93, "lr": 9.45513319860067e-05} +{"train_loss": 0.008686698041856289, "global_step": 11134, "epoch": 93, "lr": 9.45503262094184e-05} +{"train_loss": 0.007244442123919725, "global_step": 11135, "epoch": 93, "lr": 9.454932034536028e-05} +{"train_loss": 0.00724207516759634, "global_step": 11136, "epoch": 93, "lr": 9.454831439383433e-05} +{"train_loss": 0.009662602096796036, "global_step": 11137, "epoch": 93, "lr": 9.454730835484253e-05} +{"train_loss": 0.0082511305809021, "global_step": 11138, "epoch": 93, "lr": 9.454630222838685e-05} +{"train_loss": 0.008776147849857807, "global_step": 11139, "epoch": 93, "lr": 9.454529601446927e-05} +{"train_loss": 0.007625729311257601, "global_step": 11140, "epoch": 93, "lr": 9.454428971309175e-05} +{"train_loss": 0.009955322369933128, "global_step": 11141, "epoch": 93, "lr": 9.454328332425629e-05} +{"train_loss": 0.009125631302595139, "global_step": 11142, "epoch": 93, "lr": 9.454227684796482e-05} +{"train_loss": 0.006816646549850702, "global_step": 11143, "epoch": 93, "lr": 9.454127028421938e-05} +{"train_loss": 0.010524032637476921, "global_step": 11144, "epoch": 93, "lr": 9.454026363302188e-05} +{"train_loss": 0.004721964243799448, "global_step": 11145, "epoch": 93, "lr": 9.453925689437437e-05} +{"train_loss": 0.009138127788901329, "global_step": 11146, "epoch": 93, "lr": 9.453825006827877e-05} +{"train_loss": 0.011326088570058346, "global_step": 11147, "epoch": 93, "lr": 9.453724315473706e-05} +{"train_loss": 0.00994220282882452, "global_step": 11148, "epoch": 93, "lr": 9.453623615375126e-05} +{"train_loss": 0.008121658116579056, "global_step": 11149, "epoch": 93, "lr": 9.453522906532331e-05} +{"train_loss": 0.008868894539773464, "global_step": 11150, "epoch": 93, "lr": 9.453422188945517e-05} +{"train_loss": 0.006177703849971294, "global_step": 11151, "epoch": 93, "lr": 9.453321462614888e-05} +{"train_loss": 0.0062474701553583145, "global_step": 11152, "epoch": 93, "lr": 9.453220727540636e-05} +{"train_loss": 0.01012130081653595, "global_step": 11153, "epoch": 93, "lr": 9.453119983722962e-05} +{"train_loss": 0.008624473586678505, "global_step": 11154, "epoch": 93, "lr": 9.453019231162061e-05} +{"train_loss": 0.010841676965355873, "global_step": 11155, "epoch": 93, "lr": 9.452918469858134e-05} +{"train_loss": 0.01285551581531763, "global_step": 11156, "epoch": 93, "lr": 9.452817699811376e-05} +{"train_loss": 0.009741226211190224, "global_step": 11157, "epoch": 93, "lr": 9.452716921021986e-05} +{"train_loss": 0.007265668362379074, "global_step": 11158, "epoch": 93, "lr": 9.452616133490164e-05} +{"train_loss": 0.009439194574952126, "global_step": 11159, "epoch": 93, "lr": 9.452515337216105e-05} +{"train_loss": 0.008523387834429741, "global_step": 11160, "epoch": 93, "lr": 9.452414532200007e-05} +{"train_loss": 0.00787360966205597, "global_step": 11161, "epoch": 93, "lr": 9.45231371844207e-05} +{"train_loss": 0.009903574362397194, "global_step": 11162, "epoch": 93, "lr": 9.45221289594249e-05} +{"train_loss": 0.006955932825803757, "global_step": 11163, "epoch": 93, "lr": 9.452112064701465e-05} +{"train_loss": 0.007754175923764706, "global_step": 11164, "epoch": 93, "lr": 9.452011224719194e-05} +{"train_loss": 0.006833734456449747, "global_step": 11165, "epoch": 93, "lr": 9.451910375995875e-05} +{"train_loss": 0.011669116094708443, "global_step": 11166, "epoch": 93, "lr": 9.451809518531704e-05} +{"train_loss": 0.009693989530205727, "global_step": 11167, "epoch": 93, "lr": 9.451708652326883e-05} +{"train_loss": 0.00819924846291542, "global_step": 11168, "epoch": 93, "lr": 9.451607777381607e-05} +{"train_loss": 0.00899851880967617, "global_step": 11169, "epoch": 93, "lr": 9.451506893696074e-05} +{"train_loss": 0.007737305015325546, "global_step": 11170, "epoch": 93, "lr": 9.451406001270484e-05} +{"train_loss": 0.009215069934725761, "global_step": 11171, "epoch": 93, "lr": 9.451305100105033e-05} +{"train_loss": 0.006835702806711197, "global_step": 11172, "epoch": 93, "lr": 9.451204190199921e-05} +{"train_loss": 0.010986763052642345, "global_step": 11173, "epoch": 93, "lr": 9.451103271555343e-05} +{"train_loss": 0.008076200261712074, "global_step": 11174, "epoch": 93, "lr": 9.4510023441715e-05} +{"train_loss": 0.009948622435331345, "global_step": 11175, "epoch": 93, "lr": 9.450901408048591e-05} +{"train_loss": 0.008573046885430813, "global_step": 11176, "epoch": 93, "lr": 9.45080046318681e-05} +{"train_loss": 0.011399652808904648, "global_step": 11177, "epoch": 93, "lr": 9.45069950958636e-05} +{"train_loss": 0.010593193583190441, "global_step": 11178, "epoch": 93, "lr": 9.450598547247435e-05} +{"train_loss": 0.010616222396492958, "global_step": 11179, "epoch": 93, "lr": 9.450497576170237e-05} +{"train_loss": 0.01295977272093296, "global_step": 11180, "epoch": 93, "lr": 9.450396596354963e-05} +{"train_loss": 0.01147383637726307, "global_step": 11181, "epoch": 93, "lr": 9.450295607801809e-05} +{"train_loss": 0.007966331206262112, "global_step": 11182, "epoch": 93, "lr": 9.450194610510976e-05} +{"train_loss": 0.005994729232043028, "global_step": 11183, "epoch": 93, "lr": 9.45009360448266e-05} +{"train_loss": 0.009244538843631744, "global_step": 11184, "epoch": 93, "lr": 9.449992589717062e-05} +{"train_loss": 0.009157535925257105, "global_step": 11185, "epoch": 93, "lr": 9.44989156621438e-05, "val_loss": 0.025251377373933792} +{"train_loss": 0.008472536690533161, "global_step": 11186, "epoch": 94, "lr": 9.449790533974809e-05} +{"train_loss": 0.010342225432395935, "global_step": 11187, "epoch": 94, "lr": 9.44968949299855e-05} +{"train_loss": 0.011317766271531582, "global_step": 11188, "epoch": 94, "lr": 9.449588443285801e-05} +{"train_loss": 0.0064123827032744884, "global_step": 11189, "epoch": 94, "lr": 9.449487384836762e-05} +{"train_loss": 0.013158980756998062, "global_step": 11190, "epoch": 94, "lr": 9.44938631765163e-05} +{"train_loss": 0.008882610127329826, "global_step": 11191, "epoch": 94, "lr": 9.449285241730601e-05} +{"train_loss": 0.009694838896393776, "global_step": 11192, "epoch": 94, "lr": 9.449184157073877e-05} +{"train_loss": 0.007714702747762203, "global_step": 11193, "epoch": 94, "lr": 9.449083063681656e-05} +{"train_loss": 0.013439221307635307, "global_step": 11194, "epoch": 94, "lr": 9.448981961554135e-05} +{"train_loss": 0.011447099037468433, "global_step": 11195, "epoch": 94, "lr": 9.448880850691513e-05} +{"train_loss": 0.009686683304607868, "global_step": 11196, "epoch": 94, "lr": 9.448779731093989e-05} +{"train_loss": 0.006577802821993828, "global_step": 11197, "epoch": 94, "lr": 9.44867860276176e-05} +{"train_loss": 0.009098141454160213, "global_step": 11198, "epoch": 94, "lr": 9.448577465695028e-05} +{"train_loss": 0.006897012237459421, "global_step": 11199, "epoch": 94, "lr": 9.448476319893989e-05} +{"train_loss": 0.006208874750882387, "global_step": 11200, "epoch": 94, "lr": 9.448375165358841e-05} +{"train_loss": 0.011418458074331284, "global_step": 11201, "epoch": 94, "lr": 9.448274002089783e-05} +{"train_loss": 0.007559751160442829, "global_step": 11202, "epoch": 94, "lr": 9.448172830087017e-05} +{"train_loss": 0.006838472094386816, "global_step": 11203, "epoch": 94, "lr": 9.448071649350736e-05} +{"train_loss": 0.006185399834066629, "global_step": 11204, "epoch": 94, "lr": 9.447970459881144e-05} +{"train_loss": 0.00886356458067894, "global_step": 11205, "epoch": 94, "lr": 9.447869261678435e-05} +{"train_loss": 0.007948873564600945, "global_step": 11206, "epoch": 94, "lr": 9.447768054742811e-05} +{"train_loss": 0.008035890758037567, "global_step": 11207, "epoch": 94, "lr": 9.44766683907447e-05} +{"train_loss": 0.006384807173162699, "global_step": 11208, "epoch": 94, "lr": 9.447565614673609e-05} +{"train_loss": 0.006164052989333868, "global_step": 11209, "epoch": 94, "lr": 9.447464381540429e-05} +{"train_loss": 0.008267735131084919, "global_step": 11210, "epoch": 94, "lr": 9.447363139675128e-05} +{"train_loss": 0.011796497739851475, "global_step": 11211, "epoch": 94, "lr": 9.447261889077902e-05} +{"train_loss": 0.008187706582248211, "global_step": 11212, "epoch": 94, "lr": 9.447160629748957e-05} +{"train_loss": 0.008609768003225327, "global_step": 11213, "epoch": 94, "lr": 9.447059361688484e-05} +{"train_loss": 0.007619936019182205, "global_step": 11214, "epoch": 94, "lr": 9.446958084896686e-05} +{"train_loss": 0.012515871785581112, "global_step": 11215, "epoch": 94, "lr": 9.44685679937376e-05} +{"train_loss": 0.010494571179151535, "global_step": 11216, "epoch": 94, "lr": 9.446755505119907e-05} +{"train_loss": 0.012375270947813988, "global_step": 11217, "epoch": 94, "lr": 9.446654202135323e-05} +{"train_loss": 0.010344762355089188, "global_step": 11218, "epoch": 94, "lr": 9.44655289042021e-05} +{"train_loss": 0.009117056615650654, "global_step": 11219, "epoch": 94, "lr": 9.446451569974766e-05} +{"train_loss": 0.008143914863467216, "global_step": 11220, "epoch": 94, "lr": 9.446350240799188e-05} +{"train_loss": 0.01024574413895607, "global_step": 11221, "epoch": 94, "lr": 9.446248902893678e-05} +{"train_loss": 0.01058848388493061, "global_step": 11222, "epoch": 94, "lr": 9.446147556258431e-05} +{"train_loss": 0.012205167673528194, "global_step": 11223, "epoch": 94, "lr": 9.44604620089365e-05} +{"train_loss": 0.010943938046693802, "global_step": 11224, "epoch": 94, "lr": 9.445944836799532e-05} +{"train_loss": 0.010475839488208294, "global_step": 11225, "epoch": 94, "lr": 9.445843463976275e-05} +{"train_loss": 0.010463581420481205, "global_step": 11226, "epoch": 94, "lr": 9.44574208242408e-05} +{"train_loss": 0.009350674226880074, "global_step": 11227, "epoch": 94, "lr": 9.445640692143145e-05} +{"train_loss": 0.008868778124451637, "global_step": 11228, "epoch": 94, "lr": 9.445539293133672e-05} +{"train_loss": 0.011963714845478535, "global_step": 11229, "epoch": 94, "lr": 9.445437885395854e-05} +{"train_loss": 0.00949823297560215, "global_step": 11230, "epoch": 94, "lr": 9.445336468929895e-05} +{"train_loss": 0.005315128248184919, "global_step": 11231, "epoch": 94, "lr": 9.445235043735994e-05} +{"train_loss": 0.005757275503128767, "global_step": 11232, "epoch": 94, "lr": 9.445133609814348e-05} +{"train_loss": 0.00725181307643652, "global_step": 11233, "epoch": 94, "lr": 9.445032167165157e-05} +{"train_loss": 0.006826045922935009, "global_step": 11234, "epoch": 94, "lr": 9.44493071578862e-05} +{"train_loss": 0.007079609204083681, "global_step": 11235, "epoch": 94, "lr": 9.444829255684937e-05} +{"train_loss": 0.009187350049614906, "global_step": 11236, "epoch": 94, "lr": 9.444727786854306e-05} +{"train_loss": 0.01063583418726921, "global_step": 11237, "epoch": 94, "lr": 9.444626309296927e-05} +{"train_loss": 0.007429668214172125, "global_step": 11238, "epoch": 94, "lr": 9.444524823013e-05} +{"train_loss": 0.009449692443013191, "global_step": 11239, "epoch": 94, "lr": 9.44442332800272e-05} +{"train_loss": 0.014720008708536625, "global_step": 11240, "epoch": 94, "lr": 9.444321824266293e-05} +{"train_loss": 0.006437482312321663, "global_step": 11241, "epoch": 94, "lr": 9.444220311803915e-05} +{"train_loss": 0.0067260549403727055, "global_step": 11242, "epoch": 94, "lr": 9.444118790615784e-05} +{"train_loss": 0.008754401467740536, "global_step": 11243, "epoch": 94, "lr": 9.4440172607021e-05} +{"train_loss": 0.010076656937599182, "global_step": 11244, "epoch": 94, "lr": 9.443915722063063e-05} +{"train_loss": 0.008569181896746159, "global_step": 11245, "epoch": 94, "lr": 9.443814174698875e-05} +{"train_loss": 0.006735015660524368, "global_step": 11246, "epoch": 94, "lr": 9.44371261860973e-05} +{"train_loss": 0.009455202147364616, "global_step": 11247, "epoch": 94, "lr": 9.44361105379583e-05} +{"train_loss": 0.006956123746931553, "global_step": 11248, "epoch": 94, "lr": 9.443509480257375e-05} +{"train_loss": 0.009982888586819172, "global_step": 11249, "epoch": 94, "lr": 9.443407897994563e-05} +{"train_loss": 0.012815717607736588, "global_step": 11250, "epoch": 94, "lr": 9.443306307007596e-05} +{"train_loss": 0.007508785929530859, "global_step": 11251, "epoch": 94, "lr": 9.44320470729667e-05} +{"train_loss": 0.011970414780080318, "global_step": 11252, "epoch": 94, "lr": 9.443103098861988e-05} +{"train_loss": 0.009640078991651535, "global_step": 11253, "epoch": 94, "lr": 9.443001481703746e-05} +{"train_loss": 0.005485962610691786, "global_step": 11254, "epoch": 94, "lr": 9.442899855822147e-05} +{"train_loss": 0.008799511007964611, "global_step": 11255, "epoch": 94, "lr": 9.442798221217387e-05} +{"train_loss": 0.014645430259406567, "global_step": 11256, "epoch": 94, "lr": 9.44269657788967e-05} +{"train_loss": 0.0055817789398133755, "global_step": 11257, "epoch": 94, "lr": 9.44259492583919e-05} +{"train_loss": 0.006907702423632145, "global_step": 11258, "epoch": 94, "lr": 9.44249326506615e-05} +{"train_loss": 0.01063777320086956, "global_step": 11259, "epoch": 94, "lr": 9.44239159557075e-05} +{"train_loss": 0.007439331151545048, "global_step": 11260, "epoch": 94, "lr": 9.442289917353188e-05} +{"train_loss": 0.013555405661463737, "global_step": 11261, "epoch": 94, "lr": 9.442188230413665e-05} +{"train_loss": 0.007409267593175173, "global_step": 11262, "epoch": 94, "lr": 9.442086534752379e-05} +{"train_loss": 0.008131089620292187, "global_step": 11263, "epoch": 94, "lr": 9.441984830369532e-05} +{"train_loss": 0.011581385508179665, "global_step": 11264, "epoch": 94, "lr": 9.441883117265322e-05} +{"train_loss": 0.01155538484454155, "global_step": 11265, "epoch": 94, "lr": 9.441781395439949e-05} +{"train_loss": 0.00748464185744524, "global_step": 11266, "epoch": 94, "lr": 9.441679664893612e-05} +{"train_loss": 0.00943372119218111, "global_step": 11267, "epoch": 94, "lr": 9.441577925626513e-05} +{"train_loss": 0.011258045211434364, "global_step": 11268, "epoch": 94, "lr": 9.441476177638848e-05} +{"train_loss": 0.010384014807641506, "global_step": 11269, "epoch": 94, "lr": 9.44137442093082e-05} +{"train_loss": 0.01037132740020752, "global_step": 11270, "epoch": 94, "lr": 9.441272655502628e-05} +{"train_loss": 0.01002086978405714, "global_step": 11271, "epoch": 94, "lr": 9.441170881354473e-05} +{"train_loss": 0.009815514087677002, "global_step": 11272, "epoch": 94, "lr": 9.441069098486552e-05} +{"train_loss": 0.007890804670751095, "global_step": 11273, "epoch": 94, "lr": 9.440967306899066e-05} +{"train_loss": 0.005991703364998102, "global_step": 11274, "epoch": 94, "lr": 9.440865506592215e-05} +{"train_loss": 0.007973539642989635, "global_step": 11275, "epoch": 94, "lr": 9.4407636975662e-05} +{"train_loss": 0.011192373000085354, "global_step": 11276, "epoch": 94, "lr": 9.44066187982122e-05} +{"train_loss": 0.009356859140098095, "global_step": 11277, "epoch": 94, "lr": 9.440560053357473e-05} +{"train_loss": 0.011136654764413834, "global_step": 11278, "epoch": 94, "lr": 9.440458218175163e-05} +{"train_loss": 0.011937384493649006, "global_step": 11279, "epoch": 94, "lr": 9.440356374274487e-05} +{"train_loss": 0.008222031407058239, "global_step": 11280, "epoch": 94, "lr": 9.440254521655645e-05} +{"train_loss": 0.007566260639578104, "global_step": 11281, "epoch": 94, "lr": 9.440152660318838e-05} +{"train_loss": 0.007923168130218983, "global_step": 11282, "epoch": 94, "lr": 9.440050790264265e-05} +{"train_loss": 0.013467755168676376, "global_step": 11283, "epoch": 94, "lr": 9.439948911492127e-05} +{"train_loss": 0.0069926162250339985, "global_step": 11284, "epoch": 94, "lr": 9.439847024002625e-05} +{"train_loss": 0.009895294904708862, "global_step": 11285, "epoch": 94, "lr": 9.439745127795957e-05} +{"train_loss": 0.008327987976372242, "global_step": 11286, "epoch": 94, "lr": 9.439643222872323e-05} +{"train_loss": 0.015148142352700233, "global_step": 11287, "epoch": 94, "lr": 9.439541309231924e-05} +{"train_loss": 0.00885116308927536, "global_step": 11288, "epoch": 94, "lr": 9.43943938687496e-05} +{"train_loss": 0.013559114187955856, "global_step": 11289, "epoch": 94, "lr": 9.43933745580163e-05} +{"train_loss": 0.007088244426995516, "global_step": 11290, "epoch": 94, "lr": 9.439235516012136e-05} +{"train_loss": 0.00995259452611208, "global_step": 11291, "epoch": 94, "lr": 9.439133567506679e-05} +{"train_loss": 0.006221582647413015, "global_step": 11292, "epoch": 94, "lr": 9.439031610285455e-05} +{"train_loss": 0.00639951741322875, "global_step": 11293, "epoch": 94, "lr": 9.438929644348668e-05} +{"train_loss": 0.008174138143658638, "global_step": 11294, "epoch": 94, "lr": 9.438827669696518e-05} +{"train_loss": 0.007815206423401833, "global_step": 11295, "epoch": 94, "lr": 9.438725686329202e-05} +{"train_loss": 0.009674306958913803, "global_step": 11296, "epoch": 94, "lr": 9.438623694246924e-05} +{"train_loss": 0.01078168023377657, "global_step": 11297, "epoch": 94, "lr": 9.438521693449882e-05} +{"train_loss": 0.005991336889564991, "global_step": 11298, "epoch": 94, "lr": 9.438419683938275e-05} +{"train_loss": 0.00880727730691433, "global_step": 11299, "epoch": 94, "lr": 9.438317665712307e-05} +{"train_loss": 0.006743303034454584, "global_step": 11300, "epoch": 94, "lr": 9.438215638772176e-05} +{"train_loss": 0.007253015413880348, "global_step": 11301, "epoch": 94, "lr": 9.438113603118084e-05} +{"train_loss": 0.009564925916492939, "global_step": 11302, "epoch": 94, "lr": 9.438011558750228e-05} +{"train_loss": 0.00879182480275631, "global_step": 11303, "epoch": 94, "lr": 9.437909505668812e-05} +{"train_loss": 0.009141258711480544, "global_step": 11304, "epoch": 94, "lr": 9.437807443874034e-05, "val_loss": 0.02038136124610901} +{"train_loss": 0.008091554045677185, "global_step": 11305, "epoch": 95, "lr": 9.437705373366095e-05} +{"train_loss": 0.00937293004244566, "global_step": 11306, "epoch": 95, "lr": 9.437603294145197e-05} +{"train_loss": 0.008476673625409603, "global_step": 11307, "epoch": 95, "lr": 9.437501206211536e-05} +{"train_loss": 0.008925311267375946, "global_step": 11308, "epoch": 95, "lr": 9.437399109565319e-05} +{"train_loss": 0.010759826749563217, "global_step": 11309, "epoch": 95, "lr": 9.437297004206741e-05} +{"train_loss": 0.010750558227300644, "global_step": 11310, "epoch": 95, "lr": 9.437194890136006e-05} +{"train_loss": 0.012160423211753368, "global_step": 11311, "epoch": 95, "lr": 9.43709276735331e-05} +{"train_loss": 0.009825755842030048, "global_step": 11312, "epoch": 95, "lr": 9.436990635858858e-05} +{"train_loss": 0.010861504822969437, "global_step": 11313, "epoch": 95, "lr": 9.43688849565285e-05} +{"train_loss": 0.008037138730287552, "global_step": 11314, "epoch": 95, "lr": 9.436786346735483e-05} +{"train_loss": 0.006581733003258705, "global_step": 11315, "epoch": 95, "lr": 9.436684189106962e-05} +{"train_loss": 0.011139520443975925, "global_step": 11316, "epoch": 95, "lr": 9.436582022767484e-05} +{"train_loss": 0.012299305759370327, "global_step": 11317, "epoch": 95, "lr": 9.436479847717252e-05} +{"train_loss": 0.008422105573117733, "global_step": 11318, "epoch": 95, "lr": 9.436377663956468e-05} +{"train_loss": 0.008036565035581589, "global_step": 11319, "epoch": 95, "lr": 9.436275471485328e-05} +{"train_loss": 0.007181402295827866, "global_step": 11320, "epoch": 95, "lr": 9.436173270304034e-05} +{"train_loss": 0.0106546925380826, "global_step": 11321, "epoch": 95, "lr": 9.43607106041279e-05} +{"train_loss": 0.008611327968537807, "global_step": 11322, "epoch": 95, "lr": 9.435968841811793e-05} +{"train_loss": 0.007691127248108387, "global_step": 11323, "epoch": 95, "lr": 9.435866614501245e-05} +{"train_loss": 0.00877902191132307, "global_step": 11324, "epoch": 95, "lr": 9.435764378481348e-05} +{"train_loss": 0.013675265945494175, "global_step": 11325, "epoch": 95, "lr": 9.4356621337523e-05} +{"train_loss": 0.010333058424293995, "global_step": 11326, "epoch": 95, "lr": 9.435559880314306e-05} +{"train_loss": 0.00768829183652997, "global_step": 11327, "epoch": 95, "lr": 9.435457618167561e-05} +{"train_loss": 0.00789455883204937, "global_step": 11328, "epoch": 95, "lr": 9.435355347312272e-05} +{"train_loss": 0.009766723960638046, "global_step": 11329, "epoch": 95, "lr": 9.435253067748632e-05} +{"train_loss": 0.010763094760477543, "global_step": 11330, "epoch": 95, "lr": 9.43515077947685e-05} +{"train_loss": 0.008495774120092392, "global_step": 11331, "epoch": 95, "lr": 9.435048482497123e-05} +{"train_loss": 0.007554680574685335, "global_step": 11332, "epoch": 95, "lr": 9.434946176809651e-05} +{"train_loss": 0.00893651507794857, "global_step": 11333, "epoch": 95, "lr": 9.434843862414637e-05} +{"train_loss": 0.006069141905754805, "global_step": 11334, "epoch": 95, "lr": 9.43474153931228e-05} +{"train_loss": 0.007823344320058823, "global_step": 11335, "epoch": 95, "lr": 9.434639207502782e-05} +{"train_loss": 0.008906823582947254, "global_step": 11336, "epoch": 95, "lr": 9.434536866986344e-05} +{"train_loss": 0.008130226284265518, "global_step": 11337, "epoch": 95, "lr": 9.434434517763167e-05} +{"train_loss": 0.011156980879604816, "global_step": 11338, "epoch": 95, "lr": 9.434332159833451e-05} +{"train_loss": 0.014391258358955383, "global_step": 11339, "epoch": 95, "lr": 9.434229793197397e-05} +{"train_loss": 0.01070998515933752, "global_step": 11340, "epoch": 95, "lr": 9.434127417855208e-05} +{"train_loss": 0.01048197690397501, "global_step": 11341, "epoch": 95, "lr": 9.434025033807082e-05} +{"train_loss": 0.011597861535847187, "global_step": 11342, "epoch": 95, "lr": 9.433922641053223e-05} +{"train_loss": 0.011490407399833202, "global_step": 11343, "epoch": 95, "lr": 9.43382023959383e-05} +{"train_loss": 0.009072156623005867, "global_step": 11344, "epoch": 95, "lr": 9.433717829429104e-05} +{"train_loss": 0.011760878376662731, "global_step": 11345, "epoch": 95, "lr": 9.433615410559246e-05} +{"train_loss": 0.004884479567408562, "global_step": 11346, "epoch": 95, "lr": 9.43351298298446e-05} +{"train_loss": 0.00765087828040123, "global_step": 11347, "epoch": 95, "lr": 9.433410546704944e-05} +{"train_loss": 0.0087893670424819, "global_step": 11348, "epoch": 95, "lr": 9.4333081017209e-05} +{"train_loss": 0.01155620627105236, "global_step": 11349, "epoch": 95, "lr": 9.433205648032528e-05} +{"train_loss": 0.008676123805344105, "global_step": 11350, "epoch": 95, "lr": 9.433103185640032e-05} +{"train_loss": 0.006270159501582384, "global_step": 11351, "epoch": 95, "lr": 9.433000714543611e-05} +{"train_loss": 0.009846319444477558, "global_step": 11352, "epoch": 95, "lr": 9.432898234743466e-05} +{"train_loss": 0.005887516774237156, "global_step": 11353, "epoch": 95, "lr": 9.4327957462398e-05} +{"train_loss": 0.009949753060936928, "global_step": 11354, "epoch": 95, "lr": 9.432693249032812e-05} +{"train_loss": 0.008438954129815102, "global_step": 11355, "epoch": 95, "lr": 9.432590743122705e-05} +{"train_loss": 0.00926282536238432, "global_step": 11356, "epoch": 95, "lr": 9.432488228509679e-05} +{"train_loss": 0.008675153367221355, "global_step": 11357, "epoch": 95, "lr": 9.432385705193939e-05} +{"train_loss": 0.01399616152048111, "global_step": 11358, "epoch": 95, "lr": 9.432283173175679e-05} +{"train_loss": 0.008891071192920208, "global_step": 11359, "epoch": 95, "lr": 9.432180632455107e-05} +{"train_loss": 0.008590789511799812, "global_step": 11360, "epoch": 95, "lr": 9.43207808303242e-05} +{"train_loss": 0.008363097906112671, "global_step": 11361, "epoch": 95, "lr": 9.431975524907823e-05} +{"train_loss": 0.006602896377444267, "global_step": 11362, "epoch": 95, "lr": 9.431872958081514e-05} +{"train_loss": 0.007627230137586594, "global_step": 11363, "epoch": 95, "lr": 9.431770382553698e-05} +{"train_loss": 0.007796944584697485, "global_step": 11364, "epoch": 95, "lr": 9.431667798324573e-05} +{"train_loss": 0.006385129876434803, "global_step": 11365, "epoch": 95, "lr": 9.431565205394341e-05} +{"train_loss": 0.009559519588947296, "global_step": 11366, "epoch": 95, "lr": 9.431462603763205e-05} +{"train_loss": 0.0062568774446845055, "global_step": 11367, "epoch": 95, "lr": 9.431359993431366e-05} +{"train_loss": 0.007189527153968811, "global_step": 11368, "epoch": 95, "lr": 9.431257374399024e-05} +{"train_loss": 0.006543993018567562, "global_step": 11369, "epoch": 95, "lr": 9.431154746666383e-05} +{"train_loss": 0.007642163895070553, "global_step": 11370, "epoch": 95, "lr": 9.431052110233641e-05} +{"train_loss": 0.007971329614520073, "global_step": 11371, "epoch": 95, "lr": 9.430949465101003e-05} +{"train_loss": 0.00843915157020092, "global_step": 11372, "epoch": 95, "lr": 9.43084681126867e-05} +{"train_loss": 0.008672846481204033, "global_step": 11373, "epoch": 95, "lr": 9.430744148736841e-05} +{"train_loss": 0.007399349007755518, "global_step": 11374, "epoch": 95, "lr": 9.43064147750572e-05} +{"train_loss": 0.005006512627005577, "global_step": 11375, "epoch": 95, "lr": 9.430538797575508e-05} +{"train_loss": 0.006915573962032795, "global_step": 11376, "epoch": 95, "lr": 9.430436108946406e-05} +{"train_loss": 0.007269921246916056, "global_step": 11377, "epoch": 95, "lr": 9.430333411618614e-05} +{"train_loss": 0.008867194876074791, "global_step": 11378, "epoch": 95, "lr": 9.430230705592339e-05} +{"train_loss": 0.008638249710202217, "global_step": 11379, "epoch": 95, "lr": 9.430127990867777e-05} +{"train_loss": 0.00960068590939045, "global_step": 11380, "epoch": 95, "lr": 9.430025267445132e-05} +{"train_loss": 0.009026122279465199, "global_step": 11381, "epoch": 95, "lr": 9.429922535324607e-05} +{"train_loss": 0.008198975585401058, "global_step": 11382, "epoch": 95, "lr": 9.429819794506402e-05} +{"train_loss": 0.006140575278550386, "global_step": 11383, "epoch": 95, "lr": 9.429717044990721e-05} +{"train_loss": 0.009835345670580864, "global_step": 11384, "epoch": 95, "lr": 9.429614286777762e-05} +{"train_loss": 0.009494291618466377, "global_step": 11385, "epoch": 95, "lr": 9.429511519867728e-05} +{"train_loss": 0.010688422247767448, "global_step": 11386, "epoch": 95, "lr": 9.429408744260821e-05} +{"train_loss": 0.008837264962494373, "global_step": 11387, "epoch": 95, "lr": 9.429305959957244e-05} +{"train_loss": 0.007058882620185614, "global_step": 11388, "epoch": 95, "lr": 9.429203166957199e-05} +{"train_loss": 0.010827808640897274, "global_step": 11389, "epoch": 95, "lr": 9.429100365260885e-05} +{"train_loss": 0.00812163483351469, "global_step": 11390, "epoch": 95, "lr": 9.428997554868506e-05} +{"train_loss": 0.007704177405685186, "global_step": 11391, "epoch": 95, "lr": 9.428894735780264e-05} +{"train_loss": 0.011149239726364613, "global_step": 11392, "epoch": 95, "lr": 9.42879190799636e-05} +{"train_loss": 0.003851983230561018, "global_step": 11393, "epoch": 95, "lr": 9.428689071516997e-05} +{"train_loss": 0.014230526983737946, "global_step": 11394, "epoch": 95, "lr": 9.428586226342376e-05} +{"train_loss": 0.007631728891283274, "global_step": 11395, "epoch": 95, "lr": 9.428483372472697e-05} +{"train_loss": 0.00811344850808382, "global_step": 11396, "epoch": 95, "lr": 9.428380509908166e-05} +{"train_loss": 0.008338353596627712, "global_step": 11397, "epoch": 95, "lr": 9.428277638648984e-05} +{"train_loss": 0.0077524492517113686, "global_step": 11398, "epoch": 95, "lr": 9.42817475869535e-05} +{"train_loss": 0.007377697620540857, "global_step": 11399, "epoch": 95, "lr": 9.428071870047467e-05} +{"train_loss": 0.010230707004666328, "global_step": 11400, "epoch": 95, "lr": 9.42796897270554e-05} +{"train_loss": 0.009907186031341553, "global_step": 11401, "epoch": 95, "lr": 9.427866066669768e-05} +{"train_loss": 0.007395570166409016, "global_step": 11402, "epoch": 95, "lr": 9.427763151940354e-05} +{"train_loss": 0.011774841696023941, "global_step": 11403, "epoch": 95, "lr": 9.427660228517501e-05} +{"train_loss": 0.007973838597536087, "global_step": 11404, "epoch": 95, "lr": 9.42755729640141e-05} +{"train_loss": 0.0066438959911465645, "global_step": 11405, "epoch": 95, "lr": 9.427454355592282e-05} +{"train_loss": 0.009318520314991474, "global_step": 11406, "epoch": 95, "lr": 9.427351406090322e-05} +{"train_loss": 0.004548258148133755, "global_step": 11407, "epoch": 95, "lr": 9.427248447895729e-05} +{"train_loss": 0.007838635705411434, "global_step": 11408, "epoch": 95, "lr": 9.427145481008707e-05} +{"train_loss": 0.008440511301159859, "global_step": 11409, "epoch": 95, "lr": 9.42704250542946e-05} +{"train_loss": 0.009258009493350983, "global_step": 11410, "epoch": 95, "lr": 9.426939521158186e-05} +{"train_loss": 0.005998942069709301, "global_step": 11411, "epoch": 95, "lr": 9.426836528195089e-05} +{"train_loss": 0.013866801746189594, "global_step": 11412, "epoch": 95, "lr": 9.426733526540372e-05} +{"train_loss": 0.005676943343132734, "global_step": 11413, "epoch": 95, "lr": 9.426630516194237e-05} +{"train_loss": 0.00846098829060793, "global_step": 11414, "epoch": 95, "lr": 9.426527497156885e-05} +{"train_loss": 0.010767532512545586, "global_step": 11415, "epoch": 95, "lr": 9.42642446942852e-05} +{"train_loss": 0.010545680299401283, "global_step": 11416, "epoch": 95, "lr": 9.426321433009343e-05} +{"train_loss": 0.006168821826577187, "global_step": 11417, "epoch": 95, "lr": 9.426218387899557e-05} +{"train_loss": 0.006621931679546833, "global_step": 11418, "epoch": 95, "lr": 9.426115334099364e-05} +{"train_loss": 0.01007629930973053, "global_step": 11419, "epoch": 95, "lr": 9.426012271608966e-05} +{"train_loss": 0.008583871647715569, "global_step": 11420, "epoch": 95, "lr": 9.425909200428565e-05} +{"train_loss": 0.005891666281968355, "global_step": 11421, "epoch": 95, "lr": 9.425806120558366e-05} +{"train_loss": 0.010628217831254005, "global_step": 11422, "epoch": 95, "lr": 9.425703031998569e-05} +{"train_loss": 0.008808243147121007, "global_step": 11423, "epoch": 95, "lr": 9.425599934749377e-05, "val_loss": 0.014634950086474419, "train_action_mse_error": 0.0003478563448879868} +{"train_loss": 0.008105977438390255, "global_step": 11424, "epoch": 96, "lr": 9.425496828810991e-05} +{"train_loss": 0.010023696348071098, "global_step": 11425, "epoch": 96, "lr": 9.425393714183616e-05} +{"train_loss": 0.005686366464942694, "global_step": 11426, "epoch": 96, "lr": 9.425290590867452e-05} +{"train_loss": 0.010711449198424816, "global_step": 11427, "epoch": 96, "lr": 9.425187458862704e-05} +{"train_loss": 0.009381084702908993, "global_step": 11428, "epoch": 96, "lr": 9.425084318169573e-05} +{"train_loss": 0.0071750907227396965, "global_step": 11429, "epoch": 96, "lr": 9.424981168788261e-05} +{"train_loss": 0.00931398943066597, "global_step": 11430, "epoch": 96, "lr": 9.424878010718971e-05} +{"train_loss": 0.011400526389479637, "global_step": 11431, "epoch": 96, "lr": 9.424774843961907e-05} +{"train_loss": 0.008282748982310295, "global_step": 11432, "epoch": 96, "lr": 9.424671668517271e-05} +{"train_loss": 0.0073761409148573875, "global_step": 11433, "epoch": 96, "lr": 9.424568484385264e-05} +{"train_loss": 0.006742639467120171, "global_step": 11434, "epoch": 96, "lr": 9.424465291566088e-05} +{"train_loss": 0.008687256835401058, "global_step": 11435, "epoch": 96, "lr": 9.424362090059949e-05} +{"train_loss": 0.012667057104408741, "global_step": 11436, "epoch": 96, "lr": 9.424258879867046e-05} +{"train_loss": 0.006172840483486652, "global_step": 11437, "epoch": 96, "lr": 9.424155660987583e-05} +{"train_loss": 0.008640115149319172, "global_step": 11438, "epoch": 96, "lr": 9.424052433421767e-05} +{"train_loss": 0.008768915198743343, "global_step": 11439, "epoch": 96, "lr": 9.423949197169792e-05} +{"train_loss": 0.00803481787443161, "global_step": 11440, "epoch": 96, "lr": 9.423845952231868e-05} +{"train_loss": 0.00892692431807518, "global_step": 11441, "epoch": 96, "lr": 9.423742698608195e-05} +{"train_loss": 0.00488618016242981, "global_step": 11442, "epoch": 96, "lr": 9.423639436298974e-05} +{"train_loss": 0.010343324393033981, "global_step": 11443, "epoch": 96, "lr": 9.423536165304412e-05} +{"train_loss": 0.005569291301071644, "global_step": 11444, "epoch": 96, "lr": 9.423432885624708e-05} +{"train_loss": 0.007185892667621374, "global_step": 11445, "epoch": 96, "lr": 9.423329597260065e-05} +{"train_loss": 0.012553286738693714, "global_step": 11446, "epoch": 96, "lr": 9.42322630021069e-05} +{"train_loss": 0.006340092979371548, "global_step": 11447, "epoch": 96, "lr": 9.42312299447678e-05} +{"train_loss": 0.005616867449134588, "global_step": 11448, "epoch": 96, "lr": 9.423019680058541e-05} +{"train_loss": 0.00917036272585392, "global_step": 11449, "epoch": 96, "lr": 9.422916356956175e-05} +{"train_loss": 0.013853086158633232, "global_step": 11450, "epoch": 96, "lr": 9.422813025169888e-05} +{"train_loss": 0.006985208950936794, "global_step": 11451, "epoch": 96, "lr": 9.422709684699877e-05} +{"train_loss": 0.006481615826487541, "global_step": 11452, "epoch": 96, "lr": 9.42260633554635e-05} +{"train_loss": 0.009474290534853935, "global_step": 11453, "epoch": 96, "lr": 9.422502977709507e-05} +{"train_loss": 0.00963735394179821, "global_step": 11454, "epoch": 96, "lr": 9.422399611189552e-05} +{"train_loss": 0.007323599420487881, "global_step": 11455, "epoch": 96, "lr": 9.422296235986688e-05} +{"train_loss": 0.005877105053514242, "global_step": 11456, "epoch": 96, "lr": 9.422192852101117e-05} +{"train_loss": 0.007971125654876232, "global_step": 11457, "epoch": 96, "lr": 9.422089459533043e-05} +{"train_loss": 0.009716170839965343, "global_step": 11458, "epoch": 96, "lr": 9.421986058282671e-05} +{"train_loss": 0.010298546403646469, "global_step": 11459, "epoch": 96, "lr": 9.421882648350198e-05} +{"train_loss": 0.012977579608559608, "global_step": 11460, "epoch": 96, "lr": 9.421779229735833e-05} +{"train_loss": 0.008230654522776604, "global_step": 11461, "epoch": 96, "lr": 9.421675802439778e-05} +{"train_loss": 0.004735609050840139, "global_step": 11462, "epoch": 96, "lr": 9.421572366462232e-05} +{"train_loss": 0.013541707769036293, "global_step": 11463, "epoch": 96, "lr": 9.421468921803403e-05} +{"train_loss": 0.006729679647833109, "global_step": 11464, "epoch": 96, "lr": 9.421365468463493e-05} +{"train_loss": 0.011340988799929619, "global_step": 11465, "epoch": 96, "lr": 9.421262006442702e-05} +{"train_loss": 0.007480669766664505, "global_step": 11466, "epoch": 96, "lr": 9.421158535741237e-05} +{"train_loss": 0.006870304234325886, "global_step": 11467, "epoch": 96, "lr": 9.421055056359299e-05} +{"train_loss": 0.007226103451102972, "global_step": 11468, "epoch": 96, "lr": 9.420951568297091e-05} +{"train_loss": 0.005254613701254129, "global_step": 11469, "epoch": 96, "lr": 9.420848071554818e-05} +{"train_loss": 0.008519403636455536, "global_step": 11470, "epoch": 96, "lr": 9.420744566132683e-05} +{"train_loss": 0.006800075992941856, "global_step": 11471, "epoch": 96, "lr": 9.420641052030885e-05} +{"train_loss": 0.007709472440183163, "global_step": 11472, "epoch": 96, "lr": 9.420537529249634e-05} +{"train_loss": 0.008168306201696396, "global_step": 11473, "epoch": 96, "lr": 9.420433997789129e-05} +{"train_loss": 0.007721858099102974, "global_step": 11474, "epoch": 96, "lr": 9.420330457649573e-05} +{"train_loss": 0.009044786915183067, "global_step": 11475, "epoch": 96, "lr": 9.420226908831171e-05} +{"train_loss": 0.011669463478028774, "global_step": 11476, "epoch": 96, "lr": 9.420123351334125e-05} +{"train_loss": 0.006136368494480848, "global_step": 11477, "epoch": 96, "lr": 9.42001978515864e-05} +{"train_loss": 0.010070154443383217, "global_step": 11478, "epoch": 96, "lr": 9.419916210304917e-05} +{"train_loss": 0.00454860320314765, "global_step": 11479, "epoch": 96, "lr": 9.419812626773163e-05} +{"train_loss": 0.009686559438705444, "global_step": 11480, "epoch": 96, "lr": 9.419709034563578e-05} +{"train_loss": 0.007250199094414711, "global_step": 11481, "epoch": 96, "lr": 9.419605433676366e-05} +{"train_loss": 0.010149813257157803, "global_step": 11482, "epoch": 96, "lr": 9.419501824111732e-05} +{"train_loss": 0.006612979806959629, "global_step": 11483, "epoch": 96, "lr": 9.419398205869876e-05} +{"train_loss": 0.00908423401415348, "global_step": 11484, "epoch": 96, "lr": 9.419294578951006e-05} +{"train_loss": 0.008526215329766273, "global_step": 11485, "epoch": 96, "lr": 9.419190943355322e-05} +{"train_loss": 0.0055245039984583855, "global_step": 11486, "epoch": 96, "lr": 9.419087299083029e-05} +{"train_loss": 0.007363402750343084, "global_step": 11487, "epoch": 96, "lr": 9.418983646134332e-05} +{"train_loss": 0.006396145094186068, "global_step": 11488, "epoch": 96, "lr": 9.41887998450943e-05} +{"train_loss": 0.004703880753368139, "global_step": 11489, "epoch": 96, "lr": 9.41877631420853e-05} +{"train_loss": 0.008012760430574417, "global_step": 11490, "epoch": 96, "lr": 9.418672635231835e-05} +{"train_loss": 0.009730661287903786, "global_step": 11491, "epoch": 96, "lr": 9.418568947579549e-05} +{"train_loss": 0.0065176342613995075, "global_step": 11492, "epoch": 96, "lr": 9.418465251251875e-05} +{"train_loss": 0.008489388972520828, "global_step": 11493, "epoch": 96, "lr": 9.418361546249017e-05} +{"train_loss": 0.00825645960867405, "global_step": 11494, "epoch": 96, "lr": 9.418257832571176e-05} +{"train_loss": 0.006608275230973959, "global_step": 11495, "epoch": 96, "lr": 9.418154110218559e-05} +{"train_loss": 0.005007399246096611, "global_step": 11496, "epoch": 96, "lr": 9.418050379191367e-05} +{"train_loss": 0.007975421845912933, "global_step": 11497, "epoch": 96, "lr": 9.417946639489808e-05} +{"train_loss": 0.006308624055236578, "global_step": 11498, "epoch": 96, "lr": 9.417842891114081e-05} +{"train_loss": 0.010499972850084305, "global_step": 11499, "epoch": 96, "lr": 9.417739134064392e-05} +{"train_loss": 0.006876668892800808, "global_step": 11500, "epoch": 96, "lr": 9.417635368340942e-05} +{"train_loss": 0.00887182354927063, "global_step": 11501, "epoch": 96, "lr": 9.41753159394394e-05} +{"train_loss": 0.006981214974075556, "global_step": 11502, "epoch": 96, "lr": 9.417427810873585e-05} +{"train_loss": 0.006919119507074356, "global_step": 11503, "epoch": 96, "lr": 9.417324019130083e-05} +{"train_loss": 0.0065613361075520515, "global_step": 11504, "epoch": 96, "lr": 9.417220218713636e-05} +{"train_loss": 0.007328697945922613, "global_step": 11505, "epoch": 96, "lr": 9.417116409624452e-05} +{"train_loss": 0.0066769784316420555, "global_step": 11506, "epoch": 96, "lr": 9.417012591862728e-05} +{"train_loss": 0.006439424119889736, "global_step": 11507, "epoch": 96, "lr": 9.416908765428674e-05} +{"train_loss": 0.007165574934333563, "global_step": 11508, "epoch": 96, "lr": 9.416804930322491e-05} +{"train_loss": 0.00823195930570364, "global_step": 11509, "epoch": 96, "lr": 9.416701086544383e-05} +{"train_loss": 0.007379155606031418, "global_step": 11510, "epoch": 96, "lr": 9.416597234094556e-05} +{"train_loss": 0.007067161146551371, "global_step": 11511, "epoch": 96, "lr": 9.41649337297321e-05} +{"train_loss": 0.006648375652730465, "global_step": 11512, "epoch": 96, "lr": 9.416389503180552e-05} +{"train_loss": 0.005329147446900606, "global_step": 11513, "epoch": 96, "lr": 9.416285624716785e-05} +{"train_loss": 0.006423157174140215, "global_step": 11514, "epoch": 96, "lr": 9.416181737582113e-05} +{"train_loss": 0.009910741820931435, "global_step": 11515, "epoch": 96, "lr": 9.41607784177674e-05} +{"train_loss": 0.008562578819692135, "global_step": 11516, "epoch": 96, "lr": 9.415973937300869e-05} +{"train_loss": 0.008423371240496635, "global_step": 11517, "epoch": 96, "lr": 9.415870024154705e-05} +{"train_loss": 0.007813653908669949, "global_step": 11518, "epoch": 96, "lr": 9.415766102338453e-05} +{"train_loss": 0.00836566835641861, "global_step": 11519, "epoch": 96, "lr": 9.415662171852318e-05} +{"train_loss": 0.006395888514816761, "global_step": 11520, "epoch": 96, "lr": 9.415558232696499e-05} +{"train_loss": 0.00867263600230217, "global_step": 11521, "epoch": 96, "lr": 9.415454284871203e-05} +{"train_loss": 0.00766063341870904, "global_step": 11522, "epoch": 96, "lr": 9.415350328376635e-05} +{"train_loss": 0.005236638709902763, "global_step": 11523, "epoch": 96, "lr": 9.415246363212999e-05} +{"train_loss": 0.008013946004211903, "global_step": 11524, "epoch": 96, "lr": 9.415142389380499e-05} +{"train_loss": 0.01220409944653511, "global_step": 11525, "epoch": 96, "lr": 9.415038406879337e-05} +{"train_loss": 0.008609343320131302, "global_step": 11526, "epoch": 96, "lr": 9.41493441570972e-05} +{"train_loss": 0.014566445723176003, "global_step": 11527, "epoch": 96, "lr": 9.41483041587185e-05} +{"train_loss": 0.012120658531785011, "global_step": 11528, "epoch": 96, "lr": 9.414726407365932e-05} +{"train_loss": 0.00779235502704978, "global_step": 11529, "epoch": 96, "lr": 9.414622390192172e-05} +{"train_loss": 0.009051205590367317, "global_step": 11530, "epoch": 96, "lr": 9.414518364350771e-05} +{"train_loss": 0.011002886109054089, "global_step": 11531, "epoch": 96, "lr": 9.414414329841934e-05} +{"train_loss": 0.012920870445668697, "global_step": 11532, "epoch": 96, "lr": 9.414310286665868e-05} +{"train_loss": 0.009968834929168224, "global_step": 11533, "epoch": 96, "lr": 9.414206234822774e-05} +{"train_loss": 0.007718220818787813, "global_step": 11534, "epoch": 96, "lr": 9.414102174312858e-05} +{"train_loss": 0.01055964920669794, "global_step": 11535, "epoch": 96, "lr": 9.413998105136326e-05} +{"train_loss": 0.008916561491787434, "global_step": 11536, "epoch": 96, "lr": 9.413894027293377e-05} +{"train_loss": 0.011792700737714767, "global_step": 11537, "epoch": 96, "lr": 9.413789940784221e-05} +{"train_loss": 0.008679894730448723, "global_step": 11538, "epoch": 96, "lr": 9.413685845609059e-05} +{"train_loss": 0.01111591700464487, "global_step": 11539, "epoch": 96, "lr": 9.413581741768097e-05} +{"train_loss": 0.008587113581597805, "global_step": 11540, "epoch": 96, "lr": 9.413477629261539e-05} +{"train_loss": 0.010178196243941784, "global_step": 11541, "epoch": 96, "lr": 9.413373508089587e-05} +{"train_loss": 0.00831635800745933, "global_step": 11542, "epoch": 96, "lr": 9.41326937825245e-05, "val_loss": 0.028564367443323135} +{"train_loss": 0.0107416408136487, "global_step": 11543, "epoch": 97, "lr": 9.413165239750327e-05} +{"train_loss": 0.006780931260436773, "global_step": 11544, "epoch": 97, "lr": 9.413061092583429e-05} +{"train_loss": 0.0066537028178572655, "global_step": 11545, "epoch": 97, "lr": 9.412956936751956e-05} +{"train_loss": 0.01082419790327549, "global_step": 11546, "epoch": 97, "lr": 9.412852772256113e-05} +{"train_loss": 0.009327654726803303, "global_step": 11547, "epoch": 97, "lr": 9.412748599096106e-05} +{"train_loss": 0.007659049239009619, "global_step": 11548, "epoch": 97, "lr": 9.412644417272138e-05} +{"train_loss": 0.008779129013419151, "global_step": 11549, "epoch": 97, "lr": 9.412540226784413e-05} +{"train_loss": 0.01045834831893444, "global_step": 11550, "epoch": 97, "lr": 9.412436027633137e-05} +{"train_loss": 0.009207090362906456, "global_step": 11551, "epoch": 97, "lr": 9.412331819818516e-05} +{"train_loss": 0.009055112488567829, "global_step": 11552, "epoch": 97, "lr": 9.412227603340751e-05} +{"train_loss": 0.011213007383048534, "global_step": 11553, "epoch": 97, "lr": 9.41212337820005e-05} +{"train_loss": 0.010252025909721851, "global_step": 11554, "epoch": 97, "lr": 9.412019144396615e-05} +{"train_loss": 0.007113699335604906, "global_step": 11555, "epoch": 97, "lr": 9.411914901930652e-05} +{"train_loss": 0.010708979330956936, "global_step": 11556, "epoch": 97, "lr": 9.411810650802366e-05} +{"train_loss": 0.008811911568045616, "global_step": 11557, "epoch": 97, "lr": 9.411706391011961e-05} +{"train_loss": 0.012580903246998787, "global_step": 11558, "epoch": 97, "lr": 9.41160212255964e-05} +{"train_loss": 0.007893706671893597, "global_step": 11559, "epoch": 97, "lr": 9.411497845445612e-05} +{"train_loss": 0.009504827670753002, "global_step": 11560, "epoch": 97, "lr": 9.411393559670078e-05} +{"train_loss": 0.012041633017361164, "global_step": 11561, "epoch": 97, "lr": 9.411289265233245e-05} +{"train_loss": 0.006147589068859816, "global_step": 11562, "epoch": 97, "lr": 9.411184962135315e-05} +{"train_loss": 0.007645890116691589, "global_step": 11563, "epoch": 97, "lr": 9.411080650376495e-05} +{"train_loss": 0.01044215727597475, "global_step": 11564, "epoch": 97, "lr": 9.41097632995699e-05} +{"train_loss": 0.01076455693691969, "global_step": 11565, "epoch": 97, "lr": 9.410872000877004e-05} +{"train_loss": 0.009733140468597412, "global_step": 11566, "epoch": 97, "lr": 9.410767663136743e-05} +{"train_loss": 0.011074322275817394, "global_step": 11567, "epoch": 97, "lr": 9.41066331673641e-05} +{"train_loss": 0.007801441475749016, "global_step": 11568, "epoch": 97, "lr": 9.410558961676212e-05} +{"train_loss": 0.009244900196790695, "global_step": 11569, "epoch": 97, "lr": 9.410454597956351e-05} +{"train_loss": 0.006794771179556847, "global_step": 11570, "epoch": 97, "lr": 9.410350225577034e-05} +{"train_loss": 0.007675345987081528, "global_step": 11571, "epoch": 97, "lr": 9.410245844538467e-05} +{"train_loss": 0.007478579878807068, "global_step": 11572, "epoch": 97, "lr": 9.410141454840851e-05} +{"train_loss": 0.00888143852353096, "global_step": 11573, "epoch": 97, "lr": 9.410037056484396e-05} +{"train_loss": 0.006326434202492237, "global_step": 11574, "epoch": 97, "lr": 9.409932649469302e-05} +{"train_loss": 0.008269595913589, "global_step": 11575, "epoch": 97, "lr": 9.409828233795779e-05} +{"train_loss": 0.013805575668811798, "global_step": 11576, "epoch": 97, "lr": 9.409723809464027e-05} +{"train_loss": 0.013403450138866901, "global_step": 11577, "epoch": 97, "lr": 9.409619376474255e-05} +{"train_loss": 0.010206318460404873, "global_step": 11578, "epoch": 97, "lr": 9.409514934826664e-05} +{"train_loss": 0.012114034034311771, "global_step": 11579, "epoch": 97, "lr": 9.409410484521463e-05} +{"train_loss": 0.007819971069693565, "global_step": 11580, "epoch": 97, "lr": 9.409306025558857e-05} +{"train_loss": 0.010395212098956108, "global_step": 11581, "epoch": 97, "lr": 9.409201557939049e-05} +{"train_loss": 0.009194868616759777, "global_step": 11582, "epoch": 97, "lr": 9.409097081662243e-05} +{"train_loss": 0.0073798950761556625, "global_step": 11583, "epoch": 97, "lr": 9.408992596728648e-05} +{"train_loss": 0.009737719781696796, "global_step": 11584, "epoch": 97, "lr": 9.408888103138467e-05} +{"train_loss": 0.008552000857889652, "global_step": 11585, "epoch": 97, "lr": 9.408783600891904e-05} +{"train_loss": 0.00837081577628851, "global_step": 11586, "epoch": 97, "lr": 9.408679089989165e-05} +{"train_loss": 0.012345215305685997, "global_step": 11587, "epoch": 97, "lr": 9.408574570430457e-05} +{"train_loss": 0.007045005448162556, "global_step": 11588, "epoch": 97, "lr": 9.408470042215984e-05} +{"train_loss": 0.007696120999753475, "global_step": 11589, "epoch": 97, "lr": 9.40836550534595e-05} +{"train_loss": 0.008199174888432026, "global_step": 11590, "epoch": 97, "lr": 9.408260959820561e-05} +{"train_loss": 0.0069031259045004845, "global_step": 11591, "epoch": 97, "lr": 9.408156405640023e-05} +{"train_loss": 0.007970888167619705, "global_step": 11592, "epoch": 97, "lr": 9.408051842804541e-05} +{"train_loss": 0.010577174834907055, "global_step": 11593, "epoch": 97, "lr": 9.407947271314321e-05} +{"train_loss": 0.010611498728394508, "global_step": 11594, "epoch": 97, "lr": 9.407842691169565e-05} +{"train_loss": 0.009043551050126553, "global_step": 11595, "epoch": 97, "lr": 9.407738102370484e-05} +{"train_loss": 0.010666634887456894, "global_step": 11596, "epoch": 97, "lr": 9.40763350491728e-05} +{"train_loss": 0.00809515081346035, "global_step": 11597, "epoch": 97, "lr": 9.407528898810157e-05} +{"train_loss": 0.006639515049755573, "global_step": 11598, "epoch": 97, "lr": 9.40742428404932e-05} +{"train_loss": 0.008700110018253326, "global_step": 11599, "epoch": 97, "lr": 9.407319660634979e-05} +{"train_loss": 0.010759217664599419, "global_step": 11600, "epoch": 97, "lr": 9.407215028567335e-05} +{"train_loss": 0.008504378609359264, "global_step": 11601, "epoch": 97, "lr": 9.407110387846596e-05} +{"train_loss": 0.008054936304688454, "global_step": 11602, "epoch": 97, "lr": 9.407005738472967e-05} +{"train_loss": 0.012838339433073997, "global_step": 11603, "epoch": 97, "lr": 9.406901080446653e-05} +{"train_loss": 0.011576859280467033, "global_step": 11604, "epoch": 97, "lr": 9.40679641376786e-05} +{"train_loss": 0.013079999014735222, "global_step": 11605, "epoch": 97, "lr": 9.406691738436791e-05} +{"train_loss": 0.0060333991423249245, "global_step": 11606, "epoch": 97, "lr": 9.406587054453655e-05} +{"train_loss": 0.007854091003537178, "global_step": 11607, "epoch": 97, "lr": 9.406482361818656e-05} +{"train_loss": 0.007515995763242245, "global_step": 11608, "epoch": 97, "lr": 9.406377660532e-05} +{"train_loss": 0.008620135486125946, "global_step": 11609, "epoch": 97, "lr": 9.406272950593891e-05} +{"train_loss": 0.0061471303924918175, "global_step": 11610, "epoch": 97, "lr": 9.406168232004537e-05} +{"train_loss": 0.007536770310252905, "global_step": 11611, "epoch": 97, "lr": 9.406063504764142e-05} +{"train_loss": 0.010160546749830246, "global_step": 11612, "epoch": 97, "lr": 9.405958768872912e-05} +{"train_loss": 0.00886159110814333, "global_step": 11613, "epoch": 97, "lr": 9.405854024331054e-05} +{"train_loss": 0.008756312541663647, "global_step": 11614, "epoch": 97, "lr": 9.40574927113877e-05} +{"train_loss": 0.011049470864236355, "global_step": 11615, "epoch": 97, "lr": 9.40564450929627e-05} +{"train_loss": 0.008882850408554077, "global_step": 11616, "epoch": 97, "lr": 9.405539738803756e-05} +{"train_loss": 0.01526225358247757, "global_step": 11617, "epoch": 97, "lr": 9.405434959661437e-05} +{"train_loss": 0.009645586833357811, "global_step": 11618, "epoch": 97, "lr": 9.405330171869516e-05} +{"train_loss": 0.0068845683708786964, "global_step": 11619, "epoch": 97, "lr": 9.405225375428199e-05} +{"train_loss": 0.009392520412802696, "global_step": 11620, "epoch": 97, "lr": 9.405120570337694e-05} +{"train_loss": 0.007891318760812283, "global_step": 11621, "epoch": 97, "lr": 9.405015756598204e-05} +{"train_loss": 0.007500466890633106, "global_step": 11622, "epoch": 97, "lr": 9.404910934209939e-05} +{"train_loss": 0.00938627403229475, "global_step": 11623, "epoch": 97, "lr": 9.4048061031731e-05} +{"train_loss": 0.00991684477776289, "global_step": 11624, "epoch": 97, "lr": 9.404701263487894e-05} +{"train_loss": 0.009914519265294075, "global_step": 11625, "epoch": 97, "lr": 9.404596415154529e-05} +{"train_loss": 0.009691878221929073, "global_step": 11626, "epoch": 97, "lr": 9.404491558173209e-05} +{"train_loss": 0.007301690522581339, "global_step": 11627, "epoch": 97, "lr": 9.404386692544141e-05} +{"train_loss": 0.008481464348733425, "global_step": 11628, "epoch": 97, "lr": 9.404281818267529e-05} +{"train_loss": 0.013137605041265488, "global_step": 11629, "epoch": 97, "lr": 9.40417693534358e-05} +{"train_loss": 0.00875262264162302, "global_step": 11630, "epoch": 97, "lr": 9.404072043772502e-05} +{"train_loss": 0.005250126589089632, "global_step": 11631, "epoch": 97, "lr": 9.403967143554498e-05} +{"train_loss": 0.004833207931369543, "global_step": 11632, "epoch": 97, "lr": 9.403862234689775e-05} +{"train_loss": 0.007989213801920414, "global_step": 11633, "epoch": 97, "lr": 9.403757317178539e-05} +{"train_loss": 0.006213081069290638, "global_step": 11634, "epoch": 97, "lr": 9.403652391020997e-05} +{"train_loss": 0.010174226015806198, "global_step": 11635, "epoch": 97, "lr": 9.403547456217352e-05} +{"train_loss": 0.006815474946051836, "global_step": 11636, "epoch": 97, "lr": 9.403442512767813e-05} +{"train_loss": 0.009927964769303799, "global_step": 11637, "epoch": 97, "lr": 9.403337560672584e-05} +{"train_loss": 0.00785170029848814, "global_step": 11638, "epoch": 97, "lr": 9.403232599931875e-05} +{"train_loss": 0.006976917386054993, "global_step": 11639, "epoch": 97, "lr": 9.403127630545887e-05} +{"train_loss": 0.01114135142415762, "global_step": 11640, "epoch": 97, "lr": 9.40302265251483e-05} +{"train_loss": 0.008698387071490288, "global_step": 11641, "epoch": 97, "lr": 9.402917665838907e-05} +{"train_loss": 0.004867983981966972, "global_step": 11642, "epoch": 97, "lr": 9.402812670518324e-05} +{"train_loss": 0.012863506563007832, "global_step": 11643, "epoch": 97, "lr": 9.40270766655329e-05} +{"train_loss": 0.011534925550222397, "global_step": 11644, "epoch": 97, "lr": 9.402602653944012e-05} +{"train_loss": 0.009337017312645912, "global_step": 11645, "epoch": 97, "lr": 9.402497632690693e-05} +{"train_loss": 0.012757806107401848, "global_step": 11646, "epoch": 97, "lr": 9.402392602793538e-05} +{"train_loss": 0.008800247684121132, "global_step": 11647, "epoch": 97, "lr": 9.402287564252758e-05} +{"train_loss": 0.007702928502112627, "global_step": 11648, "epoch": 97, "lr": 9.402182517068555e-05} +{"train_loss": 0.007537794765084982, "global_step": 11649, "epoch": 97, "lr": 9.402077461241138e-05} +{"train_loss": 0.005634305067360401, "global_step": 11650, "epoch": 97, "lr": 9.401972396770711e-05} +{"train_loss": 0.0071181380189955235, "global_step": 11651, "epoch": 97, "lr": 9.401867323657483e-05} +{"train_loss": 0.008385789580643177, "global_step": 11652, "epoch": 97, "lr": 9.401762241901657e-05} +{"train_loss": 0.010078750550746918, "global_step": 11653, "epoch": 97, "lr": 9.401657151503442e-05} +{"train_loss": 0.007320437580347061, "global_step": 11654, "epoch": 97, "lr": 9.401552052463045e-05} +{"train_loss": 0.007736620958894491, "global_step": 11655, "epoch": 97, "lr": 9.401446944780669e-05} +{"train_loss": 0.00798220094293356, "global_step": 11656, "epoch": 97, "lr": 9.401341828456522e-05} +{"train_loss": 0.009061254560947418, "global_step": 11657, "epoch": 97, "lr": 9.401236703490812e-05} +{"train_loss": 0.008281726390123367, "global_step": 11658, "epoch": 97, "lr": 9.401131569883742e-05} +{"train_loss": 0.012749911285936832, "global_step": 11659, "epoch": 97, "lr": 9.401026427635522e-05} +{"train_loss": 0.006150045897811651, "global_step": 11660, "epoch": 97, "lr": 9.400921276746356e-05} +{"train_loss": 0.009019918755448166, "global_step": 11661, "epoch": 97, "lr": 9.400816117216451e-05, "val_loss": 0.022390983998775482} +{"train_loss": 0.0088890315964818, "global_step": 11662, "epoch": 98, "lr": 9.400710949046014e-05} +{"train_loss": 0.008682620711624622, "global_step": 11663, "epoch": 98, "lr": 9.400605772235251e-05} +{"train_loss": 0.01406986266374588, "global_step": 11664, "epoch": 98, "lr": 9.400500586784369e-05} +{"train_loss": 0.008142984472215176, "global_step": 11665, "epoch": 98, "lr": 9.400395392693575e-05} +{"train_loss": 0.006191066931933165, "global_step": 11666, "epoch": 98, "lr": 9.400290189963073e-05} +{"train_loss": 0.011093897745013237, "global_step": 11667, "epoch": 98, "lr": 9.400184978593073e-05} +{"train_loss": 0.008905294351279736, "global_step": 11668, "epoch": 98, "lr": 9.40007975858378e-05} +{"train_loss": 0.007458691019564867, "global_step": 11669, "epoch": 98, "lr": 9.399974529935399e-05} +{"train_loss": 0.010604257695376873, "global_step": 11670, "epoch": 98, "lr": 9.399869292648137e-05} +{"train_loss": 0.01173464860767126, "global_step": 11671, "epoch": 98, "lr": 9.399764046722205e-05} +{"train_loss": 0.007717333734035492, "global_step": 11672, "epoch": 98, "lr": 9.399658792157805e-05} +{"train_loss": 0.00653783930465579, "global_step": 11673, "epoch": 98, "lr": 9.399553528955145e-05} +{"train_loss": 0.010819030925631523, "global_step": 11674, "epoch": 98, "lr": 9.399448257114432e-05} +{"train_loss": 0.012685819528996944, "global_step": 11675, "epoch": 98, "lr": 9.39934297663587e-05} +{"train_loss": 0.006621200125664473, "global_step": 11676, "epoch": 98, "lr": 9.39923768751967e-05} +{"train_loss": 0.01095294114202261, "global_step": 11677, "epoch": 98, "lr": 9.399132389766036e-05} +{"train_loss": 0.007419832516461611, "global_step": 11678, "epoch": 98, "lr": 9.399027083375179e-05} +{"train_loss": 0.010195184499025345, "global_step": 11679, "epoch": 98, "lr": 9.398921768347297e-05} +{"train_loss": 0.010747617110610008, "global_step": 11680, "epoch": 98, "lr": 9.398816444682605e-05} +{"train_loss": 0.00906143244355917, "global_step": 11681, "epoch": 98, "lr": 9.398711112381307e-05} +{"train_loss": 0.012487957254052162, "global_step": 11682, "epoch": 98, "lr": 9.39860577144361e-05} +{"train_loss": 0.009679792448878288, "global_step": 11683, "epoch": 98, "lr": 9.398500421869718e-05} +{"train_loss": 0.011826535686850548, "global_step": 11684, "epoch": 98, "lr": 9.398395063659842e-05} +{"train_loss": 0.0061509557999670506, "global_step": 11685, "epoch": 98, "lr": 9.398289696814187e-05} +{"train_loss": 0.007090780884027481, "global_step": 11686, "epoch": 98, "lr": 9.398184321332961e-05} +{"train_loss": 0.00812862254679203, "global_step": 11687, "epoch": 98, "lr": 9.398078937216368e-05} +{"train_loss": 0.00789237953722477, "global_step": 11688, "epoch": 98, "lr": 9.397973544464617e-05} +{"train_loss": 0.006210606079548597, "global_step": 11689, "epoch": 98, "lr": 9.397868143077917e-05} +{"train_loss": 0.006815725471824408, "global_step": 11690, "epoch": 98, "lr": 9.397762733056472e-05} +{"train_loss": 0.015041489154100418, "global_step": 11691, "epoch": 98, "lr": 9.397657314400488e-05} +{"train_loss": 0.010178878903388977, "global_step": 11692, "epoch": 98, "lr": 9.397551887110176e-05} +{"train_loss": 0.009707502089440823, "global_step": 11693, "epoch": 98, "lr": 9.397446451185738e-05} +{"train_loss": 0.009094630368053913, "global_step": 11694, "epoch": 98, "lr": 9.397341006627387e-05} +{"train_loss": 0.007634047418832779, "global_step": 11695, "epoch": 98, "lr": 9.397235553435323e-05} +{"train_loss": 0.010169485583901405, "global_step": 11696, "epoch": 98, "lr": 9.397130091609761e-05} +{"train_loss": 0.010649513453245163, "global_step": 11697, "epoch": 98, "lr": 9.397024621150901e-05} +{"train_loss": 0.010079937987029552, "global_step": 11698, "epoch": 98, "lr": 9.396919142058952e-05} +{"train_loss": 0.008474557660520077, "global_step": 11699, "epoch": 98, "lr": 9.396813654334124e-05} +{"train_loss": 0.010051456280052662, "global_step": 11700, "epoch": 98, "lr": 9.396708157976622e-05} +{"train_loss": 0.008168069645762444, "global_step": 11701, "epoch": 98, "lr": 9.396602652986653e-05} +{"train_loss": 0.007636765483766794, "global_step": 11702, "epoch": 98, "lr": 9.396497139364424e-05} +{"train_loss": 0.0107331657782197, "global_step": 11703, "epoch": 98, "lr": 9.396391617110144e-05} +{"train_loss": 0.011803348548710346, "global_step": 11704, "epoch": 98, "lr": 9.396286086224018e-05} +{"train_loss": 0.005046656355261803, "global_step": 11705, "epoch": 98, "lr": 9.396180546706253e-05} +{"train_loss": 0.0075789038091897964, "global_step": 11706, "epoch": 98, "lr": 9.396074998557057e-05} +{"train_loss": 0.0069855256006121635, "global_step": 11707, "epoch": 98, "lr": 9.395969441776637e-05} +{"train_loss": 0.012926328927278519, "global_step": 11708, "epoch": 98, "lr": 9.395863876365202e-05} +{"train_loss": 0.006478294264525175, "global_step": 11709, "epoch": 98, "lr": 9.395758302322958e-05} +{"train_loss": 0.009210710413753986, "global_step": 11710, "epoch": 98, "lr": 9.395652719650111e-05} +{"train_loss": 0.00573516683652997, "global_step": 11711, "epoch": 98, "lr": 9.395547128346872e-05} +{"train_loss": 0.011297790333628654, "global_step": 11712, "epoch": 98, "lr": 9.395441528413445e-05} +{"train_loss": 0.009176265448331833, "global_step": 11713, "epoch": 98, "lr": 9.395335919850037e-05} +{"train_loss": 0.011209869757294655, "global_step": 11714, "epoch": 98, "lr": 9.395230302656856e-05} +{"train_loss": 0.011044549755752087, "global_step": 11715, "epoch": 98, "lr": 9.395124676834111e-05} +{"train_loss": 0.009585685096681118, "global_step": 11716, "epoch": 98, "lr": 9.395019042382007e-05} +{"train_loss": 0.00932164303958416, "global_step": 11717, "epoch": 98, "lr": 9.394913399300753e-05} +{"train_loss": 0.007567239925265312, "global_step": 11718, "epoch": 98, "lr": 9.394807747590558e-05} +{"train_loss": 0.007516194600611925, "global_step": 11719, "epoch": 98, "lr": 9.394702087251625e-05} +{"train_loss": 0.009217165410518646, "global_step": 11720, "epoch": 98, "lr": 9.394596418284165e-05} +{"train_loss": 0.014284689910709858, "global_step": 11721, "epoch": 98, "lr": 9.394490740688384e-05} +{"train_loss": 0.010952910408377647, "global_step": 11722, "epoch": 98, "lr": 9.394385054464492e-05} +{"train_loss": 0.011736595071852207, "global_step": 11723, "epoch": 98, "lr": 9.394279359612693e-05} +{"train_loss": 0.006547410506755114, "global_step": 11724, "epoch": 98, "lr": 9.394173656133193e-05} +{"train_loss": 0.009091883897781372, "global_step": 11725, "epoch": 98, "lr": 9.394067944026207e-05} +{"train_loss": 0.008790571242570877, "global_step": 11726, "epoch": 98, "lr": 9.393962223291936e-05} +{"train_loss": 0.00580904446542263, "global_step": 11727, "epoch": 98, "lr": 9.39385649393059e-05} +{"train_loss": 0.00941169448196888, "global_step": 11728, "epoch": 98, "lr": 9.393750755942376e-05} +{"train_loss": 0.012627781368792057, "global_step": 11729, "epoch": 98, "lr": 9.393645009327502e-05} +{"train_loss": 0.009388785809278488, "global_step": 11730, "epoch": 98, "lr": 9.393539254086174e-05} +{"train_loss": 0.007184809073805809, "global_step": 11731, "epoch": 98, "lr": 9.393433490218603e-05} +{"train_loss": 0.011498553678393364, "global_step": 11732, "epoch": 98, "lr": 9.393327717724994e-05} +{"train_loss": 0.007327960338443518, "global_step": 11733, "epoch": 98, "lr": 9.393221936605556e-05} +{"train_loss": 0.009332505986094475, "global_step": 11734, "epoch": 98, "lr": 9.393116146860494e-05} +{"train_loss": 0.010805980302393436, "global_step": 11735, "epoch": 98, "lr": 9.393010348490022e-05} +{"train_loss": 0.008456621319055557, "global_step": 11736, "epoch": 98, "lr": 9.392904541494339e-05} +{"train_loss": 0.006927134469151497, "global_step": 11737, "epoch": 98, "lr": 9.392798725873659e-05} +{"train_loss": 0.008918941020965576, "global_step": 11738, "epoch": 98, "lr": 9.392692901628188e-05} +{"train_loss": 0.00824805535376072, "global_step": 11739, "epoch": 98, "lr": 9.392587068758134e-05} +{"train_loss": 0.006209736689925194, "global_step": 11740, "epoch": 98, "lr": 9.392481227263704e-05} +{"train_loss": 0.012729517184197903, "global_step": 11741, "epoch": 98, "lr": 9.392375377145106e-05} +{"train_loss": 0.006953692529350519, "global_step": 11742, "epoch": 98, "lr": 9.39226951840255e-05} +{"train_loss": 0.007541140541434288, "global_step": 11743, "epoch": 98, "lr": 9.392163651036241e-05} +{"train_loss": 0.01216689869761467, "global_step": 11744, "epoch": 98, "lr": 9.392057775046388e-05} +{"train_loss": 0.009992263279855251, "global_step": 11745, "epoch": 98, "lr": 9.391951890433199e-05} +{"train_loss": 0.006119086407124996, "global_step": 11746, "epoch": 98, "lr": 9.39184599719688e-05} +{"train_loss": 0.007161386776715517, "global_step": 11747, "epoch": 98, "lr": 9.391740095337642e-05} +{"train_loss": 0.008752233348786831, "global_step": 11748, "epoch": 98, "lr": 9.391634184855691e-05} +{"train_loss": 0.008355557918548584, "global_step": 11749, "epoch": 98, "lr": 9.391528265751237e-05} +{"train_loss": 0.009334652684628963, "global_step": 11750, "epoch": 98, "lr": 9.391422338024485e-05} +{"train_loss": 0.01210729405283928, "global_step": 11751, "epoch": 98, "lr": 9.391316401675646e-05} +{"train_loss": 0.009797899052500725, "global_step": 11752, "epoch": 98, "lr": 9.391210456704924e-05} +{"train_loss": 0.011518174782395363, "global_step": 11753, "epoch": 98, "lr": 9.39110450311253e-05} +{"train_loss": 0.00831611268222332, "global_step": 11754, "epoch": 98, "lr": 9.390998540898672e-05} +{"train_loss": 0.010675440542399883, "global_step": 11755, "epoch": 98, "lr": 9.390892570063558e-05} +{"train_loss": 0.005130648612976074, "global_step": 11756, "epoch": 98, "lr": 9.390786590607394e-05} +{"train_loss": 0.011613872833549976, "global_step": 11757, "epoch": 98, "lr": 9.39068060253039e-05} +{"train_loss": 0.00817391462624073, "global_step": 11758, "epoch": 98, "lr": 9.390574605832755e-05} +{"train_loss": 0.006513682194054127, "global_step": 11759, "epoch": 98, "lr": 9.390468600514695e-05} +{"train_loss": 0.009706291370093822, "global_step": 11760, "epoch": 98, "lr": 9.39036258657642e-05} +{"train_loss": 0.011552756652235985, "global_step": 11761, "epoch": 98, "lr": 9.390256564018135e-05} +{"train_loss": 0.008257947862148285, "global_step": 11762, "epoch": 98, "lr": 9.390150532840052e-05} +{"train_loss": 0.010075954720377922, "global_step": 11763, "epoch": 98, "lr": 9.390044493042375e-05} +{"train_loss": 0.007359763607382774, "global_step": 11764, "epoch": 98, "lr": 9.389938444625318e-05} +{"train_loss": 0.008819019421935081, "global_step": 11765, "epoch": 98, "lr": 9.389832387589084e-05} +{"train_loss": 0.015587856061756611, "global_step": 11766, "epoch": 98, "lr": 9.389726321933883e-05} +{"train_loss": 0.009916151873767376, "global_step": 11767, "epoch": 98, "lr": 9.389620247659925e-05} +{"train_loss": 0.009192146360874176, "global_step": 11768, "epoch": 98, "lr": 9.389514164767415e-05} +{"train_loss": 0.006546837743371725, "global_step": 11769, "epoch": 98, "lr": 9.389408073256563e-05} +{"train_loss": 0.007843557745218277, "global_step": 11770, "epoch": 98, "lr": 9.389301973127578e-05} +{"train_loss": 0.010095660574734211, "global_step": 11771, "epoch": 98, "lr": 9.389195864380667e-05} +{"train_loss": 0.008832952938973904, "global_step": 11772, "epoch": 98, "lr": 9.389089747016037e-05} +{"train_loss": 0.008036710321903229, "global_step": 11773, "epoch": 98, "lr": 9.3889836210339e-05} +{"train_loss": 0.011050776578485966, "global_step": 11774, "epoch": 98, "lr": 9.388877486434464e-05} +{"train_loss": 0.008465850725769997, "global_step": 11775, "epoch": 98, "lr": 9.388771343217935e-05} +{"train_loss": 0.007532801479101181, "global_step": 11776, "epoch": 98, "lr": 9.38866519138452e-05} +{"train_loss": 0.007973091676831245, "global_step": 11777, "epoch": 98, "lr": 9.388559030934432e-05} +{"train_loss": 0.011405057273805141, "global_step": 11778, "epoch": 98, "lr": 9.388452861867876e-05} +{"train_loss": 0.009985966607928276, "global_step": 11779, "epoch": 98, "lr": 9.388346684185063e-05} +{"train_loss": 0.0092065502779887, "global_step": 11780, "epoch": 98, "lr": 9.3882404978862e-05, "val_loss": 0.012708557769656181} +{"train_loss": 0.010828808881342411, "global_step": 11781, "epoch": 99, "lr": 9.388134302971495e-05} +{"train_loss": 0.008729551918804646, "global_step": 11782, "epoch": 99, "lr": 9.388028099441158e-05} +{"train_loss": 0.007606100756675005, "global_step": 11783, "epoch": 99, "lr": 9.387921887295394e-05} +{"train_loss": 0.006680003367364407, "global_step": 11784, "epoch": 99, "lr": 9.387815666534416e-05} +{"train_loss": 0.004931194707751274, "global_step": 11785, "epoch": 99, "lr": 9.387709437158431e-05} +{"train_loss": 0.007674266118556261, "global_step": 11786, "epoch": 99, "lr": 9.387603199167647e-05} +{"train_loss": 0.00893374066799879, "global_step": 11787, "epoch": 99, "lr": 9.387496952562274e-05} +{"train_loss": 0.007715015206485987, "global_step": 11788, "epoch": 99, "lr": 9.387390697342517e-05} +{"train_loss": 0.009579341858625412, "global_step": 11789, "epoch": 99, "lr": 9.38728443350859e-05} +{"train_loss": 0.007620485965162516, "global_step": 11790, "epoch": 99, "lr": 9.387178161060696e-05} +{"train_loss": 0.0047354199923574924, "global_step": 11791, "epoch": 99, "lr": 9.387071879999047e-05} +{"train_loss": 0.006614362820982933, "global_step": 11792, "epoch": 99, "lr": 9.386965590323853e-05} +{"train_loss": 0.006011635530740023, "global_step": 11793, "epoch": 99, "lr": 9.38685929203532e-05} +{"train_loss": 0.008627485483884811, "global_step": 11794, "epoch": 99, "lr": 9.386752985133655e-05} +{"train_loss": 0.009531861171126366, "global_step": 11795, "epoch": 99, "lr": 9.386646669619071e-05} +{"train_loss": 0.009859144687652588, "global_step": 11796, "epoch": 99, "lr": 9.386540345491775e-05} +{"train_loss": 0.01002228632569313, "global_step": 11797, "epoch": 99, "lr": 9.386434012751976e-05} +{"train_loss": 0.007758373394608498, "global_step": 11798, "epoch": 99, "lr": 9.386327671399882e-05} +{"train_loss": 0.007101519964635372, "global_step": 11799, "epoch": 99, "lr": 9.386221321435702e-05} +{"train_loss": 0.0061920988373458385, "global_step": 11800, "epoch": 99, "lr": 9.386114962859645e-05} +{"train_loss": 0.012457545846700668, "global_step": 11801, "epoch": 99, "lr": 9.38600859567192e-05} +{"train_loss": 0.009767821989953518, "global_step": 11802, "epoch": 99, "lr": 9.385902219872735e-05} +{"train_loss": 0.008126482367515564, "global_step": 11803, "epoch": 99, "lr": 9.385795835462301e-05} +{"train_loss": 0.01075535174459219, "global_step": 11804, "epoch": 99, "lr": 9.385689442440825e-05} +{"train_loss": 0.008603550493717194, "global_step": 11805, "epoch": 99, "lr": 9.385583040808515e-05} +{"train_loss": 0.006926859263330698, "global_step": 11806, "epoch": 99, "lr": 9.385476630565583e-05} +{"train_loss": 0.009114685468375683, "global_step": 11807, "epoch": 99, "lr": 9.385370211712236e-05} +{"train_loss": 0.007088103797286749, "global_step": 11808, "epoch": 99, "lr": 9.385263784248682e-05} +{"train_loss": 0.008725475519895554, "global_step": 11809, "epoch": 99, "lr": 9.385157348175131e-05} +{"train_loss": 0.009050247259438038, "global_step": 11810, "epoch": 99, "lr": 9.385050903491793e-05} +{"train_loss": 0.007845270447432995, "global_step": 11811, "epoch": 99, "lr": 9.384944450198875e-05} +{"train_loss": 0.00964702945202589, "global_step": 11812, "epoch": 99, "lr": 9.384837988296589e-05} +{"train_loss": 0.008513013832271099, "global_step": 11813, "epoch": 99, "lr": 9.38473151778514e-05} +{"train_loss": 0.00944194570183754, "global_step": 11814, "epoch": 99, "lr": 9.38462503866474e-05} +{"train_loss": 0.0066267275251448154, "global_step": 11815, "epoch": 99, "lr": 9.384518550935597e-05} +{"train_loss": 0.006913994438946247, "global_step": 11816, "epoch": 99, "lr": 9.38441205459792e-05} +{"train_loss": 0.00789460726082325, "global_step": 11817, "epoch": 99, "lr": 9.384305549651918e-05} +{"train_loss": 0.008109981194138527, "global_step": 11818, "epoch": 99, "lr": 9.384199036097801e-05} +{"train_loss": 0.006815249565988779, "global_step": 11819, "epoch": 99, "lr": 9.384092513935778e-05} +{"train_loss": 0.007514480501413345, "global_step": 11820, "epoch": 99, "lr": 9.383985983166058e-05} +{"train_loss": 0.009224209934473038, "global_step": 11821, "epoch": 99, "lr": 9.383879443788849e-05} +{"train_loss": 0.00990801490843296, "global_step": 11822, "epoch": 99, "lr": 9.383772895804362e-05} +{"train_loss": 0.008507473394274712, "global_step": 11823, "epoch": 99, "lr": 9.383666339212804e-05} +{"train_loss": 0.007961263880133629, "global_step": 11824, "epoch": 99, "lr": 9.383559774014385e-05} +{"train_loss": 0.0094308378174901, "global_step": 11825, "epoch": 99, "lr": 9.383453200209316e-05} +{"train_loss": 0.008863983675837517, "global_step": 11826, "epoch": 99, "lr": 9.383346617797805e-05} +{"train_loss": 0.006909030023962259, "global_step": 11827, "epoch": 99, "lr": 9.38324002678006e-05} +{"train_loss": 0.007558948360383511, "global_step": 11828, "epoch": 99, "lr": 9.383133427156292e-05} +{"train_loss": 0.010045981965959072, "global_step": 11829, "epoch": 99, "lr": 9.383026818926711e-05} +{"train_loss": 0.011040379293262959, "global_step": 11830, "epoch": 99, "lr": 9.382920202091524e-05} +{"train_loss": 0.007494928780943155, "global_step": 11831, "epoch": 99, "lr": 9.382813576650941e-05} +{"train_loss": 0.013586793094873428, "global_step": 11832, "epoch": 99, "lr": 9.382706942605172e-05} +{"train_loss": 0.005989209283143282, "global_step": 11833, "epoch": 99, "lr": 9.382600299954428e-05} +{"train_loss": 0.009609369561076164, "global_step": 11834, "epoch": 99, "lr": 9.382493648698914e-05} +{"train_loss": 0.008454634808003902, "global_step": 11835, "epoch": 99, "lr": 9.382386988838844e-05} +{"train_loss": 0.010268520563840866, "global_step": 11836, "epoch": 99, "lr": 9.382280320374423e-05} +{"train_loss": 0.010784360580146313, "global_step": 11837, "epoch": 99, "lr": 9.382173643305865e-05} +{"train_loss": 0.0062081459909677505, "global_step": 11838, "epoch": 99, "lr": 9.382066957633377e-05} +{"train_loss": 0.00838361494243145, "global_step": 11839, "epoch": 99, "lr": 9.381960263357168e-05} +{"train_loss": 0.009031053632497787, "global_step": 11840, "epoch": 99, "lr": 9.381853560477447e-05} +{"train_loss": 0.00765477167442441, "global_step": 11841, "epoch": 99, "lr": 9.381746848994427e-05} +{"train_loss": 0.006775119807571173, "global_step": 11842, "epoch": 99, "lr": 9.381640128908314e-05} +{"train_loss": 0.013625452294945717, "global_step": 11843, "epoch": 99, "lr": 9.381533400219318e-05} +{"train_loss": 0.011294678784906864, "global_step": 11844, "epoch": 99, "lr": 9.38142666292765e-05} +{"train_loss": 0.010453427210450172, "global_step": 11845, "epoch": 99, "lr": 9.38131991703352e-05} +{"train_loss": 0.008779305964708328, "global_step": 11846, "epoch": 99, "lr": 9.381213162537134e-05} +{"train_loss": 0.007913472130894661, "global_step": 11847, "epoch": 99, "lr": 9.381106399438706e-05} +{"train_loss": 0.006608875934034586, "global_step": 11848, "epoch": 99, "lr": 9.380999627738443e-05} +{"train_loss": 0.008829353377223015, "global_step": 11849, "epoch": 99, "lr": 9.380892847436555e-05} +{"train_loss": 0.009906741790473461, "global_step": 11850, "epoch": 99, "lr": 9.380786058533252e-05} +{"train_loss": 0.010760328732430935, "global_step": 11851, "epoch": 99, "lr": 9.380679261028744e-05} +{"train_loss": 0.009941129945218563, "global_step": 11852, "epoch": 99, "lr": 9.38057245492324e-05} +{"train_loss": 0.010092425160109997, "global_step": 11853, "epoch": 99, "lr": 9.380465640216949e-05} +{"train_loss": 0.00963317509740591, "global_step": 11854, "epoch": 99, "lr": 9.380358816910084e-05} +{"train_loss": 0.01286519505083561, "global_step": 11855, "epoch": 99, "lr": 9.38025198500285e-05} +{"train_loss": 0.008082769811153412, "global_step": 11856, "epoch": 99, "lr": 9.38014514449546e-05} +{"train_loss": 0.010466763749718666, "global_step": 11857, "epoch": 99, "lr": 9.380038295388124e-05} +{"train_loss": 0.006836016196757555, "global_step": 11858, "epoch": 99, "lr": 9.37993143768105e-05} +{"train_loss": 0.009774777106940746, "global_step": 11859, "epoch": 99, "lr": 9.379824571374448e-05} +{"train_loss": 0.006817806512117386, "global_step": 11860, "epoch": 99, "lr": 9.379717696468528e-05} +{"train_loss": 0.007526194676756859, "global_step": 11861, "epoch": 99, "lr": 9.379610812963501e-05} +{"train_loss": 0.0047617461532354355, "global_step": 11862, "epoch": 99, "lr": 9.379503920859578e-05} +{"train_loss": 0.016614487394690514, "global_step": 11863, "epoch": 99, "lr": 9.379397020156965e-05} +{"train_loss": 0.008876721374690533, "global_step": 11864, "epoch": 99, "lr": 9.379290110855874e-05} +{"train_loss": 0.008617664687335491, "global_step": 11865, "epoch": 99, "lr": 9.379183192956514e-05} +{"train_loss": 0.008875170722603798, "global_step": 11866, "epoch": 99, "lr": 9.379076266459097e-05} +{"train_loss": 0.007622522301971912, "global_step": 11867, "epoch": 99, "lr": 9.37896933136383e-05} +{"train_loss": 0.009497100487351418, "global_step": 11868, "epoch": 99, "lr": 9.378862387670926e-05} +{"train_loss": 0.009751115925610065, "global_step": 11869, "epoch": 99, "lr": 9.378755435380593e-05} +{"train_loss": 0.006949700880795717, "global_step": 11870, "epoch": 99, "lr": 9.378648474493042e-05} +{"train_loss": 0.01159131620079279, "global_step": 11871, "epoch": 99, "lr": 9.37854150500848e-05} +{"train_loss": 0.011080584488809109, "global_step": 11872, "epoch": 99, "lr": 9.378434526927122e-05} +{"train_loss": 0.007985315285623074, "global_step": 11873, "epoch": 99, "lr": 9.378327540249175e-05} +{"train_loss": 0.006510888691991568, "global_step": 11874, "epoch": 99, "lr": 9.37822054497485e-05} +{"train_loss": 0.013261403888463974, "global_step": 11875, "epoch": 99, "lr": 9.378113541104356e-05} +{"train_loss": 0.014040373265743256, "global_step": 11876, "epoch": 99, "lr": 9.378006528637905e-05} +{"train_loss": 0.009742498397827148, "global_step": 11877, "epoch": 99, "lr": 9.377899507575705e-05} +{"train_loss": 0.012455468066036701, "global_step": 11878, "epoch": 99, "lr": 9.377792477917967e-05} +{"train_loss": 0.010508488863706589, "global_step": 11879, "epoch": 99, "lr": 9.377685439664902e-05} +{"train_loss": 0.010798614472150803, "global_step": 11880, "epoch": 99, "lr": 9.377578392816719e-05} +{"train_loss": 0.0064687649719417095, "global_step": 11881, "epoch": 99, "lr": 9.377471337373626e-05} +{"train_loss": 0.010223179124295712, "global_step": 11882, "epoch": 99, "lr": 9.377364273335838e-05} +{"train_loss": 0.009439453482627869, "global_step": 11883, "epoch": 99, "lr": 9.377257200703565e-05} +{"train_loss": 0.009588080458343029, "global_step": 11884, "epoch": 99, "lr": 9.377150119477011e-05} +{"train_loss": 0.013044340535998344, "global_step": 11885, "epoch": 99, "lr": 9.377043029656393e-05} +{"train_loss": 0.008191372267901897, "global_step": 11886, "epoch": 99, "lr": 9.376935931241916e-05} +{"train_loss": 0.009822525084018707, "global_step": 11887, "epoch": 99, "lr": 9.376828824233797e-05} +{"train_loss": 0.006629714276641607, "global_step": 11888, "epoch": 99, "lr": 9.376721708632239e-05} +{"train_loss": 0.00843197014182806, "global_step": 11889, "epoch": 99, "lr": 9.376614584437456e-05} +{"train_loss": 0.008696074597537518, "global_step": 11890, "epoch": 99, "lr": 9.376507451649659e-05} +{"train_loss": 0.011560863815248013, "global_step": 11891, "epoch": 99, "lr": 9.376400310269055e-05} +{"train_loss": 0.012582293711602688, "global_step": 11892, "epoch": 99, "lr": 9.37629316029586e-05} +{"train_loss": 0.009924954734742641, "global_step": 11893, "epoch": 99, "lr": 9.376186001730279e-05} +{"train_loss": 0.008820224553346634, "global_step": 11894, "epoch": 99, "lr": 9.376078834572523e-05} +{"train_loss": 0.008859529159963131, "global_step": 11895, "epoch": 99, "lr": 9.375971658822805e-05} +{"train_loss": 0.011896362528204918, "global_step": 11896, "epoch": 99, "lr": 9.375864474481336e-05} +{"train_loss": 0.008944688364863396, "global_step": 11897, "epoch": 99, "lr": 9.37575728154832e-05} +{"train_loss": 0.00816259067505598, "global_step": 11898, "epoch": 99, "lr": 9.375650080023977e-05} +{"train_loss": 0.008989296626581364, "global_step": 11899, "epoch": 99, "lr": 9.375542869908509e-05, "val_loss": 0.017420824617147446} +{"train_loss": 0.010880948044359684, "global_step": 11900, "epoch": 100, "lr": 9.375435651202132e-05} +{"train_loss": 0.008877696469426155, "global_step": 11901, "epoch": 100, "lr": 9.375328423905053e-05} +{"train_loss": 0.007991190999746323, "global_step": 11902, "epoch": 100, "lr": 9.375221188017484e-05} +{"train_loss": 0.009505105204880238, "global_step": 11903, "epoch": 100, "lr": 9.375113943539638e-05} +{"train_loss": 0.010388887487351894, "global_step": 11904, "epoch": 100, "lr": 9.375006690471721e-05} +{"train_loss": 0.007738668471574783, "global_step": 11905, "epoch": 100, "lr": 9.374899428813948e-05} +{"train_loss": 0.010380717925727367, "global_step": 11906, "epoch": 100, "lr": 9.374792158566525e-05} +{"train_loss": 0.011599253863096237, "global_step": 11907, "epoch": 100, "lr": 9.374684879729666e-05} +{"train_loss": 0.008483164943754673, "global_step": 11908, "epoch": 100, "lr": 9.374577592303579e-05} +{"train_loss": 0.007423324976116419, "global_step": 11909, "epoch": 100, "lr": 9.374470296288479e-05} +{"train_loss": 0.007997545413672924, "global_step": 11910, "epoch": 100, "lr": 9.374362991684574e-05} +{"train_loss": 0.007535035256296396, "global_step": 11911, "epoch": 100, "lr": 9.374255678492072e-05} +{"train_loss": 0.009551716968417168, "global_step": 11912, "epoch": 100, "lr": 9.374148356711187e-05} +{"train_loss": 0.008063409477472305, "global_step": 11913, "epoch": 100, "lr": 9.374041026342129e-05} +{"train_loss": 0.00784565880894661, "global_step": 11914, "epoch": 100, "lr": 9.37393368738511e-05} +{"train_loss": 0.0075047817081213, "global_step": 11915, "epoch": 100, "lr": 9.373826339840339e-05} +{"train_loss": 0.00616243714466691, "global_step": 11916, "epoch": 100, "lr": 9.373718983708026e-05} +{"train_loss": 0.009879359975457191, "global_step": 11917, "epoch": 100, "lr": 9.373611618988384e-05} +{"train_loss": 0.006746172904968262, "global_step": 11918, "epoch": 100, "lr": 9.373504245681623e-05} +{"train_loss": 0.008337367326021194, "global_step": 11919, "epoch": 100, "lr": 9.373396863787955e-05} +{"train_loss": 0.008009694516658783, "global_step": 11920, "epoch": 100, "lr": 9.373289473307587e-05} +{"train_loss": 0.014171228744089603, "global_step": 11921, "epoch": 100, "lr": 9.373182074240733e-05} +{"train_loss": 0.008267974480986595, "global_step": 11922, "epoch": 100, "lr": 9.373074666587605e-05} +{"train_loss": 0.00532871950417757, "global_step": 11923, "epoch": 100, "lr": 9.37296725034841e-05} +{"train_loss": 0.006794381886720657, "global_step": 11924, "epoch": 100, "lr": 9.372859825523361e-05} +{"train_loss": 0.006309778895229101, "global_step": 11925, "epoch": 100, "lr": 9.37275239211267e-05} +{"train_loss": 0.008622520603239536, "global_step": 11926, "epoch": 100, "lr": 9.372644950116547e-05} +{"train_loss": 0.01136555802077055, "global_step": 11927, "epoch": 100, "lr": 9.3725374995352e-05} +{"train_loss": 0.006874100770801306, "global_step": 11928, "epoch": 100, "lr": 9.372430040368847e-05} +{"train_loss": 0.005231371149420738, "global_step": 11929, "epoch": 100, "lr": 9.372322572617694e-05} +{"train_loss": 0.008221948519349098, "global_step": 11930, "epoch": 100, "lr": 9.37221509628195e-05} +{"train_loss": 0.008248472586274147, "global_step": 11931, "epoch": 100, "lr": 9.37210761136183e-05} +{"train_loss": 0.008592462167143822, "global_step": 11932, "epoch": 100, "lr": 9.372000117857544e-05} +{"train_loss": 0.009686163626611233, "global_step": 11933, "epoch": 100, "lr": 9.371892615769302e-05} +{"train_loss": 0.0064436523243784904, "global_step": 11934, "epoch": 100, "lr": 9.371785105097317e-05} +{"train_loss": 0.0078263645991683, "global_step": 11935, "epoch": 100, "lr": 9.3716775858418e-05} +{"train_loss": 0.007405412849038839, "global_step": 11936, "epoch": 100, "lr": 9.371570058002958e-05} +{"train_loss": 0.009658437222242355, "global_step": 11937, "epoch": 100, "lr": 9.371462521581008e-05} +{"train_loss": 0.011007171124219894, "global_step": 11938, "epoch": 100, "lr": 9.371354976576158e-05} +{"train_loss": 0.00863555446267128, "global_step": 11939, "epoch": 100, "lr": 9.371247422988618e-05} +{"train_loss": 0.006928311660885811, "global_step": 11940, "epoch": 100, "lr": 9.371139860818603e-05} +{"train_loss": 0.009338664822280407, "global_step": 11941, "epoch": 100, "lr": 9.37103229006632e-05} +{"train_loss": 0.011282983236014843, "global_step": 11942, "epoch": 100, "lr": 9.370924710731982e-05} +{"train_loss": 0.011920825578272343, "global_step": 11943, "epoch": 100, "lr": 9.3708171228158e-05} +{"train_loss": 0.007849571295082569, "global_step": 11944, "epoch": 100, "lr": 9.370709526317986e-05} +{"train_loss": 0.011554209515452385, "global_step": 11945, "epoch": 100, "lr": 9.370601921238753e-05} +{"train_loss": 0.007912282831966877, "global_step": 11946, "epoch": 100, "lr": 9.370494307578308e-05} +{"train_loss": 0.009793996810913086, "global_step": 11947, "epoch": 100, "lr": 9.370386685336865e-05} +{"train_loss": 0.010742543265223503, "global_step": 11948, "epoch": 100, "lr": 9.370279054514633e-05} +{"train_loss": 0.009075159206986427, "global_step": 11949, "epoch": 100, "lr": 9.370171415111826e-05} +{"train_loss": 0.008406921289861202, "global_step": 11950, "epoch": 100, "lr": 9.370063767128656e-05} +{"train_loss": 0.011717889457941055, "global_step": 11951, "epoch": 100, "lr": 9.36995611056533e-05} +{"train_loss": 0.005976016167551279, "global_step": 11952, "epoch": 100, "lr": 9.369848445422063e-05} +{"train_loss": 0.007038240320980549, "global_step": 11953, "epoch": 100, "lr": 9.369740771699067e-05} +{"train_loss": 0.009574877098202705, "global_step": 11954, "epoch": 100, "lr": 9.36963308939655e-05} +{"train_loss": 0.005876060109585524, "global_step": 11955, "epoch": 100, "lr": 9.369525398514726e-05} +{"train_loss": 0.007608754560351372, "global_step": 11956, "epoch": 100, "lr": 9.369417699053806e-05} +{"train_loss": 0.00970920454710722, "global_step": 11957, "epoch": 100, "lr": 9.369309991013999e-05} +{"train_loss": 0.006781361065804958, "global_step": 11958, "epoch": 100, "lr": 9.369202274395521e-05} +{"train_loss": 0.005472404882311821, "global_step": 11959, "epoch": 100, "lr": 9.36909454919858e-05} +{"train_loss": 0.008429745212197304, "global_step": 11960, "epoch": 100, "lr": 9.368986815423389e-05} +{"train_loss": 0.009146901778876781, "global_step": 11961, "epoch": 100, "lr": 9.36887907307016e-05} +{"train_loss": 0.010426436550915241, "global_step": 11962, "epoch": 100, "lr": 9.368771322139103e-05} +{"train_loss": 0.007216639816761017, "global_step": 11963, "epoch": 100, "lr": 9.368663562630429e-05} +{"train_loss": 0.00787908211350441, "global_step": 11964, "epoch": 100, "lr": 9.368555794544352e-05} +{"train_loss": 0.009213405661284924, "global_step": 11965, "epoch": 100, "lr": 9.368448017881082e-05} +{"train_loss": 0.009274902753531933, "global_step": 11966, "epoch": 100, "lr": 9.36834023264083e-05} +{"train_loss": 0.008253100328147411, "global_step": 11967, "epoch": 100, "lr": 9.368232438823812e-05} +{"train_loss": 0.008442468009889126, "global_step": 11968, "epoch": 100, "lr": 9.368124636430233e-05} +{"train_loss": 0.008622984401881695, "global_step": 11969, "epoch": 100, "lr": 9.368016825460309e-05} +{"train_loss": 0.008488801307976246, "global_step": 11970, "epoch": 100, "lr": 9.367909005914251e-05} +{"train_loss": 0.00832226499915123, "global_step": 11971, "epoch": 100, "lr": 9.36780117779227e-05} +{"train_loss": 0.008590570650994778, "global_step": 11972, "epoch": 100, "lr": 9.367693341094579e-05} +{"train_loss": 0.007194464560598135, "global_step": 11973, "epoch": 100, "lr": 9.367585495821387e-05} +{"train_loss": 0.008275289088487625, "global_step": 11974, "epoch": 100, "lr": 9.367477641972909e-05} +{"train_loss": 0.010189501568675041, "global_step": 11975, "epoch": 100, "lr": 9.367369779549354e-05} +{"train_loss": 0.010276436805725098, "global_step": 11976, "epoch": 100, "lr": 9.367261908550936e-05} +{"train_loss": 0.0069613950327038765, "global_step": 11977, "epoch": 100, "lr": 9.367154028977865e-05} +{"train_loss": 0.0071477219462394714, "global_step": 11978, "epoch": 100, "lr": 9.367046140830355e-05} +{"train_loss": 0.012513888068497181, "global_step": 11979, "epoch": 100, "lr": 9.366938244108615e-05} +{"train_loss": 0.006029317155480385, "global_step": 11980, "epoch": 100, "lr": 9.366830338812858e-05} +{"train_loss": 0.006691641174256802, "global_step": 11981, "epoch": 100, "lr": 9.366722424943297e-05} +{"train_loss": 0.0058088647201657295, "global_step": 11982, "epoch": 100, "lr": 9.366614502500144e-05} +{"train_loss": 0.003572282148525119, "global_step": 11983, "epoch": 100, "lr": 9.366506571483608e-05} +{"train_loss": 0.007264568470418453, "global_step": 11984, "epoch": 100, "lr": 9.366398631893904e-05} +{"train_loss": 0.007975202985107899, "global_step": 11985, "epoch": 100, "lr": 9.366290683731242e-05} +{"train_loss": 0.005346393678337336, "global_step": 11986, "epoch": 100, "lr": 9.366182726995836e-05} +{"train_loss": 0.011290653608739376, "global_step": 11987, "epoch": 100, "lr": 9.366074761687895e-05} +{"train_loss": 0.007464869413524866, "global_step": 11988, "epoch": 100, "lr": 9.365966787807634e-05} +{"train_loss": 0.0075926766730844975, "global_step": 11989, "epoch": 100, "lr": 9.365858805355263e-05} +{"train_loss": 0.006605817470699549, "global_step": 11990, "epoch": 100, "lr": 9.365750814330996e-05} +{"train_loss": 0.011254635639488697, "global_step": 11991, "epoch": 100, "lr": 9.365642814735042e-05} +{"train_loss": 0.010205245576798916, "global_step": 11992, "epoch": 100, "lr": 9.365534806567615e-05} +{"train_loss": 0.008437985554337502, "global_step": 11993, "epoch": 100, "lr": 9.365426789828927e-05} +{"train_loss": 0.007161045912653208, "global_step": 11994, "epoch": 100, "lr": 9.36531876451919e-05} +{"train_loss": 0.0038897099439054728, "global_step": 11995, "epoch": 100, "lr": 9.365210730638617e-05} +{"train_loss": 0.009505472145974636, "global_step": 11996, "epoch": 100, "lr": 9.365102688187417e-05} +{"train_loss": 0.010514085181057453, "global_step": 11997, "epoch": 100, "lr": 9.364994637165805e-05} +{"train_loss": 0.009515817277133465, "global_step": 11998, "epoch": 100, "lr": 9.364886577573993e-05} +{"train_loss": 0.010192740708589554, "global_step": 11999, "epoch": 100, "lr": 9.364778509412191e-05} +{"train_loss": 0.007203106302767992, "global_step": 12000, "epoch": 100, "lr": 9.364670432680615e-05} +{"train_loss": 0.006641203071922064, "global_step": 12001, "epoch": 100, "lr": 9.364562347379473e-05} +{"train_loss": 0.004869495518505573, "global_step": 12002, "epoch": 100, "lr": 9.364454253508981e-05} +{"train_loss": 0.008257423527538776, "global_step": 12003, "epoch": 100, "lr": 9.364346151069347e-05} +{"train_loss": 0.007068099919706583, "global_step": 12004, "epoch": 100, "lr": 9.364238040060786e-05} +{"train_loss": 0.008803065866231918, "global_step": 12005, "epoch": 100, "lr": 9.364129920483511e-05} +{"train_loss": 0.006819093134254217, "global_step": 12006, "epoch": 100, "lr": 9.364021792337733e-05} +{"train_loss": 0.008885040879249573, "global_step": 12007, "epoch": 100, "lr": 9.363913655623664e-05} +{"train_loss": 0.006562570575624704, "global_step": 12008, "epoch": 100, "lr": 9.363805510341517e-05} +{"train_loss": 0.008910308592021465, "global_step": 12009, "epoch": 100, "lr": 9.363697356491504e-05} +{"train_loss": 0.006318078842014074, "global_step": 12010, "epoch": 100, "lr": 9.363589194073838e-05} +{"train_loss": 0.010128509253263474, "global_step": 12011, "epoch": 100, "lr": 9.36348102308873e-05} +{"train_loss": 0.006270323880016804, "global_step": 12012, "epoch": 100, "lr": 9.363372843536394e-05} +{"train_loss": 0.009557058103382587, "global_step": 12013, "epoch": 100, "lr": 9.36326465541704e-05} +{"train_loss": 0.008655935525894165, "global_step": 12014, "epoch": 100, "lr": 9.363156458730884e-05} +{"train_loss": 0.006066512782126665, "global_step": 12015, "epoch": 100, "lr": 9.363048253478135e-05} +{"train_loss": 0.00806244183331728, "global_step": 12016, "epoch": 100, "lr": 9.362940039659008e-05} +{"train_loss": 0.007978486828505993, "global_step": 12017, "epoch": 100, "lr": 9.362831817273713e-05} +{"train_loss": 0.0083059363161065, "global_step": 12018, "epoch": 100, "lr": 9.362723586322464e-05, "val_loss": 0.013764174655079842, "train_action_mse_error": 0.0002841046079993248} +{"train_loss": 0.007781689986586571, "global_step": 12019, "epoch": 101, "lr": 9.362615346805474e-05} +{"train_loss": 0.0067909108474850655, "global_step": 12020, "epoch": 101, "lr": 9.362507098722955e-05} +{"train_loss": 0.0052222334779798985, "global_step": 12021, "epoch": 101, "lr": 9.362398842075119e-05} +{"train_loss": 0.009236683137714863, "global_step": 12022, "epoch": 101, "lr": 9.362290576862179e-05} +{"train_loss": 0.005784324835985899, "global_step": 12023, "epoch": 101, "lr": 9.362182303084349e-05} +{"train_loss": 0.006145216058939695, "global_step": 12024, "epoch": 101, "lr": 9.362074020741836e-05} +{"train_loss": 0.007517803926020861, "global_step": 12025, "epoch": 101, "lr": 9.36196572983486e-05} +{"train_loss": 0.006779830902814865, "global_step": 12026, "epoch": 101, "lr": 9.36185743036363e-05} +{"train_loss": 0.0066205658949911594, "global_step": 12027, "epoch": 101, "lr": 9.361749122328359e-05} +{"train_loss": 0.009640703909099102, "global_step": 12028, "epoch": 101, "lr": 9.361640805729258e-05} +{"train_loss": 0.010320570319890976, "global_step": 12029, "epoch": 101, "lr": 9.361532480566541e-05} +{"train_loss": 0.008831271901726723, "global_step": 12030, "epoch": 101, "lr": 9.361424146840423e-05} +{"train_loss": 0.006420730613172054, "global_step": 12031, "epoch": 101, "lr": 9.361315804551114e-05} +{"train_loss": 0.004954556934535503, "global_step": 12032, "epoch": 101, "lr": 9.361207453698829e-05} +{"train_loss": 0.008576950989663601, "global_step": 12033, "epoch": 101, "lr": 9.361099094283776e-05} +{"train_loss": 0.007216485217213631, "global_step": 12034, "epoch": 101, "lr": 9.360990726306172e-05} +{"train_loss": 0.008678756654262543, "global_step": 12035, "epoch": 101, "lr": 9.360882349766229e-05} +{"train_loss": 0.006613908335566521, "global_step": 12036, "epoch": 101, "lr": 9.36077396466416e-05} +{"train_loss": 0.009647167287766933, "global_step": 12037, "epoch": 101, "lr": 9.360665571000176e-05} +{"train_loss": 0.009137360379099846, "global_step": 12038, "epoch": 101, "lr": 9.360557168774491e-05} +{"train_loss": 0.01085477415472269, "global_step": 12039, "epoch": 101, "lr": 9.360448757987318e-05} +{"train_loss": 0.010634041391313076, "global_step": 12040, "epoch": 101, "lr": 9.360340338638868e-05} +{"train_loss": 0.00601131422445178, "global_step": 12041, "epoch": 101, "lr": 9.360231910729358e-05} +{"train_loss": 0.006934520322829485, "global_step": 12042, "epoch": 101, "lr": 9.360123474258999e-05} +{"train_loss": 0.012961635366082191, "global_step": 12043, "epoch": 101, "lr": 9.360015029228002e-05} +{"train_loss": 0.01158842071890831, "global_step": 12044, "epoch": 101, "lr": 9.359906575636582e-05} +{"train_loss": 0.008298988454043865, "global_step": 12045, "epoch": 101, "lr": 9.35979811348495e-05} +{"train_loss": 0.012492661364376545, "global_step": 12046, "epoch": 101, "lr": 9.359689642773322e-05} +{"train_loss": 0.006999878212809563, "global_step": 12047, "epoch": 101, "lr": 9.359581163501908e-05} +{"train_loss": 0.008314373902976513, "global_step": 12048, "epoch": 101, "lr": 9.359472675670923e-05} +{"train_loss": 0.008373922668397427, "global_step": 12049, "epoch": 101, "lr": 9.359364179280579e-05} +{"train_loss": 0.014401163905858994, "global_step": 12050, "epoch": 101, "lr": 9.359255674331087e-05} +{"train_loss": 0.009140918962657452, "global_step": 12051, "epoch": 101, "lr": 9.359147160822664e-05} +{"train_loss": 0.009721262380480766, "global_step": 12052, "epoch": 101, "lr": 9.359038638755521e-05} +{"train_loss": 0.009202806279063225, "global_step": 12053, "epoch": 101, "lr": 9.358930108129871e-05} +{"train_loss": 0.006040969397872686, "global_step": 12054, "epoch": 101, "lr": 9.35882156894593e-05} +{"train_loss": 0.01120831724256277, "global_step": 12055, "epoch": 101, "lr": 9.358713021203905e-05} +{"train_loss": 0.010652485303580761, "global_step": 12056, "epoch": 101, "lr": 9.358604464904014e-05} +{"train_loss": 0.013947810977697372, "global_step": 12057, "epoch": 101, "lr": 9.358495900046468e-05} +{"train_loss": 0.008623930625617504, "global_step": 12058, "epoch": 101, "lr": 9.358387326631483e-05} +{"train_loss": 0.009175109677016735, "global_step": 12059, "epoch": 101, "lr": 9.358278744659267e-05} +{"train_loss": 0.0068940394558012486, "global_step": 12060, "epoch": 101, "lr": 9.358170154130039e-05} +{"train_loss": 0.012122880667448044, "global_step": 12061, "epoch": 101, "lr": 9.358061555044008e-05} +{"train_loss": 0.007157320622354746, "global_step": 12062, "epoch": 101, "lr": 9.35795294740139e-05} +{"train_loss": 0.011918876320123672, "global_step": 12063, "epoch": 101, "lr": 9.357844331202396e-05} +{"train_loss": 0.0075022815726697445, "global_step": 12064, "epoch": 101, "lr": 9.357735706447242e-05} +{"train_loss": 0.009037557058036327, "global_step": 12065, "epoch": 101, "lr": 9.357627073136137e-05} +{"train_loss": 0.009443116374313831, "global_step": 12066, "epoch": 101, "lr": 9.357518431269298e-05} +{"train_loss": 0.011317187920212746, "global_step": 12067, "epoch": 101, "lr": 9.357409780846937e-05} +{"train_loss": 0.007427281700074673, "global_step": 12068, "epoch": 101, "lr": 9.357301121869268e-05} +{"train_loss": 0.009910198859870434, "global_step": 12069, "epoch": 101, "lr": 9.357192454336503e-05} +{"train_loss": 0.010384726338088512, "global_step": 12070, "epoch": 101, "lr": 9.357083778248857e-05} +{"train_loss": 0.007358960807323456, "global_step": 12071, "epoch": 101, "lr": 9.356975093606542e-05} +{"train_loss": 0.009173846803605556, "global_step": 12072, "epoch": 101, "lr": 9.35686640040977e-05} +{"train_loss": 0.008726421743631363, "global_step": 12073, "epoch": 101, "lr": 9.356757698658758e-05} +{"train_loss": 0.007976378314197063, "global_step": 12074, "epoch": 101, "lr": 9.356648988353718e-05} +{"train_loss": 0.008388347923755646, "global_step": 12075, "epoch": 101, "lr": 9.356540269494862e-05} +{"train_loss": 0.007048805709928274, "global_step": 12076, "epoch": 101, "lr": 9.356431542082405e-05} +{"train_loss": 0.010352488607168198, "global_step": 12077, "epoch": 101, "lr": 9.356322806116561e-05} +{"train_loss": 0.007512343116104603, "global_step": 12078, "epoch": 101, "lr": 9.356214061597542e-05} +{"train_loss": 0.00810122862458229, "global_step": 12079, "epoch": 101, "lr": 9.356105308525563e-05} +{"train_loss": 0.006087176967412233, "global_step": 12080, "epoch": 101, "lr": 9.355996546900835e-05} +{"train_loss": 0.009999683126807213, "global_step": 12081, "epoch": 101, "lr": 9.355887776723573e-05} +{"train_loss": 0.008253457024693489, "global_step": 12082, "epoch": 101, "lr": 9.355778997993992e-05} +{"train_loss": 0.008671597577631474, "global_step": 12083, "epoch": 101, "lr": 9.355670210712303e-05} +{"train_loss": 0.0081555200740695, "global_step": 12084, "epoch": 101, "lr": 9.355561414878721e-05} +{"train_loss": 0.005995059385895729, "global_step": 12085, "epoch": 101, "lr": 9.355452610493462e-05} +{"train_loss": 0.008259475231170654, "global_step": 12086, "epoch": 101, "lr": 9.355343797556734e-05} +{"train_loss": 0.0069370330311357975, "global_step": 12087, "epoch": 101, "lr": 9.355234976068756e-05} +{"train_loss": 0.010814153589308262, "global_step": 12088, "epoch": 101, "lr": 9.355126146029738e-05} +{"train_loss": 0.010438356548547745, "global_step": 12089, "epoch": 101, "lr": 9.355017307439897e-05} +{"train_loss": 0.006461849436163902, "global_step": 12090, "epoch": 101, "lr": 9.354908460299443e-05} +{"train_loss": 0.00751187140122056, "global_step": 12091, "epoch": 101, "lr": 9.35479960460859e-05} +{"train_loss": 0.007373647298663855, "global_step": 12092, "epoch": 101, "lr": 9.354690740367557e-05} +{"train_loss": 0.006116871722042561, "global_step": 12093, "epoch": 101, "lr": 9.354581867576551e-05} +{"train_loss": 0.00609636539593339, "global_step": 12094, "epoch": 101, "lr": 9.35447298623579e-05} +{"train_loss": 0.007946196012198925, "global_step": 12095, "epoch": 101, "lr": 9.354364096345487e-05} +{"train_loss": 0.010118929669260979, "global_step": 12096, "epoch": 101, "lr": 9.354255197905855e-05} +{"train_loss": 0.010155169293284416, "global_step": 12097, "epoch": 101, "lr": 9.354146290917107e-05} +{"train_loss": 0.008892144076526165, "global_step": 12098, "epoch": 101, "lr": 9.354037375379459e-05} +{"train_loss": 0.009816951118409634, "global_step": 12099, "epoch": 101, "lr": 9.353928451293121e-05} +{"train_loss": 0.007693133316934109, "global_step": 12100, "epoch": 101, "lr": 9.353819518658313e-05} +{"train_loss": 0.007814919576048851, "global_step": 12101, "epoch": 101, "lr": 9.353710577475244e-05} +{"train_loss": 0.008339369669556618, "global_step": 12102, "epoch": 101, "lr": 9.35360162774413e-05} +{"train_loss": 0.0071760197170078754, "global_step": 12103, "epoch": 101, "lr": 9.353492669465184e-05} +{"train_loss": 0.008419403806328773, "global_step": 12104, "epoch": 101, "lr": 9.35338370263862e-05} +{"train_loss": 0.00848254095762968, "global_step": 12105, "epoch": 101, "lr": 9.353274727264654e-05} +{"train_loss": 0.004244986921548843, "global_step": 12106, "epoch": 101, "lr": 9.353165743343496e-05} +{"train_loss": 0.0071821920573711395, "global_step": 12107, "epoch": 101, "lr": 9.353056750875363e-05} +{"train_loss": 0.009077074006199837, "global_step": 12108, "epoch": 101, "lr": 9.352947749860468e-05} +{"train_loss": 0.005806146189570427, "global_step": 12109, "epoch": 101, "lr": 9.352838740299026e-05} +{"train_loss": 0.008175050839781761, "global_step": 12110, "epoch": 101, "lr": 9.352729722191249e-05} +{"train_loss": 0.007473126519471407, "global_step": 12111, "epoch": 101, "lr": 9.352620695537353e-05} +{"train_loss": 0.00661150086671114, "global_step": 12112, "epoch": 101, "lr": 9.352511660337551e-05} +{"train_loss": 0.007607028353959322, "global_step": 12113, "epoch": 101, "lr": 9.352402616592057e-05} +{"train_loss": 0.007433885708451271, "global_step": 12114, "epoch": 101, "lr": 9.352293564301084e-05} +{"train_loss": 0.008292263373732567, "global_step": 12115, "epoch": 101, "lr": 9.35218450346485e-05} +{"train_loss": 0.006131237838417292, "global_step": 12116, "epoch": 101, "lr": 9.352075434083566e-05} +{"train_loss": 0.00817984901368618, "global_step": 12117, "epoch": 101, "lr": 9.351966356157447e-05} +{"train_loss": 0.010052679106593132, "global_step": 12118, "epoch": 101, "lr": 9.351857269686706e-05} +{"train_loss": 0.00944259762763977, "global_step": 12119, "epoch": 101, "lr": 9.351748174671559e-05} +{"train_loss": 0.006155182607471943, "global_step": 12120, "epoch": 101, "lr": 9.351639071112219e-05} +{"train_loss": 0.009207240305840969, "global_step": 12121, "epoch": 101, "lr": 9.351529959008901e-05} +{"train_loss": 0.010007143020629883, "global_step": 12122, "epoch": 101, "lr": 9.35142083836182e-05} +{"train_loss": 0.00586834317073226, "global_step": 12123, "epoch": 101, "lr": 9.351311709171187e-05} +{"train_loss": 0.010430104099214077, "global_step": 12124, "epoch": 101, "lr": 9.351202571437218e-05} +{"train_loss": 0.006663287524133921, "global_step": 12125, "epoch": 101, "lr": 9.351093425160128e-05} +{"train_loss": 0.00919341016560793, "global_step": 12126, "epoch": 101, "lr": 9.350984270340133e-05} +{"train_loss": 0.006900136359035969, "global_step": 12127, "epoch": 101, "lr": 9.350875106977443e-05} +{"train_loss": 0.011784356087446213, "global_step": 12128, "epoch": 101, "lr": 9.350765935072277e-05} +{"train_loss": 0.006835597567260265, "global_step": 12129, "epoch": 101, "lr": 9.350656754624845e-05} +{"train_loss": 0.008069354109466076, "global_step": 12130, "epoch": 101, "lr": 9.350547565635363e-05} +{"train_loss": 0.00822991319000721, "global_step": 12131, "epoch": 101, "lr": 9.350438368104046e-05} +{"train_loss": 0.006621779408305883, "global_step": 12132, "epoch": 101, "lr": 9.350329162031109e-05} +{"train_loss": 0.00715927267447114, "global_step": 12133, "epoch": 101, "lr": 9.350219947416764e-05} +{"train_loss": 0.004876861814409494, "global_step": 12134, "epoch": 101, "lr": 9.350110724261228e-05} +{"train_loss": 0.00900547206401825, "global_step": 12135, "epoch": 101, "lr": 9.350001492564713e-05} +{"train_loss": 0.005636562593281269, "global_step": 12136, "epoch": 101, "lr": 9.349892252327436e-05} +{"train_loss": 0.008333383057610829, "global_step": 12137, "epoch": 101, "lr": 9.349783003549611e-05, "val_loss": 0.015593649819493294} +{"train_loss": 0.006386494264006615, "global_step": 12138, "epoch": 102, "lr": 9.349673746231448e-05} +{"train_loss": 0.006632461212575436, "global_step": 12139, "epoch": 102, "lr": 9.34956448037317e-05} +{"train_loss": 0.010999788530170918, "global_step": 12140, "epoch": 102, "lr": 9.349455205974984e-05} +{"train_loss": 0.006611058954149485, "global_step": 12141, "epoch": 102, "lr": 9.349345923037108e-05} +{"train_loss": 0.010129678063094616, "global_step": 12142, "epoch": 102, "lr": 9.349236631559757e-05} +{"train_loss": 0.006318599916994572, "global_step": 12143, "epoch": 102, "lr": 9.349127331543143e-05} +{"train_loss": 0.006277950014919043, "global_step": 12144, "epoch": 102, "lr": 9.349018022987484e-05} +{"train_loss": 0.005488111637532711, "global_step": 12145, "epoch": 102, "lr": 9.348908705892992e-05} +{"train_loss": 0.007294303737580776, "global_step": 12146, "epoch": 102, "lr": 9.34879938025988e-05} +{"train_loss": 0.010705730877816677, "global_step": 12147, "epoch": 102, "lr": 9.348690046088367e-05} +{"train_loss": 0.009400201961398125, "global_step": 12148, "epoch": 102, "lr": 9.348580703378666e-05} +{"train_loss": 0.011210291646420956, "global_step": 12149, "epoch": 102, "lr": 9.348471352130991e-05} +{"train_loss": 0.007154760416597128, "global_step": 12150, "epoch": 102, "lr": 9.348361992345557e-05} +{"train_loss": 0.005415888968855143, "global_step": 12151, "epoch": 102, "lr": 9.348252624022579e-05} +{"train_loss": 0.007579806260764599, "global_step": 12152, "epoch": 102, "lr": 9.34814324716227e-05} +{"train_loss": 0.008174230344593525, "global_step": 12153, "epoch": 102, "lr": 9.34803386176485e-05} +{"train_loss": 0.009448385797441006, "global_step": 12154, "epoch": 102, "lr": 9.347924467830526e-05} +{"train_loss": 0.0061773741617798805, "global_step": 12155, "epoch": 102, "lr": 9.347815065359519e-05} +{"train_loss": 0.008671930059790611, "global_step": 12156, "epoch": 102, "lr": 9.347705654352041e-05} +{"train_loss": 0.007973924279212952, "global_step": 12157, "epoch": 102, "lr": 9.347596234808307e-05} +{"train_loss": 0.0071814521215856075, "global_step": 12158, "epoch": 102, "lr": 9.347486806728532e-05} +{"train_loss": 0.005040072835981846, "global_step": 12159, "epoch": 102, "lr": 9.347377370112933e-05} +{"train_loss": 0.00756329670548439, "global_step": 12160, "epoch": 102, "lr": 9.347267924961721e-05} +{"train_loss": 0.01013975776731968, "global_step": 12161, "epoch": 102, "lr": 9.347158471275114e-05} +{"train_loss": 0.00834638997912407, "global_step": 12162, "epoch": 102, "lr": 9.347049009053326e-05} +{"train_loss": 0.006532339379191399, "global_step": 12163, "epoch": 102, "lr": 9.34693953829657e-05} +{"train_loss": 0.010354649275541306, "global_step": 12164, "epoch": 102, "lr": 9.346830059005065e-05} +{"train_loss": 0.008634654805064201, "global_step": 12165, "epoch": 102, "lr": 9.346720571179022e-05} +{"train_loss": 0.010065286420285702, "global_step": 12166, "epoch": 102, "lr": 9.346611074818657e-05} +{"train_loss": 0.006454567424952984, "global_step": 12167, "epoch": 102, "lr": 9.346501569924186e-05} +{"train_loss": 0.008163278922438622, "global_step": 12168, "epoch": 102, "lr": 9.346392056495826e-05} +{"train_loss": 0.008029980584979057, "global_step": 12169, "epoch": 102, "lr": 9.346282534533787e-05} +{"train_loss": 0.009723919443786144, "global_step": 12170, "epoch": 102, "lr": 9.346173004038286e-05} +{"train_loss": 0.00785645842552185, "global_step": 12171, "epoch": 102, "lr": 9.34606346500954e-05} +{"train_loss": 0.009479207918047905, "global_step": 12172, "epoch": 102, "lr": 9.345953917447762e-05} +{"train_loss": 0.007166377268731594, "global_step": 12173, "epoch": 102, "lr": 9.345844361353169e-05} +{"train_loss": 0.009047186002135277, "global_step": 12174, "epoch": 102, "lr": 9.345734796725974e-05} +{"train_loss": 0.007227146532386541, "global_step": 12175, "epoch": 102, "lr": 9.345625223566392e-05} +{"train_loss": 0.006791365798562765, "global_step": 12176, "epoch": 102, "lr": 9.345515641874641e-05} +{"train_loss": 0.007878725416958332, "global_step": 12177, "epoch": 102, "lr": 9.345406051650933e-05} +{"train_loss": 0.008046140894293785, "global_step": 12178, "epoch": 102, "lr": 9.345296452895486e-05} +{"train_loss": 0.00931534729897976, "global_step": 12179, "epoch": 102, "lr": 9.345186845608512e-05} +{"train_loss": 0.008806108497083187, "global_step": 12180, "epoch": 102, "lr": 9.345077229790229e-05} +{"train_loss": 0.005910276900976896, "global_step": 12181, "epoch": 102, "lr": 9.344967605440849e-05} +{"train_loss": 0.010808323509991169, "global_step": 12182, "epoch": 102, "lr": 9.344857972560592e-05} +{"train_loss": 0.006611279211938381, "global_step": 12183, "epoch": 102, "lr": 9.344748331149669e-05} +{"train_loss": 0.00693358713760972, "global_step": 12184, "epoch": 102, "lr": 9.344638681208297e-05} +{"train_loss": 0.007398655638098717, "global_step": 12185, "epoch": 102, "lr": 9.344529022736692e-05} +{"train_loss": 0.0067522646859288216, "global_step": 12186, "epoch": 102, "lr": 9.344419355735067e-05} +{"train_loss": 0.006292418111115694, "global_step": 12187, "epoch": 102, "lr": 9.344309680203639e-05} +{"train_loss": 0.008697371929883957, "global_step": 12188, "epoch": 102, "lr": 9.344199996142625e-05} +{"train_loss": 0.007744662929326296, "global_step": 12189, "epoch": 102, "lr": 9.344090303552235e-05} +{"train_loss": 0.008767012506723404, "global_step": 12190, "epoch": 102, "lr": 9.34398060243269e-05} +{"train_loss": 0.009642571210861206, "global_step": 12191, "epoch": 102, "lr": 9.343870892784203e-05} +{"train_loss": 0.00656708050519228, "global_step": 12192, "epoch": 102, "lr": 9.343761174606989e-05} +{"train_loss": 0.010244985111057758, "global_step": 12193, "epoch": 102, "lr": 9.343651447901265e-05} +{"train_loss": 0.007630792446434498, "global_step": 12194, "epoch": 102, "lr": 9.343541712667244e-05} +{"train_loss": 0.006103988271206617, "global_step": 12195, "epoch": 102, "lr": 9.343431968905144e-05} +{"train_loss": 0.007474357727915049, "global_step": 12196, "epoch": 102, "lr": 9.343322216615179e-05} +{"train_loss": 0.00804232433438301, "global_step": 12197, "epoch": 102, "lr": 9.343212455797565e-05} +{"train_loss": 0.006378831807523966, "global_step": 12198, "epoch": 102, "lr": 9.343102686452517e-05} +{"train_loss": 0.00981102418154478, "global_step": 12199, "epoch": 102, "lr": 9.342992908580252e-05} +{"train_loss": 0.008267012424767017, "global_step": 12200, "epoch": 102, "lr": 9.342883122180983e-05} +{"train_loss": 0.00962742604315281, "global_step": 12201, "epoch": 102, "lr": 9.342773327254927e-05} +{"train_loss": 0.004272044636309147, "global_step": 12202, "epoch": 102, "lr": 9.3426635238023e-05} +{"train_loss": 0.008428008295595646, "global_step": 12203, "epoch": 102, "lr": 9.342553711823317e-05} +{"train_loss": 0.007978682406246662, "global_step": 12204, "epoch": 102, "lr": 9.342443891318194e-05} +{"train_loss": 0.005087102763354778, "global_step": 12205, "epoch": 102, "lr": 9.342334062287146e-05} +{"train_loss": 0.011427456513047218, "global_step": 12206, "epoch": 102, "lr": 9.34222422473039e-05} +{"train_loss": 0.007439026143401861, "global_step": 12207, "epoch": 102, "lr": 9.342114378648139e-05} +{"train_loss": 0.006121732760220766, "global_step": 12208, "epoch": 102, "lr": 9.34200452404061e-05} +{"train_loss": 0.006624704226851463, "global_step": 12209, "epoch": 102, "lr": 9.341894660908022e-05} +{"train_loss": 0.013878141529858112, "global_step": 12210, "epoch": 102, "lr": 9.341784789250584e-05} +{"train_loss": 0.010395071469247341, "global_step": 12211, "epoch": 102, "lr": 9.341674909068518e-05} +{"train_loss": 0.01143520139157772, "global_step": 12212, "epoch": 102, "lr": 9.341565020362037e-05} +{"train_loss": 0.012827279977500439, "global_step": 12213, "epoch": 102, "lr": 9.341455123131355e-05} +{"train_loss": 0.006772743072360754, "global_step": 12214, "epoch": 102, "lr": 9.341345217376692e-05} +{"train_loss": 0.004806225188076496, "global_step": 12215, "epoch": 102, "lr": 9.34123530309826e-05} +{"train_loss": 0.006577140185981989, "global_step": 12216, "epoch": 102, "lr": 9.341125380296277e-05} +{"train_loss": 0.010245513170957565, "global_step": 12217, "epoch": 102, "lr": 9.341015448970957e-05} +{"train_loss": 0.011794189922511578, "global_step": 12218, "epoch": 102, "lr": 9.340905509122519e-05} +{"train_loss": 0.005994140636175871, "global_step": 12219, "epoch": 102, "lr": 9.340795560751175e-05} +{"train_loss": 0.008416394703090191, "global_step": 12220, "epoch": 102, "lr": 9.340685603857143e-05} +{"train_loss": 0.010835660621523857, "global_step": 12221, "epoch": 102, "lr": 9.340575638440638e-05} +{"train_loss": 0.005352589767426252, "global_step": 12222, "epoch": 102, "lr": 9.340465664501878e-05} +{"train_loss": 0.004569810815155506, "global_step": 12223, "epoch": 102, "lr": 9.340355682041077e-05} +{"train_loss": 0.007981940172612667, "global_step": 12224, "epoch": 102, "lr": 9.34024569105845e-05} +{"train_loss": 0.010980053804814816, "global_step": 12225, "epoch": 102, "lr": 9.340135691554215e-05} +{"train_loss": 0.01080751046538353, "global_step": 12226, "epoch": 102, "lr": 9.340025683528589e-05} +{"train_loss": 0.007633148692548275, "global_step": 12227, "epoch": 102, "lr": 9.339915666981784e-05} +{"train_loss": 0.006823085714131594, "global_step": 12228, "epoch": 102, "lr": 9.33980564191402e-05} +{"train_loss": 0.012531491927802563, "global_step": 12229, "epoch": 102, "lr": 9.33969560832551e-05} +{"train_loss": 0.007583401165902615, "global_step": 12230, "epoch": 102, "lr": 9.33958556621647e-05} +{"train_loss": 0.01053343340754509, "global_step": 12231, "epoch": 102, "lr": 9.339475515587119e-05} +{"train_loss": 0.007991541177034378, "global_step": 12232, "epoch": 102, "lr": 9.33936545643767e-05} +{"train_loss": 0.007172272074967623, "global_step": 12233, "epoch": 102, "lr": 9.339255388768343e-05} +{"train_loss": 0.016897091642022133, "global_step": 12234, "epoch": 102, "lr": 9.33914531257935e-05} +{"train_loss": 0.010748467408120632, "global_step": 12235, "epoch": 102, "lr": 9.339035227870909e-05} +{"train_loss": 0.00568387983366847, "global_step": 12236, "epoch": 102, "lr": 9.338925134643237e-05} +{"train_loss": 0.015133686363697052, "global_step": 12237, "epoch": 102, "lr": 9.338815032896547e-05} +{"train_loss": 0.009125316515564919, "global_step": 12238, "epoch": 102, "lr": 9.338704922631059e-05} +{"train_loss": 0.009366382844746113, "global_step": 12239, "epoch": 102, "lr": 9.338594803846986e-05} +{"train_loss": 0.006853469181805849, "global_step": 12240, "epoch": 102, "lr": 9.338484676544547e-05} +{"train_loss": 0.008546167984604836, "global_step": 12241, "epoch": 102, "lr": 9.338374540723955e-05} +{"train_loss": 0.007003473583608866, "global_step": 12242, "epoch": 102, "lr": 9.33826439638543e-05} +{"train_loss": 0.014682970941066742, "global_step": 12243, "epoch": 102, "lr": 9.338154243529185e-05} +{"train_loss": 0.008792825043201447, "global_step": 12244, "epoch": 102, "lr": 9.33804408215544e-05} +{"train_loss": 0.010302137583494186, "global_step": 12245, "epoch": 102, "lr": 9.337933912264404e-05} +{"train_loss": 0.008582847192883492, "global_step": 12246, "epoch": 102, "lr": 9.337823733856304e-05} +{"train_loss": 0.010281870141625404, "global_step": 12247, "epoch": 102, "lr": 9.337713546931346e-05} +{"train_loss": 0.005401642993092537, "global_step": 12248, "epoch": 102, "lr": 9.337603351489753e-05} +{"train_loss": 0.009150807745754719, "global_step": 12249, "epoch": 102, "lr": 9.33749314753174e-05} +{"train_loss": 0.007059056311845779, "global_step": 12250, "epoch": 102, "lr": 9.337382935057521e-05} +{"train_loss": 0.013859483413398266, "global_step": 12251, "epoch": 102, "lr": 9.337272714067313e-05} +{"train_loss": 0.009770325385034084, "global_step": 12252, "epoch": 102, "lr": 9.337162484561336e-05} +{"train_loss": 0.008522833697497845, "global_step": 12253, "epoch": 102, "lr": 9.337052246539802e-05} +{"train_loss": 0.00907975435256958, "global_step": 12254, "epoch": 102, "lr": 9.336942000002931e-05} +{"train_loss": 0.012442921288311481, "global_step": 12255, "epoch": 102, "lr": 9.336831744950935e-05} +{"train_loss": 0.008514827113410756, "global_step": 12256, "epoch": 102, "lr": 9.336721481384036e-05, "val_loss": 0.021039549261331558} +{"train_loss": 0.008145501837134361, "global_step": 12257, "epoch": 103, "lr": 9.336611209302446e-05} +{"train_loss": 0.011911790817975998, "global_step": 12258, "epoch": 103, "lr": 9.336500928706385e-05} +{"train_loss": 0.009726356714963913, "global_step": 12259, "epoch": 103, "lr": 9.336390639596065e-05} +{"train_loss": 0.007938135415315628, "global_step": 12260, "epoch": 103, "lr": 9.336280341971707e-05} +{"train_loss": 0.008377531543374062, "global_step": 12261, "epoch": 103, "lr": 9.336170035833525e-05} +{"train_loss": 0.01461094617843628, "global_step": 12262, "epoch": 103, "lr": 9.336059721181737e-05} +{"train_loss": 0.007851166650652885, "global_step": 12263, "epoch": 103, "lr": 9.33594939801656e-05} +{"train_loss": 0.00855737179517746, "global_step": 12264, "epoch": 103, "lr": 9.335839066338208e-05} +{"train_loss": 0.008482567965984344, "global_step": 12265, "epoch": 103, "lr": 9.3357287261469e-05} +{"train_loss": 0.007678675465285778, "global_step": 12266, "epoch": 103, "lr": 9.33561837744285e-05} +{"train_loss": 0.008300898596644402, "global_step": 12267, "epoch": 103, "lr": 9.335508020226278e-05} +{"train_loss": 0.004959662910550833, "global_step": 12268, "epoch": 103, "lr": 9.3353976544974e-05} +{"train_loss": 0.008151243440806866, "global_step": 12269, "epoch": 103, "lr": 9.335287280256431e-05} +{"train_loss": 0.00836312398314476, "global_step": 12270, "epoch": 103, "lr": 9.335176897503588e-05} +{"train_loss": 0.011571154929697514, "global_step": 12271, "epoch": 103, "lr": 9.335066506239089e-05} +{"train_loss": 0.008438235148787498, "global_step": 12272, "epoch": 103, "lr": 9.334956106463151e-05} +{"train_loss": 0.006557709537446499, "global_step": 12273, "epoch": 103, "lr": 9.334845698175988e-05} +{"train_loss": 0.008835533633828163, "global_step": 12274, "epoch": 103, "lr": 9.33473528137782e-05} +{"train_loss": 0.009500490501523018, "global_step": 12275, "epoch": 103, "lr": 9.33462485606886e-05} +{"train_loss": 0.005639129318296909, "global_step": 12276, "epoch": 103, "lr": 9.334514422249329e-05} +{"train_loss": 0.01072442252188921, "global_step": 12277, "epoch": 103, "lr": 9.334403979919444e-05} +{"train_loss": 0.009132714942097664, "global_step": 12278, "epoch": 103, "lr": 9.334293529079417e-05} +{"train_loss": 0.009777268394827843, "global_step": 12279, "epoch": 103, "lr": 9.334183069729468e-05} +{"train_loss": 0.00981859676539898, "global_step": 12280, "epoch": 103, "lr": 9.334072601869815e-05} +{"train_loss": 0.012489104643464088, "global_step": 12281, "epoch": 103, "lr": 9.333962125500673e-05} +{"train_loss": 0.011280045844614506, "global_step": 12282, "epoch": 103, "lr": 9.333851640622257e-05} +{"train_loss": 0.010626176372170448, "global_step": 12283, "epoch": 103, "lr": 9.333741147234788e-05} +{"train_loss": 0.007548218593001366, "global_step": 12284, "epoch": 103, "lr": 9.333630645338482e-05} +{"train_loss": 0.007467110641300678, "global_step": 12285, "epoch": 103, "lr": 9.333520134933556e-05} +{"train_loss": 0.007473982870578766, "global_step": 12286, "epoch": 103, "lr": 9.333409616020224e-05} +{"train_loss": 0.009204168803989887, "global_step": 12287, "epoch": 103, "lr": 9.333299088598707e-05} +{"train_loss": 0.006177361588925123, "global_step": 12288, "epoch": 103, "lr": 9.333188552669218e-05} +{"train_loss": 0.00486418092623353, "global_step": 12289, "epoch": 103, "lr": 9.333078008231977e-05} +{"train_loss": 0.007755866274237633, "global_step": 12290, "epoch": 103, "lr": 9.332967455287202e-05} +{"train_loss": 0.006176332477480173, "global_step": 12291, "epoch": 103, "lr": 9.332856893835107e-05} +{"train_loss": 0.009625335223972797, "global_step": 12292, "epoch": 103, "lr": 9.332746323875909e-05} +{"train_loss": 0.008247362449765205, "global_step": 12293, "epoch": 103, "lr": 9.332635745409828e-05} +{"train_loss": 0.006359527353197336, "global_step": 12294, "epoch": 103, "lr": 9.33252515843708e-05} +{"train_loss": 0.012155357748270035, "global_step": 12295, "epoch": 103, "lr": 9.33241456295788e-05} +{"train_loss": 0.004693516995757818, "global_step": 12296, "epoch": 103, "lr": 9.33230395897245e-05} +{"train_loss": 0.006796861067414284, "global_step": 12297, "epoch": 103, "lr": 9.332193346481002e-05} +{"train_loss": 0.008608179166913033, "global_step": 12298, "epoch": 103, "lr": 9.332082725483756e-05} +{"train_loss": 0.007264418061822653, "global_step": 12299, "epoch": 103, "lr": 9.331972095980926e-05} +{"train_loss": 0.005395522806793451, "global_step": 12300, "epoch": 103, "lr": 9.331861457972732e-05} +{"train_loss": 0.014403644017875195, "global_step": 12301, "epoch": 103, "lr": 9.331750811459393e-05} +{"train_loss": 0.006894493009895086, "global_step": 12302, "epoch": 103, "lr": 9.331640156441124e-05} +{"train_loss": 0.00728512043133378, "global_step": 12303, "epoch": 103, "lr": 9.33152949291814e-05} +{"train_loss": 0.008089736104011536, "global_step": 12304, "epoch": 103, "lr": 9.331418820890662e-05} +{"train_loss": 0.012936842627823353, "global_step": 12305, "epoch": 103, "lr": 9.331308140358908e-05} +{"train_loss": 0.008513427339494228, "global_step": 12306, "epoch": 103, "lr": 9.331197451323091e-05} +{"train_loss": 0.01459653303027153, "global_step": 12307, "epoch": 103, "lr": 9.33108675378343e-05} +{"train_loss": 0.006117667071521282, "global_step": 12308, "epoch": 103, "lr": 9.330976047740143e-05} +{"train_loss": 0.00894157774746418, "global_step": 12309, "epoch": 103, "lr": 9.330865333193449e-05} +{"train_loss": 0.0063362750224769115, "global_step": 12310, "epoch": 103, "lr": 9.330754610143562e-05} +{"train_loss": 0.0069178324192762375, "global_step": 12311, "epoch": 103, "lr": 9.3306438785907e-05} +{"train_loss": 0.006616001948714256, "global_step": 12312, "epoch": 103, "lr": 9.330533138535083e-05} +{"train_loss": 0.007238257676362991, "global_step": 12313, "epoch": 103, "lr": 9.330422389976928e-05} +{"train_loss": 0.006681227125227451, "global_step": 12314, "epoch": 103, "lr": 9.330311632916449e-05} +{"train_loss": 0.010546188801527023, "global_step": 12315, "epoch": 103, "lr": 9.330200867353866e-05} +{"train_loss": 0.008352480828762054, "global_step": 12316, "epoch": 103, "lr": 9.330090093289397e-05} +{"train_loss": 0.009582025930285454, "global_step": 12317, "epoch": 103, "lr": 9.329979310723257e-05} +{"train_loss": 0.015199696645140648, "global_step": 12318, "epoch": 103, "lr": 9.329868519655668e-05} +{"train_loss": 0.007894579321146011, "global_step": 12319, "epoch": 103, "lr": 9.329757720086844e-05} +{"train_loss": 0.01027613878250122, "global_step": 12320, "epoch": 103, "lr": 9.329646912017003e-05} +{"train_loss": 0.007224442902952433, "global_step": 12321, "epoch": 103, "lr": 9.32953609544636e-05} +{"train_loss": 0.006614602170884609, "global_step": 12322, "epoch": 103, "lr": 9.329425270375139e-05} +{"train_loss": 0.011123517528176308, "global_step": 12323, "epoch": 103, "lr": 9.329314436803554e-05} +{"train_loss": 0.00891901459544897, "global_step": 12324, "epoch": 103, "lr": 9.329203594731822e-05} +{"train_loss": 0.0057921381667256355, "global_step": 12325, "epoch": 103, "lr": 9.32909274416016e-05} +{"train_loss": 0.011246285401284695, "global_step": 12326, "epoch": 103, "lr": 9.328981885088787e-05} +{"train_loss": 0.005384551361203194, "global_step": 12327, "epoch": 103, "lr": 9.328871017517922e-05} +{"train_loss": 0.00861378014087677, "global_step": 12328, "epoch": 103, "lr": 9.32876014144778e-05} +{"train_loss": 0.009563571773469448, "global_step": 12329, "epoch": 103, "lr": 9.328649256878581e-05} +{"train_loss": 0.006542779039591551, "global_step": 12330, "epoch": 103, "lr": 9.328538363810541e-05} +{"train_loss": 0.006723033729940653, "global_step": 12331, "epoch": 103, "lr": 9.328427462243879e-05} +{"train_loss": 0.012774697504937649, "global_step": 12332, "epoch": 103, "lr": 9.328316552178811e-05} +{"train_loss": 0.007230513263493776, "global_step": 12333, "epoch": 103, "lr": 9.328205633615557e-05} +{"train_loss": 0.007456906605511904, "global_step": 12334, "epoch": 103, "lr": 9.328094706554333e-05} +{"train_loss": 0.010731572285294533, "global_step": 12335, "epoch": 103, "lr": 9.327983770995357e-05} +{"train_loss": 0.00809949915856123, "global_step": 12336, "epoch": 103, "lr": 9.327872826938848e-05} +{"train_loss": 0.00824509933590889, "global_step": 12337, "epoch": 103, "lr": 9.327761874385022e-05} +{"train_loss": 0.009309728629887104, "global_step": 12338, "epoch": 103, "lr": 9.327650913334099e-05} +{"train_loss": 0.008171919733285904, "global_step": 12339, "epoch": 103, "lr": 9.327539943786296e-05} +{"train_loss": 0.008129823952913284, "global_step": 12340, "epoch": 103, "lr": 9.327428965741829e-05} +{"train_loss": 0.006537492852658033, "global_step": 12341, "epoch": 103, "lr": 9.327317979200919e-05} +{"train_loss": 0.00948903989046812, "global_step": 12342, "epoch": 103, "lr": 9.327206984163783e-05} +{"train_loss": 0.008935515768826008, "global_step": 12343, "epoch": 103, "lr": 9.327095980630637e-05} +{"train_loss": 0.007867797277867794, "global_step": 12344, "epoch": 103, "lr": 9.326984968601701e-05} +{"train_loss": 0.0065567372366786, "global_step": 12345, "epoch": 103, "lr": 9.326873948077192e-05} +{"train_loss": 0.009593593887984753, "global_step": 12346, "epoch": 103, "lr": 9.326762919057329e-05} +{"train_loss": 0.0067876186221838, "global_step": 12347, "epoch": 103, "lr": 9.326651881542328e-05} +{"train_loss": 0.00537718553096056, "global_step": 12348, "epoch": 103, "lr": 9.326540835532409e-05} +{"train_loss": 0.00507039949297905, "global_step": 12349, "epoch": 103, "lr": 9.326429781027788e-05} +{"train_loss": 0.007104916498064995, "global_step": 12350, "epoch": 103, "lr": 9.326318718028686e-05} +{"train_loss": 0.005782150663435459, "global_step": 12351, "epoch": 103, "lr": 9.326207646535319e-05} +{"train_loss": 0.006061769090592861, "global_step": 12352, "epoch": 103, "lr": 9.326096566547906e-05} +{"train_loss": 0.007342594210058451, "global_step": 12353, "epoch": 103, "lr": 9.325985478066663e-05} +{"train_loss": 0.007638292387127876, "global_step": 12354, "epoch": 103, "lr": 9.32587438109181e-05} +{"train_loss": 0.007105697877705097, "global_step": 12355, "epoch": 103, "lr": 9.325763275623566e-05} +{"train_loss": 0.007808055728673935, "global_step": 12356, "epoch": 103, "lr": 9.325652161662148e-05} +{"train_loss": 0.010826501064002514, "global_step": 12357, "epoch": 103, "lr": 9.325541039207773e-05} +{"train_loss": 0.006358325947076082, "global_step": 12358, "epoch": 103, "lr": 9.325429908260661e-05} +{"train_loss": 0.004801446571946144, "global_step": 12359, "epoch": 103, "lr": 9.32531876882103e-05} +{"train_loss": 0.009128137491643429, "global_step": 12360, "epoch": 103, "lr": 9.325207620889096e-05} +{"train_loss": 0.009287645108997822, "global_step": 12361, "epoch": 103, "lr": 9.325096464465081e-05} +{"train_loss": 0.007974823005497456, "global_step": 12362, "epoch": 103, "lr": 9.324985299549199e-05} +{"train_loss": 0.007233431562781334, "global_step": 12363, "epoch": 103, "lr": 9.324874126141672e-05} +{"train_loss": 0.010141855105757713, "global_step": 12364, "epoch": 103, "lr": 9.324762944242716e-05} +{"train_loss": 0.0053077032789587975, "global_step": 12365, "epoch": 103, "lr": 9.32465175385255e-05} +{"train_loss": 0.007487935945391655, "global_step": 12366, "epoch": 103, "lr": 9.324540554971392e-05} +{"train_loss": 0.0128275565803051, "global_step": 12367, "epoch": 103, "lr": 9.324429347599461e-05} +{"train_loss": 0.012402879074215889, "global_step": 12368, "epoch": 103, "lr": 9.324318131736976e-05} +{"train_loss": 0.005039808340370655, "global_step": 12369, "epoch": 103, "lr": 9.324206907384154e-05} +{"train_loss": 0.009960918687283993, "global_step": 12370, "epoch": 103, "lr": 9.324095674541211e-05} +{"train_loss": 0.010823193937540054, "global_step": 12371, "epoch": 103, "lr": 9.323984433208372e-05} +{"train_loss": 0.007096646353602409, "global_step": 12372, "epoch": 103, "lr": 9.323873183385849e-05} +{"train_loss": 0.007231791969388723, "global_step": 12373, "epoch": 103, "lr": 9.323761925073863e-05} +{"train_loss": 0.010081215761601925, "global_step": 12374, "epoch": 103, "lr": 9.323650658272633e-05} +{"train_loss": 0.008447282376284358, "global_step": 12375, "epoch": 103, "lr": 9.323539382982378e-05, "val_loss": 0.01747852936387062} +{"train_loss": 0.008865006268024445, "global_step": 12376, "epoch": 104, "lr": 9.323428099203314e-05} +{"train_loss": 0.008703015744686127, "global_step": 12377, "epoch": 104, "lr": 9.32331680693566e-05} +{"train_loss": 0.01042219903320074, "global_step": 12378, "epoch": 104, "lr": 9.323205506179638e-05} +{"train_loss": 0.007240707986056805, "global_step": 12379, "epoch": 104, "lr": 9.323094196935461e-05} +{"train_loss": 0.014169702306389809, "global_step": 12380, "epoch": 104, "lr": 9.322982879203352e-05} +{"train_loss": 0.007320580538362265, "global_step": 12381, "epoch": 104, "lr": 9.322871552983528e-05} +{"train_loss": 0.007258723024278879, "global_step": 12382, "epoch": 104, "lr": 9.322760218276206e-05} +{"train_loss": 0.01248256303369999, "global_step": 12383, "epoch": 104, "lr": 9.322648875081608e-05} +{"train_loss": 0.007388237863779068, "global_step": 12384, "epoch": 104, "lr": 9.32253752339995e-05} +{"train_loss": 0.007661648094654083, "global_step": 12385, "epoch": 104, "lr": 9.322426163231451e-05} +{"train_loss": 0.011926773004233837, "global_step": 12386, "epoch": 104, "lr": 9.32231479457633e-05} +{"train_loss": 0.00851207971572876, "global_step": 12387, "epoch": 104, "lr": 9.322203417434807e-05} +{"train_loss": 0.008742978796362877, "global_step": 12388, "epoch": 104, "lr": 9.322092031807097e-05} +{"train_loss": 0.009821389801800251, "global_step": 12389, "epoch": 104, "lr": 9.321980637693424e-05} +{"train_loss": 0.007210229057818651, "global_step": 12390, "epoch": 104, "lr": 9.321869235094002e-05} +{"train_loss": 0.008722796104848385, "global_step": 12391, "epoch": 104, "lr": 9.32175782400905e-05} +{"train_loss": 0.007861781865358353, "global_step": 12392, "epoch": 104, "lr": 9.321646404438791e-05} +{"train_loss": 0.010643444024026394, "global_step": 12393, "epoch": 104, "lr": 9.321534976383439e-05} +{"train_loss": 0.007211462594568729, "global_step": 12394, "epoch": 104, "lr": 9.321423539843217e-05} +{"train_loss": 0.011809277348220348, "global_step": 12395, "epoch": 104, "lr": 9.32131209481834e-05} +{"train_loss": 0.006406152155250311, "global_step": 12396, "epoch": 104, "lr": 9.321200641309028e-05} +{"train_loss": 0.009101325646042824, "global_step": 12397, "epoch": 104, "lr": 9.321089179315501e-05} +{"train_loss": 0.010974501259624958, "global_step": 12398, "epoch": 104, "lr": 9.320977708837976e-05} +{"train_loss": 0.00850602425634861, "global_step": 12399, "epoch": 104, "lr": 9.320866229876675e-05} +{"train_loss": 0.008625682443380356, "global_step": 12400, "epoch": 104, "lr": 9.320754742431812e-05} +{"train_loss": 0.010046052746474743, "global_step": 12401, "epoch": 104, "lr": 9.320643246503611e-05} +{"train_loss": 0.008185056038200855, "global_step": 12402, "epoch": 104, "lr": 9.320531742092288e-05} +{"train_loss": 0.01199257466942072, "global_step": 12403, "epoch": 104, "lr": 9.320420229198061e-05} +{"train_loss": 0.0062419818714261055, "global_step": 12404, "epoch": 104, "lr": 9.320308707821153e-05} +{"train_loss": 0.004991823807358742, "global_step": 12405, "epoch": 104, "lr": 9.320197177961779e-05} +{"train_loss": 0.008874556981027126, "global_step": 12406, "epoch": 104, "lr": 9.32008563962016e-05} +{"train_loss": 0.011738922446966171, "global_step": 12407, "epoch": 104, "lr": 9.319974092796513e-05} +{"train_loss": 0.012133079580962658, "global_step": 12408, "epoch": 104, "lr": 9.319862537491059e-05} +{"train_loss": 0.007638887967914343, "global_step": 12409, "epoch": 104, "lr": 9.319750973704017e-05} +{"train_loss": 0.008311004377901554, "global_step": 12410, "epoch": 104, "lr": 9.319639401435605e-05} +{"train_loss": 0.007483270950615406, "global_step": 12411, "epoch": 104, "lr": 9.319527820686043e-05} +{"train_loss": 0.009851181879639626, "global_step": 12412, "epoch": 104, "lr": 9.319416231455549e-05} +{"train_loss": 0.008785981684923172, "global_step": 12413, "epoch": 104, "lr": 9.319304633744342e-05} +{"train_loss": 0.007054822985082865, "global_step": 12414, "epoch": 104, "lr": 9.319193027552643e-05} +{"train_loss": 0.011103485710918903, "global_step": 12415, "epoch": 104, "lr": 9.319081412880671e-05} +{"train_loss": 0.007454965263605118, "global_step": 12416, "epoch": 104, "lr": 9.318969789728642e-05} +{"train_loss": 0.013428461737930775, "global_step": 12417, "epoch": 104, "lr": 9.318858158096777e-05} +{"train_loss": 0.005877423565834761, "global_step": 12418, "epoch": 104, "lr": 9.318746517985297e-05} +{"train_loss": 0.009998541325330734, "global_step": 12419, "epoch": 104, "lr": 9.318634869394419e-05} +{"train_loss": 0.0051452093757689, "global_step": 12420, "epoch": 104, "lr": 9.318523212324361e-05} +{"train_loss": 0.005901414435356855, "global_step": 12421, "epoch": 104, "lr": 9.318411546775348e-05} +{"train_loss": 0.011593290604650974, "global_step": 12422, "epoch": 104, "lr": 9.318299872747591e-05} +{"train_loss": 0.010969149880111217, "global_step": 12423, "epoch": 104, "lr": 9.318188190241317e-05} +{"train_loss": 0.005720717832446098, "global_step": 12424, "epoch": 104, "lr": 9.31807649925674e-05} +{"train_loss": 0.00911376066505909, "global_step": 12425, "epoch": 104, "lr": 9.317964799794081e-05} +{"train_loss": 0.008379671722650528, "global_step": 12426, "epoch": 104, "lr": 9.317853091853561e-05} +{"train_loss": 0.009334946982562542, "global_step": 12427, "epoch": 104, "lr": 9.317741375435396e-05} +{"train_loss": 0.009348297491669655, "global_step": 12428, "epoch": 104, "lr": 9.317629650539808e-05} +{"train_loss": 0.008742495439946651, "global_step": 12429, "epoch": 104, "lr": 9.317517917167015e-05} +{"train_loss": 0.006439611781388521, "global_step": 12430, "epoch": 104, "lr": 9.317406175317237e-05} +{"train_loss": 0.009193423204123974, "global_step": 12431, "epoch": 104, "lr": 9.317294424990695e-05} +{"train_loss": 0.008669081144034863, "global_step": 12432, "epoch": 104, "lr": 9.317182666187604e-05} +{"train_loss": 0.0068300762213766575, "global_step": 12433, "epoch": 104, "lr": 9.317070898908187e-05} +{"train_loss": 0.013028819113969803, "global_step": 12434, "epoch": 104, "lr": 9.316959123152662e-05} +{"train_loss": 0.008931847289204597, "global_step": 12435, "epoch": 104, "lr": 9.31684733892125e-05} +{"train_loss": 0.01046566478908062, "global_step": 12436, "epoch": 104, "lr": 9.316735546214168e-05} +{"train_loss": 0.006946547422558069, "global_step": 12437, "epoch": 104, "lr": 9.316623745031639e-05} +{"train_loss": 0.008632942102849483, "global_step": 12438, "epoch": 104, "lr": 9.316511935373879e-05} +{"train_loss": 0.008699789643287659, "global_step": 12439, "epoch": 104, "lr": 9.316400117241109e-05} +{"train_loss": 0.007774239405989647, "global_step": 12440, "epoch": 104, "lr": 9.316288290633549e-05} +{"train_loss": 0.012128511443734169, "global_step": 12441, "epoch": 104, "lr": 9.316176455551418e-05} +{"train_loss": 0.008504855446517467, "global_step": 12442, "epoch": 104, "lr": 9.316064611994934e-05} +{"train_loss": 0.00856849830597639, "global_step": 12443, "epoch": 104, "lr": 9.315952759964321e-05} +{"train_loss": 0.006772784516215324, "global_step": 12444, "epoch": 104, "lr": 9.315840899459793e-05} +{"train_loss": 0.013001578859984875, "global_step": 12445, "epoch": 104, "lr": 9.315729030481575e-05} +{"train_loss": 0.009039921686053276, "global_step": 12446, "epoch": 104, "lr": 9.315617153029884e-05} +{"train_loss": 0.008364493027329445, "global_step": 12447, "epoch": 104, "lr": 9.315505267104938e-05} +{"train_loss": 0.01045483723282814, "global_step": 12448, "epoch": 104, "lr": 9.31539337270696e-05} +{"train_loss": 0.008179137483239174, "global_step": 12449, "epoch": 104, "lr": 9.315281469836168e-05} +{"train_loss": 0.011786776594817638, "global_step": 12450, "epoch": 104, "lr": 9.31516955849278e-05} +{"train_loss": 0.00842597521841526, "global_step": 12451, "epoch": 104, "lr": 9.31505763867702e-05} +{"train_loss": 0.009496403858065605, "global_step": 12452, "epoch": 104, "lr": 9.314945710389103e-05} +{"train_loss": 0.007751318626105785, "global_step": 12453, "epoch": 104, "lr": 9.314833773629253e-05} +{"train_loss": 0.01315560657531023, "global_step": 12454, "epoch": 104, "lr": 9.314721828397687e-05} +{"train_loss": 0.010588503442704678, "global_step": 12455, "epoch": 104, "lr": 9.314609874694627e-05} +{"train_loss": 0.010949420742690563, "global_step": 12456, "epoch": 104, "lr": 9.314497912520289e-05} +{"train_loss": 0.005625125952064991, "global_step": 12457, "epoch": 104, "lr": 9.314385941874897e-05} +{"train_loss": 0.007786512840539217, "global_step": 12458, "epoch": 104, "lr": 9.314273962758669e-05} +{"train_loss": 0.008982069790363312, "global_step": 12459, "epoch": 104, "lr": 9.314161975171824e-05} +{"train_loss": 0.010568346828222275, "global_step": 12460, "epoch": 104, "lr": 9.314049979114584e-05} +{"train_loss": 0.005217854864895344, "global_step": 12461, "epoch": 104, "lr": 9.313937974587167e-05} +{"train_loss": 0.008956607431173325, "global_step": 12462, "epoch": 104, "lr": 9.313825961589795e-05} +{"train_loss": 0.015115019865334034, "global_step": 12463, "epoch": 104, "lr": 9.313713940122685e-05} +{"train_loss": 0.005219362210482359, "global_step": 12464, "epoch": 104, "lr": 9.313601910186058e-05} +{"train_loss": 0.008160339668393135, "global_step": 12465, "epoch": 104, "lr": 9.313489871780137e-05} +{"train_loss": 0.008785500191152096, "global_step": 12466, "epoch": 104, "lr": 9.313377824905138e-05} +{"train_loss": 0.004761907737702131, "global_step": 12467, "epoch": 104, "lr": 9.313265769561282e-05} +{"train_loss": 0.007782195694744587, "global_step": 12468, "epoch": 104, "lr": 9.313153705748789e-05} +{"train_loss": 0.009013960137963295, "global_step": 12469, "epoch": 104, "lr": 9.31304163346788e-05} +{"train_loss": 0.00885193981230259, "global_step": 12470, "epoch": 104, "lr": 9.312929552718776e-05} +{"train_loss": 0.008376240730285645, "global_step": 12471, "epoch": 104, "lr": 9.312817463501696e-05} +{"train_loss": 0.00761326402425766, "global_step": 12472, "epoch": 104, "lr": 9.312705365816857e-05} +{"train_loss": 0.010813551023602486, "global_step": 12473, "epoch": 104, "lr": 9.312593259664483e-05} +{"train_loss": 0.008700943551957607, "global_step": 12474, "epoch": 104, "lr": 9.312481145044793e-05} +{"train_loss": 0.008589409291744232, "global_step": 12475, "epoch": 104, "lr": 9.312369021958007e-05} +{"train_loss": 0.007043106015771627, "global_step": 12476, "epoch": 104, "lr": 9.312256890404346e-05} +{"train_loss": 0.005424924660474062, "global_step": 12477, "epoch": 104, "lr": 9.312144750384028e-05} +{"train_loss": 0.008381597697734833, "global_step": 12478, "epoch": 104, "lr": 9.312032601897274e-05} +{"train_loss": 0.010332610458135605, "global_step": 12479, "epoch": 104, "lr": 9.311920444944305e-05} +{"train_loss": 0.005328322760760784, "global_step": 12480, "epoch": 104, "lr": 9.311808279525343e-05} +{"train_loss": 0.009632453322410583, "global_step": 12481, "epoch": 104, "lr": 9.311696105640604e-05} +{"train_loss": 0.009866408072412014, "global_step": 12482, "epoch": 104, "lr": 9.311583923290311e-05} +{"train_loss": 0.011899071745574474, "global_step": 12483, "epoch": 104, "lr": 9.311471732474682e-05} +{"train_loss": 0.013718755915760994, "global_step": 12484, "epoch": 104, "lr": 9.311359533193941e-05} +{"train_loss": 0.007900024764239788, "global_step": 12485, "epoch": 104, "lr": 9.311247325448305e-05} +{"train_loss": 0.009220730513334274, "global_step": 12486, "epoch": 104, "lr": 9.311135109237996e-05} +{"train_loss": 0.008192638866603374, "global_step": 12487, "epoch": 104, "lr": 9.311022884563234e-05} +{"train_loss": 0.01057050283998251, "global_step": 12488, "epoch": 104, "lr": 9.310910651424238e-05} +{"train_loss": 0.005931043531745672, "global_step": 12489, "epoch": 104, "lr": 9.31079840982123e-05} +{"train_loss": 0.00831578578799963, "global_step": 12490, "epoch": 104, "lr": 9.31068615975443e-05} +{"train_loss": 0.0069298832677304745, "global_step": 12491, "epoch": 104, "lr": 9.310573901224059e-05} +{"train_loss": 0.00855318084359169, "global_step": 12492, "epoch": 104, "lr": 9.310461634230336e-05} +{"train_loss": 0.007892441935837269, "global_step": 12493, "epoch": 104, "lr": 9.310349358773482e-05} +{"train_loss": 0.008912831368785696, "global_step": 12494, "epoch": 104, "lr": 9.310237074853717e-05, "val_loss": 0.013702543452382088} +{"train_loss": 0.008594559505581856, "global_step": 12495, "epoch": 105, "lr": 9.310124782471263e-05} +{"train_loss": 0.010804381221532822, "global_step": 12496, "epoch": 105, "lr": 9.310012481626339e-05} +{"train_loss": 0.012795635499060154, "global_step": 12497, "epoch": 105, "lr": 9.309900172319166e-05} +{"train_loss": 0.008604428730905056, "global_step": 12498, "epoch": 105, "lr": 9.309787854549965e-05} +{"train_loss": 0.009104840457439423, "global_step": 12499, "epoch": 105, "lr": 9.309675528318955e-05} +{"train_loss": 0.00960462260991335, "global_step": 12500, "epoch": 105, "lr": 9.309563193626359e-05} +{"train_loss": 0.011059088632464409, "global_step": 12501, "epoch": 105, "lr": 9.309450850472394e-05} +{"train_loss": 0.009387552738189697, "global_step": 12502, "epoch": 105, "lr": 9.309338498857283e-05} +{"train_loss": 0.005444428883492947, "global_step": 12503, "epoch": 105, "lr": 9.309226138781247e-05} +{"train_loss": 0.007727629505097866, "global_step": 12504, "epoch": 105, "lr": 9.309113770244506e-05} +{"train_loss": 0.01587597467005253, "global_step": 12505, "epoch": 105, "lr": 9.30900139324728e-05} +{"train_loss": 0.009326075203716755, "global_step": 12506, "epoch": 105, "lr": 9.308889007789792e-05} +{"train_loss": 0.0057465797290205956, "global_step": 12507, "epoch": 105, "lr": 9.308776613872258e-05} +{"train_loss": 0.00793579500168562, "global_step": 12508, "epoch": 105, "lr": 9.308664211494903e-05} +{"train_loss": 0.008298858068883419, "global_step": 12509, "epoch": 105, "lr": 9.308551800657945e-05} +{"train_loss": 0.007427888456732035, "global_step": 12510, "epoch": 105, "lr": 9.308439381361607e-05} +{"train_loss": 0.007103756535798311, "global_step": 12511, "epoch": 105, "lr": 9.308326953606108e-05} +{"train_loss": 0.00476488471031189, "global_step": 12512, "epoch": 105, "lr": 9.308214517391669e-05} +{"train_loss": 0.014522038400173187, "global_step": 12513, "epoch": 105, "lr": 9.308102072718512e-05} +{"train_loss": 0.007075830362737179, "global_step": 12514, "epoch": 105, "lr": 9.307989619586857e-05} +{"train_loss": 0.007623595185577869, "global_step": 12515, "epoch": 105, "lr": 9.307877157996923e-05} +{"train_loss": 0.013289776630699635, "global_step": 12516, "epoch": 105, "lr": 9.307764687948935e-05} +{"train_loss": 0.006658199708908796, "global_step": 12517, "epoch": 105, "lr": 9.307652209443108e-05} +{"train_loss": 0.005860186647623777, "global_step": 12518, "epoch": 105, "lr": 9.307539722479667e-05} +{"train_loss": 0.00946139357984066, "global_step": 12519, "epoch": 105, "lr": 9.307427227058834e-05} +{"train_loss": 0.01042302418500185, "global_step": 12520, "epoch": 105, "lr": 9.307314723180827e-05} +{"train_loss": 0.008474815636873245, "global_step": 12521, "epoch": 105, "lr": 9.307202210845867e-05} +{"train_loss": 0.006152445450425148, "global_step": 12522, "epoch": 105, "lr": 9.307089690054177e-05} +{"train_loss": 0.010505090467631817, "global_step": 12523, "epoch": 105, "lr": 9.306977160805974e-05} +{"train_loss": 0.00419418653473258, "global_step": 12524, "epoch": 105, "lr": 9.306864623101484e-05} +{"train_loss": 0.007310693617910147, "global_step": 12525, "epoch": 105, "lr": 9.306752076940924e-05} +{"train_loss": 0.009225037880241871, "global_step": 12526, "epoch": 105, "lr": 9.306639522324516e-05} +{"train_loss": 0.007343224249780178, "global_step": 12527, "epoch": 105, "lr": 9.306526959252482e-05} +{"train_loss": 0.006806142628192902, "global_step": 12528, "epoch": 105, "lr": 9.306414387725042e-05} +{"train_loss": 0.007326668594032526, "global_step": 12529, "epoch": 105, "lr": 9.306301807742417e-05} +{"train_loss": 0.008302641101181507, "global_step": 12530, "epoch": 105, "lr": 9.30618921930483e-05} +{"train_loss": 0.00740174762904644, "global_step": 12531, "epoch": 105, "lr": 9.306076622412501e-05} +{"train_loss": 0.008918249048292637, "global_step": 12532, "epoch": 105, "lr": 9.305964017065648e-05} +{"train_loss": 0.00695814611390233, "global_step": 12533, "epoch": 105, "lr": 9.305851403264496e-05} +{"train_loss": 0.015876425430178642, "global_step": 12534, "epoch": 105, "lr": 9.305738781009266e-05} +{"train_loss": 0.012817504815757275, "global_step": 12535, "epoch": 105, "lr": 9.305626150300176e-05} +{"train_loss": 0.010620197281241417, "global_step": 12536, "epoch": 105, "lr": 9.305513511137449e-05} +{"train_loss": 0.008675467222929, "global_step": 12537, "epoch": 105, "lr": 9.305400863521308e-05} +{"train_loss": 0.008454646915197372, "global_step": 12538, "epoch": 105, "lr": 9.305288207451972e-05} +{"train_loss": 0.005571895278990269, "global_step": 12539, "epoch": 105, "lr": 9.305175542929662e-05} +{"train_loss": 0.014058968052268028, "global_step": 12540, "epoch": 105, "lr": 9.3050628699546e-05} +{"train_loss": 0.010618998669087887, "global_step": 12541, "epoch": 105, "lr": 9.304950188527006e-05} +{"train_loss": 0.013615702278912067, "global_step": 12542, "epoch": 105, "lr": 9.304837498647103e-05} +{"train_loss": 0.005801067221909761, "global_step": 12543, "epoch": 105, "lr": 9.304724800315112e-05} +{"train_loss": 0.006114177871495485, "global_step": 12544, "epoch": 105, "lr": 9.304612093531254e-05} +{"train_loss": 0.007648589555174112, "global_step": 12545, "epoch": 105, "lr": 9.304499378295748e-05} +{"train_loss": 0.008973469026386738, "global_step": 12546, "epoch": 105, "lr": 9.304386654608819e-05} +{"train_loss": 0.006287253461778164, "global_step": 12547, "epoch": 105, "lr": 9.304273922470686e-05} +{"train_loss": 0.011753451079130173, "global_step": 12548, "epoch": 105, "lr": 9.30416118188157e-05} +{"train_loss": 0.011193404905498028, "global_step": 12549, "epoch": 105, "lr": 9.304048432841695e-05} +{"train_loss": 0.008832884021103382, "global_step": 12550, "epoch": 105, "lr": 9.303935675351281e-05} +{"train_loss": 0.012119264341890812, "global_step": 12551, "epoch": 105, "lr": 9.303822909410547e-05} +{"train_loss": 0.0068291714414954185, "global_step": 12552, "epoch": 105, "lr": 9.30371013501972e-05} +{"train_loss": 0.005768533330410719, "global_step": 12553, "epoch": 105, "lr": 9.303597352179014e-05} +{"train_loss": 0.006117462180554867, "global_step": 12554, "epoch": 105, "lr": 9.303484560888657e-05} +{"train_loss": 0.011310846544802189, "global_step": 12555, "epoch": 105, "lr": 9.303371761148867e-05} +{"train_loss": 0.008087526075541973, "global_step": 12556, "epoch": 105, "lr": 9.303258952959865e-05} +{"train_loss": 0.006459646392613649, "global_step": 12557, "epoch": 105, "lr": 9.303146136321876e-05} +{"train_loss": 0.009503607638180256, "global_step": 12558, "epoch": 105, "lr": 9.303033311235119e-05} +{"train_loss": 0.013057160191237926, "global_step": 12559, "epoch": 105, "lr": 9.302920477699814e-05} +{"train_loss": 0.011858812533318996, "global_step": 12560, "epoch": 105, "lr": 9.302807635716186e-05} +{"train_loss": 0.008650293573737144, "global_step": 12561, "epoch": 105, "lr": 9.302694785284454e-05} +{"train_loss": 0.011771494522690773, "global_step": 12562, "epoch": 105, "lr": 9.30258192640484e-05} +{"train_loss": 0.008958234451711178, "global_step": 12563, "epoch": 105, "lr": 9.302469059077568e-05} +{"train_loss": 0.0061460924334824085, "global_step": 12564, "epoch": 105, "lr": 9.302356183302857e-05} +{"train_loss": 0.011823452077805996, "global_step": 12565, "epoch": 105, "lr": 9.302243299080928e-05} +{"train_loss": 0.009307144209742546, "global_step": 12566, "epoch": 105, "lr": 9.302130406412006e-05} +{"train_loss": 0.007316396106034517, "global_step": 12567, "epoch": 105, "lr": 9.302017505296309e-05} +{"train_loss": 0.013030139729380608, "global_step": 12568, "epoch": 105, "lr": 9.30190459573406e-05} +{"train_loss": 0.008889516815543175, "global_step": 12569, "epoch": 105, "lr": 9.301791677725483e-05} +{"train_loss": 0.007383449003100395, "global_step": 12570, "epoch": 105, "lr": 9.301678751270795e-05} +{"train_loss": 0.00823839008808136, "global_step": 12571, "epoch": 105, "lr": 9.301565816370221e-05} +{"train_loss": 0.009817364625632763, "global_step": 12572, "epoch": 105, "lr": 9.301452873023983e-05} +{"train_loss": 0.009135870262980461, "global_step": 12573, "epoch": 105, "lr": 9.301339921232301e-05} +{"train_loss": 0.01250612922012806, "global_step": 12574, "epoch": 105, "lr": 9.301226960995399e-05} +{"train_loss": 0.0076517448760569096, "global_step": 12575, "epoch": 105, "lr": 9.301113992313496e-05} +{"train_loss": 0.008455552160739899, "global_step": 12576, "epoch": 105, "lr": 9.301001015186815e-05} +{"train_loss": 0.007802790030837059, "global_step": 12577, "epoch": 105, "lr": 9.300888029615578e-05} +{"train_loss": 0.011188406497240067, "global_step": 12578, "epoch": 105, "lr": 9.300775035600008e-05} +{"train_loss": 0.009268803521990776, "global_step": 12579, "epoch": 105, "lr": 9.300662033140325e-05} +{"train_loss": 0.012262089177966118, "global_step": 12580, "epoch": 105, "lr": 9.300549022236751e-05} +{"train_loss": 0.00989228393882513, "global_step": 12581, "epoch": 105, "lr": 9.30043600288951e-05} +{"train_loss": 0.011014704592525959, "global_step": 12582, "epoch": 105, "lr": 9.30032297509882e-05} +{"train_loss": 0.00917909201234579, "global_step": 12583, "epoch": 105, "lr": 9.300209938864907e-05} +{"train_loss": 0.008646789006888866, "global_step": 12584, "epoch": 105, "lr": 9.300096894187991e-05} +{"train_loss": 0.008551442995667458, "global_step": 12585, "epoch": 105, "lr": 9.299983841068294e-05} +{"train_loss": 0.01150574255734682, "global_step": 12586, "epoch": 105, "lr": 9.299870779506039e-05} +{"train_loss": 0.006037720013409853, "global_step": 12587, "epoch": 105, "lr": 9.299757709501447e-05} +{"train_loss": 0.011805307120084763, "global_step": 12588, "epoch": 105, "lr": 9.299644631054739e-05} +{"train_loss": 0.009477967396378517, "global_step": 12589, "epoch": 105, "lr": 9.299531544166138e-05} +{"train_loss": 0.006450703367590904, "global_step": 12590, "epoch": 105, "lr": 9.299418448835866e-05} +{"train_loss": 0.010983980260789394, "global_step": 12591, "epoch": 105, "lr": 9.299305345064146e-05} +{"train_loss": 0.010089341551065445, "global_step": 12592, "epoch": 105, "lr": 9.299192232851199e-05} +{"train_loss": 0.01026749424636364, "global_step": 12593, "epoch": 105, "lr": 9.299079112197246e-05} +{"train_loss": 0.007497862912714481, "global_step": 12594, "epoch": 105, "lr": 9.298965983102512e-05} +{"train_loss": 0.009454729966819286, "global_step": 12595, "epoch": 105, "lr": 9.298852845567219e-05} +{"train_loss": 0.009240595623850822, "global_step": 12596, "epoch": 105, "lr": 9.298739699591586e-05} +{"train_loss": 0.013397504575550556, "global_step": 12597, "epoch": 105, "lr": 9.298626545175837e-05} +{"train_loss": 0.007886948063969612, "global_step": 12598, "epoch": 105, "lr": 9.298513382320193e-05} +{"train_loss": 0.006119265221059322, "global_step": 12599, "epoch": 105, "lr": 9.298400211024879e-05} +{"train_loss": 0.007086949422955513, "global_step": 12600, "epoch": 105, "lr": 9.298287031290113e-05} +{"train_loss": 0.010401730425655842, "global_step": 12601, "epoch": 105, "lr": 9.298173843116123e-05} +{"train_loss": 0.009439743123948574, "global_step": 12602, "epoch": 105, "lr": 9.298060646503125e-05} +{"train_loss": 0.007831393741071224, "global_step": 12603, "epoch": 105, "lr": 9.297947441451344e-05} +{"train_loss": 0.005551240406930447, "global_step": 12604, "epoch": 105, "lr": 9.297834227961004e-05} +{"train_loss": 0.0075661842711269855, "global_step": 12605, "epoch": 105, "lr": 9.297721006032325e-05} +{"train_loss": 0.006994991563260555, "global_step": 12606, "epoch": 105, "lr": 9.297607775665531e-05} +{"train_loss": 0.009409147314727306, "global_step": 12607, "epoch": 105, "lr": 9.297494536860842e-05} +{"train_loss": 0.007858379743993282, "global_step": 12608, "epoch": 105, "lr": 9.297381289618482e-05} +{"train_loss": 0.007808265276253223, "global_step": 12609, "epoch": 105, "lr": 9.297268033938673e-05} +{"train_loss": 0.0074637760408222675, "global_step": 12610, "epoch": 105, "lr": 9.297154769821637e-05} +{"train_loss": 0.007637580391019583, "global_step": 12611, "epoch": 105, "lr": 9.297041497267599e-05} +{"train_loss": 0.007391751278191805, "global_step": 12612, "epoch": 105, "lr": 9.296928216276774e-05} +{"train_loss": 0.008969739349480687, "global_step": 12613, "epoch": 105, "lr": 9.296814926849394e-05, "val_loss": 0.01906626671552658, "train_action_mse_error": 0.00020112883066758513} +{"train_loss": 0.012270941399037838, "global_step": 12614, "epoch": 106, "lr": 9.296701628985676e-05} +{"train_loss": 0.004309145733714104, "global_step": 12615, "epoch": 106, "lr": 9.296588322685842e-05} +{"train_loss": 0.00779440114274621, "global_step": 12616, "epoch": 106, "lr": 9.296475007950116e-05} +{"train_loss": 0.00622639199718833, "global_step": 12617, "epoch": 106, "lr": 9.296361684778722e-05} +{"train_loss": 0.01022512000054121, "global_step": 12618, "epoch": 106, "lr": 9.29624835317188e-05} +{"train_loss": 0.012034310027956963, "global_step": 12619, "epoch": 106, "lr": 9.296135013129812e-05} +{"train_loss": 0.006462334655225277, "global_step": 12620, "epoch": 106, "lr": 9.296021664652744e-05} +{"train_loss": 0.0077017517760396, "global_step": 12621, "epoch": 106, "lr": 9.295908307740895e-05} +{"train_loss": 0.007652821484953165, "global_step": 12622, "epoch": 106, "lr": 9.29579494239449e-05} +{"train_loss": 0.007789266295731068, "global_step": 12623, "epoch": 106, "lr": 9.29568156861375e-05} +{"train_loss": 0.008402283303439617, "global_step": 12624, "epoch": 106, "lr": 9.295568186398897e-05} +{"train_loss": 0.007775891572237015, "global_step": 12625, "epoch": 106, "lr": 9.295454795750158e-05} +{"train_loss": 0.009871510788798332, "global_step": 12626, "epoch": 106, "lr": 9.29534139666775e-05} +{"train_loss": 0.011701295152306557, "global_step": 12627, "epoch": 106, "lr": 9.295227989151898e-05} +{"train_loss": 0.006407924462109804, "global_step": 12628, "epoch": 106, "lr": 9.295114573202825e-05} +{"train_loss": 0.008404216729104519, "global_step": 12629, "epoch": 106, "lr": 9.295001148820753e-05} +{"train_loss": 0.009999092668294907, "global_step": 12630, "epoch": 106, "lr": 9.294887716005907e-05} +{"train_loss": 0.004990745335817337, "global_step": 12631, "epoch": 106, "lr": 9.294774274758506e-05} +{"train_loss": 0.007278273347765207, "global_step": 12632, "epoch": 106, "lr": 9.294660825078775e-05} +{"train_loss": 0.008837010711431503, "global_step": 12633, "epoch": 106, "lr": 9.294547366966936e-05} +{"train_loss": 0.011175439693033695, "global_step": 12634, "epoch": 106, "lr": 9.294433900423211e-05} +{"train_loss": 0.005445750895887613, "global_step": 12635, "epoch": 106, "lr": 9.294320425447826e-05} +{"train_loss": 0.010295700281858444, "global_step": 12636, "epoch": 106, "lr": 9.294206942041002e-05} +{"train_loss": 0.009382701478898525, "global_step": 12637, "epoch": 106, "lr": 9.29409345020296e-05} +{"train_loss": 0.007271663285791874, "global_step": 12638, "epoch": 106, "lr": 9.293979949933924e-05} +{"train_loss": 0.005927892401814461, "global_step": 12639, "epoch": 106, "lr": 9.293866441234118e-05} +{"train_loss": 0.010171052068471909, "global_step": 12640, "epoch": 106, "lr": 9.293752924103764e-05} +{"train_loss": 0.007151774130761623, "global_step": 12641, "epoch": 106, "lr": 9.293639398543083e-05} +{"train_loss": 0.009861940518021584, "global_step": 12642, "epoch": 106, "lr": 9.293525864552301e-05} +{"train_loss": 0.006056510377675295, "global_step": 12643, "epoch": 106, "lr": 9.29341232213164e-05} +{"train_loss": 0.006242642179131508, "global_step": 12644, "epoch": 106, "lr": 9.293298771281324e-05} +{"train_loss": 0.006280849222093821, "global_step": 12645, "epoch": 106, "lr": 9.293185212001571e-05} +{"train_loss": 0.010327090509235859, "global_step": 12646, "epoch": 106, "lr": 9.29307164429261e-05} +{"train_loss": 0.0066897994838654995, "global_step": 12647, "epoch": 106, "lr": 9.292958068154662e-05} +{"train_loss": 0.006583547219634056, "global_step": 12648, "epoch": 106, "lr": 9.292844483587948e-05} +{"train_loss": 0.011545096524059772, "global_step": 12649, "epoch": 106, "lr": 9.292730890592693e-05} +{"train_loss": 0.009021207690238953, "global_step": 12650, "epoch": 106, "lr": 9.29261728916912e-05} +{"train_loss": 0.005181103013455868, "global_step": 12651, "epoch": 106, "lr": 9.29250367931745e-05} +{"train_loss": 0.007646655663847923, "global_step": 12652, "epoch": 106, "lr": 9.292390061037908e-05} +{"train_loss": 0.006686854641884565, "global_step": 12653, "epoch": 106, "lr": 9.292276434330718e-05} +{"train_loss": 0.007686927914619446, "global_step": 12654, "epoch": 106, "lr": 9.292162799196102e-05} +{"train_loss": 0.005165329203009605, "global_step": 12655, "epoch": 106, "lr": 9.292049155634281e-05} +{"train_loss": 0.005686548072844744, "global_step": 12656, "epoch": 106, "lr": 9.291935503645481e-05} +{"train_loss": 0.011120353825390339, "global_step": 12657, "epoch": 106, "lr": 9.291821843229925e-05} +{"train_loss": 0.006418545264750719, "global_step": 12658, "epoch": 106, "lr": 9.291708174387834e-05} +{"train_loss": 0.008980452083051205, "global_step": 12659, "epoch": 106, "lr": 9.291594497119434e-05} +{"train_loss": 0.005154794547706842, "global_step": 12660, "epoch": 106, "lr": 9.291480811424944e-05} +{"train_loss": 0.010563484393060207, "global_step": 12661, "epoch": 106, "lr": 9.291367117304593e-05} +{"train_loss": 0.007591282017529011, "global_step": 12662, "epoch": 106, "lr": 9.291253414758598e-05} +{"train_loss": 0.010884283110499382, "global_step": 12663, "epoch": 106, "lr": 9.291139703787188e-05} +{"train_loss": 0.008936445228755474, "global_step": 12664, "epoch": 106, "lr": 9.291025984390582e-05} +{"train_loss": 0.0076454756781458855, "global_step": 12665, "epoch": 106, "lr": 9.290912256569006e-05} +{"train_loss": 0.007216049358248711, "global_step": 12666, "epoch": 106, "lr": 9.290798520322682e-05} +{"train_loss": 0.008848080411553383, "global_step": 12667, "epoch": 106, "lr": 9.290684775651833e-05} +{"train_loss": 0.007955833338201046, "global_step": 12668, "epoch": 106, "lr": 9.290571022556683e-05} +{"train_loss": 0.008087458088994026, "global_step": 12669, "epoch": 106, "lr": 9.290457261037455e-05} +{"train_loss": 0.007244941312819719, "global_step": 12670, "epoch": 106, "lr": 9.290343491094373e-05} +{"train_loss": 0.009355375543236732, "global_step": 12671, "epoch": 106, "lr": 9.29022971272766e-05} +{"train_loss": 0.009361613541841507, "global_step": 12672, "epoch": 106, "lr": 9.290115925937539e-05} +{"train_loss": 0.007506661582738161, "global_step": 12673, "epoch": 106, "lr": 9.290002130724234e-05} +{"train_loss": 0.005170287564396858, "global_step": 12674, "epoch": 106, "lr": 9.289888327087967e-05} +{"train_loss": 0.0054951924830675125, "global_step": 12675, "epoch": 106, "lr": 9.289774515028965e-05} +{"train_loss": 0.007872093468904495, "global_step": 12676, "epoch": 106, "lr": 9.289660694547447e-05} +{"train_loss": 0.008720699697732925, "global_step": 12677, "epoch": 106, "lr": 9.28954686564364e-05} +{"train_loss": 0.013748757541179657, "global_step": 12678, "epoch": 106, "lr": 9.289433028317765e-05} +{"train_loss": 0.00968883465975523, "global_step": 12679, "epoch": 106, "lr": 9.289319182570046e-05} +{"train_loss": 0.008529165759682655, "global_step": 12680, "epoch": 106, "lr": 9.289205328400708e-05} +{"train_loss": 0.010046509094536304, "global_step": 12681, "epoch": 106, "lr": 9.289091465809973e-05} +{"train_loss": 0.008778367191553116, "global_step": 12682, "epoch": 106, "lr": 9.288977594798064e-05} +{"train_loss": 0.006523973774164915, "global_step": 12683, "epoch": 106, "lr": 9.288863715365209e-05} +{"train_loss": 0.009033378213644028, "global_step": 12684, "epoch": 106, "lr": 9.288749827511624e-05} +{"train_loss": 0.007156480569392443, "global_step": 12685, "epoch": 106, "lr": 9.28863593123754e-05} +{"train_loss": 0.009738411754369736, "global_step": 12686, "epoch": 106, "lr": 9.288522026543178e-05} +{"train_loss": 0.00780331389978528, "global_step": 12687, "epoch": 106, "lr": 9.288408113428759e-05} +{"train_loss": 0.0070515782572329044, "global_step": 12688, "epoch": 106, "lr": 9.28829419189451e-05} +{"train_loss": 0.0086748031899333, "global_step": 12689, "epoch": 106, "lr": 9.288180261940653e-05} +{"train_loss": 0.009301269426941872, "global_step": 12690, "epoch": 106, "lr": 9.288066323567412e-05} +{"train_loss": 0.012948820367455482, "global_step": 12691, "epoch": 106, "lr": 9.287952376775011e-05} +{"train_loss": 0.01047271303832531, "global_step": 12692, "epoch": 106, "lr": 9.287838421563674e-05} +{"train_loss": 0.012015107087790966, "global_step": 12693, "epoch": 106, "lr": 9.287724457933625e-05} +{"train_loss": 0.009263204410672188, "global_step": 12694, "epoch": 106, "lr": 9.287610485885086e-05} +{"train_loss": 0.009431513026356697, "global_step": 12695, "epoch": 106, "lr": 9.287496505418281e-05} +{"train_loss": 0.010265539400279522, "global_step": 12696, "epoch": 106, "lr": 9.287382516533437e-05} +{"train_loss": 0.007518486585468054, "global_step": 12697, "epoch": 106, "lr": 9.287268519230775e-05} +{"train_loss": 0.012996540404856205, "global_step": 12698, "epoch": 106, "lr": 9.287154513510517e-05} +{"train_loss": 0.008076999336481094, "global_step": 12699, "epoch": 106, "lr": 9.287040499372893e-05} +{"train_loss": 0.00576024642214179, "global_step": 12700, "epoch": 106, "lr": 9.286926476818118e-05} +{"train_loss": 0.011083987541496754, "global_step": 12701, "epoch": 106, "lr": 9.286812445846425e-05} +{"train_loss": 0.011338978074491024, "global_step": 12702, "epoch": 106, "lr": 9.286698406458033e-05} +{"train_loss": 0.00797357689589262, "global_step": 12703, "epoch": 106, "lr": 9.286584358653166e-05} +{"train_loss": 0.005858549382537603, "global_step": 12704, "epoch": 106, "lr": 9.286470302432046e-05} +{"train_loss": 0.012963549233973026, "global_step": 12705, "epoch": 106, "lr": 9.286356237794903e-05} +{"train_loss": 0.008113650605082512, "global_step": 12706, "epoch": 106, "lr": 9.286242164741957e-05} +{"train_loss": 0.011587531305849552, "global_step": 12707, "epoch": 106, "lr": 9.286128083273431e-05} +{"train_loss": 0.00721721863374114, "global_step": 12708, "epoch": 106, "lr": 9.286013993389551e-05} +{"train_loss": 0.008785880170762539, "global_step": 12709, "epoch": 106, "lr": 9.285899895090542e-05} +{"train_loss": 0.009478701278567314, "global_step": 12710, "epoch": 106, "lr": 9.285785788376625e-05} +{"train_loss": 0.010580231435596943, "global_step": 12711, "epoch": 106, "lr": 9.285671673248026e-05} +{"train_loss": 0.009777260944247246, "global_step": 12712, "epoch": 106, "lr": 9.285557549704969e-05} +{"train_loss": 0.012072879821062088, "global_step": 12713, "epoch": 106, "lr": 9.285443417747676e-05} +{"train_loss": 0.0077667697332799435, "global_step": 12714, "epoch": 106, "lr": 9.285329277376373e-05} +{"train_loss": 0.00974244810640812, "global_step": 12715, "epoch": 106, "lr": 9.285215128591285e-05} +{"train_loss": 0.010401632636785507, "global_step": 12716, "epoch": 106, "lr": 9.285100971392633e-05} +{"train_loss": 0.007463735528290272, "global_step": 12717, "epoch": 106, "lr": 9.284986805780644e-05} +{"train_loss": 0.010010617785155773, "global_step": 12718, "epoch": 106, "lr": 9.284872631755542e-05} +{"train_loss": 0.007822642102837563, "global_step": 12719, "epoch": 106, "lr": 9.28475844931755e-05} +{"train_loss": 0.010422581806778908, "global_step": 12720, "epoch": 106, "lr": 9.284644258466892e-05} +{"train_loss": 0.006115684285759926, "global_step": 12721, "epoch": 106, "lr": 9.284530059203794e-05} +{"train_loss": 0.0097245704382658, "global_step": 12722, "epoch": 106, "lr": 9.284415851528477e-05} +{"train_loss": 0.009464127011597157, "global_step": 12723, "epoch": 106, "lr": 9.284301635441169e-05} +{"train_loss": 0.004577175714075565, "global_step": 12724, "epoch": 106, "lr": 9.28418741094209e-05} +{"train_loss": 0.005377655848860741, "global_step": 12725, "epoch": 106, "lr": 9.284073178031469e-05} +{"train_loss": 0.006733184214681387, "global_step": 12726, "epoch": 106, "lr": 9.283958936709527e-05} +{"train_loss": 0.007830495946109295, "global_step": 12727, "epoch": 106, "lr": 9.28384468697649e-05} +{"train_loss": 0.01296058390289545, "global_step": 12728, "epoch": 106, "lr": 9.283730428832581e-05} +{"train_loss": 0.008786824531853199, "global_step": 12729, "epoch": 106, "lr": 9.283616162278025e-05} +{"train_loss": 0.0076385801658034325, "global_step": 12730, "epoch": 106, "lr": 9.283501887313046e-05} +{"train_loss": 0.006773342378437519, "global_step": 12731, "epoch": 106, "lr": 9.28338760393787e-05} +{"train_loss": 0.008504866035420354, "global_step": 12732, "epoch": 106, "lr": 9.283273312152718e-05, "val_loss": 0.01868065819144249} +{"train_loss": 0.0077911377884447575, "global_step": 12733, "epoch": 107, "lr": 9.283159011957818e-05} +{"train_loss": 0.00731536652892828, "global_step": 12734, "epoch": 107, "lr": 9.283044703353393e-05} +{"train_loss": 0.008970912545919418, "global_step": 12735, "epoch": 107, "lr": 9.282930386339667e-05} +{"train_loss": 0.007629381958395243, "global_step": 12736, "epoch": 107, "lr": 9.282816060916865e-05} +{"train_loss": 0.01059369184076786, "global_step": 12737, "epoch": 107, "lr": 9.28270172708521e-05} +{"train_loss": 0.007149725221097469, "global_step": 12738, "epoch": 107, "lr": 9.28258738484493e-05} +{"train_loss": 0.008171589113771915, "global_step": 12739, "epoch": 107, "lr": 9.282473034196244e-05} +{"train_loss": 0.009129662998020649, "global_step": 12740, "epoch": 107, "lr": 9.282358675139383e-05} +{"train_loss": 0.01016236376017332, "global_step": 12741, "epoch": 107, "lr": 9.282244307674566e-05} +{"train_loss": 0.009056124836206436, "global_step": 12742, "epoch": 107, "lr": 9.28212993180202e-05} +{"train_loss": 0.009547505527734756, "global_step": 12743, "epoch": 107, "lr": 9.282015547521969e-05} +{"train_loss": 0.005937066860496998, "global_step": 12744, "epoch": 107, "lr": 9.28190115483464e-05} +{"train_loss": 0.008483869954943657, "global_step": 12745, "epoch": 107, "lr": 9.281786753740254e-05} +{"train_loss": 0.0082489512860775, "global_step": 12746, "epoch": 107, "lr": 9.281672344239037e-05} +{"train_loss": 0.00699445977807045, "global_step": 12747, "epoch": 107, "lr": 9.281557926331215e-05} +{"train_loss": 0.007111841347068548, "global_step": 12748, "epoch": 107, "lr": 9.28144350001701e-05} +{"train_loss": 0.006799656897783279, "global_step": 12749, "epoch": 107, "lr": 9.281329065296649e-05} +{"train_loss": 0.008698311634361744, "global_step": 12750, "epoch": 107, "lr": 9.281214622170356e-05} +{"train_loss": 0.006792036816477776, "global_step": 12751, "epoch": 107, "lr": 9.281100170638355e-05} +{"train_loss": 0.005457785911858082, "global_step": 12752, "epoch": 107, "lr": 9.28098571070087e-05} +{"train_loss": 0.006087662186473608, "global_step": 12753, "epoch": 107, "lr": 9.280871242358129e-05} +{"train_loss": 0.009356743656098843, "global_step": 12754, "epoch": 107, "lr": 9.280756765610353e-05} +{"train_loss": 0.006536825560033321, "global_step": 12755, "epoch": 107, "lr": 9.280642280457769e-05} +{"train_loss": 0.0059169684536755085, "global_step": 12756, "epoch": 107, "lr": 9.280527786900602e-05} +{"train_loss": 0.00598300714045763, "global_step": 12757, "epoch": 107, "lr": 9.280413284939075e-05} +{"train_loss": 0.005705217830836773, "global_step": 12758, "epoch": 107, "lr": 9.280298774573415e-05} +{"train_loss": 0.007221676409244537, "global_step": 12759, "epoch": 107, "lr": 9.280184255803844e-05} +{"train_loss": 0.007346693892031908, "global_step": 12760, "epoch": 107, "lr": 9.280069728630589e-05} +{"train_loss": 0.008775434456765652, "global_step": 12761, "epoch": 107, "lr": 9.279955193053875e-05} +{"train_loss": 0.006597933359444141, "global_step": 12762, "epoch": 107, "lr": 9.279840649073925e-05} +{"train_loss": 0.0074440063908696175, "global_step": 12763, "epoch": 107, "lr": 9.279726096690968e-05} +{"train_loss": 0.00805831141769886, "global_step": 12764, "epoch": 107, "lr": 9.279611535905224e-05} +{"train_loss": 0.006758199539035559, "global_step": 12765, "epoch": 107, "lr": 9.279496966716918e-05} +{"train_loss": 0.00983927957713604, "global_step": 12766, "epoch": 107, "lr": 9.27938238912628e-05} +{"train_loss": 0.004558016546070576, "global_step": 12767, "epoch": 107, "lr": 9.279267803133532e-05} +{"train_loss": 0.003271349472925067, "global_step": 12768, "epoch": 107, "lr": 9.279153208738896e-05} +{"train_loss": 0.005674309097230434, "global_step": 12769, "epoch": 107, "lr": 9.279038605942602e-05} +{"train_loss": 0.00647819833829999, "global_step": 12770, "epoch": 107, "lr": 9.278923994744872e-05} +{"train_loss": 0.005932671017944813, "global_step": 12771, "epoch": 107, "lr": 9.278809375145932e-05} +{"train_loss": 0.010657289065420628, "global_step": 12772, "epoch": 107, "lr": 9.278694747146007e-05} +{"train_loss": 0.005647966638207436, "global_step": 12773, "epoch": 107, "lr": 9.278580110745322e-05} +{"train_loss": 0.005674298387020826, "global_step": 12774, "epoch": 107, "lr": 9.278465465944102e-05} +{"train_loss": 0.004866695497184992, "global_step": 12775, "epoch": 107, "lr": 9.278350812742572e-05} +{"train_loss": 0.008143603801727295, "global_step": 12776, "epoch": 107, "lr": 9.278236151140957e-05} +{"train_loss": 0.0068246107548475266, "global_step": 12777, "epoch": 107, "lr": 9.278121481139483e-05} +{"train_loss": 0.005879717413336039, "global_step": 12778, "epoch": 107, "lr": 9.278006802738375e-05} +{"train_loss": 0.005702781956642866, "global_step": 12779, "epoch": 107, "lr": 9.277892115937856e-05} +{"train_loss": 0.009019752033054829, "global_step": 12780, "epoch": 107, "lr": 9.277777420738154e-05} +{"train_loss": 0.007660963106900454, "global_step": 12781, "epoch": 107, "lr": 9.277662717139494e-05} +{"train_loss": 0.010171081870794296, "global_step": 12782, "epoch": 107, "lr": 9.277548005142098e-05} +{"train_loss": 0.003319324692711234, "global_step": 12783, "epoch": 107, "lr": 9.277433284746196e-05} +{"train_loss": 0.006243147887289524, "global_step": 12784, "epoch": 107, "lr": 9.277318555952008e-05} +{"train_loss": 0.007248864043504, "global_step": 12785, "epoch": 107, "lr": 9.277203818759764e-05} +{"train_loss": 0.011037727817893028, "global_step": 12786, "epoch": 107, "lr": 9.277089073169686e-05} +{"train_loss": 0.005776621866971254, "global_step": 12787, "epoch": 107, "lr": 9.276974319182001e-05} +{"train_loss": 0.0066025136038661, "global_step": 12788, "epoch": 107, "lr": 9.276859556796935e-05} +{"train_loss": 0.010101044550538063, "global_step": 12789, "epoch": 107, "lr": 9.276744786014712e-05} +{"train_loss": 0.006724114529788494, "global_step": 12790, "epoch": 107, "lr": 9.276630006835557e-05} +{"train_loss": 0.005621077958494425, "global_step": 12791, "epoch": 107, "lr": 9.276515219259696e-05} +{"train_loss": 0.006169226951897144, "global_step": 12792, "epoch": 107, "lr": 9.276400423287353e-05} +{"train_loss": 0.007387679535895586, "global_step": 12793, "epoch": 107, "lr": 9.276285618918756e-05} +{"train_loss": 0.006665962282568216, "global_step": 12794, "epoch": 107, "lr": 9.276170806154127e-05} +{"train_loss": 0.009423492476344109, "global_step": 12795, "epoch": 107, "lr": 9.276055984993696e-05} +{"train_loss": 0.006179385352879763, "global_step": 12796, "epoch": 107, "lr": 9.275941155437684e-05} +{"train_loss": 0.009287072345614433, "global_step": 12797, "epoch": 107, "lr": 9.27582631748632e-05} +{"train_loss": 0.009229532442986965, "global_step": 12798, "epoch": 107, "lr": 9.275711471139828e-05} +{"train_loss": 0.007719387300312519, "global_step": 12799, "epoch": 107, "lr": 9.275596616398431e-05} +{"train_loss": 0.007894898764789104, "global_step": 12800, "epoch": 107, "lr": 9.275481753262359e-05} +{"train_loss": 0.00451500341296196, "global_step": 12801, "epoch": 107, "lr": 9.275366881731834e-05} +{"train_loss": 0.006144858431071043, "global_step": 12802, "epoch": 107, "lr": 9.275252001807084e-05} +{"train_loss": 0.009776716120541096, "global_step": 12803, "epoch": 107, "lr": 9.275137113488333e-05} +{"train_loss": 0.007177190389484167, "global_step": 12804, "epoch": 107, "lr": 9.275022216775806e-05} +{"train_loss": 0.007781656924635172, "global_step": 12805, "epoch": 107, "lr": 9.274907311669731e-05} +{"train_loss": 0.013838602229952812, "global_step": 12806, "epoch": 107, "lr": 9.274792398170331e-05} +{"train_loss": 0.005287563428282738, "global_step": 12807, "epoch": 107, "lr": 9.274677476277833e-05} +{"train_loss": 0.005084655247628689, "global_step": 12808, "epoch": 107, "lr": 9.274562545992465e-05} +{"train_loss": 0.007609604857861996, "global_step": 12809, "epoch": 107, "lr": 9.274447607314447e-05} +{"train_loss": 0.010204367339611053, "global_step": 12810, "epoch": 107, "lr": 9.27433266024401e-05} +{"train_loss": 0.01003243587911129, "global_step": 12811, "epoch": 107, "lr": 9.274217704781375e-05} +{"train_loss": 0.006600084714591503, "global_step": 12812, "epoch": 107, "lr": 9.274102740926771e-05} +{"train_loss": 0.010167819447815418, "global_step": 12813, "epoch": 107, "lr": 9.273987768680424e-05} +{"train_loss": 0.008893854916095734, "global_step": 12814, "epoch": 107, "lr": 9.273872788042558e-05} +{"train_loss": 0.0064680809155106544, "global_step": 12815, "epoch": 107, "lr": 9.273757799013399e-05} +{"train_loss": 0.010338830761611462, "global_step": 12816, "epoch": 107, "lr": 9.273642801593174e-05} +{"train_loss": 0.010957552120089531, "global_step": 12817, "epoch": 107, "lr": 9.273527795782108e-05} +{"train_loss": 0.010359169915318489, "global_step": 12818, "epoch": 107, "lr": 9.273412781580426e-05} +{"train_loss": 0.010569197125732899, "global_step": 12819, "epoch": 107, "lr": 9.273297758988355e-05} +{"train_loss": 0.009621410630643368, "global_step": 12820, "epoch": 107, "lr": 9.27318272800612e-05} +{"train_loss": 0.007689842954277992, "global_step": 12821, "epoch": 107, "lr": 9.273067688633947e-05} +{"train_loss": 0.010993621312081814, "global_step": 12822, "epoch": 107, "lr": 9.272952640872062e-05} +{"train_loss": 0.005064812488853931, "global_step": 12823, "epoch": 107, "lr": 9.272837584720692e-05} +{"train_loss": 0.0068986183032393456, "global_step": 12824, "epoch": 107, "lr": 9.272722520180062e-05} +{"train_loss": 0.008883319795131683, "global_step": 12825, "epoch": 107, "lr": 9.272607447250396e-05} +{"train_loss": 0.006709726992994547, "global_step": 12826, "epoch": 107, "lr": 9.272492365931922e-05} +{"train_loss": 0.009852061048150063, "global_step": 12827, "epoch": 107, "lr": 9.272377276224868e-05} +{"train_loss": 0.005500858649611473, "global_step": 12828, "epoch": 107, "lr": 9.272262178129457e-05} +{"train_loss": 0.008558896370232105, "global_step": 12829, "epoch": 107, "lr": 9.272147071645913e-05} +{"train_loss": 0.013855119235813618, "global_step": 12830, "epoch": 107, "lr": 9.272031956774467e-05} +{"train_loss": 0.007253085728734732, "global_step": 12831, "epoch": 107, "lr": 9.271916833515341e-05} +{"train_loss": 0.007402745075523853, "global_step": 12832, "epoch": 107, "lr": 9.271801701868765e-05} +{"train_loss": 0.008044714108109474, "global_step": 12833, "epoch": 107, "lr": 9.271686561834962e-05} +{"train_loss": 0.011130995117127895, "global_step": 12834, "epoch": 107, "lr": 9.271571413414157e-05} +{"train_loss": 0.006002573296427727, "global_step": 12835, "epoch": 107, "lr": 9.271456256606581e-05} +{"train_loss": 0.006213176529854536, "global_step": 12836, "epoch": 107, "lr": 9.271341091412455e-05} +{"train_loss": 0.008314257487654686, "global_step": 12837, "epoch": 107, "lr": 9.271225917832007e-05} +{"train_loss": 0.005958771798759699, "global_step": 12838, "epoch": 107, "lr": 9.271110735865464e-05} +{"train_loss": 0.009517921134829521, "global_step": 12839, "epoch": 107, "lr": 9.270995545513051e-05} +{"train_loss": 0.00678025558590889, "global_step": 12840, "epoch": 107, "lr": 9.270880346774994e-05} +{"train_loss": 0.006456826813519001, "global_step": 12841, "epoch": 107, "lr": 9.270765139651521e-05} +{"train_loss": 0.00614811759442091, "global_step": 12842, "epoch": 107, "lr": 9.270649924142856e-05} +{"train_loss": 0.007866926491260529, "global_step": 12843, "epoch": 107, "lr": 9.270534700249225e-05} +{"train_loss": 0.008146453648805618, "global_step": 12844, "epoch": 107, "lr": 9.270419467970856e-05} +{"train_loss": 0.00947139598429203, "global_step": 12845, "epoch": 107, "lr": 9.270304227307975e-05} +{"train_loss": 0.0112947141751647, "global_step": 12846, "epoch": 107, "lr": 9.27018897826081e-05} +{"train_loss": 0.00915270671248436, "global_step": 12847, "epoch": 107, "lr": 9.270073720829582e-05} +{"train_loss": 0.010241356678307056, "global_step": 12848, "epoch": 107, "lr": 9.269958455014523e-05} +{"train_loss": 0.008614818565547466, "global_step": 12849, "epoch": 107, "lr": 9.269843180815854e-05} +{"train_loss": 0.009319600649178028, "global_step": 12850, "epoch": 107, "lr": 9.269727898233807e-05} +{"train_loss": 0.007777603065297634, "global_step": 12851, "epoch": 107, "lr": 9.269612607268603e-05, "val_loss": 0.017819130793213844} +{"train_loss": 0.007890917360782623, "global_step": 12852, "epoch": 108, "lr": 9.269497307920471e-05} +{"train_loss": 0.013407571241259575, "global_step": 12853, "epoch": 108, "lr": 9.269382000189638e-05} +{"train_loss": 0.00612229248508811, "global_step": 12854, "epoch": 108, "lr": 9.26926668407633e-05} +{"train_loss": 0.007938719354569912, "global_step": 12855, "epoch": 108, "lr": 9.269151359580773e-05} +{"train_loss": 0.008110602386295795, "global_step": 12856, "epoch": 108, "lr": 9.269036026703191e-05} +{"train_loss": 0.007757630664855242, "global_step": 12857, "epoch": 108, "lr": 9.268920685443815e-05} +{"train_loss": 0.007053495850414038, "global_step": 12858, "epoch": 108, "lr": 9.268805335802868e-05} +{"train_loss": 0.007586326450109482, "global_step": 12859, "epoch": 108, "lr": 9.26868997778058e-05} +{"train_loss": 0.009564921259880066, "global_step": 12860, "epoch": 108, "lr": 9.268574611377174e-05} +{"train_loss": 0.0059014903381466866, "global_step": 12861, "epoch": 108, "lr": 9.268459236592877e-05} +{"train_loss": 0.01013832539319992, "global_step": 12862, "epoch": 108, "lr": 9.268343853427917e-05} +{"train_loss": 0.007851338014006615, "global_step": 12863, "epoch": 108, "lr": 9.26822846188252e-05} +{"train_loss": 0.008023224771022797, "global_step": 12864, "epoch": 108, "lr": 9.268113061956913e-05} +{"train_loss": 0.00889318622648716, "global_step": 12865, "epoch": 108, "lr": 9.267997653651322e-05} +{"train_loss": 0.0070296721532940865, "global_step": 12866, "epoch": 108, "lr": 9.267882236965972e-05} +{"train_loss": 0.009043482132256031, "global_step": 12867, "epoch": 108, "lr": 9.26776681190109e-05} +{"train_loss": 0.010481292381882668, "global_step": 12868, "epoch": 108, "lr": 9.267651378456908e-05} +{"train_loss": 0.007557575590908527, "global_step": 12869, "epoch": 108, "lr": 9.267535936633646e-05} +{"train_loss": 0.0066852448508143425, "global_step": 12870, "epoch": 108, "lr": 9.267420486431533e-05} +{"train_loss": 0.0038843315560370684, "global_step": 12871, "epoch": 108, "lr": 9.267305027850797e-05} +{"train_loss": 0.007342172786593437, "global_step": 12872, "epoch": 108, "lr": 9.267189560891663e-05} +{"train_loss": 0.00714921485632658, "global_step": 12873, "epoch": 108, "lr": 9.267074085554357e-05} +{"train_loss": 0.0076196216978132725, "global_step": 12874, "epoch": 108, "lr": 9.266958601839107e-05} +{"train_loss": 0.007723168935626745, "global_step": 12875, "epoch": 108, "lr": 9.266843109746141e-05} +{"train_loss": 0.0056114355102181435, "global_step": 12876, "epoch": 108, "lr": 9.266727609275684e-05} +{"train_loss": 0.007874153554439545, "global_step": 12877, "epoch": 108, "lr": 9.266612100427963e-05} +{"train_loss": 0.008053208701312542, "global_step": 12878, "epoch": 108, "lr": 9.266496583203205e-05} +{"train_loss": 0.005374449770897627, "global_step": 12879, "epoch": 108, "lr": 9.266381057601636e-05} +{"train_loss": 0.007983560673892498, "global_step": 12880, "epoch": 108, "lr": 9.266265523623485e-05} +{"train_loss": 0.008758395910263062, "global_step": 12881, "epoch": 108, "lr": 9.266149981268977e-05} +{"train_loss": 0.00825907289981842, "global_step": 12882, "epoch": 108, "lr": 9.266034430538337e-05} +{"train_loss": 0.008292767219245434, "global_step": 12883, "epoch": 108, "lr": 9.265918871431797e-05} +{"train_loss": 0.005497257690876722, "global_step": 12884, "epoch": 108, "lr": 9.26580330394958e-05} +{"train_loss": 0.006373521871864796, "global_step": 12885, "epoch": 108, "lr": 9.265687728091914e-05} +{"train_loss": 0.0062728566117584705, "global_step": 12886, "epoch": 108, "lr": 9.265572143859026e-05} +{"train_loss": 0.007953009568154812, "global_step": 12887, "epoch": 108, "lr": 9.265456551251144e-05} +{"train_loss": 0.009091045707464218, "global_step": 12888, "epoch": 108, "lr": 9.265340950268492e-05} +{"train_loss": 0.008176886476576328, "global_step": 12889, "epoch": 108, "lr": 9.265225340911298e-05} +{"train_loss": 0.00922703742980957, "global_step": 12890, "epoch": 108, "lr": 9.265109723179792e-05} +{"train_loss": 0.005268947221338749, "global_step": 12891, "epoch": 108, "lr": 9.264994097074197e-05} +{"train_loss": 0.006605548318475485, "global_step": 12892, "epoch": 108, "lr": 9.264878462594744e-05} +{"train_loss": 0.010226810351014137, "global_step": 12893, "epoch": 108, "lr": 9.264762819741655e-05} +{"train_loss": 0.008561093360185623, "global_step": 12894, "epoch": 108, "lr": 9.264647168515161e-05} +{"train_loss": 0.0042105200700461864, "global_step": 12895, "epoch": 108, "lr": 9.264531508915489e-05} +{"train_loss": 0.00635677482932806, "global_step": 12896, "epoch": 108, "lr": 9.264415840942864e-05} +{"train_loss": 0.008772585541009903, "global_step": 12897, "epoch": 108, "lr": 9.264300164597512e-05} +{"train_loss": 0.008669308386743069, "global_step": 12898, "epoch": 108, "lr": 9.264184479879666e-05} +{"train_loss": 0.0063604386523365974, "global_step": 12899, "epoch": 108, "lr": 9.264068786789546e-05} +{"train_loss": 0.00797573383897543, "global_step": 12900, "epoch": 108, "lr": 9.263953085327385e-05} +{"train_loss": 0.007969949394464493, "global_step": 12901, "epoch": 108, "lr": 9.263837375493407e-05} +{"train_loss": 0.006013468373566866, "global_step": 12902, "epoch": 108, "lr": 9.263721657287838e-05} +{"train_loss": 0.006865854375064373, "global_step": 12903, "epoch": 108, "lr": 9.263605930710911e-05} +{"train_loss": 0.007765915244817734, "global_step": 12904, "epoch": 108, "lr": 9.263490195762845e-05} +{"train_loss": 0.010882744565606117, "global_step": 12905, "epoch": 108, "lr": 9.263374452443874e-05} +{"train_loss": 0.007732418365776539, "global_step": 12906, "epoch": 108, "lr": 9.263258700754221e-05} +{"train_loss": 0.006492623593658209, "global_step": 12907, "epoch": 108, "lr": 9.263142940694116e-05} +{"train_loss": 0.008340119384229183, "global_step": 12908, "epoch": 108, "lr": 9.263027172263785e-05} +{"train_loss": 0.009313779883086681, "global_step": 12909, "epoch": 108, "lr": 9.262911395463456e-05} +{"train_loss": 0.004966801032423973, "global_step": 12910, "epoch": 108, "lr": 9.262795610293357e-05} +{"train_loss": 0.010085088200867176, "global_step": 12911, "epoch": 108, "lr": 9.262679816753713e-05} +{"train_loss": 0.009584089741110802, "global_step": 12912, "epoch": 108, "lr": 9.262564014844752e-05} +{"train_loss": 0.006343496032059193, "global_step": 12913, "epoch": 108, "lr": 9.262448204566703e-05} +{"train_loss": 0.0051887729205191135, "global_step": 12914, "epoch": 108, "lr": 9.262332385919792e-05} +{"train_loss": 0.0060095274820923805, "global_step": 12915, "epoch": 108, "lr": 9.262216558904246e-05} +{"train_loss": 0.006162482313811779, "global_step": 12916, "epoch": 108, "lr": 9.262100723520294e-05} +{"train_loss": 0.0073959194123744965, "global_step": 12917, "epoch": 108, "lr": 9.261984879768162e-05} +{"train_loss": 0.007403048686683178, "global_step": 12918, "epoch": 108, "lr": 9.261869027648078e-05} +{"train_loss": 0.010080069303512573, "global_step": 12919, "epoch": 108, "lr": 9.261753167160271e-05} +{"train_loss": 0.009379113093018532, "global_step": 12920, "epoch": 108, "lr": 9.261637298304966e-05} +{"train_loss": 0.006977160461246967, "global_step": 12921, "epoch": 108, "lr": 9.26152142108239e-05} +{"train_loss": 0.003831523470580578, "global_step": 12922, "epoch": 108, "lr": 9.261405535492773e-05} +{"train_loss": 0.010494477115571499, "global_step": 12923, "epoch": 108, "lr": 9.261289641536342e-05} +{"train_loss": 0.00847575068473816, "global_step": 12924, "epoch": 108, "lr": 9.261173739213325e-05} +{"train_loss": 0.007368811871856451, "global_step": 12925, "epoch": 108, "lr": 9.261057828523947e-05} +{"train_loss": 0.004863780923187733, "global_step": 12926, "epoch": 108, "lr": 9.260941909468437e-05} +{"train_loss": 0.008631289005279541, "global_step": 12927, "epoch": 108, "lr": 9.260825982047024e-05} +{"train_loss": 0.00456143356859684, "global_step": 12928, "epoch": 108, "lr": 9.260710046259933e-05} +{"train_loss": 0.008040538057684898, "global_step": 12929, "epoch": 108, "lr": 9.260594102107394e-05} +{"train_loss": 0.007821409963071346, "global_step": 12930, "epoch": 108, "lr": 9.260478149589633e-05} +{"train_loss": 0.009370128624141216, "global_step": 12931, "epoch": 108, "lr": 9.260362188706879e-05} +{"train_loss": 0.007325177080929279, "global_step": 12932, "epoch": 108, "lr": 9.260246219459358e-05} +{"train_loss": 0.007828895002603531, "global_step": 12933, "epoch": 108, "lr": 9.260130241847298e-05} +{"train_loss": 0.007789443247020245, "global_step": 12934, "epoch": 108, "lr": 9.26001425587093e-05} +{"train_loss": 0.0072715976275503635, "global_step": 12935, "epoch": 108, "lr": 9.259898261530478e-05} +{"train_loss": 0.009683105163276196, "global_step": 12936, "epoch": 108, "lr": 9.25978225882617e-05} +{"train_loss": 0.007464731577783823, "global_step": 12937, "epoch": 108, "lr": 9.259666247758236e-05} +{"train_loss": 0.008032109588384628, "global_step": 12938, "epoch": 108, "lr": 9.259550228326902e-05} +{"train_loss": 0.012363645248115063, "global_step": 12939, "epoch": 108, "lr": 9.259434200532395e-05} +{"train_loss": 0.007232496049255133, "global_step": 12940, "epoch": 108, "lr": 9.259318164374947e-05} +{"train_loss": 0.006379056256264448, "global_step": 12941, "epoch": 108, "lr": 9.25920211985478e-05} +{"train_loss": 0.005437552463263273, "global_step": 12942, "epoch": 108, "lr": 9.259086066972125e-05} +{"train_loss": 0.005783468950539827, "global_step": 12943, "epoch": 108, "lr": 9.25897000572721e-05} +{"train_loss": 0.007483256049454212, "global_step": 12944, "epoch": 108, "lr": 9.258853936120262e-05} +{"train_loss": 0.006400565151125193, "global_step": 12945, "epoch": 108, "lr": 9.25873785815151e-05} +{"train_loss": 0.006570881698280573, "global_step": 12946, "epoch": 108, "lr": 9.258621771821181e-05} +{"train_loss": 0.011777038685977459, "global_step": 12947, "epoch": 108, "lr": 9.258505677129503e-05} +{"train_loss": 0.007132349070161581, "global_step": 12948, "epoch": 108, "lr": 9.258389574076703e-05} +{"train_loss": 0.007028727326542139, "global_step": 12949, "epoch": 108, "lr": 9.258273462663012e-05} +{"train_loss": 0.009150448255240917, "global_step": 12950, "epoch": 108, "lr": 9.258157342888654e-05} +{"train_loss": 0.00887919869273901, "global_step": 12951, "epoch": 108, "lr": 9.25804121475386e-05} +{"train_loss": 0.005252600181847811, "global_step": 12952, "epoch": 108, "lr": 9.257925078258858e-05} +{"train_loss": 0.007771284785121679, "global_step": 12953, "epoch": 108, "lr": 9.257808933403874e-05} +{"train_loss": 0.007997134700417519, "global_step": 12954, "epoch": 108, "lr": 9.257692780189136e-05} +{"train_loss": 0.008439603261649609, "global_step": 12955, "epoch": 108, "lr": 9.257576618614875e-05} +{"train_loss": 0.004201756324619055, "global_step": 12956, "epoch": 108, "lr": 9.257460448681316e-05} +{"train_loss": 0.00922825001180172, "global_step": 12957, "epoch": 108, "lr": 9.257344270388688e-05} +{"train_loss": 0.006754573434591293, "global_step": 12958, "epoch": 108, "lr": 9.257228083737219e-05} +{"train_loss": 0.0075384178198874, "global_step": 12959, "epoch": 108, "lr": 9.257111888727138e-05} +{"train_loss": 0.009586228989064693, "global_step": 12960, "epoch": 108, "lr": 9.256995685358675e-05} +{"train_loss": 0.009859347715973854, "global_step": 12961, "epoch": 108, "lr": 9.256879473632055e-05} +{"train_loss": 0.006640540435910225, "global_step": 12962, "epoch": 108, "lr": 9.256763253547504e-05} +{"train_loss": 0.0064326124265789986, "global_step": 12963, "epoch": 108, "lr": 9.256647025105254e-05} +{"train_loss": 0.005301120225340128, "global_step": 12964, "epoch": 108, "lr": 9.256530788305533e-05} +{"train_loss": 0.003879135474562645, "global_step": 12965, "epoch": 108, "lr": 9.256414543148569e-05} +{"train_loss": 0.008566920645534992, "global_step": 12966, "epoch": 108, "lr": 9.256298289634591e-05} +{"train_loss": 0.0065711443312466145, "global_step": 12967, "epoch": 108, "lr": 9.256182027763824e-05} +{"train_loss": 0.008100243285298347, "global_step": 12968, "epoch": 108, "lr": 9.256065757536499e-05} +{"train_loss": 0.005058556795120239, "global_step": 12969, "epoch": 108, "lr": 9.255949478952842e-05} +{"train_loss": 0.007573336642626829, "global_step": 12970, "epoch": 108, "lr": 9.255833192013084e-05, "val_loss": 0.021099936217069626} +{"train_loss": 0.008623254485428333, "global_step": 12971, "epoch": 109, "lr": 9.255716896717452e-05} +{"train_loss": 0.009024632163345814, "global_step": 12972, "epoch": 109, "lr": 9.255600593066176e-05} +{"train_loss": 0.008075174875557423, "global_step": 12973, "epoch": 109, "lr": 9.255484281059481e-05} +{"train_loss": 0.007059227675199509, "global_step": 12974, "epoch": 109, "lr": 9.255367960697598e-05} +{"train_loss": 0.006538087967783213, "global_step": 12975, "epoch": 109, "lr": 9.255251631980755e-05} +{"train_loss": 0.006787004414945841, "global_step": 12976, "epoch": 109, "lr": 9.25513529490918e-05} +{"train_loss": 0.004613752476871014, "global_step": 12977, "epoch": 109, "lr": 9.255018949483101e-05} +{"train_loss": 0.012538821436464787, "global_step": 12978, "epoch": 109, "lr": 9.254902595702747e-05} +{"train_loss": 0.009224451147019863, "global_step": 12979, "epoch": 109, "lr": 9.254786233568347e-05} +{"train_loss": 0.007253990042954683, "global_step": 12980, "epoch": 109, "lr": 9.254669863080127e-05} +{"train_loss": 0.008543243631720543, "global_step": 12981, "epoch": 109, "lr": 9.254553484238318e-05} +{"train_loss": 0.009052074514329433, "global_step": 12982, "epoch": 109, "lr": 9.25443709704315e-05} +{"train_loss": 0.005375484470278025, "global_step": 12983, "epoch": 109, "lr": 9.254320701494846e-05} +{"train_loss": 0.006874594837427139, "global_step": 12984, "epoch": 109, "lr": 9.25420429759364e-05} +{"train_loss": 0.006967509631067514, "global_step": 12985, "epoch": 109, "lr": 9.254087885339757e-05} +{"train_loss": 0.004858748521655798, "global_step": 12986, "epoch": 109, "lr": 9.253971464733429e-05} +{"train_loss": 0.010726405307650566, "global_step": 12987, "epoch": 109, "lr": 9.25385503577488e-05} +{"train_loss": 0.01123883482068777, "global_step": 12988, "epoch": 109, "lr": 9.253738598464342e-05} +{"train_loss": 0.006054945755749941, "global_step": 12989, "epoch": 109, "lr": 9.253622152802042e-05} +{"train_loss": 0.0060698846355080605, "global_step": 12990, "epoch": 109, "lr": 9.253505698788211e-05} +{"train_loss": 0.007337130606174469, "global_step": 12991, "epoch": 109, "lr": 9.253389236423076e-05} +{"train_loss": 0.011610204353928566, "global_step": 12992, "epoch": 109, "lr": 9.253272765706863e-05} +{"train_loss": 0.008759330958127975, "global_step": 12993, "epoch": 109, "lr": 9.253156286639806e-05} +{"train_loss": 0.008773363195359707, "global_step": 12994, "epoch": 109, "lr": 9.25303979922213e-05} +{"train_loss": 0.006953722797334194, "global_step": 12995, "epoch": 109, "lr": 9.252923303454065e-05} +{"train_loss": 0.006475542671978474, "global_step": 12996, "epoch": 109, "lr": 9.25280679933584e-05} +{"train_loss": 0.008478865027427673, "global_step": 12997, "epoch": 109, "lr": 9.252690286867682e-05} +{"train_loss": 0.007869970984756947, "global_step": 12998, "epoch": 109, "lr": 9.252573766049821e-05} +{"train_loss": 0.0060039362870156765, "global_step": 12999, "epoch": 109, "lr": 9.252457236882486e-05} +{"train_loss": 0.007010126952081919, "global_step": 13000, "epoch": 109, "lr": 9.252340699365907e-05} +{"train_loss": 0.011556633748114109, "global_step": 13001, "epoch": 109, "lr": 9.252224153500309e-05} +{"train_loss": 0.006408468820154667, "global_step": 13002, "epoch": 109, "lr": 9.252107599285924e-05} +{"train_loss": 0.0086141899228096, "global_step": 13003, "epoch": 109, "lr": 9.25199103672298e-05} +{"train_loss": 0.005834808573126793, "global_step": 13004, "epoch": 109, "lr": 9.251874465811707e-05} +{"train_loss": 0.005977058317512274, "global_step": 13005, "epoch": 109, "lr": 9.251757886552331e-05} +{"train_loss": 0.008269603364169598, "global_step": 13006, "epoch": 109, "lr": 9.251641298945084e-05} +{"train_loss": 0.010316974483430386, "global_step": 13007, "epoch": 109, "lr": 9.251524702990194e-05} +{"train_loss": 0.00483778677880764, "global_step": 13008, "epoch": 109, "lr": 9.251408098687887e-05} +{"train_loss": 0.009656486101448536, "global_step": 13009, "epoch": 109, "lr": 9.251291486038395e-05} +{"train_loss": 0.00742611289024353, "global_step": 13010, "epoch": 109, "lr": 9.251174865041949e-05} +{"train_loss": 0.006600638385862112, "global_step": 13011, "epoch": 109, "lr": 9.251058235698773e-05} +{"train_loss": 0.007562311831861734, "global_step": 13012, "epoch": 109, "lr": 9.250941598009097e-05} +{"train_loss": 0.007750235497951508, "global_step": 13013, "epoch": 109, "lr": 9.250824951973154e-05} +{"train_loss": 0.006007781717926264, "global_step": 13014, "epoch": 109, "lr": 9.250708297591169e-05} +{"train_loss": 0.00902688130736351, "global_step": 13015, "epoch": 109, "lr": 9.250591634863374e-05} +{"train_loss": 0.006636567879468203, "global_step": 13016, "epoch": 109, "lr": 9.250474963789994e-05} +{"train_loss": 0.007122001610696316, "global_step": 13017, "epoch": 109, "lr": 9.250358284371263e-05} +{"train_loss": 0.006619835738092661, "global_step": 13018, "epoch": 109, "lr": 9.250241596607405e-05} +{"train_loss": 0.007035570684820414, "global_step": 13019, "epoch": 109, "lr": 9.250124900498654e-05} +{"train_loss": 0.010780534707009792, "global_step": 13020, "epoch": 109, "lr": 9.250008196045235e-05} +{"train_loss": 0.014039082452654839, "global_step": 13021, "epoch": 109, "lr": 9.249891483247381e-05} +{"train_loss": 0.006619705352932215, "global_step": 13022, "epoch": 109, "lr": 9.249774762105318e-05} +{"train_loss": 0.004832352511584759, "global_step": 13023, "epoch": 109, "lr": 9.249658032619274e-05} +{"train_loss": 0.009543085470795631, "global_step": 13024, "epoch": 109, "lr": 9.249541294789485e-05} +{"train_loss": 0.013660441152751446, "global_step": 13025, "epoch": 109, "lr": 9.249424548616173e-05} +{"train_loss": 0.007216482423245907, "global_step": 13026, "epoch": 109, "lr": 9.24930779409957e-05} +{"train_loss": 0.008153458125889301, "global_step": 13027, "epoch": 109, "lr": 9.249191031239906e-05} +{"train_loss": 0.00794182624667883, "global_step": 13028, "epoch": 109, "lr": 9.249074260037407e-05} +{"train_loss": 0.011538582853972912, "global_step": 13029, "epoch": 109, "lr": 9.248957480492306e-05} +{"train_loss": 0.007558208890259266, "global_step": 13030, "epoch": 109, "lr": 9.248840692604832e-05} +{"train_loss": 0.009635498747229576, "global_step": 13031, "epoch": 109, "lr": 9.248723896375213e-05} +{"train_loss": 0.010296217165887356, "global_step": 13032, "epoch": 109, "lr": 9.248607091803678e-05} +{"train_loss": 0.00668833963572979, "global_step": 13033, "epoch": 109, "lr": 9.248490278890456e-05} +{"train_loss": 0.00801666546612978, "global_step": 13034, "epoch": 109, "lr": 9.248373457635779e-05} +{"train_loss": 0.0053121899254620075, "global_step": 13035, "epoch": 109, "lr": 9.248256628039873e-05} +{"train_loss": 0.009737329557538033, "global_step": 13036, "epoch": 109, "lr": 9.24813979010297e-05} +{"train_loss": 0.01061607338488102, "global_step": 13037, "epoch": 109, "lr": 9.248022943825299e-05} +{"train_loss": 0.00893553625792265, "global_step": 13038, "epoch": 109, "lr": 9.247906089207087e-05} +{"train_loss": 0.00786731205880642, "global_step": 13039, "epoch": 109, "lr": 9.247789226248566e-05} +{"train_loss": 0.007885696366429329, "global_step": 13040, "epoch": 109, "lr": 9.247672354949964e-05} +{"train_loss": 0.011927386745810509, "global_step": 13041, "epoch": 109, "lr": 9.247555475311512e-05} +{"train_loss": 0.009962761774659157, "global_step": 13042, "epoch": 109, "lr": 9.24743858733344e-05} +{"train_loss": 0.00782221183180809, "global_step": 13043, "epoch": 109, "lr": 9.247321691015974e-05} +{"train_loss": 0.009873039089143276, "global_step": 13044, "epoch": 109, "lr": 9.247204786359345e-05} +{"train_loss": 0.0062491800636053085, "global_step": 13045, "epoch": 109, "lr": 9.247087873363784e-05} +{"train_loss": 0.01010111439973116, "global_step": 13046, "epoch": 109, "lr": 9.246970952029522e-05} +{"train_loss": 0.007549865171313286, "global_step": 13047, "epoch": 109, "lr": 9.246854022356783e-05} +{"train_loss": 0.006900501903146505, "global_step": 13048, "epoch": 109, "lr": 9.246737084345801e-05} +{"train_loss": 0.008066516369581223, "global_step": 13049, "epoch": 109, "lr": 9.246620137996805e-05} +{"train_loss": 0.007224107626825571, "global_step": 13050, "epoch": 109, "lr": 9.246503183310022e-05} +{"train_loss": 0.007513395510613918, "global_step": 13051, "epoch": 109, "lr": 9.246386220285687e-05} +{"train_loss": 0.00827657338231802, "global_step": 13052, "epoch": 109, "lr": 9.246269248924025e-05} +{"train_loss": 0.007362105417996645, "global_step": 13053, "epoch": 109, "lr": 9.246152269225266e-05} +{"train_loss": 0.0039038737304508686, "global_step": 13054, "epoch": 109, "lr": 9.24603528118964e-05} +{"train_loss": 0.008321687579154968, "global_step": 13055, "epoch": 109, "lr": 9.245918284817378e-05} +{"train_loss": 0.006252995226532221, "global_step": 13056, "epoch": 109, "lr": 9.24580128010871e-05} +{"train_loss": 0.008722107857465744, "global_step": 13057, "epoch": 109, "lr": 9.245684267063865e-05} +{"train_loss": 0.012453971430659294, "global_step": 13058, "epoch": 109, "lr": 9.245567245683072e-05} +{"train_loss": 0.008759929798543453, "global_step": 13059, "epoch": 109, "lr": 9.245450215966561e-05} +{"train_loss": 0.007828343659639359, "global_step": 13060, "epoch": 109, "lr": 9.245333177914562e-05} +{"train_loss": 0.012825756333768368, "global_step": 13061, "epoch": 109, "lr": 9.245216131527306e-05} +{"train_loss": 0.007794633973389864, "global_step": 13062, "epoch": 109, "lr": 9.24509907680502e-05} +{"train_loss": 0.005711081903427839, "global_step": 13063, "epoch": 109, "lr": 9.244982013747935e-05} +{"train_loss": 0.007613473106175661, "global_step": 13064, "epoch": 109, "lr": 9.244864942356284e-05} +{"train_loss": 0.008893359452486038, "global_step": 13065, "epoch": 109, "lr": 9.244747862630292e-05} +{"train_loss": 0.006776393391191959, "global_step": 13066, "epoch": 109, "lr": 9.244630774570193e-05} +{"train_loss": 0.011389466933906078, "global_step": 13067, "epoch": 109, "lr": 9.244513678176213e-05} +{"train_loss": 0.008162295445799828, "global_step": 13068, "epoch": 109, "lr": 9.244396573448585e-05} +{"train_loss": 0.004258693661540747, "global_step": 13069, "epoch": 109, "lr": 9.244279460387537e-05} +{"train_loss": 0.005723054055124521, "global_step": 13070, "epoch": 109, "lr": 9.244162338993301e-05} +{"train_loss": 0.011292384937405586, "global_step": 13071, "epoch": 109, "lr": 9.244045209266104e-05} +{"train_loss": 0.005846245680004358, "global_step": 13072, "epoch": 109, "lr": 9.243928071206178e-05} +{"train_loss": 0.0068677933886647224, "global_step": 13073, "epoch": 109, "lr": 9.243810924813754e-05} +{"train_loss": 0.009359074756503105, "global_step": 13074, "epoch": 109, "lr": 9.243693770089059e-05} +{"train_loss": 0.010130580514669418, "global_step": 13075, "epoch": 109, "lr": 9.243576607032324e-05} +{"train_loss": 0.007802003528922796, "global_step": 13076, "epoch": 109, "lr": 9.243459435643782e-05} +{"train_loss": 0.010343304835259914, "global_step": 13077, "epoch": 109, "lr": 9.24334225592366e-05} +{"train_loss": 0.006471117027103901, "global_step": 13078, "epoch": 109, "lr": 9.243225067872189e-05} +{"train_loss": 0.010929401963949203, "global_step": 13079, "epoch": 109, "lr": 9.243107871489598e-05} +{"train_loss": 0.006720265839248896, "global_step": 13080, "epoch": 109, "lr": 9.242990666776119e-05} +{"train_loss": 0.010409523732960224, "global_step": 13081, "epoch": 109, "lr": 9.242873453731979e-05} +{"train_loss": 0.010451207868754864, "global_step": 13082, "epoch": 109, "lr": 9.242756232357414e-05} +{"train_loss": 0.009585953317582607, "global_step": 13083, "epoch": 109, "lr": 9.242639002652648e-05} +{"train_loss": 0.0073821027763187885, "global_step": 13084, "epoch": 109, "lr": 9.242521764617913e-05} +{"train_loss": 0.006394029129296541, "global_step": 13085, "epoch": 109, "lr": 9.242404518253441e-05} +{"train_loss": 0.011296539567410946, "global_step": 13086, "epoch": 109, "lr": 9.24228726355946e-05} +{"train_loss": 0.006334017496556044, "global_step": 13087, "epoch": 109, "lr": 9.242170000536203e-05} +{"train_loss": 0.009558130986988544, "global_step": 13088, "epoch": 109, "lr": 9.242052729183896e-05} +{"train_loss": 0.008195586432115872, "global_step": 13089, "epoch": 109, "lr": 9.241935449502773e-05, "val_loss": 0.013937912881374359} +{"train_loss": 0.007046805229038, "global_step": 13090, "epoch": 110, "lr": 9.241818161493064e-05} +{"train_loss": 0.009441908448934555, "global_step": 13091, "epoch": 110, "lr": 9.241700865154997e-05} +{"train_loss": 0.007944022305309772, "global_step": 13092, "epoch": 110, "lr": 9.241583560488802e-05} +{"train_loss": 0.013978642411530018, "global_step": 13093, "epoch": 110, "lr": 9.241466247494712e-05} +{"train_loss": 0.0051923589780926704, "global_step": 13094, "epoch": 110, "lr": 9.241348926172957e-05} +{"train_loss": 0.011020505800843239, "global_step": 13095, "epoch": 110, "lr": 9.241231596523767e-05} +{"train_loss": 0.006506563629955053, "global_step": 13096, "epoch": 110, "lr": 9.24111425854737e-05} +{"train_loss": 0.009081212803721428, "global_step": 13097, "epoch": 110, "lr": 9.240996912243999e-05} +{"train_loss": 0.00672042416408658, "global_step": 13098, "epoch": 110, "lr": 9.240879557613884e-05} +{"train_loss": 0.01093955896794796, "global_step": 13099, "epoch": 110, "lr": 9.240762194657254e-05} +{"train_loss": 0.0097657460719347, "global_step": 13100, "epoch": 110, "lr": 9.240644823374341e-05} +{"train_loss": 0.006727874744683504, "global_step": 13101, "epoch": 110, "lr": 9.240527443765376e-05} +{"train_loss": 0.006194966845214367, "global_step": 13102, "epoch": 110, "lr": 9.240410055830588e-05} +{"train_loss": 0.01307604182511568, "global_step": 13103, "epoch": 110, "lr": 9.240292659570206e-05} +{"train_loss": 0.005728499963879585, "global_step": 13104, "epoch": 110, "lr": 9.240175254984465e-05} +{"train_loss": 0.009761868044734001, "global_step": 13105, "epoch": 110, "lr": 9.240057842073592e-05} +{"train_loss": 0.00888805277645588, "global_step": 13106, "epoch": 110, "lr": 9.239940420837819e-05} +{"train_loss": 0.00833362527191639, "global_step": 13107, "epoch": 110, "lr": 9.239822991277373e-05} +{"train_loss": 0.010123372077941895, "global_step": 13108, "epoch": 110, "lr": 9.23970555339249e-05} +{"train_loss": 0.007543143816292286, "global_step": 13109, "epoch": 110, "lr": 9.2395881071834e-05} +{"train_loss": 0.007039754651486874, "global_step": 13110, "epoch": 110, "lr": 9.239470652650329e-05} +{"train_loss": 0.006899448111653328, "global_step": 13111, "epoch": 110, "lr": 9.239353189793509e-05} +{"train_loss": 0.007748724427074194, "global_step": 13112, "epoch": 110, "lr": 9.239235718613174e-05} +{"train_loss": 0.010542563162744045, "global_step": 13113, "epoch": 110, "lr": 9.239118239109552e-05} +{"train_loss": 0.006751593202352524, "global_step": 13114, "epoch": 110, "lr": 9.239000751282874e-05} +{"train_loss": 0.007357539143413305, "global_step": 13115, "epoch": 110, "lr": 9.238883255133371e-05} +{"train_loss": 0.004947548266500235, "global_step": 13116, "epoch": 110, "lr": 9.238765750661275e-05} +{"train_loss": 0.010135761462152004, "global_step": 13117, "epoch": 110, "lr": 9.238648237866814e-05} +{"train_loss": 0.012734215706586838, "global_step": 13118, "epoch": 110, "lr": 9.23853071675022e-05} +{"train_loss": 0.005369931925088167, "global_step": 13119, "epoch": 110, "lr": 9.238413187311723e-05} +{"train_loss": 0.009572689421474934, "global_step": 13120, "epoch": 110, "lr": 9.238295649551556e-05} +{"train_loss": 0.0090006273239851, "global_step": 13121, "epoch": 110, "lr": 9.238178103469948e-05} +{"train_loss": 0.004431487992405891, "global_step": 13122, "epoch": 110, "lr": 9.23806054906713e-05} +{"train_loss": 0.00685140723362565, "global_step": 13123, "epoch": 110, "lr": 9.237942986343333e-05} +{"train_loss": 0.00625096820294857, "global_step": 13124, "epoch": 110, "lr": 9.237825415298787e-05} +{"train_loss": 0.011932756751775742, "global_step": 13125, "epoch": 110, "lr": 9.237707835933725e-05} +{"train_loss": 0.0071362643502652645, "global_step": 13126, "epoch": 110, "lr": 9.237590248248375e-05} +{"train_loss": 0.008308714255690575, "global_step": 13127, "epoch": 110, "lr": 9.23747265224297e-05} +{"train_loss": 0.007009514607489109, "global_step": 13128, "epoch": 110, "lr": 9.237355047917738e-05} +{"train_loss": 0.007725374307483435, "global_step": 13129, "epoch": 110, "lr": 9.237237435272914e-05} +{"train_loss": 0.005121259484440088, "global_step": 13130, "epoch": 110, "lr": 9.237119814308728e-05} +{"train_loss": 0.0068697016686201096, "global_step": 13131, "epoch": 110, "lr": 9.237002185025408e-05} +{"train_loss": 0.0059294318780303, "global_step": 13132, "epoch": 110, "lr": 9.236884547423188e-05} +{"train_loss": 0.006827938370406628, "global_step": 13133, "epoch": 110, "lr": 9.236766901502296e-05} +{"train_loss": 0.006822001654654741, "global_step": 13134, "epoch": 110, "lr": 9.236649247262967e-05} +{"train_loss": 0.008433755487203598, "global_step": 13135, "epoch": 110, "lr": 9.23653158470543e-05} +{"train_loss": 0.00822688639163971, "global_step": 13136, "epoch": 110, "lr": 9.236413913829915e-05} +{"train_loss": 0.007065426558256149, "global_step": 13137, "epoch": 110, "lr": 9.236296234636652e-05} +{"train_loss": 0.007128759287297726, "global_step": 13138, "epoch": 110, "lr": 9.236178547125876e-05} +{"train_loss": 0.00937474425882101, "global_step": 13139, "epoch": 110, "lr": 9.236060851297817e-05} +{"train_loss": 0.005657433066517115, "global_step": 13140, "epoch": 110, "lr": 9.235943147152703e-05} +{"train_loss": 0.005606463644653559, "global_step": 13141, "epoch": 110, "lr": 9.235825434690768e-05} +{"train_loss": 0.008423623628914356, "global_step": 13142, "epoch": 110, "lr": 9.235707713912242e-05} +{"train_loss": 0.009180794470012188, "global_step": 13143, "epoch": 110, "lr": 9.235589984817356e-05} +{"train_loss": 0.009713051840662956, "global_step": 13144, "epoch": 110, "lr": 9.235472247406342e-05} +{"train_loss": 0.008535233326256275, "global_step": 13145, "epoch": 110, "lr": 9.235354501679432e-05} +{"train_loss": 0.006107524503022432, "global_step": 13146, "epoch": 110, "lr": 9.235236747636855e-05} +{"train_loss": 0.006256821099668741, "global_step": 13147, "epoch": 110, "lr": 9.235118985278844e-05} +{"train_loss": 0.008267493918538094, "global_step": 13148, "epoch": 110, "lr": 9.235001214605628e-05} +{"train_loss": 0.007384755183011293, "global_step": 13149, "epoch": 110, "lr": 9.234883435617439e-05} +{"train_loss": 0.008277123793959618, "global_step": 13150, "epoch": 110, "lr": 9.23476564831451e-05} +{"train_loss": 0.0106795160099864, "global_step": 13151, "epoch": 110, "lr": 9.234647852697072e-05} +{"train_loss": 0.007528258487582207, "global_step": 13152, "epoch": 110, "lr": 9.234530048765353e-05} +{"train_loss": 0.004054371267557144, "global_step": 13153, "epoch": 110, "lr": 9.234412236519588e-05} +{"train_loss": 0.007236284203827381, "global_step": 13154, "epoch": 110, "lr": 9.234294415960005e-05} +{"train_loss": 0.007574447430670261, "global_step": 13155, "epoch": 110, "lr": 9.234176587086841e-05} +{"train_loss": 0.00990189891308546, "global_step": 13156, "epoch": 110, "lr": 9.234058749900321e-05} +{"train_loss": 0.00760158896446228, "global_step": 13157, "epoch": 110, "lr": 9.23394090440068e-05} +{"train_loss": 0.004734896123409271, "global_step": 13158, "epoch": 110, "lr": 9.233823050588147e-05} +{"train_loss": 0.014137816615402699, "global_step": 13159, "epoch": 110, "lr": 9.233705188462956e-05} +{"train_loss": 0.006450791843235493, "global_step": 13160, "epoch": 110, "lr": 9.233587318025337e-05} +{"train_loss": 0.0061031002551317215, "global_step": 13161, "epoch": 110, "lr": 9.233469439275521e-05} +{"train_loss": 0.005769217386841774, "global_step": 13162, "epoch": 110, "lr": 9.23335155221374e-05} +{"train_loss": 0.009311826899647713, "global_step": 13163, "epoch": 110, "lr": 9.233233656840227e-05} +{"train_loss": 0.004209461156278849, "global_step": 13164, "epoch": 110, "lr": 9.23311575315521e-05} +{"train_loss": 0.009022138081490993, "global_step": 13165, "epoch": 110, "lr": 9.232997841158923e-05} +{"train_loss": 0.009087367914617062, "global_step": 13166, "epoch": 110, "lr": 9.232879920851598e-05} +{"train_loss": 0.013654019683599472, "global_step": 13167, "epoch": 110, "lr": 9.232761992233466e-05} +{"train_loss": 0.006379591301083565, "global_step": 13168, "epoch": 110, "lr": 9.232644055304757e-05} +{"train_loss": 0.010380241088569164, "global_step": 13169, "epoch": 110, "lr": 9.232526110065703e-05} +{"train_loss": 0.007151205092668533, "global_step": 13170, "epoch": 110, "lr": 9.232408156516537e-05} +{"train_loss": 0.00884511973708868, "global_step": 13171, "epoch": 110, "lr": 9.23229019465749e-05} +{"train_loss": 0.005813518073409796, "global_step": 13172, "epoch": 110, "lr": 9.23217222448879e-05} +{"train_loss": 0.0076362621039152145, "global_step": 13173, "epoch": 110, "lr": 9.232054246010677e-05} +{"train_loss": 0.01095613930374384, "global_step": 13174, "epoch": 110, "lr": 9.231936259223375e-05} +{"train_loss": 0.006506763864308596, "global_step": 13175, "epoch": 110, "lr": 9.231818264127119e-05} +{"train_loss": 0.006507981102913618, "global_step": 13176, "epoch": 110, "lr": 9.23170026072214e-05} +{"train_loss": 0.005945064593106508, "global_step": 13177, "epoch": 110, "lr": 9.231582249008669e-05} +{"train_loss": 0.010902907699346542, "global_step": 13178, "epoch": 110, "lr": 9.231464228986939e-05} +{"train_loss": 0.011127782985568047, "global_step": 13179, "epoch": 110, "lr": 9.231346200657179e-05} +{"train_loss": 0.0077097718603909016, "global_step": 13180, "epoch": 110, "lr": 9.231228164019625e-05} +{"train_loss": 0.005361758638173342, "global_step": 13181, "epoch": 110, "lr": 9.231110119074506e-05} +{"train_loss": 0.006783876568078995, "global_step": 13182, "epoch": 110, "lr": 9.230992065822054e-05} +{"train_loss": 0.008081778883934021, "global_step": 13183, "epoch": 110, "lr": 9.230874004262502e-05} +{"train_loss": 0.007659123744815588, "global_step": 13184, "epoch": 110, "lr": 9.23075593439608e-05} +{"train_loss": 0.007513455115258694, "global_step": 13185, "epoch": 110, "lr": 9.230637856223021e-05} +{"train_loss": 0.0072113703936338425, "global_step": 13186, "epoch": 110, "lr": 9.230519769743555e-05} +{"train_loss": 0.00867233332246542, "global_step": 13187, "epoch": 110, "lr": 9.230401674957918e-05} +{"train_loss": 0.013797540217638016, "global_step": 13188, "epoch": 110, "lr": 9.230283571866338e-05} +{"train_loss": 0.008235694840550423, "global_step": 13189, "epoch": 110, "lr": 9.230165460469048e-05} +{"train_loss": 0.00688163423910737, "global_step": 13190, "epoch": 110, "lr": 9.230047340766281e-05} +{"train_loss": 0.005584953352808952, "global_step": 13191, "epoch": 110, "lr": 9.229929212758265e-05} +{"train_loss": 0.0075348298996686935, "global_step": 13192, "epoch": 110, "lr": 9.229811076445238e-05} +{"train_loss": 0.0060209548100829124, "global_step": 13193, "epoch": 110, "lr": 9.22969293182743e-05} +{"train_loss": 0.007927830331027508, "global_step": 13194, "epoch": 110, "lr": 9.229574778905069e-05} +{"train_loss": 0.005518958438187838, "global_step": 13195, "epoch": 110, "lr": 9.22945661767839e-05} +{"train_loss": 0.008600924164056778, "global_step": 13196, "epoch": 110, "lr": 9.229338448147626e-05} +{"train_loss": 0.00712231919169426, "global_step": 13197, "epoch": 110, "lr": 9.229220270313007e-05} +{"train_loss": 0.0067770592868328094, "global_step": 13198, "epoch": 110, "lr": 9.229102084174765e-05} +{"train_loss": 0.010723312385380268, "global_step": 13199, "epoch": 110, "lr": 9.228983889733135e-05} +{"train_loss": 0.007787814363837242, "global_step": 13200, "epoch": 110, "lr": 9.228865686988346e-05} +{"train_loss": 0.010175416246056557, "global_step": 13201, "epoch": 110, "lr": 9.228747475940631e-05} +{"train_loss": 0.006577393971383572, "global_step": 13202, "epoch": 110, "lr": 9.228629256590223e-05} +{"train_loss": 0.005163421854376793, "global_step": 13203, "epoch": 110, "lr": 9.22851102893735e-05} +{"train_loss": 0.010644355788826942, "global_step": 13204, "epoch": 110, "lr": 9.22839279298225e-05} +{"train_loss": 0.010128363035619259, "global_step": 13205, "epoch": 110, "lr": 9.228274548725151e-05} +{"train_loss": 0.013554682023823261, "global_step": 13206, "epoch": 110, "lr": 9.228156296166288e-05} +{"train_loss": 0.010488857515156269, "global_step": 13207, "epoch": 110, "lr": 9.228038035305892e-05} +{"train_loss": 0.008054575272405348, "global_step": 13208, "epoch": 110, "lr": 9.227919766144196e-05, "val_loss": 0.016546057537198067, "train_action_mse_error": 0.00026669210637919605} +{"train_loss": 0.005478455685079098, "global_step": 13209, "epoch": 111, "lr": 9.227801488681429e-05} +{"train_loss": 0.011862797662615776, "global_step": 13210, "epoch": 111, "lr": 9.227683202917826e-05} +{"train_loss": 0.004699320998042822, "global_step": 13211, "epoch": 111, "lr": 9.227564908853618e-05} +{"train_loss": 0.005666361656039953, "global_step": 13212, "epoch": 111, "lr": 9.227446606489038e-05} +{"train_loss": 0.005536483135074377, "global_step": 13213, "epoch": 111, "lr": 9.22732829582432e-05} +{"train_loss": 0.011033055372536182, "global_step": 13214, "epoch": 111, "lr": 9.227209976859695e-05} +{"train_loss": 0.008338614366948605, "global_step": 13215, "epoch": 111, "lr": 9.227091649595391e-05} +{"train_loss": 0.011088241823017597, "global_step": 13216, "epoch": 111, "lr": 9.226973314031649e-05} +{"train_loss": 0.010851590894162655, "global_step": 13217, "epoch": 111, "lr": 9.226854970168692e-05} +{"train_loss": 0.005184462293982506, "global_step": 13218, "epoch": 111, "lr": 9.22673661800676e-05} +{"train_loss": 0.00964927114546299, "global_step": 13219, "epoch": 111, "lr": 9.22661825754608e-05} +{"train_loss": 0.008242921903729439, "global_step": 13220, "epoch": 111, "lr": 9.226499888786889e-05} +{"train_loss": 0.01154943834990263, "global_step": 13221, "epoch": 111, "lr": 9.226381511729414e-05} +{"train_loss": 0.007573016453534365, "global_step": 13222, "epoch": 111, "lr": 9.226263126373893e-05} +{"train_loss": 0.005163001362234354, "global_step": 13223, "epoch": 111, "lr": 9.226144732720554e-05} +{"train_loss": 0.005993695463985205, "global_step": 13224, "epoch": 111, "lr": 9.226026330769633e-05} +{"train_loss": 0.007218054495751858, "global_step": 13225, "epoch": 111, "lr": 9.22590792052136e-05} +{"train_loss": 0.007841043174266815, "global_step": 13226, "epoch": 111, "lr": 9.225789501975969e-05} +{"train_loss": 0.00799480639398098, "global_step": 13227, "epoch": 111, "lr": 9.22567107513369e-05} +{"train_loss": 0.009643386118113995, "global_step": 13228, "epoch": 111, "lr": 9.225552639994759e-05} +{"train_loss": 0.0063512627966701984, "global_step": 13229, "epoch": 111, "lr": 9.225434196559405e-05} +{"train_loss": 0.008209927938878536, "global_step": 13230, "epoch": 111, "lr": 9.225315744827864e-05} +{"train_loss": 0.011487876996397972, "global_step": 13231, "epoch": 111, "lr": 9.225197284800366e-05} +{"train_loss": 0.00567282410338521, "global_step": 13232, "epoch": 111, "lr": 9.225078816477146e-05} +{"train_loss": 0.007832087576389313, "global_step": 13233, "epoch": 111, "lr": 9.224960339858434e-05} +{"train_loss": 0.005861309822648764, "global_step": 13234, "epoch": 111, "lr": 9.224841854944464e-05} +{"train_loss": 0.007704326417297125, "global_step": 13235, "epoch": 111, "lr": 9.224723361735468e-05} +{"train_loss": 0.01013833750039339, "global_step": 13236, "epoch": 111, "lr": 9.224604860231679e-05} +{"train_loss": 0.006993867922574282, "global_step": 13237, "epoch": 111, "lr": 9.22448635043333e-05} +{"train_loss": 0.007776458747684956, "global_step": 13238, "epoch": 111, "lr": 9.224367832340654e-05} +{"train_loss": 0.007612728048115969, "global_step": 13239, "epoch": 111, "lr": 9.224249305953882e-05} +{"train_loss": 0.006429701112210751, "global_step": 13240, "epoch": 111, "lr": 9.224130771273248e-05} +{"train_loss": 0.009746162220835686, "global_step": 13241, "epoch": 111, "lr": 9.224012228298984e-05} +{"train_loss": 0.007662641815841198, "global_step": 13242, "epoch": 111, "lr": 9.223893677031325e-05} +{"train_loss": 0.0049721961840987206, "global_step": 13243, "epoch": 111, "lr": 9.223775117470502e-05} +{"train_loss": 0.007685343734920025, "global_step": 13244, "epoch": 111, "lr": 9.223656549616746e-05} +{"train_loss": 0.005029179155826569, "global_step": 13245, "epoch": 111, "lr": 9.223537973470292e-05} +{"train_loss": 0.006637905724346638, "global_step": 13246, "epoch": 111, "lr": 9.223419389031374e-05} +{"train_loss": 0.012047174386680126, "global_step": 13247, "epoch": 111, "lr": 9.22330079630022e-05} +{"train_loss": 0.00657610734924674, "global_step": 13248, "epoch": 111, "lr": 9.223182195277069e-05} +{"train_loss": 0.011428426951169968, "global_step": 13249, "epoch": 111, "lr": 9.223063585962151e-05} +{"train_loss": 0.005293717607855797, "global_step": 13250, "epoch": 111, "lr": 9.222944968355698e-05} +{"train_loss": 0.0053557055070996284, "global_step": 13251, "epoch": 111, "lr": 9.222826342457943e-05} +{"train_loss": 0.005659850314259529, "global_step": 13252, "epoch": 111, "lr": 9.22270770826912e-05} +{"train_loss": 0.010430474765598774, "global_step": 13253, "epoch": 111, "lr": 9.222589065789462e-05} +{"train_loss": 0.011272839270532131, "global_step": 13254, "epoch": 111, "lr": 9.222470415019202e-05} +{"train_loss": 0.010782348923385143, "global_step": 13255, "epoch": 111, "lr": 9.222351755958571e-05} +{"train_loss": 0.006880620960146189, "global_step": 13256, "epoch": 111, "lr": 9.222233088607803e-05} +{"train_loss": 0.009313728660345078, "global_step": 13257, "epoch": 111, "lr": 9.222114412967133e-05} +{"train_loss": 0.005915690679103136, "global_step": 13258, "epoch": 111, "lr": 9.221995729036793e-05} +{"train_loss": 0.008392909541726112, "global_step": 13259, "epoch": 111, "lr": 9.221877036817014e-05} +{"train_loss": 0.009173552505671978, "global_step": 13260, "epoch": 111, "lr": 9.221758336308031e-05} +{"train_loss": 0.004584187641739845, "global_step": 13261, "epoch": 111, "lr": 9.221639627510076e-05} +{"train_loss": 0.006460963748395443, "global_step": 13262, "epoch": 111, "lr": 9.221520910423383e-05} +{"train_loss": 0.006450363900512457, "global_step": 13263, "epoch": 111, "lr": 9.221402185048184e-05} +{"train_loss": 0.010150347836315632, "global_step": 13264, "epoch": 111, "lr": 9.221283451384715e-05} +{"train_loss": 0.007789784576743841, "global_step": 13265, "epoch": 111, "lr": 9.221164709433205e-05} +{"train_loss": 0.00870148278772831, "global_step": 13266, "epoch": 111, "lr": 9.221045959193887e-05} +{"train_loss": 0.009186780080199242, "global_step": 13267, "epoch": 111, "lr": 9.220927200667e-05} +{"train_loss": 0.005661968607455492, "global_step": 13268, "epoch": 111, "lr": 9.220808433852772e-05} +{"train_loss": 0.006896571721881628, "global_step": 13269, "epoch": 111, "lr": 9.220689658751437e-05} +{"train_loss": 0.006286099087446928, "global_step": 13270, "epoch": 111, "lr": 9.22057087536323e-05} +{"train_loss": 0.007095239125192165, "global_step": 13271, "epoch": 111, "lr": 9.220452083688382e-05} +{"train_loss": 0.004714742302894592, "global_step": 13272, "epoch": 111, "lr": 9.220333283727128e-05} +{"train_loss": 0.008488153107464314, "global_step": 13273, "epoch": 111, "lr": 9.2202144754797e-05} +{"train_loss": 0.008533600717782974, "global_step": 13274, "epoch": 111, "lr": 9.220095658946333e-05} +{"train_loss": 0.007086616475135088, "global_step": 13275, "epoch": 111, "lr": 9.219976834127258e-05} +{"train_loss": 0.008043123409152031, "global_step": 13276, "epoch": 111, "lr": 9.219858001022709e-05} +{"train_loss": 0.005607747007161379, "global_step": 13277, "epoch": 111, "lr": 9.219739159632919e-05} +{"train_loss": 0.007609900552779436, "global_step": 13278, "epoch": 111, "lr": 9.219620309958123e-05} +{"train_loss": 0.0063372086733579636, "global_step": 13279, "epoch": 111, "lr": 9.219501451998554e-05} +{"train_loss": 0.010383103974163532, "global_step": 13280, "epoch": 111, "lr": 9.219382585754444e-05} +{"train_loss": 0.007192517630755901, "global_step": 13281, "epoch": 111, "lr": 9.219263711226025e-05} +{"train_loss": 0.005305948667228222, "global_step": 13282, "epoch": 111, "lr": 9.219144828413536e-05} +{"train_loss": 0.004670911934226751, "global_step": 13283, "epoch": 111, "lr": 9.219025937317205e-05} +{"train_loss": 0.008698079735040665, "global_step": 13284, "epoch": 111, "lr": 9.218907037937268e-05} +{"train_loss": 0.005207995884120464, "global_step": 13285, "epoch": 111, "lr": 9.218788130273957e-05} +{"train_loss": 0.00801078975200653, "global_step": 13286, "epoch": 111, "lr": 9.218669214327505e-05} +{"train_loss": 0.007775482255965471, "global_step": 13287, "epoch": 111, "lr": 9.218550290098149e-05} +{"train_loss": 0.008100214414298534, "global_step": 13288, "epoch": 111, "lr": 9.21843135758612e-05} +{"train_loss": 0.007657007779926062, "global_step": 13289, "epoch": 111, "lr": 9.21831241679165e-05} +{"train_loss": 0.006326011382043362, "global_step": 13290, "epoch": 111, "lr": 9.218193467714975e-05} +{"train_loss": 0.007819948717951775, "global_step": 13291, "epoch": 111, "lr": 9.21807451035633e-05} +{"train_loss": 0.009839019738137722, "global_step": 13292, "epoch": 111, "lr": 9.217955544715944e-05} +{"train_loss": 0.006006811745464802, "global_step": 13293, "epoch": 111, "lr": 9.217836570794052e-05} +{"train_loss": 0.008111035451292992, "global_step": 13294, "epoch": 111, "lr": 9.21771758859089e-05} +{"train_loss": 0.008661975152790546, "global_step": 13295, "epoch": 111, "lr": 9.21759859810669e-05} +{"train_loss": 0.008892308920621872, "global_step": 13296, "epoch": 111, "lr": 9.217479599341685e-05} +{"train_loss": 0.010295514948666096, "global_step": 13297, "epoch": 111, "lr": 9.21736059229611e-05} +{"train_loss": 0.005979405250400305, "global_step": 13298, "epoch": 111, "lr": 9.217241576970199e-05} +{"train_loss": 0.004408066626638174, "global_step": 13299, "epoch": 111, "lr": 9.217122553364183e-05} +{"train_loss": 0.005116544663906097, "global_step": 13300, "epoch": 111, "lr": 9.217003521478297e-05} +{"train_loss": 0.007480571512132883, "global_step": 13301, "epoch": 111, "lr": 9.216884481312778e-05} +{"train_loss": 0.010068734176456928, "global_step": 13302, "epoch": 111, "lr": 9.216765432867855e-05} +{"train_loss": 0.010176188312470913, "global_step": 13303, "epoch": 111, "lr": 9.216646376143764e-05} +{"train_loss": 0.01087085623294115, "global_step": 13304, "epoch": 111, "lr": 9.216527311140737e-05} +{"train_loss": 0.007951575331389904, "global_step": 13305, "epoch": 111, "lr": 9.216408237859011e-05} +{"train_loss": 0.007516816724091768, "global_step": 13306, "epoch": 111, "lr": 9.216289156298817e-05} +{"train_loss": 0.007461589761078358, "global_step": 13307, "epoch": 111, "lr": 9.21617006646039e-05} +{"train_loss": 0.009806463494896889, "global_step": 13308, "epoch": 111, "lr": 9.216050968343963e-05} +{"train_loss": 0.008003037422895432, "global_step": 13309, "epoch": 111, "lr": 9.21593186194977e-05} +{"train_loss": 0.008053403347730637, "global_step": 13310, "epoch": 111, "lr": 9.215812747278045e-05} +{"train_loss": 0.006769747473299503, "global_step": 13311, "epoch": 111, "lr": 9.215693624329024e-05} +{"train_loss": 0.006531575229018927, "global_step": 13312, "epoch": 111, "lr": 9.215574493102938e-05} +{"train_loss": 0.010470799170434475, "global_step": 13313, "epoch": 111, "lr": 9.215455353600021e-05} +{"train_loss": 0.010145332664251328, "global_step": 13314, "epoch": 111, "lr": 9.215336205820508e-05} +{"train_loss": 0.00801792647689581, "global_step": 13315, "epoch": 111, "lr": 9.215217049764632e-05} +{"train_loss": 0.008471714332699776, "global_step": 13316, "epoch": 111, "lr": 9.21509788543263e-05} +{"train_loss": 0.008924668654799461, "global_step": 13317, "epoch": 111, "lr": 9.214978712824734e-05} +{"train_loss": 0.006165215279906988, "global_step": 13318, "epoch": 111, "lr": 9.214859531941174e-05} +{"train_loss": 0.00579123105853796, "global_step": 13319, "epoch": 111, "lr": 9.21474034278219e-05} +{"train_loss": 0.006978989113122225, "global_step": 13320, "epoch": 111, "lr": 9.214621145348013e-05} +{"train_loss": 0.010026548057794571, "global_step": 13321, "epoch": 111, "lr": 9.214501939638877e-05} +{"train_loss": 0.008346403017640114, "global_step": 13322, "epoch": 111, "lr": 9.214382725655018e-05} +{"train_loss": 0.004400511272251606, "global_step": 13323, "epoch": 111, "lr": 9.21426350339667e-05} +{"train_loss": 0.007532095070928335, "global_step": 13324, "epoch": 111, "lr": 9.214144272864062e-05} +{"train_loss": 0.008547505363821983, "global_step": 13325, "epoch": 111, "lr": 9.214025034057434e-05} +{"train_loss": 0.004621995612978935, "global_step": 13326, "epoch": 111, "lr": 9.21390578697702e-05} +{"train_loss": 0.007723629517684213, "global_step": 13327, "epoch": 111, "lr": 9.213786531623048e-05, "val_loss": 0.010870442725718021} +{"train_loss": 0.006217661313712597, "global_step": 13328, "epoch": 112, "lr": 9.21366726799576e-05} +{"train_loss": 0.006126566790044308, "global_step": 13329, "epoch": 112, "lr": 9.213547996095385e-05} +{"train_loss": 0.006522748153656721, "global_step": 13330, "epoch": 112, "lr": 9.21342871592216e-05} +{"train_loss": 0.006266457028687, "global_step": 13331, "epoch": 112, "lr": 9.213309427476316e-05} +{"train_loss": 0.003792614210397005, "global_step": 13332, "epoch": 112, "lr": 9.213190130758089e-05} +{"train_loss": 0.006971265189349651, "global_step": 13333, "epoch": 112, "lr": 9.213070825767713e-05} +{"train_loss": 0.009771868586540222, "global_step": 13334, "epoch": 112, "lr": 9.212951512505424e-05} +{"train_loss": 0.008141806349158287, "global_step": 13335, "epoch": 112, "lr": 9.212832190971454e-05} +{"train_loss": 0.005821047350764275, "global_step": 13336, "epoch": 112, "lr": 9.212712861166039e-05} +{"train_loss": 0.009996555745601654, "global_step": 13337, "epoch": 112, "lr": 9.212593523089411e-05} +{"train_loss": 0.00693947309628129, "global_step": 13338, "epoch": 112, "lr": 9.212474176741807e-05} +{"train_loss": 0.007262222934514284, "global_step": 13339, "epoch": 112, "lr": 9.212354822123459e-05} +{"train_loss": 0.0073600341565907, "global_step": 13340, "epoch": 112, "lr": 9.212235459234603e-05} +{"train_loss": 0.008737277239561081, "global_step": 13341, "epoch": 112, "lr": 9.212116088075472e-05} +{"train_loss": 0.005544033832848072, "global_step": 13342, "epoch": 112, "lr": 9.211996708646302e-05} +{"train_loss": 0.005874943919479847, "global_step": 13343, "epoch": 112, "lr": 9.211877320947324e-05} +{"train_loss": 0.010837935842573643, "global_step": 13344, "epoch": 112, "lr": 9.211757924978778e-05} +{"train_loss": 0.008900563232600689, "global_step": 13345, "epoch": 112, "lr": 9.211638520740894e-05} +{"train_loss": 0.004949244204908609, "global_step": 13346, "epoch": 112, "lr": 9.211519108233907e-05} +{"train_loss": 0.005069468170404434, "global_step": 13347, "epoch": 112, "lr": 9.211399687458053e-05} +{"train_loss": 0.008697567507624626, "global_step": 13348, "epoch": 112, "lr": 9.211280258413565e-05} +{"train_loss": 0.005884782876819372, "global_step": 13349, "epoch": 112, "lr": 9.21116082110068e-05} +{"train_loss": 0.010865564458072186, "global_step": 13350, "epoch": 112, "lr": 9.21104137551963e-05} +{"train_loss": 0.008378907106816769, "global_step": 13351, "epoch": 112, "lr": 9.210921921670648e-05} +{"train_loss": 0.009550357237458229, "global_step": 13352, "epoch": 112, "lr": 9.210802459553972e-05} +{"train_loss": 0.006879216991364956, "global_step": 13353, "epoch": 112, "lr": 9.210682989169836e-05} +{"train_loss": 0.005147615913301706, "global_step": 13354, "epoch": 112, "lr": 9.210563510518472e-05} +{"train_loss": 0.005184638313949108, "global_step": 13355, "epoch": 112, "lr": 9.210444023600117e-05} +{"train_loss": 0.00884375348687172, "global_step": 13356, "epoch": 112, "lr": 9.210324528415007e-05} +{"train_loss": 0.007111233659088612, "global_step": 13357, "epoch": 112, "lr": 9.210205024963373e-05} +{"train_loss": 0.005242533516138792, "global_step": 13358, "epoch": 112, "lr": 9.21008551324545e-05} +{"train_loss": 0.008676561526954174, "global_step": 13359, "epoch": 112, "lr": 9.209965993261475e-05} +{"train_loss": 0.0077328672632575035, "global_step": 13360, "epoch": 112, "lr": 9.209846465011683e-05} +{"train_loss": 0.006751681212335825, "global_step": 13361, "epoch": 112, "lr": 9.209726928496304e-05} +{"train_loss": 0.007522791624069214, "global_step": 13362, "epoch": 112, "lr": 9.20960738371558e-05} +{"train_loss": 0.005471932236105204, "global_step": 13363, "epoch": 112, "lr": 9.209487830669738e-05} +{"train_loss": 0.007283478043973446, "global_step": 13364, "epoch": 112, "lr": 9.209368269359018e-05} +{"train_loss": 0.006754037458449602, "global_step": 13365, "epoch": 112, "lr": 9.209248699783653e-05} +{"train_loss": 0.006292594596743584, "global_step": 13366, "epoch": 112, "lr": 9.209129121943878e-05} +{"train_loss": 0.006559931673109531, "global_step": 13367, "epoch": 112, "lr": 9.209009535839927e-05} +{"train_loss": 0.009334277361631393, "global_step": 13368, "epoch": 112, "lr": 9.208889941472037e-05} +{"train_loss": 0.00940086878836155, "global_step": 13369, "epoch": 112, "lr": 9.20877033884044e-05} +{"train_loss": 0.005377635825425386, "global_step": 13370, "epoch": 112, "lr": 9.208650727945371e-05} +{"train_loss": 0.005404471419751644, "global_step": 13371, "epoch": 112, "lr": 9.208531108787068e-05} +{"train_loss": 0.007828990928828716, "global_step": 13372, "epoch": 112, "lr": 9.208411481365763e-05} +{"train_loss": 0.008778335526585579, "global_step": 13373, "epoch": 112, "lr": 9.208291845681691e-05} +{"train_loss": 0.004830980207771063, "global_step": 13374, "epoch": 112, "lr": 9.208172201735088e-05} +{"train_loss": 0.007865047082304955, "global_step": 13375, "epoch": 112, "lr": 9.208052549526189e-05} +{"train_loss": 0.008843155577778816, "global_step": 13376, "epoch": 112, "lr": 9.207932889055228e-05} +{"train_loss": 0.008895458653569221, "global_step": 13377, "epoch": 112, "lr": 9.207813220322441e-05} +{"train_loss": 0.008273663930594921, "global_step": 13378, "epoch": 112, "lr": 9.20769354332806e-05} +{"train_loss": 0.007900352589786053, "global_step": 13379, "epoch": 112, "lr": 9.207573858072325e-05} +{"train_loss": 0.004052848555147648, "global_step": 13380, "epoch": 112, "lr": 9.207454164555467e-05} +{"train_loss": 0.006769292522221804, "global_step": 13381, "epoch": 112, "lr": 9.207334462777723e-05} +{"train_loss": 0.012280400842428207, "global_step": 13382, "epoch": 112, "lr": 9.207214752739326e-05} +{"train_loss": 0.006723788566887379, "global_step": 13383, "epoch": 112, "lr": 9.207095034440514e-05} +{"train_loss": 0.006329261232167482, "global_step": 13384, "epoch": 112, "lr": 9.206975307881518e-05} +{"train_loss": 0.010484251193702221, "global_step": 13385, "epoch": 112, "lr": 9.206855573062576e-05} +{"train_loss": 0.004052344243973494, "global_step": 13386, "epoch": 112, "lr": 9.206735829983923e-05} +{"train_loss": 0.007312027737498283, "global_step": 13387, "epoch": 112, "lr": 9.206616078645796e-05} +{"train_loss": 0.009251803159713745, "global_step": 13388, "epoch": 112, "lr": 9.206496319048424e-05} +{"train_loss": 0.007594125345349312, "global_step": 13389, "epoch": 112, "lr": 9.206376551192048e-05} +{"train_loss": 0.009098618291318417, "global_step": 13390, "epoch": 112, "lr": 9.2062567750769e-05} +{"train_loss": 0.007826047018170357, "global_step": 13391, "epoch": 112, "lr": 9.206136990703217e-05} +{"train_loss": 0.007999585941433907, "global_step": 13392, "epoch": 112, "lr": 9.206017198071233e-05} +{"train_loss": 0.009983460418879986, "global_step": 13393, "epoch": 112, "lr": 9.205897397181183e-05} +{"train_loss": 0.0044479710049927235, "global_step": 13394, "epoch": 112, "lr": 9.205777588033305e-05} +{"train_loss": 0.007835484109818935, "global_step": 13395, "epoch": 112, "lr": 9.20565777062783e-05} +{"train_loss": 0.009030178189277649, "global_step": 13396, "epoch": 112, "lr": 9.205537944964995e-05} +{"train_loss": 0.005909427534788847, "global_step": 13397, "epoch": 112, "lr": 9.205418111045036e-05} +{"train_loss": 0.0039716437458992004, "global_step": 13398, "epoch": 112, "lr": 9.205298268868188e-05} +{"train_loss": 0.003880928736180067, "global_step": 13399, "epoch": 112, "lr": 9.205178418434687e-05} +{"train_loss": 0.009333130903542042, "global_step": 13400, "epoch": 112, "lr": 9.205058559744766e-05} +{"train_loss": 0.009569200687110424, "global_step": 13401, "epoch": 112, "lr": 9.204938692798664e-05} +{"train_loss": 0.009551707655191422, "global_step": 13402, "epoch": 112, "lr": 9.204818817596613e-05} +{"train_loss": 0.006971609778702259, "global_step": 13403, "epoch": 112, "lr": 9.204698934138847e-05} +{"train_loss": 0.00700283283367753, "global_step": 13404, "epoch": 112, "lr": 9.204579042425607e-05} +{"train_loss": 0.008639328181743622, "global_step": 13405, "epoch": 112, "lr": 9.204459142457124e-05} +{"train_loss": 0.009271974675357342, "global_step": 13406, "epoch": 112, "lr": 9.204339234233634e-05} +{"train_loss": 0.00546931941062212, "global_step": 13407, "epoch": 112, "lr": 9.204219317755373e-05} +{"train_loss": 0.007233594078570604, "global_step": 13408, "epoch": 112, "lr": 9.204099393022578e-05} +{"train_loss": 0.00640899920836091, "global_step": 13409, "epoch": 112, "lr": 9.203979460035484e-05} +{"train_loss": 0.008413190953433514, "global_step": 13410, "epoch": 112, "lr": 9.203859518794322e-05} +{"train_loss": 0.007648547179996967, "global_step": 13411, "epoch": 112, "lr": 9.203739569299332e-05} +{"train_loss": 0.007633978966623545, "global_step": 13412, "epoch": 112, "lr": 9.20361961155075e-05} +{"train_loss": 0.008189458400011063, "global_step": 13413, "epoch": 112, "lr": 9.20349964554881e-05} +{"train_loss": 0.009224489331245422, "global_step": 13414, "epoch": 112, "lr": 9.203379671293746e-05} +{"train_loss": 0.006137503311038017, "global_step": 13415, "epoch": 112, "lr": 9.203259688785796e-05} +{"train_loss": 0.004732855595648289, "global_step": 13416, "epoch": 112, "lr": 9.203139698025193e-05} +{"train_loss": 0.011686605401337147, "global_step": 13417, "epoch": 112, "lr": 9.203019699012176e-05} +{"train_loss": 0.006249462254345417, "global_step": 13418, "epoch": 112, "lr": 9.20289969174698e-05} +{"train_loss": 0.008253313601016998, "global_step": 13419, "epoch": 112, "lr": 9.202779676229838e-05} +{"train_loss": 0.005912936292588711, "global_step": 13420, "epoch": 112, "lr": 9.202659652460986e-05} +{"train_loss": 0.007010561879724264, "global_step": 13421, "epoch": 112, "lr": 9.202539620440662e-05} +{"train_loss": 0.007311498746275902, "global_step": 13422, "epoch": 112, "lr": 9.202419580169101e-05} +{"train_loss": 0.007919755764305592, "global_step": 13423, "epoch": 112, "lr": 9.202299531646536e-05} +{"train_loss": 0.006575176026672125, "global_step": 13424, "epoch": 112, "lr": 9.202179474873207e-05} +{"train_loss": 0.005738282576203346, "global_step": 13425, "epoch": 112, "lr": 9.202059409849347e-05} +{"train_loss": 0.006937254220247269, "global_step": 13426, "epoch": 112, "lr": 9.201939336575192e-05} +{"train_loss": 0.005531700793653727, "global_step": 13427, "epoch": 112, "lr": 9.201819255050978e-05} +{"train_loss": 0.006652918644249439, "global_step": 13428, "epoch": 112, "lr": 9.20169916527694e-05} +{"train_loss": 0.008882240392267704, "global_step": 13429, "epoch": 112, "lr": 9.201579067253316e-05} +{"train_loss": 0.008722756989300251, "global_step": 13430, "epoch": 112, "lr": 9.201458960980341e-05} +{"train_loss": 0.009219336323440075, "global_step": 13431, "epoch": 112, "lr": 9.201338846458248e-05} +{"train_loss": 0.008136369287967682, "global_step": 13432, "epoch": 112, "lr": 9.201218723687276e-05} +{"train_loss": 0.006774876266717911, "global_step": 13433, "epoch": 112, "lr": 9.201098592667661e-05} +{"train_loss": 0.006407833658158779, "global_step": 13434, "epoch": 112, "lr": 9.200978453399635e-05} +{"train_loss": 0.006445972714573145, "global_step": 13435, "epoch": 112, "lr": 9.200858305883439e-05} +{"train_loss": 0.007855999283492565, "global_step": 13436, "epoch": 112, "lr": 9.200738150119305e-05} +{"train_loss": 0.007671216037124395, "global_step": 13437, "epoch": 112, "lr": 9.200617986107471e-05} +{"train_loss": 0.006300652865320444, "global_step": 13438, "epoch": 112, "lr": 9.200497813848173e-05} +{"train_loss": 0.009152519516646862, "global_step": 13439, "epoch": 112, "lr": 9.200377633341646e-05} +{"train_loss": 0.007294772192835808, "global_step": 13440, "epoch": 112, "lr": 9.200257444588126e-05} +{"train_loss": 0.006853977683931589, "global_step": 13441, "epoch": 112, "lr": 9.20013724758785e-05} +{"train_loss": 0.00549825094640255, "global_step": 13442, "epoch": 112, "lr": 9.200017042341052e-05} +{"train_loss": 0.00881228968501091, "global_step": 13443, "epoch": 112, "lr": 9.199896828847969e-05} +{"train_loss": 0.005330271553248167, "global_step": 13444, "epoch": 112, "lr": 9.199776607108838e-05} +{"train_loss": 0.005681205075234175, "global_step": 13445, "epoch": 112, "lr": 9.199656377123895e-05} +{"train_loss": 0.0073269053338831215, "global_step": 13446, "epoch": 112, "lr": 9.199536138893374e-05, "val_loss": 0.021675996482372284} +{"train_loss": 0.005533752031624317, "global_step": 13447, "epoch": 113, "lr": 9.199415892417514e-05} +{"train_loss": 0.00629819743335247, "global_step": 13448, "epoch": 113, "lr": 9.199295637696549e-05} +{"train_loss": 0.008664794266223907, "global_step": 13449, "epoch": 113, "lr": 9.199175374730716e-05} +{"train_loss": 0.006040002219378948, "global_step": 13450, "epoch": 113, "lr": 9.199055103520249e-05} +{"train_loss": 0.005147836171090603, "global_step": 13451, "epoch": 113, "lr": 9.198934824065389e-05} +{"train_loss": 0.005974249914288521, "global_step": 13452, "epoch": 113, "lr": 9.198814536366365e-05} +{"train_loss": 0.0050787958316504955, "global_step": 13453, "epoch": 113, "lr": 9.19869424042342e-05} +{"train_loss": 0.010168718174099922, "global_step": 13454, "epoch": 113, "lr": 9.198573936236787e-05} +{"train_loss": 0.005636623594909906, "global_step": 13455, "epoch": 113, "lr": 9.198453623806702e-05} +{"train_loss": 0.00706814881414175, "global_step": 13456, "epoch": 113, "lr": 9.198333303133401e-05} +{"train_loss": 0.006617098115384579, "global_step": 13457, "epoch": 113, "lr": 9.198212974217124e-05} +{"train_loss": 0.007647589780390263, "global_step": 13458, "epoch": 113, "lr": 9.198092637058102e-05} +{"train_loss": 0.005861766170710325, "global_step": 13459, "epoch": 113, "lr": 9.197972291656574e-05} +{"train_loss": 0.007578031159937382, "global_step": 13460, "epoch": 113, "lr": 9.197851938012777e-05} +{"train_loss": 0.009027006104588509, "global_step": 13461, "epoch": 113, "lr": 9.197731576126944e-05} +{"train_loss": 0.004766336642205715, "global_step": 13462, "epoch": 113, "lr": 9.197611205999316e-05} +{"train_loss": 0.005917471833527088, "global_step": 13463, "epoch": 113, "lr": 9.197490827630127e-05} +{"train_loss": 0.006665251683443785, "global_step": 13464, "epoch": 113, "lr": 9.19737044101961e-05} +{"train_loss": 0.007107149809598923, "global_step": 13465, "epoch": 113, "lr": 9.197250046168007e-05} +{"train_loss": 0.007547522429376841, "global_step": 13466, "epoch": 113, "lr": 9.197129643075552e-05} +{"train_loss": 0.0061555104330182076, "global_step": 13467, "epoch": 113, "lr": 9.197009231742481e-05} +{"train_loss": 0.006712362635880709, "global_step": 13468, "epoch": 113, "lr": 9.19688881216903e-05} +{"train_loss": 0.0054359761998057365, "global_step": 13469, "epoch": 113, "lr": 9.196768384355437e-05} +{"train_loss": 0.0066329361870884895, "global_step": 13470, "epoch": 113, "lr": 9.196647948301938e-05} +{"train_loss": 0.0064330692403018475, "global_step": 13471, "epoch": 113, "lr": 9.196527504008767e-05} +{"train_loss": 0.004682127386331558, "global_step": 13472, "epoch": 113, "lr": 9.196407051476163e-05} +{"train_loss": 0.007614816073328257, "global_step": 13473, "epoch": 113, "lr": 9.196286590704364e-05} +{"train_loss": 0.00770963029935956, "global_step": 13474, "epoch": 113, "lr": 9.196166121693603e-05} +{"train_loss": 0.005985623691231012, "global_step": 13475, "epoch": 113, "lr": 9.19604564444412e-05} +{"train_loss": 0.005838366691023111, "global_step": 13476, "epoch": 113, "lr": 9.195925158956149e-05} +{"train_loss": 0.010533890686929226, "global_step": 13477, "epoch": 113, "lr": 9.195804665229925e-05} +{"train_loss": 0.005760990548878908, "global_step": 13478, "epoch": 113, "lr": 9.19568416326569e-05} +{"train_loss": 0.002970793517306447, "global_step": 13479, "epoch": 113, "lr": 9.195563653063675e-05} +{"train_loss": 0.007044164463877678, "global_step": 13480, "epoch": 113, "lr": 9.19544313462412e-05} +{"train_loss": 0.006411127280443907, "global_step": 13481, "epoch": 113, "lr": 9.195322607947261e-05} +{"train_loss": 0.008697872050106525, "global_step": 13482, "epoch": 113, "lr": 9.195202073033333e-05} +{"train_loss": 0.0064440504647791386, "global_step": 13483, "epoch": 113, "lr": 9.195081529882574e-05} +{"train_loss": 0.007463613525032997, "global_step": 13484, "epoch": 113, "lr": 9.194960978495221e-05} +{"train_loss": 0.008936471305787563, "global_step": 13485, "epoch": 113, "lr": 9.194840418871511e-05} +{"train_loss": 0.006301846820861101, "global_step": 13486, "epoch": 113, "lr": 9.194719851011681e-05} +{"train_loss": 0.007778363302350044, "global_step": 13487, "epoch": 113, "lr": 9.194599274915965e-05} +{"train_loss": 0.00727618345990777, "global_step": 13488, "epoch": 113, "lr": 9.194478690584601e-05} +{"train_loss": 0.007161058951169252, "global_step": 13489, "epoch": 113, "lr": 9.194358098017828e-05} +{"train_loss": 0.0054036835208535194, "global_step": 13490, "epoch": 113, "lr": 9.19423749721588e-05} +{"train_loss": 0.004557549953460693, "global_step": 13491, "epoch": 113, "lr": 9.194116888178995e-05} +{"train_loss": 0.00681493803858757, "global_step": 13492, "epoch": 113, "lr": 9.193996270907408e-05} +{"train_loss": 0.0054435827769339085, "global_step": 13493, "epoch": 113, "lr": 9.193875645401359e-05} +{"train_loss": 0.00450048316270113, "global_step": 13494, "epoch": 113, "lr": 9.193755011661083e-05} +{"train_loss": 0.006803293712437153, "global_step": 13495, "epoch": 113, "lr": 9.193634369686816e-05} +{"train_loss": 0.008361619897186756, "global_step": 13496, "epoch": 113, "lr": 9.193513719478797e-05} +{"train_loss": 0.006016404367983341, "global_step": 13497, "epoch": 113, "lr": 9.19339306103726e-05} +{"train_loss": 0.006520268507301807, "global_step": 13498, "epoch": 113, "lr": 9.193272394362446e-05} +{"train_loss": 0.006309146992862225, "global_step": 13499, "epoch": 113, "lr": 9.19315171945459e-05} +{"train_loss": 0.007729307282716036, "global_step": 13500, "epoch": 113, "lr": 9.193031036313928e-05} +{"train_loss": 0.006723565049469471, "global_step": 13501, "epoch": 113, "lr": 9.192910344940697e-05} +{"train_loss": 0.004774502478539944, "global_step": 13502, "epoch": 113, "lr": 9.192789645335133e-05} +{"train_loss": 0.007000137586146593, "global_step": 13503, "epoch": 113, "lr": 9.192668937497478e-05} +{"train_loss": 0.008125461637973785, "global_step": 13504, "epoch": 113, "lr": 9.192548221427964e-05} +{"train_loss": 0.007718964479863644, "global_step": 13505, "epoch": 113, "lr": 9.192427497126827e-05} +{"train_loss": 0.008867236785590649, "global_step": 13506, "epoch": 113, "lr": 9.19230676459431e-05} +{"train_loss": 0.008649639785289764, "global_step": 13507, "epoch": 113, "lr": 9.192186023830644e-05} +{"train_loss": 0.005263855680823326, "global_step": 13508, "epoch": 113, "lr": 9.192065274836071e-05} +{"train_loss": 0.006900448352098465, "global_step": 13509, "epoch": 113, "lr": 9.191944517610823e-05} +{"train_loss": 0.006843099370598793, "global_step": 13510, "epoch": 113, "lr": 9.191823752155141e-05} +{"train_loss": 0.009332135319709778, "global_step": 13511, "epoch": 113, "lr": 9.191702978469261e-05} +{"train_loss": 0.006331840995699167, "global_step": 13512, "epoch": 113, "lr": 9.191582196553421e-05} +{"train_loss": 0.007282995153218508, "global_step": 13513, "epoch": 113, "lr": 9.191461406407856e-05} +{"train_loss": 0.008957264944911003, "global_step": 13514, "epoch": 113, "lr": 9.191340608032804e-05} +{"train_loss": 0.0075323437340557575, "global_step": 13515, "epoch": 113, "lr": 9.191219801428503e-05} +{"train_loss": 0.006042886059731245, "global_step": 13516, "epoch": 113, "lr": 9.191098986595191e-05} +{"train_loss": 0.008890294469892979, "global_step": 13517, "epoch": 113, "lr": 9.190978163533102e-05} +{"train_loss": 0.00481572886928916, "global_step": 13518, "epoch": 113, "lr": 9.190857332242475e-05} +{"train_loss": 0.005963121075183153, "global_step": 13519, "epoch": 113, "lr": 9.190736492723548e-05} +{"train_loss": 0.008717181161046028, "global_step": 13520, "epoch": 113, "lr": 9.190615644976557e-05} +{"train_loss": 0.009678802452981472, "global_step": 13521, "epoch": 113, "lr": 9.190494789001742e-05} +{"train_loss": 0.007453871425241232, "global_step": 13522, "epoch": 113, "lr": 9.190373924799336e-05} +{"train_loss": 0.006307176314294338, "global_step": 13523, "epoch": 113, "lr": 9.190253052369579e-05} +{"train_loss": 0.008054163306951523, "global_step": 13524, "epoch": 113, "lr": 9.190132171712709e-05} +{"train_loss": 0.004742729011923075, "global_step": 13525, "epoch": 113, "lr": 9.190011282828961e-05} +{"train_loss": 0.01345842331647873, "global_step": 13526, "epoch": 113, "lr": 9.189890385718573e-05} +{"train_loss": 0.007034998387098312, "global_step": 13527, "epoch": 113, "lr": 9.189769480381784e-05} +{"train_loss": 0.007785119581967592, "global_step": 13528, "epoch": 113, "lr": 9.18964856681883e-05} +{"train_loss": 0.007650439161807299, "global_step": 13529, "epoch": 113, "lr": 9.189527645029947e-05} +{"train_loss": 0.00667199632152915, "global_step": 13530, "epoch": 113, "lr": 9.189406715015376e-05} +{"train_loss": 0.006241034250706434, "global_step": 13531, "epoch": 113, "lr": 9.189285776775352e-05} +{"train_loss": 0.007284574210643768, "global_step": 13532, "epoch": 113, "lr": 9.189164830310114e-05} +{"train_loss": 0.011028270237147808, "global_step": 13533, "epoch": 113, "lr": 9.189043875619896e-05} +{"train_loss": 0.009973179548978806, "global_step": 13534, "epoch": 113, "lr": 9.188922912704938e-05} +{"train_loss": 0.007355985697358847, "global_step": 13535, "epoch": 113, "lr": 9.188801941565479e-05} +{"train_loss": 0.008328845724463463, "global_step": 13536, "epoch": 113, "lr": 9.188680962201755e-05} +{"train_loss": 0.008924061432480812, "global_step": 13537, "epoch": 113, "lr": 9.188559974614003e-05} +{"train_loss": 0.008054257370531559, "global_step": 13538, "epoch": 113, "lr": 9.18843897880246e-05} +{"train_loss": 0.00832604244351387, "global_step": 13539, "epoch": 113, "lr": 9.188317974767367e-05} +{"train_loss": 0.013369884341955185, "global_step": 13540, "epoch": 113, "lr": 9.188196962508957e-05} +{"train_loss": 0.005493528209626675, "global_step": 13541, "epoch": 113, "lr": 9.188075942027469e-05} +{"train_loss": 0.007892880588769913, "global_step": 13542, "epoch": 113, "lr": 9.187954913323142e-05} +{"train_loss": 0.008883188478648663, "global_step": 13543, "epoch": 113, "lr": 9.187833876396214e-05} +{"train_loss": 0.013013242743909359, "global_step": 13544, "epoch": 113, "lr": 9.187712831246921e-05} +{"train_loss": 0.0052025048062205315, "global_step": 13545, "epoch": 113, "lr": 9.187591777875502e-05} +{"train_loss": 0.009719336405396461, "global_step": 13546, "epoch": 113, "lr": 9.187470716282192e-05} +{"train_loss": 0.004669103305786848, "global_step": 13547, "epoch": 113, "lr": 9.187349646467232e-05} +{"train_loss": 0.007639114744961262, "global_step": 13548, "epoch": 113, "lr": 9.187228568430858e-05} +{"train_loss": 0.0070234849117696285, "global_step": 13549, "epoch": 113, "lr": 9.187107482173308e-05} +{"train_loss": 0.0075348978862166405, "global_step": 13550, "epoch": 113, "lr": 9.18698638769482e-05} +{"train_loss": 0.00867488607764244, "global_step": 13551, "epoch": 113, "lr": 9.186865284995631e-05} +{"train_loss": 0.006271848920732737, "global_step": 13552, "epoch": 113, "lr": 9.186744174075981e-05} +{"train_loss": 0.008452033624053001, "global_step": 13553, "epoch": 113, "lr": 9.186623054936105e-05} +{"train_loss": 0.007529435213655233, "global_step": 13554, "epoch": 113, "lr": 9.186501927576241e-05} +{"train_loss": 0.00816943496465683, "global_step": 13555, "epoch": 113, "lr": 9.186380791996629e-05} +{"train_loss": 0.010251044295728207, "global_step": 13556, "epoch": 113, "lr": 9.186259648197504e-05} +{"train_loss": 0.005776035599410534, "global_step": 13557, "epoch": 113, "lr": 9.186138496179106e-05} +{"train_loss": 0.010664568282663822, "global_step": 13558, "epoch": 113, "lr": 9.186017335941674e-05} +{"train_loss": 0.008041534572839737, "global_step": 13559, "epoch": 113, "lr": 9.185896167485443e-05} +{"train_loss": 0.007978374138474464, "global_step": 13560, "epoch": 113, "lr": 9.185774990810652e-05} +{"train_loss": 0.008865047246217728, "global_step": 13561, "epoch": 113, "lr": 9.185653805917539e-05} +{"train_loss": 0.009912884794175625, "global_step": 13562, "epoch": 113, "lr": 9.185532612806342e-05} +{"train_loss": 0.00669636158272624, "global_step": 13563, "epoch": 113, "lr": 9.185411411477299e-05} +{"train_loss": 0.007245218846946955, "global_step": 13564, "epoch": 113, "lr": 9.185290201930647e-05} +{"train_loss": 0.007297041984431508, "global_step": 13565, "epoch": 113, "lr": 9.185168984166625e-05, "val_loss": 0.01095745898783207} +{"train_loss": 0.010710272006690502, "global_step": 13566, "epoch": 114, "lr": 9.185047758185472e-05} +{"train_loss": 0.005979942623525858, "global_step": 13567, "epoch": 114, "lr": 9.184926523987423e-05} +{"train_loss": 0.00829117652028799, "global_step": 13568, "epoch": 114, "lr": 9.18480528157272e-05} +{"train_loss": 0.012671091593801975, "global_step": 13569, "epoch": 114, "lr": 9.184684030941598e-05} +{"train_loss": 0.007095531094819307, "global_step": 13570, "epoch": 114, "lr": 9.184562772094296e-05} +{"train_loss": 0.007829083129763603, "global_step": 13571, "epoch": 114, "lr": 9.184441505031052e-05} +{"train_loss": 0.0049636485055089, "global_step": 13572, "epoch": 114, "lr": 9.184320229752104e-05} +{"train_loss": 0.009296148084104061, "global_step": 13573, "epoch": 114, "lr": 9.18419894625769e-05} +{"train_loss": 0.006291472353041172, "global_step": 13574, "epoch": 114, "lr": 9.18407765454805e-05} +{"train_loss": 0.008906293660402298, "global_step": 13575, "epoch": 114, "lr": 9.183956354623417e-05} +{"train_loss": 0.009408664889633656, "global_step": 13576, "epoch": 114, "lr": 9.183835046484035e-05} +{"train_loss": 0.009784871712327003, "global_step": 13577, "epoch": 114, "lr": 9.18371373013014e-05} +{"train_loss": 0.006636689882725477, "global_step": 13578, "epoch": 114, "lr": 9.183592405561969e-05} +{"train_loss": 0.006609659176319838, "global_step": 13579, "epoch": 114, "lr": 9.183471072779763e-05} +{"train_loss": 0.008910538628697395, "global_step": 13580, "epoch": 114, "lr": 9.183349731783759e-05} +{"train_loss": 0.005628481041640043, "global_step": 13581, "epoch": 114, "lr": 9.183228382574192e-05} +{"train_loss": 0.009366623125970364, "global_step": 13582, "epoch": 114, "lr": 9.183107025151306e-05} +{"train_loss": 0.011499356478452682, "global_step": 13583, "epoch": 114, "lr": 9.182985659515333e-05} +{"train_loss": 0.007875656709074974, "global_step": 13584, "epoch": 114, "lr": 9.182864285666516e-05} +{"train_loss": 0.006256630644202232, "global_step": 13585, "epoch": 114, "lr": 9.182742903605092e-05} +{"train_loss": 0.011479837819933891, "global_step": 13586, "epoch": 114, "lr": 9.1826215133313e-05} +{"train_loss": 0.006964430678635836, "global_step": 13587, "epoch": 114, "lr": 9.182500114845376e-05} +{"train_loss": 0.006663308944553137, "global_step": 13588, "epoch": 114, "lr": 9.18237870814756e-05} +{"train_loss": 0.0070175654254853725, "global_step": 13589, "epoch": 114, "lr": 9.18225729323809e-05} +{"train_loss": 0.008560583926737309, "global_step": 13590, "epoch": 114, "lr": 9.182135870117205e-05} +{"train_loss": 0.008564237505197525, "global_step": 13591, "epoch": 114, "lr": 9.182014438785145e-05} +{"train_loss": 0.009600983932614326, "global_step": 13592, "epoch": 114, "lr": 9.181892999242143e-05} +{"train_loss": 0.0058647762052714825, "global_step": 13593, "epoch": 114, "lr": 9.181771551488443e-05} +{"train_loss": 0.007386738900095224, "global_step": 13594, "epoch": 114, "lr": 9.181650095524281e-05} +{"train_loss": 0.005699885077774525, "global_step": 13595, "epoch": 114, "lr": 9.181528631349897e-05} +{"train_loss": 0.005222730804234743, "global_step": 13596, "epoch": 114, "lr": 9.181407158965526e-05} +{"train_loss": 0.008218187838792801, "global_step": 13597, "epoch": 114, "lr": 9.181285678371409e-05} +{"train_loss": 0.011747139506042004, "global_step": 13598, "epoch": 114, "lr": 9.181164189567785e-05} +{"train_loss": 0.008564886637032032, "global_step": 13599, "epoch": 114, "lr": 9.181042692554893e-05} +{"train_loss": 0.008827446028590202, "global_step": 13600, "epoch": 114, "lr": 9.180921187332969e-05} +{"train_loss": 0.006003911141306162, "global_step": 13601, "epoch": 114, "lr": 9.180799673902253e-05} +{"train_loss": 0.004483863711357117, "global_step": 13602, "epoch": 114, "lr": 9.180678152262984e-05} +{"train_loss": 0.01027039997279644, "global_step": 13603, "epoch": 114, "lr": 9.1805566224154e-05} +{"train_loss": 0.004578045569360256, "global_step": 13604, "epoch": 114, "lr": 9.180435084359738e-05} +{"train_loss": 0.00706583634018898, "global_step": 13605, "epoch": 114, "lr": 9.180313538096241e-05} +{"train_loss": 0.009334481321275234, "global_step": 13606, "epoch": 114, "lr": 9.180191983625144e-05} +{"train_loss": 0.008429963141679764, "global_step": 13607, "epoch": 114, "lr": 9.180070420946684e-05} +{"train_loss": 0.008670899085700512, "global_step": 13608, "epoch": 114, "lr": 9.179948850061106e-05} +{"train_loss": 0.00798320583999157, "global_step": 13609, "epoch": 114, "lr": 9.179827270968643e-05} +{"train_loss": 0.012446180917322636, "global_step": 13610, "epoch": 114, "lr": 9.179705683669537e-05} +{"train_loss": 0.00469836313277483, "global_step": 13611, "epoch": 114, "lr": 9.179584088164024e-05} +{"train_loss": 0.008387461304664612, "global_step": 13612, "epoch": 114, "lr": 9.179462484452346e-05} +{"train_loss": 0.010651431046426296, "global_step": 13613, "epoch": 114, "lr": 9.179340872534738e-05} +{"train_loss": 0.010003356263041496, "global_step": 13614, "epoch": 114, "lr": 9.179219252411441e-05} +{"train_loss": 0.004618869628757238, "global_step": 13615, "epoch": 114, "lr": 9.179097624082695e-05} +{"train_loss": 0.005419684108346701, "global_step": 13616, "epoch": 114, "lr": 9.178975987548736e-05} +{"train_loss": 0.00606816541403532, "global_step": 13617, "epoch": 114, "lr": 9.178854342809804e-05} +{"train_loss": 0.006521440111100674, "global_step": 13618, "epoch": 114, "lr": 9.178732689866139e-05} +{"train_loss": 0.007492023054510355, "global_step": 13619, "epoch": 114, "lr": 9.178611028717978e-05} +{"train_loss": 0.005660956725478172, "global_step": 13620, "epoch": 114, "lr": 9.17848935936556e-05} +{"train_loss": 0.01040976494550705, "global_step": 13621, "epoch": 114, "lr": 9.178367681809126e-05} +{"train_loss": 0.00982726737856865, "global_step": 13622, "epoch": 114, "lr": 9.178245996048913e-05} +{"train_loss": 0.006439540069550276, "global_step": 13623, "epoch": 114, "lr": 9.17812430208516e-05} +{"train_loss": 0.008110537193715572, "global_step": 13624, "epoch": 114, "lr": 9.178002599918106e-05} +{"train_loss": 0.0068884058855473995, "global_step": 13625, "epoch": 114, "lr": 9.177880889547991e-05} +{"train_loss": 0.0066195325925946236, "global_step": 13626, "epoch": 114, "lr": 9.177759170975053e-05} +{"train_loss": 0.008454650640487671, "global_step": 13627, "epoch": 114, "lr": 9.177637444199531e-05} +{"train_loss": 0.008735585026443005, "global_step": 13628, "epoch": 114, "lr": 9.177515709221664e-05} +{"train_loss": 0.01062134001404047, "global_step": 13629, "epoch": 114, "lr": 9.177393966041692e-05} +{"train_loss": 0.004452123306691647, "global_step": 13630, "epoch": 114, "lr": 9.177272214659852e-05} +{"train_loss": 0.008938832208514214, "global_step": 13631, "epoch": 114, "lr": 9.177150455076385e-05} +{"train_loss": 0.009672238491475582, "global_step": 13632, "epoch": 114, "lr": 9.177028687291529e-05} +{"train_loss": 0.007396087050437927, "global_step": 13633, "epoch": 114, "lr": 9.176906911305525e-05} +{"train_loss": 0.008166607469320297, "global_step": 13634, "epoch": 114, "lr": 9.176785127118607e-05} +{"train_loss": 0.0057604750618338585, "global_step": 13635, "epoch": 114, "lr": 9.176663334731021e-05} +{"train_loss": 0.006050016265362501, "global_step": 13636, "epoch": 114, "lr": 9.176541534143002e-05} +{"train_loss": 0.008189293555915356, "global_step": 13637, "epoch": 114, "lr": 9.17641972535479e-05} +{"train_loss": 0.0069313873536884785, "global_step": 13638, "epoch": 114, "lr": 9.176297908366624e-05} +{"train_loss": 0.007559890393167734, "global_step": 13639, "epoch": 114, "lr": 9.176176083178743e-05} +{"train_loss": 0.004367384128272533, "global_step": 13640, "epoch": 114, "lr": 9.176054249791386e-05} +{"train_loss": 0.0046713948249816895, "global_step": 13641, "epoch": 114, "lr": 9.175932408204793e-05} +{"train_loss": 0.006262705661356449, "global_step": 13642, "epoch": 114, "lr": 9.175810558419202e-05} +{"train_loss": 0.006997902411967516, "global_step": 13643, "epoch": 114, "lr": 9.175688700434855e-05} +{"train_loss": 0.008086226880550385, "global_step": 13644, "epoch": 114, "lr": 9.175566834251987e-05} +{"train_loss": 0.005657263565808535, "global_step": 13645, "epoch": 114, "lr": 9.17544495987084e-05} +{"train_loss": 0.006995081901550293, "global_step": 13646, "epoch": 114, "lr": 9.175323077291655e-05} +{"train_loss": 0.007182011380791664, "global_step": 13647, "epoch": 114, "lr": 9.175201186514668e-05} +{"train_loss": 0.007159008644521236, "global_step": 13648, "epoch": 114, "lr": 9.175079287540118e-05} +{"train_loss": 0.00840233825147152, "global_step": 13649, "epoch": 114, "lr": 9.174957380368247e-05} +{"train_loss": 0.009051111526787281, "global_step": 13650, "epoch": 114, "lr": 9.174835464999294e-05} +{"train_loss": 0.008222325704991817, "global_step": 13651, "epoch": 114, "lr": 9.174713541433498e-05} +{"train_loss": 0.005867369938641787, "global_step": 13652, "epoch": 114, "lr": 9.174591609671096e-05} +{"train_loss": 0.008633268065750599, "global_step": 13653, "epoch": 114, "lr": 9.174469669712331e-05} +{"train_loss": 0.007067174185067415, "global_step": 13654, "epoch": 114, "lr": 9.174347721557441e-05} +{"train_loss": 0.0061186389066278934, "global_step": 13655, "epoch": 114, "lr": 9.174225765206664e-05} +{"train_loss": 0.00988946296274662, "global_step": 13656, "epoch": 114, "lr": 9.174103800660241e-05} +{"train_loss": 0.007127421908080578, "global_step": 13657, "epoch": 114, "lr": 9.173981827918411e-05} +{"train_loss": 0.004904272500425577, "global_step": 13658, "epoch": 114, "lr": 9.173859846981415e-05} +{"train_loss": 0.0063041155226528645, "global_step": 13659, "epoch": 114, "lr": 9.17373785784949e-05} +{"train_loss": 0.006507920566946268, "global_step": 13660, "epoch": 114, "lr": 9.173615860522875e-05} +{"train_loss": 0.006899897009134293, "global_step": 13661, "epoch": 114, "lr": 9.173493855001814e-05} +{"train_loss": 0.005431027617305517, "global_step": 13662, "epoch": 114, "lr": 9.173371841286541e-05} +{"train_loss": 0.006147449836134911, "global_step": 13663, "epoch": 114, "lr": 9.1732498193773e-05} +{"train_loss": 0.008169800974428654, "global_step": 13664, "epoch": 114, "lr": 9.173127789274329e-05} +{"train_loss": 0.005638453643769026, "global_step": 13665, "epoch": 114, "lr": 9.173005750977865e-05} +{"train_loss": 0.008492718450725079, "global_step": 13666, "epoch": 114, "lr": 9.172883704488153e-05} +{"train_loss": 0.005752069875597954, "global_step": 13667, "epoch": 114, "lr": 9.172761649805428e-05} +{"train_loss": 0.007420394569635391, "global_step": 13668, "epoch": 114, "lr": 9.172639586929932e-05} +{"train_loss": 0.007967066951096058, "global_step": 13669, "epoch": 114, "lr": 9.172517515861903e-05} +{"train_loss": 0.009507367387413979, "global_step": 13670, "epoch": 114, "lr": 9.172395436601582e-05} +{"train_loss": 0.006769957952201366, "global_step": 13671, "epoch": 114, "lr": 9.17227334914921e-05} +{"train_loss": 0.005458606872707605, "global_step": 13672, "epoch": 114, "lr": 9.172151253505023e-05} +{"train_loss": 0.008309721946716309, "global_step": 13673, "epoch": 114, "lr": 9.172029149669264e-05} +{"train_loss": 0.008190600201487541, "global_step": 13674, "epoch": 114, "lr": 9.171907037642171e-05} +{"train_loss": 0.006633219309151173, "global_step": 13675, "epoch": 114, "lr": 9.171784917423984e-05} +{"train_loss": 0.0074204495176672935, "global_step": 13676, "epoch": 114, "lr": 9.171662789014943e-05} +{"train_loss": 0.006448924075812101, "global_step": 13677, "epoch": 114, "lr": 9.17154065241529e-05} +{"train_loss": 0.005151764955371618, "global_step": 13678, "epoch": 114, "lr": 9.171418507625259e-05} +{"train_loss": 0.005939506459981203, "global_step": 13679, "epoch": 114, "lr": 9.171296354645095e-05} +{"train_loss": 0.007252473849803209, "global_step": 13680, "epoch": 114, "lr": 9.171174193475036e-05} +{"train_loss": 0.006638550665229559, "global_step": 13681, "epoch": 114, "lr": 9.171052024115323e-05} +{"train_loss": 0.005628389772027731, "global_step": 13682, "epoch": 114, "lr": 9.170929846566195e-05} +{"train_loss": 0.011219063773751259, "global_step": 13683, "epoch": 114, "lr": 9.17080766082789e-05} +{"train_loss": 0.007522322847938337, "global_step": 13684, "epoch": 114, "lr": 9.17068546690065e-05, "val_loss": 0.014730164781212807} +{"train_loss": 0.007557186298072338, "global_step": 13685, "epoch": 115, "lr": 9.170563264784716e-05} +{"train_loss": 0.00786003191024065, "global_step": 13686, "epoch": 115, "lr": 9.170441054480326e-05} +{"train_loss": 0.011591453105211258, "global_step": 13687, "epoch": 115, "lr": 9.170318835987721e-05} +{"train_loss": 0.013519414700567722, "global_step": 13688, "epoch": 115, "lr": 9.17019660930714e-05} +{"train_loss": 0.004405982792377472, "global_step": 13689, "epoch": 115, "lr": 9.170074374438824e-05} +{"train_loss": 0.007059973664581776, "global_step": 13690, "epoch": 115, "lr": 9.169952131383012e-05} +{"train_loss": 0.0073338462971150875, "global_step": 13691, "epoch": 115, "lr": 9.169829880139944e-05} +{"train_loss": 0.006226350553333759, "global_step": 13692, "epoch": 115, "lr": 9.169707620709861e-05} +{"train_loss": 0.006154340226203203, "global_step": 13693, "epoch": 115, "lr": 9.169585353093002e-05} +{"train_loss": 0.00811843853443861, "global_step": 13694, "epoch": 115, "lr": 9.169463077289608e-05} +{"train_loss": 0.008332016877830029, "global_step": 13695, "epoch": 115, "lr": 9.169340793299919e-05} +{"train_loss": 0.0065409536473453045, "global_step": 13696, "epoch": 115, "lr": 9.169218501124176e-05} +{"train_loss": 0.0057810707949101925, "global_step": 13697, "epoch": 115, "lr": 9.169096200762617e-05} +{"train_loss": 0.006904405541718006, "global_step": 13698, "epoch": 115, "lr": 9.168973892215482e-05} +{"train_loss": 0.012469283305108547, "global_step": 13699, "epoch": 115, "lr": 9.168851575483013e-05} +{"train_loss": 0.009201433509588242, "global_step": 13700, "epoch": 115, "lr": 9.168729250565448e-05} +{"train_loss": 0.007183625362813473, "global_step": 13701, "epoch": 115, "lr": 9.16860691746303e-05} +{"train_loss": 0.009989466518163681, "global_step": 13702, "epoch": 115, "lr": 9.168484576175997e-05} +{"train_loss": 0.00989128090441227, "global_step": 13703, "epoch": 115, "lr": 9.168362226704591e-05} +{"train_loss": 0.006182086654007435, "global_step": 13704, "epoch": 115, "lr": 9.16823986904905e-05} +{"train_loss": 0.00417538546025753, "global_step": 13705, "epoch": 115, "lr": 9.168117503209616e-05} +{"train_loss": 0.010199004784226418, "global_step": 13706, "epoch": 115, "lr": 9.167995129186527e-05} +{"train_loss": 0.006530777085572481, "global_step": 13707, "epoch": 115, "lr": 9.167872746980026e-05} +{"train_loss": 0.011313652619719505, "global_step": 13708, "epoch": 115, "lr": 9.167750356590352e-05} +{"train_loss": 0.006795520428568125, "global_step": 13709, "epoch": 115, "lr": 9.167627958017746e-05} +{"train_loss": 0.008741103112697601, "global_step": 13710, "epoch": 115, "lr": 9.167505551262448e-05} +{"train_loss": 0.007126572076231241, "global_step": 13711, "epoch": 115, "lr": 9.167383136324696e-05} +{"train_loss": 0.00757265742868185, "global_step": 13712, "epoch": 115, "lr": 9.167260713204735e-05} +{"train_loss": 0.005832655820995569, "global_step": 13713, "epoch": 115, "lr": 9.167138281902801e-05} +{"train_loss": 0.009655630216002464, "global_step": 13714, "epoch": 115, "lr": 9.167015842419136e-05} +{"train_loss": 0.007320774719119072, "global_step": 13715, "epoch": 115, "lr": 9.166893394753982e-05} +{"train_loss": 0.012177848257124424, "global_step": 13716, "epoch": 115, "lr": 9.166770938907578e-05} +{"train_loss": 0.00839180126786232, "global_step": 13717, "epoch": 115, "lr": 9.166648474880163e-05} +{"train_loss": 0.006142825353890657, "global_step": 13718, "epoch": 115, "lr": 9.16652600267198e-05} +{"train_loss": 0.00948421098291874, "global_step": 13719, "epoch": 115, "lr": 9.166403522283268e-05} +{"train_loss": 0.004235687665641308, "global_step": 13720, "epoch": 115, "lr": 9.166281033714267e-05} +{"train_loss": 0.01160554401576519, "global_step": 13721, "epoch": 115, "lr": 9.16615853696522e-05} +{"train_loss": 0.005591068882495165, "global_step": 13722, "epoch": 115, "lr": 9.166036032036365e-05} +{"train_loss": 0.00851783249527216, "global_step": 13723, "epoch": 115, "lr": 9.165913518927942e-05} +{"train_loss": 0.008932316675782204, "global_step": 13724, "epoch": 115, "lr": 9.165790997640194e-05} +{"train_loss": 0.006413010414689779, "global_step": 13725, "epoch": 115, "lr": 9.165668468173361e-05} +{"train_loss": 0.006847696844488382, "global_step": 13726, "epoch": 115, "lr": 9.165545930527681e-05} +{"train_loss": 0.00986996479332447, "global_step": 13727, "epoch": 115, "lr": 9.1654233847034e-05} +{"train_loss": 0.006697273813188076, "global_step": 13728, "epoch": 115, "lr": 9.165300830700753e-05} +{"train_loss": 0.008922024630010128, "global_step": 13729, "epoch": 115, "lr": 9.165178268519982e-05} +{"train_loss": 0.006857177242636681, "global_step": 13730, "epoch": 115, "lr": 9.165055698161329e-05} +{"train_loss": 0.009359261952340603, "global_step": 13731, "epoch": 115, "lr": 9.164933119625036e-05} +{"train_loss": 0.006947188172489405, "global_step": 13732, "epoch": 115, "lr": 9.164810532911339e-05} +{"train_loss": 0.009188045747578144, "global_step": 13733, "epoch": 115, "lr": 9.164687938020483e-05} +{"train_loss": 0.010241519659757614, "global_step": 13734, "epoch": 115, "lr": 9.164565334952709e-05} +{"train_loss": 0.007213585544377565, "global_step": 13735, "epoch": 115, "lr": 9.164442723708254e-05} +{"train_loss": 0.007371187675744295, "global_step": 13736, "epoch": 115, "lr": 9.164320104287358e-05} +{"train_loss": 0.009059276431798935, "global_step": 13737, "epoch": 115, "lr": 9.164197476690268e-05} +{"train_loss": 0.006617083679884672, "global_step": 13738, "epoch": 115, "lr": 9.16407484091722e-05} +{"train_loss": 0.008051758632063866, "global_step": 13739, "epoch": 115, "lr": 9.163952196968455e-05} +{"train_loss": 0.005637721624225378, "global_step": 13740, "epoch": 115, "lr": 9.163829544844215e-05} +{"train_loss": 0.008066149428486824, "global_step": 13741, "epoch": 115, "lr": 9.163706884544743e-05} +{"train_loss": 0.007916374132037163, "global_step": 13742, "epoch": 115, "lr": 9.163584216070275e-05} +{"train_loss": 0.007786291651427746, "global_step": 13743, "epoch": 115, "lr": 9.163461539421055e-05} +{"train_loss": 0.005071911029517651, "global_step": 13744, "epoch": 115, "lr": 9.163338854597324e-05} +{"train_loss": 0.007215702440589666, "global_step": 13745, "epoch": 115, "lr": 9.163216161599319e-05} +{"train_loss": 0.010888774879276752, "global_step": 13746, "epoch": 115, "lr": 9.163093460427285e-05} +{"train_loss": 0.007477725390344858, "global_step": 13747, "epoch": 115, "lr": 9.162970751081464e-05} +{"train_loss": 0.008868569508194923, "global_step": 13748, "epoch": 115, "lr": 9.162848033562091e-05} +{"train_loss": 0.011324076913297176, "global_step": 13749, "epoch": 115, "lr": 9.162725307869413e-05} +{"train_loss": 0.00766673544421792, "global_step": 13750, "epoch": 115, "lr": 9.16260257400367e-05} +{"train_loss": 0.00807286985218525, "global_step": 13751, "epoch": 115, "lr": 9.162479831965099e-05} +{"train_loss": 0.007290683686733246, "global_step": 13752, "epoch": 115, "lr": 9.162357081753942e-05} +{"train_loss": 0.0073357536457479, "global_step": 13753, "epoch": 115, "lr": 9.162234323370445e-05} +{"train_loss": 0.007365432567894459, "global_step": 13754, "epoch": 115, "lr": 9.162111556814846e-05} +{"train_loss": 0.008484583348035812, "global_step": 13755, "epoch": 115, "lr": 9.161988782087383e-05} +{"train_loss": 0.006753379013389349, "global_step": 13756, "epoch": 115, "lr": 9.1618659991883e-05} +{"train_loss": 0.005795163102447987, "global_step": 13757, "epoch": 115, "lr": 9.161743208117839e-05} +{"train_loss": 0.008545615710318089, "global_step": 13758, "epoch": 115, "lr": 9.16162040887624e-05} +{"train_loss": 0.00891890749335289, "global_step": 13759, "epoch": 115, "lr": 9.161497601463742e-05} +{"train_loss": 0.007835721597075462, "global_step": 13760, "epoch": 115, "lr": 9.16137478588059e-05} +{"train_loss": 0.006229585036635399, "global_step": 13761, "epoch": 115, "lr": 9.161251962127022e-05} +{"train_loss": 0.007261105813086033, "global_step": 13762, "epoch": 115, "lr": 9.16112913020328e-05} +{"train_loss": 0.013181256130337715, "global_step": 13763, "epoch": 115, "lr": 9.161006290109607e-05} +{"train_loss": 0.0048278933390975, "global_step": 13764, "epoch": 115, "lr": 9.160883441846242e-05} +{"train_loss": 0.0064324685372412205, "global_step": 13765, "epoch": 115, "lr": 9.160760585413427e-05} +{"train_loss": 0.00838707759976387, "global_step": 13766, "epoch": 115, "lr": 9.160637720811403e-05} +{"train_loss": 0.007462328299880028, "global_step": 13767, "epoch": 115, "lr": 9.160514848040411e-05} +{"train_loss": 0.006430462468415499, "global_step": 13768, "epoch": 115, "lr": 9.160391967100694e-05} +{"train_loss": 0.01039398368448019, "global_step": 13769, "epoch": 115, "lr": 9.160269077992489e-05} +{"train_loss": 0.007871124893426895, "global_step": 13770, "epoch": 115, "lr": 9.160146180716043e-05} +{"train_loss": 0.004287106450647116, "global_step": 13771, "epoch": 115, "lr": 9.160023275271594e-05} +{"train_loss": 0.007117814384400845, "global_step": 13772, "epoch": 115, "lr": 9.159900361659382e-05} +{"train_loss": 0.008764315396547318, "global_step": 13773, "epoch": 115, "lr": 9.159777439879651e-05} +{"train_loss": 0.006130652967840433, "global_step": 13774, "epoch": 115, "lr": 9.159654509932642e-05} +{"train_loss": 0.009000981226563454, "global_step": 13775, "epoch": 115, "lr": 9.159531571818595e-05} +{"train_loss": 0.005089703481644392, "global_step": 13776, "epoch": 115, "lr": 9.159408625537752e-05} +{"train_loss": 0.00474696047604084, "global_step": 13777, "epoch": 115, "lr": 9.159285671090354e-05} +{"train_loss": 0.005545722786337137, "global_step": 13778, "epoch": 115, "lr": 9.159162708476645e-05} +{"train_loss": 0.005580542609095573, "global_step": 13779, "epoch": 115, "lr": 9.159039737696863e-05} +{"train_loss": 0.005967522505670786, "global_step": 13780, "epoch": 115, "lr": 9.15891675875125e-05} +{"train_loss": 0.007065734826028347, "global_step": 13781, "epoch": 115, "lr": 9.15879377164005e-05} +{"train_loss": 0.006452594418078661, "global_step": 13782, "epoch": 115, "lr": 9.158670776363503e-05} +{"train_loss": 0.007440181914716959, "global_step": 13783, "epoch": 115, "lr": 9.158547772921849e-05} +{"train_loss": 0.007633741945028305, "global_step": 13784, "epoch": 115, "lr": 9.15842476131533e-05} +{"train_loss": 0.005624871235340834, "global_step": 13785, "epoch": 115, "lr": 9.15830174154419e-05} +{"train_loss": 0.007677455432713032, "global_step": 13786, "epoch": 115, "lr": 9.158178713608667e-05} +{"train_loss": 0.005017010495066643, "global_step": 13787, "epoch": 115, "lr": 9.158055677509005e-05} +{"train_loss": 0.006755535956472158, "global_step": 13788, "epoch": 115, "lr": 9.157932633245445e-05} +{"train_loss": 0.0033360286615788937, "global_step": 13789, "epoch": 115, "lr": 9.15780958081823e-05} +{"train_loss": 0.005962835159152746, "global_step": 13790, "epoch": 115, "lr": 9.157686520227597e-05} +{"train_loss": 0.007568798027932644, "global_step": 13791, "epoch": 115, "lr": 9.157563451473794e-05} +{"train_loss": 0.004862781148403883, "global_step": 13792, "epoch": 115, "lr": 9.157440374557057e-05} +{"train_loss": 0.005295508075505495, "global_step": 13793, "epoch": 115, "lr": 9.157317289477632e-05} +{"train_loss": 0.00828618835657835, "global_step": 13794, "epoch": 115, "lr": 9.157194196235757e-05} +{"train_loss": 0.006027583964169025, "global_step": 13795, "epoch": 115, "lr": 9.157071094831676e-05} +{"train_loss": 0.006203389726579189, "global_step": 13796, "epoch": 115, "lr": 9.15694798526563e-05} +{"train_loss": 0.006250280421227217, "global_step": 13797, "epoch": 115, "lr": 9.156824867537859e-05} +{"train_loss": 0.005379030015319586, "global_step": 13798, "epoch": 115, "lr": 9.156701741648607e-05} +{"train_loss": 0.004650485701858997, "global_step": 13799, "epoch": 115, "lr": 9.156578607598117e-05} +{"train_loss": 0.008446215651929379, "global_step": 13800, "epoch": 115, "lr": 9.156455465386629e-05} +{"train_loss": 0.00515957735478878, "global_step": 13801, "epoch": 115, "lr": 9.156332315014384e-05} +{"train_loss": 0.01046459935605526, "global_step": 13802, "epoch": 115, "lr": 9.156209156481624e-05} +{"train_loss": 0.007509067517650478, "global_step": 13803, "epoch": 115, "lr": 9.156085989788593e-05, "val_loss": 0.015030918642878532, "train_action_mse_error": 0.00024774414487183094} +{"train_loss": 0.008714307099580765, "global_step": 13804, "epoch": 116, "lr": 9.155962814935528e-05} +{"train_loss": 0.010815282352268696, "global_step": 13805, "epoch": 116, "lr": 9.155839631922676e-05} +{"train_loss": 0.005415152292698622, "global_step": 13806, "epoch": 116, "lr": 9.155716440750277e-05} +{"train_loss": 0.007771859411150217, "global_step": 13807, "epoch": 116, "lr": 9.155593241418572e-05} +{"train_loss": 0.009596260264515877, "global_step": 13808, "epoch": 116, "lr": 9.155470033927804e-05} +{"train_loss": 0.009647812694311142, "global_step": 13809, "epoch": 116, "lr": 9.155346818278217e-05} +{"train_loss": 0.0049767764285206795, "global_step": 13810, "epoch": 116, "lr": 9.155223594470047e-05} +{"train_loss": 0.00635855458676815, "global_step": 13811, "epoch": 116, "lr": 9.155100362503542e-05} +{"train_loss": 0.006894736550748348, "global_step": 13812, "epoch": 116, "lr": 9.154977122378938e-05} +{"train_loss": 0.007924849167466164, "global_step": 13813, "epoch": 116, "lr": 9.154853874096483e-05} +{"train_loss": 0.007709406781941652, "global_step": 13814, "epoch": 116, "lr": 9.154730617656415e-05} +{"train_loss": 0.007833950221538544, "global_step": 13815, "epoch": 116, "lr": 9.154607353058979e-05} +{"train_loss": 0.0071591599844396114, "global_step": 13816, "epoch": 116, "lr": 9.154484080304414e-05} +{"train_loss": 0.006913565564900637, "global_step": 13817, "epoch": 116, "lr": 9.154360799392963e-05} +{"train_loss": 0.008373063057661057, "global_step": 13818, "epoch": 116, "lr": 9.154237510324869e-05} +{"train_loss": 0.006780822761356831, "global_step": 13819, "epoch": 116, "lr": 9.154114213100373e-05} +{"train_loss": 0.0059295776300132275, "global_step": 13820, "epoch": 116, "lr": 9.153990907719718e-05} +{"train_loss": 0.006300750654190779, "global_step": 13821, "epoch": 116, "lr": 9.153867594183145e-05} +{"train_loss": 0.007640701252967119, "global_step": 13822, "epoch": 116, "lr": 9.153744272490898e-05} +{"train_loss": 0.00536005012691021, "global_step": 13823, "epoch": 116, "lr": 9.153620942643217e-05} +{"train_loss": 0.004942054394632578, "global_step": 13824, "epoch": 116, "lr": 9.153497604640344e-05} +{"train_loss": 0.005852710921317339, "global_step": 13825, "epoch": 116, "lr": 9.153374258482526e-05} +{"train_loss": 0.004963675979524851, "global_step": 13826, "epoch": 116, "lr": 9.153250904169998e-05} +{"train_loss": 0.006650377996265888, "global_step": 13827, "epoch": 116, "lr": 9.153127541703006e-05} +{"train_loss": 0.007502769120037556, "global_step": 13828, "epoch": 116, "lr": 9.153004171081792e-05} +{"train_loss": 0.0057452889159321785, "global_step": 13829, "epoch": 116, "lr": 9.152880792306597e-05} +{"train_loss": 0.005882796831429005, "global_step": 13830, "epoch": 116, "lr": 9.152757405377665e-05} +{"train_loss": 0.009175335057079792, "global_step": 13831, "epoch": 116, "lr": 9.15263401029524e-05} +{"train_loss": 0.005414315965026617, "global_step": 13832, "epoch": 116, "lr": 9.152510607059559e-05} +{"train_loss": 0.005895728711038828, "global_step": 13833, "epoch": 116, "lr": 9.152387195670867e-05} +{"train_loss": 0.006498717702925205, "global_step": 13834, "epoch": 116, "lr": 9.152263776129407e-05} +{"train_loss": 0.011348792351782322, "global_step": 13835, "epoch": 116, "lr": 9.152140348435421e-05} +{"train_loss": 0.00813690759241581, "global_step": 13836, "epoch": 116, "lr": 9.152016912589149e-05} +{"train_loss": 0.0037325622979551554, "global_step": 13837, "epoch": 116, "lr": 9.151893468590838e-05} +{"train_loss": 0.0074830930680036545, "global_step": 13838, "epoch": 116, "lr": 9.151770016440729e-05} +{"train_loss": 0.0043589165434241295, "global_step": 13839, "epoch": 116, "lr": 9.15164655613906e-05} +{"train_loss": 0.007894891314208508, "global_step": 13840, "epoch": 116, "lr": 9.151523087686077e-05} +{"train_loss": 0.00606208760291338, "global_step": 13841, "epoch": 116, "lr": 9.151399611082023e-05} +{"train_loss": 0.006205917336046696, "global_step": 13842, "epoch": 116, "lr": 9.151276126327137e-05} +{"train_loss": 0.00824084784835577, "global_step": 13843, "epoch": 116, "lr": 9.151152633421667e-05} +{"train_loss": 0.004792119842022657, "global_step": 13844, "epoch": 116, "lr": 9.15102913236585e-05} +{"train_loss": 0.006968209054321051, "global_step": 13845, "epoch": 116, "lr": 9.150905623159933e-05} +{"train_loss": 0.00821119174361229, "global_step": 13846, "epoch": 116, "lr": 9.150782105804155e-05} +{"train_loss": 0.007194031961262226, "global_step": 13847, "epoch": 116, "lr": 9.15065858029876e-05} +{"train_loss": 0.006371240597218275, "global_step": 13848, "epoch": 116, "lr": 9.150535046643988e-05} +{"train_loss": 0.0064169433899223804, "global_step": 13849, "epoch": 116, "lr": 9.150411504840086e-05} +{"train_loss": 0.006873188074678183, "global_step": 13850, "epoch": 116, "lr": 9.150287954887295e-05} +{"train_loss": 0.009997762739658356, "global_step": 13851, "epoch": 116, "lr": 9.150164396785856e-05} +{"train_loss": 0.008943366818130016, "global_step": 13852, "epoch": 116, "lr": 9.150040830536013e-05} +{"train_loss": 0.004651613533496857, "global_step": 13853, "epoch": 116, "lr": 9.149917256138007e-05} +{"train_loss": 0.009237219579517841, "global_step": 13854, "epoch": 116, "lr": 9.149793673592084e-05} +{"train_loss": 0.00840589590370655, "global_step": 13855, "epoch": 116, "lr": 9.149670082898483e-05} +{"train_loss": 0.005474886391311884, "global_step": 13856, "epoch": 116, "lr": 9.149546484057448e-05} +{"train_loss": 0.006414999254047871, "global_step": 13857, "epoch": 116, "lr": 9.149422877069222e-05} +{"train_loss": 0.009094229899346828, "global_step": 13858, "epoch": 116, "lr": 9.149299261934048e-05} +{"train_loss": 0.00604975875467062, "global_step": 13859, "epoch": 116, "lr": 9.149175638652169e-05} +{"train_loss": 0.005561499856412411, "global_step": 13860, "epoch": 116, "lr": 9.149052007223825e-05} +{"train_loss": 0.00922462623566389, "global_step": 13861, "epoch": 116, "lr": 9.14892836764926e-05} +{"train_loss": 0.007366890553385019, "global_step": 13862, "epoch": 116, "lr": 9.14880471992872e-05} +{"train_loss": 0.010637537576258183, "global_step": 13863, "epoch": 116, "lr": 9.148681064062445e-05} +{"train_loss": 0.00907018594443798, "global_step": 13864, "epoch": 116, "lr": 9.148557400050676e-05} +{"train_loss": 0.005386227276176214, "global_step": 13865, "epoch": 116, "lr": 9.14843372789366e-05} +{"train_loss": 0.008009975776076317, "global_step": 13866, "epoch": 116, "lr": 9.148310047591636e-05} +{"train_loss": 0.007781181950122118, "global_step": 13867, "epoch": 116, "lr": 9.148186359144847e-05} +{"train_loss": 0.007801422383636236, "global_step": 13868, "epoch": 116, "lr": 9.148062662553541e-05} +{"train_loss": 0.006531313993036747, "global_step": 13869, "epoch": 116, "lr": 9.147938957817954e-05} +{"train_loss": 0.006468160077929497, "global_step": 13870, "epoch": 116, "lr": 9.147815244938334e-05} +{"train_loss": 0.005997075699269772, "global_step": 13871, "epoch": 116, "lr": 9.14769152391492e-05} +{"train_loss": 0.008215508423745632, "global_step": 13872, "epoch": 116, "lr": 9.147567794747958e-05} +{"train_loss": 0.006795641966164112, "global_step": 13873, "epoch": 116, "lr": 9.147444057437689e-05} +{"train_loss": 0.006613429170101881, "global_step": 13874, "epoch": 116, "lr": 9.147320311984357e-05} +{"train_loss": 0.006277330685406923, "global_step": 13875, "epoch": 116, "lr": 9.147196558388206e-05} +{"train_loss": 0.009855653159320354, "global_step": 13876, "epoch": 116, "lr": 9.147072796649476e-05} +{"train_loss": 0.005331030115485191, "global_step": 13877, "epoch": 116, "lr": 9.146949026768412e-05} +{"train_loss": 0.007469947449862957, "global_step": 13878, "epoch": 116, "lr": 9.146825248745256e-05} +{"train_loss": 0.007734646555036306, "global_step": 13879, "epoch": 116, "lr": 9.146701462580253e-05} +{"train_loss": 0.004287221934646368, "global_step": 13880, "epoch": 116, "lr": 9.146577668273644e-05} +{"train_loss": 0.006184224970638752, "global_step": 13881, "epoch": 116, "lr": 9.146453865825673e-05} +{"train_loss": 0.004696215037256479, "global_step": 13882, "epoch": 116, "lr": 9.146330055236583e-05} +{"train_loss": 0.0053001451306045055, "global_step": 13883, "epoch": 116, "lr": 9.146206236506615e-05} +{"train_loss": 0.004898216109722853, "global_step": 13884, "epoch": 116, "lr": 9.146082409636017e-05} +{"train_loss": 0.006720343139022589, "global_step": 13885, "epoch": 116, "lr": 9.145958574625027e-05} +{"train_loss": 0.006215386558324099, "global_step": 13886, "epoch": 116, "lr": 9.145834731473892e-05} +{"train_loss": 0.003629526821896434, "global_step": 13887, "epoch": 116, "lr": 9.145710880182851e-05} +{"train_loss": 0.005687023047357798, "global_step": 13888, "epoch": 116, "lr": 9.14558702075215e-05} +{"train_loss": 0.006101527251303196, "global_step": 13889, "epoch": 116, "lr": 9.145463153182035e-05} +{"train_loss": 0.004201066680252552, "global_step": 13890, "epoch": 116, "lr": 9.145339277472744e-05} +{"train_loss": 0.005171085242182016, "global_step": 13891, "epoch": 116, "lr": 9.14521539362452e-05} +{"train_loss": 0.007611505687236786, "global_step": 13892, "epoch": 116, "lr": 9.14509150163761e-05} +{"train_loss": 0.0035472337622195482, "global_step": 13893, "epoch": 116, "lr": 9.144967601512258e-05} +{"train_loss": 0.0077075837180018425, "global_step": 13894, "epoch": 116, "lr": 9.144843693248701e-05} +{"train_loss": 0.005040138028562069, "global_step": 13895, "epoch": 116, "lr": 9.14471977684719e-05} +{"train_loss": 0.009445805102586746, "global_step": 13896, "epoch": 116, "lr": 9.144595852307962e-05} +{"train_loss": 0.008684579282999039, "global_step": 13897, "epoch": 116, "lr": 9.144471919631264e-05} +{"train_loss": 0.005057002883404493, "global_step": 13898, "epoch": 116, "lr": 9.144347978817337e-05} +{"train_loss": 0.003758873324841261, "global_step": 13899, "epoch": 116, "lr": 9.144224029866426e-05} +{"train_loss": 0.007497916463762522, "global_step": 13900, "epoch": 116, "lr": 9.144100072778774e-05} +{"train_loss": 0.00516080018132925, "global_step": 13901, "epoch": 116, "lr": 9.143976107554624e-05} +{"train_loss": 0.005526166874915361, "global_step": 13902, "epoch": 116, "lr": 9.143852134194219e-05} +{"train_loss": 0.006703088525682688, "global_step": 13903, "epoch": 116, "lr": 9.143728152697805e-05} +{"train_loss": 0.006561290938407183, "global_step": 13904, "epoch": 116, "lr": 9.143604163065622e-05} +{"train_loss": 0.006111564114689827, "global_step": 13905, "epoch": 116, "lr": 9.143480165297915e-05} +{"train_loss": 0.00422446895390749, "global_step": 13906, "epoch": 116, "lr": 9.143356159394929e-05} +{"train_loss": 0.006227521225810051, "global_step": 13907, "epoch": 116, "lr": 9.143232145356903e-05} +{"train_loss": 0.005589346867054701, "global_step": 13908, "epoch": 116, "lr": 9.143108123184086e-05} +{"train_loss": 0.007513043936342001, "global_step": 13909, "epoch": 116, "lr": 9.142984092876718e-05} +{"train_loss": 0.006403549574315548, "global_step": 13910, "epoch": 116, "lr": 9.142860054435043e-05} +{"train_loss": 0.010167721658945084, "global_step": 13911, "epoch": 116, "lr": 9.142736007859305e-05} +{"train_loss": 0.006035367958247662, "global_step": 13912, "epoch": 116, "lr": 9.142611953149747e-05} +{"train_loss": 0.0055015855468809605, "global_step": 13913, "epoch": 116, "lr": 9.142487890306613e-05} +{"train_loss": 0.00788805540651083, "global_step": 13914, "epoch": 116, "lr": 9.142363819330146e-05} +{"train_loss": 0.006570971105247736, "global_step": 13915, "epoch": 116, "lr": 9.142239740220592e-05} +{"train_loss": 0.007006040774285793, "global_step": 13916, "epoch": 116, "lr": 9.142115652978191e-05} +{"train_loss": 0.006312842946499586, "global_step": 13917, "epoch": 116, "lr": 9.141991557603189e-05} +{"train_loss": 0.01023523323237896, "global_step": 13918, "epoch": 116, "lr": 9.14186745409583e-05} +{"train_loss": 0.0049824099987745285, "global_step": 13919, "epoch": 116, "lr": 9.141743342456357e-05} +{"train_loss": 0.010327566415071487, "global_step": 13920, "epoch": 116, "lr": 9.141619222685011e-05} +{"train_loss": 0.007222680374979973, "global_step": 13921, "epoch": 116, "lr": 9.14149509478204e-05} +{"train_loss": 0.006856802402909438, "global_step": 13922, "epoch": 116, "lr": 9.141370958747686e-05, "val_loss": 0.02382788434624672} +{"train_loss": 0.006760288495570421, "global_step": 13923, "epoch": 117, "lr": 9.141246814582191e-05} +{"train_loss": 0.004701223224401474, "global_step": 13924, "epoch": 117, "lr": 9.141122662285802e-05} +{"train_loss": 0.009065907448530197, "global_step": 13925, "epoch": 117, "lr": 9.14099850185876e-05} +{"train_loss": 0.005886911414563656, "global_step": 13926, "epoch": 117, "lr": 9.14087433330131e-05} +{"train_loss": 0.0032194831874221563, "global_step": 13927, "epoch": 117, "lr": 9.140750156613697e-05} +{"train_loss": 0.006920911837369204, "global_step": 13928, "epoch": 117, "lr": 9.140625971796161e-05} +{"train_loss": 0.008515764959156513, "global_step": 13929, "epoch": 117, "lr": 9.140501778848951e-05} +{"train_loss": 0.007099617272615433, "global_step": 13930, "epoch": 117, "lr": 9.140377577772307e-05} +{"train_loss": 0.006611557211726904, "global_step": 13931, "epoch": 117, "lr": 9.140253368566474e-05} +{"train_loss": 0.008505125530064106, "global_step": 13932, "epoch": 117, "lr": 9.140129151231696e-05} +{"train_loss": 0.0058019524440169334, "global_step": 13933, "epoch": 117, "lr": 9.140004925768215e-05} +{"train_loss": 0.010381072759628296, "global_step": 13934, "epoch": 117, "lr": 9.139880692176277e-05} +{"train_loss": 0.007848196662962437, "global_step": 13935, "epoch": 117, "lr": 9.139756450456128e-05} +{"train_loss": 0.007212198339402676, "global_step": 13936, "epoch": 117, "lr": 9.139632200608007e-05} +{"train_loss": 0.005595637951046228, "global_step": 13937, "epoch": 117, "lr": 9.139507942632161e-05} +{"train_loss": 0.00876682996749878, "global_step": 13938, "epoch": 117, "lr": 9.139383676528835e-05} +{"train_loss": 0.007554222829639912, "global_step": 13939, "epoch": 117, "lr": 9.13925940229827e-05} +{"train_loss": 0.00682356720790267, "global_step": 13940, "epoch": 117, "lr": 9.139135119940711e-05} +{"train_loss": 0.005508371163159609, "global_step": 13941, "epoch": 117, "lr": 9.139010829456402e-05} +{"train_loss": 0.008121798746287823, "global_step": 13942, "epoch": 117, "lr": 9.13888653084559e-05} +{"train_loss": 0.005311067681759596, "global_step": 13943, "epoch": 117, "lr": 9.138762224108514e-05} +{"train_loss": 0.007891400717198849, "global_step": 13944, "epoch": 117, "lr": 9.138637909245421e-05} +{"train_loss": 0.008716875687241554, "global_step": 13945, "epoch": 117, "lr": 9.138513586256555e-05} +{"train_loss": 0.00534626143053174, "global_step": 13946, "epoch": 117, "lr": 9.13838925514216e-05} +{"train_loss": 0.007276774849742651, "global_step": 13947, "epoch": 117, "lr": 9.13826491590248e-05} +{"train_loss": 0.008890480734407902, "global_step": 13948, "epoch": 117, "lr": 9.138140568537757e-05} +{"train_loss": 0.0049241455271840096, "global_step": 13949, "epoch": 117, "lr": 9.138016213048239e-05} +{"train_loss": 0.006215096917003393, "global_step": 13950, "epoch": 117, "lr": 9.137891849434168e-05} +{"train_loss": 0.0060705034993588924, "global_step": 13951, "epoch": 117, "lr": 9.137767477695788e-05} +{"train_loss": 0.010291693732142448, "global_step": 13952, "epoch": 117, "lr": 9.137643097833344e-05} +{"train_loss": 0.011093365959823132, "global_step": 13953, "epoch": 117, "lr": 9.137518709847079e-05} +{"train_loss": 0.006203073542565107, "global_step": 13954, "epoch": 117, "lr": 9.137394313737238e-05} +{"train_loss": 0.009410685859620571, "global_step": 13955, "epoch": 117, "lr": 9.137269909504067e-05} +{"train_loss": 0.008951662108302116, "global_step": 13956, "epoch": 117, "lr": 9.137145497147807e-05} +{"train_loss": 0.009949743747711182, "global_step": 13957, "epoch": 117, "lr": 9.137021076668704e-05} +{"train_loss": 0.0049123638309538364, "global_step": 13958, "epoch": 117, "lr": 9.136896648067003e-05} +{"train_loss": 0.009901866316795349, "global_step": 13959, "epoch": 117, "lr": 9.136772211342947e-05} +{"train_loss": 0.007404187228530645, "global_step": 13960, "epoch": 117, "lr": 9.136647766496779e-05} +{"train_loss": 0.009476634673774242, "global_step": 13961, "epoch": 117, "lr": 9.136523313528746e-05} +{"train_loss": 0.00847511924803257, "global_step": 13962, "epoch": 117, "lr": 9.136398852439094e-05} +{"train_loss": 0.008455458097159863, "global_step": 13963, "epoch": 117, "lr": 9.136274383228061e-05} +{"train_loss": 0.005723470356315374, "global_step": 13964, "epoch": 117, "lr": 9.136149905895896e-05} +{"train_loss": 0.006067735143005848, "global_step": 13965, "epoch": 117, "lr": 9.136025420442844e-05} +{"train_loss": 0.007374891545623541, "global_step": 13966, "epoch": 117, "lr": 9.135900926869148e-05} +{"train_loss": 0.007552857045084238, "global_step": 13967, "epoch": 117, "lr": 9.135776425175051e-05} +{"train_loss": 0.006404618266969919, "global_step": 13968, "epoch": 117, "lr": 9.1356519153608e-05} +{"train_loss": 0.008046540431678295, "global_step": 13969, "epoch": 117, "lr": 9.135527397426638e-05} +{"train_loss": 0.004208737052977085, "global_step": 13970, "epoch": 117, "lr": 9.135402871372808e-05} +{"train_loss": 0.007900653406977654, "global_step": 13971, "epoch": 117, "lr": 9.13527833719956e-05} +{"train_loss": 0.007439360488206148, "global_step": 13972, "epoch": 117, "lr": 9.135153794907132e-05} +{"train_loss": 0.007564068306237459, "global_step": 13973, "epoch": 117, "lr": 9.135029244495772e-05} +{"train_loss": 0.0038496635388582945, "global_step": 13974, "epoch": 117, "lr": 9.134904685965724e-05} +{"train_loss": 0.006425983272492886, "global_step": 13975, "epoch": 117, "lr": 9.134780119317232e-05} +{"train_loss": 0.013045287691056728, "global_step": 13976, "epoch": 117, "lr": 9.134655544550542e-05} +{"train_loss": 0.005958459805697203, "global_step": 13977, "epoch": 117, "lr": 9.134530961665896e-05} +{"train_loss": 0.008522666059434414, "global_step": 13978, "epoch": 117, "lr": 9.13440637066354e-05} +{"train_loss": 0.009158861823379993, "global_step": 13979, "epoch": 117, "lr": 9.13428177154372e-05} +{"train_loss": 0.007181838620454073, "global_step": 13980, "epoch": 117, "lr": 9.134157164306679e-05} +{"train_loss": 0.004714882001280785, "global_step": 13981, "epoch": 117, "lr": 9.134032548952662e-05} +{"train_loss": 0.0096368920058012, "global_step": 13982, "epoch": 117, "lr": 9.133907925481915e-05} +{"train_loss": 0.006801230367273092, "global_step": 13983, "epoch": 117, "lr": 9.13378329389468e-05} +{"train_loss": 0.006908867508172989, "global_step": 13984, "epoch": 117, "lr": 9.133658654191204e-05} +{"train_loss": 0.007537800818681717, "global_step": 13985, "epoch": 117, "lr": 9.133534006371729e-05} +{"train_loss": 0.007807549089193344, "global_step": 13986, "epoch": 117, "lr": 9.133409350436503e-05} +{"train_loss": 0.005686177872121334, "global_step": 13987, "epoch": 117, "lr": 9.133284686385768e-05} +{"train_loss": 0.00621026661247015, "global_step": 13988, "epoch": 117, "lr": 9.133160014219772e-05} +{"train_loss": 0.008425010368227959, "global_step": 13989, "epoch": 117, "lr": 9.133035333938757e-05} +{"train_loss": 0.008596210740506649, "global_step": 13990, "epoch": 117, "lr": 9.13291064554297e-05} +{"train_loss": 0.006311899516731501, "global_step": 13991, "epoch": 117, "lr": 9.132785949032653e-05} +{"train_loss": 0.006708662956953049, "global_step": 13992, "epoch": 117, "lr": 9.132661244408053e-05} +{"train_loss": 0.006593739148229361, "global_step": 13993, "epoch": 117, "lr": 9.132536531669413e-05} +{"train_loss": 0.006831037346273661, "global_step": 13994, "epoch": 117, "lr": 9.13241181081698e-05} +{"train_loss": 0.006986713502556086, "global_step": 13995, "epoch": 117, "lr": 9.132287081850998e-05} +{"train_loss": 0.004819619935005903, "global_step": 13996, "epoch": 117, "lr": 9.13216234477171e-05} +{"train_loss": 0.007202901877462864, "global_step": 13997, "epoch": 117, "lr": 9.132037599579366e-05} +{"train_loss": 0.006201072596013546, "global_step": 13998, "epoch": 117, "lr": 9.131912846274206e-05} +{"train_loss": 0.008326348848640919, "global_step": 13999, "epoch": 117, "lr": 9.131788084856476e-05} +{"train_loss": 0.008415548130869865, "global_step": 14000, "epoch": 117, "lr": 9.131663315326422e-05} +{"train_loss": 0.006462522782385349, "global_step": 14001, "epoch": 117, "lr": 9.131538537684288e-05} +{"train_loss": 0.007876750081777573, "global_step": 14002, "epoch": 117, "lr": 9.13141375193032e-05} +{"train_loss": 0.005976764485239983, "global_step": 14003, "epoch": 117, "lr": 9.131288958064763e-05} +{"train_loss": 0.006967492867261171, "global_step": 14004, "epoch": 117, "lr": 9.13116415608786e-05} +{"train_loss": 0.005767684895545244, "global_step": 14005, "epoch": 117, "lr": 9.131039345999858e-05} +{"train_loss": 0.004149074200540781, "global_step": 14006, "epoch": 117, "lr": 9.130914527801002e-05} +{"train_loss": 0.006350467447191477, "global_step": 14007, "epoch": 117, "lr": 9.130789701491536e-05} +{"train_loss": 0.009464847855269909, "global_step": 14008, "epoch": 117, "lr": 9.130664867071707e-05} +{"train_loss": 0.008452131412923336, "global_step": 14009, "epoch": 117, "lr": 9.130540024541759e-05} +{"train_loss": 0.010396214202046394, "global_step": 14010, "epoch": 117, "lr": 9.130415173901934e-05} +{"train_loss": 0.0064768013544380665, "global_step": 14011, "epoch": 117, "lr": 9.130290315152483e-05} +{"train_loss": 0.007012993097305298, "global_step": 14012, "epoch": 117, "lr": 9.130165448293649e-05} +{"train_loss": 0.0032133597414940596, "global_step": 14013, "epoch": 117, "lr": 9.130040573325674e-05} +{"train_loss": 0.003328507300466299, "global_step": 14014, "epoch": 117, "lr": 9.129915690248805e-05} +{"train_loss": 0.008664925582706928, "global_step": 14015, "epoch": 117, "lr": 9.12979079906329e-05} +{"train_loss": 0.005896862130612135, "global_step": 14016, "epoch": 117, "lr": 9.129665899769371e-05} +{"train_loss": 0.007215013727545738, "global_step": 14017, "epoch": 117, "lr": 9.129540992367294e-05} +{"train_loss": 0.008101244457066059, "global_step": 14018, "epoch": 117, "lr": 9.129416076857304e-05} +{"train_loss": 0.004832969047129154, "global_step": 14019, "epoch": 117, "lr": 9.129291153239647e-05} +{"train_loss": 0.009315882809460163, "global_step": 14020, "epoch": 117, "lr": 9.129166221514569e-05} +{"train_loss": 0.005274910945445299, "global_step": 14021, "epoch": 117, "lr": 9.129041281682314e-05} +{"train_loss": 0.006244358606636524, "global_step": 14022, "epoch": 117, "lr": 9.128916333743127e-05} +{"train_loss": 0.006861002650111914, "global_step": 14023, "epoch": 117, "lr": 9.128791377697254e-05} +{"train_loss": 0.009179333224892616, "global_step": 14024, "epoch": 117, "lr": 9.12866641354494e-05} +{"train_loss": 0.005056628957390785, "global_step": 14025, "epoch": 117, "lr": 9.128541441286431e-05} +{"train_loss": 0.005909148138016462, "global_step": 14026, "epoch": 117, "lr": 9.128416460921972e-05} +{"train_loss": 0.005355788394808769, "global_step": 14027, "epoch": 117, "lr": 9.128291472451809e-05} +{"train_loss": 0.0057359966449439526, "global_step": 14028, "epoch": 117, "lr": 9.128166475876185e-05} +{"train_loss": 0.011625356040894985, "global_step": 14029, "epoch": 117, "lr": 9.128041471195348e-05} +{"train_loss": 0.01134070847183466, "global_step": 14030, "epoch": 117, "lr": 9.127916458409542e-05} +{"train_loss": 0.007065949961543083, "global_step": 14031, "epoch": 117, "lr": 9.127791437519015e-05} +{"train_loss": 0.008951413445174694, "global_step": 14032, "epoch": 117, "lr": 9.127666408524008e-05} +{"train_loss": 0.00499129481613636, "global_step": 14033, "epoch": 117, "lr": 9.12754137142477e-05} +{"train_loss": 0.0037822930607944727, "global_step": 14034, "epoch": 117, "lr": 9.127416326221547e-05} +{"train_loss": 0.006154985632747412, "global_step": 14035, "epoch": 117, "lr": 9.12729127291458e-05} +{"train_loss": 0.01232120767235756, "global_step": 14036, "epoch": 117, "lr": 9.12716621150412e-05} +{"train_loss": 0.011342083103954792, "global_step": 14037, "epoch": 117, "lr": 9.127041141990408e-05} +{"train_loss": 0.008541323244571686, "global_step": 14038, "epoch": 117, "lr": 9.126916064373694e-05} +{"train_loss": 0.007001911755651236, "global_step": 14039, "epoch": 117, "lr": 9.126790978654221e-05} +{"train_loss": 0.011792032048106194, "global_step": 14040, "epoch": 117, "lr": 9.126665884832232e-05} +{"train_loss": 0.0072930014512243395, "global_step": 14041, "epoch": 117, "lr": 9.126540782907978e-05, "val_loss": 0.01396652776747942} +{"train_loss": 0.006816138047724962, "global_step": 14042, "epoch": 118, "lr": 9.1264156728817e-05} +{"train_loss": 0.009346703067421913, "global_step": 14043, "epoch": 118, "lr": 9.126290554753649e-05} +{"train_loss": 0.008073562756180763, "global_step": 14044, "epoch": 118, "lr": 9.126165428524064e-05} +{"train_loss": 0.012383108027279377, "global_step": 14045, "epoch": 118, "lr": 9.126040294193195e-05} +{"train_loss": 0.006043335888534784, "global_step": 14046, "epoch": 118, "lr": 9.125915151761287e-05} +{"train_loss": 0.009956108406186104, "global_step": 14047, "epoch": 118, "lr": 9.125790001228586e-05} +{"train_loss": 0.007059136871248484, "global_step": 14048, "epoch": 118, "lr": 9.125664842595336e-05} +{"train_loss": 0.0076394593343138695, "global_step": 14049, "epoch": 118, "lr": 9.125539675861786e-05} +{"train_loss": 0.0058671762235462666, "global_step": 14050, "epoch": 118, "lr": 9.125414501028177e-05} +{"train_loss": 0.0072595300152897835, "global_step": 14051, "epoch": 118, "lr": 9.125289318094758e-05} +{"train_loss": 0.01084363367408514, "global_step": 14052, "epoch": 118, "lr": 9.125164127061774e-05} +{"train_loss": 0.006263847928494215, "global_step": 14053, "epoch": 118, "lr": 9.125038927929471e-05} +{"train_loss": 0.009174274280667305, "global_step": 14054, "epoch": 118, "lr": 9.124913720698096e-05} +{"train_loss": 0.0056397938169538975, "global_step": 14055, "epoch": 118, "lr": 9.124788505367892e-05} +{"train_loss": 0.006086899898946285, "global_step": 14056, "epoch": 118, "lr": 9.124663281939107e-05} +{"train_loss": 0.009306807070970535, "global_step": 14057, "epoch": 118, "lr": 9.124538050411986e-05} +{"train_loss": 0.009197223000228405, "global_step": 14058, "epoch": 118, "lr": 9.124412810786775e-05} +{"train_loss": 0.006090512499213219, "global_step": 14059, "epoch": 118, "lr": 9.124287563063723e-05} +{"train_loss": 0.007767908740788698, "global_step": 14060, "epoch": 118, "lr": 9.124162307243069e-05} +{"train_loss": 0.006280671339482069, "global_step": 14061, "epoch": 118, "lr": 9.124037043325066e-05} +{"train_loss": 0.006800622679293156, "global_step": 14062, "epoch": 118, "lr": 9.123911771309955e-05} +{"train_loss": 0.008895153179764748, "global_step": 14063, "epoch": 118, "lr": 9.123786491197983e-05} +{"train_loss": 0.009110953658819199, "global_step": 14064, "epoch": 118, "lr": 9.123661202989399e-05} +{"train_loss": 0.008108647540211678, "global_step": 14065, "epoch": 118, "lr": 9.123535906684446e-05} +{"train_loss": 0.007418977562338114, "global_step": 14066, "epoch": 118, "lr": 9.123410602283372e-05} +{"train_loss": 0.008222401142120361, "global_step": 14067, "epoch": 118, "lr": 9.123285289786419e-05} +{"train_loss": 0.007590129040181637, "global_step": 14068, "epoch": 118, "lr": 9.123159969193837e-05} +{"train_loss": 0.006191525142639875, "global_step": 14069, "epoch": 118, "lr": 9.123034640505871e-05} +{"train_loss": 0.006720838136970997, "global_step": 14070, "epoch": 118, "lr": 9.122909303722767e-05} +{"train_loss": 0.005256214644759893, "global_step": 14071, "epoch": 118, "lr": 9.122783958844771e-05} +{"train_loss": 0.0071634165942668915, "global_step": 14072, "epoch": 118, "lr": 9.12265860587213e-05} +{"train_loss": 0.00854827743023634, "global_step": 14073, "epoch": 118, "lr": 9.122533244805087e-05} +{"train_loss": 0.009213000535964966, "global_step": 14074, "epoch": 118, "lr": 9.122407875643893e-05} +{"train_loss": 0.005722750909626484, "global_step": 14075, "epoch": 118, "lr": 9.12228249838879e-05} +{"train_loss": 0.008755582384765148, "global_step": 14076, "epoch": 118, "lr": 9.122157113040026e-05} +{"train_loss": 0.007040566299110651, "global_step": 14077, "epoch": 118, "lr": 9.122031719597848e-05} +{"train_loss": 0.007191440090537071, "global_step": 14078, "epoch": 118, "lr": 9.121906318062499e-05} +{"train_loss": 0.00604975875467062, "global_step": 14079, "epoch": 118, "lr": 9.12178090843423e-05} +{"train_loss": 0.007433614693582058, "global_step": 14080, "epoch": 118, "lr": 9.121655490713282e-05} +{"train_loss": 0.005368912126868963, "global_step": 14081, "epoch": 118, "lr": 9.121530064899906e-05} +{"train_loss": 0.005235144402831793, "global_step": 14082, "epoch": 118, "lr": 9.121404630994344e-05} +{"train_loss": 0.008357895538210869, "global_step": 14083, "epoch": 118, "lr": 9.121279188996846e-05} +{"train_loss": 0.006276936735957861, "global_step": 14084, "epoch": 118, "lr": 9.121153738907655e-05} +{"train_loss": 0.007271400652825832, "global_step": 14085, "epoch": 118, "lr": 9.12102828072702e-05} +{"train_loss": 0.007442580070346594, "global_step": 14086, "epoch": 118, "lr": 9.120902814455186e-05} +{"train_loss": 0.009828457608819008, "global_step": 14087, "epoch": 118, "lr": 9.120777340092399e-05} +{"train_loss": 0.006768600549548864, "global_step": 14088, "epoch": 118, "lr": 9.120651857638907e-05} +{"train_loss": 0.0077333091758191586, "global_step": 14089, "epoch": 118, "lr": 9.120526367094955e-05} +{"train_loss": 0.006418141070753336, "global_step": 14090, "epoch": 118, "lr": 9.120400868460789e-05} +{"train_loss": 0.012310805730521679, "global_step": 14091, "epoch": 118, "lr": 9.120275361736656e-05} +{"train_loss": 0.007969209924340248, "global_step": 14092, "epoch": 118, "lr": 9.120149846922804e-05} +{"train_loss": 0.006076042540371418, "global_step": 14093, "epoch": 118, "lr": 9.120024324019476e-05} +{"train_loss": 0.006845859345048666, "global_step": 14094, "epoch": 118, "lr": 9.119898793026922e-05} +{"train_loss": 0.007776737213134766, "global_step": 14095, "epoch": 118, "lr": 9.119773253945386e-05} +{"train_loss": 0.006343601271510124, "global_step": 14096, "epoch": 118, "lr": 9.119647706775116e-05} +{"train_loss": 0.008202520199120045, "global_step": 14097, "epoch": 118, "lr": 9.119522151516358e-05} +{"train_loss": 0.0069986190646886826, "global_step": 14098, "epoch": 118, "lr": 9.119396588169358e-05} +{"train_loss": 0.008962217718362808, "global_step": 14099, "epoch": 118, "lr": 9.119271016734361e-05} +{"train_loss": 0.006911971140652895, "global_step": 14100, "epoch": 118, "lr": 9.119145437211619e-05} +{"train_loss": 0.007520618848502636, "global_step": 14101, "epoch": 118, "lr": 9.119019849601372e-05} +{"train_loss": 0.009327737614512444, "global_step": 14102, "epoch": 118, "lr": 9.118894253903872e-05} +{"train_loss": 0.007846202701330185, "global_step": 14103, "epoch": 118, "lr": 9.11876865011936e-05} +{"train_loss": 0.007542154286056757, "global_step": 14104, "epoch": 118, "lr": 9.118643038248088e-05} +{"train_loss": 0.0080526452511549, "global_step": 14105, "epoch": 118, "lr": 9.1185174182903e-05} +{"train_loss": 0.008102646097540855, "global_step": 14106, "epoch": 118, "lr": 9.118391790246244e-05} +{"train_loss": 0.005243625026196241, "global_step": 14107, "epoch": 118, "lr": 9.118266154116164e-05} +{"train_loss": 0.0047175283543765545, "global_step": 14108, "epoch": 118, "lr": 9.118140509900311e-05} +{"train_loss": 0.0055578420870006084, "global_step": 14109, "epoch": 118, "lr": 9.118014857598927e-05} +{"train_loss": 0.008839610032737255, "global_step": 14110, "epoch": 118, "lr": 9.11788919721226e-05} +{"train_loss": 0.006805680692195892, "global_step": 14111, "epoch": 118, "lr": 9.117763528740558e-05} +{"train_loss": 0.006640053354203701, "global_step": 14112, "epoch": 118, "lr": 9.117637852184068e-05} +{"train_loss": 0.009943981654942036, "global_step": 14113, "epoch": 118, "lr": 9.117512167543036e-05} +{"train_loss": 0.00673469016328454, "global_step": 14114, "epoch": 118, "lr": 9.117386474817708e-05} +{"train_loss": 0.007324861828237772, "global_step": 14115, "epoch": 118, "lr": 9.117260774008333e-05} +{"train_loss": 0.004951538983732462, "global_step": 14116, "epoch": 118, "lr": 9.117135065115156e-05} +{"train_loss": 0.008581819012761116, "global_step": 14117, "epoch": 118, "lr": 9.117009348138424e-05} +{"train_loss": 0.0076222773641347885, "global_step": 14118, "epoch": 118, "lr": 9.116883623078383e-05} +{"train_loss": 0.006743472069501877, "global_step": 14119, "epoch": 118, "lr": 9.116757889935281e-05} +{"train_loss": 0.006549314130097628, "global_step": 14120, "epoch": 118, "lr": 9.116632148709365e-05} +{"train_loss": 0.006245697848498821, "global_step": 14121, "epoch": 118, "lr": 9.116506399400882e-05} +{"train_loss": 0.006961027625948191, "global_step": 14122, "epoch": 118, "lr": 9.116380642010078e-05} +{"train_loss": 0.005210025701671839, "global_step": 14123, "epoch": 118, "lr": 9.1162548765372e-05} +{"train_loss": 0.006721866317093372, "global_step": 14124, "epoch": 118, "lr": 9.116129102982496e-05} +{"train_loss": 0.007742833346128464, "global_step": 14125, "epoch": 118, "lr": 9.116003321346212e-05} +{"train_loss": 0.010115590877830982, "global_step": 14126, "epoch": 118, "lr": 9.115877531628596e-05} +{"train_loss": 0.00864703394472599, "global_step": 14127, "epoch": 118, "lr": 9.115751733829892e-05} +{"train_loss": 0.007657310925424099, "global_step": 14128, "epoch": 118, "lr": 9.115625927950351e-05} +{"train_loss": 0.004781952127814293, "global_step": 14129, "epoch": 118, "lr": 9.115500113990217e-05} +{"train_loss": 0.007988253608345985, "global_step": 14130, "epoch": 118, "lr": 9.115374291949739e-05} +{"train_loss": 0.006633122451603413, "global_step": 14131, "epoch": 118, "lr": 9.115248461829163e-05} +{"train_loss": 0.006285309325903654, "global_step": 14132, "epoch": 118, "lr": 9.115122623628738e-05} +{"train_loss": 0.007130492478609085, "global_step": 14133, "epoch": 118, "lr": 9.114996777348707e-05} +{"train_loss": 0.007757915649563074, "global_step": 14134, "epoch": 118, "lr": 9.11487092298932e-05} +{"train_loss": 0.006456885952502489, "global_step": 14135, "epoch": 118, "lr": 9.114745060550824e-05} +{"train_loss": 0.006570516154170036, "global_step": 14136, "epoch": 118, "lr": 9.114619190033465e-05} +{"train_loss": 0.005715810228139162, "global_step": 14137, "epoch": 118, "lr": 9.114493311437492e-05} +{"train_loss": 0.007415091153234243, "global_step": 14138, "epoch": 118, "lr": 9.11436742476315e-05} +{"train_loss": 0.005332873668521643, "global_step": 14139, "epoch": 118, "lr": 9.114241530010687e-05} +{"train_loss": 0.008563514798879623, "global_step": 14140, "epoch": 118, "lr": 9.114115627180351e-05} +{"train_loss": 0.008942178450524807, "global_step": 14141, "epoch": 118, "lr": 9.113989716272388e-05} +{"train_loss": 0.0056413826532661915, "global_step": 14142, "epoch": 118, "lr": 9.113863797287046e-05} +{"train_loss": 0.008957705460488796, "global_step": 14143, "epoch": 118, "lr": 9.113737870224573e-05} +{"train_loss": 0.0049390774220228195, "global_step": 14144, "epoch": 118, "lr": 9.113611935085213e-05} +{"train_loss": 0.0071733915247023106, "global_step": 14145, "epoch": 118, "lr": 9.113485991869217e-05} +{"train_loss": 0.00745071517303586, "global_step": 14146, "epoch": 118, "lr": 9.11336004057683e-05} +{"train_loss": 0.006203899625688791, "global_step": 14147, "epoch": 118, "lr": 9.1132340812083e-05} +{"train_loss": 0.005560498218983412, "global_step": 14148, "epoch": 118, "lr": 9.113108113763875e-05} +{"train_loss": 0.006360708735883236, "global_step": 14149, "epoch": 118, "lr": 9.1129821382438e-05} +{"train_loss": 0.009615100920200348, "global_step": 14150, "epoch": 118, "lr": 9.112856154648326e-05} +{"train_loss": 0.007056122180074453, "global_step": 14151, "epoch": 118, "lr": 9.112730162977698e-05} +{"train_loss": 0.004709823057055473, "global_step": 14152, "epoch": 118, "lr": 9.112604163232164e-05} +{"train_loss": 0.007269155699759722, "global_step": 14153, "epoch": 118, "lr": 9.112478155411968e-05} +{"train_loss": 0.006980263162404299, "global_step": 14154, "epoch": 118, "lr": 9.112352139517363e-05} +{"train_loss": 0.007754568010568619, "global_step": 14155, "epoch": 118, "lr": 9.112226115548595e-05} +{"train_loss": 0.006081381347030401, "global_step": 14156, "epoch": 118, "lr": 9.112100083505908e-05} +{"train_loss": 0.009372573345899582, "global_step": 14157, "epoch": 118, "lr": 9.111974043389553e-05} +{"train_loss": 0.0074487244710326195, "global_step": 14158, "epoch": 118, "lr": 9.111847995199776e-05} +{"train_loss": 0.005660033319145441, "global_step": 14159, "epoch": 118, "lr": 9.111721938936826e-05} +{"train_loss": 0.0073151465881021085, "global_step": 14160, "epoch": 118, "lr": 9.111595874600946e-05, "val_loss": 0.014942271634936333} +{"train_loss": 0.006607115734368563, "global_step": 14161, "epoch": 119, "lr": 9.11146980219239e-05} +{"train_loss": 0.005012190900743008, "global_step": 14162, "epoch": 119, "lr": 9.1113437217114e-05} +{"train_loss": 0.006919868290424347, "global_step": 14163, "epoch": 119, "lr": 9.111217633158229e-05} +{"train_loss": 0.007643850985914469, "global_step": 14164, "epoch": 119, "lr": 9.111091536533118e-05} +{"train_loss": 0.005036661867052317, "global_step": 14165, "epoch": 119, "lr": 9.11096543183632e-05} +{"train_loss": 0.007654719520360231, "global_step": 14166, "epoch": 119, "lr": 9.11083931906808e-05} +{"train_loss": 0.004305127542465925, "global_step": 14167, "epoch": 119, "lr": 9.110713198228646e-05} +{"train_loss": 0.008668321184813976, "global_step": 14168, "epoch": 119, "lr": 9.110587069318266e-05} +{"train_loss": 0.0075612603686749935, "global_step": 14169, "epoch": 119, "lr": 9.110460932337187e-05} +{"train_loss": 0.005038470029830933, "global_step": 14170, "epoch": 119, "lr": 9.110334787285656e-05} +{"train_loss": 0.007404207251966, "global_step": 14171, "epoch": 119, "lr": 9.110208634163924e-05} +{"train_loss": 0.00501398928463459, "global_step": 14172, "epoch": 119, "lr": 9.110082472972237e-05} +{"train_loss": 0.009466026909649372, "global_step": 14173, "epoch": 119, "lr": 9.109956303710841e-05} +{"train_loss": 0.006835405249148607, "global_step": 14174, "epoch": 119, "lr": 9.109830126379984e-05} +{"train_loss": 0.008856547065079212, "global_step": 14175, "epoch": 119, "lr": 9.109703940979914e-05} +{"train_loss": 0.006697122007608414, "global_step": 14176, "epoch": 119, "lr": 9.109577747510882e-05} +{"train_loss": 0.008805698715150356, "global_step": 14177, "epoch": 119, "lr": 9.109451545973131e-05} +{"train_loss": 0.004827695433050394, "global_step": 14178, "epoch": 119, "lr": 9.109325336366912e-05} +{"train_loss": 0.005518049467355013, "global_step": 14179, "epoch": 119, "lr": 9.109199118692472e-05} +{"train_loss": 0.007503717206418514, "global_step": 14180, "epoch": 119, "lr": 9.109072892950056e-05} +{"train_loss": 0.005340973846614361, "global_step": 14181, "epoch": 119, "lr": 9.108946659139919e-05} +{"train_loss": 0.008766948245465755, "global_step": 14182, "epoch": 119, "lr": 9.1088204172623e-05} +{"train_loss": 0.004543856717646122, "global_step": 14183, "epoch": 119, "lr": 9.108694167317452e-05} +{"train_loss": 0.005090939346700907, "global_step": 14184, "epoch": 119, "lr": 9.108567909305623e-05} +{"train_loss": 0.008978555910289288, "global_step": 14185, "epoch": 119, "lr": 9.108441643227061e-05} +{"train_loss": 0.005362180061638355, "global_step": 14186, "epoch": 119, "lr": 9.10831536908201e-05} +{"train_loss": 0.007806976325809956, "global_step": 14187, "epoch": 119, "lr": 9.108189086870722e-05} +{"train_loss": 0.007317989133298397, "global_step": 14188, "epoch": 119, "lr": 9.108062796593444e-05} +{"train_loss": 0.00772311445325613, "global_step": 14189, "epoch": 119, "lr": 9.107936498250422e-05} +{"train_loss": 0.0056668794713914394, "global_step": 14190, "epoch": 119, "lr": 9.107810191841908e-05} +{"train_loss": 0.0076993112452328205, "global_step": 14191, "epoch": 119, "lr": 9.107683877368144e-05} +{"train_loss": 0.007130651269108057, "global_step": 14192, "epoch": 119, "lr": 9.107557554829384e-05} +{"train_loss": 0.005884918849915266, "global_step": 14193, "epoch": 119, "lr": 9.107431224225876e-05} +{"train_loss": 0.006328970659524202, "global_step": 14194, "epoch": 119, "lr": 9.107304885557861e-05} +{"train_loss": 0.008651099167764187, "global_step": 14195, "epoch": 119, "lr": 9.107178538825593e-05} +{"train_loss": 0.004877639934420586, "global_step": 14196, "epoch": 119, "lr": 9.107052184029319e-05} +{"train_loss": 0.006640148349106312, "global_step": 14197, "epoch": 119, "lr": 9.106925821169288e-05} +{"train_loss": 0.005761885549873114, "global_step": 14198, "epoch": 119, "lr": 9.106799450245746e-05} +{"train_loss": 0.006132795941084623, "global_step": 14199, "epoch": 119, "lr": 9.106673071258942e-05} +{"train_loss": 0.008431951515376568, "global_step": 14200, "epoch": 119, "lr": 9.106546684209125e-05} +{"train_loss": 0.00537846190854907, "global_step": 14201, "epoch": 119, "lr": 9.10642028909654e-05} +{"train_loss": 0.004369753412902355, "global_step": 14202, "epoch": 119, "lr": 9.10629388592144e-05} +{"train_loss": 0.005921697244048119, "global_step": 14203, "epoch": 119, "lr": 9.106167474684069e-05} +{"train_loss": 0.011189774610102177, "global_step": 14204, "epoch": 119, "lr": 9.106041055384678e-05} +{"train_loss": 0.004942489787936211, "global_step": 14205, "epoch": 119, "lr": 9.105914628023513e-05} +{"train_loss": 0.006001274101436138, "global_step": 14206, "epoch": 119, "lr": 9.105788192600823e-05} +{"train_loss": 0.009111936204135418, "global_step": 14207, "epoch": 119, "lr": 9.105661749116858e-05} +{"train_loss": 0.007114320062100887, "global_step": 14208, "epoch": 119, "lr": 9.105535297571864e-05} +{"train_loss": 0.009553930722177029, "global_step": 14209, "epoch": 119, "lr": 9.10540883796609e-05} +{"train_loss": 0.005219008307904005, "global_step": 14210, "epoch": 119, "lr": 9.105282370299785e-05} +{"train_loss": 0.005615015514194965, "global_step": 14211, "epoch": 119, "lr": 9.105155894573196e-05} +{"train_loss": 0.006367759313434362, "global_step": 14212, "epoch": 119, "lr": 9.105029410786572e-05} +{"train_loss": 0.005336702335625887, "global_step": 14213, "epoch": 119, "lr": 9.104902918940162e-05} +{"train_loss": 0.005968002136796713, "global_step": 14214, "epoch": 119, "lr": 9.104776419034213e-05} +{"train_loss": 0.005772097501903772, "global_step": 14215, "epoch": 119, "lr": 9.104649911068974e-05} +{"train_loss": 0.006054637022316456, "global_step": 14216, "epoch": 119, "lr": 9.104523395044693e-05} +{"train_loss": 0.00625983951613307, "global_step": 14217, "epoch": 119, "lr": 9.10439687096162e-05} +{"train_loss": 0.0050661214627325535, "global_step": 14218, "epoch": 119, "lr": 9.104270338820001e-05} +{"train_loss": 0.0046868594363331795, "global_step": 14219, "epoch": 119, "lr": 9.104143798620087e-05} +{"train_loss": 0.006729820277541876, "global_step": 14220, "epoch": 119, "lr": 9.104017250362125e-05} +{"train_loss": 0.004312961827963591, "global_step": 14221, "epoch": 119, "lr": 9.103890694046363e-05} +{"train_loss": 0.006349650211632252, "global_step": 14222, "epoch": 119, "lr": 9.10376412967305e-05} +{"train_loss": 0.007862656377255917, "global_step": 14223, "epoch": 119, "lr": 9.103637557242434e-05} +{"train_loss": 0.006724210921674967, "global_step": 14224, "epoch": 119, "lr": 9.103510976754763e-05} +{"train_loss": 0.00483236787840724, "global_step": 14225, "epoch": 119, "lr": 9.10338438821029e-05} +{"train_loss": 0.007872878573834896, "global_step": 14226, "epoch": 119, "lr": 9.103257791609258e-05} +{"train_loss": 0.007005439605563879, "global_step": 14227, "epoch": 119, "lr": 9.103131186951917e-05} +{"train_loss": 0.003182534594088793, "global_step": 14228, "epoch": 119, "lr": 9.103004574238518e-05} +{"train_loss": 0.008587993681430817, "global_step": 14229, "epoch": 119, "lr": 9.102877953469306e-05} +{"train_loss": 0.009674015454947948, "global_step": 14230, "epoch": 119, "lr": 9.102751324644534e-05} +{"train_loss": 0.004910875111818314, "global_step": 14231, "epoch": 119, "lr": 9.102624687764446e-05} +{"train_loss": 0.005668098572641611, "global_step": 14232, "epoch": 119, "lr": 9.102498042829294e-05} +{"train_loss": 0.008165898732841015, "global_step": 14233, "epoch": 119, "lr": 9.102371389839325e-05} +{"train_loss": 0.006136691197752953, "global_step": 14234, "epoch": 119, "lr": 9.102244728794787e-05} +{"train_loss": 0.006243925075978041, "global_step": 14235, "epoch": 119, "lr": 9.102118059695931e-05} +{"train_loss": 0.006356501951813698, "global_step": 14236, "epoch": 119, "lr": 9.101991382543004e-05} +{"train_loss": 0.011483414098620415, "global_step": 14237, "epoch": 119, "lr": 9.101864697336255e-05} +{"train_loss": 0.00624213507398963, "global_step": 14238, "epoch": 119, "lr": 9.101738004075933e-05} +{"train_loss": 0.00927949883043766, "global_step": 14239, "epoch": 119, "lr": 9.101611302762288e-05} +{"train_loss": 0.007918789982795715, "global_step": 14240, "epoch": 119, "lr": 9.101484593395565e-05} +{"train_loss": 0.009254911914467812, "global_step": 14241, "epoch": 119, "lr": 9.101357875976017e-05} +{"train_loss": 0.006803987547755241, "global_step": 14242, "epoch": 119, "lr": 9.10123115050389e-05} +{"train_loss": 0.006588844582438469, "global_step": 14243, "epoch": 119, "lr": 9.101104416979434e-05} +{"train_loss": 0.004949263762682676, "global_step": 14244, "epoch": 119, "lr": 9.100977675402897e-05} +{"train_loss": 0.0072603123262524605, "global_step": 14245, "epoch": 119, "lr": 9.100850925774529e-05} +{"train_loss": 0.009887566789984703, "global_step": 14246, "epoch": 119, "lr": 9.100724168094578e-05} +{"train_loss": 0.007943026721477509, "global_step": 14247, "epoch": 119, "lr": 9.100597402363296e-05} +{"train_loss": 0.008677096106112003, "global_step": 14248, "epoch": 119, "lr": 9.100470628580925e-05} +{"train_loss": 0.005740855820477009, "global_step": 14249, "epoch": 119, "lr": 9.10034384674772e-05} +{"train_loss": 0.008555054664611816, "global_step": 14250, "epoch": 119, "lr": 9.100217056863927e-05} +{"train_loss": 0.005381760653108358, "global_step": 14251, "epoch": 119, "lr": 9.100090258929798e-05} +{"train_loss": 0.010666229762136936, "global_step": 14252, "epoch": 119, "lr": 9.099963452945577e-05} +{"train_loss": 0.007124921772629023, "global_step": 14253, "epoch": 119, "lr": 9.099836638911517e-05} +{"train_loss": 0.009120823815464973, "global_step": 14254, "epoch": 119, "lr": 9.099709816827866e-05} +{"train_loss": 0.00692512933164835, "global_step": 14255, "epoch": 119, "lr": 9.099582986694874e-05} +{"train_loss": 0.008446421474218369, "global_step": 14256, "epoch": 119, "lr": 9.099456148512786e-05} +{"train_loss": 0.007501471787691116, "global_step": 14257, "epoch": 119, "lr": 9.099329302281856e-05} +{"train_loss": 0.010230153799057007, "global_step": 14258, "epoch": 119, "lr": 9.099202448002331e-05} +{"train_loss": 0.007741724606603384, "global_step": 14259, "epoch": 119, "lr": 9.099075585674458e-05} +{"train_loss": 0.00526417838409543, "global_step": 14260, "epoch": 119, "lr": 9.098948715298488e-05} +{"train_loss": 0.007857328280806541, "global_step": 14261, "epoch": 119, "lr": 9.098821836874671e-05} +{"train_loss": 0.006443137302994728, "global_step": 14262, "epoch": 119, "lr": 9.098694950403257e-05} +{"train_loss": 0.005644240882247686, "global_step": 14263, "epoch": 119, "lr": 9.098568055884491e-05} +{"train_loss": 0.009511272422969341, "global_step": 14264, "epoch": 119, "lr": 9.098441153318625e-05} +{"train_loss": 0.0047446428798139095, "global_step": 14265, "epoch": 119, "lr": 9.098314242705907e-05} +{"train_loss": 0.006678951904177666, "global_step": 14266, "epoch": 119, "lr": 9.098187324046589e-05} +{"train_loss": 0.012284642085433006, "global_step": 14267, "epoch": 119, "lr": 9.098060397340917e-05} +{"train_loss": 0.009781340137124062, "global_step": 14268, "epoch": 119, "lr": 9.097933462589139e-05} +{"train_loss": 0.009860276244580746, "global_step": 14269, "epoch": 119, "lr": 9.09780651979151e-05} +{"train_loss": 0.007779004517942667, "global_step": 14270, "epoch": 119, "lr": 9.097679568948274e-05} +{"train_loss": 0.005964041221886873, "global_step": 14271, "epoch": 119, "lr": 9.09755261005968e-05} +{"train_loss": 0.006459442898631096, "global_step": 14272, "epoch": 119, "lr": 9.097425643125983e-05} +{"train_loss": 0.007942628115415573, "global_step": 14273, "epoch": 119, "lr": 9.097298668147427e-05} +{"train_loss": 0.009923933073878288, "global_step": 14274, "epoch": 119, "lr": 9.097171685124261e-05} +{"train_loss": 0.009029608219861984, "global_step": 14275, "epoch": 119, "lr": 9.097044694056738e-05} +{"train_loss": 0.005037066992372274, "global_step": 14276, "epoch": 119, "lr": 9.096917694945105e-05} +{"train_loss": 0.008234510198235512, "global_step": 14277, "epoch": 119, "lr": 9.096790687789611e-05} +{"train_loss": 0.009061750024557114, "global_step": 14278, "epoch": 119, "lr": 9.096663672590508e-05} +{"train_loss": 0.007039601969368318, "global_step": 14279, "epoch": 119, "lr": 9.096536649348041e-05, "val_loss": 0.01401166245341301} +{"train_loss": 0.009507263079285622, "global_step": 14280, "epoch": 120, "lr": 9.096409618062464e-05} +{"train_loss": 0.009506583213806152, "global_step": 14281, "epoch": 120, "lr": 9.096282578734024e-05} +{"train_loss": 0.00801858026534319, "global_step": 14282, "epoch": 120, "lr": 9.096155531362971e-05} +{"train_loss": 0.006426061503589153, "global_step": 14283, "epoch": 120, "lr": 9.096028475949553e-05} +{"train_loss": 0.0086718974635005, "global_step": 14284, "epoch": 120, "lr": 9.095901412494024e-05} +{"train_loss": 0.0068636490032076836, "global_step": 14285, "epoch": 120, "lr": 9.095774340996625e-05} +{"train_loss": 0.007553928066045046, "global_step": 14286, "epoch": 120, "lr": 9.095647261457614e-05} +{"train_loss": 0.006654457189142704, "global_step": 14287, "epoch": 120, "lr": 9.095520173877236e-05} +{"train_loss": 0.006655312143266201, "global_step": 14288, "epoch": 120, "lr": 9.095393078255743e-05} +{"train_loss": 0.00800180621445179, "global_step": 14289, "epoch": 120, "lr": 9.095265974593383e-05} +{"train_loss": 0.006142118014395237, "global_step": 14290, "epoch": 120, "lr": 9.095138862890405e-05} +{"train_loss": 0.00821658130735159, "global_step": 14291, "epoch": 120, "lr": 9.09501174314706e-05} +{"train_loss": 0.005246608983725309, "global_step": 14292, "epoch": 120, "lr": 9.094884615363595e-05} +{"train_loss": 0.0063257114961743355, "global_step": 14293, "epoch": 120, "lr": 9.094757479540264e-05} +{"train_loss": 0.009208550676703453, "global_step": 14294, "epoch": 120, "lr": 9.094630335677313e-05} +{"train_loss": 0.006682972423732281, "global_step": 14295, "epoch": 120, "lr": 9.094503183774992e-05} +{"train_loss": 0.008113935589790344, "global_step": 14296, "epoch": 120, "lr": 9.094376023833553e-05} +{"train_loss": 0.008589227683842182, "global_step": 14297, "epoch": 120, "lr": 9.094248855853243e-05} +{"train_loss": 0.010579933412373066, "global_step": 14298, "epoch": 120, "lr": 9.094121679834314e-05} +{"train_loss": 0.00783228687942028, "global_step": 14299, "epoch": 120, "lr": 9.093994495777013e-05} +{"train_loss": 0.005917471367865801, "global_step": 14300, "epoch": 120, "lr": 9.093867303681591e-05} +{"train_loss": 0.005021698772907257, "global_step": 14301, "epoch": 120, "lr": 9.0937401035483e-05} +{"train_loss": 0.00803445652127266, "global_step": 14302, "epoch": 120, "lr": 9.093612895377386e-05} +{"train_loss": 0.0063971965573728085, "global_step": 14303, "epoch": 120, "lr": 9.0934856791691e-05} +{"train_loss": 0.008691365830600262, "global_step": 14304, "epoch": 120, "lr": 9.093358454923694e-05} +{"train_loss": 0.005244086496531963, "global_step": 14305, "epoch": 120, "lr": 9.093231222641415e-05} +{"train_loss": 0.010036645457148552, "global_step": 14306, "epoch": 120, "lr": 9.093103982322512e-05} +{"train_loss": 0.005968052428215742, "global_step": 14307, "epoch": 120, "lr": 9.09297673396724e-05} +{"train_loss": 0.005942074581980705, "global_step": 14308, "epoch": 120, "lr": 9.092849477575844e-05} +{"train_loss": 0.006054589059203863, "global_step": 14309, "epoch": 120, "lr": 9.092722213148575e-05} +{"train_loss": 0.00585932144895196, "global_step": 14310, "epoch": 120, "lr": 9.092594940685683e-05} +{"train_loss": 0.01000417023897171, "global_step": 14311, "epoch": 120, "lr": 9.092467660187418e-05} +{"train_loss": 0.006483760662376881, "global_step": 14312, "epoch": 120, "lr": 9.092340371654031e-05} +{"train_loss": 0.007916014641523361, "global_step": 14313, "epoch": 120, "lr": 9.09221307508577e-05} +{"train_loss": 0.007321970537304878, "global_step": 14314, "epoch": 120, "lr": 9.092085770482886e-05} +{"train_loss": 0.006336255930364132, "global_step": 14315, "epoch": 120, "lr": 9.091958457845628e-05} +{"train_loss": 0.006915566511452198, "global_step": 14316, "epoch": 120, "lr": 9.091831137174249e-05} +{"train_loss": 0.005549784284085035, "global_step": 14317, "epoch": 120, "lr": 9.091703808468994e-05} +{"train_loss": 0.008360788226127625, "global_step": 14318, "epoch": 120, "lr": 9.091576471730118e-05} +{"train_loss": 0.006760928779840469, "global_step": 14319, "epoch": 120, "lr": 9.091449126957868e-05} +{"train_loss": 0.005485559348016977, "global_step": 14320, "epoch": 120, "lr": 9.091321774152495e-05} +{"train_loss": 0.006430535111576319, "global_step": 14321, "epoch": 120, "lr": 9.091194413314247e-05} +{"train_loss": 0.008882234804332256, "global_step": 14322, "epoch": 120, "lr": 9.091067044443377e-05} +{"train_loss": 0.007463307585567236, "global_step": 14323, "epoch": 120, "lr": 9.090939667540135e-05} +{"train_loss": 0.006281169131398201, "global_step": 14324, "epoch": 120, "lr": 9.090812282604768e-05} +{"train_loss": 0.005554933566600084, "global_step": 14325, "epoch": 120, "lr": 9.09068488963753e-05} +{"train_loss": 0.0069536129012703896, "global_step": 14326, "epoch": 120, "lr": 9.090557488638668e-05} +{"train_loss": 0.00692699896171689, "global_step": 14327, "epoch": 120, "lr": 9.090430079608434e-05} +{"train_loss": 0.0068288445472717285, "global_step": 14328, "epoch": 120, "lr": 9.090302662547077e-05} +{"train_loss": 0.006781017407774925, "global_step": 14329, "epoch": 120, "lr": 9.090175237454848e-05} +{"train_loss": 0.010677825659513474, "global_step": 14330, "epoch": 120, "lr": 9.090047804331996e-05} +{"train_loss": 0.005424877628684044, "global_step": 14331, "epoch": 120, "lr": 9.089920363178774e-05} +{"train_loss": 0.010332413017749786, "global_step": 14332, "epoch": 120, "lr": 9.08979291399543e-05} +{"train_loss": 0.0109612587839365, "global_step": 14333, "epoch": 120, "lr": 9.089665456782214e-05} +{"train_loss": 0.0033854686189442873, "global_step": 14334, "epoch": 120, "lr": 9.089537991539376e-05} +{"train_loss": 0.011569637805223465, "global_step": 14335, "epoch": 120, "lr": 9.089410518267167e-05} +{"train_loss": 0.00620060320943594, "global_step": 14336, "epoch": 120, "lr": 9.089283036965839e-05} +{"train_loss": 0.005093812942504883, "global_step": 14337, "epoch": 120, "lr": 9.08915554763564e-05} +{"train_loss": 0.008574584499001503, "global_step": 14338, "epoch": 120, "lr": 9.08902805027682e-05} +{"train_loss": 0.008973795920610428, "global_step": 14339, "epoch": 120, "lr": 9.088900544889632e-05} +{"train_loss": 0.006738861091434956, "global_step": 14340, "epoch": 120, "lr": 9.088773031474322e-05} +{"train_loss": 0.006040052976459265, "global_step": 14341, "epoch": 120, "lr": 9.088645510031144e-05} +{"train_loss": 0.01180869247764349, "global_step": 14342, "epoch": 120, "lr": 9.088517980560349e-05} +{"train_loss": 0.009351551532745361, "global_step": 14343, "epoch": 120, "lr": 9.088390443062184e-05} +{"train_loss": 0.0038282382301986217, "global_step": 14344, "epoch": 120, "lr": 9.088262897536901e-05} +{"train_loss": 0.008646378293633461, "global_step": 14345, "epoch": 120, "lr": 9.088135343984751e-05} +{"train_loss": 0.007406070828437805, "global_step": 14346, "epoch": 120, "lr": 9.088007782405986e-05} +{"train_loss": 0.006900027859956026, "global_step": 14347, "epoch": 120, "lr": 9.087880212800853e-05} +{"train_loss": 0.008729781955480576, "global_step": 14348, "epoch": 120, "lr": 9.087752635169602e-05} +{"train_loss": 0.008472859859466553, "global_step": 14349, "epoch": 120, "lr": 9.087625049512488e-05} +{"train_loss": 0.006135755684226751, "global_step": 14350, "epoch": 120, "lr": 9.087497455829758e-05} +{"train_loss": 0.006167855579406023, "global_step": 14351, "epoch": 120, "lr": 9.087369854121663e-05} +{"train_loss": 0.00920841470360756, "global_step": 14352, "epoch": 120, "lr": 9.087242244388454e-05} +{"train_loss": 0.006504429504275322, "global_step": 14353, "epoch": 120, "lr": 9.087114626630382e-05} +{"train_loss": 0.006881433539092541, "global_step": 14354, "epoch": 120, "lr": 9.086987000847698e-05} +{"train_loss": 0.004351811483502388, "global_step": 14355, "epoch": 120, "lr": 9.086859367040649e-05} +{"train_loss": 0.014631688594818115, "global_step": 14356, "epoch": 120, "lr": 9.086731725209492e-05} +{"train_loss": 0.006320339627563953, "global_step": 14357, "epoch": 120, "lr": 9.086604075354471e-05} +{"train_loss": 0.0052046640776097775, "global_step": 14358, "epoch": 120, "lr": 9.08647641747584e-05} +{"train_loss": 0.00783742405474186, "global_step": 14359, "epoch": 120, "lr": 9.08634875157385e-05} +{"train_loss": 0.00897417962551117, "global_step": 14360, "epoch": 120, "lr": 9.08622107764875e-05} +{"train_loss": 0.008629417978227139, "global_step": 14361, "epoch": 120, "lr": 9.086093395700792e-05} +{"train_loss": 0.007705341093242168, "global_step": 14362, "epoch": 120, "lr": 9.085965705730225e-05} +{"train_loss": 0.0070744287222623825, "global_step": 14363, "epoch": 120, "lr": 9.085838007737302e-05} +{"train_loss": 0.004999249242246151, "global_step": 14364, "epoch": 120, "lr": 9.085710301722272e-05} +{"train_loss": 0.005995089653879404, "global_step": 14365, "epoch": 120, "lr": 9.085582587685387e-05} +{"train_loss": 0.0064765578135848045, "global_step": 14366, "epoch": 120, "lr": 9.085454865626897e-05} +{"train_loss": 0.004220400005578995, "global_step": 14367, "epoch": 120, "lr": 9.085327135547052e-05} +{"train_loss": 0.009544750675559044, "global_step": 14368, "epoch": 120, "lr": 9.085199397446104e-05} +{"train_loss": 0.006520326714962721, "global_step": 14369, "epoch": 120, "lr": 9.085071651324302e-05} +{"train_loss": 0.006935576442629099, "global_step": 14370, "epoch": 120, "lr": 9.084943897181902e-05} +{"train_loss": 0.006111965514719486, "global_step": 14371, "epoch": 120, "lr": 9.084816135019148e-05} +{"train_loss": 0.006158430594950914, "global_step": 14372, "epoch": 120, "lr": 9.084688364836294e-05} +{"train_loss": 0.010977673344314098, "global_step": 14373, "epoch": 120, "lr": 9.084560586633593e-05} +{"train_loss": 0.004832891281694174, "global_step": 14374, "epoch": 120, "lr": 9.084432800411291e-05} +{"train_loss": 0.008394359610974789, "global_step": 14375, "epoch": 120, "lr": 9.084305006169642e-05} +{"train_loss": 0.005733133293688297, "global_step": 14376, "epoch": 120, "lr": 9.084177203908897e-05} +{"train_loss": 0.009034893475472927, "global_step": 14377, "epoch": 120, "lr": 9.084049393629308e-05} +{"train_loss": 0.009268274530768394, "global_step": 14378, "epoch": 120, "lr": 9.083921575331123e-05} +{"train_loss": 0.008173624984920025, "global_step": 14379, "epoch": 120, "lr": 9.083793749014594e-05} +{"train_loss": 0.008669383823871613, "global_step": 14380, "epoch": 120, "lr": 9.08366591467997e-05} +{"train_loss": 0.007435349281877279, "global_step": 14381, "epoch": 120, "lr": 9.083538072327508e-05} +{"train_loss": 0.006206853780895472, "global_step": 14382, "epoch": 120, "lr": 9.083410221957455e-05} +{"train_loss": 0.007172965444624424, "global_step": 14383, "epoch": 120, "lr": 9.08328236357006e-05} +{"train_loss": 0.00791134126484394, "global_step": 14384, "epoch": 120, "lr": 9.083154497165579e-05} +{"train_loss": 0.007632930763065815, "global_step": 14385, "epoch": 120, "lr": 9.083026622744257e-05} +{"train_loss": 0.007021795958280563, "global_step": 14386, "epoch": 120, "lr": 9.082898740306352e-05} +{"train_loss": 0.007315078750252724, "global_step": 14387, "epoch": 120, "lr": 9.082770849852108e-05} +{"train_loss": 0.006697384640574455, "global_step": 14388, "epoch": 120, "lr": 9.082642951381782e-05} +{"train_loss": 0.007514298427850008, "global_step": 14389, "epoch": 120, "lr": 9.082515044895623e-05} +{"train_loss": 0.008362935855984688, "global_step": 14390, "epoch": 120, "lr": 9.082387130393881e-05} +{"train_loss": 0.011802548542618752, "global_step": 14391, "epoch": 120, "lr": 9.082259207876807e-05} +{"train_loss": 0.0042156800627708435, "global_step": 14392, "epoch": 120, "lr": 9.082131277344654e-05} +{"train_loss": 0.004819369874894619, "global_step": 14393, "epoch": 120, "lr": 9.082003338797674e-05} +{"train_loss": 0.006522899493575096, "global_step": 14394, "epoch": 120, "lr": 9.081875392236114e-05} +{"train_loss": 0.007284573279321194, "global_step": 14395, "epoch": 120, "lr": 9.08174743766023e-05} +{"train_loss": 0.004652892239391804, "global_step": 14396, "epoch": 120, "lr": 9.081619475070269e-05} +{"train_loss": 0.0098373182117939, "global_step": 14397, "epoch": 120, "lr": 9.081491504466485e-05} +{"train_loss": 0.007371977854034856, "global_step": 14398, "epoch": 120, "lr": 9.081363525849129e-05, "val_loss": 0.014596923254430294, "train_action_mse_error": 0.00021379507961682975} +{"train_loss": 0.008540894836187363, "global_step": 14399, "epoch": 121, "lr": 9.081235539218451e-05} +{"train_loss": 0.009831300005316734, "global_step": 14400, "epoch": 121, "lr": 9.081107544574703e-05} +{"train_loss": 0.006159386597573757, "global_step": 14401, "epoch": 121, "lr": 9.080979541918137e-05} +{"train_loss": 0.008165424689650536, "global_step": 14402, "epoch": 121, "lr": 9.080851531249004e-05} +{"train_loss": 0.007413110695779324, "global_step": 14403, "epoch": 121, "lr": 9.080723512567553e-05} +{"train_loss": 0.0046334778890013695, "global_step": 14404, "epoch": 121, "lr": 9.08059548587404e-05} +{"train_loss": 0.006946998182684183, "global_step": 14405, "epoch": 121, "lr": 9.080467451168711e-05} +{"train_loss": 0.00901851337403059, "global_step": 14406, "epoch": 121, "lr": 9.080339408451822e-05} +{"train_loss": 0.00851946510374546, "global_step": 14407, "epoch": 121, "lr": 9.080211357723623e-05} +{"train_loss": 0.008829236030578613, "global_step": 14408, "epoch": 121, "lr": 9.080083298984363e-05} +{"train_loss": 0.008347010239958763, "global_step": 14409, "epoch": 121, "lr": 9.079955232234297e-05} +{"train_loss": 0.006713866256177425, "global_step": 14410, "epoch": 121, "lr": 9.079827157473673e-05} +{"train_loss": 0.007044801022857428, "global_step": 14411, "epoch": 121, "lr": 9.079699074702746e-05} +{"train_loss": 0.006222504656761885, "global_step": 14412, "epoch": 121, "lr": 9.079570983921764e-05} +{"train_loss": 0.00785846821963787, "global_step": 14413, "epoch": 121, "lr": 9.079442885130982e-05} +{"train_loss": 0.0076208277605473995, "global_step": 14414, "epoch": 121, "lr": 9.079314778330648e-05} +{"train_loss": 0.006081364117562771, "global_step": 14415, "epoch": 121, "lr": 9.079186663521016e-05} +{"train_loss": 0.005153072532266378, "global_step": 14416, "epoch": 121, "lr": 9.079058540702337e-05} +{"train_loss": 0.006438515614718199, "global_step": 14417, "epoch": 121, "lr": 9.078930409874861e-05} +{"train_loss": 0.006051527336239815, "global_step": 14418, "epoch": 121, "lr": 9.078802271038845e-05} +{"train_loss": 0.006923665292561054, "global_step": 14419, "epoch": 121, "lr": 9.078674124194533e-05} +{"train_loss": 0.008397789672017097, "global_step": 14420, "epoch": 121, "lr": 9.07854596934218e-05} +{"train_loss": 0.0072975619696080685, "global_step": 14421, "epoch": 121, "lr": 9.078417806482038e-05} +{"train_loss": 0.005381763447076082, "global_step": 14422, "epoch": 121, "lr": 9.078289635614359e-05} +{"train_loss": 0.007101556286215782, "global_step": 14423, "epoch": 121, "lr": 9.078161456739393e-05} +{"train_loss": 0.006699227262288332, "global_step": 14424, "epoch": 121, "lr": 9.078033269857394e-05} +{"train_loss": 0.005149466916918755, "global_step": 14425, "epoch": 121, "lr": 9.077905074968612e-05} +{"train_loss": 0.009375374764204025, "global_step": 14426, "epoch": 121, "lr": 9.077776872073299e-05} +{"train_loss": 0.012482982128858566, "global_step": 14427, "epoch": 121, "lr": 9.077648661171707e-05} +{"train_loss": 0.00746069336310029, "global_step": 14428, "epoch": 121, "lr": 9.077520442264087e-05} +{"train_loss": 0.006601931992918253, "global_step": 14429, "epoch": 121, "lr": 9.077392215350691e-05} +{"train_loss": 0.005897692870348692, "global_step": 14430, "epoch": 121, "lr": 9.077263980431771e-05} +{"train_loss": 0.005862551275640726, "global_step": 14431, "epoch": 121, "lr": 9.07713573750758e-05} +{"train_loss": 0.008332861587405205, "global_step": 14432, "epoch": 121, "lr": 9.077007486578367e-05} +{"train_loss": 0.005113614723086357, "global_step": 14433, "epoch": 121, "lr": 9.076879227644385e-05} +{"train_loss": 0.006741761229932308, "global_step": 14434, "epoch": 121, "lr": 9.076750960705888e-05} +{"train_loss": 0.005646154750138521, "global_step": 14435, "epoch": 121, "lr": 9.076622685763125e-05} +{"train_loss": 0.005277582444250584, "global_step": 14436, "epoch": 121, "lr": 9.076494402816349e-05} +{"train_loss": 0.007022468373179436, "global_step": 14437, "epoch": 121, "lr": 9.076366111865812e-05} +{"train_loss": 0.00913195125758648, "global_step": 14438, "epoch": 121, "lr": 9.076237812911765e-05} +{"train_loss": 0.008762633427977562, "global_step": 14439, "epoch": 121, "lr": 9.076109505954462e-05} +{"train_loss": 0.003759626531973481, "global_step": 14440, "epoch": 121, "lr": 9.075981190994153e-05} +{"train_loss": 0.008041609078645706, "global_step": 14441, "epoch": 121, "lr": 9.075852868031089e-05} +{"train_loss": 0.009021144360303879, "global_step": 14442, "epoch": 121, "lr": 9.075724537065524e-05} +{"train_loss": 0.007686587981879711, "global_step": 14443, "epoch": 121, "lr": 9.07559619809771e-05} +{"train_loss": 0.011401415802538395, "global_step": 14444, "epoch": 121, "lr": 9.075467851127897e-05} +{"train_loss": 0.010934827849268913, "global_step": 14445, "epoch": 121, "lr": 9.07533949615634e-05} +{"train_loss": 0.006205956917256117, "global_step": 14446, "epoch": 121, "lr": 9.075211133183287e-05} +{"train_loss": 0.006093490403145552, "global_step": 14447, "epoch": 121, "lr": 9.075082762208996e-05} +{"train_loss": 0.006519373971968889, "global_step": 14448, "epoch": 121, "lr": 9.074954383233711e-05} +{"train_loss": 0.006890189368277788, "global_step": 14449, "epoch": 121, "lr": 9.074825996257692e-05} +{"train_loss": 0.007951853796839714, "global_step": 14450, "epoch": 121, "lr": 9.074697601281186e-05} +{"train_loss": 0.005497824866324663, "global_step": 14451, "epoch": 121, "lr": 9.074569198304446e-05} +{"train_loss": 0.00810418650507927, "global_step": 14452, "epoch": 121, "lr": 9.074440787327725e-05} +{"train_loss": 0.007088550832122564, "global_step": 14453, "epoch": 121, "lr": 9.074312368351274e-05} +{"train_loss": 0.008460268378257751, "global_step": 14454, "epoch": 121, "lr": 9.074183941375348e-05} +{"train_loss": 0.005696759093552828, "global_step": 14455, "epoch": 121, "lr": 9.074055506400197e-05} +{"train_loss": 0.005755542777478695, "global_step": 14456, "epoch": 121, "lr": 9.073927063426072e-05} +{"train_loss": 0.009840033948421478, "global_step": 14457, "epoch": 121, "lr": 9.073798612453226e-05} +{"train_loss": 0.008113480173051357, "global_step": 14458, "epoch": 121, "lr": 9.073670153481912e-05} +{"train_loss": 0.006639434490352869, "global_step": 14459, "epoch": 121, "lr": 9.073541686512382e-05} +{"train_loss": 0.00852870475500822, "global_step": 14460, "epoch": 121, "lr": 9.073413211544887e-05} +{"train_loss": 0.006286384537816048, "global_step": 14461, "epoch": 121, "lr": 9.073284728579683e-05} +{"train_loss": 0.007869861088693142, "global_step": 14462, "epoch": 121, "lr": 9.073156237617019e-05} +{"train_loss": 0.00942162610590458, "global_step": 14463, "epoch": 121, "lr": 9.073027738657147e-05} +{"train_loss": 0.008351072669029236, "global_step": 14464, "epoch": 121, "lr": 9.07289923170032e-05} +{"train_loss": 0.00691539840772748, "global_step": 14465, "epoch": 121, "lr": 9.07277071674679e-05} +{"train_loss": 0.0066245486959815025, "global_step": 14466, "epoch": 121, "lr": 9.072642193796811e-05} +{"train_loss": 0.004810751415789127, "global_step": 14467, "epoch": 121, "lr": 9.072513662850634e-05} +{"train_loss": 0.006415588781237602, "global_step": 14468, "epoch": 121, "lr": 9.072385123908511e-05} +{"train_loss": 0.006992486771196127, "global_step": 14469, "epoch": 121, "lr": 9.072256576970695e-05} +{"train_loss": 0.00696702441200614, "global_step": 14470, "epoch": 121, "lr": 9.072128022037438e-05} +{"train_loss": 0.005989959929138422, "global_step": 14471, "epoch": 121, "lr": 9.071999459108994e-05} +{"train_loss": 0.010119568556547165, "global_step": 14472, "epoch": 121, "lr": 9.071870888185612e-05} +{"train_loss": 0.007748464588075876, "global_step": 14473, "epoch": 121, "lr": 9.071742309267548e-05} +{"train_loss": 0.0059216939844191074, "global_step": 14474, "epoch": 121, "lr": 9.071613722355053e-05} +{"train_loss": 0.008394798263907433, "global_step": 14475, "epoch": 121, "lr": 9.071485127448379e-05} +{"train_loss": 0.006925825960934162, "global_step": 14476, "epoch": 121, "lr": 9.07135652454778e-05} +{"train_loss": 0.008280006237328053, "global_step": 14477, "epoch": 121, "lr": 9.071227913653506e-05} +{"train_loss": 0.006405482534319162, "global_step": 14478, "epoch": 121, "lr": 9.071099294765811e-05} +{"train_loss": 0.004918839316815138, "global_step": 14479, "epoch": 121, "lr": 9.070970667884949e-05} +{"train_loss": 0.009436055086553097, "global_step": 14480, "epoch": 121, "lr": 9.070842033011169e-05} +{"train_loss": 0.008712902665138245, "global_step": 14481, "epoch": 121, "lr": 9.070713390144727e-05} +{"train_loss": 0.011643050238490105, "global_step": 14482, "epoch": 121, "lr": 9.070584739285873e-05} +{"train_loss": 0.011652274057269096, "global_step": 14483, "epoch": 121, "lr": 9.070456080434862e-05} +{"train_loss": 0.005524650681763887, "global_step": 14484, "epoch": 121, "lr": 9.070327413591944e-05} +{"train_loss": 0.005470959469676018, "global_step": 14485, "epoch": 121, "lr": 9.070198738757373e-05} +{"train_loss": 0.007437561638653278, "global_step": 14486, "epoch": 121, "lr": 9.070070055931403e-05} +{"train_loss": 0.008691903203725815, "global_step": 14487, "epoch": 121, "lr": 9.069941365114285e-05} +{"train_loss": 0.00857782643288374, "global_step": 14488, "epoch": 121, "lr": 9.06981266630627e-05} +{"train_loss": 0.006244507618248463, "global_step": 14489, "epoch": 121, "lr": 9.069683959507615e-05} +{"train_loss": 0.006973935291171074, "global_step": 14490, "epoch": 121, "lr": 9.06955524471857e-05} +{"train_loss": 0.012150327675044537, "global_step": 14491, "epoch": 121, "lr": 9.069426521939387e-05} +{"train_loss": 0.006518927402794361, "global_step": 14492, "epoch": 121, "lr": 9.06929779117032e-05} +{"train_loss": 0.012669982388615608, "global_step": 14493, "epoch": 121, "lr": 9.069169052411623e-05} +{"train_loss": 0.006140352226793766, "global_step": 14494, "epoch": 121, "lr": 9.069040305663546e-05} +{"train_loss": 0.006354385055601597, "global_step": 14495, "epoch": 121, "lr": 9.068911550926342e-05} +{"train_loss": 0.0059736985713243484, "global_step": 14496, "epoch": 121, "lr": 9.068782788200268e-05} +{"train_loss": 0.008871559053659439, "global_step": 14497, "epoch": 121, "lr": 9.068654017485571e-05} +{"train_loss": 0.011637968942523003, "global_step": 14498, "epoch": 121, "lr": 9.068525238782507e-05} +{"train_loss": 0.0049437265843153, "global_step": 14499, "epoch": 121, "lr": 9.068396452091328e-05} +{"train_loss": 0.008302973583340645, "global_step": 14500, "epoch": 121, "lr": 9.068267657412288e-05} +{"train_loss": 0.007317895535379648, "global_step": 14501, "epoch": 121, "lr": 9.068138854745638e-05} +{"train_loss": 0.009209897369146347, "global_step": 14502, "epoch": 121, "lr": 9.068010044091633e-05} +{"train_loss": 0.010046765208244324, "global_step": 14503, "epoch": 121, "lr": 9.067881225450525e-05} +{"train_loss": 0.008444796316325665, "global_step": 14504, "epoch": 121, "lr": 9.067752398822567e-05} +{"train_loss": 0.005446579772979021, "global_step": 14505, "epoch": 121, "lr": 9.06762356420801e-05} +{"train_loss": 0.0083867646753788, "global_step": 14506, "epoch": 121, "lr": 9.06749472160711e-05} +{"train_loss": 0.0074942163191735744, "global_step": 14507, "epoch": 121, "lr": 9.067365871020119e-05} +{"train_loss": 0.005804621148854494, "global_step": 14508, "epoch": 121, "lr": 9.067237012447289e-05} +{"train_loss": 0.007893568836152554, "global_step": 14509, "epoch": 121, "lr": 9.067108145888875e-05} +{"train_loss": 0.010777630843222141, "global_step": 14510, "epoch": 121, "lr": 9.066979271345127e-05} +{"train_loss": 0.008572803810238838, "global_step": 14511, "epoch": 121, "lr": 9.066850388816301e-05} +{"train_loss": 0.008410348556935787, "global_step": 14512, "epoch": 121, "lr": 9.066721498302649e-05} +{"train_loss": 0.005317600443959236, "global_step": 14513, "epoch": 121, "lr": 9.066592599804422e-05} +{"train_loss": 0.007214399520307779, "global_step": 14514, "epoch": 121, "lr": 9.066463693321876e-05} +{"train_loss": 0.006901035085320473, "global_step": 14515, "epoch": 121, "lr": 9.06633477885526e-05} +{"train_loss": 0.010397407226264477, "global_step": 14516, "epoch": 121, "lr": 9.066205856404835e-05} +{"train_loss": 0.007559173734576888, "global_step": 14517, "epoch": 121, "lr": 9.066076925970847e-05, "val_loss": 0.012519975192844868} +{"train_loss": 0.006940687540918589, "global_step": 14518, "epoch": 122, "lr": 9.065947987553551e-05} +{"train_loss": 0.008270464837551117, "global_step": 14519, "epoch": 122, "lr": 9.065819041153201e-05} +{"train_loss": 0.00871297437697649, "global_step": 14520, "epoch": 122, "lr": 9.065690086770049e-05} +{"train_loss": 0.008006269112229347, "global_step": 14521, "epoch": 122, "lr": 9.065561124404349e-05} +{"train_loss": 0.008011355064809322, "global_step": 14522, "epoch": 122, "lr": 9.065432154056355e-05} +{"train_loss": 0.0065550548024475574, "global_step": 14523, "epoch": 122, "lr": 9.065303175726319e-05} +{"train_loss": 0.012133303098380566, "global_step": 14524, "epoch": 122, "lr": 9.065174189414494e-05} +{"train_loss": 0.007562961429357529, "global_step": 14525, "epoch": 122, "lr": 9.065045195121134e-05} +{"train_loss": 0.008921962231397629, "global_step": 14526, "epoch": 122, "lr": 9.064916192846492e-05} +{"train_loss": 0.008641974069178104, "global_step": 14527, "epoch": 122, "lr": 9.064787182590822e-05} +{"train_loss": 0.009452692233026028, "global_step": 14528, "epoch": 122, "lr": 9.064658164354377e-05} +{"train_loss": 0.009710537269711494, "global_step": 14529, "epoch": 122, "lr": 9.064529138137408e-05} +{"train_loss": 0.007963677868247032, "global_step": 14530, "epoch": 122, "lr": 9.064400103940171e-05} +{"train_loss": 0.0059807091020047665, "global_step": 14531, "epoch": 122, "lr": 9.064271061762918e-05} +{"train_loss": 0.007243060972541571, "global_step": 14532, "epoch": 122, "lr": 9.064142011605905e-05} +{"train_loss": 0.006203954108059406, "global_step": 14533, "epoch": 122, "lr": 9.064012953469382e-05} +{"train_loss": 0.00807077158242464, "global_step": 14534, "epoch": 122, "lr": 9.063883887353603e-05} +{"train_loss": 0.005962105002254248, "global_step": 14535, "epoch": 122, "lr": 9.063754813258823e-05} +{"train_loss": 0.01046411506831646, "global_step": 14536, "epoch": 122, "lr": 9.063625731185295e-05} +{"train_loss": 0.006326337810605764, "global_step": 14537, "epoch": 122, "lr": 9.063496641133273e-05} +{"train_loss": 0.005845650564879179, "global_step": 14538, "epoch": 122, "lr": 9.063367543103007e-05} +{"train_loss": 0.005954362917691469, "global_step": 14539, "epoch": 122, "lr": 9.063238437094754e-05} +{"train_loss": 0.010165718384087086, "global_step": 14540, "epoch": 122, "lr": 9.063109323108767e-05} +{"train_loss": 0.007188660092651844, "global_step": 14541, "epoch": 122, "lr": 9.062980201145298e-05} +{"train_loss": 0.0069251880049705505, "global_step": 14542, "epoch": 122, "lr": 9.062851071204602e-05} +{"train_loss": 0.007255390752106905, "global_step": 14543, "epoch": 122, "lr": 9.062721933286932e-05} +{"train_loss": 0.007759834639728069, "global_step": 14544, "epoch": 122, "lr": 9.06259278739254e-05} +{"train_loss": 0.008274812251329422, "global_step": 14545, "epoch": 122, "lr": 9.062463633521684e-05} +{"train_loss": 0.004606619477272034, "global_step": 14546, "epoch": 122, "lr": 9.062334471674613e-05} +{"train_loss": 0.010391084477305412, "global_step": 14547, "epoch": 122, "lr": 9.062205301851582e-05} +{"train_loss": 0.012570757418870926, "global_step": 14548, "epoch": 122, "lr": 9.062076124052845e-05} +{"train_loss": 0.008638341911137104, "global_step": 14549, "epoch": 122, "lr": 9.061946938278655e-05} +{"train_loss": 0.007137425243854523, "global_step": 14550, "epoch": 122, "lr": 9.061817744529269e-05} +{"train_loss": 0.007891972549259663, "global_step": 14551, "epoch": 122, "lr": 9.061688542804935e-05} +{"train_loss": 0.011671499349176884, "global_step": 14552, "epoch": 122, "lr": 9.061559333105909e-05} +{"train_loss": 0.00533507252112031, "global_step": 14553, "epoch": 122, "lr": 9.061430115432448e-05} +{"train_loss": 0.005743131507188082, "global_step": 14554, "epoch": 122, "lr": 9.0613008897848e-05} +{"train_loss": 0.010708119720220566, "global_step": 14555, "epoch": 122, "lr": 9.061171656163223e-05} +{"train_loss": 0.006719239987432957, "global_step": 14556, "epoch": 122, "lr": 9.061042414567968e-05} +{"train_loss": 0.005417981185019016, "global_step": 14557, "epoch": 122, "lr": 9.060913164999292e-05} +{"train_loss": 0.007273706141859293, "global_step": 14558, "epoch": 122, "lr": 9.060783907457446e-05} +{"train_loss": 0.008816915564239025, "global_step": 14559, "epoch": 122, "lr": 9.060654641942686e-05} +{"train_loss": 0.006561591289937496, "global_step": 14560, "epoch": 122, "lr": 9.060525368455262e-05} +{"train_loss": 0.006478950846940279, "global_step": 14561, "epoch": 122, "lr": 9.060396086995431e-05} +{"train_loss": 0.008512563072144985, "global_step": 14562, "epoch": 122, "lr": 9.060266797563447e-05} +{"train_loss": 0.008562302216887474, "global_step": 14563, "epoch": 122, "lr": 9.060137500159562e-05} +{"train_loss": 0.006488686427474022, "global_step": 14564, "epoch": 122, "lr": 9.060008194784031e-05} +{"train_loss": 0.005844722967594862, "global_step": 14565, "epoch": 122, "lr": 9.059878881437107e-05} +{"train_loss": 0.010362225584685802, "global_step": 14566, "epoch": 122, "lr": 9.059749560119046e-05} +{"train_loss": 0.008977602235972881, "global_step": 14567, "epoch": 122, "lr": 9.0596202308301e-05} +{"train_loss": 0.008450742810964584, "global_step": 14568, "epoch": 122, "lr": 9.059490893570523e-05} +{"train_loss": 0.007901451550424099, "global_step": 14569, "epoch": 122, "lr": 9.059361548340569e-05} +{"train_loss": 0.007363911718130112, "global_step": 14570, "epoch": 122, "lr": 9.059232195140494e-05} +{"train_loss": 0.008717826567590237, "global_step": 14571, "epoch": 122, "lr": 9.059102833970547e-05} +{"train_loss": 0.005468479357659817, "global_step": 14572, "epoch": 122, "lr": 9.058973464830989e-05} +{"train_loss": 0.01264207623898983, "global_step": 14573, "epoch": 122, "lr": 9.058844087722067e-05} +{"train_loss": 0.00837584026157856, "global_step": 14574, "epoch": 122, "lr": 9.05871470264404e-05} +{"train_loss": 0.007954882457852364, "global_step": 14575, "epoch": 122, "lr": 9.05858530959716e-05} +{"train_loss": 0.006236211396753788, "global_step": 14576, "epoch": 122, "lr": 9.058455908581683e-05} +{"train_loss": 0.0067057739943265915, "global_step": 14577, "epoch": 122, "lr": 9.05832649959786e-05} +{"train_loss": 0.007614976726472378, "global_step": 14578, "epoch": 122, "lr": 9.058197082645944e-05} +{"train_loss": 0.016563668847084045, "global_step": 14579, "epoch": 122, "lr": 9.058067657726195e-05} +{"train_loss": 0.009164949879050255, "global_step": 14580, "epoch": 122, "lr": 9.057938224838862e-05} +{"train_loss": 0.009888608008623123, "global_step": 14581, "epoch": 122, "lr": 9.057808783984202e-05} +{"train_loss": 0.006386608351022005, "global_step": 14582, "epoch": 122, "lr": 9.057679335162466e-05} +{"train_loss": 0.007466454524546862, "global_step": 14583, "epoch": 122, "lr": 9.057549878373912e-05} +{"train_loss": 0.006665798369795084, "global_step": 14584, "epoch": 122, "lr": 9.057420413618791e-05} +{"train_loss": 0.006619976367801428, "global_step": 14585, "epoch": 122, "lr": 9.057290940897361e-05} +{"train_loss": 0.00654996233060956, "global_step": 14586, "epoch": 122, "lr": 9.05716146020987e-05} +{"train_loss": 0.011726947501301765, "global_step": 14587, "epoch": 122, "lr": 9.05703197155658e-05} +{"train_loss": 0.009296837262809277, "global_step": 14588, "epoch": 122, "lr": 9.056902474937739e-05} +{"train_loss": 0.009069537743926048, "global_step": 14589, "epoch": 122, "lr": 9.056772970353601e-05} +{"train_loss": 0.007638839539140463, "global_step": 14590, "epoch": 122, "lr": 9.056643457804426e-05} +{"train_loss": 0.0062017240561544895, "global_step": 14591, "epoch": 122, "lr": 9.056513937290465e-05} +{"train_loss": 0.010397356003522873, "global_step": 14592, "epoch": 122, "lr": 9.05638440881197e-05} +{"train_loss": 0.0057400972582399845, "global_step": 14593, "epoch": 122, "lr": 9.0562548723692e-05} +{"train_loss": 0.008621814660727978, "global_step": 14594, "epoch": 122, "lr": 9.056125327962406e-05} +{"train_loss": 0.006499723065644503, "global_step": 14595, "epoch": 122, "lr": 9.055995775591844e-05} +{"train_loss": 0.0065297638066112995, "global_step": 14596, "epoch": 122, "lr": 9.055866215257765e-05} +{"train_loss": 0.008675339631736279, "global_step": 14597, "epoch": 122, "lr": 9.055736646960428e-05} +{"train_loss": 0.01230678427964449, "global_step": 14598, "epoch": 122, "lr": 9.055607070700085e-05} +{"train_loss": 0.008158445358276367, "global_step": 14599, "epoch": 122, "lr": 9.055477486476991e-05} +{"train_loss": 0.005442979745566845, "global_step": 14600, "epoch": 122, "lr": 9.0553478942914e-05} +{"train_loss": 0.0056718760170042515, "global_step": 14601, "epoch": 122, "lr": 9.055218294143566e-05} +{"train_loss": 0.012088092975318432, "global_step": 14602, "epoch": 122, "lr": 9.055088686033745e-05} +{"train_loss": 0.008303302340209484, "global_step": 14603, "epoch": 122, "lr": 9.05495906996219e-05} +{"train_loss": 0.006513578817248344, "global_step": 14604, "epoch": 122, "lr": 9.054829445929156e-05} +{"train_loss": 0.0077619184739887714, "global_step": 14605, "epoch": 122, "lr": 9.054699813934899e-05} +{"train_loss": 0.0075426651164889336, "global_step": 14606, "epoch": 122, "lr": 9.05457017397967e-05} +{"train_loss": 0.00570638058707118, "global_step": 14607, "epoch": 122, "lr": 9.054440526063728e-05} +{"train_loss": 0.006493979133665562, "global_step": 14608, "epoch": 122, "lr": 9.054310870187323e-05} +{"train_loss": 0.00905052199959755, "global_step": 14609, "epoch": 122, "lr": 9.054181206350714e-05} +{"train_loss": 0.00425654835999012, "global_step": 14610, "epoch": 122, "lr": 9.05405153455415e-05} +{"train_loss": 0.00809687189757824, "global_step": 14611, "epoch": 122, "lr": 9.053921854797893e-05} +{"train_loss": 0.010334226302802563, "global_step": 14612, "epoch": 122, "lr": 9.053792167082192e-05} +{"train_loss": 0.009381209500133991, "global_step": 14613, "epoch": 122, "lr": 9.053662471407301e-05} +{"train_loss": 0.008427917957305908, "global_step": 14614, "epoch": 122, "lr": 9.053532767773479e-05} +{"train_loss": 0.007113655097782612, "global_step": 14615, "epoch": 122, "lr": 9.053403056180978e-05} +{"train_loss": 0.00627027777954936, "global_step": 14616, "epoch": 122, "lr": 9.053273336630053e-05} +{"train_loss": 0.00762599240988493, "global_step": 14617, "epoch": 122, "lr": 9.053143609120959e-05} +{"train_loss": 0.006196167785674334, "global_step": 14618, "epoch": 122, "lr": 9.053013873653951e-05} +{"train_loss": 0.007261332124471664, "global_step": 14619, "epoch": 122, "lr": 9.052884130229282e-05} +{"train_loss": 0.00915395375341177, "global_step": 14620, "epoch": 122, "lr": 9.052754378847209e-05} +{"train_loss": 0.009074856527149677, "global_step": 14621, "epoch": 122, "lr": 9.052624619507986e-05} +{"train_loss": 0.007062449119985104, "global_step": 14622, "epoch": 122, "lr": 9.052494852211865e-05} +{"train_loss": 0.009547962807118893, "global_step": 14623, "epoch": 122, "lr": 9.052365076959106e-05} +{"train_loss": 0.009852058254182339, "global_step": 14624, "epoch": 122, "lr": 9.05223529374996e-05} +{"train_loss": 0.004038090817630291, "global_step": 14625, "epoch": 122, "lr": 9.052105502584684e-05} +{"train_loss": 0.006477561313658953, "global_step": 14626, "epoch": 122, "lr": 9.051975703463532e-05} +{"train_loss": 0.007868676446378231, "global_step": 14627, "epoch": 122, "lr": 9.051845896386757e-05} +{"train_loss": 0.008584106341004372, "global_step": 14628, "epoch": 122, "lr": 9.051716081354616e-05} +{"train_loss": 0.009141734801232815, "global_step": 14629, "epoch": 122, "lr": 9.051586258367363e-05} +{"train_loss": 0.006907073315232992, "global_step": 14630, "epoch": 122, "lr": 9.051456427425253e-05} +{"train_loss": 0.008507746271789074, "global_step": 14631, "epoch": 122, "lr": 9.051326588528542e-05} +{"train_loss": 0.007571429945528507, "global_step": 14632, "epoch": 122, "lr": 9.051196741677484e-05} +{"train_loss": 0.005908533465117216, "global_step": 14633, "epoch": 122, "lr": 9.051066886872335e-05} +{"train_loss": 0.0072548650205135345, "global_step": 14634, "epoch": 122, "lr": 9.050937024113346e-05} +{"train_loss": 0.006352994125336409, "global_step": 14635, "epoch": 122, "lr": 9.050807153400777e-05} +{"train_loss": 0.007906787113106552, "global_step": 14636, "epoch": 122, "lr": 9.050677274734882e-05, "val_loss": 0.014105905778706074} +{"train_loss": 0.006947237998247147, "global_step": 14637, "epoch": 123, "lr": 9.050547388115913e-05} +{"train_loss": 0.008818690665066242, "global_step": 14638, "epoch": 123, "lr": 9.050417493544128e-05} +{"train_loss": 0.007730349898338318, "global_step": 14639, "epoch": 123, "lr": 9.050287591019779e-05} +{"train_loss": 0.003928031772375107, "global_step": 14640, "epoch": 123, "lr": 9.050157680543125e-05} +{"train_loss": 0.006063179578632116, "global_step": 14641, "epoch": 123, "lr": 9.050027762114419e-05} +{"train_loss": 0.007925505749881268, "global_step": 14642, "epoch": 123, "lr": 9.049897835733915e-05} +{"train_loss": 0.006774993613362312, "global_step": 14643, "epoch": 123, "lr": 9.049767901401872e-05} +{"train_loss": 0.007092584855854511, "global_step": 14644, "epoch": 123, "lr": 9.04963795911854e-05} +{"train_loss": 0.007358151488006115, "global_step": 14645, "epoch": 123, "lr": 9.049508008884176e-05} +{"train_loss": 0.009741436690092087, "global_step": 14646, "epoch": 123, "lr": 9.049378050699038e-05} +{"train_loss": 0.004200839903205633, "global_step": 14647, "epoch": 123, "lr": 9.049248084563376e-05} +{"train_loss": 0.008454665541648865, "global_step": 14648, "epoch": 123, "lr": 9.04911811047745e-05} +{"train_loss": 0.005021645221859217, "global_step": 14649, "epoch": 123, "lr": 9.048988128441512e-05} +{"train_loss": 0.006116739474236965, "global_step": 14650, "epoch": 123, "lr": 9.048858138455819e-05} +{"train_loss": 0.0055845510214567184, "global_step": 14651, "epoch": 123, "lr": 9.048728140520626e-05} +{"train_loss": 0.009907637722790241, "global_step": 14652, "epoch": 123, "lr": 9.048598134636188e-05} +{"train_loss": 0.00515183387324214, "global_step": 14653, "epoch": 123, "lr": 9.048468120802759e-05} +{"train_loss": 0.005475784186273813, "global_step": 14654, "epoch": 123, "lr": 9.048338099020596e-05} +{"train_loss": 0.009590360336005688, "global_step": 14655, "epoch": 123, "lr": 9.048208069289952e-05} +{"train_loss": 0.008133690804243088, "global_step": 14656, "epoch": 123, "lr": 9.048078031611087e-05} +{"train_loss": 0.008759280666708946, "global_step": 14657, "epoch": 123, "lr": 9.047947985984251e-05} +{"train_loss": 0.006447363179177046, "global_step": 14658, "epoch": 123, "lr": 9.047817932409702e-05} +{"train_loss": 0.004961775150150061, "global_step": 14659, "epoch": 123, "lr": 9.047687870887696e-05} +{"train_loss": 0.007659358903765678, "global_step": 14660, "epoch": 123, "lr": 9.047557801418486e-05} +{"train_loss": 0.010669373907148838, "global_step": 14661, "epoch": 123, "lr": 9.04742772400233e-05} +{"train_loss": 0.005327015183866024, "global_step": 14662, "epoch": 123, "lr": 9.04729763863948e-05} +{"train_loss": 0.007122189272195101, "global_step": 14663, "epoch": 123, "lr": 9.047167545330195e-05} +{"train_loss": 0.00614760909229517, "global_step": 14664, "epoch": 123, "lr": 9.047037444074728e-05} +{"train_loss": 0.009348243474960327, "global_step": 14665, "epoch": 123, "lr": 9.046907334873337e-05} +{"train_loss": 0.0066411783918738365, "global_step": 14666, "epoch": 123, "lr": 9.046777217726275e-05} +{"train_loss": 0.007822578772902489, "global_step": 14667, "epoch": 123, "lr": 9.046647092633798e-05} +{"train_loss": 0.012345529161393642, "global_step": 14668, "epoch": 123, "lr": 9.04651695959616e-05} +{"train_loss": 0.010115886107087135, "global_step": 14669, "epoch": 123, "lr": 9.046386818613621e-05} +{"train_loss": 0.006600494962185621, "global_step": 14670, "epoch": 123, "lr": 9.046256669686434e-05} +{"train_loss": 0.005906790029257536, "global_step": 14671, "epoch": 123, "lr": 9.046126512814852e-05} +{"train_loss": 0.007962527684867382, "global_step": 14672, "epoch": 123, "lr": 9.045996347999136e-05} +{"train_loss": 0.006234422791749239, "global_step": 14673, "epoch": 123, "lr": 9.045866175239535e-05} +{"train_loss": 0.008195403032004833, "global_step": 14674, "epoch": 123, "lr": 9.045735994536308e-05} +{"train_loss": 0.005007744766771793, "global_step": 14675, "epoch": 123, "lr": 9.045605805889713e-05} +{"train_loss": 0.010289234109222889, "global_step": 14676, "epoch": 123, "lr": 9.045475609300003e-05} +{"train_loss": 0.003968458157032728, "global_step": 14677, "epoch": 123, "lr": 9.045345404767432e-05} +{"train_loss": 0.006677411962300539, "global_step": 14678, "epoch": 123, "lr": 9.045215192292259e-05} +{"train_loss": 0.007078906055539846, "global_step": 14679, "epoch": 123, "lr": 9.045084971874738e-05} +{"train_loss": 0.009813632816076279, "global_step": 14680, "epoch": 123, "lr": 9.044954743515123e-05} +{"train_loss": 0.00553156016394496, "global_step": 14681, "epoch": 123, "lr": 9.044824507213674e-05} +{"train_loss": 0.0072395093739032745, "global_step": 14682, "epoch": 123, "lr": 9.044694262970644e-05} +{"train_loss": 0.008391106501221657, "global_step": 14683, "epoch": 123, "lr": 9.044564010786287e-05} +{"train_loss": 0.004739541094750166, "global_step": 14684, "epoch": 123, "lr": 9.044433750660863e-05} +{"train_loss": 0.010989845730364323, "global_step": 14685, "epoch": 123, "lr": 9.044303482594623e-05} +{"train_loss": 0.007649809587746859, "global_step": 14686, "epoch": 123, "lr": 9.044173206587826e-05} +{"train_loss": 0.008027820847928524, "global_step": 14687, "epoch": 123, "lr": 9.044042922640727e-05} +{"train_loss": 0.005615513306111097, "global_step": 14688, "epoch": 123, "lr": 9.043912630753583e-05} +{"train_loss": 0.00745152123272419, "global_step": 14689, "epoch": 123, "lr": 9.043782330926648e-05} +{"train_loss": 0.007925044745206833, "global_step": 14690, "epoch": 123, "lr": 9.043652023160179e-05} +{"train_loss": 0.007305996026843786, "global_step": 14691, "epoch": 123, "lr": 9.04352170745443e-05} +{"train_loss": 0.007845018059015274, "global_step": 14692, "epoch": 123, "lr": 9.043391383809659e-05} +{"train_loss": 0.010556862689554691, "global_step": 14693, "epoch": 123, "lr": 9.04326105222612e-05} +{"train_loss": 0.009246117435395718, "global_step": 14694, "epoch": 123, "lr": 9.04313071270407e-05} +{"train_loss": 0.007693807128816843, "global_step": 14695, "epoch": 123, "lr": 9.043000365243766e-05} +{"train_loss": 0.007538512349128723, "global_step": 14696, "epoch": 123, "lr": 9.042870009845461e-05} +{"train_loss": 0.01260949857532978, "global_step": 14697, "epoch": 123, "lr": 9.042739646509413e-05} +{"train_loss": 0.008311161771416664, "global_step": 14698, "epoch": 123, "lr": 9.042609275235878e-05} +{"train_loss": 0.008586322888731956, "global_step": 14699, "epoch": 123, "lr": 9.042478896025112e-05} +{"train_loss": 0.006844236049801111, "global_step": 14700, "epoch": 123, "lr": 9.04234850887737e-05} +{"train_loss": 0.007011879701167345, "global_step": 14701, "epoch": 123, "lr": 9.042218113792909e-05} +{"train_loss": 0.004688830114901066, "global_step": 14702, "epoch": 123, "lr": 9.042087710771985e-05} +{"train_loss": 0.005686050280928612, "global_step": 14703, "epoch": 123, "lr": 9.041957299814851e-05} +{"train_loss": 0.006658508442342281, "global_step": 14704, "epoch": 123, "lr": 9.041826880921768e-05} +{"train_loss": 0.011256030760705471, "global_step": 14705, "epoch": 123, "lr": 9.04169645409299e-05} +{"train_loss": 0.007148209027945995, "global_step": 14706, "epoch": 123, "lr": 9.041566019328773e-05} +{"train_loss": 0.0075738742016255856, "global_step": 14707, "epoch": 123, "lr": 9.041435576629371e-05} +{"train_loss": 0.0077471002005040646, "global_step": 14708, "epoch": 123, "lr": 9.041305125995043e-05} +{"train_loss": 0.010240940377116203, "global_step": 14709, "epoch": 123, "lr": 9.041174667426044e-05} +{"train_loss": 0.013644922524690628, "global_step": 14710, "epoch": 123, "lr": 9.041044200922631e-05} +{"train_loss": 0.010777431540191174, "global_step": 14711, "epoch": 123, "lr": 9.040913726485059e-05} +{"train_loss": 0.006518172100186348, "global_step": 14712, "epoch": 123, "lr": 9.040783244113584e-05} +{"train_loss": 0.007311646826565266, "global_step": 14713, "epoch": 123, "lr": 9.040652753808464e-05} +{"train_loss": 0.009712799452245235, "global_step": 14714, "epoch": 123, "lr": 9.040522255569954e-05} +{"train_loss": 0.0065881493501365185, "global_step": 14715, "epoch": 123, "lr": 9.040391749398309e-05} +{"train_loss": 0.008111853152513504, "global_step": 14716, "epoch": 123, "lr": 9.040261235293787e-05} +{"train_loss": 0.006531980354338884, "global_step": 14717, "epoch": 123, "lr": 9.040130713256644e-05} +{"train_loss": 0.007184807676821947, "global_step": 14718, "epoch": 123, "lr": 9.040000183287135e-05} +{"train_loss": 0.006521749775856733, "global_step": 14719, "epoch": 123, "lr": 9.039869645385518e-05} +{"train_loss": 0.006812421139329672, "global_step": 14720, "epoch": 123, "lr": 9.039739099552047e-05} +{"train_loss": 0.006813243497163057, "global_step": 14721, "epoch": 123, "lr": 9.039608545786983e-05} +{"train_loss": 0.007183513604104519, "global_step": 14722, "epoch": 123, "lr": 9.039477984090576e-05} +{"train_loss": 0.008497918024659157, "global_step": 14723, "epoch": 123, "lr": 9.039347414463088e-05} +{"train_loss": 0.005790918134152889, "global_step": 14724, "epoch": 123, "lr": 9.039216836904772e-05} +{"train_loss": 0.0070080505684018135, "global_step": 14725, "epoch": 123, "lr": 9.039086251415884e-05} +{"train_loss": 0.005736551247537136, "global_step": 14726, "epoch": 123, "lr": 9.038955657996684e-05} +{"train_loss": 0.006772198248654604, "global_step": 14727, "epoch": 123, "lr": 9.038825056647426e-05} +{"train_loss": 0.006202029064297676, "global_step": 14728, "epoch": 123, "lr": 9.038694447368365e-05} +{"train_loss": 0.007997358217835426, "global_step": 14729, "epoch": 123, "lr": 9.038563830159758e-05} +{"train_loss": 0.010531211271882057, "global_step": 14730, "epoch": 123, "lr": 9.038433205021864e-05} +{"train_loss": 0.007173443678766489, "global_step": 14731, "epoch": 123, "lr": 9.038302571954938e-05} +{"train_loss": 0.006973023060709238, "global_step": 14732, "epoch": 123, "lr": 9.038171930959236e-05} +{"train_loss": 0.008486544713377953, "global_step": 14733, "epoch": 123, "lr": 9.038041282035014e-05} +{"train_loss": 0.007046157494187355, "global_step": 14734, "epoch": 123, "lr": 9.03791062518253e-05} +{"train_loss": 0.008442729711532593, "global_step": 14735, "epoch": 123, "lr": 9.037779960402041e-05} +{"train_loss": 0.007437925785779953, "global_step": 14736, "epoch": 123, "lr": 9.037649287693801e-05} +{"train_loss": 0.008084243163466454, "global_step": 14737, "epoch": 123, "lr": 9.037518607058068e-05} +{"train_loss": 0.006234830245375633, "global_step": 14738, "epoch": 123, "lr": 9.0373879184951e-05} +{"train_loss": 0.00868547335267067, "global_step": 14739, "epoch": 123, "lr": 9.037257222005152e-05} +{"train_loss": 0.009103270247578621, "global_step": 14740, "epoch": 123, "lr": 9.037126517588478e-05} +{"train_loss": 0.004525481723248959, "global_step": 14741, "epoch": 123, "lr": 9.03699580524534e-05} +{"train_loss": 0.007659957744181156, "global_step": 14742, "epoch": 123, "lr": 9.036865084975992e-05} +{"train_loss": 0.007750567048788071, "global_step": 14743, "epoch": 123, "lr": 9.036734356780689e-05} +{"train_loss": 0.008021863177418709, "global_step": 14744, "epoch": 123, "lr": 9.036603620659689e-05} +{"train_loss": 0.007194818463176489, "global_step": 14745, "epoch": 123, "lr": 9.036472876613251e-05} +{"train_loss": 0.006306761410087347, "global_step": 14746, "epoch": 123, "lr": 9.036342124641629e-05} +{"train_loss": 0.010897123254835606, "global_step": 14747, "epoch": 123, "lr": 9.036211364745081e-05} +{"train_loss": 0.008117574267089367, "global_step": 14748, "epoch": 123, "lr": 9.036080596923861e-05} +{"train_loss": 0.007757899351418018, "global_step": 14749, "epoch": 123, "lr": 9.035949821178232e-05} +{"train_loss": 0.009523647837340832, "global_step": 14750, "epoch": 123, "lr": 9.035819037508444e-05} +{"train_loss": 0.0049986811354756355, "global_step": 14751, "epoch": 123, "lr": 9.035688245914756e-05} +{"train_loss": 0.006804157048463821, "global_step": 14752, "epoch": 123, "lr": 9.035557446397427e-05} +{"train_loss": 0.007584043312817812, "global_step": 14753, "epoch": 123, "lr": 9.03542663895671e-05} +{"train_loss": 0.0063944365829229355, "global_step": 14754, "epoch": 123, "lr": 9.035295823592867e-05} +{"train_loss": 0.007550706132119443, "global_step": 14755, "epoch": 123, "lr": 9.035165000306148e-05, "val_loss": 0.018847564235329628} +{"train_loss": 0.006424921099096537, "global_step": 14756, "epoch": 124, "lr": 9.035034169096816e-05} +{"train_loss": 0.009281100705265999, "global_step": 14757, "epoch": 124, "lr": 9.034903329965126e-05} +{"train_loss": 0.008094941265881062, "global_step": 14758, "epoch": 124, "lr": 9.034772482911332e-05} +{"train_loss": 0.004342278931289911, "global_step": 14759, "epoch": 124, "lr": 9.034641627935695e-05} +{"train_loss": 0.011194851249456406, "global_step": 14760, "epoch": 124, "lr": 9.03451076503847e-05} +{"train_loss": 0.0072559514082968235, "global_step": 14761, "epoch": 124, "lr": 9.034379894219913e-05} +{"train_loss": 0.010506699793040752, "global_step": 14762, "epoch": 124, "lr": 9.034249015480284e-05} +{"train_loss": 0.007439172826707363, "global_step": 14763, "epoch": 124, "lr": 9.034118128819837e-05} +{"train_loss": 0.006337443832308054, "global_step": 14764, "epoch": 124, "lr": 9.03398723423883e-05} +{"train_loss": 0.00695898849517107, "global_step": 14765, "epoch": 124, "lr": 9.03385633173752e-05} +{"train_loss": 0.008232825435698032, "global_step": 14766, "epoch": 124, "lr": 9.033725421316164e-05} +{"train_loss": 0.005467782262712717, "global_step": 14767, "epoch": 124, "lr": 9.03359450297502e-05} +{"train_loss": 0.009562830440700054, "global_step": 14768, "epoch": 124, "lr": 9.033463576714343e-05} +{"train_loss": 0.009087201207876205, "global_step": 14769, "epoch": 124, "lr": 9.033332642534391e-05} +{"train_loss": 0.0048174867406487465, "global_step": 14770, "epoch": 124, "lr": 9.033201700435423e-05} +{"train_loss": 0.005182832479476929, "global_step": 14771, "epoch": 124, "lr": 9.033070750417693e-05} +{"train_loss": 0.0061481427401304245, "global_step": 14772, "epoch": 124, "lr": 9.032939792481458e-05} +{"train_loss": 0.010267636738717556, "global_step": 14773, "epoch": 124, "lr": 9.032808826626979e-05} +{"train_loss": 0.00825497880578041, "global_step": 14774, "epoch": 124, "lr": 9.03267785285451e-05} +{"train_loss": 0.008071424439549446, "global_step": 14775, "epoch": 124, "lr": 9.032546871164309e-05} +{"train_loss": 0.00746742682531476, "global_step": 14776, "epoch": 124, "lr": 9.032415881556633e-05} +{"train_loss": 0.0061184619553387165, "global_step": 14777, "epoch": 124, "lr": 9.032284884031739e-05} +{"train_loss": 0.009845681488513947, "global_step": 14778, "epoch": 124, "lr": 9.032153878589884e-05} +{"train_loss": 0.007990431971848011, "global_step": 14779, "epoch": 124, "lr": 9.032022865231327e-05} +{"train_loss": 0.007786790374666452, "global_step": 14780, "epoch": 124, "lr": 9.031891843956322e-05} +{"train_loss": 0.010050063021481037, "global_step": 14781, "epoch": 124, "lr": 9.031760814765129e-05} +{"train_loss": 0.010907531715929508, "global_step": 14782, "epoch": 124, "lr": 9.031629777658005e-05} +{"train_loss": 0.008254896849393845, "global_step": 14783, "epoch": 124, "lr": 9.031498732635207e-05} +{"train_loss": 0.00844215415418148, "global_step": 14784, "epoch": 124, "lr": 9.031367679696991e-05} +{"train_loss": 0.006445916835218668, "global_step": 14785, "epoch": 124, "lr": 9.031236618843615e-05} +{"train_loss": 0.007565625477582216, "global_step": 14786, "epoch": 124, "lr": 9.031105550075336e-05} +{"train_loss": 0.009566444903612137, "global_step": 14787, "epoch": 124, "lr": 9.030974473392413e-05} +{"train_loss": 0.006859155371785164, "global_step": 14788, "epoch": 124, "lr": 9.030843388795103e-05} +{"train_loss": 0.006947477348148823, "global_step": 14789, "epoch": 124, "lr": 9.030712296283661e-05} +{"train_loss": 0.012825940735638142, "global_step": 14790, "epoch": 124, "lr": 9.030581195858347e-05} +{"train_loss": 0.004907743539661169, "global_step": 14791, "epoch": 124, "lr": 9.030450087519417e-05} +{"train_loss": 0.007331999950110912, "global_step": 14792, "epoch": 124, "lr": 9.030318971267129e-05} +{"train_loss": 0.0067188977263867855, "global_step": 14793, "epoch": 124, "lr": 9.03018784710174e-05} +{"train_loss": 0.005460480693727732, "global_step": 14794, "epoch": 124, "lr": 9.030056715023507e-05} +{"train_loss": 0.006826301105320454, "global_step": 14795, "epoch": 124, "lr": 9.029925575032689e-05} +{"train_loss": 0.007595743052661419, "global_step": 14796, "epoch": 124, "lr": 9.029794427129543e-05} +{"train_loss": 0.006197573151439428, "global_step": 14797, "epoch": 124, "lr": 9.029663271314326e-05} +{"train_loss": 0.008325628936290741, "global_step": 14798, "epoch": 124, "lr": 9.029532107587296e-05} +{"train_loss": 0.007692212704569101, "global_step": 14799, "epoch": 124, "lr": 9.02940093594871e-05} +{"train_loss": 0.004818572662770748, "global_step": 14800, "epoch": 124, "lr": 9.029269756398826e-05} +{"train_loss": 0.005792082753032446, "global_step": 14801, "epoch": 124, "lr": 9.0291385689379e-05} +{"train_loss": 0.006872129626572132, "global_step": 14802, "epoch": 124, "lr": 9.029007373566192e-05} +{"train_loss": 0.0051812115125358105, "global_step": 14803, "epoch": 124, "lr": 9.028876170283958e-05} +{"train_loss": 0.006068552378565073, "global_step": 14804, "epoch": 124, "lr": 9.028744959091457e-05} +{"train_loss": 0.006486342288553715, "global_step": 14805, "epoch": 124, "lr": 9.028613739988945e-05} +{"train_loss": 0.0067353262566030025, "global_step": 14806, "epoch": 124, "lr": 9.028482512976679e-05} +{"train_loss": 0.006070992443710566, "global_step": 14807, "epoch": 124, "lr": 9.028351278054921e-05} +{"train_loss": 0.005952127743512392, "global_step": 14808, "epoch": 124, "lr": 9.028220035223923e-05} +{"train_loss": 0.0074417851865291595, "global_step": 14809, "epoch": 124, "lr": 9.028088784483946e-05} +{"train_loss": 0.005606294143944979, "global_step": 14810, "epoch": 124, "lr": 9.027957525835248e-05} +{"train_loss": 0.0064398618414998055, "global_step": 14811, "epoch": 124, "lr": 9.027826259278084e-05} +{"train_loss": 0.008293477818369865, "global_step": 14812, "epoch": 124, "lr": 9.027694984812714e-05} +{"train_loss": 0.004616597201675177, "global_step": 14813, "epoch": 124, "lr": 9.027563702439397e-05} +{"train_loss": 0.00623220345005393, "global_step": 14814, "epoch": 124, "lr": 9.027432412158386e-05} +{"train_loss": 0.008064765483140945, "global_step": 14815, "epoch": 124, "lr": 9.027301113969944e-05} +{"train_loss": 0.004954868927598, "global_step": 14816, "epoch": 124, "lr": 9.027169807874327e-05} +{"train_loss": 0.007568548433482647, "global_step": 14817, "epoch": 124, "lr": 9.02703849387179e-05} +{"train_loss": 0.006609785370528698, "global_step": 14818, "epoch": 124, "lr": 9.026907171962594e-05} +{"train_loss": 0.006507159676402807, "global_step": 14819, "epoch": 124, "lr": 9.026775842146998e-05} +{"train_loss": 0.005269220098853111, "global_step": 14820, "epoch": 124, "lr": 9.026644504425254e-05} +{"train_loss": 0.008704619482159615, "global_step": 14821, "epoch": 124, "lr": 9.026513158797626e-05} +{"train_loss": 0.007953732274472713, "global_step": 14822, "epoch": 124, "lr": 9.02638180526437e-05} +{"train_loss": 0.008372828364372253, "global_step": 14823, "epoch": 124, "lr": 9.026250443825742e-05} +{"train_loss": 0.009009336121380329, "global_step": 14824, "epoch": 124, "lr": 9.026119074482003e-05} +{"train_loss": 0.005302800796926022, "global_step": 14825, "epoch": 124, "lr": 9.025987697233408e-05} +{"train_loss": 0.0074051483534276485, "global_step": 14826, "epoch": 124, "lr": 9.025856312080216e-05} +{"train_loss": 0.009439338929951191, "global_step": 14827, "epoch": 124, "lr": 9.025724919022687e-05} +{"train_loss": 0.01093271654099226, "global_step": 14828, "epoch": 124, "lr": 9.025593518061076e-05} +{"train_loss": 0.007074602413922548, "global_step": 14829, "epoch": 124, "lr": 9.025462109195641e-05} +{"train_loss": 0.009691938757896423, "global_step": 14830, "epoch": 124, "lr": 9.025330692426643e-05} +{"train_loss": 0.009859642945230007, "global_step": 14831, "epoch": 124, "lr": 9.025199267754338e-05} +{"train_loss": 0.006289866752922535, "global_step": 14832, "epoch": 124, "lr": 9.025067835178985e-05} +{"train_loss": 0.007033664733171463, "global_step": 14833, "epoch": 124, "lr": 9.02493639470084e-05} +{"train_loss": 0.0063699642196297646, "global_step": 14834, "epoch": 124, "lr": 9.024804946320164e-05} +{"train_loss": 0.005800218321382999, "global_step": 14835, "epoch": 124, "lr": 9.024673490037213e-05} +{"train_loss": 0.006044976878911257, "global_step": 14836, "epoch": 124, "lr": 9.024542025852243e-05} +{"train_loss": 0.012191126123070717, "global_step": 14837, "epoch": 124, "lr": 9.024410553765517e-05} +{"train_loss": 0.007131007965654135, "global_step": 14838, "epoch": 124, "lr": 9.02427907377729e-05} +{"train_loss": 0.008439302444458008, "global_step": 14839, "epoch": 124, "lr": 9.024147585887821e-05} +{"train_loss": 0.007702637929469347, "global_step": 14840, "epoch": 124, "lr": 9.024016090097369e-05} +{"train_loss": 0.003899872535839677, "global_step": 14841, "epoch": 124, "lr": 9.023884586406191e-05} +{"train_loss": 0.008619911037385464, "global_step": 14842, "epoch": 124, "lr": 9.023753074814545e-05} +{"train_loss": 0.01089825201779604, "global_step": 14843, "epoch": 124, "lr": 9.02362155532269e-05} +{"train_loss": 0.004526039585471153, "global_step": 14844, "epoch": 124, "lr": 9.023490027930884e-05} +{"train_loss": 0.00821350421756506, "global_step": 14845, "epoch": 124, "lr": 9.023358492639385e-05} +{"train_loss": 0.00573586905375123, "global_step": 14846, "epoch": 124, "lr": 9.023226949448451e-05} +{"train_loss": 0.00829398911446333, "global_step": 14847, "epoch": 124, "lr": 9.023095398358342e-05} +{"train_loss": 0.00784190371632576, "global_step": 14848, "epoch": 124, "lr": 9.022963839369314e-05} +{"train_loss": 0.005583173595368862, "global_step": 14849, "epoch": 124, "lr": 9.022832272481628e-05} +{"train_loss": 0.005162273533642292, "global_step": 14850, "epoch": 124, "lr": 9.022700697695539e-05} +{"train_loss": 0.011129333637654781, "global_step": 14851, "epoch": 124, "lr": 9.022569115011305e-05} +{"train_loss": 0.00943315401673317, "global_step": 14852, "epoch": 124, "lr": 9.02243752442919e-05} +{"train_loss": 0.0074120634235441685, "global_step": 14853, "epoch": 124, "lr": 9.022305925949447e-05} +{"train_loss": 0.007332885172218084, "global_step": 14854, "epoch": 124, "lr": 9.022174319572336e-05} +{"train_loss": 0.00660830270498991, "global_step": 14855, "epoch": 124, "lr": 9.022042705298115e-05} +{"train_loss": 0.0103942034766078, "global_step": 14856, "epoch": 124, "lr": 9.021911083127044e-05} +{"train_loss": 0.007518472615629435, "global_step": 14857, "epoch": 124, "lr": 9.021779453059379e-05} +{"train_loss": 0.009517192840576172, "global_step": 14858, "epoch": 124, "lr": 9.021647815095381e-05} +{"train_loss": 0.005639538634568453, "global_step": 14859, "epoch": 124, "lr": 9.021516169235307e-05} +{"train_loss": 0.005048909690231085, "global_step": 14860, "epoch": 124, "lr": 9.021384515479414e-05} +{"train_loss": 0.00918804481625557, "global_step": 14861, "epoch": 124, "lr": 9.021252853827964e-05} +{"train_loss": 0.009406011551618576, "global_step": 14862, "epoch": 124, "lr": 9.021121184281211e-05} +{"train_loss": 0.008430711925029755, "global_step": 14863, "epoch": 124, "lr": 9.020989506839419e-05} +{"train_loss": 0.006491458043456078, "global_step": 14864, "epoch": 124, "lr": 9.020857821502843e-05} +{"train_loss": 0.005812739487737417, "global_step": 14865, "epoch": 124, "lr": 9.020726128271741e-05} +{"train_loss": 0.008154485374689102, "global_step": 14866, "epoch": 124, "lr": 9.020594427146374e-05} +{"train_loss": 0.0038366729859262705, "global_step": 14867, "epoch": 124, "lr": 9.020462718126999e-05} +{"train_loss": 0.008781167678534985, "global_step": 14868, "epoch": 124, "lr": 9.020331001213875e-05} +{"train_loss": 0.008457125164568424, "global_step": 14869, "epoch": 124, "lr": 9.020199276407262e-05} +{"train_loss": 0.006155651994049549, "global_step": 14870, "epoch": 124, "lr": 9.020067543707416e-05} +{"train_loss": 0.0067016007378697395, "global_step": 14871, "epoch": 124, "lr": 9.019935803114596e-05} +{"train_loss": 0.006598643027245998, "global_step": 14872, "epoch": 124, "lr": 9.019804054629062e-05} +{"train_loss": 0.007215165998786688, "global_step": 14873, "epoch": 124, "lr": 9.019672298251073e-05} +{"train_loss": 0.007426974418408731, "global_step": 14874, "epoch": 124, "lr": 9.019540533980886e-05, "val_loss": 0.012580415233969688} +{"train_loss": 0.006765390280634165, "global_step": 14875, "epoch": 125, "lr": 9.019408761818762e-05} +{"train_loss": 0.007356191053986549, "global_step": 14876, "epoch": 125, "lr": 9.019276981764957e-05} +{"train_loss": 0.0064976876601576805, "global_step": 14877, "epoch": 125, "lr": 9.019145193819732e-05} +{"train_loss": 0.007180043030530214, "global_step": 14878, "epoch": 125, "lr": 9.019013397983343e-05} +{"train_loss": 0.00742255337536335, "global_step": 14879, "epoch": 125, "lr": 9.018881594256052e-05} +{"train_loss": 0.010558951646089554, "global_step": 14880, "epoch": 125, "lr": 9.018749782638116e-05} +{"train_loss": 0.004690555855631828, "global_step": 14881, "epoch": 125, "lr": 9.018617963129793e-05} +{"train_loss": 0.004376304801553488, "global_step": 14882, "epoch": 125, "lr": 9.018486135731344e-05} +{"train_loss": 0.008595882914960384, "global_step": 14883, "epoch": 125, "lr": 9.018354300443028e-05} +{"train_loss": 0.006617845967411995, "global_step": 14884, "epoch": 125, "lr": 9.018222457265101e-05} +{"train_loss": 0.007566237356513739, "global_step": 14885, "epoch": 125, "lr": 9.018090606197825e-05} +{"train_loss": 0.00862607080489397, "global_step": 14886, "epoch": 125, "lr": 9.017958747241455e-05} +{"train_loss": 0.007209495175629854, "global_step": 14887, "epoch": 125, "lr": 9.017826880396254e-05} +{"train_loss": 0.004263118840754032, "global_step": 14888, "epoch": 125, "lr": 9.017695005662479e-05} +{"train_loss": 0.006565037649124861, "global_step": 14889, "epoch": 125, "lr": 9.01756312304039e-05} +{"train_loss": 0.004318518564105034, "global_step": 14890, "epoch": 125, "lr": 9.017431232530243e-05} +{"train_loss": 0.0068934401497244835, "global_step": 14891, "epoch": 125, "lr": 9.017299334132299e-05} +{"train_loss": 0.00584820844233036, "global_step": 14892, "epoch": 125, "lr": 9.017167427846817e-05} +{"train_loss": 0.006338864099234343, "global_step": 14893, "epoch": 125, "lr": 9.017035513674058e-05} +{"train_loss": 0.006697174161672592, "global_step": 14894, "epoch": 125, "lr": 9.016903591614278e-05} +{"train_loss": 0.007411287631839514, "global_step": 14895, "epoch": 125, "lr": 9.016771661667735e-05} +{"train_loss": 0.007660543546080589, "global_step": 14896, "epoch": 125, "lr": 9.016639723834692e-05} +{"train_loss": 0.008726654574275017, "global_step": 14897, "epoch": 125, "lr": 9.016507778115406e-05} +{"train_loss": 0.006601825822144747, "global_step": 14898, "epoch": 125, "lr": 9.016375824510135e-05} +{"train_loss": 0.009087975136935711, "global_step": 14899, "epoch": 125, "lr": 9.016243863019141e-05} +{"train_loss": 0.007133350241929293, "global_step": 14900, "epoch": 125, "lr": 9.016111893642681e-05} +{"train_loss": 0.0063855345360934734, "global_step": 14901, "epoch": 125, "lr": 9.015979916381012e-05} +{"train_loss": 0.0040555126033723354, "global_step": 14902, "epoch": 125, "lr": 9.015847931234397e-05} +{"train_loss": 0.007541994098573923, "global_step": 14903, "epoch": 125, "lr": 9.015715938203093e-05} +{"train_loss": 0.00676368735730648, "global_step": 14904, "epoch": 125, "lr": 9.015583937287361e-05} +{"train_loss": 0.008813838474452496, "global_step": 14905, "epoch": 125, "lr": 9.015451928487457e-05} +{"train_loss": 0.005706821568310261, "global_step": 14906, "epoch": 125, "lr": 9.015319911803643e-05} +{"train_loss": 0.006150627508759499, "global_step": 14907, "epoch": 125, "lr": 9.015187887236178e-05} +{"train_loss": 0.009214639663696289, "global_step": 14908, "epoch": 125, "lr": 9.015055854785321e-05} +{"train_loss": 0.0062614185735583305, "global_step": 14909, "epoch": 125, "lr": 9.01492381445133e-05} +{"train_loss": 0.004188832826912403, "global_step": 14910, "epoch": 125, "lr": 9.014791766234465e-05} +{"train_loss": 0.007373749278485775, "global_step": 14911, "epoch": 125, "lr": 9.014659710134985e-05} +{"train_loss": 0.005909709259867668, "global_step": 14912, "epoch": 125, "lr": 9.014527646153151e-05} +{"train_loss": 0.007372313644737005, "global_step": 14913, "epoch": 125, "lr": 9.014395574289218e-05} +{"train_loss": 0.0056263478472828865, "global_step": 14914, "epoch": 125, "lr": 9.01426349454345e-05} +{"train_loss": 0.006254664622247219, "global_step": 14915, "epoch": 125, "lr": 9.014131406916105e-05} +{"train_loss": 0.005590646527707577, "global_step": 14916, "epoch": 125, "lr": 9.013999311407441e-05} +{"train_loss": 0.00694793276488781, "global_step": 14917, "epoch": 125, "lr": 9.013867208017719e-05} +{"train_loss": 0.010671298019587994, "global_step": 14918, "epoch": 125, "lr": 9.013735096747197e-05} +{"train_loss": 0.004357649013400078, "global_step": 14919, "epoch": 125, "lr": 9.013602977596134e-05} +{"train_loss": 0.008267935365438461, "global_step": 14920, "epoch": 125, "lr": 9.013470850564791e-05} +{"train_loss": 0.005031144246459007, "global_step": 14921, "epoch": 125, "lr": 9.013338715653427e-05} +{"train_loss": 0.004600703250616789, "global_step": 14922, "epoch": 125, "lr": 9.013206572862302e-05} +{"train_loss": 0.004059923812747002, "global_step": 14923, "epoch": 125, "lr": 9.013074422191674e-05} +{"train_loss": 0.00919062364846468, "global_step": 14924, "epoch": 125, "lr": 9.012942263641803e-05} +{"train_loss": 0.006510052364319563, "global_step": 14925, "epoch": 125, "lr": 9.012810097212948e-05} +{"train_loss": 0.006926541682332754, "global_step": 14926, "epoch": 125, "lr": 9.01267792290537e-05} +{"train_loss": 0.004351935349404812, "global_step": 14927, "epoch": 125, "lr": 9.012545740719327e-05} +{"train_loss": 0.00957014225423336, "global_step": 14928, "epoch": 125, "lr": 9.012413550655078e-05} +{"train_loss": 0.006788966245949268, "global_step": 14929, "epoch": 125, "lr": 9.012281352712886e-05} +{"train_loss": 0.0061294459737837315, "global_step": 14930, "epoch": 125, "lr": 9.012149146893007e-05} +{"train_loss": 0.004679566714912653, "global_step": 14931, "epoch": 125, "lr": 9.012016933195701e-05} +{"train_loss": 0.005638630595058203, "global_step": 14932, "epoch": 125, "lr": 9.011884711621231e-05} +{"train_loss": 0.005973835475742817, "global_step": 14933, "epoch": 125, "lr": 9.011752482169852e-05} +{"train_loss": 0.006801479961723089, "global_step": 14934, "epoch": 125, "lr": 9.011620244841825e-05} +{"train_loss": 0.007308992091566324, "global_step": 14935, "epoch": 125, "lr": 9.011487999637411e-05} +{"train_loss": 0.006649890448898077, "global_step": 14936, "epoch": 125, "lr": 9.01135574655687e-05} +{"train_loss": 0.006788474507629871, "global_step": 14937, "epoch": 125, "lr": 9.011223485600459e-05} +{"train_loss": 0.007653312291949987, "global_step": 14938, "epoch": 125, "lr": 9.01109121676844e-05} +{"train_loss": 0.00708272447809577, "global_step": 14939, "epoch": 125, "lr": 9.010958940061072e-05} +{"train_loss": 0.009097829461097717, "global_step": 14940, "epoch": 125, "lr": 9.010826655478615e-05} +{"train_loss": 0.007346415892243385, "global_step": 14941, "epoch": 125, "lr": 9.010694363021327e-05} +{"train_loss": 0.007514669559895992, "global_step": 14942, "epoch": 125, "lr": 9.010562062689469e-05} +{"train_loss": 0.005057857371866703, "global_step": 14943, "epoch": 125, "lr": 9.010429754483303e-05} +{"train_loss": 0.00509978411719203, "global_step": 14944, "epoch": 125, "lr": 9.010297438403083e-05} +{"train_loss": 0.006024384405463934, "global_step": 14945, "epoch": 125, "lr": 9.010165114449077e-05} +{"train_loss": 0.006661033723503351, "global_step": 14946, "epoch": 125, "lr": 9.010032782621537e-05} +{"train_loss": 0.004770663566887379, "global_step": 14947, "epoch": 125, "lr": 9.009900442920726e-05} +{"train_loss": 0.004845259245485067, "global_step": 14948, "epoch": 125, "lr": 9.009768095346906e-05} +{"train_loss": 0.0049803839065134525, "global_step": 14949, "epoch": 125, "lr": 9.009635739900332e-05} +{"train_loss": 0.005168923642486334, "global_step": 14950, "epoch": 125, "lr": 9.00950337658127e-05} +{"train_loss": 0.005422197747975588, "global_step": 14951, "epoch": 125, "lr": 9.009371005389974e-05} +{"train_loss": 0.010855894535779953, "global_step": 14952, "epoch": 125, "lr": 9.009238626326708e-05} +{"train_loss": 0.005308279301971197, "global_step": 14953, "epoch": 125, "lr": 9.009106239391728e-05} +{"train_loss": 0.003782369429245591, "global_step": 14954, "epoch": 125, "lr": 9.008973844585298e-05} +{"train_loss": 0.006273223087191582, "global_step": 14955, "epoch": 125, "lr": 9.008841441907676e-05} +{"train_loss": 0.00581711670383811, "global_step": 14956, "epoch": 125, "lr": 9.008709031359122e-05} +{"train_loss": 0.005835932679474354, "global_step": 14957, "epoch": 125, "lr": 9.008576612939894e-05} +{"train_loss": 0.006748459301888943, "global_step": 14958, "epoch": 125, "lr": 9.008444186650256e-05} +{"train_loss": 0.007138852495700121, "global_step": 14959, "epoch": 125, "lr": 9.008311752490466e-05} +{"train_loss": 0.0050286781042814255, "global_step": 14960, "epoch": 125, "lr": 9.008179310460785e-05} +{"train_loss": 0.007190175820142031, "global_step": 14961, "epoch": 125, "lr": 9.008046860561471e-05} +{"train_loss": 0.005752177443355322, "global_step": 14962, "epoch": 125, "lr": 9.007914402792785e-05} +{"train_loss": 0.006804306525737047, "global_step": 14963, "epoch": 125, "lr": 9.007781937154988e-05} +{"train_loss": 0.007393122185021639, "global_step": 14964, "epoch": 125, "lr": 9.007649463648338e-05} +{"train_loss": 0.007715234998613596, "global_step": 14965, "epoch": 125, "lr": 9.007516982273099e-05} +{"train_loss": 0.005992541089653969, "global_step": 14966, "epoch": 125, "lr": 9.007384493029526e-05} +{"train_loss": 0.0069099171087145805, "global_step": 14967, "epoch": 125, "lr": 9.007251995917882e-05} +{"train_loss": 0.006977207027375698, "global_step": 14968, "epoch": 125, "lr": 9.007119490938429e-05} +{"train_loss": 0.007050179410725832, "global_step": 14969, "epoch": 125, "lr": 9.006986978091422e-05} +{"train_loss": 0.008405070751905441, "global_step": 14970, "epoch": 125, "lr": 9.006854457377126e-05} +{"train_loss": 0.006011896301060915, "global_step": 14971, "epoch": 125, "lr": 9.006721928795798e-05} +{"train_loss": 0.005278976168483496, "global_step": 14972, "epoch": 125, "lr": 9.006589392347702e-05} +{"train_loss": 0.006541205570101738, "global_step": 14973, "epoch": 125, "lr": 9.006456848033093e-05} +{"train_loss": 0.009516922757029533, "global_step": 14974, "epoch": 125, "lr": 9.006324295852235e-05} +{"train_loss": 0.004681198392063379, "global_step": 14975, "epoch": 125, "lr": 9.006191735805388e-05} +{"train_loss": 0.005599348805844784, "global_step": 14976, "epoch": 125, "lr": 9.00605916789281e-05} +{"train_loss": 0.006141714286059141, "global_step": 14977, "epoch": 125, "lr": 9.005926592114765e-05} +{"train_loss": 0.00764850527048111, "global_step": 14978, "epoch": 125, "lr": 9.005794008471509e-05} +{"train_loss": 0.00831839069724083, "global_step": 14979, "epoch": 125, "lr": 9.005661416963306e-05} +{"train_loss": 0.004704072140157223, "global_step": 14980, "epoch": 125, "lr": 9.005528817590414e-05} +{"train_loss": 0.01001838780939579, "global_step": 14981, "epoch": 125, "lr": 9.005396210353094e-05} +{"train_loss": 0.00801206473261118, "global_step": 14982, "epoch": 125, "lr": 9.005263595251607e-05} +{"train_loss": 0.005798084661364555, "global_step": 14983, "epoch": 125, "lr": 9.005130972286213e-05} +{"train_loss": 0.0058901021257042885, "global_step": 14984, "epoch": 125, "lr": 9.004998341457172e-05} +{"train_loss": 0.009010255336761475, "global_step": 14985, "epoch": 125, "lr": 9.004865702764745e-05} +{"train_loss": 0.006594442296773195, "global_step": 14986, "epoch": 125, "lr": 9.004733056209189e-05} +{"train_loss": 0.009889401495456696, "global_step": 14987, "epoch": 125, "lr": 9.004600401790771e-05} +{"train_loss": 0.008152407594025135, "global_step": 14988, "epoch": 125, "lr": 9.004467739509746e-05} +{"train_loss": 0.00815032608807087, "global_step": 14989, "epoch": 125, "lr": 9.004335069366377e-05} +{"train_loss": 0.0057538715191185474, "global_step": 14990, "epoch": 125, "lr": 9.004202391360925e-05} +{"train_loss": 0.006374200340360403, "global_step": 14991, "epoch": 125, "lr": 9.004069705493649e-05} +{"train_loss": 0.007385767996311188, "global_step": 14992, "epoch": 125, "lr": 9.003937011764809e-05} +{"train_loss": 0.006721469700852988, "global_step": 14993, "epoch": 125, "lr": 9.003804310174667e-05, "val_loss": 0.01261937152594328, "train_action_mse_error": 0.00023101631086319685} +{"train_loss": 0.005429996643215418, "global_step": 14994, "epoch": 126, "lr": 9.003671600723483e-05} +{"train_loss": 0.0060751973651349545, "global_step": 14995, "epoch": 126, "lr": 9.003538883411516e-05} +{"train_loss": 0.0061228470876812935, "global_step": 14996, "epoch": 126, "lr": 9.00340615823903e-05} +{"train_loss": 0.00592826958745718, "global_step": 14997, "epoch": 126, "lr": 9.003273425206283e-05} +{"train_loss": 0.00643859151750803, "global_step": 14998, "epoch": 126, "lr": 9.003140684313536e-05} +{"train_loss": 0.005652246065437794, "global_step": 14999, "epoch": 126, "lr": 9.003007935561052e-05} +{"train_loss": 0.007748295087367296, "global_step": 15000, "epoch": 126, "lr": 9.002875178949088e-05} +{"train_loss": 0.007277355063706636, "global_step": 15001, "epoch": 126, "lr": 9.002742414477904e-05} +{"train_loss": 0.005796889774501324, "global_step": 15002, "epoch": 126, "lr": 9.002609642147766e-05} +{"train_loss": 0.008805294521152973, "global_step": 15003, "epoch": 126, "lr": 9.002476861958931e-05} +{"train_loss": 0.004954561125487089, "global_step": 15004, "epoch": 126, "lr": 9.002344073911659e-05} +{"train_loss": 0.005223240237683058, "global_step": 15005, "epoch": 126, "lr": 9.002211278006214e-05} +{"train_loss": 0.006519305054098368, "global_step": 15006, "epoch": 126, "lr": 9.002078474242855e-05} +{"train_loss": 0.0069193607196211815, "global_step": 15007, "epoch": 126, "lr": 9.00194566262184e-05} +{"train_loss": 0.007261923514306545, "global_step": 15008, "epoch": 126, "lr": 9.001812843143433e-05} +{"train_loss": 0.006943280342966318, "global_step": 15009, "epoch": 126, "lr": 9.001680015807896e-05} +{"train_loss": 0.011823782697319984, "global_step": 15010, "epoch": 126, "lr": 9.001547180615485e-05} +{"train_loss": 0.005399591289460659, "global_step": 15011, "epoch": 126, "lr": 9.001414337566465e-05} +{"train_loss": 0.00518165435642004, "global_step": 15012, "epoch": 126, "lr": 9.001281486661095e-05} +{"train_loss": 0.007668105885386467, "global_step": 15013, "epoch": 126, "lr": 9.001148627899636e-05} +{"train_loss": 0.006491281557828188, "global_step": 15014, "epoch": 126, "lr": 9.00101576128235e-05} +{"train_loss": 0.009840039536356926, "global_step": 15015, "epoch": 126, "lr": 9.000882886809498e-05} +{"train_loss": 0.004628247581422329, "global_step": 15016, "epoch": 126, "lr": 9.000750004481337e-05} +{"train_loss": 0.00740327313542366, "global_step": 15017, "epoch": 126, "lr": 9.000617114298133e-05} +{"train_loss": 0.00951759796589613, "global_step": 15018, "epoch": 126, "lr": 9.000484216260144e-05} +{"train_loss": 0.00789585430175066, "global_step": 15019, "epoch": 126, "lr": 9.000351310367631e-05} +{"train_loss": 0.006463537458330393, "global_step": 15020, "epoch": 126, "lr": 9.000218396620857e-05} +{"train_loss": 0.007625466212630272, "global_step": 15021, "epoch": 126, "lr": 9.000085475020081e-05} +{"train_loss": 0.0038177580572664738, "global_step": 15022, "epoch": 126, "lr": 8.999952545565565e-05} +{"train_loss": 0.006039198022335768, "global_step": 15023, "epoch": 126, "lr": 8.999819608257569e-05} +{"train_loss": 0.005929076578468084, "global_step": 15024, "epoch": 126, "lr": 8.999686663096354e-05} +{"train_loss": 0.010296136140823364, "global_step": 15025, "epoch": 126, "lr": 8.999553710082182e-05} +{"train_loss": 0.006550977937877178, "global_step": 15026, "epoch": 126, "lr": 8.999420749215313e-05} +{"train_loss": 0.006941611412912607, "global_step": 15027, "epoch": 126, "lr": 8.999287780496008e-05} +{"train_loss": 0.004445556551218033, "global_step": 15028, "epoch": 126, "lr": 8.99915480392453e-05} +{"train_loss": 0.007964061573147774, "global_step": 15029, "epoch": 126, "lr": 8.999021819501139e-05} +{"train_loss": 0.004827633034437895, "global_step": 15030, "epoch": 126, "lr": 8.998888827226096e-05} +{"train_loss": 0.008251802995800972, "global_step": 15031, "epoch": 126, "lr": 8.998755827099661e-05} +{"train_loss": 0.008138955570757389, "global_step": 15032, "epoch": 126, "lr": 8.998622819122098e-05} +{"train_loss": 0.008946163579821587, "global_step": 15033, "epoch": 126, "lr": 8.998489803293664e-05} +{"train_loss": 0.008465485647320747, "global_step": 15034, "epoch": 126, "lr": 8.998356779614622e-05} +{"train_loss": 0.007666256278753281, "global_step": 15035, "epoch": 126, "lr": 8.998223748085236e-05} +{"train_loss": 0.00805186852812767, "global_step": 15036, "epoch": 126, "lr": 8.998090708705764e-05} +{"train_loss": 0.008520270697772503, "global_step": 15037, "epoch": 126, "lr": 8.997957661476468e-05} +{"train_loss": 0.005817319732159376, "global_step": 15038, "epoch": 126, "lr": 8.997824606397609e-05} +{"train_loss": 0.008258875459432602, "global_step": 15039, "epoch": 126, "lr": 8.997691543469449e-05} +{"train_loss": 0.008635258302092552, "global_step": 15040, "epoch": 126, "lr": 8.997558472692249e-05} +{"train_loss": 0.00630901288241148, "global_step": 15041, "epoch": 126, "lr": 8.997425394066268e-05} +{"train_loss": 0.007676102686673403, "global_step": 15042, "epoch": 126, "lr": 8.997292307591772e-05} +{"train_loss": 0.006917214952409267, "global_step": 15043, "epoch": 126, "lr": 8.997159213269018e-05} +{"train_loss": 0.006117487791925669, "global_step": 15044, "epoch": 126, "lr": 8.997026111098268e-05} +{"train_loss": 0.006594050209969282, "global_step": 15045, "epoch": 126, "lr": 8.996893001079784e-05} +{"train_loss": 0.007713560946285725, "global_step": 15046, "epoch": 126, "lr": 8.99675988321383e-05} +{"train_loss": 0.007495449855923653, "global_step": 15047, "epoch": 126, "lr": 8.996626757500665e-05} +{"train_loss": 0.0048439158126711845, "global_step": 15048, "epoch": 126, "lr": 8.99649362394055e-05} +{"train_loss": 0.003580491989850998, "global_step": 15049, "epoch": 126, "lr": 8.996360482533746e-05} +{"train_loss": 0.008177796378731728, "global_step": 15050, "epoch": 126, "lr": 8.996227333280514e-05} +{"train_loss": 0.006918218918144703, "global_step": 15051, "epoch": 126, "lr": 8.996094176181118e-05} +{"train_loss": 0.004335098899900913, "global_step": 15052, "epoch": 126, "lr": 8.995961011235817e-05} +{"train_loss": 0.008106060326099396, "global_step": 15053, "epoch": 126, "lr": 8.995827838444875e-05} +{"train_loss": 0.005793713498860598, "global_step": 15054, "epoch": 126, "lr": 8.99569465780855e-05} +{"train_loss": 0.005580300465226173, "global_step": 15055, "epoch": 126, "lr": 8.995561469327107e-05} +{"train_loss": 0.004883210640400648, "global_step": 15056, "epoch": 126, "lr": 8.995428273000805e-05} +{"train_loss": 0.007673034910112619, "global_step": 15057, "epoch": 126, "lr": 8.995295068829908e-05} +{"train_loss": 0.006258021574467421, "global_step": 15058, "epoch": 126, "lr": 8.995161856814674e-05} +{"train_loss": 0.008833246305584908, "global_step": 15059, "epoch": 126, "lr": 8.995028636955369e-05} +{"train_loss": 0.0057896580547094345, "global_step": 15060, "epoch": 126, "lr": 8.994895409252249e-05} +{"train_loss": 0.0072964951395988464, "global_step": 15061, "epoch": 126, "lr": 8.99476217370558e-05} +{"train_loss": 0.007909046486020088, "global_step": 15062, "epoch": 126, "lr": 8.994628930315623e-05} +{"train_loss": 0.0070681022480130196, "global_step": 15063, "epoch": 126, "lr": 8.994495679082638e-05} +{"train_loss": 0.007331558503210545, "global_step": 15064, "epoch": 126, "lr": 8.994362420006887e-05} +{"train_loss": 0.004900793079286814, "global_step": 15065, "epoch": 126, "lr": 8.994229153088633e-05} +{"train_loss": 0.008088041096925735, "global_step": 15066, "epoch": 126, "lr": 8.994095878328138e-05} +{"train_loss": 0.005790993105620146, "global_step": 15067, "epoch": 126, "lr": 8.99396259572566e-05} +{"train_loss": 0.004512525629252195, "global_step": 15068, "epoch": 126, "lr": 8.993829305281465e-05} +{"train_loss": 0.005021922290325165, "global_step": 15069, "epoch": 126, "lr": 8.99369600699581e-05} +{"train_loss": 0.006125321611762047, "global_step": 15070, "epoch": 126, "lr": 8.993562700868962e-05} +{"train_loss": 0.005849981214851141, "global_step": 15071, "epoch": 126, "lr": 8.993429386901182e-05} +{"train_loss": 0.006577646359801292, "global_step": 15072, "epoch": 126, "lr": 8.993296065092726e-05} +{"train_loss": 0.008329559117555618, "global_step": 15073, "epoch": 126, "lr": 8.993162735443862e-05} +{"train_loss": 0.006618870422244072, "global_step": 15074, "epoch": 126, "lr": 8.993029397954851e-05} +{"train_loss": 0.006557339336723089, "global_step": 15075, "epoch": 126, "lr": 8.99289605262595e-05} +{"train_loss": 0.004514691419899464, "global_step": 15076, "epoch": 126, "lr": 8.992762699457427e-05} +{"train_loss": 0.010268311947584152, "global_step": 15077, "epoch": 126, "lr": 8.992629338449539e-05} +{"train_loss": 0.007098993752151728, "global_step": 15078, "epoch": 126, "lr": 8.992495969602552e-05} +{"train_loss": 0.006943041924387217, "global_step": 15079, "epoch": 126, "lr": 8.992362592916723e-05} +{"train_loss": 0.005818914156407118, "global_step": 15080, "epoch": 126, "lr": 8.992229208392318e-05} +{"train_loss": 0.007099183741956949, "global_step": 15081, "epoch": 126, "lr": 8.992095816029597e-05} +{"train_loss": 0.006289518438279629, "global_step": 15082, "epoch": 126, "lr": 8.991962415828822e-05} +{"train_loss": 0.004326925612986088, "global_step": 15083, "epoch": 126, "lr": 8.991829007790258e-05} +{"train_loss": 0.0062694791704416275, "global_step": 15084, "epoch": 126, "lr": 8.991695591914162e-05} +{"train_loss": 0.0060487049631774426, "global_step": 15085, "epoch": 126, "lr": 8.991562168200798e-05} +{"train_loss": 0.00832018256187439, "global_step": 15086, "epoch": 126, "lr": 8.99142873665043e-05} +{"train_loss": 0.0069621866568923, "global_step": 15087, "epoch": 126, "lr": 8.991295297263315e-05} +{"train_loss": 0.00732151884585619, "global_step": 15088, "epoch": 126, "lr": 8.991161850039719e-05} +{"train_loss": 0.005094176158308983, "global_step": 15089, "epoch": 126, "lr": 8.991028394979904e-05} +{"train_loss": 0.005588687025010586, "global_step": 15090, "epoch": 126, "lr": 8.990894932084132e-05} +{"train_loss": 0.005305266939103603, "global_step": 15091, "epoch": 126, "lr": 8.990761461352664e-05} +{"train_loss": 0.005662194453179836, "global_step": 15092, "epoch": 126, "lr": 8.99062798278576e-05} +{"train_loss": 0.006455053575336933, "global_step": 15093, "epoch": 126, "lr": 8.990494496383686e-05} +{"train_loss": 0.005171490833163261, "global_step": 15094, "epoch": 126, "lr": 8.990361002146701e-05} +{"train_loss": 0.008286308497190475, "global_step": 15095, "epoch": 126, "lr": 8.990227500075071e-05} +{"train_loss": 0.008744843304157257, "global_step": 15096, "epoch": 126, "lr": 8.990093990169052e-05} +{"train_loss": 0.007729731500148773, "global_step": 15097, "epoch": 126, "lr": 8.989960472428913e-05} +{"train_loss": 0.005039909854531288, "global_step": 15098, "epoch": 126, "lr": 8.989826946854912e-05} +{"train_loss": 0.007227536756545305, "global_step": 15099, "epoch": 126, "lr": 8.989693413447311e-05} +{"train_loss": 0.004682318773120642, "global_step": 15100, "epoch": 126, "lr": 8.989559872206374e-05} +{"train_loss": 0.008114811033010483, "global_step": 15101, "epoch": 126, "lr": 8.989426323132361e-05} +{"train_loss": 0.00322991656139493, "global_step": 15102, "epoch": 126, "lr": 8.989292766225539e-05} +{"train_loss": 0.005101291928440332, "global_step": 15103, "epoch": 126, "lr": 8.989159201486164e-05} +{"train_loss": 0.007172927726060152, "global_step": 15104, "epoch": 126, "lr": 8.989025628914503e-05} +{"train_loss": 0.00503695011138916, "global_step": 15105, "epoch": 126, "lr": 8.988892048510814e-05} +{"train_loss": 0.006249213591217995, "global_step": 15106, "epoch": 126, "lr": 8.988758460275363e-05} +{"train_loss": 0.008828987367451191, "global_step": 15107, "epoch": 126, "lr": 8.988624864208411e-05} +{"train_loss": 0.00742453895509243, "global_step": 15108, "epoch": 126, "lr": 8.98849126031022e-05} +{"train_loss": 0.005853989627212286, "global_step": 15109, "epoch": 126, "lr": 8.988357648581051e-05} +{"train_loss": 0.006487550679594278, "global_step": 15110, "epoch": 126, "lr": 8.988224029021171e-05} +{"train_loss": 0.007910127751529217, "global_step": 15111, "epoch": 126, "lr": 8.988090401630837e-05} +{"train_loss": 0.006692323051079982, "global_step": 15112, "epoch": 126, "lr": 8.987956766410315e-05, "val_loss": 0.01177135482430458} +{"train_loss": 0.011830913834273815, "global_step": 15113, "epoch": 127, "lr": 8.987823123359864e-05} +{"train_loss": 0.007608817424625158, "global_step": 15114, "epoch": 127, "lr": 8.98768947247975e-05} +{"train_loss": 0.006536906119436026, "global_step": 15115, "epoch": 127, "lr": 8.987555813770233e-05} +{"train_loss": 0.01025943923741579, "global_step": 15116, "epoch": 127, "lr": 8.987422147231576e-05} +{"train_loss": 0.005949003621935844, "global_step": 15117, "epoch": 127, "lr": 8.987288472864042e-05} +{"train_loss": 0.008829544298350811, "global_step": 15118, "epoch": 127, "lr": 8.987154790667894e-05} +{"train_loss": 0.005994149949401617, "global_step": 15119, "epoch": 127, "lr": 8.987021100643392e-05} +{"train_loss": 0.008913540281355381, "global_step": 15120, "epoch": 127, "lr": 8.9868874027908e-05} +{"train_loss": 0.007876455783843994, "global_step": 15121, "epoch": 127, "lr": 8.986753697110381e-05} +{"train_loss": 0.0044958461076021194, "global_step": 15122, "epoch": 127, "lr": 8.986619983602397e-05} +{"train_loss": 0.007482356391847134, "global_step": 15123, "epoch": 127, "lr": 8.986486262267111e-05} +{"train_loss": 0.008974440395832062, "global_step": 15124, "epoch": 127, "lr": 8.986352533104784e-05} +{"train_loss": 0.007183023262768984, "global_step": 15125, "epoch": 127, "lr": 8.986218796115681e-05} +{"train_loss": 0.005440332926809788, "global_step": 15126, "epoch": 127, "lr": 8.986085051300061e-05} +{"train_loss": 0.006323272828012705, "global_step": 15127, "epoch": 127, "lr": 8.98595129865819e-05} +{"train_loss": 0.006251405458897352, "global_step": 15128, "epoch": 127, "lr": 8.985817538190331e-05} +{"train_loss": 0.004745314363390207, "global_step": 15129, "epoch": 127, "lr": 8.985683769896745e-05} +{"train_loss": 0.006284089293330908, "global_step": 15130, "epoch": 127, "lr": 8.985549993777693e-05} +{"train_loss": 0.0057157669216394424, "global_step": 15131, "epoch": 127, "lr": 8.985416209833441e-05} +{"train_loss": 0.006263092625886202, "global_step": 15132, "epoch": 127, "lr": 8.98528241806425e-05} +{"train_loss": 0.007619858719408512, "global_step": 15133, "epoch": 127, "lr": 8.98514861847038e-05} +{"train_loss": 0.0050871288403868675, "global_step": 15134, "epoch": 127, "lr": 8.985014811052099e-05} +{"train_loss": 0.005835163872689009, "global_step": 15135, "epoch": 127, "lr": 8.984880995809667e-05} +{"train_loss": 0.007521284278482199, "global_step": 15136, "epoch": 127, "lr": 8.984747172743346e-05} +{"train_loss": 0.008554408326745033, "global_step": 15137, "epoch": 127, "lr": 8.984613341853401e-05} +{"train_loss": 0.009418437257409096, "global_step": 15138, "epoch": 127, "lr": 8.984479503140092e-05} +{"train_loss": 0.009214174933731556, "global_step": 15139, "epoch": 127, "lr": 8.984345656603684e-05} +{"train_loss": 0.00508596608415246, "global_step": 15140, "epoch": 127, "lr": 8.984211802244438e-05} +{"train_loss": 0.005813837517052889, "global_step": 15141, "epoch": 127, "lr": 8.984077940062619e-05} +{"train_loss": 0.004310301039367914, "global_step": 15142, "epoch": 127, "lr": 8.983944070058488e-05} +{"train_loss": 0.006209838204085827, "global_step": 15143, "epoch": 127, "lr": 8.983810192232307e-05} +{"train_loss": 0.008244108408689499, "global_step": 15144, "epoch": 127, "lr": 8.983676306584343e-05} +{"train_loss": 0.0055467053316533566, "global_step": 15145, "epoch": 127, "lr": 8.983542413114853e-05} +{"train_loss": 0.006055756472051144, "global_step": 15146, "epoch": 127, "lr": 8.983408511824106e-05} +{"train_loss": 0.005640750750899315, "global_step": 15147, "epoch": 127, "lr": 8.983274602712361e-05} +{"train_loss": 0.005057153757661581, "global_step": 15148, "epoch": 127, "lr": 8.983140685779882e-05} +{"train_loss": 0.008528594858944416, "global_step": 15149, "epoch": 127, "lr": 8.983006761026931e-05} +{"train_loss": 0.006611612159758806, "global_step": 15150, "epoch": 127, "lr": 8.982872828453772e-05} +{"train_loss": 0.007921192795038223, "global_step": 15151, "epoch": 127, "lr": 8.982738888060669e-05} +{"train_loss": 0.004237163811922073, "global_step": 15152, "epoch": 127, "lr": 8.982604939847883e-05} +{"train_loss": 0.006271301303058863, "global_step": 15153, "epoch": 127, "lr": 8.982470983815676e-05} +{"train_loss": 0.008547781966626644, "global_step": 15154, "epoch": 127, "lr": 8.982337019964315e-05} +{"train_loss": 0.005432776175439358, "global_step": 15155, "epoch": 127, "lr": 8.98220304829406e-05} +{"train_loss": 0.007432359270751476, "global_step": 15156, "epoch": 127, "lr": 8.982069068805175e-05} +{"train_loss": 0.007372998632490635, "global_step": 15157, "epoch": 127, "lr": 8.981935081497921e-05} +{"train_loss": 0.008579416200518608, "global_step": 15158, "epoch": 127, "lr": 8.981801086372565e-05} +{"train_loss": 0.005388795398175716, "global_step": 15159, "epoch": 127, "lr": 8.981667083429367e-05} +{"train_loss": 0.007013456430286169, "global_step": 15160, "epoch": 127, "lr": 8.981533072668591e-05} +{"train_loss": 0.0075479247607290745, "global_step": 15161, "epoch": 127, "lr": 8.9813990540905e-05} +{"train_loss": 0.006808108650147915, "global_step": 15162, "epoch": 127, "lr": 8.981265027695358e-05} +{"train_loss": 0.006452708039432764, "global_step": 15163, "epoch": 127, "lr": 8.981130993483428e-05} +{"train_loss": 0.007717700209468603, "global_step": 15164, "epoch": 127, "lr": 8.980996951454972e-05} +{"train_loss": 0.005598882678896189, "global_step": 15165, "epoch": 127, "lr": 8.980862901610253e-05} +{"train_loss": 0.006399114616215229, "global_step": 15166, "epoch": 127, "lr": 8.980728843949535e-05} +{"train_loss": 0.007205592002719641, "global_step": 15167, "epoch": 127, "lr": 8.980594778473081e-05} +{"train_loss": 0.004224543925374746, "global_step": 15168, "epoch": 127, "lr": 8.980460705181155e-05} +{"train_loss": 0.007986967451870441, "global_step": 15169, "epoch": 127, "lr": 8.980326624074021e-05} +{"train_loss": 0.007897162809967995, "global_step": 15170, "epoch": 127, "lr": 8.980192535151938e-05} +{"train_loss": 0.01228010281920433, "global_step": 15171, "epoch": 127, "lr": 8.980058438415175e-05} +{"train_loss": 0.005543618928641081, "global_step": 15172, "epoch": 127, "lr": 8.979924333863991e-05} +{"train_loss": 0.008204965852200985, "global_step": 15173, "epoch": 127, "lr": 8.979790221498651e-05} +{"train_loss": 0.006960841361433268, "global_step": 15174, "epoch": 127, "lr": 8.979656101319418e-05} +{"train_loss": 0.007763837464153767, "global_step": 15175, "epoch": 127, "lr": 8.979521973326556e-05} +{"train_loss": 0.00964881107211113, "global_step": 15176, "epoch": 127, "lr": 8.979387837520327e-05} +{"train_loss": 0.0076245879754424095, "global_step": 15177, "epoch": 127, "lr": 8.979253693900996e-05} +{"train_loss": 0.006795097608119249, "global_step": 15178, "epoch": 127, "lr": 8.979119542468825e-05} +{"train_loss": 0.00841079093515873, "global_step": 15179, "epoch": 127, "lr": 8.97898538322408e-05} +{"train_loss": 0.010135617107152939, "global_step": 15180, "epoch": 127, "lr": 8.978851216167019e-05} +{"train_loss": 0.007316636852920055, "global_step": 15181, "epoch": 127, "lr": 8.978717041297911e-05} +{"train_loss": 0.008720316924154758, "global_step": 15182, "epoch": 127, "lr": 8.978582858617016e-05} +{"train_loss": 0.007903854362666607, "global_step": 15183, "epoch": 127, "lr": 8.978448668124597e-05} +{"train_loss": 0.007853090763092041, "global_step": 15184, "epoch": 127, "lr": 8.978314469820922e-05} +{"train_loss": 0.006503840908408165, "global_step": 15185, "epoch": 127, "lr": 8.978180263706249e-05} +{"train_loss": 0.005512543488293886, "global_step": 15186, "epoch": 127, "lr": 8.978046049780846e-05} +{"train_loss": 0.00867028720676899, "global_step": 15187, "epoch": 127, "lr": 8.977911828044973e-05} +{"train_loss": 0.00809023529291153, "global_step": 15188, "epoch": 127, "lr": 8.977777598498897e-05} +{"train_loss": 0.008621646091341972, "global_step": 15189, "epoch": 127, "lr": 8.977643361142877e-05} +{"train_loss": 0.010731345042586327, "global_step": 15190, "epoch": 127, "lr": 8.977509115977183e-05} +{"train_loss": 0.005998322740197182, "global_step": 15191, "epoch": 127, "lr": 8.977374863002071e-05} +{"train_loss": 0.00765692675486207, "global_step": 15192, "epoch": 127, "lr": 8.97724060221781e-05} +{"train_loss": 0.007482060231268406, "global_step": 15193, "epoch": 127, "lr": 8.977106333624663e-05} +{"train_loss": 0.01070153247565031, "global_step": 15194, "epoch": 127, "lr": 8.97697205722289e-05} +{"train_loss": 0.008101584389805794, "global_step": 15195, "epoch": 127, "lr": 8.976837773012761e-05} +{"train_loss": 0.008729993365705013, "global_step": 15196, "epoch": 127, "lr": 8.976703480994533e-05} +{"train_loss": 0.008100136183202267, "global_step": 15197, "epoch": 127, "lr": 8.976569181168473e-05} +{"train_loss": 0.009671688079833984, "global_step": 15198, "epoch": 127, "lr": 8.976434873534845e-05} +{"train_loss": 0.008665081113576889, "global_step": 15199, "epoch": 127, "lr": 8.976300558093911e-05} +{"train_loss": 0.006379168014973402, "global_step": 15200, "epoch": 127, "lr": 8.976166234845936e-05} +{"train_loss": 0.00804360955953598, "global_step": 15201, "epoch": 127, "lr": 8.976031903791185e-05} +{"train_loss": 0.0054998197592794895, "global_step": 15202, "epoch": 127, "lr": 8.975897564929917e-05} +{"train_loss": 0.010033868253231049, "global_step": 15203, "epoch": 127, "lr": 8.975763218262401e-05} +{"train_loss": 0.008436045609414577, "global_step": 15204, "epoch": 127, "lr": 8.975628863788898e-05} +{"train_loss": 0.00865692924708128, "global_step": 15205, "epoch": 127, "lr": 8.975494501509674e-05} +{"train_loss": 0.007060815580189228, "global_step": 15206, "epoch": 127, "lr": 8.975360131424989e-05} +{"train_loss": 0.008524170145392418, "global_step": 15207, "epoch": 127, "lr": 8.975225753535111e-05} +{"train_loss": 0.007351638749241829, "global_step": 15208, "epoch": 127, "lr": 8.975091367840301e-05} +{"train_loss": 0.010766887106001377, "global_step": 15209, "epoch": 127, "lr": 8.974956974340822e-05} +{"train_loss": 0.006464442238211632, "global_step": 15210, "epoch": 127, "lr": 8.974822573036942e-05} +{"train_loss": 0.007073547691106796, "global_step": 15211, "epoch": 127, "lr": 8.974688163928922e-05} +{"train_loss": 0.007002608850598335, "global_step": 15212, "epoch": 127, "lr": 8.974553747017027e-05} +{"train_loss": 0.005110570695251226, "global_step": 15213, "epoch": 127, "lr": 8.97441932230152e-05} +{"train_loss": 0.007959899492561817, "global_step": 15214, "epoch": 127, "lr": 8.974284889782665e-05} +{"train_loss": 0.006631735246628523, "global_step": 15215, "epoch": 127, "lr": 8.974150449460726e-05} +{"train_loss": 0.011169034987688065, "global_step": 15216, "epoch": 127, "lr": 8.974016001335966e-05} +{"train_loss": 0.004668215289711952, "global_step": 15217, "epoch": 127, "lr": 8.973881545408651e-05} +{"train_loss": 0.00704410532489419, "global_step": 15218, "epoch": 127, "lr": 8.973747081679045e-05} +{"train_loss": 0.007503144908696413, "global_step": 15219, "epoch": 127, "lr": 8.973612610147411e-05} +{"train_loss": 0.007464607246220112, "global_step": 15220, "epoch": 127, "lr": 8.973478130814013e-05} +{"train_loss": 0.009402362629771233, "global_step": 15221, "epoch": 127, "lr": 8.973343643679116e-05} +{"train_loss": 0.007603751961141825, "global_step": 15222, "epoch": 127, "lr": 8.973209148742982e-05} +{"train_loss": 0.006041919346898794, "global_step": 15223, "epoch": 127, "lr": 8.973074646005877e-05} +{"train_loss": 0.008385341614484787, "global_step": 15224, "epoch": 127, "lr": 8.972940135468063e-05} +{"train_loss": 0.007728519383817911, "global_step": 15225, "epoch": 127, "lr": 8.972805617129807e-05} +{"train_loss": 0.007826020009815693, "global_step": 15226, "epoch": 127, "lr": 8.972671090991372e-05} +{"train_loss": 0.005220444407314062, "global_step": 15227, "epoch": 127, "lr": 8.97253655705302e-05} +{"train_loss": 0.0113550815731287, "global_step": 15228, "epoch": 127, "lr": 8.972402015315018e-05} +{"train_loss": 0.007158588618040085, "global_step": 15229, "epoch": 127, "lr": 8.972267465777628e-05} +{"train_loss": 0.008811975829303265, "global_step": 15230, "epoch": 127, "lr": 8.972132908441116e-05} +{"train_loss": 0.007426758735057186, "global_step": 15231, "epoch": 127, "lr": 8.971998343305745e-05, "val_loss": 0.02130655013024807} +{"train_loss": 0.005498027894645929, "global_step": 15232, "epoch": 128, "lr": 8.97186377037178e-05} +{"train_loss": 0.004990497138351202, "global_step": 15233, "epoch": 128, "lr": 8.971729189639485e-05} +{"train_loss": 0.009767085313796997, "global_step": 15234, "epoch": 128, "lr": 8.971594601109123e-05} +{"train_loss": 0.005174120422452688, "global_step": 15235, "epoch": 128, "lr": 8.97146000478096e-05} +{"train_loss": 0.00972312968224287, "global_step": 15236, "epoch": 128, "lr": 8.971325400655261e-05} +{"train_loss": 0.00728315394371748, "global_step": 15237, "epoch": 128, "lr": 8.971190788732288e-05} +{"train_loss": 0.009833362884819508, "global_step": 15238, "epoch": 128, "lr": 8.971056169012305e-05} +{"train_loss": 0.006640114355832338, "global_step": 15239, "epoch": 128, "lr": 8.970921541495579e-05} +{"train_loss": 0.008373932912945747, "global_step": 15240, "epoch": 128, "lr": 8.970786906182371e-05} +{"train_loss": 0.006554754916578531, "global_step": 15241, "epoch": 128, "lr": 8.970652263072949e-05} +{"train_loss": 0.007617427501827478, "global_step": 15242, "epoch": 128, "lr": 8.970517612167574e-05} +{"train_loss": 0.0055636572651565075, "global_step": 15243, "epoch": 128, "lr": 8.970382953466511e-05} +{"train_loss": 0.00694179255515337, "global_step": 15244, "epoch": 128, "lr": 8.970248286970028e-05} +{"train_loss": 0.007975654676556587, "global_step": 15245, "epoch": 128, "lr": 8.970113612678386e-05} +{"train_loss": 0.007206938229501247, "global_step": 15246, "epoch": 128, "lr": 8.969978930591849e-05} +{"train_loss": 0.004646401386708021, "global_step": 15247, "epoch": 128, "lr": 8.969844240710683e-05} +{"train_loss": 0.007880764082074165, "global_step": 15248, "epoch": 128, "lr": 8.969709543035152e-05} +{"train_loss": 0.008547760546207428, "global_step": 15249, "epoch": 128, "lr": 8.96957483756552e-05} +{"train_loss": 0.006548566278070211, "global_step": 15250, "epoch": 128, "lr": 8.969440124302051e-05} +{"train_loss": 0.0069890134036540985, "global_step": 15251, "epoch": 128, "lr": 8.969305403245011e-05} +{"train_loss": 0.008049827069044113, "global_step": 15252, "epoch": 128, "lr": 8.969170674394664e-05} +{"train_loss": 0.006700893398374319, "global_step": 15253, "epoch": 128, "lr": 8.969035937751275e-05} +{"train_loss": 0.007188112009316683, "global_step": 15254, "epoch": 128, "lr": 8.96890119331511e-05} +{"train_loss": 0.006598492152988911, "global_step": 15255, "epoch": 128, "lr": 8.968766441086428e-05} +{"train_loss": 0.008212503045797348, "global_step": 15256, "epoch": 128, "lr": 8.968631681065499e-05} +{"train_loss": 0.008922796696424484, "global_step": 15257, "epoch": 128, "lr": 8.968496913252585e-05} +{"train_loss": 0.009532731026411057, "global_step": 15258, "epoch": 128, "lr": 8.968362137647951e-05} +{"train_loss": 0.004415011499077082, "global_step": 15259, "epoch": 128, "lr": 8.968227354251862e-05} +{"train_loss": 0.01071514654904604, "global_step": 15260, "epoch": 128, "lr": 8.968092563064583e-05} +{"train_loss": 0.007179462816566229, "global_step": 15261, "epoch": 128, "lr": 8.967957764086379e-05} +{"train_loss": 0.008819658309221268, "global_step": 15262, "epoch": 128, "lr": 8.96782295731751e-05} +{"train_loss": 0.004522956907749176, "global_step": 15263, "epoch": 128, "lr": 8.967688142758249e-05} +{"train_loss": 0.01065948698669672, "global_step": 15264, "epoch": 128, "lr": 8.967553320408855e-05} +{"train_loss": 0.010448423214256763, "global_step": 15265, "epoch": 128, "lr": 8.967418490269593e-05} +{"train_loss": 0.006743880454450846, "global_step": 15266, "epoch": 128, "lr": 8.96728365234073e-05} +{"train_loss": 0.006470875348895788, "global_step": 15267, "epoch": 128, "lr": 8.967148806622527e-05} +{"train_loss": 0.008580036461353302, "global_step": 15268, "epoch": 128, "lr": 8.967013953115253e-05} +{"train_loss": 0.007807084824889898, "global_step": 15269, "epoch": 128, "lr": 8.966879091819171e-05} +{"train_loss": 0.010283753275871277, "global_step": 15270, "epoch": 128, "lr": 8.966744222734545e-05} +{"train_loss": 0.009046854451298714, "global_step": 15271, "epoch": 128, "lr": 8.966609345861641e-05} +{"train_loss": 0.009486299008131027, "global_step": 15272, "epoch": 128, "lr": 8.966474461200724e-05} +{"train_loss": 0.004789062775671482, "global_step": 15273, "epoch": 128, "lr": 8.966339568752056e-05} +{"train_loss": 0.009614897891879082, "global_step": 15274, "epoch": 128, "lr": 8.966204668515906e-05} +{"train_loss": 0.008866974152624607, "global_step": 15275, "epoch": 128, "lr": 8.966069760492536e-05} +{"train_loss": 0.006141982041299343, "global_step": 15276, "epoch": 128, "lr": 8.965934844682211e-05} +{"train_loss": 0.0064816540107131, "global_step": 15277, "epoch": 128, "lr": 8.965799921085198e-05} +{"train_loss": 0.010625452734529972, "global_step": 15278, "epoch": 128, "lr": 8.965664989701761e-05} +{"train_loss": 0.005298907402902842, "global_step": 15279, "epoch": 128, "lr": 8.965530050532163e-05} +{"train_loss": 0.007579827215522528, "global_step": 15280, "epoch": 128, "lr": 8.96539510357667e-05} +{"train_loss": 0.006887797731906176, "global_step": 15281, "epoch": 128, "lr": 8.965260148835549e-05} +{"train_loss": 0.0062165879644453526, "global_step": 15282, "epoch": 128, "lr": 8.965125186309062e-05} +{"train_loss": 0.006335539743304253, "global_step": 15283, "epoch": 128, "lr": 8.964990215997476e-05} +{"train_loss": 0.007923750206828117, "global_step": 15284, "epoch": 128, "lr": 8.964855237901055e-05} +{"train_loss": 0.006290498189628124, "global_step": 15285, "epoch": 128, "lr": 8.964720252020065e-05} +{"train_loss": 0.007317283656448126, "global_step": 15286, "epoch": 128, "lr": 8.964585258354769e-05} +{"train_loss": 0.010194316506385803, "global_step": 15287, "epoch": 128, "lr": 8.964450256905435e-05} +{"train_loss": 0.0060145496390759945, "global_step": 15288, "epoch": 128, "lr": 8.964315247672326e-05} +{"train_loss": 0.005163712427020073, "global_step": 15289, "epoch": 128, "lr": 8.964180230655708e-05} +{"train_loss": 0.006011513527482748, "global_step": 15290, "epoch": 128, "lr": 8.964045205855845e-05} +{"train_loss": 0.00801900215446949, "global_step": 15291, "epoch": 128, "lr": 8.963910173273003e-05} +{"train_loss": 0.007900020107626915, "global_step": 15292, "epoch": 128, "lr": 8.963775132907444e-05} +{"train_loss": 0.00505181634798646, "global_step": 15293, "epoch": 128, "lr": 8.96364008475944e-05} +{"train_loss": 0.00884301494807005, "global_step": 15294, "epoch": 128, "lr": 8.963505028829251e-05} +{"train_loss": 0.004759429022669792, "global_step": 15295, "epoch": 128, "lr": 8.963369965117142e-05} +{"train_loss": 0.007993756793439388, "global_step": 15296, "epoch": 128, "lr": 8.96323489362338e-05} +{"train_loss": 0.011137166060507298, "global_step": 15297, "epoch": 128, "lr": 8.96309981434823e-05} +{"train_loss": 0.00845871027559042, "global_step": 15298, "epoch": 128, "lr": 8.962964727291958e-05} +{"train_loss": 0.008741424418985844, "global_step": 15299, "epoch": 128, "lr": 8.962829632454828e-05} +{"train_loss": 0.004626489244401455, "global_step": 15300, "epoch": 128, "lr": 8.962694529837103e-05} +{"train_loss": 0.006388990208506584, "global_step": 15301, "epoch": 128, "lr": 8.962559419439053e-05} +{"train_loss": 0.004301175475120544, "global_step": 15302, "epoch": 128, "lr": 8.962424301260939e-05} +{"train_loss": 0.006406782194972038, "global_step": 15303, "epoch": 128, "lr": 8.962289175303031e-05} +{"train_loss": 0.005742404144257307, "global_step": 15304, "epoch": 128, "lr": 8.96215404156559e-05} +{"train_loss": 0.006538651417940855, "global_step": 15305, "epoch": 128, "lr": 8.96201890004888e-05} +{"train_loss": 0.005255596246570349, "global_step": 15306, "epoch": 128, "lr": 8.961883750753174e-05} +{"train_loss": 0.0051859356462955475, "global_step": 15307, "epoch": 128, "lr": 8.961748593678729e-05} +{"train_loss": 0.006061469204723835, "global_step": 15308, "epoch": 128, "lr": 8.961613428825816e-05} +{"train_loss": 0.005875505972653627, "global_step": 15309, "epoch": 128, "lr": 8.961478256194698e-05} +{"train_loss": 0.006620559375733137, "global_step": 15310, "epoch": 128, "lr": 8.96134307578564e-05} +{"train_loss": 0.009262831881642342, "global_step": 15311, "epoch": 128, "lr": 8.961207887598908e-05} +{"train_loss": 0.009842951782047749, "global_step": 15312, "epoch": 128, "lr": 8.961072691634768e-05} +{"train_loss": 0.007534781005233526, "global_step": 15313, "epoch": 128, "lr": 8.960937487893484e-05} +{"train_loss": 0.006767261773347855, "global_step": 15314, "epoch": 128, "lr": 8.960802276375324e-05} +{"train_loss": 0.008705212734639645, "global_step": 15315, "epoch": 128, "lr": 8.96066705708055e-05} +{"train_loss": 0.005538784433156252, "global_step": 15316, "epoch": 128, "lr": 8.960531830009431e-05} +{"train_loss": 0.005535826552659273, "global_step": 15317, "epoch": 128, "lr": 8.960396595162231e-05} +{"train_loss": 0.0058380854316055775, "global_step": 15318, "epoch": 128, "lr": 8.960261352539213e-05} +{"train_loss": 0.006509328261017799, "global_step": 15319, "epoch": 128, "lr": 8.960126102140647e-05} +{"train_loss": 0.0060947369784116745, "global_step": 15320, "epoch": 128, "lr": 8.959990843966797e-05} +{"train_loss": 0.006204984150826931, "global_step": 15321, "epoch": 128, "lr": 8.959855578017926e-05} +{"train_loss": 0.011225858703255653, "global_step": 15322, "epoch": 128, "lr": 8.959720304294303e-05} +{"train_loss": 0.007842163555324078, "global_step": 15323, "epoch": 128, "lr": 8.959585022796191e-05} +{"train_loss": 0.00786827877163887, "global_step": 15324, "epoch": 128, "lr": 8.959449733523858e-05} +{"train_loss": 0.008468023501336575, "global_step": 15325, "epoch": 128, "lr": 8.959314436477569e-05} +{"train_loss": 0.007286901120096445, "global_step": 15326, "epoch": 128, "lr": 8.959179131657588e-05} +{"train_loss": 0.00889643281698227, "global_step": 15327, "epoch": 128, "lr": 8.959043819064181e-05} +{"train_loss": 0.006742299068719149, "global_step": 15328, "epoch": 128, "lr": 8.958908498697617e-05} +{"train_loss": 0.007693406194448471, "global_step": 15329, "epoch": 128, "lr": 8.958773170558156e-05} +{"train_loss": 0.008979340083897114, "global_step": 15330, "epoch": 128, "lr": 8.958637834646068e-05} +{"train_loss": 0.006494377739727497, "global_step": 15331, "epoch": 128, "lr": 8.95850249096162e-05} +{"train_loss": 0.006368877831846476, "global_step": 15332, "epoch": 128, "lr": 8.958367139505073e-05} +{"train_loss": 0.008225679397583008, "global_step": 15333, "epoch": 128, "lr": 8.958231780276694e-05} +{"train_loss": 0.005723923910409212, "global_step": 15334, "epoch": 128, "lr": 8.958096413276751e-05} +{"train_loss": 0.00656494963914156, "global_step": 15335, "epoch": 128, "lr": 8.957961038505509e-05} +{"train_loss": 0.00714110815897584, "global_step": 15336, "epoch": 128, "lr": 8.957825655963232e-05} +{"train_loss": 0.0056728096678853035, "global_step": 15337, "epoch": 128, "lr": 8.95769026565019e-05} +{"train_loss": 0.006261793896555901, "global_step": 15338, "epoch": 128, "lr": 8.957554867566643e-05} +{"train_loss": 0.005275722127407789, "global_step": 15339, "epoch": 128, "lr": 8.957419461712861e-05} +{"train_loss": 0.007083880715072155, "global_step": 15340, "epoch": 128, "lr": 8.957284048089108e-05} +{"train_loss": 0.005534063093364239, "global_step": 15341, "epoch": 128, "lr": 8.957148626695651e-05} +{"train_loss": 0.007193480618298054, "global_step": 15342, "epoch": 128, "lr": 8.957013197532756e-05} +{"train_loss": 0.008383258245885372, "global_step": 15343, "epoch": 128, "lr": 8.956877760600687e-05} +{"train_loss": 0.006924180313944817, "global_step": 15344, "epoch": 128, "lr": 8.956742315899713e-05} +{"train_loss": 0.007534930016845465, "global_step": 15345, "epoch": 128, "lr": 8.956606863430098e-05} +{"train_loss": 0.007573109585791826, "global_step": 15346, "epoch": 128, "lr": 8.956471403192106e-05} +{"train_loss": 0.004969524685293436, "global_step": 15347, "epoch": 128, "lr": 8.956335935186006e-05} +{"train_loss": 0.007256964221596718, "global_step": 15348, "epoch": 128, "lr": 8.956200459412064e-05} +{"train_loss": 0.010298985056579113, "global_step": 15349, "epoch": 128, "lr": 8.956064975870543e-05} +{"train_loss": 0.007265958903717394, "global_step": 15350, "epoch": 128, "lr": 8.955929484561713e-05, "val_loss": 0.014723161235451698} +{"train_loss": 0.007481418550014496, "global_step": 15351, "epoch": 129, "lr": 8.955793985485839e-05} +{"train_loss": 0.0051793623715639114, "global_step": 15352, "epoch": 129, "lr": 8.955658478643185e-05} +{"train_loss": 0.005452747922390699, "global_step": 15353, "epoch": 129, "lr": 8.955522964034018e-05} +{"train_loss": 0.0065515777096152306, "global_step": 15354, "epoch": 129, "lr": 8.955387441658604e-05} +{"train_loss": 0.006429681554436684, "global_step": 15355, "epoch": 129, "lr": 8.95525191151721e-05} +{"train_loss": 0.004320734646171331, "global_step": 15356, "epoch": 129, "lr": 8.9551163736101e-05} +{"train_loss": 0.004764236509799957, "global_step": 15357, "epoch": 129, "lr": 8.954980827937543e-05} +{"train_loss": 0.005224613938480616, "global_step": 15358, "epoch": 129, "lr": 8.954845274499803e-05} +{"train_loss": 0.006350222509354353, "global_step": 15359, "epoch": 129, "lr": 8.954709713297147e-05} +{"train_loss": 0.007648272439837456, "global_step": 15360, "epoch": 129, "lr": 8.954574144329841e-05} +{"train_loss": 0.005343867465853691, "global_step": 15361, "epoch": 129, "lr": 8.954438567598152e-05} +{"train_loss": 0.003851199522614479, "global_step": 15362, "epoch": 129, "lr": 8.954302983102343e-05} +{"train_loss": 0.0072931814938783646, "global_step": 15363, "epoch": 129, "lr": 8.954167390842685e-05} +{"train_loss": 0.009234360419213772, "global_step": 15364, "epoch": 129, "lr": 8.95403179081944e-05} +{"train_loss": 0.007280188146978617, "global_step": 15365, "epoch": 129, "lr": 8.953896183032877e-05} +{"train_loss": 0.008487481623888016, "global_step": 15366, "epoch": 129, "lr": 8.953760567483261e-05} +{"train_loss": 0.0055061099119484425, "global_step": 15367, "epoch": 129, "lr": 8.95362494417086e-05} +{"train_loss": 0.0069876303896307945, "global_step": 15368, "epoch": 129, "lr": 8.953489313095937e-05} +{"train_loss": 0.0067785633727908134, "global_step": 15369, "epoch": 129, "lr": 8.95335367425876e-05} +{"train_loss": 0.012544835917651653, "global_step": 15370, "epoch": 129, "lr": 8.953218027659596e-05} +{"train_loss": 0.003631288418546319, "global_step": 15371, "epoch": 129, "lr": 8.953082373298711e-05} +{"train_loss": 0.005836846772581339, "global_step": 15372, "epoch": 129, "lr": 8.952946711176371e-05} +{"train_loss": 0.0064325216226279736, "global_step": 15373, "epoch": 129, "lr": 8.952811041292841e-05} +{"train_loss": 0.007760205771774054, "global_step": 15374, "epoch": 129, "lr": 8.95267536364839e-05} +{"train_loss": 0.008350846357643604, "global_step": 15375, "epoch": 129, "lr": 8.952539678243283e-05} +{"train_loss": 0.007362652570009232, "global_step": 15376, "epoch": 129, "lr": 8.952403985077788e-05} +{"train_loss": 0.00701654190197587, "global_step": 15377, "epoch": 129, "lr": 8.952268284152168e-05} +{"train_loss": 0.0077154310420155525, "global_step": 15378, "epoch": 129, "lr": 8.952132575466693e-05} +{"train_loss": 0.0061298999935388565, "global_step": 15379, "epoch": 129, "lr": 8.951996859021627e-05} +{"train_loss": 0.008471335284411907, "global_step": 15380, "epoch": 129, "lr": 8.951861134817238e-05} +{"train_loss": 0.009594714269042015, "global_step": 15381, "epoch": 129, "lr": 8.95172540285379e-05} +{"train_loss": 0.004170962609350681, "global_step": 15382, "epoch": 129, "lr": 8.951589663131553e-05} +{"train_loss": 0.00518567580729723, "global_step": 15383, "epoch": 129, "lr": 8.951453915650792e-05} +{"train_loss": 0.008391238749027252, "global_step": 15384, "epoch": 129, "lr": 8.951318160411773e-05} +{"train_loss": 0.007742198649793863, "global_step": 15385, "epoch": 129, "lr": 8.951182397414764e-05} +{"train_loss": 0.008084814064204693, "global_step": 15386, "epoch": 129, "lr": 8.95104662666003e-05} +{"train_loss": 0.009003860875964165, "global_step": 15387, "epoch": 129, "lr": 8.950910848147836e-05} +{"train_loss": 0.006198407616466284, "global_step": 15388, "epoch": 129, "lr": 8.950775061878453e-05} +{"train_loss": 0.007808987982571125, "global_step": 15389, "epoch": 129, "lr": 8.950639267852143e-05} +{"train_loss": 0.006298580672591925, "global_step": 15390, "epoch": 129, "lr": 8.950503466069177e-05} +{"train_loss": 0.005275125615298748, "global_step": 15391, "epoch": 129, "lr": 8.950367656529818e-05} +{"train_loss": 0.008171822875738144, "global_step": 15392, "epoch": 129, "lr": 8.950231839234336e-05} +{"train_loss": 0.003807217115536332, "global_step": 15393, "epoch": 129, "lr": 8.950096014182994e-05} +{"train_loss": 0.00818634033203125, "global_step": 15394, "epoch": 129, "lr": 8.949960181376061e-05} +{"train_loss": 0.006002367008477449, "global_step": 15395, "epoch": 129, "lr": 8.949824340813804e-05} +{"train_loss": 0.005997319705784321, "global_step": 15396, "epoch": 129, "lr": 8.949688492496489e-05} +{"train_loss": 0.006389221176505089, "global_step": 15397, "epoch": 129, "lr": 8.949552636424381e-05} +{"train_loss": 0.00917982030659914, "global_step": 15398, "epoch": 129, "lr": 8.94941677259775e-05} +{"train_loss": 0.005858945194631815, "global_step": 15399, "epoch": 129, "lr": 8.949280901016859e-05} +{"train_loss": 0.005986716132611036, "global_step": 15400, "epoch": 129, "lr": 8.94914502168198e-05} +{"train_loss": 0.0054830401204526424, "global_step": 15401, "epoch": 129, "lr": 8.949009134593373e-05} +{"train_loss": 0.010702433064579964, "global_step": 15402, "epoch": 129, "lr": 8.948873239751311e-05} +{"train_loss": 0.0068586780689656734, "global_step": 15403, "epoch": 129, "lr": 8.948737337156056e-05} +{"train_loss": 0.003967172931879759, "global_step": 15404, "epoch": 129, "lr": 8.94860142680788e-05} +{"train_loss": 0.008540208451449871, "global_step": 15405, "epoch": 129, "lr": 8.948465508707046e-05} +{"train_loss": 0.00845768116414547, "global_step": 15406, "epoch": 129, "lr": 8.94832958285382e-05} +{"train_loss": 0.005597160197794437, "global_step": 15407, "epoch": 129, "lr": 8.948193649248474e-05} +{"train_loss": 0.004864965565502644, "global_step": 15408, "epoch": 129, "lr": 8.948057707891268e-05} +{"train_loss": 0.007381686009466648, "global_step": 15409, "epoch": 129, "lr": 8.947921758782474e-05} +{"train_loss": 0.00938236340880394, "global_step": 15410, "epoch": 129, "lr": 8.947785801922358e-05} +{"train_loss": 0.0067810844630002975, "global_step": 15411, "epoch": 129, "lr": 8.947649837311186e-05} +{"train_loss": 0.00900272186845541, "global_step": 15412, "epoch": 129, "lr": 8.947513864949226e-05} +{"train_loss": 0.0069228000938892365, "global_step": 15413, "epoch": 129, "lr": 8.947377884836743e-05} +{"train_loss": 0.005947520956397057, "global_step": 15414, "epoch": 129, "lr": 8.947241896974006e-05} +{"train_loss": 0.0069707240909338, "global_step": 15415, "epoch": 129, "lr": 8.947105901361279e-05} +{"train_loss": 0.003946436103433371, "global_step": 15416, "epoch": 129, "lr": 8.946969897998833e-05} +{"train_loss": 0.0076445164158940315, "global_step": 15417, "epoch": 129, "lr": 8.946833886886934e-05} +{"train_loss": 0.008937378413975239, "global_step": 15418, "epoch": 129, "lr": 8.946697868025848e-05} +{"train_loss": 0.006302898749709129, "global_step": 15419, "epoch": 129, "lr": 8.946561841415842e-05} +{"train_loss": 0.0052256276831030846, "global_step": 15420, "epoch": 129, "lr": 8.946425807057184e-05} +{"train_loss": 0.0037395439576357603, "global_step": 15421, "epoch": 129, "lr": 8.946289764950139e-05} +{"train_loss": 0.005117654800415039, "global_step": 15422, "epoch": 129, "lr": 8.946153715094978e-05} +{"train_loss": 0.005090859718620777, "global_step": 15423, "epoch": 129, "lr": 8.946017657491964e-05} +{"train_loss": 0.009936060756444931, "global_step": 15424, "epoch": 129, "lr": 8.945881592141367e-05} +{"train_loss": 0.006357002537697554, "global_step": 15425, "epoch": 129, "lr": 8.945745519043452e-05} +{"train_loss": 0.006856376770883799, "global_step": 15426, "epoch": 129, "lr": 8.945609438198487e-05} +{"train_loss": 0.006246317643672228, "global_step": 15427, "epoch": 129, "lr": 8.94547334960674e-05} +{"train_loss": 0.004431516397744417, "global_step": 15428, "epoch": 129, "lr": 8.945337253268478e-05} +{"train_loss": 0.008678710088133812, "global_step": 15429, "epoch": 129, "lr": 8.945201149183968e-05} +{"train_loss": 0.005146903917193413, "global_step": 15430, "epoch": 129, "lr": 8.945065037353478e-05} +{"train_loss": 0.004696575924754143, "global_step": 15431, "epoch": 129, "lr": 8.944928917777271e-05} +{"train_loss": 0.0070884996093809605, "global_step": 15432, "epoch": 129, "lr": 8.94479279045562e-05} +{"train_loss": 0.0061991894617676735, "global_step": 15433, "epoch": 129, "lr": 8.944656655388788e-05} +{"train_loss": 0.006118339486420155, "global_step": 15434, "epoch": 129, "lr": 8.944520512577046e-05} +{"train_loss": 0.010416579432785511, "global_step": 15435, "epoch": 129, "lr": 8.944384362020657e-05} +{"train_loss": 0.005298076197504997, "global_step": 15436, "epoch": 129, "lr": 8.944248203719894e-05} +{"train_loss": 0.008012990467250347, "global_step": 15437, "epoch": 129, "lr": 8.94411203767502e-05} +{"train_loss": 0.007305925711989403, "global_step": 15438, "epoch": 129, "lr": 8.943975863886302e-05} +{"train_loss": 0.005975254811346531, "global_step": 15439, "epoch": 129, "lr": 8.943839682354009e-05} +{"train_loss": 0.008354030549526215, "global_step": 15440, "epoch": 129, "lr": 8.943703493078409e-05} +{"train_loss": 0.005262367893010378, "global_step": 15441, "epoch": 129, "lr": 8.943567296059767e-05} +{"train_loss": 0.005752261262387037, "global_step": 15442, "epoch": 129, "lr": 8.943431091298353e-05} +{"train_loss": 0.00811532512307167, "global_step": 15443, "epoch": 129, "lr": 8.943294878794432e-05} +{"train_loss": 0.008469881489872932, "global_step": 15444, "epoch": 129, "lr": 8.943158658548276e-05} +{"train_loss": 0.004359304439276457, "global_step": 15445, "epoch": 129, "lr": 8.943022430560147e-05} +{"train_loss": 0.006015338469296694, "global_step": 15446, "epoch": 129, "lr": 8.942886194830315e-05} +{"train_loss": 0.005245075561106205, "global_step": 15447, "epoch": 129, "lr": 8.942749951359047e-05} +{"train_loss": 0.008705807849764824, "global_step": 15448, "epoch": 129, "lr": 8.942613700146611e-05} +{"train_loss": 0.005292725749313831, "global_step": 15449, "epoch": 129, "lr": 8.942477441193274e-05} +{"train_loss": 0.00655435211956501, "global_step": 15450, "epoch": 129, "lr": 8.942341174499304e-05} +{"train_loss": 0.005347947124391794, "global_step": 15451, "epoch": 129, "lr": 8.942204900064967e-05} +{"train_loss": 0.006743320729583502, "global_step": 15452, "epoch": 129, "lr": 8.942068617890533e-05} +{"train_loss": 0.00749087193980813, "global_step": 15453, "epoch": 129, "lr": 8.941932327976269e-05} +{"train_loss": 0.0062985350377857685, "global_step": 15454, "epoch": 129, "lr": 8.941796030322442e-05} +{"train_loss": 0.009542154148221016, "global_step": 15455, "epoch": 129, "lr": 8.941659724929319e-05} +{"train_loss": 0.004947248380631208, "global_step": 15456, "epoch": 129, "lr": 8.941523411797168e-05} +{"train_loss": 0.007538239471614361, "global_step": 15457, "epoch": 129, "lr": 8.941387090926256e-05} +{"train_loss": 0.007024711929261684, "global_step": 15458, "epoch": 129, "lr": 8.941250762316853e-05} +{"train_loss": 0.008622974157333374, "global_step": 15459, "epoch": 129, "lr": 8.941114425969226e-05} +{"train_loss": 0.006714486982673407, "global_step": 15460, "epoch": 129, "lr": 8.94097808188364e-05} +{"train_loss": 0.007076126988977194, "global_step": 15461, "epoch": 129, "lr": 8.940841730060365e-05} +{"train_loss": 0.007027085870504379, "global_step": 15462, "epoch": 129, "lr": 8.940705370499669e-05} +{"train_loss": 0.004356585443019867, "global_step": 15463, "epoch": 129, "lr": 8.940569003201818e-05} +{"train_loss": 0.00836043618619442, "global_step": 15464, "epoch": 129, "lr": 8.940432628167082e-05} +{"train_loss": 0.006080541294068098, "global_step": 15465, "epoch": 129, "lr": 8.940296245395727e-05} +{"train_loss": 0.00634064432233572, "global_step": 15466, "epoch": 129, "lr": 8.940159854888021e-05} +{"train_loss": 0.004851959180086851, "global_step": 15467, "epoch": 129, "lr": 8.940023456644231e-05} +{"train_loss": 0.005685216281563044, "global_step": 15468, "epoch": 129, "lr": 8.939887050664629e-05} +{"train_loss": 0.006712173575441502, "global_step": 15469, "epoch": 129, "lr": 8.939750636949477e-05, "val_loss": 0.013184087350964546} +{"train_loss": 0.0057706525549292564, "global_step": 15470, "epoch": 130, "lr": 8.939614215499045e-05} +{"train_loss": 0.0057145156897604465, "global_step": 15471, "epoch": 130, "lr": 8.939477786313604e-05} +{"train_loss": 0.005590463522821665, "global_step": 15472, "epoch": 130, "lr": 8.939341349393418e-05} +{"train_loss": 0.004322490189224482, "global_step": 15473, "epoch": 130, "lr": 8.939204904738754e-05} +{"train_loss": 0.005404881201684475, "global_step": 15474, "epoch": 130, "lr": 8.939068452349885e-05} +{"train_loss": 0.005313052795827389, "global_step": 15475, "epoch": 130, "lr": 8.938931992227076e-05} +{"train_loss": 0.004624181427061558, "global_step": 15476, "epoch": 130, "lr": 8.938795524370593e-05} +{"train_loss": 0.009404201991856098, "global_step": 15477, "epoch": 130, "lr": 8.938659048780706e-05} +{"train_loss": 0.005854032468050718, "global_step": 15478, "epoch": 130, "lr": 8.938522565457684e-05} +{"train_loss": 0.0056481207720935345, "global_step": 15479, "epoch": 130, "lr": 8.938386074401793e-05} +{"train_loss": 0.005286459811031818, "global_step": 15480, "epoch": 130, "lr": 8.938249575613301e-05} +{"train_loss": 0.004176710266619921, "global_step": 15481, "epoch": 130, "lr": 8.938113069092477e-05} +{"train_loss": 0.006384310778230429, "global_step": 15482, "epoch": 130, "lr": 8.937976554839589e-05} +{"train_loss": 0.008635340258479118, "global_step": 15483, "epoch": 130, "lr": 8.937840032854905e-05} +{"train_loss": 0.0060608116909861565, "global_step": 15484, "epoch": 130, "lr": 8.937703503138693e-05} +{"train_loss": 0.007382966578006744, "global_step": 15485, "epoch": 130, "lr": 8.937566965691222e-05} +{"train_loss": 0.005202143453061581, "global_step": 15486, "epoch": 130, "lr": 8.937430420512756e-05} +{"train_loss": 0.0102193932980299, "global_step": 15487, "epoch": 130, "lr": 8.937293867603566e-05} +{"train_loss": 0.005765972658991814, "global_step": 15488, "epoch": 130, "lr": 8.937157306963924e-05} +{"train_loss": 0.004646870773285627, "global_step": 15489, "epoch": 130, "lr": 8.93702073859409e-05} +{"train_loss": 0.006979239173233509, "global_step": 15490, "epoch": 130, "lr": 8.936884162494339e-05} +{"train_loss": 0.0065849251113832, "global_step": 15491, "epoch": 130, "lr": 8.936747578664936e-05} +{"train_loss": 0.0072212968952953815, "global_step": 15492, "epoch": 130, "lr": 8.936610987106149e-05} +{"train_loss": 0.005368782207369804, "global_step": 15493, "epoch": 130, "lr": 8.936474387818247e-05} +{"train_loss": 0.005916212685406208, "global_step": 15494, "epoch": 130, "lr": 8.9363377808015e-05} +{"train_loss": 0.005046755075454712, "global_step": 15495, "epoch": 130, "lr": 8.936201166056172e-05} +{"train_loss": 0.007728846278041601, "global_step": 15496, "epoch": 130, "lr": 8.936064543582534e-05} +{"train_loss": 0.007919163443148136, "global_step": 15497, "epoch": 130, "lr": 8.935927913380854e-05} +{"train_loss": 0.008750833570957184, "global_step": 15498, "epoch": 130, "lr": 8.9357912754514e-05} +{"train_loss": 0.005483700893819332, "global_step": 15499, "epoch": 130, "lr": 8.935654629794441e-05} +{"train_loss": 0.007761090993881226, "global_step": 15500, "epoch": 130, "lr": 8.935517976410244e-05} +{"train_loss": 0.0068987770937383175, "global_step": 15501, "epoch": 130, "lr": 8.935381315299078e-05} +{"train_loss": 0.006006679963320494, "global_step": 15502, "epoch": 130, "lr": 8.93524464646121e-05} +{"train_loss": 0.009905720129609108, "global_step": 15503, "epoch": 130, "lr": 8.935107969896911e-05} +{"train_loss": 0.005975236184895039, "global_step": 15504, "epoch": 130, "lr": 8.934971285606449e-05} +{"train_loss": 0.01040397398173809, "global_step": 15505, "epoch": 130, "lr": 8.93483459359009e-05} +{"train_loss": 0.005435055121779442, "global_step": 15506, "epoch": 130, "lr": 8.934697893848101e-05} +{"train_loss": 0.004376289434731007, "global_step": 15507, "epoch": 130, "lr": 8.934561186380756e-05} +{"train_loss": 0.00825443770736456, "global_step": 15508, "epoch": 130, "lr": 8.934424471188321e-05} +{"train_loss": 0.006081209983676672, "global_step": 15509, "epoch": 130, "lr": 8.934287748271062e-05} +{"train_loss": 0.005170004442334175, "global_step": 15510, "epoch": 130, "lr": 8.934151017629251e-05} +{"train_loss": 0.008167430758476257, "global_step": 15511, "epoch": 130, "lr": 8.934014279263154e-05} +{"train_loss": 0.0037470615934580564, "global_step": 15512, "epoch": 130, "lr": 8.93387753317304e-05} +{"train_loss": 0.007218723185360432, "global_step": 15513, "epoch": 130, "lr": 8.933740779359177e-05} +{"train_loss": 0.00531921349465847, "global_step": 15514, "epoch": 130, "lr": 8.933604017821835e-05} +{"train_loss": 0.005528745241463184, "global_step": 15515, "epoch": 130, "lr": 8.933467248561282e-05} +{"train_loss": 0.006211170461028814, "global_step": 15516, "epoch": 130, "lr": 8.933330471577787e-05} +{"train_loss": 0.009026086889207363, "global_step": 15517, "epoch": 130, "lr": 8.933193686871617e-05} +{"train_loss": 0.012054177932441235, "global_step": 15518, "epoch": 130, "lr": 8.933056894443041e-05} +{"train_loss": 0.005898327101022005, "global_step": 15519, "epoch": 130, "lr": 8.93292009429233e-05} +{"train_loss": 0.0041213259100914, "global_step": 15520, "epoch": 130, "lr": 8.932783286419748e-05} +{"train_loss": 0.0072036185301840305, "global_step": 15521, "epoch": 130, "lr": 8.932646470825567e-05} +{"train_loss": 0.004550531506538391, "global_step": 15522, "epoch": 130, "lr": 8.932509647510055e-05} +{"train_loss": 0.005011053755879402, "global_step": 15523, "epoch": 130, "lr": 8.932372816473479e-05} +{"train_loss": 0.0038640464190393686, "global_step": 15524, "epoch": 130, "lr": 8.932235977716113e-05} +{"train_loss": 0.006464510224759579, "global_step": 15525, "epoch": 130, "lr": 8.932099131238219e-05} +{"train_loss": 0.008328026160597801, "global_step": 15526, "epoch": 130, "lr": 8.93196227704007e-05} +{"train_loss": 0.007758434861898422, "global_step": 15527, "epoch": 130, "lr": 8.93182541512193e-05} +{"train_loss": 0.0056543778628110886, "global_step": 15528, "epoch": 130, "lr": 8.931688545484073e-05} +{"train_loss": 0.009475133381783962, "global_step": 15529, "epoch": 130, "lr": 8.931551668126766e-05} +{"train_loss": 0.007472829427570105, "global_step": 15530, "epoch": 130, "lr": 8.931414783050275e-05} +{"train_loss": 0.006259026471525431, "global_step": 15531, "epoch": 130, "lr": 8.931277890254872e-05} +{"train_loss": 0.007453475147485733, "global_step": 15532, "epoch": 130, "lr": 8.931140989740826e-05} +{"train_loss": 0.00513256061822176, "global_step": 15533, "epoch": 130, "lr": 8.931004081508406e-05} +{"train_loss": 0.006229119841009378, "global_step": 15534, "epoch": 130, "lr": 8.930867165557876e-05} +{"train_loss": 0.006667724344879389, "global_step": 15535, "epoch": 130, "lr": 8.93073024188951e-05} +{"train_loss": 0.007477837149053812, "global_step": 15536, "epoch": 130, "lr": 8.930593310503576e-05} +{"train_loss": 0.0074702417477965355, "global_step": 15537, "epoch": 130, "lr": 8.93045637140034e-05} +{"train_loss": 0.0051534282974898815, "global_step": 15538, "epoch": 130, "lr": 8.930319424580074e-05} +{"train_loss": 0.004799466114491224, "global_step": 15539, "epoch": 130, "lr": 8.930182470043044e-05} +{"train_loss": 0.010065967217087746, "global_step": 15540, "epoch": 130, "lr": 8.930045507789524e-05} +{"train_loss": 0.005246591754257679, "global_step": 15541, "epoch": 130, "lr": 8.929908537819778e-05} +{"train_loss": 0.0067609017714858055, "global_step": 15542, "epoch": 130, "lr": 8.929771560134075e-05} +{"train_loss": 0.008359003812074661, "global_step": 15543, "epoch": 130, "lr": 8.929634574732685e-05} +{"train_loss": 0.006562072318047285, "global_step": 15544, "epoch": 130, "lr": 8.92949758161588e-05} +{"train_loss": 0.004356280900537968, "global_step": 15545, "epoch": 130, "lr": 8.929360580783925e-05} +{"train_loss": 0.009946306236088276, "global_step": 15546, "epoch": 130, "lr": 8.929223572237092e-05} +{"train_loss": 0.0059313466772437096, "global_step": 15547, "epoch": 130, "lr": 8.929086555975646e-05} +{"train_loss": 0.0071503049694001675, "global_step": 15548, "epoch": 130, "lr": 8.928949531999858e-05} +{"train_loss": 0.007839420810341835, "global_step": 15549, "epoch": 130, "lr": 8.928812500309998e-05} +{"train_loss": 0.004294409416615963, "global_step": 15550, "epoch": 130, "lr": 8.928675460906334e-05} +{"train_loss": 0.005180861335247755, "global_step": 15551, "epoch": 130, "lr": 8.928538413789139e-05} +{"train_loss": 0.004210393410176039, "global_step": 15552, "epoch": 130, "lr": 8.928401358958674e-05} +{"train_loss": 0.0051408801227808, "global_step": 15553, "epoch": 130, "lr": 8.928264296415214e-05} +{"train_loss": 0.00592739786952734, "global_step": 15554, "epoch": 130, "lr": 8.928127226159028e-05} +{"train_loss": 0.006504680495709181, "global_step": 15555, "epoch": 130, "lr": 8.927990148190381e-05} +{"train_loss": 0.006658603902906179, "global_step": 15556, "epoch": 130, "lr": 8.927853062509548e-05} +{"train_loss": 0.006852757651358843, "global_step": 15557, "epoch": 130, "lr": 8.927715969116794e-05} +{"train_loss": 0.005811239592730999, "global_step": 15558, "epoch": 130, "lr": 8.92757886801239e-05} +{"train_loss": 0.005800523329526186, "global_step": 15559, "epoch": 130, "lr": 8.927441759196602e-05} +{"train_loss": 0.006006764713674784, "global_step": 15560, "epoch": 130, "lr": 8.927304642669705e-05} +{"train_loss": 0.005652694962918758, "global_step": 15561, "epoch": 130, "lr": 8.927167518431962e-05} +{"train_loss": 0.005385919474065304, "global_step": 15562, "epoch": 130, "lr": 8.927030386483648e-05} +{"train_loss": 0.00553217763081193, "global_step": 15563, "epoch": 130, "lr": 8.926893246825028e-05} +{"train_loss": 0.006491841748356819, "global_step": 15564, "epoch": 130, "lr": 8.926756099456372e-05} +{"train_loss": 0.00540741253644228, "global_step": 15565, "epoch": 130, "lr": 8.926618944377949e-05} +{"train_loss": 0.003741383785381913, "global_step": 15566, "epoch": 130, "lr": 8.926481781590032e-05} +{"train_loss": 0.005256774835288525, "global_step": 15567, "epoch": 130, "lr": 8.926344611092885e-05} +{"train_loss": 0.006652007345110178, "global_step": 15568, "epoch": 130, "lr": 8.926207432886782e-05} +{"train_loss": 0.004078587982803583, "global_step": 15569, "epoch": 130, "lr": 8.92607024697199e-05} +{"train_loss": 0.007084221113473177, "global_step": 15570, "epoch": 130, "lr": 8.925933053348777e-05} +{"train_loss": 0.007391705177724361, "global_step": 15571, "epoch": 130, "lr": 8.925795852017414e-05} +{"train_loss": 0.005775687284767628, "global_step": 15572, "epoch": 130, "lr": 8.92565864297817e-05} +{"train_loss": 0.004369663540273905, "global_step": 15573, "epoch": 130, "lr": 8.925521426231316e-05} +{"train_loss": 0.007929029874503613, "global_step": 15574, "epoch": 130, "lr": 8.925384201777119e-05} +{"train_loss": 0.006055580917745829, "global_step": 15575, "epoch": 130, "lr": 8.92524696961585e-05} +{"train_loss": 0.010190647095441818, "global_step": 15576, "epoch": 130, "lr": 8.925109729747778e-05} +{"train_loss": 0.007339905947446823, "global_step": 15577, "epoch": 130, "lr": 8.924972482173173e-05} +{"train_loss": 0.008226800709962845, "global_step": 15578, "epoch": 130, "lr": 8.924835226892303e-05} +{"train_loss": 0.009310740046203136, "global_step": 15579, "epoch": 130, "lr": 8.924697963905437e-05} +{"train_loss": 0.010247363708913326, "global_step": 15580, "epoch": 130, "lr": 8.924560693212847e-05} +{"train_loss": 0.009013417176902294, "global_step": 15581, "epoch": 130, "lr": 8.924423414814802e-05} +{"train_loss": 0.0058383699506521225, "global_step": 15582, "epoch": 130, "lr": 8.924286128711572e-05} +{"train_loss": 0.005300321616232395, "global_step": 15583, "epoch": 130, "lr": 8.924148834903423e-05} +{"train_loss": 0.007462829817086458, "global_step": 15584, "epoch": 130, "lr": 8.924011533390628e-05} +{"train_loss": 0.007396265864372253, "global_step": 15585, "epoch": 130, "lr": 8.923874224173456e-05} +{"train_loss": 0.004371060058474541, "global_step": 15586, "epoch": 130, "lr": 8.923736907252176e-05} +{"train_loss": 0.004396115429699421, "global_step": 15587, "epoch": 130, "lr": 8.923599582627057e-05} +{"train_loss": 0.006489127946767111, "global_step": 15588, "epoch": 130, "lr": 8.92346225029837e-05, "val_loss": 0.02176274172961712, "train_action_mse_error": 0.0002485671720933169} +{"train_loss": 0.0067697023041546345, "global_step": 15589, "epoch": 131, "lr": 8.923324910266383e-05} +{"train_loss": 0.008182215504348278, "global_step": 15590, "epoch": 131, "lr": 8.923187562531367e-05} +{"train_loss": 0.009767858311533928, "global_step": 15591, "epoch": 131, "lr": 8.923050207093593e-05} +{"train_loss": 0.00703364796936512, "global_step": 15592, "epoch": 131, "lr": 8.922912843953328e-05} +{"train_loss": 0.006175418384373188, "global_step": 15593, "epoch": 131, "lr": 8.922775473110843e-05} +{"train_loss": 0.008949455805122852, "global_step": 15594, "epoch": 131, "lr": 8.922638094566407e-05} +{"train_loss": 0.00693917740136385, "global_step": 15595, "epoch": 131, "lr": 8.922500708320291e-05} +{"train_loss": 0.009625356644392014, "global_step": 15596, "epoch": 131, "lr": 8.922363314372763e-05} +{"train_loss": 0.006776720751076937, "global_step": 15597, "epoch": 131, "lr": 8.922225912724094e-05} +{"train_loss": 0.008211526088416576, "global_step": 15598, "epoch": 131, "lr": 8.922088503374553e-05} +{"train_loss": 0.0038647567853331566, "global_step": 15599, "epoch": 131, "lr": 8.921951086324411e-05} +{"train_loss": 0.006269602105021477, "global_step": 15600, "epoch": 131, "lr": 8.921813661573935e-05} +{"train_loss": 0.007483745459467173, "global_step": 15601, "epoch": 131, "lr": 8.9216762291234e-05} +{"train_loss": 0.005648663267493248, "global_step": 15602, "epoch": 131, "lr": 8.92153878897307e-05} +{"train_loss": 0.004997322801500559, "global_step": 15603, "epoch": 131, "lr": 8.921401341123218e-05} +{"train_loss": 0.004638948943465948, "global_step": 15604, "epoch": 131, "lr": 8.921263885574116e-05} +{"train_loss": 0.011496545746922493, "global_step": 15605, "epoch": 131, "lr": 8.921126422326029e-05} +{"train_loss": 0.004505057819187641, "global_step": 15606, "epoch": 131, "lr": 8.92098895137923e-05} +{"train_loss": 0.004750060848891735, "global_step": 15607, "epoch": 131, "lr": 8.920851472733987e-05} +{"train_loss": 0.009394926019012928, "global_step": 15608, "epoch": 131, "lr": 8.920713986390572e-05} +{"train_loss": 0.008771074935793877, "global_step": 15609, "epoch": 131, "lr": 8.920576492349253e-05} +{"train_loss": 0.009467804804444313, "global_step": 15610, "epoch": 131, "lr": 8.920438990610303e-05} +{"train_loss": 0.00820070505142212, "global_step": 15611, "epoch": 131, "lr": 8.920301481173987e-05} +{"train_loss": 0.007220374885946512, "global_step": 15612, "epoch": 131, "lr": 8.92016396404058e-05} +{"train_loss": 0.005303180310875177, "global_step": 15613, "epoch": 131, "lr": 8.920026439210349e-05} +{"train_loss": 0.010898175649344921, "global_step": 15614, "epoch": 131, "lr": 8.919888906683565e-05} +{"train_loss": 0.013862048275768757, "global_step": 15615, "epoch": 131, "lr": 8.919751366460498e-05} +{"train_loss": 0.004126927349716425, "global_step": 15616, "epoch": 131, "lr": 8.919613818541417e-05} +{"train_loss": 0.004439351614564657, "global_step": 15617, "epoch": 131, "lr": 8.919476262926594e-05} +{"train_loss": 0.006219112779945135, "global_step": 15618, "epoch": 131, "lr": 8.919338699616299e-05} +{"train_loss": 0.007118167821317911, "global_step": 15619, "epoch": 131, "lr": 8.9192011286108e-05} +{"train_loss": 0.0064091067761182785, "global_step": 15620, "epoch": 131, "lr": 8.919063549910369e-05} +{"train_loss": 0.01099046878516674, "global_step": 15621, "epoch": 131, "lr": 8.918925963515275e-05} +{"train_loss": 0.00988253578543663, "global_step": 15622, "epoch": 131, "lr": 8.918788369425788e-05} +{"train_loss": 0.009101742878556252, "global_step": 15623, "epoch": 131, "lr": 8.918650767642179e-05} +{"train_loss": 0.0063866847194731236, "global_step": 15624, "epoch": 131, "lr": 8.918513158164718e-05} +{"train_loss": 0.009146861732006073, "global_step": 15625, "epoch": 131, "lr": 8.918375540993676e-05} +{"train_loss": 0.006215621717274189, "global_step": 15626, "epoch": 131, "lr": 8.918237916129321e-05} +{"train_loss": 0.005889943800866604, "global_step": 15627, "epoch": 131, "lr": 8.918100283571923e-05} +{"train_loss": 0.005572160240262747, "global_step": 15628, "epoch": 131, "lr": 8.917962643321756e-05} +{"train_loss": 0.005850391928106546, "global_step": 15629, "epoch": 131, "lr": 8.917824995379087e-05} +{"train_loss": 0.007002108730375767, "global_step": 15630, "epoch": 131, "lr": 8.917687339744188e-05} +{"train_loss": 0.003664696589112282, "global_step": 15631, "epoch": 131, "lr": 8.917549676417328e-05} +{"train_loss": 0.006287569645792246, "global_step": 15632, "epoch": 131, "lr": 8.917412005398777e-05} +{"train_loss": 0.0064927046187222, "global_step": 15633, "epoch": 131, "lr": 8.917274326688808e-05} +{"train_loss": 0.006133987568318844, "global_step": 15634, "epoch": 131, "lr": 8.917136640287689e-05} +{"train_loss": 0.005371151491999626, "global_step": 15635, "epoch": 131, "lr": 8.91699894619569e-05} +{"train_loss": 0.005691923666745424, "global_step": 15636, "epoch": 131, "lr": 8.916861244413082e-05} +{"train_loss": 0.007840504869818687, "global_step": 15637, "epoch": 131, "lr": 8.916723534940134e-05} +{"train_loss": 0.00641549052670598, "global_step": 15638, "epoch": 131, "lr": 8.916585817777119e-05} +{"train_loss": 0.006766258738934994, "global_step": 15639, "epoch": 131, "lr": 8.916448092924306e-05} +{"train_loss": 0.0050109014846384525, "global_step": 15640, "epoch": 131, "lr": 8.916310360381966e-05} +{"train_loss": 0.006654439494013786, "global_step": 15641, "epoch": 131, "lr": 8.91617262015037e-05} +{"train_loss": 0.004867671988904476, "global_step": 15642, "epoch": 131, "lr": 8.916034872229786e-05} +{"train_loss": 0.01029475498944521, "global_step": 15643, "epoch": 131, "lr": 8.915897116620486e-05} +{"train_loss": 0.007414692547172308, "global_step": 15644, "epoch": 131, "lr": 8.91575935332274e-05} +{"train_loss": 0.004477574490010738, "global_step": 15645, "epoch": 131, "lr": 8.91562158233682e-05} +{"train_loss": 0.006014012731611729, "global_step": 15646, "epoch": 131, "lr": 8.915483803662994e-05} +{"train_loss": 0.008424290455877781, "global_step": 15647, "epoch": 131, "lr": 8.915346017301534e-05} +{"train_loss": 0.007110158447176218, "global_step": 15648, "epoch": 131, "lr": 8.91520822325271e-05} +{"train_loss": 0.007995477877557278, "global_step": 15649, "epoch": 131, "lr": 8.915070421516796e-05} +{"train_loss": 0.003921135328710079, "global_step": 15650, "epoch": 131, "lr": 8.914932612094055e-05} +{"train_loss": 0.0059694708324968815, "global_step": 15651, "epoch": 131, "lr": 8.914794794984767e-05} +{"train_loss": 0.005878554191440344, "global_step": 15652, "epoch": 131, "lr": 8.914656970189195e-05} +{"train_loss": 0.008980443701148033, "global_step": 15653, "epoch": 131, "lr": 8.914519137707611e-05} +{"train_loss": 0.006201275158673525, "global_step": 15654, "epoch": 131, "lr": 8.914381297540288e-05} +{"train_loss": 0.006456409115344286, "global_step": 15655, "epoch": 131, "lr": 8.914243449687496e-05} +{"train_loss": 0.005542556289583445, "global_step": 15656, "epoch": 131, "lr": 8.914105594149504e-05} +{"train_loss": 0.010812943801283836, "global_step": 15657, "epoch": 131, "lr": 8.913967730926586e-05} +{"train_loss": 0.006407843437045813, "global_step": 15658, "epoch": 131, "lr": 8.913829860019009e-05} +{"train_loss": 0.006842317525297403, "global_step": 15659, "epoch": 131, "lr": 8.913691981427045e-05} +{"train_loss": 0.004796639084815979, "global_step": 15660, "epoch": 131, "lr": 8.913554095150967e-05} +{"train_loss": 0.009326443076133728, "global_step": 15661, "epoch": 131, "lr": 8.91341620119104e-05} +{"train_loss": 0.005212801042944193, "global_step": 15662, "epoch": 131, "lr": 8.913278299547541e-05} +{"train_loss": 0.00991719402372837, "global_step": 15663, "epoch": 131, "lr": 8.913140390220737e-05} +{"train_loss": 0.006839800626039505, "global_step": 15664, "epoch": 131, "lr": 8.9130024732109e-05} +{"train_loss": 0.0037046459037810564, "global_step": 15665, "epoch": 131, "lr": 8.912864548518302e-05} +{"train_loss": 0.0064907618798315525, "global_step": 15666, "epoch": 131, "lr": 8.912726616143212e-05} +{"train_loss": 0.005439859814941883, "global_step": 15667, "epoch": 131, "lr": 8.9125886760859e-05} +{"train_loss": 0.007168666925281286, "global_step": 15668, "epoch": 131, "lr": 8.91245072834664e-05} +{"train_loss": 0.004901308100670576, "global_step": 15669, "epoch": 131, "lr": 8.912312772925699e-05} +{"train_loss": 0.007572049740701914, "global_step": 15670, "epoch": 131, "lr": 8.912174809823351e-05} +{"train_loss": 0.005369200371205807, "global_step": 15671, "epoch": 131, "lr": 8.912036839039866e-05} +{"train_loss": 0.00752406707033515, "global_step": 15672, "epoch": 131, "lr": 8.911898860575514e-05} +{"train_loss": 0.006115238182246685, "global_step": 15673, "epoch": 131, "lr": 8.911760874430566e-05} +{"train_loss": 0.007775437086820602, "global_step": 15674, "epoch": 131, "lr": 8.911622880605295e-05} +{"train_loss": 0.006881623063236475, "global_step": 15675, "epoch": 131, "lr": 8.91148487909997e-05} +{"train_loss": 0.005223354324698448, "global_step": 15676, "epoch": 131, "lr": 8.911346869914861e-05} +{"train_loss": 0.006473163608461618, "global_step": 15677, "epoch": 131, "lr": 8.911208853050241e-05} +{"train_loss": 0.0056190104223787785, "global_step": 15678, "epoch": 131, "lr": 8.91107082850638e-05} +{"train_loss": 0.004449627362191677, "global_step": 15679, "epoch": 131, "lr": 8.91093279628355e-05} +{"train_loss": 0.005460420157760382, "global_step": 15680, "epoch": 131, "lr": 8.91079475638202e-05} +{"train_loss": 0.008095613680779934, "global_step": 15681, "epoch": 131, "lr": 8.910656708802064e-05} +{"train_loss": 0.004543522838503122, "global_step": 15682, "epoch": 131, "lr": 8.91051865354395e-05} +{"train_loss": 0.007539788726717234, "global_step": 15683, "epoch": 131, "lr": 8.910380590607952e-05} +{"train_loss": 0.008149756118655205, "global_step": 15684, "epoch": 131, "lr": 8.910242519994337e-05} +{"train_loss": 0.005659363232553005, "global_step": 15685, "epoch": 131, "lr": 8.910104441703381e-05} +{"train_loss": 0.0065367757342755795, "global_step": 15686, "epoch": 131, "lr": 8.909966355735351e-05} +{"train_loss": 0.006948583293706179, "global_step": 15687, "epoch": 131, "lr": 8.90982826209052e-05} +{"train_loss": 0.00851364154368639, "global_step": 15688, "epoch": 131, "lr": 8.90969016076916e-05} +{"train_loss": 0.009079206734895706, "global_step": 15689, "epoch": 131, "lr": 8.90955205177154e-05} +{"train_loss": 0.00539366714656353, "global_step": 15690, "epoch": 131, "lr": 8.909413935097932e-05} +{"train_loss": 0.006264487747102976, "global_step": 15691, "epoch": 131, "lr": 8.909275810748608e-05} +{"train_loss": 0.005244527477771044, "global_step": 15692, "epoch": 131, "lr": 8.909137678723839e-05} +{"train_loss": 0.006692302413284779, "global_step": 15693, "epoch": 131, "lr": 8.908999539023896e-05} +{"train_loss": 0.006163923069834709, "global_step": 15694, "epoch": 131, "lr": 8.908861391649048e-05} +{"train_loss": 0.006829685531556606, "global_step": 15695, "epoch": 131, "lr": 8.90872323659957e-05} +{"train_loss": 0.00558851845562458, "global_step": 15696, "epoch": 131, "lr": 8.908585073875732e-05} +{"train_loss": 0.007615128066390753, "global_step": 15697, "epoch": 131, "lr": 8.908446903477803e-05} +{"train_loss": 0.005239372607320547, "global_step": 15698, "epoch": 131, "lr": 8.908308725406059e-05} +{"train_loss": 0.0045213401317596436, "global_step": 15699, "epoch": 131, "lr": 8.908170539660764e-05} +{"train_loss": 0.005992532707750797, "global_step": 15700, "epoch": 131, "lr": 8.908032346242196e-05} +{"train_loss": 0.005609505344182253, "global_step": 15701, "epoch": 131, "lr": 8.907894145150625e-05} +{"train_loss": 0.0062962910160422325, "global_step": 15702, "epoch": 131, "lr": 8.90775593638632e-05} +{"train_loss": 0.006369906943291426, "global_step": 15703, "epoch": 131, "lr": 8.907617719949554e-05} +{"train_loss": 0.002903652610257268, "global_step": 15704, "epoch": 131, "lr": 8.907479495840598e-05} +{"train_loss": 0.004195862449705601, "global_step": 15705, "epoch": 131, "lr": 8.907341264059723e-05} +{"train_loss": 0.005154519807547331, "global_step": 15706, "epoch": 131, "lr": 8.907203024607202e-05} +{"train_loss": 0.006700205096207997, "global_step": 15707, "epoch": 131, "lr": 8.907064777483305e-05, "val_loss": 0.014726396650075912} +{"train_loss": 0.00412734504789114, "global_step": 15708, "epoch": 132, "lr": 8.906926522688304e-05} +{"train_loss": 0.005457722116261721, "global_step": 15709, "epoch": 132, "lr": 8.90678826022247e-05} +{"train_loss": 0.006082137115299702, "global_step": 15710, "epoch": 132, "lr": 8.906649990086073e-05} +{"train_loss": 0.00669610220938921, "global_step": 15711, "epoch": 132, "lr": 8.906511712279389e-05} +{"train_loss": 0.007756785023957491, "global_step": 15712, "epoch": 132, "lr": 8.906373426802683e-05} +{"train_loss": 0.004910042509436607, "global_step": 15713, "epoch": 132, "lr": 8.906235133656234e-05} +{"train_loss": 0.005159591790288687, "global_step": 15714, "epoch": 132, "lr": 8.906096832840308e-05} +{"train_loss": 0.004047144204378128, "global_step": 15715, "epoch": 132, "lr": 8.905958524355176e-05} +{"train_loss": 0.008210072293877602, "global_step": 15716, "epoch": 132, "lr": 8.905820208201115e-05} +{"train_loss": 0.007649900857359171, "global_step": 15717, "epoch": 132, "lr": 8.905681884378391e-05} +{"train_loss": 0.005831562448292971, "global_step": 15718, "epoch": 132, "lr": 8.90554355288728e-05} +{"train_loss": 0.007452376652508974, "global_step": 15719, "epoch": 132, "lr": 8.905405213728049e-05} +{"train_loss": 0.00537107465788722, "global_step": 15720, "epoch": 132, "lr": 8.905266866900973e-05} +{"train_loss": 0.005106139462441206, "global_step": 15721, "epoch": 132, "lr": 8.905128512406323e-05} +{"train_loss": 0.0049650464206933975, "global_step": 15722, "epoch": 132, "lr": 8.90499015024437e-05} +{"train_loss": 0.007625875994563103, "global_step": 15723, "epoch": 132, "lr": 8.904851780415388e-05} +{"train_loss": 0.005041135475039482, "global_step": 15724, "epoch": 132, "lr": 8.904713402919645e-05} +{"train_loss": 0.007038016803562641, "global_step": 15725, "epoch": 132, "lr": 8.904575017757414e-05} +{"train_loss": 0.00588314700871706, "global_step": 15726, "epoch": 132, "lr": 8.904436624928968e-05} +{"train_loss": 0.00483685452491045, "global_step": 15727, "epoch": 132, "lr": 8.904298224434577e-05} +{"train_loss": 0.006724445149302483, "global_step": 15728, "epoch": 132, "lr": 8.904159816274514e-05} +{"train_loss": 0.006675321143120527, "global_step": 15729, "epoch": 132, "lr": 8.904021400449051e-05} +{"train_loss": 0.005383057985454798, "global_step": 15730, "epoch": 132, "lr": 8.903882976958457e-05} +{"train_loss": 0.0067840199917554855, "global_step": 15731, "epoch": 132, "lr": 8.903744545803008e-05} +{"train_loss": 0.004693277180194855, "global_step": 15732, "epoch": 132, "lr": 8.903606106982974e-05} +{"train_loss": 0.004093295428901911, "global_step": 15733, "epoch": 132, "lr": 8.903467660498625e-05} +{"train_loss": 0.004616846330463886, "global_step": 15734, "epoch": 132, "lr": 8.903329206350234e-05} +{"train_loss": 0.005842403043061495, "global_step": 15735, "epoch": 132, "lr": 8.903190744538074e-05} +{"train_loss": 0.008437713608145714, "global_step": 15736, "epoch": 132, "lr": 8.903052275062415e-05} +{"train_loss": 0.006431443616747856, "global_step": 15737, "epoch": 132, "lr": 8.902913797923531e-05} +{"train_loss": 0.008337782695889473, "global_step": 15738, "epoch": 132, "lr": 8.902775313121692e-05} +{"train_loss": 0.004754282534122467, "global_step": 15739, "epoch": 132, "lr": 8.90263682065717e-05} +{"train_loss": 0.0036858702078461647, "global_step": 15740, "epoch": 132, "lr": 8.902498320530239e-05} +{"train_loss": 0.005506378598511219, "global_step": 15741, "epoch": 132, "lr": 8.902359812741169e-05} +{"train_loss": 0.004540084861218929, "global_step": 15742, "epoch": 132, "lr": 8.902221297290232e-05} +{"train_loss": 0.008165751583874226, "global_step": 15743, "epoch": 132, "lr": 8.902082774177702e-05} +{"train_loss": 0.008642641827464104, "global_step": 15744, "epoch": 132, "lr": 8.901944243403848e-05} +{"train_loss": 0.007398063316941261, "global_step": 15745, "epoch": 132, "lr": 8.901805704968942e-05} +{"train_loss": 0.007904302328824997, "global_step": 15746, "epoch": 132, "lr": 8.901667158873259e-05} +{"train_loss": 0.0031422721222043037, "global_step": 15747, "epoch": 132, "lr": 8.901528605117069e-05} +{"train_loss": 0.007327420637011528, "global_step": 15748, "epoch": 132, "lr": 8.901390043700645e-05} +{"train_loss": 0.008465101942420006, "global_step": 15749, "epoch": 132, "lr": 8.901251474624257e-05} +{"train_loss": 0.004879770800471306, "global_step": 15750, "epoch": 132, "lr": 8.901112897888179e-05} +{"train_loss": 0.005511291790753603, "global_step": 15751, "epoch": 132, "lr": 8.900974313492685e-05} +{"train_loss": 0.006219320464879274, "global_step": 15752, "epoch": 132, "lr": 8.900835721438042e-05} +{"train_loss": 0.007006428204476833, "global_step": 15753, "epoch": 132, "lr": 8.900697121724525e-05} +{"train_loss": 0.006628143135458231, "global_step": 15754, "epoch": 132, "lr": 8.900558514352407e-05} +{"train_loss": 0.007547765038907528, "global_step": 15755, "epoch": 132, "lr": 8.900419899321958e-05} +{"train_loss": 0.007552207913249731, "global_step": 15756, "epoch": 132, "lr": 8.900281276633453e-05} +{"train_loss": 0.004661110229790211, "global_step": 15757, "epoch": 132, "lr": 8.900142646287159e-05} +{"train_loss": 0.006214910186827183, "global_step": 15758, "epoch": 132, "lr": 8.900004008283355e-05} +{"train_loss": 0.009906341321766376, "global_step": 15759, "epoch": 132, "lr": 8.899865362622308e-05} +{"train_loss": 0.007462596520781517, "global_step": 15760, "epoch": 132, "lr": 8.899726709304293e-05} +{"train_loss": 0.005744569469243288, "global_step": 15761, "epoch": 132, "lr": 8.899588048329581e-05} +{"train_loss": 0.0050502922385931015, "global_step": 15762, "epoch": 132, "lr": 8.899449379698443e-05} +{"train_loss": 0.008461239747703075, "global_step": 15763, "epoch": 132, "lr": 8.899310703411155e-05} +{"train_loss": 0.008155365474522114, "global_step": 15764, "epoch": 132, "lr": 8.899172019467986e-05} +{"train_loss": 0.0065846010111272335, "global_step": 15765, "epoch": 132, "lr": 8.899033327869208e-05} +{"train_loss": 0.009523115120828152, "global_step": 15766, "epoch": 132, "lr": 8.898894628615097e-05} +{"train_loss": 0.008355788886547089, "global_step": 15767, "epoch": 132, "lr": 8.898755921705921e-05} +{"train_loss": 0.00890517421066761, "global_step": 15768, "epoch": 132, "lr": 8.898617207141956e-05} +{"train_loss": 0.007667883299291134, "global_step": 15769, "epoch": 132, "lr": 8.898478484923472e-05} +{"train_loss": 0.005905786994844675, "global_step": 15770, "epoch": 132, "lr": 8.89833975505074e-05} +{"train_loss": 0.006635480560362339, "global_step": 15771, "epoch": 132, "lr": 8.898201017524037e-05} +{"train_loss": 0.0061804563738405704, "global_step": 15772, "epoch": 132, "lr": 8.898062272343633e-05} +{"train_loss": 0.009892201982438564, "global_step": 15773, "epoch": 132, "lr": 8.897923519509799e-05} +{"train_loss": 0.006647935602813959, "global_step": 15774, "epoch": 132, "lr": 8.897784759022806e-05} +{"train_loss": 0.010386805050075054, "global_step": 15775, "epoch": 132, "lr": 8.897645990882932e-05} +{"train_loss": 0.00440786499530077, "global_step": 15776, "epoch": 132, "lr": 8.897507215090448e-05} +{"train_loss": 0.004094437696039677, "global_step": 15777, "epoch": 132, "lr": 8.897368431645623e-05} +{"train_loss": 0.009455478750169277, "global_step": 15778, "epoch": 132, "lr": 8.897229640548731e-05} +{"train_loss": 0.00601908378303051, "global_step": 15779, "epoch": 132, "lr": 8.897090841800046e-05} +{"train_loss": 0.009251613169908524, "global_step": 15780, "epoch": 132, "lr": 8.89695203539984e-05} +{"train_loss": 0.0067351143807172775, "global_step": 15781, "epoch": 132, "lr": 8.896813221348382e-05} +{"train_loss": 0.0074209896847605705, "global_step": 15782, "epoch": 132, "lr": 8.89667439964595e-05} +{"train_loss": 0.00859871320426464, "global_step": 15783, "epoch": 132, "lr": 8.896535570292814e-05} +{"train_loss": 0.009270284324884415, "global_step": 15784, "epoch": 132, "lr": 8.896396733289247e-05} +{"train_loss": 0.0085939671844244, "global_step": 15785, "epoch": 132, "lr": 8.89625788863552e-05} +{"train_loss": 0.010325110517442226, "global_step": 15786, "epoch": 132, "lr": 8.896119036331907e-05} +{"train_loss": 0.005530655849725008, "global_step": 15787, "epoch": 132, "lr": 8.89598017637868e-05} +{"train_loss": 0.006410724483430386, "global_step": 15788, "epoch": 132, "lr": 8.895841308776114e-05} +{"train_loss": 0.009489870630204678, "global_step": 15789, "epoch": 132, "lr": 8.895702433524479e-05} +{"train_loss": 0.009814927354454994, "global_step": 15790, "epoch": 132, "lr": 8.895563550624049e-05} +{"train_loss": 0.0037062636110931635, "global_step": 15791, "epoch": 132, "lr": 8.895424660075096e-05} +{"train_loss": 0.00503620645031333, "global_step": 15792, "epoch": 132, "lr": 8.895285761877892e-05} +{"train_loss": 0.006068346090614796, "global_step": 15793, "epoch": 132, "lr": 8.895146856032712e-05} +{"train_loss": 0.0056597343645989895, "global_step": 15794, "epoch": 132, "lr": 8.895007942539826e-05} +{"train_loss": 0.00830100104212761, "global_step": 15795, "epoch": 132, "lr": 8.894869021399508e-05} +{"train_loss": 0.007222235668450594, "global_step": 15796, "epoch": 132, "lr": 8.894730092612031e-05} +{"train_loss": 0.007514966186136007, "global_step": 15797, "epoch": 132, "lr": 8.894591156177667e-05} +{"train_loss": 0.006890809629112482, "global_step": 15798, "epoch": 132, "lr": 8.894452212096691e-05} +{"train_loss": 0.00906632374972105, "global_step": 15799, "epoch": 132, "lr": 8.894313260369372e-05} +{"train_loss": 0.005892486311495304, "global_step": 15800, "epoch": 132, "lr": 8.894174300995986e-05} +{"train_loss": 0.0051847416907548904, "global_step": 15801, "epoch": 132, "lr": 8.894035333976806e-05} +{"train_loss": 0.007501012645661831, "global_step": 15802, "epoch": 132, "lr": 8.893896359312102e-05} +{"train_loss": 0.006654439028352499, "global_step": 15803, "epoch": 132, "lr": 8.893757377002149e-05} +{"train_loss": 0.005977076478302479, "global_step": 15804, "epoch": 132, "lr": 8.89361838704722e-05} +{"train_loss": 0.007584139704704285, "global_step": 15805, "epoch": 132, "lr": 8.893479389447586e-05} +{"train_loss": 0.008234115317463875, "global_step": 15806, "epoch": 132, "lr": 8.893340384203521e-05} +{"train_loss": 0.01161960233002901, "global_step": 15807, "epoch": 132, "lr": 8.893201371315299e-05} +{"train_loss": 0.005848087836056948, "global_step": 15808, "epoch": 132, "lr": 8.893062350783192e-05} +{"train_loss": 0.006166398990899324, "global_step": 15809, "epoch": 132, "lr": 8.892923322607474e-05} +{"train_loss": 0.006053395103663206, "global_step": 15810, "epoch": 132, "lr": 8.892784286788415e-05} +{"train_loss": 0.0072534214705228806, "global_step": 15811, "epoch": 132, "lr": 8.892645243326291e-05} +{"train_loss": 0.007783537730574608, "global_step": 15812, "epoch": 132, "lr": 8.892506192221374e-05} +{"train_loss": 0.007162765599787235, "global_step": 15813, "epoch": 132, "lr": 8.892367133473936e-05} +{"train_loss": 0.005322823766618967, "global_step": 15814, "epoch": 132, "lr": 8.892228067084252e-05} +{"train_loss": 0.005480207968503237, "global_step": 15815, "epoch": 132, "lr": 8.892088993052594e-05} +{"train_loss": 0.00868965219706297, "global_step": 15816, "epoch": 132, "lr": 8.891949911379236e-05} +{"train_loss": 0.007199534215033054, "global_step": 15817, "epoch": 132, "lr": 8.891810822064449e-05} +{"train_loss": 0.002815915970131755, "global_step": 15818, "epoch": 132, "lr": 8.891671725108506e-05} +{"train_loss": 0.005393421743065119, "global_step": 15819, "epoch": 132, "lr": 8.891532620511682e-05} +{"train_loss": 0.004782764241099358, "global_step": 15820, "epoch": 132, "lr": 8.89139350827425e-05} +{"train_loss": 0.011346773244440556, "global_step": 15821, "epoch": 132, "lr": 8.891254388396483e-05} +{"train_loss": 0.0036348821595311165, "global_step": 15822, "epoch": 132, "lr": 8.891115260878653e-05} +{"train_loss": 0.007648048456758261, "global_step": 15823, "epoch": 132, "lr": 8.890976125721036e-05} +{"train_loss": 0.008149489760398865, "global_step": 15824, "epoch": 132, "lr": 8.890836982923901e-05} +{"train_loss": 0.006499953102320433, "global_step": 15825, "epoch": 132, "lr": 8.890697832487522e-05} +{"train_loss": 0.006732554088871018, "global_step": 15826, "epoch": 132, "lr": 8.890558674412174e-05, "val_loss": 0.015476357191801071} +{"train_loss": 0.006278547458350658, "global_step": 15827, "epoch": 133, "lr": 8.89041950869813e-05} +{"train_loss": 0.007096599787473679, "global_step": 15828, "epoch": 133, "lr": 8.890280335345666e-05} +{"train_loss": 0.006426307372748852, "global_step": 15829, "epoch": 133, "lr": 8.89014115435505e-05} +{"train_loss": 0.008550833910703659, "global_step": 15830, "epoch": 133, "lr": 8.890001965726555e-05} +{"train_loss": 0.007137707434594631, "global_step": 15831, "epoch": 133, "lr": 8.88986276946046e-05} +{"train_loss": 0.005174865014851093, "global_step": 15832, "epoch": 133, "lr": 8.889723565557033e-05} +{"train_loss": 0.007744730915874243, "global_step": 15833, "epoch": 133, "lr": 8.889584354016552e-05} +{"train_loss": 0.0069798873737454414, "global_step": 15834, "epoch": 133, "lr": 8.889445134839284e-05} +{"train_loss": 0.006069740280508995, "global_step": 15835, "epoch": 133, "lr": 8.88930590802551e-05} +{"train_loss": 0.006289372686296701, "global_step": 15836, "epoch": 133, "lr": 8.889166673575496e-05} +{"train_loss": 0.009063014760613441, "global_step": 15837, "epoch": 133, "lr": 8.88902743148952e-05} +{"train_loss": 0.005286511965095997, "global_step": 15838, "epoch": 133, "lr": 8.888888181767854e-05} +{"train_loss": 0.008585703559219837, "global_step": 15839, "epoch": 133, "lr": 8.888748924410773e-05} +{"train_loss": 0.007137706037610769, "global_step": 15840, "epoch": 133, "lr": 8.888609659418548e-05} +{"train_loss": 0.006145311053842306, "global_step": 15841, "epoch": 133, "lr": 8.888470386791453e-05} +{"train_loss": 0.006884654518216848, "global_step": 15842, "epoch": 133, "lr": 8.888331106529762e-05} +{"train_loss": 0.005955126602202654, "global_step": 15843, "epoch": 133, "lr": 8.888191818633746e-05} +{"train_loss": 0.005230567418038845, "global_step": 15844, "epoch": 133, "lr": 8.888052523103682e-05} +{"train_loss": 0.0073414333164691925, "global_step": 15845, "epoch": 133, "lr": 8.887913219939844e-05} +{"train_loss": 0.009738558903336525, "global_step": 15846, "epoch": 133, "lr": 8.887773909142502e-05} +{"train_loss": 0.00801561027765274, "global_step": 15847, "epoch": 133, "lr": 8.887634590711933e-05} +{"train_loss": 0.005924811586737633, "global_step": 15848, "epoch": 133, "lr": 8.88749526464841e-05} +{"train_loss": 0.008132977411150932, "global_step": 15849, "epoch": 133, "lr": 8.887355930952201e-05} +{"train_loss": 0.004604834597557783, "global_step": 15850, "epoch": 133, "lr": 8.887216589623586e-05} +{"train_loss": 0.005123491398990154, "global_step": 15851, "epoch": 133, "lr": 8.887077240662837e-05} +{"train_loss": 0.005200813990086317, "global_step": 15852, "epoch": 133, "lr": 8.886937884070228e-05} +{"train_loss": 0.0049690017476677895, "global_step": 15853, "epoch": 133, "lr": 8.886798519846029e-05} +{"train_loss": 0.006593191530555487, "global_step": 15854, "epoch": 133, "lr": 8.886659147990519e-05} +{"train_loss": 0.00813438929617405, "global_step": 15855, "epoch": 133, "lr": 8.886519768503967e-05} +{"train_loss": 0.0064842295832931995, "global_step": 15856, "epoch": 133, "lr": 8.88638038138665e-05} +{"train_loss": 0.008689614944159985, "global_step": 15857, "epoch": 133, "lr": 8.886240986638839e-05} +{"train_loss": 0.004096542950719595, "global_step": 15858, "epoch": 133, "lr": 8.886101584260811e-05} +{"train_loss": 0.006067189387977123, "global_step": 15859, "epoch": 133, "lr": 8.885962174252836e-05} +{"train_loss": 0.004080935847014189, "global_step": 15860, "epoch": 133, "lr": 8.88582275661519e-05} +{"train_loss": 0.007498592603951693, "global_step": 15861, "epoch": 133, "lr": 8.885683331348147e-05} +{"train_loss": 0.00547729292884469, "global_step": 15862, "epoch": 133, "lr": 8.885543898451978e-05} +{"train_loss": 0.006316331680864096, "global_step": 15863, "epoch": 133, "lr": 8.88540445792696e-05} +{"train_loss": 0.007123391143977642, "global_step": 15864, "epoch": 133, "lr": 8.885265009773364e-05} +{"train_loss": 0.00794513151049614, "global_step": 15865, "epoch": 133, "lr": 8.885125553991468e-05} +{"train_loss": 0.006875710561871529, "global_step": 15866, "epoch": 133, "lr": 8.884986090581542e-05} +{"train_loss": 0.009701680392026901, "global_step": 15867, "epoch": 133, "lr": 8.884846619543859e-05} +{"train_loss": 0.006523464806377888, "global_step": 15868, "epoch": 133, "lr": 8.884707140878696e-05} +{"train_loss": 0.005450741853564978, "global_step": 15869, "epoch": 133, "lr": 8.884567654586326e-05} +{"train_loss": 0.007964050397276878, "global_step": 15870, "epoch": 133, "lr": 8.884428160667023e-05} +{"train_loss": 0.007826346904039383, "global_step": 15871, "epoch": 133, "lr": 8.884288659121058e-05} +{"train_loss": 0.004696939140558243, "global_step": 15872, "epoch": 133, "lr": 8.884149149948708e-05} +{"train_loss": 0.005068832542747259, "global_step": 15873, "epoch": 133, "lr": 8.884009633150248e-05} +{"train_loss": 0.003908770624548197, "global_step": 15874, "epoch": 133, "lr": 8.883870108725947e-05} +{"train_loss": 0.005062203388661146, "global_step": 15875, "epoch": 133, "lr": 8.883730576676083e-05} +{"train_loss": 0.006741207093000412, "global_step": 15876, "epoch": 133, "lr": 8.883591037000932e-05} +{"train_loss": 0.005281713791191578, "global_step": 15877, "epoch": 133, "lr": 8.883451489700761e-05} +{"train_loss": 0.008663502521812916, "global_step": 15878, "epoch": 133, "lr": 8.883311934775849e-05} +{"train_loss": 0.01228329073637724, "global_step": 15879, "epoch": 133, "lr": 8.88317237222647e-05} +{"train_loss": 0.00797322392463684, "global_step": 15880, "epoch": 133, "lr": 8.883032802052895e-05} +{"train_loss": 0.006975655443966389, "global_step": 15881, "epoch": 133, "lr": 8.882893224255402e-05} +{"train_loss": 0.005829768255352974, "global_step": 15882, "epoch": 133, "lr": 8.882753638834262e-05} +{"train_loss": 0.008466813713312149, "global_step": 15883, "epoch": 133, "lr": 8.88261404578975e-05} +{"train_loss": 0.0051802643574774265, "global_step": 15884, "epoch": 133, "lr": 8.88247444512214e-05} +{"train_loss": 0.006396681535989046, "global_step": 15885, "epoch": 133, "lr": 8.882334836831706e-05} +{"train_loss": 0.007569142151623964, "global_step": 15886, "epoch": 133, "lr": 8.882195220918723e-05} +{"train_loss": 0.00754524813964963, "global_step": 15887, "epoch": 133, "lr": 8.882055597383463e-05} +{"train_loss": 0.00552706653252244, "global_step": 15888, "epoch": 133, "lr": 8.881915966226203e-05} +{"train_loss": 0.004757487680763006, "global_step": 15889, "epoch": 133, "lr": 8.881776327447215e-05} +{"train_loss": 0.008588693104684353, "global_step": 15890, "epoch": 133, "lr": 8.881636681046774e-05} +{"train_loss": 0.007932290434837341, "global_step": 15891, "epoch": 133, "lr": 8.881497027025155e-05} +{"train_loss": 0.0063017127104103565, "global_step": 15892, "epoch": 133, "lr": 8.881357365382631e-05} +{"train_loss": 0.007862288504838943, "global_step": 15893, "epoch": 133, "lr": 8.881217696119476e-05} +{"train_loss": 0.0067061264999210835, "global_step": 15894, "epoch": 133, "lr": 8.881078019235965e-05} +{"train_loss": 0.004846096970140934, "global_step": 15895, "epoch": 133, "lr": 8.880938334732372e-05} +{"train_loss": 0.007321661803871393, "global_step": 15896, "epoch": 133, "lr": 8.88079864260897e-05} +{"train_loss": 0.0061906250193715096, "global_step": 15897, "epoch": 133, "lr": 8.880658942866036e-05} +{"train_loss": 0.011881956830620766, "global_step": 15898, "epoch": 133, "lr": 8.880519235503842e-05} +{"train_loss": 0.007701532915234566, "global_step": 15899, "epoch": 133, "lr": 8.880379520522664e-05} +{"train_loss": 0.006907668896019459, "global_step": 15900, "epoch": 133, "lr": 8.880239797922773e-05} +{"train_loss": 0.005354647524654865, "global_step": 15901, "epoch": 133, "lr": 8.880100067704447e-05} +{"train_loss": 0.004570504650473595, "global_step": 15902, "epoch": 133, "lr": 8.87996032986796e-05} +{"train_loss": 0.009539999067783356, "global_step": 15903, "epoch": 133, "lr": 8.879820584413586e-05} +{"train_loss": 0.008464407175779343, "global_step": 15904, "epoch": 133, "lr": 8.879680831341595e-05} +{"train_loss": 0.0064821611158549786, "global_step": 15905, "epoch": 133, "lr": 8.879541070652268e-05} +{"train_loss": 0.009572935290634632, "global_step": 15906, "epoch": 133, "lr": 8.879401302345878e-05} +{"train_loss": 0.007178712636232376, "global_step": 15907, "epoch": 133, "lr": 8.879261526422695e-05} +{"train_loss": 0.006161001045256853, "global_step": 15908, "epoch": 133, "lr": 8.879121742882998e-05} +{"train_loss": 0.00557269062846899, "global_step": 15909, "epoch": 133, "lr": 8.87898195172706e-05} +{"train_loss": 0.009626248851418495, "global_step": 15910, "epoch": 133, "lr": 8.878842152955153e-05} +{"train_loss": 0.006179896183311939, "global_step": 15911, "epoch": 133, "lr": 8.878702346567557e-05} +{"train_loss": 0.007560244761407375, "global_step": 15912, "epoch": 133, "lr": 8.878562532564543e-05} +{"train_loss": 0.006253332365304232, "global_step": 15913, "epoch": 133, "lr": 8.878422710946384e-05} +{"train_loss": 0.007785213179886341, "global_step": 15914, "epoch": 133, "lr": 8.878282881713358e-05} +{"train_loss": 0.010936316102743149, "global_step": 15915, "epoch": 133, "lr": 8.878143044865737e-05} +{"train_loss": 0.008556372486054897, "global_step": 15916, "epoch": 133, "lr": 8.878003200403796e-05} +{"train_loss": 0.006526369135826826, "global_step": 15917, "epoch": 133, "lr": 8.87786334832781e-05} +{"train_loss": 0.007230641786009073, "global_step": 15918, "epoch": 133, "lr": 8.877723488638055e-05} +{"train_loss": 0.006853532046079636, "global_step": 15919, "epoch": 133, "lr": 8.877583621334803e-05} +{"train_loss": 0.004638747312128544, "global_step": 15920, "epoch": 133, "lr": 8.87744374641833e-05} +{"train_loss": 0.0040308707393705845, "global_step": 15921, "epoch": 133, "lr": 8.877303863888911e-05} +{"train_loss": 0.00451975641772151, "global_step": 15922, "epoch": 133, "lr": 8.87716397374682e-05} +{"train_loss": 0.006738296709954739, "global_step": 15923, "epoch": 133, "lr": 8.87702407599233e-05} +{"train_loss": 0.008754520677030087, "global_step": 15924, "epoch": 133, "lr": 8.87688417062572e-05} +{"train_loss": 0.0071063172072172165, "global_step": 15925, "epoch": 133, "lr": 8.876744257647261e-05} +{"train_loss": 0.006060381885617971, "global_step": 15926, "epoch": 133, "lr": 8.876604337057228e-05} +{"train_loss": 0.006945513654500246, "global_step": 15927, "epoch": 133, "lr": 8.876464408855898e-05} +{"train_loss": 0.00759553536772728, "global_step": 15928, "epoch": 133, "lr": 8.876324473043545e-05} +{"train_loss": 0.007925769314169884, "global_step": 15929, "epoch": 133, "lr": 8.876184529620441e-05} +{"train_loss": 0.005975788459181786, "global_step": 15930, "epoch": 133, "lr": 8.876044578586864e-05} +{"train_loss": 0.005458969157189131, "global_step": 15931, "epoch": 133, "lr": 8.875904619943086e-05} +{"train_loss": 0.009047683328390121, "global_step": 15932, "epoch": 133, "lr": 8.875764653689385e-05} +{"train_loss": 0.008979693055152893, "global_step": 15933, "epoch": 133, "lr": 8.875624679826034e-05} +{"train_loss": 0.005987927783280611, "global_step": 15934, "epoch": 133, "lr": 8.875484698353307e-05} +{"train_loss": 0.0062162368558347225, "global_step": 15935, "epoch": 133, "lr": 8.87534470927148e-05} +{"train_loss": 0.006522777024656534, "global_step": 15936, "epoch": 133, "lr": 8.875204712580828e-05} +{"train_loss": 0.0062157814390957355, "global_step": 15937, "epoch": 133, "lr": 8.875064708281626e-05} +{"train_loss": 0.005946266930550337, "global_step": 15938, "epoch": 133, "lr": 8.874924696374148e-05} +{"train_loss": 0.006863201968371868, "global_step": 15939, "epoch": 133, "lr": 8.87478467685867e-05} +{"train_loss": 0.007210597861558199, "global_step": 15940, "epoch": 133, "lr": 8.874644649735464e-05} +{"train_loss": 0.006366630084812641, "global_step": 15941, "epoch": 133, "lr": 8.874504615004809e-05} +{"train_loss": 0.005893663968890905, "global_step": 15942, "epoch": 133, "lr": 8.874364572666978e-05} +{"train_loss": 0.011057255789637566, "global_step": 15943, "epoch": 133, "lr": 8.874224522722247e-05} +{"train_loss": 0.005335033405572176, "global_step": 15944, "epoch": 133, "lr": 8.87408446517089e-05} +{"train_loss": 0.006878039897458644, "global_step": 15945, "epoch": 133, "lr": 8.87394440001318e-05, "val_loss": 0.016388988122344017} +{"train_loss": 0.006404302082955837, "global_step": 15946, "epoch": 134, "lr": 8.873804327249395e-05} +{"train_loss": 0.008259669877588749, "global_step": 15947, "epoch": 134, "lr": 8.873664246879809e-05} +{"train_loss": 0.005620116833597422, "global_step": 15948, "epoch": 134, "lr": 8.873524158904697e-05} +{"train_loss": 0.007927033118903637, "global_step": 15949, "epoch": 134, "lr": 8.873384063324335e-05} +{"train_loss": 0.005967685487121344, "global_step": 15950, "epoch": 134, "lr": 8.873243960138998e-05} +{"train_loss": 0.006549436133354902, "global_step": 15951, "epoch": 134, "lr": 8.873103849348957e-05} +{"train_loss": 0.006916188169270754, "global_step": 15952, "epoch": 134, "lr": 8.872963730954492e-05} +{"train_loss": 0.006242590025067329, "global_step": 15953, "epoch": 134, "lr": 8.872823604955877e-05} +{"train_loss": 0.008135414682328701, "global_step": 15954, "epoch": 134, "lr": 8.872683471353387e-05} +{"train_loss": 0.007441033609211445, "global_step": 15955, "epoch": 134, "lr": 8.872543330147296e-05} +{"train_loss": 0.005032687447965145, "global_step": 15956, "epoch": 134, "lr": 8.87240318133788e-05} +{"train_loss": 0.006783875171095133, "global_step": 15957, "epoch": 134, "lr": 8.872263024925413e-05} +{"train_loss": 0.007422780618071556, "global_step": 15958, "epoch": 134, "lr": 8.872122860910172e-05} +{"train_loss": 0.007486899383366108, "global_step": 15959, "epoch": 134, "lr": 8.871982689292433e-05} +{"train_loss": 0.0057647135108709335, "global_step": 15960, "epoch": 134, "lr": 8.871842510072468e-05} +{"train_loss": 0.004121188074350357, "global_step": 15961, "epoch": 134, "lr": 8.871702323250554e-05} +{"train_loss": 0.006569346878677607, "global_step": 15962, "epoch": 134, "lr": 8.871562128826967e-05} +{"train_loss": 0.009186393581330776, "global_step": 15963, "epoch": 134, "lr": 8.87142192680198e-05} +{"train_loss": 0.008867260068655014, "global_step": 15964, "epoch": 134, "lr": 8.871281717175871e-05} +{"train_loss": 0.006112484727054834, "global_step": 15965, "epoch": 134, "lr": 8.871141499948914e-05} +{"train_loss": 0.004383711609989405, "global_step": 15966, "epoch": 134, "lr": 8.871001275121382e-05} +{"train_loss": 0.007138838060200214, "global_step": 15967, "epoch": 134, "lr": 8.870861042693554e-05} +{"train_loss": 0.0035891723819077015, "global_step": 15968, "epoch": 134, "lr": 8.870720802665705e-05} +{"train_loss": 0.007714816834777594, "global_step": 15969, "epoch": 134, "lr": 8.870580555038108e-05} +{"train_loss": 0.006002009846270084, "global_step": 15970, "epoch": 134, "lr": 8.87044029981104e-05} +{"train_loss": 0.005678337998688221, "global_step": 15971, "epoch": 134, "lr": 8.870300036984776e-05} +{"train_loss": 0.006693988107144833, "global_step": 15972, "epoch": 134, "lr": 8.870159766559592e-05} +{"train_loss": 0.006512417457997799, "global_step": 15973, "epoch": 134, "lr": 8.870019488535761e-05} +{"train_loss": 0.007868143729865551, "global_step": 15974, "epoch": 134, "lr": 8.86987920291356e-05} +{"train_loss": 0.0069196829572319984, "global_step": 15975, "epoch": 134, "lr": 8.869738909693266e-05} +{"train_loss": 0.00498627033084631, "global_step": 15976, "epoch": 134, "lr": 8.869598608875154e-05} +{"train_loss": 0.007142811082303524, "global_step": 15977, "epoch": 134, "lr": 8.869458300459496e-05} +{"train_loss": 0.008807322010397911, "global_step": 15978, "epoch": 134, "lr": 8.869317984446572e-05} +{"train_loss": 0.005271353293210268, "global_step": 15979, "epoch": 134, "lr": 8.869177660836655e-05} +{"train_loss": 0.006640761159360409, "global_step": 15980, "epoch": 134, "lr": 8.869037329630021e-05} +{"train_loss": 0.010435743257403374, "global_step": 15981, "epoch": 134, "lr": 8.868896990826945e-05} +{"train_loss": 0.005573988426476717, "global_step": 15982, "epoch": 134, "lr": 8.868756644427704e-05} +{"train_loss": 0.008965743705630302, "global_step": 15983, "epoch": 134, "lr": 8.868616290432571e-05} +{"train_loss": 0.0066187032498419285, "global_step": 15984, "epoch": 134, "lr": 8.868475928841825e-05} +{"train_loss": 0.0076542142778635025, "global_step": 15985, "epoch": 134, "lr": 8.868335559655739e-05} +{"train_loss": 0.007418016903102398, "global_step": 15986, "epoch": 134, "lr": 8.868195182874591e-05} +{"train_loss": 0.007593423593789339, "global_step": 15987, "epoch": 134, "lr": 8.868054798498653e-05} +{"train_loss": 0.00523875979706645, "global_step": 15988, "epoch": 134, "lr": 8.867914406528203e-05} +{"train_loss": 0.008121581748127937, "global_step": 15989, "epoch": 134, "lr": 8.867774006963516e-05} +{"train_loss": 0.005410728044807911, "global_step": 15990, "epoch": 134, "lr": 8.867633599804868e-05} +{"train_loss": 0.00583912106230855, "global_step": 15991, "epoch": 134, "lr": 8.867493185052536e-05} +{"train_loss": 0.009073815308511257, "global_step": 15992, "epoch": 134, "lr": 8.867352762706793e-05} +{"train_loss": 0.0060010128654539585, "global_step": 15993, "epoch": 134, "lr": 8.867212332767916e-05} +{"train_loss": 0.005464700050652027, "global_step": 15994, "epoch": 134, "lr": 8.867071895236181e-05} +{"train_loss": 0.008181175217032433, "global_step": 15995, "epoch": 134, "lr": 8.866931450111864e-05} +{"train_loss": 0.007707581855356693, "global_step": 15996, "epoch": 134, "lr": 8.86679099739524e-05} +{"train_loss": 0.0037615024484694004, "global_step": 15997, "epoch": 134, "lr": 8.866650537086585e-05} +{"train_loss": 0.005989641882479191, "global_step": 15998, "epoch": 134, "lr": 8.866510069186174e-05} +{"train_loss": 0.005079549737274647, "global_step": 15999, "epoch": 134, "lr": 8.866369593694285e-05} +{"train_loss": 0.010269025340676308, "global_step": 16000, "epoch": 134, "lr": 8.866229110611191e-05} +{"train_loss": 0.006225548218935728, "global_step": 16001, "epoch": 134, "lr": 8.866088619937169e-05} +{"train_loss": 0.007515233941376209, "global_step": 16002, "epoch": 134, "lr": 8.865948121672496e-05} +{"train_loss": 0.005562750156968832, "global_step": 16003, "epoch": 134, "lr": 8.865807615817447e-05} +{"train_loss": 0.009241084568202496, "global_step": 16004, "epoch": 134, "lr": 8.865667102372297e-05} +{"train_loss": 0.00790480338037014, "global_step": 16005, "epoch": 134, "lr": 8.865526581337324e-05} +{"train_loss": 0.006685697007924318, "global_step": 16006, "epoch": 134, "lr": 8.865386052712801e-05} +{"train_loss": 0.0063003962859511375, "global_step": 16007, "epoch": 134, "lr": 8.865245516499005e-05} +{"train_loss": 0.008579447865486145, "global_step": 16008, "epoch": 134, "lr": 8.865104972696215e-05} +{"train_loss": 0.004318917170166969, "global_step": 16009, "epoch": 134, "lr": 8.864964421304703e-05} +{"train_loss": 0.0043786740861833096, "global_step": 16010, "epoch": 134, "lr": 8.864823862324745e-05} +{"train_loss": 0.004876749124377966, "global_step": 16011, "epoch": 134, "lr": 8.86468329575662e-05} +{"train_loss": 0.0045653753913939, "global_step": 16012, "epoch": 134, "lr": 8.8645427216006e-05} +{"train_loss": 0.005139055196195841, "global_step": 16013, "epoch": 134, "lr": 8.864402139856964e-05} +{"train_loss": 0.007412464823573828, "global_step": 16014, "epoch": 134, "lr": 8.864261550525989e-05} +{"train_loss": 0.006624679546803236, "global_step": 16015, "epoch": 134, "lr": 8.864120953607948e-05} +{"train_loss": 0.006118024233728647, "global_step": 16016, "epoch": 134, "lr": 8.863980349103119e-05} +{"train_loss": 0.005457398481667042, "global_step": 16017, "epoch": 134, "lr": 8.863839737011777e-05} +{"train_loss": 0.005883124656975269, "global_step": 16018, "epoch": 134, "lr": 8.863699117334197e-05} +{"train_loss": 0.007644428871572018, "global_step": 16019, "epoch": 134, "lr": 8.863558490070658e-05} +{"train_loss": 0.005565466824918985, "global_step": 16020, "epoch": 134, "lr": 8.863417855221435e-05} +{"train_loss": 0.006512013264000416, "global_step": 16021, "epoch": 134, "lr": 8.863277212786802e-05} +{"train_loss": 0.006023875903338194, "global_step": 16022, "epoch": 134, "lr": 8.863136562767039e-05} +{"train_loss": 0.008341103792190552, "global_step": 16023, "epoch": 134, "lr": 8.862995905162419e-05} +{"train_loss": 0.005160103086382151, "global_step": 16024, "epoch": 134, "lr": 8.86285523997322e-05} +{"train_loss": 0.006680675316601992, "global_step": 16025, "epoch": 134, "lr": 8.862714567199717e-05} +{"train_loss": 0.005996780935674906, "global_step": 16026, "epoch": 134, "lr": 8.862573886842188e-05} +{"train_loss": 0.005316075868904591, "global_step": 16027, "epoch": 134, "lr": 8.862433198900906e-05} +{"train_loss": 0.004321604035794735, "global_step": 16028, "epoch": 134, "lr": 8.862292503376148e-05} +{"train_loss": 0.006000041030347347, "global_step": 16029, "epoch": 134, "lr": 8.862151800268193e-05} +{"train_loss": 0.005550449248403311, "global_step": 16030, "epoch": 134, "lr": 8.862011089577316e-05} +{"train_loss": 0.005759795196354389, "global_step": 16031, "epoch": 134, "lr": 8.861870371303793e-05} +{"train_loss": 0.008887558244168758, "global_step": 16032, "epoch": 134, "lr": 8.861729645447898e-05} +{"train_loss": 0.00692120473831892, "global_step": 16033, "epoch": 134, "lr": 8.861588912009911e-05} +{"train_loss": 0.008487789891660213, "global_step": 16034, "epoch": 134, "lr": 8.861448170990106e-05} +{"train_loss": 0.0047501372173428535, "global_step": 16035, "epoch": 134, "lr": 8.86130742238876e-05} +{"train_loss": 0.005275646224617958, "global_step": 16036, "epoch": 134, "lr": 8.861166666206152e-05} +{"train_loss": 0.004789190366864204, "global_step": 16037, "epoch": 134, "lr": 8.861025902442552e-05} +{"train_loss": 0.007869884371757507, "global_step": 16038, "epoch": 134, "lr": 8.860885131098242e-05} +{"train_loss": 0.007149037905037403, "global_step": 16039, "epoch": 134, "lr": 8.860744352173495e-05} +{"train_loss": 0.005499935243278742, "global_step": 16040, "epoch": 134, "lr": 8.860603565668591e-05} +{"train_loss": 0.00491585535928607, "global_step": 16041, "epoch": 134, "lr": 8.860462771583804e-05} +{"train_loss": 0.008838276378810406, "global_step": 16042, "epoch": 134, "lr": 8.860321969919409e-05} +{"train_loss": 0.004670999478548765, "global_step": 16043, "epoch": 134, "lr": 8.860181160675687e-05} +{"train_loss": 0.009354501031339169, "global_step": 16044, "epoch": 134, "lr": 8.860040343852908e-05} +{"train_loss": 0.0073682083748281, "global_step": 16045, "epoch": 134, "lr": 8.859899519451356e-05} +{"train_loss": 0.004522165283560753, "global_step": 16046, "epoch": 134, "lr": 8.859758687471302e-05} +{"train_loss": 0.00883612409234047, "global_step": 16047, "epoch": 134, "lr": 8.859617847913024e-05} +{"train_loss": 0.003996104001998901, "global_step": 16048, "epoch": 134, "lr": 8.8594770007768e-05} +{"train_loss": 0.0078218849375844, "global_step": 16049, "epoch": 134, "lr": 8.859336146062903e-05} +{"train_loss": 0.0063764965161681175, "global_step": 16050, "epoch": 134, "lr": 8.859195283771612e-05} +{"train_loss": 0.00649860268458724, "global_step": 16051, "epoch": 134, "lr": 8.859054413903205e-05} +{"train_loss": 0.004189581144601107, "global_step": 16052, "epoch": 134, "lr": 8.858913536457956e-05} +{"train_loss": 0.008512955158948898, "global_step": 16053, "epoch": 134, "lr": 8.858772651436142e-05} +{"train_loss": 0.006046661641448736, "global_step": 16054, "epoch": 134, "lr": 8.858631758838042e-05} +{"train_loss": 0.006145225837826729, "global_step": 16055, "epoch": 134, "lr": 8.85849085866393e-05} +{"train_loss": 0.006417372729629278, "global_step": 16056, "epoch": 134, "lr": 8.858349950914083e-05} +{"train_loss": 0.006024195812642574, "global_step": 16057, "epoch": 134, "lr": 8.858209035588778e-05} +{"train_loss": 0.00524927768856287, "global_step": 16058, "epoch": 134, "lr": 8.858068112688292e-05} +{"train_loss": 0.0058642905205488205, "global_step": 16059, "epoch": 134, "lr": 8.857927182212902e-05} +{"train_loss": 0.007958296686410904, "global_step": 16060, "epoch": 134, "lr": 8.857786244162882e-05} +{"train_loss": 0.00408859783783555, "global_step": 16061, "epoch": 134, "lr": 8.857645298538512e-05} +{"train_loss": 0.004526153206825256, "global_step": 16062, "epoch": 134, "lr": 8.857504345340068e-05} +{"train_loss": 0.009424678049981594, "global_step": 16063, "epoch": 134, "lr": 8.857363384567828e-05} +{"train_loss": 0.006521934287293869, "global_step": 16064, "epoch": 134, "lr": 8.857222416222064e-05, "val_loss": 0.016664016991853714} +{"train_loss": 0.0030917536932975054, "global_step": 16065, "epoch": 135, "lr": 8.857081440303058e-05} +{"train_loss": 0.004765971098095179, "global_step": 16066, "epoch": 135, "lr": 8.856940456811084e-05} +{"train_loss": 0.008036796003580093, "global_step": 16067, "epoch": 135, "lr": 8.856799465746418e-05} +{"train_loss": 0.005738282110542059, "global_step": 16068, "epoch": 135, "lr": 8.85665846710934e-05} +{"train_loss": 0.00736437551677227, "global_step": 16069, "epoch": 135, "lr": 8.856517460900124e-05} +{"train_loss": 0.005029756110161543, "global_step": 16070, "epoch": 135, "lr": 8.85637644711905e-05} +{"train_loss": 0.003502550069242716, "global_step": 16071, "epoch": 135, "lr": 8.856235425766392e-05} +{"train_loss": 0.004980709403753281, "global_step": 16072, "epoch": 135, "lr": 8.856094396842427e-05} +{"train_loss": 0.0044213589280843735, "global_step": 16073, "epoch": 135, "lr": 8.855953360347433e-05} +{"train_loss": 0.005236118100583553, "global_step": 16074, "epoch": 135, "lr": 8.855812316281686e-05} +{"train_loss": 0.0072380658239126205, "global_step": 16075, "epoch": 135, "lr": 8.855671264645465e-05} +{"train_loss": 0.004892904311418533, "global_step": 16076, "epoch": 135, "lr": 8.855530205439042e-05} +{"train_loss": 0.007019722368568182, "global_step": 16077, "epoch": 135, "lr": 8.8553891386627e-05} +{"train_loss": 0.004318288993090391, "global_step": 16078, "epoch": 135, "lr": 8.855248064316714e-05} +{"train_loss": 0.0047836690209805965, "global_step": 16079, "epoch": 135, "lr": 8.855106982401358e-05} +{"train_loss": 0.003984044771641493, "global_step": 16080, "epoch": 135, "lr": 8.854965892916913e-05} +{"train_loss": 0.007286929991096258, "global_step": 16081, "epoch": 135, "lr": 8.854824795863654e-05} +{"train_loss": 0.005061884876340628, "global_step": 16082, "epoch": 135, "lr": 8.854683691241859e-05} +{"train_loss": 0.005755221471190453, "global_step": 16083, "epoch": 135, "lr": 8.854542579051804e-05} +{"train_loss": 0.006942876148968935, "global_step": 16084, "epoch": 135, "lr": 8.854401459293764e-05} +{"train_loss": 0.005484743043780327, "global_step": 16085, "epoch": 135, "lr": 8.85426033196802e-05} +{"train_loss": 0.0034348582848906517, "global_step": 16086, "epoch": 135, "lr": 8.854119197074849e-05} +{"train_loss": 0.005028220359236002, "global_step": 16087, "epoch": 135, "lr": 8.853978054614527e-05} +{"train_loss": 0.005726912524551153, "global_step": 16088, "epoch": 135, "lr": 8.853836904587329e-05} +{"train_loss": 0.0050130849704146385, "global_step": 16089, "epoch": 135, "lr": 8.853695746993535e-05} +{"train_loss": 0.00795786827802658, "global_step": 16090, "epoch": 135, "lr": 8.85355458183342e-05} +{"train_loss": 0.006887165363878012, "global_step": 16091, "epoch": 135, "lr": 8.853413409107263e-05} +{"train_loss": 0.004043372813612223, "global_step": 16092, "epoch": 135, "lr": 8.85327222881534e-05} +{"train_loss": 0.008512589149177074, "global_step": 16093, "epoch": 135, "lr": 8.853131040957929e-05} +{"train_loss": 0.00304955942556262, "global_step": 16094, "epoch": 135, "lr": 8.852989845535306e-05} +{"train_loss": 0.004845128860324621, "global_step": 16095, "epoch": 135, "lr": 8.852848642547751e-05} +{"train_loss": 0.004272265359759331, "global_step": 16096, "epoch": 135, "lr": 8.85270743199554e-05} +{"train_loss": 0.004139356315135956, "global_step": 16097, "epoch": 135, "lr": 8.852566213878947e-05} +{"train_loss": 0.005836732219904661, "global_step": 16098, "epoch": 135, "lr": 8.852424988198252e-05} +{"train_loss": 0.006179048214107752, "global_step": 16099, "epoch": 135, "lr": 8.852283754953732e-05} +{"train_loss": 0.004360854625701904, "global_step": 16100, "epoch": 135, "lr": 8.852142514145665e-05} +{"train_loss": 0.007192743010818958, "global_step": 16101, "epoch": 135, "lr": 8.852001265774329e-05} +{"train_loss": 0.0026830281130969524, "global_step": 16102, "epoch": 135, "lr": 8.851860009839999e-05} +{"train_loss": 0.0049321711994707584, "global_step": 16103, "epoch": 135, "lr": 8.851718746342954e-05} +{"train_loss": 0.007787695154547691, "global_step": 16104, "epoch": 135, "lr": 8.85157747528347e-05} +{"train_loss": 0.0056947972625494, "global_step": 16105, "epoch": 135, "lr": 8.851436196661825e-05} +{"train_loss": 0.005162492394447327, "global_step": 16106, "epoch": 135, "lr": 8.851294910478296e-05} +{"train_loss": 0.005714903585612774, "global_step": 16107, "epoch": 135, "lr": 8.851153616733162e-05} +{"train_loss": 0.007406739518046379, "global_step": 16108, "epoch": 135, "lr": 8.8510123154267e-05} +{"train_loss": 0.0073692770674824715, "global_step": 16109, "epoch": 135, "lr": 8.850871006559186e-05} +{"train_loss": 0.0038652638904750347, "global_step": 16110, "epoch": 135, "lr": 8.850729690130897e-05} +{"train_loss": 0.006899338215589523, "global_step": 16111, "epoch": 135, "lr": 8.850588366142112e-05} +{"train_loss": 0.005137783475220203, "global_step": 16112, "epoch": 135, "lr": 8.850447034593109e-05} +{"train_loss": 0.009967896156013012, "global_step": 16113, "epoch": 135, "lr": 8.850305695484163e-05} +{"train_loss": 0.006217524874955416, "global_step": 16114, "epoch": 135, "lr": 8.850164348815555e-05} +{"train_loss": 0.005612634588032961, "global_step": 16115, "epoch": 135, "lr": 8.85002299458756e-05} +{"train_loss": 0.004656116012483835, "global_step": 16116, "epoch": 135, "lr": 8.849881632800455e-05} +{"train_loss": 0.011262891814112663, "global_step": 16117, "epoch": 135, "lr": 8.84974026345452e-05} +{"train_loss": 0.008505402132868767, "global_step": 16118, "epoch": 135, "lr": 8.84959888655003e-05} +{"train_loss": 0.005957203451544046, "global_step": 16119, "epoch": 135, "lr": 8.849457502087266e-05} +{"train_loss": 0.0052192737348377705, "global_step": 16120, "epoch": 135, "lr": 8.849316110066503e-05} +{"train_loss": 0.007222122512757778, "global_step": 16121, "epoch": 135, "lr": 8.849174710488018e-05} +{"train_loss": 0.004717243369668722, "global_step": 16122, "epoch": 135, "lr": 8.84903330335209e-05} +{"train_loss": 0.0069129206240177155, "global_step": 16123, "epoch": 135, "lr": 8.848891888658997e-05} +{"train_loss": 0.009526818059384823, "global_step": 16124, "epoch": 135, "lr": 8.848750466409015e-05} +{"train_loss": 0.008384020999073982, "global_step": 16125, "epoch": 135, "lr": 8.848609036602423e-05} +{"train_loss": 0.006124281790107489, "global_step": 16126, "epoch": 135, "lr": 8.848467599239498e-05} +{"train_loss": 0.00667806901037693, "global_step": 16127, "epoch": 135, "lr": 8.848326154320518e-05} +{"train_loss": 0.00792575441300869, "global_step": 16128, "epoch": 135, "lr": 8.84818470184576e-05} +{"train_loss": 0.004400948528200388, "global_step": 16129, "epoch": 135, "lr": 8.848043241815504e-05} +{"train_loss": 0.005204640328884125, "global_step": 16130, "epoch": 135, "lr": 8.847901774230027e-05} +{"train_loss": 0.007542089093476534, "global_step": 16131, "epoch": 135, "lr": 8.847760299089605e-05} +{"train_loss": 0.008848356083035469, "global_step": 16132, "epoch": 135, "lr": 8.847618816394516e-05} +{"train_loss": 0.005913714412599802, "global_step": 16133, "epoch": 135, "lr": 8.847477326145039e-05} +{"train_loss": 0.005826759617775679, "global_step": 16134, "epoch": 135, "lr": 8.847335828341451e-05} +{"train_loss": 0.004459225572645664, "global_step": 16135, "epoch": 135, "lr": 8.84719432298403e-05} +{"train_loss": 0.006818683352321386, "global_step": 16136, "epoch": 135, "lr": 8.847052810073056e-05} +{"train_loss": 0.00898648425936699, "global_step": 16137, "epoch": 135, "lr": 8.846911289608801e-05} +{"train_loss": 0.005159102380275726, "global_step": 16138, "epoch": 135, "lr": 8.846769761591549e-05} +{"train_loss": 0.00677363108843565, "global_step": 16139, "epoch": 135, "lr": 8.846628226021576e-05} +{"train_loss": 0.007929257117211819, "global_step": 16140, "epoch": 135, "lr": 8.846486682899159e-05} +{"train_loss": 0.006692857481539249, "global_step": 16141, "epoch": 135, "lr": 8.846345132224577e-05} +{"train_loss": 0.008891912177205086, "global_step": 16142, "epoch": 135, "lr": 8.846203573998105e-05} +{"train_loss": 0.0066656083799898624, "global_step": 16143, "epoch": 135, "lr": 8.846062008220026e-05} +{"train_loss": 0.005821996368467808, "global_step": 16144, "epoch": 135, "lr": 8.845920434890614e-05} +{"train_loss": 0.008482391014695168, "global_step": 16145, "epoch": 135, "lr": 8.845778854010146e-05} +{"train_loss": 0.006022136192768812, "global_step": 16146, "epoch": 135, "lr": 8.845637265578905e-05} +{"train_loss": 0.009992904029786587, "global_step": 16147, "epoch": 135, "lr": 8.845495669597163e-05} +{"train_loss": 0.007512595504522324, "global_step": 16148, "epoch": 135, "lr": 8.845354066065203e-05} +{"train_loss": 0.0059684389270842075, "global_step": 16149, "epoch": 135, "lr": 8.845212454983303e-05} +{"train_loss": 0.005693928804248571, "global_step": 16150, "epoch": 135, "lr": 8.845070836351736e-05} +{"train_loss": 0.010012205690145493, "global_step": 16151, "epoch": 135, "lr": 8.844929210170785e-05} +{"train_loss": 0.004331100732088089, "global_step": 16152, "epoch": 135, "lr": 8.844787576440726e-05} +{"train_loss": 0.006669680122286081, "global_step": 16153, "epoch": 135, "lr": 8.844645935161837e-05} +{"train_loss": 0.00434739887714386, "global_step": 16154, "epoch": 135, "lr": 8.844504286334396e-05} +{"train_loss": 0.00926339253783226, "global_step": 16155, "epoch": 135, "lr": 8.844362629958682e-05} +{"train_loss": 0.00454770028591156, "global_step": 16156, "epoch": 135, "lr": 8.844220966034973e-05} +{"train_loss": 0.0064544109627604485, "global_step": 16157, "epoch": 135, "lr": 8.844079294563548e-05} +{"train_loss": 0.008108336478471756, "global_step": 16158, "epoch": 135, "lr": 8.843937615544682e-05} +{"train_loss": 0.006646068301051855, "global_step": 16159, "epoch": 135, "lr": 8.843795928978656e-05} +{"train_loss": 0.00433893408626318, "global_step": 16160, "epoch": 135, "lr": 8.843654234865746e-05} +{"train_loss": 0.006452999077737331, "global_step": 16161, "epoch": 135, "lr": 8.843512533206233e-05} +{"train_loss": 0.0056290715001523495, "global_step": 16162, "epoch": 135, "lr": 8.843370824000393e-05} +{"train_loss": 0.006485921796411276, "global_step": 16163, "epoch": 135, "lr": 8.843229107248505e-05} +{"train_loss": 0.008580508641898632, "global_step": 16164, "epoch": 135, "lr": 8.843087382950847e-05} +{"train_loss": 0.006705152336508036, "global_step": 16165, "epoch": 135, "lr": 8.842945651107699e-05} +{"train_loss": 0.008982693776488304, "global_step": 16166, "epoch": 135, "lr": 8.842803911719337e-05} +{"train_loss": 0.005002142395824194, "global_step": 16167, "epoch": 135, "lr": 8.84266216478604e-05} +{"train_loss": 0.006604637484997511, "global_step": 16168, "epoch": 135, "lr": 8.842520410308087e-05} +{"train_loss": 0.006087568588554859, "global_step": 16169, "epoch": 135, "lr": 8.842378648285754e-05} +{"train_loss": 0.006242810748517513, "global_step": 16170, "epoch": 135, "lr": 8.842236878719324e-05} +{"train_loss": 0.0049912165850400925, "global_step": 16171, "epoch": 135, "lr": 8.842095101609069e-05} +{"train_loss": 0.00558243365958333, "global_step": 16172, "epoch": 135, "lr": 8.841953316955272e-05} +{"train_loss": 0.00794397946447134, "global_step": 16173, "epoch": 135, "lr": 8.84181152475821e-05} +{"train_loss": 0.005773857701569796, "global_step": 16174, "epoch": 135, "lr": 8.841669725018163e-05} +{"train_loss": 0.008185693994164467, "global_step": 16175, "epoch": 135, "lr": 8.841527917735406e-05} +{"train_loss": 0.008011875674128532, "global_step": 16176, "epoch": 135, "lr": 8.841386102910219e-05} +{"train_loss": 0.006094391457736492, "global_step": 16177, "epoch": 135, "lr": 8.841244280542883e-05} +{"train_loss": 0.005888530984520912, "global_step": 16178, "epoch": 135, "lr": 8.841102450633673e-05} +{"train_loss": 0.010789332911372185, "global_step": 16179, "epoch": 135, "lr": 8.840960613182868e-05} +{"train_loss": 0.0032912406604737043, "global_step": 16180, "epoch": 135, "lr": 8.840818768190749e-05} +{"train_loss": 0.0073791854083538055, "global_step": 16181, "epoch": 135, "lr": 8.840676915657591e-05} +{"train_loss": 0.007297966629266739, "global_step": 16182, "epoch": 135, "lr": 8.840535055583674e-05} +{"train_loss": 0.006272872690768803, "global_step": 16183, "epoch": 135, "lr": 8.840393187969278e-05, "val_loss": 0.014989765360951424, "train_action_mse_error": 0.00017567809845786542} +{"train_loss": 0.00745534198358655, "global_step": 16184, "epoch": 136, "lr": 8.84025131281468e-05} +{"train_loss": 0.005314894951879978, "global_step": 16185, "epoch": 136, "lr": 8.840109430120158e-05} +{"train_loss": 0.006142320577055216, "global_step": 16186, "epoch": 136, "lr": 8.839967539885992e-05} +{"train_loss": 0.008078266866505146, "global_step": 16187, "epoch": 136, "lr": 8.83982564211246e-05} +{"train_loss": 0.004238717257976532, "global_step": 16188, "epoch": 136, "lr": 8.839683736799841e-05} +{"train_loss": 0.004713417496532202, "global_step": 16189, "epoch": 136, "lr": 8.839541823948411e-05} +{"train_loss": 0.005618754308670759, "global_step": 16190, "epoch": 136, "lr": 8.839399903558454e-05} +{"train_loss": 0.006703123450279236, "global_step": 16191, "epoch": 136, "lr": 8.839257975630244e-05} +{"train_loss": 0.004432186018675566, "global_step": 16192, "epoch": 136, "lr": 8.839116040164062e-05} +{"train_loss": 0.007018880918622017, "global_step": 16193, "epoch": 136, "lr": 8.838974097160185e-05} +{"train_loss": 0.004114678595215082, "global_step": 16194, "epoch": 136, "lr": 8.838832146618892e-05} +{"train_loss": 0.008706854656338692, "global_step": 16195, "epoch": 136, "lr": 8.838690188540462e-05} +{"train_loss": 0.005275617819279432, "global_step": 16196, "epoch": 136, "lr": 8.838548222925174e-05} +{"train_loss": 0.006448122672736645, "global_step": 16197, "epoch": 136, "lr": 8.838406249773308e-05} +{"train_loss": 0.005533517803996801, "global_step": 16198, "epoch": 136, "lr": 8.838264269085142e-05} +{"train_loss": 0.008624959737062454, "global_step": 16199, "epoch": 136, "lr": 8.838122280860953e-05} +{"train_loss": 0.008255073800683022, "global_step": 16200, "epoch": 136, "lr": 8.837980285101019e-05} +{"train_loss": 0.002608594950288534, "global_step": 16201, "epoch": 136, "lr": 8.837838281805621e-05} +{"train_loss": 0.0067335451021790504, "global_step": 16202, "epoch": 136, "lr": 8.83769627097504e-05} +{"train_loss": 0.003937877248972654, "global_step": 16203, "epoch": 136, "lr": 8.837554252609552e-05} +{"train_loss": 0.007042247802019119, "global_step": 16204, "epoch": 136, "lr": 8.837412226709436e-05} +{"train_loss": 0.0065256934612989426, "global_step": 16205, "epoch": 136, "lr": 8.83727019327497e-05} +{"train_loss": 0.006595898885279894, "global_step": 16206, "epoch": 136, "lr": 8.837128152306435e-05} +{"train_loss": 0.005989434663206339, "global_step": 16207, "epoch": 136, "lr": 8.836986103804109e-05} +{"train_loss": 0.00429744366556406, "global_step": 16208, "epoch": 136, "lr": 8.83684404776827e-05} +{"train_loss": 0.005471985321491957, "global_step": 16209, "epoch": 136, "lr": 8.836701984199196e-05} +{"train_loss": 0.00987737625837326, "global_step": 16210, "epoch": 136, "lr": 8.83655991309717e-05} +{"train_loss": 0.0035221371799707413, "global_step": 16211, "epoch": 136, "lr": 8.836417834462467e-05} +{"train_loss": 0.003313274821266532, "global_step": 16212, "epoch": 136, "lr": 8.836275748295369e-05} +{"train_loss": 0.006318447180092335, "global_step": 16213, "epoch": 136, "lr": 8.836133654596153e-05} +{"train_loss": 0.006831628270447254, "global_step": 16214, "epoch": 136, "lr": 8.835991553365097e-05} +{"train_loss": 0.0073548974469304085, "global_step": 16215, "epoch": 136, "lr": 8.835849444602482e-05} +{"train_loss": 0.004936947021633387, "global_step": 16216, "epoch": 136, "lr": 8.835707328308587e-05} +{"train_loss": 0.006996606010943651, "global_step": 16217, "epoch": 136, "lr": 8.835565204483691e-05} +{"train_loss": 0.007117071188986301, "global_step": 16218, "epoch": 136, "lr": 8.835423073128072e-05} +{"train_loss": 0.0091179758310318, "global_step": 16219, "epoch": 136, "lr": 8.835280934242009e-05} +{"train_loss": 0.006295913364738226, "global_step": 16220, "epoch": 136, "lr": 8.835138787825781e-05} +{"train_loss": 0.00591604458168149, "global_step": 16221, "epoch": 136, "lr": 8.834996633879669e-05} +{"train_loss": 0.006270894315093756, "global_step": 16222, "epoch": 136, "lr": 8.83485447240395e-05} +{"train_loss": 0.007338080555200577, "global_step": 16223, "epoch": 136, "lr": 8.834712303398906e-05} +{"train_loss": 0.0057060206308960915, "global_step": 16224, "epoch": 136, "lr": 8.834570126864811e-05} +{"train_loss": 0.006483298726379871, "global_step": 16225, "epoch": 136, "lr": 8.83442794280195e-05} +{"train_loss": 0.004722962621599436, "global_step": 16226, "epoch": 136, "lr": 8.834285751210598e-05} +{"train_loss": 0.004272261634469032, "global_step": 16227, "epoch": 136, "lr": 8.834143552091035e-05} +{"train_loss": 0.005457152612507343, "global_step": 16228, "epoch": 136, "lr": 8.834001345443541e-05} +{"train_loss": 0.007637680042535067, "global_step": 16229, "epoch": 136, "lr": 8.833859131268396e-05} +{"train_loss": 0.005742611363530159, "global_step": 16230, "epoch": 136, "lr": 8.833716909565877e-05} +{"train_loss": 0.006290254183113575, "global_step": 16231, "epoch": 136, "lr": 8.833574680336265e-05} +{"train_loss": 0.0054724072106182575, "global_step": 16232, "epoch": 136, "lr": 8.833432443579839e-05} +{"train_loss": 0.0074942149221897125, "global_step": 16233, "epoch": 136, "lr": 8.833290199296878e-05} +{"train_loss": 0.005140276625752449, "global_step": 16234, "epoch": 136, "lr": 8.83314794748766e-05} +{"train_loss": 0.005277466494590044, "global_step": 16235, "epoch": 136, "lr": 8.833005688152467e-05} +{"train_loss": 0.004816366359591484, "global_step": 16236, "epoch": 136, "lr": 8.832863421291574e-05} +{"train_loss": 0.008147579617798328, "global_step": 16237, "epoch": 136, "lr": 8.832721146905267e-05} +{"train_loss": 0.004593727178871632, "global_step": 16238, "epoch": 136, "lr": 8.83257886499382e-05} +{"train_loss": 0.00426145363599062, "global_step": 16239, "epoch": 136, "lr": 8.832436575557514e-05} +{"train_loss": 0.005976113025099039, "global_step": 16240, "epoch": 136, "lr": 8.832294278596627e-05} +{"train_loss": 0.005880171898752451, "global_step": 16241, "epoch": 136, "lr": 8.83215197411144e-05} +{"train_loss": 0.006983394734561443, "global_step": 16242, "epoch": 136, "lr": 8.832009662102232e-05} +{"train_loss": 0.004722838755697012, "global_step": 16243, "epoch": 136, "lr": 8.831867342569284e-05} +{"train_loss": 0.006633582524955273, "global_step": 16244, "epoch": 136, "lr": 8.831725015512872e-05} +{"train_loss": 0.007010035682469606, "global_step": 16245, "epoch": 136, "lr": 8.831582680933279e-05} +{"train_loss": 0.005536195822060108, "global_step": 16246, "epoch": 136, "lr": 8.83144033883078e-05} +{"train_loss": 0.005031809210777283, "global_step": 16247, "epoch": 136, "lr": 8.83129798920566e-05} +{"train_loss": 0.006245241034775972, "global_step": 16248, "epoch": 136, "lr": 8.831155632058194e-05} +{"train_loss": 0.007943466305732727, "global_step": 16249, "epoch": 136, "lr": 8.831013267388665e-05} +{"train_loss": 0.006333617027848959, "global_step": 16250, "epoch": 136, "lr": 8.83087089519735e-05} +{"train_loss": 0.005452896002680063, "global_step": 16251, "epoch": 136, "lr": 8.830728515484527e-05} +{"train_loss": 0.005717017687857151, "global_step": 16252, "epoch": 136, "lr": 8.83058612825048e-05} +{"train_loss": 0.007485603913664818, "global_step": 16253, "epoch": 136, "lr": 8.830443733495487e-05} +{"train_loss": 0.006278750486671925, "global_step": 16254, "epoch": 136, "lr": 8.830301331219825e-05} +{"train_loss": 0.0066660325974226, "global_step": 16255, "epoch": 136, "lr": 8.830158921423776e-05} +{"train_loss": 0.00514973932877183, "global_step": 16256, "epoch": 136, "lr": 8.830016504107622e-05} +{"train_loss": 0.00836365669965744, "global_step": 16257, "epoch": 136, "lr": 8.829874079271635e-05} +{"train_loss": 0.006446391809731722, "global_step": 16258, "epoch": 136, "lr": 8.829731646916104e-05} +{"train_loss": 0.006176949944347143, "global_step": 16259, "epoch": 136, "lr": 8.829589207041302e-05} +{"train_loss": 0.00563867436721921, "global_step": 16260, "epoch": 136, "lr": 8.829446759647511e-05} +{"train_loss": 0.006431525573134422, "global_step": 16261, "epoch": 136, "lr": 8.829304304735008e-05} +{"train_loss": 0.009108445607125759, "global_step": 16262, "epoch": 136, "lr": 8.829161842304079e-05} +{"train_loss": 0.004787078592926264, "global_step": 16263, "epoch": 136, "lr": 8.829019372354997e-05} +{"train_loss": 0.006892787758260965, "global_step": 16264, "epoch": 136, "lr": 8.828876894888046e-05} +{"train_loss": 0.005782940424978733, "global_step": 16265, "epoch": 136, "lr": 8.828734409903504e-05} +{"train_loss": 0.009320798330008984, "global_step": 16266, "epoch": 136, "lr": 8.828591917401651e-05} +{"train_loss": 0.005745743401348591, "global_step": 16267, "epoch": 136, "lr": 8.828449417382766e-05} +{"train_loss": 0.006978733465075493, "global_step": 16268, "epoch": 136, "lr": 8.828306909847131e-05} +{"train_loss": 0.008534750901162624, "global_step": 16269, "epoch": 136, "lr": 8.828164394795024e-05} +{"train_loss": 0.005838995799422264, "global_step": 16270, "epoch": 136, "lr": 8.828021872226724e-05} +{"train_loss": 0.005491240881383419, "global_step": 16271, "epoch": 136, "lr": 8.827879342142513e-05} +{"train_loss": 0.005690224003046751, "global_step": 16272, "epoch": 136, "lr": 8.82773680454267e-05} +{"train_loss": 0.006080476101487875, "global_step": 16273, "epoch": 136, "lr": 8.827594259427475e-05} +{"train_loss": 0.003890023799613118, "global_step": 16274, "epoch": 136, "lr": 8.827451706797205e-05} +{"train_loss": 0.00614704517647624, "global_step": 16275, "epoch": 136, "lr": 8.827309146652145e-05} +{"train_loss": 0.005309710744768381, "global_step": 16276, "epoch": 136, "lr": 8.827166578992572e-05} +{"train_loss": 0.007256705313920975, "global_step": 16277, "epoch": 136, "lr": 8.827024003818766e-05} +{"train_loss": 0.004925555549561977, "global_step": 16278, "epoch": 136, "lr": 8.826881421131008e-05} +{"train_loss": 0.00577941257506609, "global_step": 16279, "epoch": 136, "lr": 8.826738830929576e-05} +{"train_loss": 0.004612376447767019, "global_step": 16280, "epoch": 136, "lr": 8.82659623321475e-05} +{"train_loss": 0.007743933703750372, "global_step": 16281, "epoch": 136, "lr": 8.826453627986814e-05} +{"train_loss": 0.008323597721755505, "global_step": 16282, "epoch": 136, "lr": 8.826311015246044e-05} +{"train_loss": 0.0045471638441085815, "global_step": 16283, "epoch": 136, "lr": 8.82616839499272e-05} +{"train_loss": 0.005335604771971703, "global_step": 16284, "epoch": 136, "lr": 8.826025767227125e-05} +{"train_loss": 0.007243265397846699, "global_step": 16285, "epoch": 136, "lr": 8.825883131949536e-05} +{"train_loss": 0.004973416682332754, "global_step": 16286, "epoch": 136, "lr": 8.825740489160235e-05} +{"train_loss": 0.004823358729481697, "global_step": 16287, "epoch": 136, "lr": 8.825597838859501e-05} +{"train_loss": 0.006352228112518787, "global_step": 16288, "epoch": 136, "lr": 8.825455181047612e-05} +{"train_loss": 0.00544607313349843, "global_step": 16289, "epoch": 136, "lr": 8.825312515724853e-05} +{"train_loss": 0.005992010701447725, "global_step": 16290, "epoch": 136, "lr": 8.825169842891502e-05} +{"train_loss": 0.004978763870894909, "global_step": 16291, "epoch": 136, "lr": 8.825027162547838e-05} +{"train_loss": 0.005970621015876532, "global_step": 16292, "epoch": 136, "lr": 8.824884474694141e-05} +{"train_loss": 0.006751968525350094, "global_step": 16293, "epoch": 136, "lr": 8.824741779330692e-05} +{"train_loss": 0.0049029081128537655, "global_step": 16294, "epoch": 136, "lr": 8.824599076457773e-05} +{"train_loss": 0.004273028578609228, "global_step": 16295, "epoch": 136, "lr": 8.82445636607566e-05} +{"train_loss": 0.003908452112227678, "global_step": 16296, "epoch": 136, "lr": 8.824313648184636e-05} +{"train_loss": 0.00635052053257823, "global_step": 16297, "epoch": 136, "lr": 8.824170922784981e-05} +{"train_loss": 0.00861487165093422, "global_step": 16298, "epoch": 136, "lr": 8.824028189876976e-05} +{"train_loss": 0.0037428541108965874, "global_step": 16299, "epoch": 136, "lr": 8.823885449460899e-05} +{"train_loss": 0.0060346852988004684, "global_step": 16300, "epoch": 136, "lr": 8.823742701537032e-05} +{"train_loss": 0.004029217641800642, "global_step": 16301, "epoch": 136, "lr": 8.823599946105654e-05} +{"train_loss": 0.00606365259658514, "global_step": 16302, "epoch": 136, "lr": 8.823457183167047e-05, "val_loss": 0.013737296685576439} +{"train_loss": 0.005716077517718077, "global_step": 16303, "epoch": 137, "lr": 8.823314412721489e-05} +{"train_loss": 0.006115350406616926, "global_step": 16304, "epoch": 137, "lr": 8.823171634769263e-05} +{"train_loss": 0.004888418596237898, "global_step": 16305, "epoch": 137, "lr": 8.823028849310647e-05} +{"train_loss": 0.004893858917057514, "global_step": 16306, "epoch": 137, "lr": 8.822886056345922e-05} +{"train_loss": 0.0066856141202151775, "global_step": 16307, "epoch": 137, "lr": 8.82274325587537e-05} +{"train_loss": 0.005053025670349598, "global_step": 16308, "epoch": 137, "lr": 8.822600447899269e-05} +{"train_loss": 0.0048514073714613914, "global_step": 16309, "epoch": 137, "lr": 8.8224576324179e-05} +{"train_loss": 0.007102074567228556, "global_step": 16310, "epoch": 137, "lr": 8.822314809431544e-05} +{"train_loss": 0.005538429599255323, "global_step": 16311, "epoch": 137, "lr": 8.822171978940483e-05} +{"train_loss": 0.004622476641088724, "global_step": 16312, "epoch": 137, "lr": 8.822029140944993e-05} +{"train_loss": 0.005639894865453243, "global_step": 16313, "epoch": 137, "lr": 8.82188629544536e-05} +{"train_loss": 0.006114507559686899, "global_step": 16314, "epoch": 137, "lr": 8.821743442441858e-05} +{"train_loss": 0.011127645149827003, "global_step": 16315, "epoch": 137, "lr": 8.821600581934774e-05} +{"train_loss": 0.007447317708283663, "global_step": 16316, "epoch": 137, "lr": 8.821457713924385e-05} +{"train_loss": 0.007901809178292751, "global_step": 16317, "epoch": 137, "lr": 8.821314838410972e-05} +{"train_loss": 0.006343217100948095, "global_step": 16318, "epoch": 137, "lr": 8.821171955394815e-05} +{"train_loss": 0.004893995821475983, "global_step": 16319, "epoch": 137, "lr": 8.821029064876195e-05} +{"train_loss": 0.007318705320358276, "global_step": 16320, "epoch": 137, "lr": 8.820886166855394e-05} +{"train_loss": 0.006059356965124607, "global_step": 16321, "epoch": 137, "lr": 8.82074326133269e-05} +{"train_loss": 0.0064079854637384415, "global_step": 16322, "epoch": 137, "lr": 8.820600348308363e-05} +{"train_loss": 0.003964165225625038, "global_step": 16323, "epoch": 137, "lr": 8.820457427782698e-05} +{"train_loss": 0.005826982669532299, "global_step": 16324, "epoch": 137, "lr": 8.820314499755973e-05} +{"train_loss": 0.010358676314353943, "global_step": 16325, "epoch": 137, "lr": 8.820171564228468e-05} +{"train_loss": 0.006695686373859644, "global_step": 16326, "epoch": 137, "lr": 8.820028621200463e-05} +{"train_loss": 0.005924334283918142, "global_step": 16327, "epoch": 137, "lr": 8.819885670672241e-05} +{"train_loss": 0.0066103688441216946, "global_step": 16328, "epoch": 137, "lr": 8.819742712644083e-05} +{"train_loss": 0.0087973577901721, "global_step": 16329, "epoch": 137, "lr": 8.819599747116268e-05} +{"train_loss": 0.005031771957874298, "global_step": 16330, "epoch": 137, "lr": 8.819456774089075e-05} +{"train_loss": 0.01161945890635252, "global_step": 16331, "epoch": 137, "lr": 8.819313793562787e-05} +{"train_loss": 0.006213950924575329, "global_step": 16332, "epoch": 137, "lr": 8.819170805537685e-05} +{"train_loss": 0.005890979431569576, "global_step": 16333, "epoch": 137, "lr": 8.819027810014049e-05} +{"train_loss": 0.005835836287587881, "global_step": 16334, "epoch": 137, "lr": 8.81888480699216e-05} +{"train_loss": 0.008191912434995174, "global_step": 16335, "epoch": 137, "lr": 8.818741796472299e-05} +{"train_loss": 0.0058187078684568405, "global_step": 16336, "epoch": 137, "lr": 8.818598778454746e-05} +{"train_loss": 0.007668881211429834, "global_step": 16337, "epoch": 137, "lr": 8.818455752939783e-05} +{"train_loss": 0.008967157453298569, "global_step": 16338, "epoch": 137, "lr": 8.818312719927689e-05} +{"train_loss": 0.010064817033708096, "global_step": 16339, "epoch": 137, "lr": 8.818169679418747e-05} +{"train_loss": 0.008033293299376965, "global_step": 16340, "epoch": 137, "lr": 8.818026631413235e-05} +{"train_loss": 0.004480068571865559, "global_step": 16341, "epoch": 137, "lr": 8.817883575911436e-05} +{"train_loss": 0.00841736514121294, "global_step": 16342, "epoch": 137, "lr": 8.817740512913633e-05} +{"train_loss": 0.006579933688044548, "global_step": 16343, "epoch": 137, "lr": 8.817597442420102e-05} +{"train_loss": 0.009007437154650688, "global_step": 16344, "epoch": 137, "lr": 8.817454364431126e-05} +{"train_loss": 0.008367100730538368, "global_step": 16345, "epoch": 137, "lr": 8.817311278946987e-05} +{"train_loss": 0.007184057496488094, "global_step": 16346, "epoch": 137, "lr": 8.817168185967966e-05} +{"train_loss": 0.004112175665795803, "global_step": 16347, "epoch": 137, "lr": 8.817025085494342e-05} +{"train_loss": 0.005924494471400976, "global_step": 16348, "epoch": 137, "lr": 8.816881977526396e-05} +{"train_loss": 0.005503315012902021, "global_step": 16349, "epoch": 137, "lr": 8.816738862064413e-05} +{"train_loss": 0.005386796314269304, "global_step": 16350, "epoch": 137, "lr": 8.816595739108669e-05} +{"train_loss": 0.007057527080178261, "global_step": 16351, "epoch": 137, "lr": 8.816452608659447e-05} +{"train_loss": 0.005587216001003981, "global_step": 16352, "epoch": 137, "lr": 8.816309470717028e-05} +{"train_loss": 0.006765712518244982, "global_step": 16353, "epoch": 137, "lr": 8.816166325281694e-05} +{"train_loss": 0.006413409952074289, "global_step": 16354, "epoch": 137, "lr": 8.816023172353725e-05} +{"train_loss": 0.006231858395040035, "global_step": 16355, "epoch": 137, "lr": 8.815880011933402e-05} +{"train_loss": 0.006549880839884281, "global_step": 16356, "epoch": 137, "lr": 8.815736844021005e-05} +{"train_loss": 0.005321495700627565, "global_step": 16357, "epoch": 137, "lr": 8.815593668616818e-05} +{"train_loss": 0.006305999122560024, "global_step": 16358, "epoch": 137, "lr": 8.81545048572112e-05} +{"train_loss": 0.005592325236648321, "global_step": 16359, "epoch": 137, "lr": 8.815307295334192e-05} +{"train_loss": 0.004565147683024406, "global_step": 16360, "epoch": 137, "lr": 8.815164097456316e-05} +{"train_loss": 0.005979923065751791, "global_step": 16361, "epoch": 137, "lr": 8.815020892087772e-05} +{"train_loss": 0.005903047975152731, "global_step": 16362, "epoch": 137, "lr": 8.814877679228844e-05} +{"train_loss": 0.006831732112914324, "global_step": 16363, "epoch": 137, "lr": 8.81473445887981e-05} +{"train_loss": 0.005218398291617632, "global_step": 16364, "epoch": 137, "lr": 8.814591231040951e-05} +{"train_loss": 0.006334667094051838, "global_step": 16365, "epoch": 137, "lr": 8.814447995712553e-05} +{"train_loss": 0.0062692840583622456, "global_step": 16366, "epoch": 137, "lr": 8.814304752894892e-05} +{"train_loss": 0.0038504451513290405, "global_step": 16367, "epoch": 137, "lr": 8.814161502588251e-05} +{"train_loss": 0.00528704421594739, "global_step": 16368, "epoch": 137, "lr": 8.814018244792913e-05} +{"train_loss": 0.006717553362250328, "global_step": 16369, "epoch": 137, "lr": 8.813874979509156e-05} +{"train_loss": 0.0070820762775838375, "global_step": 16370, "epoch": 137, "lr": 8.813731706737263e-05} +{"train_loss": 0.004601277410984039, "global_step": 16371, "epoch": 137, "lr": 8.813588426477515e-05} +{"train_loss": 0.008652198128402233, "global_step": 16372, "epoch": 137, "lr": 8.813445138730195e-05} +{"train_loss": 0.004604050889611244, "global_step": 16373, "epoch": 137, "lr": 8.813301843495581e-05} +{"train_loss": 0.007224267814308405, "global_step": 16374, "epoch": 137, "lr": 8.813158540773956e-05} +{"train_loss": 0.00681418227031827, "global_step": 16375, "epoch": 137, "lr": 8.813015230565604e-05} +{"train_loss": 0.004567211493849754, "global_step": 16376, "epoch": 137, "lr": 8.812871912870803e-05} +{"train_loss": 0.005529775284230709, "global_step": 16377, "epoch": 137, "lr": 8.812728587689834e-05} +{"train_loss": 0.0055778431706130505, "global_step": 16378, "epoch": 137, "lr": 8.812585255022982e-05} +{"train_loss": 0.007975767366588116, "global_step": 16379, "epoch": 137, "lr": 8.812441914870524e-05} +{"train_loss": 0.00504308519884944, "global_step": 16380, "epoch": 137, "lr": 8.812298567232746e-05} +{"train_loss": 0.012668169103562832, "global_step": 16381, "epoch": 137, "lr": 8.812155212109925e-05} +{"train_loss": 0.005571545567363501, "global_step": 16382, "epoch": 137, "lr": 8.812011849502343e-05} +{"train_loss": 0.0045793186873197556, "global_step": 16383, "epoch": 137, "lr": 8.811868479410286e-05} +{"train_loss": 0.00501384399831295, "global_step": 16384, "epoch": 137, "lr": 8.811725101834033e-05} +{"train_loss": 0.00571882538497448, "global_step": 16385, "epoch": 137, "lr": 8.811581716773863e-05} +{"train_loss": 0.00644946563988924, "global_step": 16386, "epoch": 137, "lr": 8.81143832423006e-05} +{"train_loss": 0.0047570872120559216, "global_step": 16387, "epoch": 137, "lr": 8.811294924202907e-05} +{"train_loss": 0.006422010250389576, "global_step": 16388, "epoch": 137, "lr": 8.811151516692679e-05} +{"train_loss": 0.006583675276488066, "global_step": 16389, "epoch": 137, "lr": 8.811008101699665e-05} +{"train_loss": 0.006067757029086351, "global_step": 16390, "epoch": 137, "lr": 8.810864679224145e-05} +{"train_loss": 0.005837759003043175, "global_step": 16391, "epoch": 137, "lr": 8.810721249266398e-05} +{"train_loss": 0.008256340399384499, "global_step": 16392, "epoch": 137, "lr": 8.810577811826706e-05} +{"train_loss": 0.0056012594141066074, "global_step": 16393, "epoch": 137, "lr": 8.810434366905354e-05} +{"train_loss": 0.008452723734080791, "global_step": 16394, "epoch": 137, "lr": 8.81029091450262e-05} +{"train_loss": 0.006074148695915937, "global_step": 16395, "epoch": 137, "lr": 8.810147454618784e-05} +{"train_loss": 0.004515823908150196, "global_step": 16396, "epoch": 137, "lr": 8.810003987254134e-05} +{"train_loss": 0.006915820762515068, "global_step": 16397, "epoch": 137, "lr": 8.809860512408948e-05} +{"train_loss": 0.007352346088737249, "global_step": 16398, "epoch": 137, "lr": 8.809717030083506e-05} +{"train_loss": 0.007244028616696596, "global_step": 16399, "epoch": 137, "lr": 8.809573540278094e-05} +{"train_loss": 0.00613782275468111, "global_step": 16400, "epoch": 137, "lr": 8.80943004299299e-05} +{"train_loss": 0.004795397166162729, "global_step": 16401, "epoch": 137, "lr": 8.809286538228476e-05} +{"train_loss": 0.007235047873109579, "global_step": 16402, "epoch": 137, "lr": 8.809143025984836e-05} +{"train_loss": 0.0063461498357355595, "global_step": 16403, "epoch": 137, "lr": 8.808999506262352e-05} +{"train_loss": 0.005638860631734133, "global_step": 16404, "epoch": 137, "lr": 8.808855979061302e-05} +{"train_loss": 0.0038804386276751757, "global_step": 16405, "epoch": 137, "lr": 8.808712444381972e-05} +{"train_loss": 0.007166258059442043, "global_step": 16406, "epoch": 137, "lr": 8.808568902224641e-05} +{"train_loss": 0.003928044810891151, "global_step": 16407, "epoch": 137, "lr": 8.808425352589592e-05} +{"train_loss": 0.00414410000666976, "global_step": 16408, "epoch": 137, "lr": 8.808281795477107e-05} +{"train_loss": 0.004019538871943951, "global_step": 16409, "epoch": 137, "lr": 8.808138230887467e-05} +{"train_loss": 0.007131190970540047, "global_step": 16410, "epoch": 137, "lr": 8.807994658820954e-05} +{"train_loss": 0.00947329867631197, "global_step": 16411, "epoch": 137, "lr": 8.807851079277852e-05} +{"train_loss": 0.005235855933278799, "global_step": 16412, "epoch": 137, "lr": 8.80770749225844e-05} +{"train_loss": 0.005608755629509687, "global_step": 16413, "epoch": 137, "lr": 8.807563897763003e-05} +{"train_loss": 0.0071848537772893906, "global_step": 16414, "epoch": 137, "lr": 8.807420295791818e-05} +{"train_loss": 0.00767801608890295, "global_step": 16415, "epoch": 137, "lr": 8.807276686345172e-05} +{"train_loss": 0.008055630140006542, "global_step": 16416, "epoch": 137, "lr": 8.807133069423345e-05} +{"train_loss": 0.0062184263952076435, "global_step": 16417, "epoch": 137, "lr": 8.806989445026617e-05} +{"train_loss": 0.005275201518088579, "global_step": 16418, "epoch": 137, "lr": 8.806845813155274e-05} +{"train_loss": 0.005680138245224953, "global_step": 16419, "epoch": 137, "lr": 8.806702173809595e-05} +{"train_loss": 0.006719786673784256, "global_step": 16420, "epoch": 137, "lr": 8.806558526989864e-05} +{"train_loss": 0.006388011057822018, "global_step": 16421, "epoch": 137, "lr": 8.806414872696361e-05, "val_loss": 0.01717280223965645} +{"train_loss": 0.004705558996647596, "global_step": 16422, "epoch": 138, "lr": 8.80627121092937e-05} +{"train_loss": 0.005773765034973621, "global_step": 16423, "epoch": 138, "lr": 8.806127541689171e-05} +{"train_loss": 0.005194060504436493, "global_step": 16424, "epoch": 138, "lr": 8.805983864976048e-05} +{"train_loss": 0.0077485376968979836, "global_step": 16425, "epoch": 138, "lr": 8.805840180790282e-05} +{"train_loss": 0.004329986870288849, "global_step": 16426, "epoch": 138, "lr": 8.805696489132156e-05} +{"train_loss": 0.007437497843056917, "global_step": 16427, "epoch": 138, "lr": 8.80555279000195e-05} +{"train_loss": 0.004620712250471115, "global_step": 16428, "epoch": 138, "lr": 8.80540908339995e-05} +{"train_loss": 0.0068791937083005905, "global_step": 16429, "epoch": 138, "lr": 8.805265369326433e-05} +{"train_loss": 0.005765055306255817, "global_step": 16430, "epoch": 138, "lr": 8.805121647781685e-05} +{"train_loss": 0.006758071947842836, "global_step": 16431, "epoch": 138, "lr": 8.804977918765989e-05} +{"train_loss": 0.004900461994111538, "global_step": 16432, "epoch": 138, "lr": 8.804834182279622e-05} +{"train_loss": 0.006419516168534756, "global_step": 16433, "epoch": 138, "lr": 8.804690438322872e-05} +{"train_loss": 0.005209063179790974, "global_step": 16434, "epoch": 138, "lr": 8.804546686896019e-05} +{"train_loss": 0.0033521042205393314, "global_step": 16435, "epoch": 138, "lr": 8.804402927999344e-05} +{"train_loss": 0.006069267634302378, "global_step": 16436, "epoch": 138, "lr": 8.80425916163313e-05} +{"train_loss": 0.003804320702329278, "global_step": 16437, "epoch": 138, "lr": 8.80411538779766e-05} +{"train_loss": 0.006582395639270544, "global_step": 16438, "epoch": 138, "lr": 8.803971606493216e-05} +{"train_loss": 0.004968402907252312, "global_step": 16439, "epoch": 138, "lr": 8.803827817720081e-05} +{"train_loss": 0.0052713071927428246, "global_step": 16440, "epoch": 138, "lr": 8.803684021478536e-05} +{"train_loss": 0.005737680476158857, "global_step": 16441, "epoch": 138, "lr": 8.803540217768862e-05} +{"train_loss": 0.004771495703607798, "global_step": 16442, "epoch": 138, "lr": 8.803396406591345e-05} +{"train_loss": 0.004811595659703016, "global_step": 16443, "epoch": 138, "lr": 8.803252587946264e-05} +{"train_loss": 0.004226398654282093, "global_step": 16444, "epoch": 138, "lr": 8.803108761833904e-05} +{"train_loss": 0.006552912760525942, "global_step": 16445, "epoch": 138, "lr": 8.802964928254547e-05} +{"train_loss": 0.006552697159349918, "global_step": 16446, "epoch": 138, "lr": 8.802821087208473e-05} +{"train_loss": 0.00621361518278718, "global_step": 16447, "epoch": 138, "lr": 8.802677238695968e-05} +{"train_loss": 0.007054239511489868, "global_step": 16448, "epoch": 138, "lr": 8.802533382717311e-05} +{"train_loss": 0.007327091880142689, "global_step": 16449, "epoch": 138, "lr": 8.802389519272787e-05} +{"train_loss": 0.005550714675337076, "global_step": 16450, "epoch": 138, "lr": 8.802245648362676e-05} +{"train_loss": 0.0059030549600720406, "global_step": 16451, "epoch": 138, "lr": 8.802101769987262e-05} +{"train_loss": 0.008554610423743725, "global_step": 16452, "epoch": 138, "lr": 8.801957884146827e-05} +{"train_loss": 0.0053940629586577415, "global_step": 16453, "epoch": 138, "lr": 8.801813990841657e-05} +{"train_loss": 0.005623835604637861, "global_step": 16454, "epoch": 138, "lr": 8.801670090072027e-05} +{"train_loss": 0.004315664991736412, "global_step": 16455, "epoch": 138, "lr": 8.801526181838227e-05} +{"train_loss": 0.003833813825622201, "global_step": 16456, "epoch": 138, "lr": 8.801382266140536e-05} +{"train_loss": 0.008276863023638725, "global_step": 16457, "epoch": 138, "lr": 8.801238342979236e-05} +{"train_loss": 0.0071971602737903595, "global_step": 16458, "epoch": 138, "lr": 8.801094412354611e-05} +{"train_loss": 0.00781065272167325, "global_step": 16459, "epoch": 138, "lr": 8.800950474266944e-05} +{"train_loss": 0.006249136291444302, "global_step": 16460, "epoch": 138, "lr": 8.800806528716516e-05} +{"train_loss": 0.006605358328670263, "global_step": 16461, "epoch": 138, "lr": 8.800662575703611e-05} +{"train_loss": 0.005495584569871426, "global_step": 16462, "epoch": 138, "lr": 8.80051861522851e-05} +{"train_loss": 0.005082036834210157, "global_step": 16463, "epoch": 138, "lr": 8.800374647291498e-05} +{"train_loss": 0.005264627747237682, "global_step": 16464, "epoch": 138, "lr": 8.800230671892856e-05} +{"train_loss": 0.00446327356621623, "global_step": 16465, "epoch": 138, "lr": 8.800086689032867e-05} +{"train_loss": 0.005419926252216101, "global_step": 16466, "epoch": 138, "lr": 8.799942698711814e-05} +{"train_loss": 0.007219398859888315, "global_step": 16467, "epoch": 138, "lr": 8.79979870092998e-05} +{"train_loss": 0.010213864967226982, "global_step": 16468, "epoch": 138, "lr": 8.799654695687644e-05} +{"train_loss": 0.0060674468986690044, "global_step": 16469, "epoch": 138, "lr": 8.799510682985096e-05} +{"train_loss": 0.005023246631026268, "global_step": 16470, "epoch": 138, "lr": 8.799366662822613e-05} +{"train_loss": 0.006641080137342215, "global_step": 16471, "epoch": 138, "lr": 8.799222635200479e-05} +{"train_loss": 0.003856267314404249, "global_step": 16472, "epoch": 138, "lr": 8.799078600118977e-05} +{"train_loss": 0.003994661848992109, "global_step": 16473, "epoch": 138, "lr": 8.79893455757839e-05} +{"train_loss": 0.01007462665438652, "global_step": 16474, "epoch": 138, "lr": 8.798790507579004e-05} +{"train_loss": 0.008418475277721882, "global_step": 16475, "epoch": 138, "lr": 8.798646450121095e-05} +{"train_loss": 0.004302326589822769, "global_step": 16476, "epoch": 138, "lr": 8.798502385204952e-05} +{"train_loss": 0.006930840201675892, "global_step": 16477, "epoch": 138, "lr": 8.798358312830854e-05} +{"train_loss": 0.008413054049015045, "global_step": 16478, "epoch": 138, "lr": 8.798214232999085e-05} +{"train_loss": 0.004786211531609297, "global_step": 16479, "epoch": 138, "lr": 8.79807014570993e-05} +{"train_loss": 0.00941815972328186, "global_step": 16480, "epoch": 138, "lr": 8.797926050963667e-05} +{"train_loss": 0.007529755122959614, "global_step": 16481, "epoch": 138, "lr": 8.797781948760584e-05} +{"train_loss": 0.007449575699865818, "global_step": 16482, "epoch": 138, "lr": 8.79763783910096e-05} +{"train_loss": 0.005772101227194071, "global_step": 16483, "epoch": 138, "lr": 8.797493721985082e-05} +{"train_loss": 0.006149758119136095, "global_step": 16484, "epoch": 138, "lr": 8.797349597413231e-05} +{"train_loss": 0.007759838365018368, "global_step": 16485, "epoch": 138, "lr": 8.797205465385688e-05} +{"train_loss": 0.007138303481042385, "global_step": 16486, "epoch": 138, "lr": 8.79706132590274e-05} +{"train_loss": 0.006702693644911051, "global_step": 16487, "epoch": 138, "lr": 8.796917178964666e-05} +{"train_loss": 0.006759149022400379, "global_step": 16488, "epoch": 138, "lr": 8.79677302457175e-05} +{"train_loss": 0.008477811701595783, "global_step": 16489, "epoch": 138, "lr": 8.796628862724277e-05} +{"train_loss": 0.004257630556821823, "global_step": 16490, "epoch": 138, "lr": 8.79648469342253e-05} +{"train_loss": 0.0057574789971113205, "global_step": 16491, "epoch": 138, "lr": 8.796340516666787e-05} +{"train_loss": 0.007222326006740332, "global_step": 16492, "epoch": 138, "lr": 8.796196332457338e-05} +{"train_loss": 0.006923787761479616, "global_step": 16493, "epoch": 138, "lr": 8.796052140794464e-05} +{"train_loss": 0.00527165038511157, "global_step": 16494, "epoch": 138, "lr": 8.795907941678446e-05} +{"train_loss": 0.007573350332677364, "global_step": 16495, "epoch": 138, "lr": 8.795763735109567e-05} +{"train_loss": 0.005870706867426634, "global_step": 16496, "epoch": 138, "lr": 8.795619521088112e-05} +{"train_loss": 0.0061529772356152534, "global_step": 16497, "epoch": 138, "lr": 8.795475299614365e-05} +{"train_loss": 0.0029611908830702305, "global_step": 16498, "epoch": 138, "lr": 8.795331070688606e-05} +{"train_loss": 0.005941582843661308, "global_step": 16499, "epoch": 138, "lr": 8.795186834311121e-05} +{"train_loss": 0.006116906646639109, "global_step": 16500, "epoch": 138, "lr": 8.795042590482192e-05} +{"train_loss": 0.004898592829704285, "global_step": 16501, "epoch": 138, "lr": 8.794898339202102e-05} +{"train_loss": 0.004838248714804649, "global_step": 16502, "epoch": 138, "lr": 8.794754080471135e-05} +{"train_loss": 0.004432179965078831, "global_step": 16503, "epoch": 138, "lr": 8.794609814289573e-05} +{"train_loss": 0.006991486996412277, "global_step": 16504, "epoch": 138, "lr": 8.7944655406577e-05} +{"train_loss": 0.007531994488090277, "global_step": 16505, "epoch": 138, "lr": 8.7943212595758e-05} +{"train_loss": 0.009844551794230938, "global_step": 16506, "epoch": 138, "lr": 8.794176971044156e-05} +{"train_loss": 0.0051063732244074345, "global_step": 16507, "epoch": 138, "lr": 8.79403267506305e-05} +{"train_loss": 0.0066919089294970036, "global_step": 16508, "epoch": 138, "lr": 8.793888371632765e-05} +{"train_loss": 0.006604945287108421, "global_step": 16509, "epoch": 138, "lr": 8.793744060753588e-05} +{"train_loss": 0.005389457568526268, "global_step": 16510, "epoch": 138, "lr": 8.7935997424258e-05} +{"train_loss": 0.004803537856787443, "global_step": 16511, "epoch": 138, "lr": 8.793455416649682e-05} +{"train_loss": 0.007346217054873705, "global_step": 16512, "epoch": 138, "lr": 8.79331108342552e-05} +{"train_loss": 0.006479588337242603, "global_step": 16513, "epoch": 138, "lr": 8.793166742753598e-05} +{"train_loss": 0.005626026075333357, "global_step": 16514, "epoch": 138, "lr": 8.793022394634197e-05} +{"train_loss": 0.006054141093045473, "global_step": 16515, "epoch": 138, "lr": 8.792878039067602e-05} +{"train_loss": 0.00488731823861599, "global_step": 16516, "epoch": 138, "lr": 8.792733676054096e-05} +{"train_loss": 0.0053114998154342175, "global_step": 16517, "epoch": 138, "lr": 8.792589305593965e-05} +{"train_loss": 0.004788929130882025, "global_step": 16518, "epoch": 138, "lr": 8.792444927687489e-05} +{"train_loss": 0.005689436104148626, "global_step": 16519, "epoch": 138, "lr": 8.792300542334952e-05} +{"train_loss": 0.0070276823826134205, "global_step": 16520, "epoch": 138, "lr": 8.792156149536637e-05} +{"train_loss": 0.007814155891537666, "global_step": 16521, "epoch": 138, "lr": 8.79201174929283e-05} +{"train_loss": 0.007050337735563517, "global_step": 16522, "epoch": 138, "lr": 8.791867341603812e-05} +{"train_loss": 0.005476155783981085, "global_step": 16523, "epoch": 138, "lr": 8.791722926469868e-05} +{"train_loss": 0.004034169018268585, "global_step": 16524, "epoch": 138, "lr": 8.791578503891281e-05} +{"train_loss": 0.005199418403208256, "global_step": 16525, "epoch": 138, "lr": 8.791434073868335e-05} +{"train_loss": 0.005460978951305151, "global_step": 16526, "epoch": 138, "lr": 8.791289636401315e-05} +{"train_loss": 0.00596575578674674, "global_step": 16527, "epoch": 138, "lr": 8.7911451914905e-05} +{"train_loss": 0.005913678091019392, "global_step": 16528, "epoch": 138, "lr": 8.791000739136176e-05} +{"train_loss": 0.005440768785774708, "global_step": 16529, "epoch": 138, "lr": 8.790856279338629e-05} +{"train_loss": 0.0059299590066075325, "global_step": 16530, "epoch": 138, "lr": 8.79071181209814e-05} +{"train_loss": 0.004772969987243414, "global_step": 16531, "epoch": 138, "lr": 8.790567337414994e-05} +{"train_loss": 0.008470377884805202, "global_step": 16532, "epoch": 138, "lr": 8.790422855289473e-05} +{"train_loss": 0.00432643573731184, "global_step": 16533, "epoch": 138, "lr": 8.790278365721863e-05} +{"train_loss": 0.005744161084294319, "global_step": 16534, "epoch": 138, "lr": 8.790133868712445e-05} +{"train_loss": 0.00827766116708517, "global_step": 16535, "epoch": 138, "lr": 8.789989364261505e-05} +{"train_loss": 0.006014027167111635, "global_step": 16536, "epoch": 138, "lr": 8.789844852369325e-05} +{"train_loss": 0.007746370043605566, "global_step": 16537, "epoch": 138, "lr": 8.789700333036191e-05} +{"train_loss": 0.00946460198611021, "global_step": 16538, "epoch": 138, "lr": 8.789555806262383e-05} +{"train_loss": 0.00449812738224864, "global_step": 16539, "epoch": 138, "lr": 8.789411272048188e-05} +{"train_loss": 0.006114792078733444, "global_step": 16540, "epoch": 138, "lr": 8.789266730393889e-05, "val_loss": 0.016965819522738457} +{"train_loss": 0.006334101315587759, "global_step": 16541, "epoch": 139, "lr": 8.789122181299769e-05} +{"train_loss": 0.005962579045444727, "global_step": 16542, "epoch": 139, "lr": 8.788977624766115e-05} +{"train_loss": 0.005917234346270561, "global_step": 16543, "epoch": 139, "lr": 8.788833060793205e-05} +{"train_loss": 0.00768641009926796, "global_step": 16544, "epoch": 139, "lr": 8.788688489381327e-05} +{"train_loss": 0.005066224839538336, "global_step": 16545, "epoch": 139, "lr": 8.788543910530765e-05} +{"train_loss": 0.004905511625111103, "global_step": 16546, "epoch": 139, "lr": 8.788399324241801e-05} +{"train_loss": 0.007459401153028011, "global_step": 16547, "epoch": 139, "lr": 8.78825473051472e-05} +{"train_loss": 0.0047448971308767796, "global_step": 16548, "epoch": 139, "lr": 8.788110129349805e-05} +{"train_loss": 0.004375785123556852, "global_step": 16549, "epoch": 139, "lr": 8.78796552074734e-05} +{"train_loss": 0.006033676210790873, "global_step": 16550, "epoch": 139, "lr": 8.78782090470761e-05} +{"train_loss": 0.006550722289830446, "global_step": 16551, "epoch": 139, "lr": 8.787676281230899e-05} +{"train_loss": 0.006961731240153313, "global_step": 16552, "epoch": 139, "lr": 8.787531650317489e-05} +{"train_loss": 0.007631910499185324, "global_step": 16553, "epoch": 139, "lr": 8.787387011967666e-05} +{"train_loss": 0.009812365286052227, "global_step": 16554, "epoch": 139, "lr": 8.787242366181714e-05} +{"train_loss": 0.004203694872558117, "global_step": 16555, "epoch": 139, "lr": 8.787097712959914e-05} +{"train_loss": 0.004690582398325205, "global_step": 16556, "epoch": 139, "lr": 8.786953052302554e-05} +{"train_loss": 0.00661223940551281, "global_step": 16557, "epoch": 139, "lr": 8.786808384209916e-05} +{"train_loss": 0.006856953259557486, "global_step": 16558, "epoch": 139, "lr": 8.786663708682283e-05} +{"train_loss": 0.005406958982348442, "global_step": 16559, "epoch": 139, "lr": 8.786519025719943e-05} +{"train_loss": 0.006401251535862684, "global_step": 16560, "epoch": 139, "lr": 8.786374335323175e-05} +{"train_loss": 0.005493166856467724, "global_step": 16561, "epoch": 139, "lr": 8.786229637492267e-05} +{"train_loss": 0.008252582512795925, "global_step": 16562, "epoch": 139, "lr": 8.7860849322275e-05} +{"train_loss": 0.008782248012721539, "global_step": 16563, "epoch": 139, "lr": 8.785940219529161e-05} +{"train_loss": 0.004742865916341543, "global_step": 16564, "epoch": 139, "lr": 8.785795499397533e-05} +{"train_loss": 0.0089380769059062, "global_step": 16565, "epoch": 139, "lr": 8.785650771832899e-05} +{"train_loss": 0.004409346729516983, "global_step": 16566, "epoch": 139, "lr": 8.785506036835546e-05} +{"train_loss": 0.0052103316411376, "global_step": 16567, "epoch": 139, "lr": 8.785361294405754e-05} +{"train_loss": 0.008372063748538494, "global_step": 16568, "epoch": 139, "lr": 8.785216544543811e-05} +{"train_loss": 0.0036861358676105738, "global_step": 16569, "epoch": 139, "lr": 8.785071787249999e-05} +{"train_loss": 0.006401421502232552, "global_step": 16570, "epoch": 139, "lr": 8.784927022524603e-05} +{"train_loss": 0.005267763044685125, "global_step": 16571, "epoch": 139, "lr": 8.784782250367907e-05} +{"train_loss": 0.003497692756354809, "global_step": 16572, "epoch": 139, "lr": 8.784637470780198e-05} +{"train_loss": 0.005501756444573402, "global_step": 16573, "epoch": 139, "lr": 8.784492683761754e-05} +{"train_loss": 0.0037550022825598717, "global_step": 16574, "epoch": 139, "lr": 8.784347889312864e-05} +{"train_loss": 0.004900849424302578, "global_step": 16575, "epoch": 139, "lr": 8.784203087433811e-05} +{"train_loss": 0.006891695316880941, "global_step": 16576, "epoch": 139, "lr": 8.784058278124881e-05} +{"train_loss": 0.006382668390870094, "global_step": 16577, "epoch": 139, "lr": 8.783913461386355e-05} +{"train_loss": 0.0065107932314276695, "global_step": 16578, "epoch": 139, "lr": 8.78376863721852e-05} +{"train_loss": 0.008736427873373032, "global_step": 16579, "epoch": 139, "lr": 8.783623805621659e-05} +{"train_loss": 0.004350860603153706, "global_step": 16580, "epoch": 139, "lr": 8.783478966596058e-05} +{"train_loss": 0.006484341807663441, "global_step": 16581, "epoch": 139, "lr": 8.783334120142e-05} +{"train_loss": 0.006577164400368929, "global_step": 16582, "epoch": 139, "lr": 8.78318926625977e-05} +{"train_loss": 0.004973982460796833, "global_step": 16583, "epoch": 139, "lr": 8.78304440494965e-05} +{"train_loss": 0.005133914295583963, "global_step": 16584, "epoch": 139, "lr": 8.782899536211928e-05} +{"train_loss": 0.006170750595629215, "global_step": 16585, "epoch": 139, "lr": 8.782754660046888e-05} +{"train_loss": 0.00541330361738801, "global_step": 16586, "epoch": 139, "lr": 8.782609776454811e-05} +{"train_loss": 0.0051562245935201645, "global_step": 16587, "epoch": 139, "lr": 8.782464885435985e-05} +{"train_loss": 0.003551588160917163, "global_step": 16588, "epoch": 139, "lr": 8.782319986990694e-05} +{"train_loss": 0.006537625100463629, "global_step": 16589, "epoch": 139, "lr": 8.78217508111922e-05} +{"train_loss": 0.007115507032722235, "global_step": 16590, "epoch": 139, "lr": 8.782030167821851e-05} +{"train_loss": 0.004940437152981758, "global_step": 16591, "epoch": 139, "lr": 8.781885247098869e-05} +{"train_loss": 0.009160575456917286, "global_step": 16592, "epoch": 139, "lr": 8.78174031895056e-05} +{"train_loss": 0.005004760809242725, "global_step": 16593, "epoch": 139, "lr": 8.781595383377207e-05} +{"train_loss": 0.008416952565312386, "global_step": 16594, "epoch": 139, "lr": 8.781450440379095e-05} +{"train_loss": 0.007162901107221842, "global_step": 16595, "epoch": 139, "lr": 8.78130548995651e-05} +{"train_loss": 0.004659298341721296, "global_step": 16596, "epoch": 139, "lr": 8.781160532109735e-05} +{"train_loss": 0.009326914325356483, "global_step": 16597, "epoch": 139, "lr": 8.781015566839057e-05} +{"train_loss": 0.00542082916945219, "global_step": 16598, "epoch": 139, "lr": 8.780870594144758e-05} +{"train_loss": 0.0061830682680010796, "global_step": 16599, "epoch": 139, "lr": 8.780725614027123e-05} +{"train_loss": 0.005439897999167442, "global_step": 16600, "epoch": 139, "lr": 8.780580626486437e-05} +{"train_loss": 0.009595043025910854, "global_step": 16601, "epoch": 139, "lr": 8.780435631522985e-05} +{"train_loss": 0.006949754431843758, "global_step": 16602, "epoch": 139, "lr": 8.78029062913705e-05} +{"train_loss": 0.0056119211949408054, "global_step": 16603, "epoch": 139, "lr": 8.780145619328921e-05} +{"train_loss": 0.004523088689893484, "global_step": 16604, "epoch": 139, "lr": 8.78000060209888e-05} +{"train_loss": 0.007680941838771105, "global_step": 16605, "epoch": 139, "lr": 8.77985557744721e-05} +{"train_loss": 0.007040919736027718, "global_step": 16606, "epoch": 139, "lr": 8.779710545374198e-05} +{"train_loss": 0.0077026961371302605, "global_step": 16607, "epoch": 139, "lr": 8.779565505880128e-05} +{"train_loss": 0.00681608822196722, "global_step": 16608, "epoch": 139, "lr": 8.779420458965286e-05} +{"train_loss": 0.005843290593475103, "global_step": 16609, "epoch": 139, "lr": 8.779275404629954e-05} +{"train_loss": 0.010350181721150875, "global_step": 16610, "epoch": 139, "lr": 8.77913034287442e-05} +{"train_loss": 0.006863890215754509, "global_step": 16611, "epoch": 139, "lr": 8.778985273698966e-05} +{"train_loss": 0.006621573586016893, "global_step": 16612, "epoch": 139, "lr": 8.778840197103876e-05} +{"train_loss": 0.004798220004886389, "global_step": 16613, "epoch": 139, "lr": 8.778695113089441e-05} +{"train_loss": 0.008788030594587326, "global_step": 16614, "epoch": 139, "lr": 8.77855002165594e-05} +{"train_loss": 0.007768469862639904, "global_step": 16615, "epoch": 139, "lr": 8.77840492280366e-05} +{"train_loss": 0.006723581813275814, "global_step": 16616, "epoch": 139, "lr": 8.778259816532887e-05} +{"train_loss": 0.00593161815777421, "global_step": 16617, "epoch": 139, "lr": 8.778114702843903e-05} +{"train_loss": 0.007278877310454845, "global_step": 16618, "epoch": 139, "lr": 8.777969581736995e-05} +{"train_loss": 0.011264574714004993, "global_step": 16619, "epoch": 139, "lr": 8.777824453212446e-05} +{"train_loss": 0.006285958923399448, "global_step": 16620, "epoch": 139, "lr": 8.777679317270543e-05} +{"train_loss": 0.006815208122134209, "global_step": 16621, "epoch": 139, "lr": 8.777534173911572e-05} +{"train_loss": 0.0066947173327207565, "global_step": 16622, "epoch": 139, "lr": 8.777389023135814e-05} +{"train_loss": 0.006510057952255011, "global_step": 16623, "epoch": 139, "lr": 8.777243864943557e-05} +{"train_loss": 0.011881864629685879, "global_step": 16624, "epoch": 139, "lr": 8.777098699335084e-05} +{"train_loss": 0.006182672455906868, "global_step": 16625, "epoch": 139, "lr": 8.776953526310683e-05} +{"train_loss": 0.004812906961888075, "global_step": 16626, "epoch": 139, "lr": 8.776808345870638e-05} +{"train_loss": 0.010089630261063576, "global_step": 16627, "epoch": 139, "lr": 8.77666315801523e-05} +{"train_loss": 0.00830716360360384, "global_step": 16628, "epoch": 139, "lr": 8.77651796274475e-05} +{"train_loss": 0.0051195076666772366, "global_step": 16629, "epoch": 139, "lr": 8.77637276005948e-05} +{"train_loss": 0.009680340066552162, "global_step": 16630, "epoch": 139, "lr": 8.776227549959706e-05} +{"train_loss": 0.005838023964315653, "global_step": 16631, "epoch": 139, "lr": 8.776082332445711e-05} +{"train_loss": 0.006192418280988932, "global_step": 16632, "epoch": 139, "lr": 8.775937107517783e-05} +{"train_loss": 0.0075003644451498985, "global_step": 16633, "epoch": 139, "lr": 8.775791875176204e-05} +{"train_loss": 0.0043586441315710545, "global_step": 16634, "epoch": 139, "lr": 8.775646635421264e-05} +{"train_loss": 0.01059024315327406, "global_step": 16635, "epoch": 139, "lr": 8.775501388253244e-05} +{"train_loss": 0.006149889435619116, "global_step": 16636, "epoch": 139, "lr": 8.77535613367243e-05} +{"train_loss": 0.006866593845188618, "global_step": 16637, "epoch": 139, "lr": 8.775210871679107e-05} +{"train_loss": 0.00762744527310133, "global_step": 16638, "epoch": 139, "lr": 8.775065602273562e-05} +{"train_loss": 0.00861617922782898, "global_step": 16639, "epoch": 139, "lr": 8.774920325456078e-05} +{"train_loss": 0.006986862048506737, "global_step": 16640, "epoch": 139, "lr": 8.774775041226943e-05} +{"train_loss": 0.009297942742705345, "global_step": 16641, "epoch": 139, "lr": 8.774629749586438e-05} +{"train_loss": 0.006246870383620262, "global_step": 16642, "epoch": 139, "lr": 8.774484450534852e-05} +{"train_loss": 0.007579153403639793, "global_step": 16643, "epoch": 139, "lr": 8.77433914407247e-05} +{"train_loss": 0.0074790907092392445, "global_step": 16644, "epoch": 139, "lr": 8.774193830199575e-05} +{"train_loss": 0.009024005383253098, "global_step": 16645, "epoch": 139, "lr": 8.774048508916454e-05} +{"train_loss": 0.011010943911969662, "global_step": 16646, "epoch": 139, "lr": 8.773903180223392e-05} +{"train_loss": 0.00707273231819272, "global_step": 16647, "epoch": 139, "lr": 8.773757844120673e-05} +{"train_loss": 0.006861723028123379, "global_step": 16648, "epoch": 139, "lr": 8.773612500608586e-05} +{"train_loss": 0.009978865273296833, "global_step": 16649, "epoch": 139, "lr": 8.773467149687413e-05} +{"train_loss": 0.0063387202098965645, "global_step": 16650, "epoch": 139, "lr": 8.77332179135744e-05} +{"train_loss": 0.005540123209357262, "global_step": 16651, "epoch": 139, "lr": 8.773176425618953e-05} +{"train_loss": 0.005948923993855715, "global_step": 16652, "epoch": 139, "lr": 8.773031052472237e-05} +{"train_loss": 0.006974825169891119, "global_step": 16653, "epoch": 139, "lr": 8.772885671917578e-05} +{"train_loss": 0.008259475231170654, "global_step": 16654, "epoch": 139, "lr": 8.77274028395526e-05} +{"train_loss": 0.006321986671537161, "global_step": 16655, "epoch": 139, "lr": 8.772594888585572e-05} +{"train_loss": 0.005345786456018686, "global_step": 16656, "epoch": 139, "lr": 8.772449485808794e-05} +{"train_loss": 0.005960423965007067, "global_step": 16657, "epoch": 139, "lr": 8.772304075625217e-05} +{"train_loss": 0.00787852331995964, "global_step": 16658, "epoch": 139, "lr": 8.772158658035122e-05} +{"train_loss": 0.006694556910450719, "global_step": 16659, "epoch": 139, "lr": 8.772013233038797e-05, "val_loss": 0.010322167538106441} +{"train_loss": 0.006688628811389208, "global_step": 16660, "epoch": 140, "lr": 8.771867800636527e-05} +{"train_loss": 0.006561811547726393, "global_step": 16661, "epoch": 140, "lr": 8.771722360828598e-05} +{"train_loss": 0.007467754650861025, "global_step": 16662, "epoch": 140, "lr": 8.771576913615294e-05} +{"train_loss": 0.009884065017104149, "global_step": 16663, "epoch": 140, "lr": 8.771431458996903e-05} +{"train_loss": 0.006420785095542669, "global_step": 16664, "epoch": 140, "lr": 8.77128599697371e-05} +{"train_loss": 0.007399377413094044, "global_step": 16665, "epoch": 140, "lr": 8.771140527545998e-05} +{"train_loss": 0.006408215034753084, "global_step": 16666, "epoch": 140, "lr": 8.770995050714055e-05} +{"train_loss": 0.006538075394928455, "global_step": 16667, "epoch": 140, "lr": 8.770849566478166e-05} +{"train_loss": 0.006484390236437321, "global_step": 16668, "epoch": 140, "lr": 8.770704074838618e-05} +{"train_loss": 0.004700967576354742, "global_step": 16669, "epoch": 140, "lr": 8.770558575795694e-05} +{"train_loss": 0.009101307019591331, "global_step": 16670, "epoch": 140, "lr": 8.770413069349681e-05} +{"train_loss": 0.005110481288284063, "global_step": 16671, "epoch": 140, "lr": 8.770267555500866e-05} +{"train_loss": 0.005515031982213259, "global_step": 16672, "epoch": 140, "lr": 8.770122034249533e-05} +{"train_loss": 0.005410409532487392, "global_step": 16673, "epoch": 140, "lr": 8.769976505595967e-05} +{"train_loss": 0.006401614751666784, "global_step": 16674, "epoch": 140, "lr": 8.769830969540456e-05} +{"train_loss": 0.0071555390022695065, "global_step": 16675, "epoch": 140, "lr": 8.769685426083284e-05} +{"train_loss": 0.006193702109158039, "global_step": 16676, "epoch": 140, "lr": 8.769539875224737e-05} +{"train_loss": 0.007410599384456873, "global_step": 16677, "epoch": 140, "lr": 8.769394316965102e-05} +{"train_loss": 0.005094184540212154, "global_step": 16678, "epoch": 140, "lr": 8.769248751304664e-05} +{"train_loss": 0.006631479132920504, "global_step": 16679, "epoch": 140, "lr": 8.769103178243709e-05} +{"train_loss": 0.007000467739999294, "global_step": 16680, "epoch": 140, "lr": 8.768957597782522e-05} +{"train_loss": 0.00644131563603878, "global_step": 16681, "epoch": 140, "lr": 8.768812009921389e-05} +{"train_loss": 0.006375040393322706, "global_step": 16682, "epoch": 140, "lr": 8.768666414660597e-05} +{"train_loss": 0.005408263765275478, "global_step": 16683, "epoch": 140, "lr": 8.768520812000431e-05} +{"train_loss": 0.006501747295260429, "global_step": 16684, "epoch": 140, "lr": 8.768375201941177e-05} +{"train_loss": 0.006632576696574688, "global_step": 16685, "epoch": 140, "lr": 8.768229584483121e-05} +{"train_loss": 0.006965939421206713, "global_step": 16686, "epoch": 140, "lr": 8.768083959626548e-05} +{"train_loss": 0.007185106165707111, "global_step": 16687, "epoch": 140, "lr": 8.767938327371745e-05} +{"train_loss": 0.005708486307412386, "global_step": 16688, "epoch": 140, "lr": 8.767792687718998e-05} +{"train_loss": 0.006964405998587608, "global_step": 16689, "epoch": 140, "lr": 8.767647040668591e-05} +{"train_loss": 0.0035132276825606823, "global_step": 16690, "epoch": 140, "lr": 8.767501386220814e-05} +{"train_loss": 0.005742976441979408, "global_step": 16691, "epoch": 140, "lr": 8.767355724375949e-05} +{"train_loss": 0.0047678700648248196, "global_step": 16692, "epoch": 140, "lr": 8.767210055134286e-05} +{"train_loss": 0.006968146190047264, "global_step": 16693, "epoch": 140, "lr": 8.767064378496106e-05} +{"train_loss": 0.01037713885307312, "global_step": 16694, "epoch": 140, "lr": 8.766918694461699e-05} +{"train_loss": 0.013500545173883438, "global_step": 16695, "epoch": 140, "lr": 8.766773003031348e-05} +{"train_loss": 0.007083996199071407, "global_step": 16696, "epoch": 140, "lr": 8.766627304205341e-05} +{"train_loss": 0.003184054745361209, "global_step": 16697, "epoch": 140, "lr": 8.766481597983964e-05} +{"train_loss": 0.00459316186606884, "global_step": 16698, "epoch": 140, "lr": 8.766335884367502e-05} +{"train_loss": 0.006596285384148359, "global_step": 16699, "epoch": 140, "lr": 8.766190163356243e-05} +{"train_loss": 0.010453314520418644, "global_step": 16700, "epoch": 140, "lr": 8.766044434950474e-05} +{"train_loss": 0.006961558014154434, "global_step": 16701, "epoch": 140, "lr": 8.765898699150475e-05} +{"train_loss": 0.004497767426073551, "global_step": 16702, "epoch": 140, "lr": 8.765752955956539e-05} +{"train_loss": 0.010513088665902615, "global_step": 16703, "epoch": 140, "lr": 8.765607205368947e-05} +{"train_loss": 0.006363565102219582, "global_step": 16704, "epoch": 140, "lr": 8.76546144738799e-05} +{"train_loss": 0.008313982747495174, "global_step": 16705, "epoch": 140, "lr": 8.76531568201395e-05} +{"train_loss": 0.007857021875679493, "global_step": 16706, "epoch": 140, "lr": 8.765169909247115e-05} +{"train_loss": 0.0052774338982999325, "global_step": 16707, "epoch": 140, "lr": 8.765024129087773e-05} +{"train_loss": 0.00621744804084301, "global_step": 16708, "epoch": 140, "lr": 8.764878341536207e-05} +{"train_loss": 0.006773142144083977, "global_step": 16709, "epoch": 140, "lr": 8.764732546592705e-05} +{"train_loss": 0.00817052461206913, "global_step": 16710, "epoch": 140, "lr": 8.764586744257552e-05} +{"train_loss": 0.006597717758268118, "global_step": 16711, "epoch": 140, "lr": 8.764440934531035e-05} +{"train_loss": 0.0066265808418393135, "global_step": 16712, "epoch": 140, "lr": 8.764295117413441e-05} +{"train_loss": 0.008203920908272266, "global_step": 16713, "epoch": 140, "lr": 8.764149292905056e-05} +{"train_loss": 0.005618115421384573, "global_step": 16714, "epoch": 140, "lr": 8.764003461006166e-05} +{"train_loss": 0.005556496791541576, "global_step": 16715, "epoch": 140, "lr": 8.763857621717058e-05} +{"train_loss": 0.007551637943834066, "global_step": 16716, "epoch": 140, "lr": 8.763711775038015e-05} +{"train_loss": 0.005702857859432697, "global_step": 16717, "epoch": 140, "lr": 8.763565920969329e-05} +{"train_loss": 0.006723899394273758, "global_step": 16718, "epoch": 140, "lr": 8.763420059511281e-05} +{"train_loss": 0.006817540153861046, "global_step": 16719, "epoch": 140, "lr": 8.763274190664161e-05} +{"train_loss": 0.00651547871530056, "global_step": 16720, "epoch": 140, "lr": 8.763128314428254e-05} +{"train_loss": 0.006827855948358774, "global_step": 16721, "epoch": 140, "lr": 8.762982430803848e-05} +{"train_loss": 0.007344425655901432, "global_step": 16722, "epoch": 140, "lr": 8.762836539791225e-05} +{"train_loss": 0.005912430118769407, "global_step": 16723, "epoch": 140, "lr": 8.762690641390677e-05} +{"train_loss": 0.008115377277135849, "global_step": 16724, "epoch": 140, "lr": 8.762544735602487e-05} +{"train_loss": 0.006583509501069784, "global_step": 16725, "epoch": 140, "lr": 8.762398822426942e-05} +{"train_loss": 0.008656632155179977, "global_step": 16726, "epoch": 140, "lr": 8.76225290186433e-05} +{"train_loss": 0.007742246612906456, "global_step": 16727, "epoch": 140, "lr": 8.762106973914936e-05} +{"train_loss": 0.010084632784128189, "global_step": 16728, "epoch": 140, "lr": 8.761961038579046e-05} +{"train_loss": 0.004557723645120859, "global_step": 16729, "epoch": 140, "lr": 8.761815095856948e-05} +{"train_loss": 0.0040065087378025055, "global_step": 16730, "epoch": 140, "lr": 8.761669145748927e-05} +{"train_loss": 0.0049891397356987, "global_step": 16731, "epoch": 140, "lr": 8.761523188255272e-05} +{"train_loss": 0.0053354715928435326, "global_step": 16732, "epoch": 140, "lr": 8.761377223376268e-05} +{"train_loss": 0.0075418357737362385, "global_step": 16733, "epoch": 140, "lr": 8.7612312511122e-05} +{"train_loss": 0.007296553812921047, "global_step": 16734, "epoch": 140, "lr": 8.761085271463359e-05} +{"train_loss": 0.0028192985337227583, "global_step": 16735, "epoch": 140, "lr": 8.760939284430027e-05} +{"train_loss": 0.005549107678234577, "global_step": 16736, "epoch": 140, "lr": 8.760793290012492e-05} +{"train_loss": 0.005606963764876127, "global_step": 16737, "epoch": 140, "lr": 8.760647288211042e-05} +{"train_loss": 0.00709393247961998, "global_step": 16738, "epoch": 140, "lr": 8.760501279025963e-05} +{"train_loss": 0.004832826554775238, "global_step": 16739, "epoch": 140, "lr": 8.760355262457541e-05} +{"train_loss": 0.005490903742611408, "global_step": 16740, "epoch": 140, "lr": 8.760209238506064e-05} +{"train_loss": 0.0077635785564780235, "global_step": 16741, "epoch": 140, "lr": 8.760063207171818e-05} +{"train_loss": 0.005779185798019171, "global_step": 16742, "epoch": 140, "lr": 8.759917168455088e-05} +{"train_loss": 0.004318839870393276, "global_step": 16743, "epoch": 140, "lr": 8.759771122356163e-05} +{"train_loss": 0.007880131714046001, "global_step": 16744, "epoch": 140, "lr": 8.75962506887533e-05} +{"train_loss": 0.0061296867206692696, "global_step": 16745, "epoch": 140, "lr": 8.759479008012874e-05} +{"train_loss": 0.00741065526381135, "global_step": 16746, "epoch": 140, "lr": 8.759332939769083e-05} +{"train_loss": 0.007563160266727209, "global_step": 16747, "epoch": 140, "lr": 8.759186864144243e-05} +{"train_loss": 0.004774901550263166, "global_step": 16748, "epoch": 140, "lr": 8.75904078113864e-05} +{"train_loss": 0.00558581342920661, "global_step": 16749, "epoch": 140, "lr": 8.758894690752563e-05} +{"train_loss": 0.005341888405382633, "global_step": 16750, "epoch": 140, "lr": 8.758748592986298e-05} +{"train_loss": 0.00833186786621809, "global_step": 16751, "epoch": 140, "lr": 8.758602487840133e-05} +{"train_loss": 0.005924324970692396, "global_step": 16752, "epoch": 140, "lr": 8.758456375314353e-05} +{"train_loss": 0.006172572262585163, "global_step": 16753, "epoch": 140, "lr": 8.758310255409246e-05} +{"train_loss": 0.004383801948279142, "global_step": 16754, "epoch": 140, "lr": 8.758164128125098e-05} +{"train_loss": 0.006001635920256376, "global_step": 16755, "epoch": 140, "lr": 8.758017993462193e-05} +{"train_loss": 0.006630935240536928, "global_step": 16756, "epoch": 140, "lr": 8.757871851420825e-05} +{"train_loss": 0.00651439419016242, "global_step": 16757, "epoch": 140, "lr": 8.757725702001275e-05} +{"train_loss": 0.005785568617284298, "global_step": 16758, "epoch": 140, "lr": 8.757579545203833e-05} +{"train_loss": 0.006593001075088978, "global_step": 16759, "epoch": 140, "lr": 8.757433381028785e-05} +{"train_loss": 0.0054938611574471, "global_step": 16760, "epoch": 140, "lr": 8.757287209476417e-05} +{"train_loss": 0.006604707334190607, "global_step": 16761, "epoch": 140, "lr": 8.757141030547017e-05} +{"train_loss": 0.010215725749731064, "global_step": 16762, "epoch": 140, "lr": 8.756994844240873e-05} +{"train_loss": 0.006225325632840395, "global_step": 16763, "epoch": 140, "lr": 8.756848650558271e-05} +{"train_loss": 0.006403104867786169, "global_step": 16764, "epoch": 140, "lr": 8.756702449499499e-05} +{"train_loss": 0.0051949420012533665, "global_step": 16765, "epoch": 140, "lr": 8.756556241064841e-05} +{"train_loss": 0.005768163595348597, "global_step": 16766, "epoch": 140, "lr": 8.756410025254588e-05} +{"train_loss": 0.007241363637149334, "global_step": 16767, "epoch": 140, "lr": 8.756263802069025e-05} +{"train_loss": 0.0058854809030890465, "global_step": 16768, "epoch": 140, "lr": 8.756117571508438e-05} +{"train_loss": 0.0074072908610105515, "global_step": 16769, "epoch": 140, "lr": 8.755971333573115e-05} +{"train_loss": 0.006025918293744326, "global_step": 16770, "epoch": 140, "lr": 8.755825088263345e-05} +{"train_loss": 0.006691410206258297, "global_step": 16771, "epoch": 140, "lr": 8.755678835579412e-05} +{"train_loss": 0.007497304119169712, "global_step": 16772, "epoch": 140, "lr": 8.755532575521608e-05} +{"train_loss": 0.006539419759064913, "global_step": 16773, "epoch": 140, "lr": 8.755386308090214e-05} +{"train_loss": 0.006591239012777805, "global_step": 16774, "epoch": 140, "lr": 8.755240033285521e-05} +{"train_loss": 0.004720067605376244, "global_step": 16775, "epoch": 140, "lr": 8.755093751107816e-05} +{"train_loss": 0.006960633210837841, "global_step": 16776, "epoch": 140, "lr": 8.754947461557385e-05} +{"train_loss": 0.005221382714807987, "global_step": 16777, "epoch": 140, "lr": 8.754801164634517e-05} +{"train_loss": 0.006547595194282652, "global_step": 16778, "epoch": 140, "lr": 8.754654860339496e-05, "val_loss": 0.014568045735359192, "train_action_mse_error": 0.00018352271581534296} +{"train_loss": 0.005736344028264284, "global_step": 16779, "epoch": 141, "lr": 8.754508548672613e-05} +{"train_loss": 0.007067963946610689, "global_step": 16780, "epoch": 141, "lr": 8.754362229634152e-05} +{"train_loss": 0.004977181553840637, "global_step": 16781, "epoch": 141, "lr": 8.754215903224404e-05} +{"train_loss": 0.0060093761421740055, "global_step": 16782, "epoch": 141, "lr": 8.754069569443653e-05} +{"train_loss": 0.004584580659866333, "global_step": 16783, "epoch": 141, "lr": 8.753923228292186e-05} +{"train_loss": 0.008566233329474926, "global_step": 16784, "epoch": 141, "lr": 8.753776879770295e-05} +{"train_loss": 0.004402130842208862, "global_step": 16785, "epoch": 141, "lr": 8.753630523878261e-05} +{"train_loss": 0.00830826349556446, "global_step": 16786, "epoch": 141, "lr": 8.753484160616377e-05} +{"train_loss": 0.005264823790639639, "global_step": 16787, "epoch": 141, "lr": 8.753337789984926e-05} +{"train_loss": 0.006971904542297125, "global_step": 16788, "epoch": 141, "lr": 8.753191411984198e-05} +{"train_loss": 0.00571090541779995, "global_step": 16789, "epoch": 141, "lr": 8.753045026614479e-05} +{"train_loss": 0.007014223840087652, "global_step": 16790, "epoch": 141, "lr": 8.752898633876059e-05} +{"train_loss": 0.005551357753574848, "global_step": 16791, "epoch": 141, "lr": 8.752752233769221e-05} +{"train_loss": 0.008605367504060268, "global_step": 16792, "epoch": 141, "lr": 8.752605826294255e-05} +{"train_loss": 0.005875225644558668, "global_step": 16793, "epoch": 141, "lr": 8.75245941145145e-05} +{"train_loss": 0.005502126179635525, "global_step": 16794, "epoch": 141, "lr": 8.752312989241091e-05} +{"train_loss": 0.007796640042215586, "global_step": 16795, "epoch": 141, "lr": 8.752166559663467e-05} +{"train_loss": 0.005239735823124647, "global_step": 16796, "epoch": 141, "lr": 8.752020122718864e-05} +{"train_loss": 0.0054677631705999374, "global_step": 16797, "epoch": 141, "lr": 8.751873678407571e-05} +{"train_loss": 0.0054068355821073055, "global_step": 16798, "epoch": 141, "lr": 8.751727226729875e-05} +{"train_loss": 0.007982826791703701, "global_step": 16799, "epoch": 141, "lr": 8.751580767686063e-05} +{"train_loss": 0.005659083370119333, "global_step": 16800, "epoch": 141, "lr": 8.751434301276422e-05} +{"train_loss": 0.005635482259094715, "global_step": 16801, "epoch": 141, "lr": 8.751287827501242e-05} +{"train_loss": 0.008187642320990562, "global_step": 16802, "epoch": 141, "lr": 8.751141346360809e-05} +{"train_loss": 0.0050591700710356236, "global_step": 16803, "epoch": 141, "lr": 8.75099485785541e-05} +{"train_loss": 0.005041609983891249, "global_step": 16804, "epoch": 141, "lr": 8.750848361985333e-05} +{"train_loss": 0.003991761710494757, "global_step": 16805, "epoch": 141, "lr": 8.750701858750868e-05} +{"train_loss": 0.00721147283911705, "global_step": 16806, "epoch": 141, "lr": 8.750555348152298e-05} +{"train_loss": 0.00712869968265295, "global_step": 16807, "epoch": 141, "lr": 8.750408830189915e-05} +{"train_loss": 0.00812830775976181, "global_step": 16808, "epoch": 141, "lr": 8.750262304864004e-05} +{"train_loss": 0.006579200271517038, "global_step": 16809, "epoch": 141, "lr": 8.750115772174855e-05} +{"train_loss": 0.008453670889139175, "global_step": 16810, "epoch": 141, "lr": 8.749969232122752e-05} +{"train_loss": 0.004921138286590576, "global_step": 16811, "epoch": 141, "lr": 8.749822684707987e-05} +{"train_loss": 0.0065527805127203465, "global_step": 16812, "epoch": 141, "lr": 8.749676129930844e-05} +{"train_loss": 0.004858002066612244, "global_step": 16813, "epoch": 141, "lr": 8.749529567791614e-05} +{"train_loss": 0.009186972863972187, "global_step": 16814, "epoch": 141, "lr": 8.749382998290583e-05} +{"train_loss": 0.0033405793365091085, "global_step": 16815, "epoch": 141, "lr": 8.74923642142804e-05} +{"train_loss": 0.007540442515164614, "global_step": 16816, "epoch": 141, "lr": 8.74908983720427e-05} +{"train_loss": 0.007095555309206247, "global_step": 16817, "epoch": 141, "lr": 8.748943245619563e-05} +{"train_loss": 0.0052769239991903305, "global_step": 16818, "epoch": 141, "lr": 8.748796646674207e-05} +{"train_loss": 0.005951050203293562, "global_step": 16819, "epoch": 141, "lr": 8.748650040368489e-05} +{"train_loss": 0.007309489417821169, "global_step": 16820, "epoch": 141, "lr": 8.748503426702698e-05} +{"train_loss": 0.004047528840601444, "global_step": 16821, "epoch": 141, "lr": 8.748356805677121e-05} +{"train_loss": 0.007360403425991535, "global_step": 16822, "epoch": 141, "lr": 8.748210177292044e-05} +{"train_loss": 0.006942437961697578, "global_step": 16823, "epoch": 141, "lr": 8.748063541547757e-05} +{"train_loss": 0.00662354426458478, "global_step": 16824, "epoch": 141, "lr": 8.747916898444549e-05} +{"train_loss": 0.007060966454446316, "global_step": 16825, "epoch": 141, "lr": 8.747770247982708e-05} +{"train_loss": 0.005498415790498257, "global_step": 16826, "epoch": 141, "lr": 8.747623590162517e-05} +{"train_loss": 0.006686306558549404, "global_step": 16827, "epoch": 141, "lr": 8.74747692498427e-05} +{"train_loss": 0.008457890711724758, "global_step": 16828, "epoch": 141, "lr": 8.747330252448251e-05} +{"train_loss": 0.008455275557935238, "global_step": 16829, "epoch": 141, "lr": 8.747183572554748e-05} +{"train_loss": 0.009250413626432419, "global_step": 16830, "epoch": 141, "lr": 8.747036885304055e-05} +{"train_loss": 0.0037066657096147537, "global_step": 16831, "epoch": 141, "lr": 8.74689019069645e-05} +{"train_loss": 0.005269051995128393, "global_step": 16832, "epoch": 141, "lr": 8.74674348873223e-05} +{"train_loss": 0.007059148512780666, "global_step": 16833, "epoch": 141, "lr": 8.74659677941168e-05} +{"train_loss": 0.00784474890679121, "global_step": 16834, "epoch": 141, "lr": 8.746450062735086e-05} +{"train_loss": 0.005521466489881277, "global_step": 16835, "epoch": 141, "lr": 8.746303338702737e-05} +{"train_loss": 0.007319328375160694, "global_step": 16836, "epoch": 141, "lr": 8.746156607314922e-05} +{"train_loss": 0.007384797558188438, "global_step": 16837, "epoch": 141, "lr": 8.746009868571928e-05} +{"train_loss": 0.006110513582825661, "global_step": 16838, "epoch": 141, "lr": 8.745863122474045e-05} +{"train_loss": 0.0052710059098899364, "global_step": 16839, "epoch": 141, "lr": 8.74571636902156e-05} +{"train_loss": 0.005778870545327663, "global_step": 16840, "epoch": 141, "lr": 8.74556960821476e-05} +{"train_loss": 0.004291211254894733, "global_step": 16841, "epoch": 141, "lr": 8.745422840053936e-05} +{"train_loss": 0.005458996165543795, "global_step": 16842, "epoch": 141, "lr": 8.745276064539373e-05} +{"train_loss": 0.007470220793038607, "global_step": 16843, "epoch": 141, "lr": 8.74512928167136e-05} +{"train_loss": 0.006849647965282202, "global_step": 16844, "epoch": 141, "lr": 8.744982491450188e-05} +{"train_loss": 0.0056690918281674385, "global_step": 16845, "epoch": 141, "lr": 8.74483569387614e-05} +{"train_loss": 0.007278377655893564, "global_step": 16846, "epoch": 141, "lr": 8.744688888949511e-05} +{"train_loss": 0.008461199700832367, "global_step": 16847, "epoch": 141, "lr": 8.744542076670582e-05} +{"train_loss": 0.005452521611005068, "global_step": 16848, "epoch": 141, "lr": 8.744395257039646e-05} +{"train_loss": 0.009195438586175442, "global_step": 16849, "epoch": 141, "lr": 8.744248430056991e-05} +{"train_loss": 0.006047117989510298, "global_step": 16850, "epoch": 141, "lr": 8.744101595722902e-05} +{"train_loss": 0.0054037789814174175, "global_step": 16851, "epoch": 141, "lr": 8.743954754037671e-05} +{"train_loss": 0.004058001097291708, "global_step": 16852, "epoch": 141, "lr": 8.743807905001584e-05} +{"train_loss": 0.0037038817536085844, "global_step": 16853, "epoch": 141, "lr": 8.743661048614931e-05} +{"train_loss": 0.006231341976672411, "global_step": 16854, "epoch": 141, "lr": 8.743514184877999e-05} +{"train_loss": 0.006034584250301123, "global_step": 16855, "epoch": 141, "lr": 8.743367313791078e-05} +{"train_loss": 0.0041222600266337395, "global_step": 16856, "epoch": 141, "lr": 8.743220435354453e-05} +{"train_loss": 0.00820433534681797, "global_step": 16857, "epoch": 141, "lr": 8.743073549568417e-05} +{"train_loss": 0.005763588473200798, "global_step": 16858, "epoch": 141, "lr": 8.742926656433254e-05} +{"train_loss": 0.005504379514604807, "global_step": 16859, "epoch": 141, "lr": 8.742779755949256e-05} +{"train_loss": 0.007755281403660774, "global_step": 16860, "epoch": 141, "lr": 8.742632848116707e-05} +{"train_loss": 0.006273316219449043, "global_step": 16861, "epoch": 141, "lr": 8.7424859329359e-05} +{"train_loss": 0.0047511267475783825, "global_step": 16862, "epoch": 141, "lr": 8.742339010407122e-05} +{"train_loss": 0.006546305492520332, "global_step": 16863, "epoch": 141, "lr": 8.742192080530663e-05} +{"train_loss": 0.0052998242899775505, "global_step": 16864, "epoch": 141, "lr": 8.742045143306806e-05} +{"train_loss": 0.007016581948846579, "global_step": 16865, "epoch": 141, "lr": 8.741898198735845e-05} +{"train_loss": 0.006605540402233601, "global_step": 16866, "epoch": 141, "lr": 8.741751246818066e-05} +{"train_loss": 0.007197865750640631, "global_step": 16867, "epoch": 141, "lr": 8.74160428755376e-05} +{"train_loss": 0.005538857541978359, "global_step": 16868, "epoch": 141, "lr": 8.741457320943211e-05} +{"train_loss": 0.009598102420568466, "global_step": 16869, "epoch": 141, "lr": 8.741310346986711e-05} +{"train_loss": 0.00662964815273881, "global_step": 16870, "epoch": 141, "lr": 8.74116336568455e-05} +{"train_loss": 0.0054039424285292625, "global_step": 16871, "epoch": 141, "lr": 8.741016377037013e-05} +{"train_loss": 0.005816874094307423, "global_step": 16872, "epoch": 141, "lr": 8.740869381044388e-05} +{"train_loss": 0.005637488327920437, "global_step": 16873, "epoch": 141, "lr": 8.74072237770697e-05} +{"train_loss": 0.007239001337438822, "global_step": 16874, "epoch": 141, "lr": 8.740575367025039e-05} +{"train_loss": 0.004865614697337151, "global_step": 16875, "epoch": 141, "lr": 8.740428348998891e-05} +{"train_loss": 0.004145528189837933, "global_step": 16876, "epoch": 141, "lr": 8.740281323628809e-05} +{"train_loss": 0.006490549072623253, "global_step": 16877, "epoch": 141, "lr": 8.740134290915085e-05} +{"train_loss": 0.005157062783837318, "global_step": 16878, "epoch": 141, "lr": 8.739987250858007e-05} +{"train_loss": 0.0052575962617993355, "global_step": 16879, "epoch": 141, "lr": 8.739840203457863e-05} +{"train_loss": 0.006785445846617222, "global_step": 16880, "epoch": 141, "lr": 8.739693148714945e-05} +{"train_loss": 0.004775994922965765, "global_step": 16881, "epoch": 141, "lr": 8.739546086629536e-05} +{"train_loss": 0.005688226781785488, "global_step": 16882, "epoch": 141, "lr": 8.73939901720193e-05} +{"train_loss": 0.004340107087045908, "global_step": 16883, "epoch": 141, "lr": 8.739251940432411e-05} +{"train_loss": 0.004779343958944082, "global_step": 16884, "epoch": 141, "lr": 8.739104856321271e-05} +{"train_loss": 0.005774193909019232, "global_step": 16885, "epoch": 141, "lr": 8.7389577648688e-05} +{"train_loss": 0.0076067280024290085, "global_step": 16886, "epoch": 141, "lr": 8.738810666075283e-05} +{"train_loss": 0.004907000344246626, "global_step": 16887, "epoch": 141, "lr": 8.738663559941012e-05} +{"train_loss": 0.005670217797160149, "global_step": 16888, "epoch": 141, "lr": 8.738516446466275e-05} +{"train_loss": 0.007549051195383072, "global_step": 16889, "epoch": 141, "lr": 8.738369325651358e-05} +{"train_loss": 0.005919689312577248, "global_step": 16890, "epoch": 141, "lr": 8.738222197496553e-05} +{"train_loss": 0.004104380961507559, "global_step": 16891, "epoch": 141, "lr": 8.73807506200215e-05} +{"train_loss": 0.0067632137797772884, "global_step": 16892, "epoch": 141, "lr": 8.737927919168434e-05} +{"train_loss": 0.005344776436686516, "global_step": 16893, "epoch": 141, "lr": 8.737780768995696e-05} +{"train_loss": 0.006831103935837746, "global_step": 16894, "epoch": 141, "lr": 8.737633611484226e-05} +{"train_loss": 0.006710190325975418, "global_step": 16895, "epoch": 141, "lr": 8.737486446634311e-05} +{"train_loss": 0.007278150413185358, "global_step": 16896, "epoch": 141, "lr": 8.73733927444624e-05} +{"train_loss": 0.006231292338744432, "global_step": 16897, "epoch": 141, "lr": 8.737192094920303e-05, "val_loss": 0.023084836080670357} +{"train_loss": 0.004280924331396818, "global_step": 16898, "epoch": 142, "lr": 8.73704490805679e-05} +{"train_loss": 0.005684633739292622, "global_step": 16899, "epoch": 142, "lr": 8.736897713855987e-05} +{"train_loss": 0.0056185671128332615, "global_step": 16900, "epoch": 142, "lr": 8.736750512318184e-05} +{"train_loss": 0.00572872394695878, "global_step": 16901, "epoch": 142, "lr": 8.736603303443671e-05} +{"train_loss": 0.005553895607590675, "global_step": 16902, "epoch": 142, "lr": 8.736456087232738e-05} +{"train_loss": 0.004624116700142622, "global_step": 16903, "epoch": 142, "lr": 8.736308863685672e-05} +{"train_loss": 0.007106896489858627, "global_step": 16904, "epoch": 142, "lr": 8.736161632802761e-05} +{"train_loss": 0.00924643874168396, "global_step": 16905, "epoch": 142, "lr": 8.736014394584297e-05} +{"train_loss": 0.005859775934368372, "global_step": 16906, "epoch": 142, "lr": 8.73586714903057e-05} +{"train_loss": 0.00446003582328558, "global_step": 16907, "epoch": 142, "lr": 8.735719896141865e-05} +{"train_loss": 0.00437351455911994, "global_step": 16908, "epoch": 142, "lr": 8.735572635918472e-05} +{"train_loss": 0.006020424421876669, "global_step": 16909, "epoch": 142, "lr": 8.735425368360684e-05} +{"train_loss": 0.010380808264017105, "global_step": 16910, "epoch": 142, "lr": 8.735278093468785e-05} +{"train_loss": 0.006265362724661827, "global_step": 16911, "epoch": 142, "lr": 8.735130811243067e-05} +{"train_loss": 0.008241691626608372, "global_step": 16912, "epoch": 142, "lr": 8.734983521683819e-05} +{"train_loss": 0.004678888712078333, "global_step": 16913, "epoch": 142, "lr": 8.73483622479133e-05} +{"train_loss": 0.006144245155155659, "global_step": 16914, "epoch": 142, "lr": 8.73468892056589e-05} +{"train_loss": 0.004933950956910849, "global_step": 16915, "epoch": 142, "lr": 8.734541609007785e-05} +{"train_loss": 0.006256441585719585, "global_step": 16916, "epoch": 142, "lr": 8.734394290117307e-05} +{"train_loss": 0.005342147313058376, "global_step": 16917, "epoch": 142, "lr": 8.734246963894746e-05} +{"train_loss": 0.006209148094058037, "global_step": 16918, "epoch": 142, "lr": 8.734099630340389e-05} +{"train_loss": 0.006329918745905161, "global_step": 16919, "epoch": 142, "lr": 8.733952289454527e-05} +{"train_loss": 0.00806588213890791, "global_step": 16920, "epoch": 142, "lr": 8.733804941237448e-05} +{"train_loss": 0.005404744762927294, "global_step": 16921, "epoch": 142, "lr": 8.733657585689443e-05} +{"train_loss": 0.006765314377844334, "global_step": 16922, "epoch": 142, "lr": 8.7335102228108e-05} +{"train_loss": 0.007341329008340836, "global_step": 16923, "epoch": 142, "lr": 8.733362852601807e-05} +{"train_loss": 0.0036133956164121628, "global_step": 16924, "epoch": 142, "lr": 8.733215475062757e-05} +{"train_loss": 0.007338360883295536, "global_step": 16925, "epoch": 142, "lr": 8.733068090193937e-05} +{"train_loss": 0.007146361283957958, "global_step": 16926, "epoch": 142, "lr": 8.732920697995634e-05} +{"train_loss": 0.004195021465420723, "global_step": 16927, "epoch": 142, "lr": 8.732773298468143e-05} +{"train_loss": 0.004170888569205999, "global_step": 16928, "epoch": 142, "lr": 8.732625891611749e-05} +{"train_loss": 0.0040868367068469524, "global_step": 16929, "epoch": 142, "lr": 8.732478477426743e-05} +{"train_loss": 0.005037042312324047, "global_step": 16930, "epoch": 142, "lr": 8.732331055913414e-05} +{"train_loss": 0.0038879471831023693, "global_step": 16931, "epoch": 142, "lr": 8.732183627072052e-05} +{"train_loss": 0.00487022427842021, "global_step": 16932, "epoch": 142, "lr": 8.732036190902946e-05} +{"train_loss": 0.006967791821807623, "global_step": 16933, "epoch": 142, "lr": 8.731888747406388e-05} +{"train_loss": 0.008335436694324017, "global_step": 16934, "epoch": 142, "lr": 8.731741296582662e-05} +{"train_loss": 0.006504223216325045, "global_step": 16935, "epoch": 142, "lr": 8.731593838432062e-05} +{"train_loss": 0.004005882423371077, "global_step": 16936, "epoch": 142, "lr": 8.731446372954875e-05} +{"train_loss": 0.004918443504720926, "global_step": 16937, "epoch": 142, "lr": 8.731298900151392e-05} +{"train_loss": 0.008673039264976978, "global_step": 16938, "epoch": 142, "lr": 8.731151420021903e-05} +{"train_loss": 0.007344114128500223, "global_step": 16939, "epoch": 142, "lr": 8.731003932566697e-05} +{"train_loss": 0.003780307248234749, "global_step": 16940, "epoch": 142, "lr": 8.730856437786063e-05} +{"train_loss": 0.005952050909399986, "global_step": 16941, "epoch": 142, "lr": 8.730708935680292e-05} +{"train_loss": 0.006481424439698458, "global_step": 16942, "epoch": 142, "lr": 8.730561426249671e-05} +{"train_loss": 0.005990507081151009, "global_step": 16943, "epoch": 142, "lr": 8.730413909494492e-05} +{"train_loss": 0.007717988453805447, "global_step": 16944, "epoch": 142, "lr": 8.730266385415043e-05} +{"train_loss": 0.006118078716099262, "global_step": 16945, "epoch": 142, "lr": 8.730118854011615e-05} +{"train_loss": 0.0036605140194296837, "global_step": 16946, "epoch": 142, "lr": 8.729971315284497e-05} +{"train_loss": 0.005921903531998396, "global_step": 16947, "epoch": 142, "lr": 8.729823769233979e-05} +{"train_loss": 0.00384659506380558, "global_step": 16948, "epoch": 142, "lr": 8.729676215860351e-05} +{"train_loss": 0.004429129417985678, "global_step": 16949, "epoch": 142, "lr": 8.729528655163901e-05} +{"train_loss": 0.008814450353384018, "global_step": 16950, "epoch": 142, "lr": 8.729381087144922e-05} +{"train_loss": 0.006357209291309118, "global_step": 16951, "epoch": 142, "lr": 8.729233511803699e-05} +{"train_loss": 0.004063200205564499, "global_step": 16952, "epoch": 142, "lr": 8.729085929140526e-05} +{"train_loss": 0.00425832811743021, "global_step": 16953, "epoch": 142, "lr": 8.72893833915569e-05} +{"train_loss": 0.007223040331155062, "global_step": 16954, "epoch": 142, "lr": 8.728790741849484e-05} +{"train_loss": 0.00804433785378933, "global_step": 16955, "epoch": 142, "lr": 8.728643137222195e-05} +{"train_loss": 0.004769239109009504, "global_step": 16956, "epoch": 142, "lr": 8.728495525274113e-05} +{"train_loss": 0.005879403557628393, "global_step": 16957, "epoch": 142, "lr": 8.728347906005527e-05} +{"train_loss": 0.004537299275398254, "global_step": 16958, "epoch": 142, "lr": 8.728200279416729e-05} +{"train_loss": 0.004306082613766193, "global_step": 16959, "epoch": 142, "lr": 8.72805264550801e-05} +{"train_loss": 0.004956760909408331, "global_step": 16960, "epoch": 142, "lr": 8.727905004279656e-05} +{"train_loss": 0.007389421574771404, "global_step": 16961, "epoch": 142, "lr": 8.72775735573196e-05} +{"train_loss": 0.004379878286272287, "global_step": 16962, "epoch": 142, "lr": 8.72760969986521e-05} +{"train_loss": 0.004783358424901962, "global_step": 16963, "epoch": 142, "lr": 8.727462036679696e-05} +{"train_loss": 0.005807889625430107, "global_step": 16964, "epoch": 142, "lr": 8.72731436617571e-05} +{"train_loss": 0.0037450511008501053, "global_step": 16965, "epoch": 142, "lr": 8.727166688353539e-05} +{"train_loss": 0.0071899318136274815, "global_step": 16966, "epoch": 142, "lr": 8.727019003213475e-05} +{"train_loss": 0.006505207624286413, "global_step": 16967, "epoch": 142, "lr": 8.726871310755808e-05} +{"train_loss": 0.006159715820103884, "global_step": 16968, "epoch": 142, "lr": 8.726723610980826e-05} +{"train_loss": 0.007817775011062622, "global_step": 16969, "epoch": 142, "lr": 8.72657590388882e-05} +{"train_loss": 0.004562229849398136, "global_step": 16970, "epoch": 142, "lr": 8.726428189480082e-05} +{"train_loss": 0.006247764453291893, "global_step": 16971, "epoch": 142, "lr": 8.7262804677549e-05} +{"train_loss": 0.004200046416372061, "global_step": 16972, "epoch": 142, "lr": 8.726132738713563e-05} +{"train_loss": 0.0056321388110518456, "global_step": 16973, "epoch": 142, "lr": 8.725985002356365e-05} +{"train_loss": 0.00553195970132947, "global_step": 16974, "epoch": 142, "lr": 8.72583725868359e-05} +{"train_loss": 0.007461901754140854, "global_step": 16975, "epoch": 142, "lr": 8.725689507695536e-05} +{"train_loss": 0.004375542048364878, "global_step": 16976, "epoch": 142, "lr": 8.725541749392487e-05} +{"train_loss": 0.006587289739400148, "global_step": 16977, "epoch": 142, "lr": 8.725393983774734e-05} +{"train_loss": 0.004762537311762571, "global_step": 16978, "epoch": 142, "lr": 8.725246210842569e-05} +{"train_loss": 0.00567625043913722, "global_step": 16979, "epoch": 142, "lr": 8.725098430596279e-05} +{"train_loss": 0.006248588673770428, "global_step": 16980, "epoch": 142, "lr": 8.724950643036157e-05} +{"train_loss": 0.005835643969476223, "global_step": 16981, "epoch": 142, "lr": 8.724802848162492e-05} +{"train_loss": 0.00564621202647686, "global_step": 16982, "epoch": 142, "lr": 8.724655045975576e-05} +{"train_loss": 0.003890963736921549, "global_step": 16983, "epoch": 142, "lr": 8.724507236475696e-05} +{"train_loss": 0.006466110702604055, "global_step": 16984, "epoch": 142, "lr": 8.724359419663146e-05} +{"train_loss": 0.004441717639565468, "global_step": 16985, "epoch": 142, "lr": 8.724211595538213e-05} +{"train_loss": 0.00494290329515934, "global_step": 16986, "epoch": 142, "lr": 8.724063764101189e-05} +{"train_loss": 0.006675771437585354, "global_step": 16987, "epoch": 142, "lr": 8.723915925352361e-05} +{"train_loss": 0.0045835524797439575, "global_step": 16988, "epoch": 142, "lr": 8.723768079292025e-05} +{"train_loss": 0.007212357595562935, "global_step": 16989, "epoch": 142, "lr": 8.723620225920468e-05} +{"train_loss": 0.006446412764489651, "global_step": 16990, "epoch": 142, "lr": 8.723472365237978e-05} +{"train_loss": 0.004456050228327513, "global_step": 16991, "epoch": 142, "lr": 8.723324497244852e-05} +{"train_loss": 0.007765268441289663, "global_step": 16992, "epoch": 142, "lr": 8.723176621941374e-05} +{"train_loss": 0.005616040900349617, "global_step": 16993, "epoch": 142, "lr": 8.723028739327834e-05} +{"train_loss": 0.005131689831614494, "global_step": 16994, "epoch": 142, "lr": 8.722880849404527e-05} +{"train_loss": 0.0047943489626049995, "global_step": 16995, "epoch": 142, "lr": 8.722732952171742e-05} +{"train_loss": 0.008458024822175503, "global_step": 16996, "epoch": 142, "lr": 8.722585047629768e-05} +{"train_loss": 0.004924295470118523, "global_step": 16997, "epoch": 142, "lr": 8.722437135778897e-05} +{"train_loss": 0.005654615815728903, "global_step": 16998, "epoch": 142, "lr": 8.722289216619417e-05} +{"train_loss": 0.005706793628633022, "global_step": 16999, "epoch": 142, "lr": 8.722141290151618e-05} +{"train_loss": 0.005631599109619856, "global_step": 17000, "epoch": 142, "lr": 8.721993356375795e-05} +{"train_loss": 0.0049392543733119965, "global_step": 17001, "epoch": 142, "lr": 8.721845415292235e-05} +{"train_loss": 0.007711908780038357, "global_step": 17002, "epoch": 142, "lr": 8.721697466901229e-05} +{"train_loss": 0.006534612271934748, "global_step": 17003, "epoch": 142, "lr": 8.721549511203066e-05} +{"train_loss": 0.0066762520000338554, "global_step": 17004, "epoch": 142, "lr": 8.72140154819804e-05} +{"train_loss": 0.005452625919133425, "global_step": 17005, "epoch": 142, "lr": 8.721253577886441e-05} +{"train_loss": 0.006669625174254179, "global_step": 17006, "epoch": 142, "lr": 8.721105600268555e-05} +{"train_loss": 0.006577807012945414, "global_step": 17007, "epoch": 142, "lr": 8.720957615344678e-05} +{"train_loss": 0.0038221341092139482, "global_step": 17008, "epoch": 142, "lr": 8.720809623115096e-05} +{"train_loss": 0.007968267425894737, "global_step": 17009, "epoch": 142, "lr": 8.720661623580104e-05} +{"train_loss": 0.005693371873348951, "global_step": 17010, "epoch": 142, "lr": 8.72051361673999e-05} +{"train_loss": 0.008526830933988094, "global_step": 17011, "epoch": 142, "lr": 8.720365602595044e-05} +{"train_loss": 0.005955930333584547, "global_step": 17012, "epoch": 142, "lr": 8.720217581145557e-05} +{"train_loss": 0.005171830300241709, "global_step": 17013, "epoch": 142, "lr": 8.720069552391824e-05} +{"train_loss": 0.004847055301070213, "global_step": 17014, "epoch": 142, "lr": 8.719921516334129e-05} +{"train_loss": 0.007442856207489967, "global_step": 17015, "epoch": 142, "lr": 8.719773472972766e-05} +{"train_loss": 0.005871769132781304, "global_step": 17016, "epoch": 142, "lr": 8.719625422308025e-05, "val_loss": 0.009821089915931225} +{"train_loss": 0.004860571585595608, "global_step": 17017, "epoch": 143, "lr": 8.719477364340196e-05} +{"train_loss": 0.005315401125699282, "global_step": 17018, "epoch": 143, "lr": 8.719329299069571e-05} +{"train_loss": 0.005202540196478367, "global_step": 17019, "epoch": 143, "lr": 8.71918122649644e-05} +{"train_loss": 0.006785562727600336, "global_step": 17020, "epoch": 143, "lr": 8.719033146621096e-05} +{"train_loss": 0.010767875239253044, "global_step": 17021, "epoch": 143, "lr": 8.718885059443826e-05} +{"train_loss": 0.004027009941637516, "global_step": 17022, "epoch": 143, "lr": 8.718736964964923e-05} +{"train_loss": 0.004385682754218578, "global_step": 17023, "epoch": 143, "lr": 8.718588863184676e-05} +{"train_loss": 0.008313012309372425, "global_step": 17024, "epoch": 143, "lr": 8.718440754103378e-05} +{"train_loss": 0.00830114260315895, "global_step": 17025, "epoch": 143, "lr": 8.71829263772132e-05} +{"train_loss": 0.007994704879820347, "global_step": 17026, "epoch": 143, "lr": 8.71814451403879e-05} +{"train_loss": 0.007900155149400234, "global_step": 17027, "epoch": 143, "lr": 8.717996383056081e-05} +{"train_loss": 0.007409663405269384, "global_step": 17028, "epoch": 143, "lr": 8.717848244773485e-05} +{"train_loss": 0.009394960477948189, "global_step": 17029, "epoch": 143, "lr": 8.71770009919129e-05} +{"train_loss": 0.005220734514296055, "global_step": 17030, "epoch": 143, "lr": 8.717551946309788e-05} +{"train_loss": 0.006260413210839033, "global_step": 17031, "epoch": 143, "lr": 8.717403786129269e-05} +{"train_loss": 0.006286153104156256, "global_step": 17032, "epoch": 143, "lr": 8.717255618650026e-05} +{"train_loss": 0.0076852161437273026, "global_step": 17033, "epoch": 143, "lr": 8.717107443872348e-05} +{"train_loss": 0.006207889877259731, "global_step": 17034, "epoch": 143, "lr": 8.716959261796526e-05} +{"train_loss": 0.005817480850964785, "global_step": 17035, "epoch": 143, "lr": 8.716811072422852e-05} +{"train_loss": 0.005590471904724836, "global_step": 17036, "epoch": 143, "lr": 8.716662875751618e-05} +{"train_loss": 0.007044964004307985, "global_step": 17037, "epoch": 143, "lr": 8.716514671783112e-05} +{"train_loss": 0.00764884427189827, "global_step": 17038, "epoch": 143, "lr": 8.716366460517626e-05} +{"train_loss": 0.00794251635670662, "global_step": 17039, "epoch": 143, "lr": 8.716218241955454e-05} +{"train_loss": 0.005617518909275532, "global_step": 17040, "epoch": 143, "lr": 8.716070016096882e-05} +{"train_loss": 0.007913668639957905, "global_step": 17041, "epoch": 143, "lr": 8.715921782942205e-05} +{"train_loss": 0.005813555791974068, "global_step": 17042, "epoch": 143, "lr": 8.715773542491712e-05} +{"train_loss": 0.005009352695196867, "global_step": 17043, "epoch": 143, "lr": 8.715625294745694e-05} +{"train_loss": 0.0051912786439061165, "global_step": 17044, "epoch": 143, "lr": 8.715477039704443e-05} +{"train_loss": 0.008555551990866661, "global_step": 17045, "epoch": 143, "lr": 8.71532877736825e-05} +{"train_loss": 0.004311094060540199, "global_step": 17046, "epoch": 143, "lr": 8.715180507737406e-05} +{"train_loss": 0.004992416128516197, "global_step": 17047, "epoch": 143, "lr": 8.715032230812202e-05} +{"train_loss": 0.007311154156923294, "global_step": 17048, "epoch": 143, "lr": 8.714883946592929e-05} +{"train_loss": 0.005054989829659462, "global_step": 17049, "epoch": 143, "lr": 8.714735655079878e-05} +{"train_loss": 0.007174555212259293, "global_step": 17050, "epoch": 143, "lr": 8.71458735627334e-05} +{"train_loss": 0.0066492739133536816, "global_step": 17051, "epoch": 143, "lr": 8.714439050173608e-05} +{"train_loss": 0.008747976273298264, "global_step": 17052, "epoch": 143, "lr": 8.714290736780973e-05} +{"train_loss": 0.00436242762953043, "global_step": 17053, "epoch": 143, "lr": 8.714142416095721e-05} +{"train_loss": 0.007104047108441591, "global_step": 17054, "epoch": 143, "lr": 8.713994088118149e-05} +{"train_loss": 0.00989466905593872, "global_step": 17055, "epoch": 143, "lr": 8.713845752848547e-05} +{"train_loss": 0.009456975385546684, "global_step": 17056, "epoch": 143, "lr": 8.713697410287205e-05} +{"train_loss": 0.006470005493611097, "global_step": 17057, "epoch": 143, "lr": 8.713549060434416e-05} +{"train_loss": 0.003645205171778798, "global_step": 17058, "epoch": 143, "lr": 8.713400703290469e-05} +{"train_loss": 0.005926148500293493, "global_step": 17059, "epoch": 143, "lr": 8.713252338855655e-05} +{"train_loss": 0.005217480007559061, "global_step": 17060, "epoch": 143, "lr": 8.713103967130269e-05} +{"train_loss": 0.0037093386054039, "global_step": 17061, "epoch": 143, "lr": 8.712955588114599e-05} +{"train_loss": 0.006839631590992212, "global_step": 17062, "epoch": 143, "lr": 8.712807201808939e-05} +{"train_loss": 0.008987128734588623, "global_step": 17063, "epoch": 143, "lr": 8.712658808213577e-05} +{"train_loss": 0.005800351966172457, "global_step": 17064, "epoch": 143, "lr": 8.712510407328806e-05} +{"train_loss": 0.008290501311421394, "global_step": 17065, "epoch": 143, "lr": 8.712361999154919e-05} +{"train_loss": 0.007910840213298798, "global_step": 17066, "epoch": 143, "lr": 8.712213583692203e-05} +{"train_loss": 0.0077382349409163, "global_step": 17067, "epoch": 143, "lr": 8.712065160940957e-05} +{"train_loss": 0.00646686227992177, "global_step": 17068, "epoch": 143, "lr": 8.711916730901464e-05} +{"train_loss": 0.004943951964378357, "global_step": 17069, "epoch": 143, "lr": 8.711768293574019e-05} +{"train_loss": 0.004499274771660566, "global_step": 17070, "epoch": 143, "lr": 8.711619848958914e-05} +{"train_loss": 0.004508044570684433, "global_step": 17071, "epoch": 143, "lr": 8.711471397056441e-05} +{"train_loss": 0.007957867346704006, "global_step": 17072, "epoch": 143, "lr": 8.71132293786689e-05} +{"train_loss": 0.004678879864513874, "global_step": 17073, "epoch": 143, "lr": 8.711174471390552e-05} +{"train_loss": 0.007965472526848316, "global_step": 17074, "epoch": 143, "lr": 8.71102599762772e-05} +{"train_loss": 0.007592388894408941, "global_step": 17075, "epoch": 143, "lr": 8.710877516578683e-05} +{"train_loss": 0.006227938458323479, "global_step": 17076, "epoch": 143, "lr": 8.710729028243739e-05} +{"train_loss": 0.007510815747082233, "global_step": 17077, "epoch": 143, "lr": 8.710580532623171e-05} +{"train_loss": 0.00630700308829546, "global_step": 17078, "epoch": 143, "lr": 8.710432029717276e-05} +{"train_loss": 0.007946065627038479, "global_step": 17079, "epoch": 143, "lr": 8.710283519526345e-05} +{"train_loss": 0.006855362560600042, "global_step": 17080, "epoch": 143, "lr": 8.710135002050667e-05} +{"train_loss": 0.0061761788092553616, "global_step": 17081, "epoch": 143, "lr": 8.709986477290534e-05} +{"train_loss": 0.005815635900944471, "global_step": 17082, "epoch": 143, "lr": 8.709837945246242e-05} +{"train_loss": 0.005428805015981197, "global_step": 17083, "epoch": 143, "lr": 8.709689405918078e-05} +{"train_loss": 0.006009121425449848, "global_step": 17084, "epoch": 143, "lr": 8.709540859306336e-05} +{"train_loss": 0.006042851135134697, "global_step": 17085, "epoch": 143, "lr": 8.709392305411306e-05} +{"train_loss": 0.003712128382176161, "global_step": 17086, "epoch": 143, "lr": 8.709243744233282e-05} +{"train_loss": 0.006689064670354128, "global_step": 17087, "epoch": 143, "lr": 8.709095175772552e-05} +{"train_loss": 0.009546501561999321, "global_step": 17088, "epoch": 143, "lr": 8.70894660002941e-05} +{"train_loss": 0.0054300990886986256, "global_step": 17089, "epoch": 143, "lr": 8.70879801700415e-05} +{"train_loss": 0.007762011606246233, "global_step": 17090, "epoch": 143, "lr": 8.70864942669706e-05} +{"train_loss": 0.006351762916892767, "global_step": 17091, "epoch": 143, "lr": 8.708500829108433e-05} +{"train_loss": 0.004537515342235565, "global_step": 17092, "epoch": 143, "lr": 8.70835222423856e-05} +{"train_loss": 0.011628394015133381, "global_step": 17093, "epoch": 143, "lr": 8.708203612087736e-05} +{"train_loss": 0.006532709579914808, "global_step": 17094, "epoch": 143, "lr": 8.708054992656247e-05} +{"train_loss": 0.004805985372513533, "global_step": 17095, "epoch": 143, "lr": 8.707906365944391e-05} +{"train_loss": 0.007604626938700676, "global_step": 17096, "epoch": 143, "lr": 8.707757731952455e-05} +{"train_loss": 0.007840326055884361, "global_step": 17097, "epoch": 143, "lr": 8.707609090680734e-05} +{"train_loss": 0.008361877873539925, "global_step": 17098, "epoch": 143, "lr": 8.707460442129519e-05} +{"train_loss": 0.006742749363183975, "global_step": 17099, "epoch": 143, "lr": 8.7073117862991e-05} +{"train_loss": 0.006028089206665754, "global_step": 17100, "epoch": 143, "lr": 8.70716312318977e-05} +{"train_loss": 0.006911950651556253, "global_step": 17101, "epoch": 143, "lr": 8.707014452801822e-05} +{"train_loss": 0.004505263175815344, "global_step": 17102, "epoch": 143, "lr": 8.706865775135548e-05} +{"train_loss": 0.005170134827494621, "global_step": 17103, "epoch": 143, "lr": 8.706717090191238e-05} +{"train_loss": 0.010288767516613007, "global_step": 17104, "epoch": 143, "lr": 8.706568397969188e-05} +{"train_loss": 0.005967448931187391, "global_step": 17105, "epoch": 143, "lr": 8.706419698469683e-05} +{"train_loss": 0.0062378766015172005, "global_step": 17106, "epoch": 143, "lr": 8.706270991693021e-05} +{"train_loss": 0.006248741410672665, "global_step": 17107, "epoch": 143, "lr": 8.706122277639492e-05} +{"train_loss": 0.004727902356535196, "global_step": 17108, "epoch": 143, "lr": 8.705973556309387e-05} +{"train_loss": 0.006177947856485844, "global_step": 17109, "epoch": 143, "lr": 8.705824827702999e-05} +{"train_loss": 0.004889644682407379, "global_step": 17110, "epoch": 143, "lr": 8.70567609182062e-05} +{"train_loss": 0.005786608438938856, "global_step": 17111, "epoch": 143, "lr": 8.705527348662541e-05} +{"train_loss": 0.005999951623380184, "global_step": 17112, "epoch": 143, "lr": 8.705378598229057e-05} +{"train_loss": 0.0053933775052428246, "global_step": 17113, "epoch": 143, "lr": 8.705229840520455e-05} +{"train_loss": 0.007786639500409365, "global_step": 17114, "epoch": 143, "lr": 8.705081075537033e-05} +{"train_loss": 0.005465735215693712, "global_step": 17115, "epoch": 143, "lr": 8.704932303279078e-05} +{"train_loss": 0.004164081998169422, "global_step": 17116, "epoch": 143, "lr": 8.704783523746885e-05} +{"train_loss": 0.006569602061063051, "global_step": 17117, "epoch": 143, "lr": 8.704634736940747e-05} +{"train_loss": 0.006788942962884903, "global_step": 17118, "epoch": 143, "lr": 8.704485942860951e-05} +{"train_loss": 0.007038779556751251, "global_step": 17119, "epoch": 143, "lr": 8.704337141507796e-05} +{"train_loss": 0.0067335679195821285, "global_step": 17120, "epoch": 143, "lr": 8.704188332881569e-05} +{"train_loss": 0.0042745331302285194, "global_step": 17121, "epoch": 143, "lr": 8.704039516982565e-05} +{"train_loss": 0.004814266227185726, "global_step": 17122, "epoch": 143, "lr": 8.703890693811074e-05} +{"train_loss": 0.006248076446354389, "global_step": 17123, "epoch": 143, "lr": 8.70374186336739e-05} +{"train_loss": 0.006247138604521751, "global_step": 17124, "epoch": 143, "lr": 8.703593025651804e-05} +{"train_loss": 0.004074131138622761, "global_step": 17125, "epoch": 143, "lr": 8.703444180664608e-05} +{"train_loss": 0.005003966391086578, "global_step": 17126, "epoch": 143, "lr": 8.703295328406097e-05} +{"train_loss": 0.005515181925147772, "global_step": 17127, "epoch": 143, "lr": 8.703146468876559e-05} +{"train_loss": 0.006659675855189562, "global_step": 17128, "epoch": 143, "lr": 8.70299760207629e-05} +{"train_loss": 0.004410327412188053, "global_step": 17129, "epoch": 143, "lr": 8.702848728005582e-05} +{"train_loss": 0.004774474538862705, "global_step": 17130, "epoch": 143, "lr": 8.702699846664724e-05} +{"train_loss": 0.005083155818283558, "global_step": 17131, "epoch": 143, "lr": 8.702550958054012e-05} +{"train_loss": 0.005693088285624981, "global_step": 17132, "epoch": 143, "lr": 8.702402062173736e-05} +{"train_loss": 0.007191619835793972, "global_step": 17133, "epoch": 143, "lr": 8.70225315902419e-05} +{"train_loss": 0.0037434445694088936, "global_step": 17134, "epoch": 143, "lr": 8.702104248605663e-05} +{"train_loss": 0.006392675516500818, "global_step": 17135, "epoch": 143, "lr": 8.701955330918452e-05, "val_loss": 0.015177050605416298} +{"train_loss": 0.007675594184547663, "global_step": 17136, "epoch": 144, "lr": 8.701806405962846e-05} +{"train_loss": 0.005047472193837166, "global_step": 17137, "epoch": 144, "lr": 8.70165747373914e-05} +{"train_loss": 0.007278551813215017, "global_step": 17138, "epoch": 144, "lr": 8.701508534247623e-05} +{"train_loss": 0.00891517661511898, "global_step": 17139, "epoch": 144, "lr": 8.701359587488591e-05} +{"train_loss": 0.005748796742409468, "global_step": 17140, "epoch": 144, "lr": 8.701210633462334e-05} +{"train_loss": 0.004272878170013428, "global_step": 17141, "epoch": 144, "lr": 8.701061672169147e-05} +{"train_loss": 0.007368170190602541, "global_step": 17142, "epoch": 144, "lr": 8.700912703609319e-05} +{"train_loss": 0.005041295196861029, "global_step": 17143, "epoch": 144, "lr": 8.700763727783145e-05} +{"train_loss": 0.006113918498158455, "global_step": 17144, "epoch": 144, "lr": 8.700614744690916e-05} +{"train_loss": 0.004498207475990057, "global_step": 17145, "epoch": 144, "lr": 8.700465754332927e-05} +{"train_loss": 0.008039169013500214, "global_step": 17146, "epoch": 144, "lr": 8.700316756709467e-05} +{"train_loss": 0.006160517688840628, "global_step": 17147, "epoch": 144, "lr": 8.700167751820831e-05} +{"train_loss": 0.006132281851023436, "global_step": 17148, "epoch": 144, "lr": 8.700018739667312e-05} +{"train_loss": 0.006527938414365053, "global_step": 17149, "epoch": 144, "lr": 8.699869720249201e-05} +{"train_loss": 0.009206867776811123, "global_step": 17150, "epoch": 144, "lr": 8.69972069356679e-05} +{"train_loss": 0.005319313611835241, "global_step": 17151, "epoch": 144, "lr": 8.699571659620374e-05} +{"train_loss": 0.004586033523082733, "global_step": 17152, "epoch": 144, "lr": 8.699422618410243e-05} +{"train_loss": 0.00817151553928852, "global_step": 17153, "epoch": 144, "lr": 8.699273569936692e-05} +{"train_loss": 0.005858346354216337, "global_step": 17154, "epoch": 144, "lr": 8.69912451420001e-05} +{"train_loss": 0.006291843019425869, "global_step": 17155, "epoch": 144, "lr": 8.698975451200495e-05} +{"train_loss": 0.007361655123531818, "global_step": 17156, "epoch": 144, "lr": 8.698826380938436e-05} +{"train_loss": 0.007474910467863083, "global_step": 17157, "epoch": 144, "lr": 8.698677303414127e-05} +{"train_loss": 0.004364796914160252, "global_step": 17158, "epoch": 144, "lr": 8.698528218627861e-05} +{"train_loss": 0.007467928342521191, "global_step": 17159, "epoch": 144, "lr": 8.698379126579929e-05} +{"train_loss": 0.003202403662726283, "global_step": 17160, "epoch": 144, "lr": 8.698230027270624e-05} +{"train_loss": 0.004027157556265593, "global_step": 17161, "epoch": 144, "lr": 8.69808092070024e-05} +{"train_loss": 0.01081227045506239, "global_step": 17162, "epoch": 144, "lr": 8.69793180686907e-05} +{"train_loss": 0.006599420215934515, "global_step": 17163, "epoch": 144, "lr": 8.697782685777405e-05} +{"train_loss": 0.00514642521739006, "global_step": 17164, "epoch": 144, "lr": 8.69763355742554e-05} +{"train_loss": 0.005047857761383057, "global_step": 17165, "epoch": 144, "lr": 8.697484421813764e-05} +{"train_loss": 0.004420817829668522, "global_step": 17166, "epoch": 144, "lr": 8.697335278942374e-05} +{"train_loss": 0.006333629135042429, "global_step": 17167, "epoch": 144, "lr": 8.697186128811662e-05} +{"train_loss": 0.0033517591655254364, "global_step": 17168, "epoch": 144, "lr": 8.697036971421919e-05} +{"train_loss": 0.00917559303343296, "global_step": 17169, "epoch": 144, "lr": 8.696887806773439e-05} +{"train_loss": 0.007858174853026867, "global_step": 17170, "epoch": 144, "lr": 8.696738634866515e-05} +{"train_loss": 0.005229451693594456, "global_step": 17171, "epoch": 144, "lr": 8.696589455701439e-05} +{"train_loss": 0.008073942735791206, "global_step": 17172, "epoch": 144, "lr": 8.696440269278506e-05} +{"train_loss": 0.006504237186163664, "global_step": 17173, "epoch": 144, "lr": 8.696291075598006e-05} +{"train_loss": 0.006552720908075571, "global_step": 17174, "epoch": 144, "lr": 8.696141874660233e-05} +{"train_loss": 0.005473533179610968, "global_step": 17175, "epoch": 144, "lr": 8.69599266646548e-05} +{"train_loss": 0.005618206225335598, "global_step": 17176, "epoch": 144, "lr": 8.695843451014042e-05} +{"train_loss": 0.006147583946585655, "global_step": 17177, "epoch": 144, "lr": 8.695694228306211e-05} +{"train_loss": 0.006187931168824434, "global_step": 17178, "epoch": 144, "lr": 8.695544998342277e-05} +{"train_loss": 0.0047244783490896225, "global_step": 17179, "epoch": 144, "lr": 8.695395761122536e-05} +{"train_loss": 0.004479043185710907, "global_step": 17180, "epoch": 144, "lr": 8.69524651664728e-05} +{"train_loss": 0.00807362049818039, "global_step": 17181, "epoch": 144, "lr": 8.695097264916802e-05} +{"train_loss": 0.004279333166778088, "global_step": 17182, "epoch": 144, "lr": 8.694948005931395e-05} +{"train_loss": 0.006260125897824764, "global_step": 17183, "epoch": 144, "lr": 8.694798739691353e-05} +{"train_loss": 0.004308918956667185, "global_step": 17184, "epoch": 144, "lr": 8.694649466196969e-05} +{"train_loss": 0.005821454804390669, "global_step": 17185, "epoch": 144, "lr": 8.694500185448536e-05} +{"train_loss": 0.008448604494333267, "global_step": 17186, "epoch": 144, "lr": 8.694350897446344e-05} +{"train_loss": 0.007346720900386572, "global_step": 17187, "epoch": 144, "lr": 8.69420160219069e-05} +{"train_loss": 0.004585078917443752, "global_step": 17188, "epoch": 144, "lr": 8.694052299681867e-05} +{"train_loss": 0.00757829612120986, "global_step": 17189, "epoch": 144, "lr": 8.693902989920165e-05} +{"train_loss": 0.007782357279211283, "global_step": 17190, "epoch": 144, "lr": 8.69375367290588e-05} +{"train_loss": 0.006225371267646551, "global_step": 17191, "epoch": 144, "lr": 8.693604348639304e-05} +{"train_loss": 0.007458331063389778, "global_step": 17192, "epoch": 144, "lr": 8.693455017120732e-05} +{"train_loss": 0.00538861658424139, "global_step": 17193, "epoch": 144, "lr": 8.693305678350454e-05} +{"train_loss": 0.005270852707326412, "global_step": 17194, "epoch": 144, "lr": 8.693156332328766e-05} +{"train_loss": 0.005230285692960024, "global_step": 17195, "epoch": 144, "lr": 8.69300697905596e-05} +{"train_loss": 0.004677271470427513, "global_step": 17196, "epoch": 144, "lr": 8.692857618532328e-05} +{"train_loss": 0.004870013799518347, "global_step": 17197, "epoch": 144, "lr": 8.692708250758165e-05} +{"train_loss": 0.005063861608505249, "global_step": 17198, "epoch": 144, "lr": 8.692558875733764e-05} +{"train_loss": 0.006242045667022467, "global_step": 17199, "epoch": 144, "lr": 8.692409493459419e-05} +{"train_loss": 0.0072309053502976894, "global_step": 17200, "epoch": 144, "lr": 8.692260103935421e-05} +{"train_loss": 0.005268294829875231, "global_step": 17201, "epoch": 144, "lr": 8.692110707162067e-05} +{"train_loss": 0.00386147852987051, "global_step": 17202, "epoch": 144, "lr": 8.691961303139646e-05} +{"train_loss": 0.005771378520876169, "global_step": 17203, "epoch": 144, "lr": 8.691811891868453e-05} +{"train_loss": 0.003106339368969202, "global_step": 17204, "epoch": 144, "lr": 8.691662473348783e-05} +{"train_loss": 0.007136585656553507, "global_step": 17205, "epoch": 144, "lr": 8.691513047580928e-05} +{"train_loss": 0.004666982218623161, "global_step": 17206, "epoch": 144, "lr": 8.691363614565182e-05} +{"train_loss": 0.00517111923545599, "global_step": 17207, "epoch": 144, "lr": 8.691214174301838e-05} +{"train_loss": 0.005080884322524071, "global_step": 17208, "epoch": 144, "lr": 8.691064726791187e-05} +{"train_loss": 0.004386540502309799, "global_step": 17209, "epoch": 144, "lr": 8.690915272033527e-05} +{"train_loss": 0.0044447146356105804, "global_step": 17210, "epoch": 144, "lr": 8.690765810029149e-05} +{"train_loss": 0.0044251540675759315, "global_step": 17211, "epoch": 144, "lr": 8.690616340778346e-05} +{"train_loss": 0.006111410446465015, "global_step": 17212, "epoch": 144, "lr": 8.690466864281412e-05} +{"train_loss": 0.007108510937541723, "global_step": 17213, "epoch": 144, "lr": 8.690317380538642e-05} +{"train_loss": 0.005440251901745796, "global_step": 17214, "epoch": 144, "lr": 8.690167889550326e-05} +{"train_loss": 0.007746169809252024, "global_step": 17215, "epoch": 144, "lr": 8.690018391316761e-05} +{"train_loss": 0.007344063371419907, "global_step": 17216, "epoch": 144, "lr": 8.689868885838238e-05} +{"train_loss": 0.005438238848000765, "global_step": 17217, "epoch": 144, "lr": 8.689719373115053e-05} +{"train_loss": 0.007159899920225143, "global_step": 17218, "epoch": 144, "lr": 8.689569853147497e-05} +{"train_loss": 0.0041622379794716835, "global_step": 17219, "epoch": 144, "lr": 8.689420325935866e-05} +{"train_loss": 0.007478705607354641, "global_step": 17220, "epoch": 144, "lr": 8.689270791480452e-05} +{"train_loss": 0.005348352715373039, "global_step": 17221, "epoch": 144, "lr": 8.689121249781548e-05} +{"train_loss": 0.006697693839669228, "global_step": 17222, "epoch": 144, "lr": 8.688971700839447e-05} +{"train_loss": 0.005781346466392279, "global_step": 17223, "epoch": 144, "lr": 8.688822144654448e-05} +{"train_loss": 0.005117031279951334, "global_step": 17224, "epoch": 144, "lr": 8.68867258122684e-05} +{"train_loss": 0.00473020039498806, "global_step": 17225, "epoch": 144, "lr": 8.688523010556915e-05} +{"train_loss": 0.003906670957803726, "global_step": 17226, "epoch": 144, "lr": 8.688373432644972e-05} +{"train_loss": 0.003993640653789043, "global_step": 17227, "epoch": 144, "lr": 8.688223847491301e-05} +{"train_loss": 0.006717833224684, "global_step": 17228, "epoch": 144, "lr": 8.688074255096194e-05} +{"train_loss": 0.004442237783223391, "global_step": 17229, "epoch": 144, "lr": 8.68792465545995e-05} +{"train_loss": 0.0053334543481469154, "global_step": 17230, "epoch": 144, "lr": 8.68777504858286e-05} +{"train_loss": 0.008190976455807686, "global_step": 17231, "epoch": 144, "lr": 8.687625434465216e-05} +{"train_loss": 0.0055864956229925156, "global_step": 17232, "epoch": 144, "lr": 8.687475813107315e-05} +{"train_loss": 0.00479933014139533, "global_step": 17233, "epoch": 144, "lr": 8.687326184509448e-05} +{"train_loss": 0.0035011472646147013, "global_step": 17234, "epoch": 144, "lr": 8.68717654867191e-05} +{"train_loss": 0.005783811677247286, "global_step": 17235, "epoch": 144, "lr": 8.687026905594995e-05} +{"train_loss": 0.0043580192141234875, "global_step": 17236, "epoch": 144, "lr": 8.686877255278998e-05} +{"train_loss": 0.007067447993904352, "global_step": 17237, "epoch": 144, "lr": 8.68672759772421e-05} +{"train_loss": 0.005630095023661852, "global_step": 17238, "epoch": 144, "lr": 8.686577932930926e-05} +{"train_loss": 0.0069462331011891365, "global_step": 17239, "epoch": 144, "lr": 8.68642826089944e-05} +{"train_loss": 0.004158315248787403, "global_step": 17240, "epoch": 144, "lr": 8.686278581630047e-05} +{"train_loss": 0.006784819532185793, "global_step": 17241, "epoch": 144, "lr": 8.686128895123038e-05} +{"train_loss": 0.006133561953902245, "global_step": 17242, "epoch": 144, "lr": 8.685979201378712e-05} +{"train_loss": 0.004847997333854437, "global_step": 17243, "epoch": 144, "lr": 8.685829500397356e-05} +{"train_loss": 0.004781050607562065, "global_step": 17244, "epoch": 144, "lr": 8.685679792179268e-05} +{"train_loss": 0.0035773981362581253, "global_step": 17245, "epoch": 144, "lr": 8.685530076724743e-05} +{"train_loss": 0.006362814921885729, "global_step": 17246, "epoch": 144, "lr": 8.685380354034074e-05} +{"train_loss": 0.00598822021856904, "global_step": 17247, "epoch": 144, "lr": 8.685230624107554e-05} +{"train_loss": 0.004907327238470316, "global_step": 17248, "epoch": 144, "lr": 8.685080886945476e-05} +{"train_loss": 0.005273524206131697, "global_step": 17249, "epoch": 144, "lr": 8.684931142548136e-05} +{"train_loss": 0.007600463926792145, "global_step": 17250, "epoch": 144, "lr": 8.684781390915828e-05} +{"train_loss": 0.0067975460551679134, "global_step": 17251, "epoch": 144, "lr": 8.684631632048845e-05} +{"train_loss": 0.003997775260359049, "global_step": 17252, "epoch": 144, "lr": 8.684481865947482e-05} +{"train_loss": 0.006115301512181759, "global_step": 17253, "epoch": 144, "lr": 8.684332092612031e-05} +{"train_loss": 0.005883750075302204, "global_step": 17254, "epoch": 144, "lr": 8.684182312042789e-05, "val_loss": 0.017622143030166626} +{"train_loss": 0.006704248953610659, "global_step": 17255, "epoch": 145, "lr": 8.684032524240048e-05} +{"train_loss": 0.006151827517896891, "global_step": 17256, "epoch": 145, "lr": 8.683882729204102e-05} +{"train_loss": 0.006684241816401482, "global_step": 17257, "epoch": 145, "lr": 8.683732926935246e-05} +{"train_loss": 0.0053757065907120705, "global_step": 17258, "epoch": 145, "lr": 8.683583117433776e-05} +{"train_loss": 0.006690404377877712, "global_step": 17259, "epoch": 145, "lr": 8.683433300699983e-05} +{"train_loss": 0.005996920634061098, "global_step": 17260, "epoch": 145, "lr": 8.683283476734161e-05} +{"train_loss": 0.00912598054856062, "global_step": 17261, "epoch": 145, "lr": 8.683133645536607e-05} +{"train_loss": 0.00537765072658658, "global_step": 17262, "epoch": 145, "lr": 8.682983807107612e-05} +{"train_loss": 0.004640510771423578, "global_step": 17263, "epoch": 145, "lr": 8.682833961447473e-05} +{"train_loss": 0.006638564635068178, "global_step": 17264, "epoch": 145, "lr": 8.682684108556483e-05} +{"train_loss": 0.0060758874751627445, "global_step": 17265, "epoch": 145, "lr": 8.682534248434935e-05} +{"train_loss": 0.008546296507120132, "global_step": 17266, "epoch": 145, "lr": 8.682384381083124e-05} +{"train_loss": 0.0037250318564474583, "global_step": 17267, "epoch": 145, "lr": 8.682234506501347e-05} +{"train_loss": 0.004526217933744192, "global_step": 17268, "epoch": 145, "lr": 8.682084624689894e-05} +{"train_loss": 0.004343951120972633, "global_step": 17269, "epoch": 145, "lr": 8.681934735649063e-05} +{"train_loss": 0.007111624348908663, "global_step": 17270, "epoch": 145, "lr": 8.681784839379145e-05} +{"train_loss": 0.006791309919208288, "global_step": 17271, "epoch": 145, "lr": 8.681634935880435e-05} +{"train_loss": 0.008597144857048988, "global_step": 17272, "epoch": 145, "lr": 8.68148502515323e-05} +{"train_loss": 0.007084920071065426, "global_step": 17273, "epoch": 145, "lr": 8.681335107197823e-05} +{"train_loss": 0.005075171589851379, "global_step": 17274, "epoch": 145, "lr": 8.681185182014507e-05} +{"train_loss": 0.007208521012216806, "global_step": 17275, "epoch": 145, "lr": 8.681035249603577e-05} +{"train_loss": 0.008153766393661499, "global_step": 17276, "epoch": 145, "lr": 8.680885309965327e-05} +{"train_loss": 0.007336054462939501, "global_step": 17277, "epoch": 145, "lr": 8.680735363100052e-05} +{"train_loss": 0.005330005660653114, "global_step": 17278, "epoch": 145, "lr": 8.680585409008047e-05} +{"train_loss": 0.00757326977327466, "global_step": 17279, "epoch": 145, "lr": 8.680435447689606e-05} +{"train_loss": 0.006481032352894545, "global_step": 17280, "epoch": 145, "lr": 8.680285479145023e-05} +{"train_loss": 0.0062205856665968895, "global_step": 17281, "epoch": 145, "lr": 8.680135503374592e-05} +{"train_loss": 0.006287594325840473, "global_step": 17282, "epoch": 145, "lr": 8.679985520378609e-05} +{"train_loss": 0.005625614896416664, "global_step": 17283, "epoch": 145, "lr": 8.679835530157366e-05} +{"train_loss": 0.007855962961912155, "global_step": 17284, "epoch": 145, "lr": 8.67968553271116e-05} +{"train_loss": 0.00451201107352972, "global_step": 17285, "epoch": 145, "lr": 8.679535528040286e-05} +{"train_loss": 0.0077300406992435455, "global_step": 17286, "epoch": 145, "lr": 8.679385516145035e-05} +{"train_loss": 0.006876374129205942, "global_step": 17287, "epoch": 145, "lr": 8.679235497025704e-05} +{"train_loss": 0.005900013260543346, "global_step": 17288, "epoch": 145, "lr": 8.679085470682588e-05} +{"train_loss": 0.0056818826124072075, "global_step": 17289, "epoch": 145, "lr": 8.67893543711598e-05} +{"train_loss": 0.007157828658819199, "global_step": 17290, "epoch": 145, "lr": 8.678785396326174e-05} +{"train_loss": 0.007402692921459675, "global_step": 17291, "epoch": 145, "lr": 8.678635348313468e-05} +{"train_loss": 0.003764065681025386, "global_step": 17292, "epoch": 145, "lr": 8.678485293078155e-05} +{"train_loss": 0.010050710290670395, "global_step": 17293, "epoch": 145, "lr": 8.678335230620529e-05} +{"train_loss": 0.006931291427463293, "global_step": 17294, "epoch": 145, "lr": 8.678185160940883e-05} +{"train_loss": 0.00927580613642931, "global_step": 17295, "epoch": 145, "lr": 8.678035084039513e-05} +{"train_loss": 0.007813227362930775, "global_step": 17296, "epoch": 145, "lr": 8.677884999916716e-05} +{"train_loss": 0.005901035852730274, "global_step": 17297, "epoch": 145, "lr": 8.677734908572783e-05} +{"train_loss": 0.006146955769509077, "global_step": 17298, "epoch": 145, "lr": 8.677584810008012e-05} +{"train_loss": 0.006813654210418463, "global_step": 17299, "epoch": 145, "lr": 8.677434704222695e-05} +{"train_loss": 0.006561717949807644, "global_step": 17300, "epoch": 145, "lr": 8.67728459121713e-05} +{"train_loss": 0.0047533512115478516, "global_step": 17301, "epoch": 145, "lr": 8.677134470991607e-05} +{"train_loss": 0.0053815944120287895, "global_step": 17302, "epoch": 145, "lr": 8.676984343546425e-05} +{"train_loss": 0.006619506049901247, "global_step": 17303, "epoch": 145, "lr": 8.676834208881877e-05} +{"train_loss": 0.006941409315913916, "global_step": 17304, "epoch": 145, "lr": 8.676684066998255e-05} +{"train_loss": 0.00525679113343358, "global_step": 17305, "epoch": 145, "lr": 8.676533917895859e-05} +{"train_loss": 0.00936419703066349, "global_step": 17306, "epoch": 145, "lr": 8.676383761574983e-05} +{"train_loss": 0.006950377486646175, "global_step": 17307, "epoch": 145, "lr": 8.676233598035917e-05} +{"train_loss": 0.005959013942629099, "global_step": 17308, "epoch": 145, "lr": 8.676083427278961e-05} +{"train_loss": 0.008035309612751007, "global_step": 17309, "epoch": 145, "lr": 8.675933249304407e-05} +{"train_loss": 0.00507002230733633, "global_step": 17310, "epoch": 145, "lr": 8.675783064112551e-05} +{"train_loss": 0.005539323668926954, "global_step": 17311, "epoch": 145, "lr": 8.675632871703689e-05} +{"train_loss": 0.00378032517619431, "global_step": 17312, "epoch": 145, "lr": 8.675482672078112e-05} +{"train_loss": 0.006534726824611425, "global_step": 17313, "epoch": 145, "lr": 8.675332465236119e-05} +{"train_loss": 0.004912523552775383, "global_step": 17314, "epoch": 145, "lr": 8.675182251178005e-05} +{"train_loss": 0.002912097377702594, "global_step": 17315, "epoch": 145, "lr": 8.67503202990406e-05} +{"train_loss": 0.0059061008505523205, "global_step": 17316, "epoch": 145, "lr": 8.674881801414584e-05} +{"train_loss": 0.009418402798473835, "global_step": 17317, "epoch": 145, "lr": 8.67473156570987e-05} +{"train_loss": 0.007065318524837494, "global_step": 17318, "epoch": 145, "lr": 8.674581322790214e-05} +{"train_loss": 0.005158080719411373, "global_step": 17319, "epoch": 145, "lr": 8.674431072655909e-05} +{"train_loss": 0.007493744138628244, "global_step": 17320, "epoch": 145, "lr": 8.67428081530725e-05} +{"train_loss": 0.006232407875359058, "global_step": 17321, "epoch": 145, "lr": 8.674130550744535e-05} +{"train_loss": 0.005597210023552179, "global_step": 17322, "epoch": 145, "lr": 8.673980278968057e-05} +{"train_loss": 0.005176699720323086, "global_step": 17323, "epoch": 145, "lr": 8.673829999978112e-05} +{"train_loss": 0.00647353520616889, "global_step": 17324, "epoch": 145, "lr": 8.673679713774991e-05} +{"train_loss": 0.003522897604852915, "global_step": 17325, "epoch": 145, "lr": 8.673529420358996e-05} +{"train_loss": 0.005201292224228382, "global_step": 17326, "epoch": 145, "lr": 8.673379119730416e-05} +{"train_loss": 0.006174627225846052, "global_step": 17327, "epoch": 145, "lr": 8.67322881188955e-05} +{"train_loss": 0.009241670370101929, "global_step": 17328, "epoch": 145, "lr": 8.673078496836692e-05} +{"train_loss": 0.006048427429050207, "global_step": 17329, "epoch": 145, "lr": 8.672928174572136e-05} +{"train_loss": 0.008211548440158367, "global_step": 17330, "epoch": 145, "lr": 8.672777845096178e-05} +{"train_loss": 0.004288994707167149, "global_step": 17331, "epoch": 145, "lr": 8.672627508409112e-05} +{"train_loss": 0.008032327517867088, "global_step": 17332, "epoch": 145, "lr": 8.672477164511236e-05} +{"train_loss": 0.005409449804574251, "global_step": 17333, "epoch": 145, "lr": 8.672326813402842e-05} +{"train_loss": 0.008813496679067612, "global_step": 17334, "epoch": 145, "lr": 8.672176455084227e-05} +{"train_loss": 0.007069223560392857, "global_step": 17335, "epoch": 145, "lr": 8.672026089555688e-05} +{"train_loss": 0.006425925064831972, "global_step": 17336, "epoch": 145, "lr": 8.671875716817514e-05} +{"train_loss": 0.0052101630717515945, "global_step": 17337, "epoch": 145, "lr": 8.671725336870007e-05} +{"train_loss": 0.0072282892651855946, "global_step": 17338, "epoch": 145, "lr": 8.671574949713459e-05} +{"train_loss": 0.004857139196246862, "global_step": 17339, "epoch": 145, "lr": 8.671424555348167e-05} +{"train_loss": 0.004465095233172178, "global_step": 17340, "epoch": 145, "lr": 8.671274153774425e-05} +{"train_loss": 0.006177445407956839, "global_step": 17341, "epoch": 145, "lr": 8.671123744992526e-05} +{"train_loss": 0.0070754894986748695, "global_step": 17342, "epoch": 145, "lr": 8.67097332900277e-05} +{"train_loss": 0.007141806650906801, "global_step": 17343, "epoch": 145, "lr": 8.670822905805449e-05} +{"train_loss": 0.006100660189986229, "global_step": 17344, "epoch": 145, "lr": 8.670672475400859e-05} +{"train_loss": 0.006867202930152416, "global_step": 17345, "epoch": 145, "lr": 8.670522037789297e-05} +{"train_loss": 0.004835581406950951, "global_step": 17346, "epoch": 145, "lr": 8.670371592971056e-05} +{"train_loss": 0.003986714873462915, "global_step": 17347, "epoch": 145, "lr": 8.670221140946433e-05} +{"train_loss": 0.007811857853084803, "global_step": 17348, "epoch": 145, "lr": 8.670070681715723e-05} +{"train_loss": 0.0059781973250210285, "global_step": 17349, "epoch": 145, "lr": 8.669920215279222e-05} +{"train_loss": 0.009637772105634212, "global_step": 17350, "epoch": 145, "lr": 8.669769741637224e-05} +{"train_loss": 0.0052748797461390495, "global_step": 17351, "epoch": 145, "lr": 8.669619260790025e-05} +{"train_loss": 0.007485339883714914, "global_step": 17352, "epoch": 145, "lr": 8.66946877273792e-05} +{"train_loss": 0.005858482792973518, "global_step": 17353, "epoch": 145, "lr": 8.669318277481207e-05} +{"train_loss": 0.005675592925399542, "global_step": 17354, "epoch": 145, "lr": 8.669167775020177e-05} +{"train_loss": 0.007136673200875521, "global_step": 17355, "epoch": 145, "lr": 8.66901726535513e-05} +{"train_loss": 0.00705931568518281, "global_step": 17356, "epoch": 145, "lr": 8.66886674848636e-05} +{"train_loss": 0.006980425212532282, "global_step": 17357, "epoch": 145, "lr": 8.668716224414159e-05} +{"train_loss": 0.004404967650771141, "global_step": 17358, "epoch": 145, "lr": 8.668565693138829e-05} +{"train_loss": 0.00588808162137866, "global_step": 17359, "epoch": 145, "lr": 8.66841515466066e-05} +{"train_loss": 0.0034219431690871716, "global_step": 17360, "epoch": 145, "lr": 8.668264608979952e-05} +{"train_loss": 0.007028230465948582, "global_step": 17361, "epoch": 145, "lr": 8.668114056096996e-05} +{"train_loss": 0.00541266892105341, "global_step": 17362, "epoch": 145, "lr": 8.667963496012093e-05} +{"train_loss": 0.003497351659461856, "global_step": 17363, "epoch": 145, "lr": 8.667812928725531e-05} +{"train_loss": 0.007767816074192524, "global_step": 17364, "epoch": 145, "lr": 8.667662354237613e-05} +{"train_loss": 0.005481368396431208, "global_step": 17365, "epoch": 145, "lr": 8.667511772548633e-05} +{"train_loss": 0.0067176721058785915, "global_step": 17366, "epoch": 145, "lr": 8.667361183658884e-05} +{"train_loss": 0.005460591986775398, "global_step": 17367, "epoch": 145, "lr": 8.667210587568662e-05} +{"train_loss": 0.005059417337179184, "global_step": 17368, "epoch": 145, "lr": 8.667059984278264e-05} +{"train_loss": 0.0055253347381949425, "global_step": 17369, "epoch": 145, "lr": 8.666909373787988e-05} +{"train_loss": 0.005683309398591518, "global_step": 17370, "epoch": 145, "lr": 8.666758756098126e-05} +{"train_loss": 0.004031339194625616, "global_step": 17371, "epoch": 145, "lr": 8.666608131208974e-05} +{"train_loss": 0.005982784554362297, "global_step": 17372, "epoch": 145, "lr": 8.666457499120829e-05} +{"train_loss": 0.006283426262093943, "global_step": 17373, "epoch": 145, "lr": 8.666306859833985e-05, "val_loss": 0.012594563886523247, "train_action_mse_error": 0.00015895406249910593} +{"train_loss": 0.003168563824146986, "global_step": 17374, "epoch": 146, "lr": 8.666156213348743e-05} +{"train_loss": 0.005169219803065062, "global_step": 17375, "epoch": 146, "lr": 8.666005559665392e-05} +{"train_loss": 0.005160295404493809, "global_step": 17376, "epoch": 146, "lr": 8.665854898784231e-05} +{"train_loss": 0.007126248441636562, "global_step": 17377, "epoch": 146, "lr": 8.665704230705557e-05} +{"train_loss": 0.005226651672273874, "global_step": 17378, "epoch": 146, "lr": 8.665553555429663e-05} +{"train_loss": 0.004863449838012457, "global_step": 17379, "epoch": 146, "lr": 8.665402872956846e-05} +{"train_loss": 0.00571117689833045, "global_step": 17380, "epoch": 146, "lr": 8.665252183287403e-05} +{"train_loss": 0.00551840802654624, "global_step": 17381, "epoch": 146, "lr": 8.665101486421628e-05} +{"train_loss": 0.00709870271384716, "global_step": 17382, "epoch": 146, "lr": 8.664950782359819e-05} +{"train_loss": 0.003696972504258156, "global_step": 17383, "epoch": 146, "lr": 8.66480007110227e-05} +{"train_loss": 0.005423915106803179, "global_step": 17384, "epoch": 146, "lr": 8.664649352649277e-05} +{"train_loss": 0.00343959778547287, "global_step": 17385, "epoch": 146, "lr": 8.664498627001136e-05} +{"train_loss": 0.004474700894206762, "global_step": 17386, "epoch": 146, "lr": 8.664347894158145e-05} +{"train_loss": 0.005542391445487738, "global_step": 17387, "epoch": 146, "lr": 8.664197154120598e-05} +{"train_loss": 0.004406480118632317, "global_step": 17388, "epoch": 146, "lr": 8.66404640688879e-05} +{"train_loss": 0.005901836324483156, "global_step": 17389, "epoch": 146, "lr": 8.66389565246302e-05} +{"train_loss": 0.0034573639277368784, "global_step": 17390, "epoch": 146, "lr": 8.663744890843583e-05} +{"train_loss": 0.007185962051153183, "global_step": 17391, "epoch": 146, "lr": 8.663594122030773e-05} +{"train_loss": 0.005965446121990681, "global_step": 17392, "epoch": 146, "lr": 8.663443346024888e-05} +{"train_loss": 0.00421320041641593, "global_step": 17393, "epoch": 146, "lr": 8.663292562826222e-05} +{"train_loss": 0.003271478693932295, "global_step": 17394, "epoch": 146, "lr": 8.663141772435073e-05} +{"train_loss": 0.004330198280513287, "global_step": 17395, "epoch": 146, "lr": 8.662990974851736e-05} +{"train_loss": 0.006178490351885557, "global_step": 17396, "epoch": 146, "lr": 8.66284017007651e-05} +{"train_loss": 0.0043276650831103325, "global_step": 17397, "epoch": 146, "lr": 8.662689358109687e-05} +{"train_loss": 0.0075994511134922504, "global_step": 17398, "epoch": 146, "lr": 8.662538538951565e-05} +{"train_loss": 0.00532309478148818, "global_step": 17399, "epoch": 146, "lr": 8.662387712602439e-05} +{"train_loss": 0.007098834961652756, "global_step": 17400, "epoch": 146, "lr": 8.662236879062606e-05} +{"train_loss": 0.0057217394933104515, "global_step": 17401, "epoch": 146, "lr": 8.662086038332364e-05} +{"train_loss": 0.004622309003025293, "global_step": 17402, "epoch": 146, "lr": 8.661935190412005e-05} +{"train_loss": 0.006562473718076944, "global_step": 17403, "epoch": 146, "lr": 8.661784335301828e-05} +{"train_loss": 0.0035078590735793114, "global_step": 17404, "epoch": 146, "lr": 8.66163347300213e-05} +{"train_loss": 0.005692311096936464, "global_step": 17405, "epoch": 146, "lr": 8.661482603513204e-05} +{"train_loss": 0.009264769963920116, "global_step": 17406, "epoch": 146, "lr": 8.66133172683535e-05} +{"train_loss": 0.004601686727255583, "global_step": 17407, "epoch": 146, "lr": 8.661180842968862e-05} +{"train_loss": 0.004797757603228092, "global_step": 17408, "epoch": 146, "lr": 8.661029951914035e-05} +{"train_loss": 0.0031239467207342386, "global_step": 17409, "epoch": 146, "lr": 8.660879053671168e-05} +{"train_loss": 0.007502691354602575, "global_step": 17410, "epoch": 146, "lr": 8.660728148240556e-05} +{"train_loss": 0.0048881834372878075, "global_step": 17411, "epoch": 146, "lr": 8.660577235622496e-05} +{"train_loss": 0.006388920824974775, "global_step": 17412, "epoch": 146, "lr": 8.660426315817282e-05} +{"train_loss": 0.007015961222350597, "global_step": 17413, "epoch": 146, "lr": 8.660275388825213e-05} +{"train_loss": 0.006032662000507116, "global_step": 17414, "epoch": 146, "lr": 8.660124454646583e-05} +{"train_loss": 0.0056812819093465805, "global_step": 17415, "epoch": 146, "lr": 8.659973513281691e-05} +{"train_loss": 0.0029780680779367685, "global_step": 17416, "epoch": 146, "lr": 8.659822564730833e-05} +{"train_loss": 0.004174468107521534, "global_step": 17417, "epoch": 146, "lr": 8.659671608994303e-05} +{"train_loss": 0.010417316108942032, "global_step": 17418, "epoch": 146, "lr": 8.659520646072399e-05} +{"train_loss": 0.006395549979060888, "global_step": 17419, "epoch": 146, "lr": 8.659369675965418e-05} +{"train_loss": 0.004199547693133354, "global_step": 17420, "epoch": 146, "lr": 8.659218698673655e-05} +{"train_loss": 0.0080020222812891, "global_step": 17421, "epoch": 146, "lr": 8.659067714197407e-05} +{"train_loss": 0.004606918897479773, "global_step": 17422, "epoch": 146, "lr": 8.65891672253697e-05} +{"train_loss": 0.007435670122504234, "global_step": 17423, "epoch": 146, "lr": 8.658765723692641e-05} +{"train_loss": 0.006228436715900898, "global_step": 17424, "epoch": 146, "lr": 8.658614717664717e-05} +{"train_loss": 0.004214792046695948, "global_step": 17425, "epoch": 146, "lr": 8.658463704453492e-05} +{"train_loss": 0.006363025400787592, "global_step": 17426, "epoch": 146, "lr": 8.658312684059267e-05} +{"train_loss": 0.00447220541536808, "global_step": 17427, "epoch": 146, "lr": 8.658161656482333e-05} +{"train_loss": 0.008686435408890247, "global_step": 17428, "epoch": 146, "lr": 8.658010621722992e-05} +{"train_loss": 0.004670214839279652, "global_step": 17429, "epoch": 146, "lr": 8.657859579781538e-05} +{"train_loss": 0.0027728374116122723, "global_step": 17430, "epoch": 146, "lr": 8.657708530658266e-05} +{"train_loss": 0.005840678699314594, "global_step": 17431, "epoch": 146, "lr": 8.657557474353475e-05} +{"train_loss": 0.004206872079521418, "global_step": 17432, "epoch": 146, "lr": 8.657406410867459e-05} +{"train_loss": 0.006067263428121805, "global_step": 17433, "epoch": 146, "lr": 8.657255340200518e-05} +{"train_loss": 0.006156240589916706, "global_step": 17434, "epoch": 146, "lr": 8.657104262352947e-05} +{"train_loss": 0.004937557503581047, "global_step": 17435, "epoch": 146, "lr": 8.656953177325041e-05} +{"train_loss": 0.0045681968331336975, "global_step": 17436, "epoch": 146, "lr": 8.6568020851171e-05} +{"train_loss": 0.006359445862472057, "global_step": 17437, "epoch": 146, "lr": 8.656650985729417e-05} +{"train_loss": 0.005907168611884117, "global_step": 17438, "epoch": 146, "lr": 8.656499879162291e-05} +{"train_loss": 0.00858288537710905, "global_step": 17439, "epoch": 146, "lr": 8.656348765416018e-05} +{"train_loss": 0.005016506649553776, "global_step": 17440, "epoch": 146, "lr": 8.656197644490895e-05} +{"train_loss": 0.004190642852336168, "global_step": 17441, "epoch": 146, "lr": 8.65604651638722e-05} +{"train_loss": 0.0030528786592185497, "global_step": 17442, "epoch": 146, "lr": 8.655895381105285e-05} +{"train_loss": 0.010940920561552048, "global_step": 17443, "epoch": 146, "lr": 8.655744238645393e-05} +{"train_loss": 0.004919277038425207, "global_step": 17444, "epoch": 146, "lr": 8.655593089007836e-05} +{"train_loss": 0.007378505077213049, "global_step": 17445, "epoch": 146, "lr": 8.655441932192913e-05} +{"train_loss": 0.0076307086274027824, "global_step": 17446, "epoch": 146, "lr": 8.65529076820092e-05} +{"train_loss": 0.003387016011402011, "global_step": 17447, "epoch": 146, "lr": 8.655139597032156e-05} +{"train_loss": 0.007608958054333925, "global_step": 17448, "epoch": 146, "lr": 8.654988418686913e-05} +{"train_loss": 0.004270737059414387, "global_step": 17449, "epoch": 146, "lr": 8.654837233165494e-05} +{"train_loss": 0.007424370851367712, "global_step": 17450, "epoch": 146, "lr": 8.65468604046819e-05} +{"train_loss": 0.005530987400561571, "global_step": 17451, "epoch": 146, "lr": 8.6545348405953e-05} +{"train_loss": 0.006069181486964226, "global_step": 17452, "epoch": 146, "lr": 8.654383633547124e-05} +{"train_loss": 0.006697386968880892, "global_step": 17453, "epoch": 146, "lr": 8.654232419323954e-05} +{"train_loss": 0.007029395550489426, "global_step": 17454, "epoch": 146, "lr": 8.65408119792609e-05} +{"train_loss": 0.006436172407120466, "global_step": 17455, "epoch": 146, "lr": 8.653929969353828e-05} +{"train_loss": 0.0051624970510602, "global_step": 17456, "epoch": 146, "lr": 8.653778733607463e-05} +{"train_loss": 0.004490166902542114, "global_step": 17457, "epoch": 146, "lr": 8.653627490687295e-05} +{"train_loss": 0.007498299703001976, "global_step": 17458, "epoch": 146, "lr": 8.65347624059362e-05} +{"train_loss": 0.004441129509359598, "global_step": 17459, "epoch": 146, "lr": 8.653324983326736e-05} +{"train_loss": 0.0040166242979466915, "global_step": 17460, "epoch": 146, "lr": 8.653173718886937e-05} +{"train_loss": 0.005636824760586023, "global_step": 17461, "epoch": 146, "lr": 8.653022447274523e-05} +{"train_loss": 0.00738693680614233, "global_step": 17462, "epoch": 146, "lr": 8.652871168489787e-05} +{"train_loss": 0.0051374277099967, "global_step": 17463, "epoch": 146, "lr": 8.652719882533031e-05} +{"train_loss": 0.009845620021224022, "global_step": 17464, "epoch": 146, "lr": 8.652568589404549e-05} +{"train_loss": 0.006772713735699654, "global_step": 17465, "epoch": 146, "lr": 8.65241728910464e-05} +{"train_loss": 0.005416092462837696, "global_step": 17466, "epoch": 146, "lr": 8.652265981633598e-05} +{"train_loss": 0.004450201988220215, "global_step": 17467, "epoch": 146, "lr": 8.652114666991724e-05} +{"train_loss": 0.004983170423656702, "global_step": 17468, "epoch": 146, "lr": 8.651963345179311e-05} +{"train_loss": 0.0054566520266234875, "global_step": 17469, "epoch": 146, "lr": 8.651812016196659e-05} +{"train_loss": 0.0033621808979660273, "global_step": 17470, "epoch": 146, "lr": 8.651660680044065e-05} +{"train_loss": 0.0074599748477339745, "global_step": 17471, "epoch": 146, "lr": 8.651509336721823e-05} +{"train_loss": 0.0034507159143686295, "global_step": 17472, "epoch": 146, "lr": 8.651357986230236e-05} +{"train_loss": 0.003183797700330615, "global_step": 17473, "epoch": 146, "lr": 8.651206628569594e-05} +{"train_loss": 0.004991444293409586, "global_step": 17474, "epoch": 146, "lr": 8.651055263740201e-05} +{"train_loss": 0.004679507110267878, "global_step": 17475, "epoch": 146, "lr": 8.65090389174235e-05} +{"train_loss": 0.006130019668489695, "global_step": 17476, "epoch": 146, "lr": 8.650752512576339e-05} +{"train_loss": 0.004169880878180265, "global_step": 17477, "epoch": 146, "lr": 8.650601126242464e-05} +{"train_loss": 0.0044633434154093266, "global_step": 17478, "epoch": 146, "lr": 8.650449732741026e-05} +{"train_loss": 0.006368540693074465, "global_step": 17479, "epoch": 146, "lr": 8.650298332072318e-05} +{"train_loss": 0.004756467416882515, "global_step": 17480, "epoch": 146, "lr": 8.650146924236642e-05} +{"train_loss": 0.00467625493183732, "global_step": 17481, "epoch": 146, "lr": 8.64999550923429e-05} +{"train_loss": 0.006656658835709095, "global_step": 17482, "epoch": 146, "lr": 8.649844087065561e-05} +{"train_loss": 0.005322467070072889, "global_step": 17483, "epoch": 146, "lr": 8.649692657730756e-05} +{"train_loss": 0.004315655212849379, "global_step": 17484, "epoch": 146, "lr": 8.649541221230169e-05} +{"train_loss": 0.0031202484387904406, "global_step": 17485, "epoch": 146, "lr": 8.649389777564095e-05} +{"train_loss": 0.0054709454998373985, "global_step": 17486, "epoch": 146, "lr": 8.649238326732835e-05} +{"train_loss": 0.00641644885763526, "global_step": 17487, "epoch": 146, "lr": 8.649086868736687e-05} +{"train_loss": 0.004694656934589148, "global_step": 17488, "epoch": 146, "lr": 8.648935403575947e-05} +{"train_loss": 0.004838997032493353, "global_step": 17489, "epoch": 146, "lr": 8.64878393125091e-05} +{"train_loss": 0.004613813944160938, "global_step": 17490, "epoch": 146, "lr": 8.648632451761876e-05} +{"train_loss": 0.004517506342381239, "global_step": 17491, "epoch": 146, "lr": 8.648480965109143e-05} +{"train_loss": 0.00549750412743883, "global_step": 17492, "epoch": 146, "lr": 8.648329471293008e-05, "val_loss": 0.016306232661008835} +{"train_loss": 0.008272209204733372, "global_step": 17493, "epoch": 147, "lr": 8.648177970313767e-05} +{"train_loss": 0.0056044189259409904, "global_step": 17494, "epoch": 147, "lr": 8.648026462171717e-05} +{"train_loss": 0.006780729163438082, "global_step": 17495, "epoch": 147, "lr": 8.647874946867158e-05} +{"train_loss": 0.007549651432782412, "global_step": 17496, "epoch": 147, "lr": 8.647723424400387e-05} +{"train_loss": 0.0035192377399653196, "global_step": 17497, "epoch": 147, "lr": 8.6475718947717e-05} +{"train_loss": 0.006970187649130821, "global_step": 17498, "epoch": 147, "lr": 8.647420357981395e-05} +{"train_loss": 0.004841831512749195, "global_step": 17499, "epoch": 147, "lr": 8.64726881402977e-05} +{"train_loss": 0.003189113922417164, "global_step": 17500, "epoch": 147, "lr": 8.647117262917122e-05} +{"train_loss": 0.0042594908736646175, "global_step": 17501, "epoch": 147, "lr": 8.64696570464375e-05} +{"train_loss": 0.00311337155289948, "global_step": 17502, "epoch": 147, "lr": 8.646814139209948e-05} +{"train_loss": 0.005421781446784735, "global_step": 17503, "epoch": 147, "lr": 8.646662566616018e-05} +{"train_loss": 0.003245763713493943, "global_step": 17504, "epoch": 147, "lr": 8.646510986862255e-05} +{"train_loss": 0.007162902969866991, "global_step": 17505, "epoch": 147, "lr": 8.646359399948959e-05} +{"train_loss": 0.004463854245841503, "global_step": 17506, "epoch": 147, "lr": 8.646207805876425e-05} +{"train_loss": 0.004963402636349201, "global_step": 17507, "epoch": 147, "lr": 8.64605620464495e-05} +{"train_loss": 0.005894934758543968, "global_step": 17508, "epoch": 147, "lr": 8.645904596254835e-05} +{"train_loss": 0.003726016962900758, "global_step": 17509, "epoch": 147, "lr": 8.645752980706374e-05} +{"train_loss": 0.0049670785665512085, "global_step": 17510, "epoch": 147, "lr": 8.645601357999868e-05} +{"train_loss": 0.006331921089440584, "global_step": 17511, "epoch": 147, "lr": 8.645449728135613e-05} +{"train_loss": 0.005789803806692362, "global_step": 17512, "epoch": 147, "lr": 8.645298091113908e-05} +{"train_loss": 0.00471140630543232, "global_step": 17513, "epoch": 147, "lr": 8.645146446935046e-05} +{"train_loss": 0.007828522473573685, "global_step": 17514, "epoch": 147, "lr": 8.644994795599331e-05} +{"train_loss": 0.0066272662952542305, "global_step": 17515, "epoch": 147, "lr": 8.644843137107059e-05} +{"train_loss": 0.006196158472448587, "global_step": 17516, "epoch": 147, "lr": 8.644691471458525e-05} +{"train_loss": 0.004761823918670416, "global_step": 17517, "epoch": 147, "lr": 8.64453979865403e-05} +{"train_loss": 0.0061841984279453754, "global_step": 17518, "epoch": 147, "lr": 8.64438811869387e-05} +{"train_loss": 0.005287619307637215, "global_step": 17519, "epoch": 147, "lr": 8.644236431578342e-05} +{"train_loss": 0.00565734738484025, "global_step": 17520, "epoch": 147, "lr": 8.644084737307746e-05} +{"train_loss": 0.0065986220724880695, "global_step": 17521, "epoch": 147, "lr": 8.643933035882378e-05} +{"train_loss": 0.007533719763159752, "global_step": 17522, "epoch": 147, "lr": 8.64378132730254e-05} +{"train_loss": 0.004589497111737728, "global_step": 17523, "epoch": 147, "lr": 8.643629611568525e-05} +{"train_loss": 0.005692098755389452, "global_step": 17524, "epoch": 147, "lr": 8.643477888680631e-05} +{"train_loss": 0.00631225248798728, "global_step": 17525, "epoch": 147, "lr": 8.643326158639159e-05} +{"train_loss": 0.005348208360373974, "global_step": 17526, "epoch": 147, "lr": 8.643174421444404e-05} +{"train_loss": 0.007447375915944576, "global_step": 17527, "epoch": 147, "lr": 8.643022677096665e-05} +{"train_loss": 0.003448938252404332, "global_step": 17528, "epoch": 147, "lr": 8.642870925596243e-05} +{"train_loss": 0.00494520366191864, "global_step": 17529, "epoch": 147, "lr": 8.642719166943432e-05} +{"train_loss": 0.005260500591248274, "global_step": 17530, "epoch": 147, "lr": 8.642567401138529e-05} +{"train_loss": 0.005838682409375906, "global_step": 17531, "epoch": 147, "lr": 8.642415628181836e-05} +{"train_loss": 0.004464748781174421, "global_step": 17532, "epoch": 147, "lr": 8.642263848073648e-05} +{"train_loss": 0.0073898364789783955, "global_step": 17533, "epoch": 147, "lr": 8.642112060814265e-05} +{"train_loss": 0.008795100264251232, "global_step": 17534, "epoch": 147, "lr": 8.641960266403983e-05} +{"train_loss": 0.00570131279528141, "global_step": 17535, "epoch": 147, "lr": 8.641808464843103e-05} +{"train_loss": 0.0054701571352779865, "global_step": 17536, "epoch": 147, "lr": 8.64165665613192e-05} +{"train_loss": 0.010483578778803349, "global_step": 17537, "epoch": 147, "lr": 8.641504840270733e-05} +{"train_loss": 0.009466825984418392, "global_step": 17538, "epoch": 147, "lr": 8.64135301725984e-05} +{"train_loss": 0.006289458367973566, "global_step": 17539, "epoch": 147, "lr": 8.64120118709954e-05} +{"train_loss": 0.007971281185746193, "global_step": 17540, "epoch": 147, "lr": 8.64104934979013e-05} +{"train_loss": 0.006859074346721172, "global_step": 17541, "epoch": 147, "lr": 8.640897505331908e-05} +{"train_loss": 0.005815053358674049, "global_step": 17542, "epoch": 147, "lr": 8.640745653725176e-05} +{"train_loss": 0.004182782955467701, "global_step": 17543, "epoch": 147, "lr": 8.640593794970224e-05} +{"train_loss": 0.008678946644067764, "global_step": 17544, "epoch": 147, "lr": 8.640441929067357e-05} +{"train_loss": 0.005608049221336842, "global_step": 17545, "epoch": 147, "lr": 8.640290056016873e-05} +{"train_loss": 0.009787109680473804, "global_step": 17546, "epoch": 147, "lr": 8.640138175819068e-05} +{"train_loss": 0.00847549643367529, "global_step": 17547, "epoch": 147, "lr": 8.639986288474239e-05} +{"train_loss": 0.004693932365626097, "global_step": 17548, "epoch": 147, "lr": 8.639834393982686e-05} +{"train_loss": 0.006014740094542503, "global_step": 17549, "epoch": 147, "lr": 8.639682492344707e-05} +{"train_loss": 0.005256257019937038, "global_step": 17550, "epoch": 147, "lr": 8.639530583560603e-05} +{"train_loss": 0.00622772891074419, "global_step": 17551, "epoch": 147, "lr": 8.639378667630667e-05} +{"train_loss": 0.006353387143462896, "global_step": 17552, "epoch": 147, "lr": 8.639226744555199e-05} +{"train_loss": 0.007272197864949703, "global_step": 17553, "epoch": 147, "lr": 8.6390748143345e-05} +{"train_loss": 0.008237200789153576, "global_step": 17554, "epoch": 147, "lr": 8.638922876968865e-05} +{"train_loss": 0.007511839736253023, "global_step": 17555, "epoch": 147, "lr": 8.638770932458594e-05} +{"train_loss": 0.005934544373303652, "global_step": 17556, "epoch": 147, "lr": 8.638618980803985e-05} +{"train_loss": 0.005013248883187771, "global_step": 17557, "epoch": 147, "lr": 8.638467022005337e-05} +{"train_loss": 0.004909576382488012, "global_step": 17558, "epoch": 147, "lr": 8.638315056062946e-05} +{"train_loss": 0.010084224864840508, "global_step": 17559, "epoch": 147, "lr": 8.638163082977115e-05} +{"train_loss": 0.006006267387419939, "global_step": 17560, "epoch": 147, "lr": 8.638011102748137e-05} +{"train_loss": 0.004643196705728769, "global_step": 17561, "epoch": 147, "lr": 8.637859115376314e-05} +{"train_loss": 0.007309682667255402, "global_step": 17562, "epoch": 147, "lr": 8.637707120861942e-05} +{"train_loss": 0.006187922786921263, "global_step": 17563, "epoch": 147, "lr": 8.637555119205323e-05} +{"train_loss": 0.006335125770419836, "global_step": 17564, "epoch": 147, "lr": 8.63740311040675e-05} +{"train_loss": 0.008031781762838364, "global_step": 17565, "epoch": 147, "lr": 8.637251094466527e-05} +{"train_loss": 0.005482158623635769, "global_step": 17566, "epoch": 147, "lr": 8.637099071384951e-05} +{"train_loss": 0.007061124313622713, "global_step": 17567, "epoch": 147, "lr": 8.636947041162317e-05} +{"train_loss": 0.007065868936479092, "global_step": 17568, "epoch": 147, "lr": 8.636795003798927e-05} +{"train_loss": 0.007147911936044693, "global_step": 17569, "epoch": 147, "lr": 8.636642959295078e-05} +{"train_loss": 0.008980244398117065, "global_step": 17570, "epoch": 147, "lr": 8.63649090765107e-05} +{"train_loss": 0.0060668024234473705, "global_step": 17571, "epoch": 147, "lr": 8.6363388488672e-05} +{"train_loss": 0.004884673282504082, "global_step": 17572, "epoch": 147, "lr": 8.636186782943769e-05} +{"train_loss": 0.0054076677188277245, "global_step": 17573, "epoch": 147, "lr": 8.63603470988107e-05} +{"train_loss": 0.0053937300108373165, "global_step": 17574, "epoch": 147, "lr": 8.635882629679408e-05} +{"train_loss": 0.005873311776667833, "global_step": 17575, "epoch": 147, "lr": 8.63573054233908e-05} +{"train_loss": 0.0073845600709319115, "global_step": 17576, "epoch": 147, "lr": 8.63557844786038e-05} +{"train_loss": 0.006179632153362036, "global_step": 17577, "epoch": 147, "lr": 8.635426346243613e-05} +{"train_loss": 0.003237024648115039, "global_step": 17578, "epoch": 147, "lr": 8.635274237489073e-05} +{"train_loss": 0.009871548041701317, "global_step": 17579, "epoch": 147, "lr": 8.635122121597062e-05} +{"train_loss": 0.003940383903682232, "global_step": 17580, "epoch": 147, "lr": 8.634969998567875e-05} +{"train_loss": 0.00694007333368063, "global_step": 17581, "epoch": 147, "lr": 8.634817868401815e-05} +{"train_loss": 0.006340800318866968, "global_step": 17582, "epoch": 147, "lr": 8.634665731099177e-05} +{"train_loss": 0.008291594684123993, "global_step": 17583, "epoch": 147, "lr": 8.634513586660262e-05} +{"train_loss": 0.006609971169382334, "global_step": 17584, "epoch": 147, "lr": 8.634361435085367e-05} +{"train_loss": 0.006224869750440121, "global_step": 17585, "epoch": 147, "lr": 8.634209276374792e-05} +{"train_loss": 0.005570037290453911, "global_step": 17586, "epoch": 147, "lr": 8.634057110528835e-05} +{"train_loss": 0.007175589445978403, "global_step": 17587, "epoch": 147, "lr": 8.633904937547796e-05} +{"train_loss": 0.004349747207015753, "global_step": 17588, "epoch": 147, "lr": 8.633752757431972e-05} +{"train_loss": 0.005086785182356834, "global_step": 17589, "epoch": 147, "lr": 8.633600570181663e-05} +{"train_loss": 0.0077133760787546635, "global_step": 17590, "epoch": 147, "lr": 8.633448375797169e-05} +{"train_loss": 0.00567668117582798, "global_step": 17591, "epoch": 147, "lr": 8.633296174278784e-05} +{"train_loss": 0.00524765532463789, "global_step": 17592, "epoch": 147, "lr": 8.633143965626812e-05} +{"train_loss": 0.0030593289993703365, "global_step": 17593, "epoch": 147, "lr": 8.63299174984155e-05} +{"train_loss": 0.005877463612705469, "global_step": 17594, "epoch": 147, "lr": 8.632839526923297e-05} +{"train_loss": 0.00426797941327095, "global_step": 17595, "epoch": 147, "lr": 8.63268729687235e-05} +{"train_loss": 0.004389000590890646, "global_step": 17596, "epoch": 147, "lr": 8.632535059689011e-05} +{"train_loss": 0.005646090023219585, "global_step": 17597, "epoch": 147, "lr": 8.632382815373578e-05} +{"train_loss": 0.0065992302261292934, "global_step": 17598, "epoch": 147, "lr": 8.63223056392635e-05} +{"train_loss": 0.003872663015499711, "global_step": 17599, "epoch": 147, "lr": 8.632078305347624e-05} +{"train_loss": 0.004339816980063915, "global_step": 17600, "epoch": 147, "lr": 8.6319260396377e-05} +{"train_loss": 0.005250347778201103, "global_step": 17601, "epoch": 147, "lr": 8.631773766796878e-05} +{"train_loss": 0.007161133456975222, "global_step": 17602, "epoch": 147, "lr": 8.631621486825456e-05} +{"train_loss": 0.005135654471814632, "global_step": 17603, "epoch": 147, "lr": 8.631469199723732e-05} +{"train_loss": 0.007001347839832306, "global_step": 17604, "epoch": 147, "lr": 8.631316905492009e-05} +{"train_loss": 0.0065502505749464035, "global_step": 17605, "epoch": 147, "lr": 8.63116460413058e-05} +{"train_loss": 0.00445071654394269, "global_step": 17606, "epoch": 147, "lr": 8.631012295639748e-05} +{"train_loss": 0.0066252341493964195, "global_step": 17607, "epoch": 147, "lr": 8.630859980019813e-05} +{"train_loss": 0.005915827117860317, "global_step": 17608, "epoch": 147, "lr": 8.630707657271071e-05} +{"train_loss": 0.005871726665645838, "global_step": 17609, "epoch": 147, "lr": 8.630555327393823e-05} +{"train_loss": 0.0045671286061406136, "global_step": 17610, "epoch": 147, "lr": 8.630402990388367e-05} +{"train_loss": 0.0060423485437768095, "global_step": 17611, "epoch": 147, "lr": 8.630250646255003e-05, "val_loss": 0.02686784788966179} +{"train_loss": 0.005304540973156691, "global_step": 17612, "epoch": 148, "lr": 8.630098294994028e-05} +{"train_loss": 0.0038955537602305412, "global_step": 17613, "epoch": 148, "lr": 8.629945936605746e-05} +{"train_loss": 0.006012336816638708, "global_step": 17614, "epoch": 148, "lr": 8.629793571090452e-05} +{"train_loss": 0.002800636226311326, "global_step": 17615, "epoch": 148, "lr": 8.629641198448445e-05} +{"train_loss": 0.006388422567397356, "global_step": 17616, "epoch": 148, "lr": 8.629488818680026e-05} +{"train_loss": 0.007126845885068178, "global_step": 17617, "epoch": 148, "lr": 8.629336431785493e-05} +{"train_loss": 0.004306122660636902, "global_step": 17618, "epoch": 148, "lr": 8.629184037765145e-05} +{"train_loss": 0.005865304730832577, "global_step": 17619, "epoch": 148, "lr": 8.629031636619282e-05} +{"train_loss": 0.004699053708463907, "global_step": 17620, "epoch": 148, "lr": 8.628879228348204e-05} +{"train_loss": 0.006886007729917765, "global_step": 17621, "epoch": 148, "lr": 8.62872681295221e-05} +{"train_loss": 0.0035390269476920366, "global_step": 17622, "epoch": 148, "lr": 8.628574390431596e-05} +{"train_loss": 0.0050375210121273994, "global_step": 17623, "epoch": 148, "lr": 8.628421960786666e-05} +{"train_loss": 0.004165267571806908, "global_step": 17624, "epoch": 148, "lr": 8.628269524017717e-05} +{"train_loss": 0.005550194997340441, "global_step": 17625, "epoch": 148, "lr": 8.628117080125049e-05} +{"train_loss": 0.004023713991045952, "global_step": 17626, "epoch": 148, "lr": 8.627964629108958e-05} +{"train_loss": 0.005494048818945885, "global_step": 17627, "epoch": 148, "lr": 8.627812170969749e-05} +{"train_loss": 0.004235010128468275, "global_step": 17628, "epoch": 148, "lr": 8.627659705707716e-05} +{"train_loss": 0.005292522720992565, "global_step": 17629, "epoch": 148, "lr": 8.627507233323162e-05} +{"train_loss": 0.008716495707631111, "global_step": 17630, "epoch": 148, "lr": 8.627354753816386e-05} +{"train_loss": 0.004739007912576199, "global_step": 17631, "epoch": 148, "lr": 8.627202267187684e-05} +{"train_loss": 0.0052353092469275, "global_step": 17632, "epoch": 148, "lr": 8.62704977343736e-05} +{"train_loss": 0.008461421355605125, "global_step": 17633, "epoch": 148, "lr": 8.626897272565711e-05} +{"train_loss": 0.0037383916787803173, "global_step": 17634, "epoch": 148, "lr": 8.626744764573036e-05} +{"train_loss": 0.005198164843022823, "global_step": 17635, "epoch": 148, "lr": 8.626592249459635e-05} +{"train_loss": 0.004521226044744253, "global_step": 17636, "epoch": 148, "lr": 8.626439727225809e-05} +{"train_loss": 0.0038333467673510313, "global_step": 17637, "epoch": 148, "lr": 8.626287197871854e-05} +{"train_loss": 0.005653216037899256, "global_step": 17638, "epoch": 148, "lr": 8.626134661398071e-05} +{"train_loss": 0.003867174033075571, "global_step": 17639, "epoch": 148, "lr": 8.625982117804763e-05} +{"train_loss": 0.007619666401296854, "global_step": 17640, "epoch": 148, "lr": 8.625829567092225e-05} +{"train_loss": 0.004233922343701124, "global_step": 17641, "epoch": 148, "lr": 8.625677009260757e-05} +{"train_loss": 0.0034322061110287905, "global_step": 17642, "epoch": 148, "lr": 8.62552444431066e-05} +{"train_loss": 0.005482305772602558, "global_step": 17643, "epoch": 148, "lr": 8.625371872242233e-05} +{"train_loss": 0.004562364425510168, "global_step": 17644, "epoch": 148, "lr": 8.625219293055777e-05} +{"train_loss": 0.008239508606493473, "global_step": 17645, "epoch": 148, "lr": 8.62506670675159e-05} +{"train_loss": 0.009106356650590897, "global_step": 17646, "epoch": 148, "lr": 8.62491411332997e-05} +{"train_loss": 0.006622415501624346, "global_step": 17647, "epoch": 148, "lr": 8.624761512791219e-05} +{"train_loss": 0.007837149314582348, "global_step": 17648, "epoch": 148, "lr": 8.624608905135638e-05} +{"train_loss": 0.005666328594088554, "global_step": 17649, "epoch": 148, "lr": 8.624456290363523e-05} +{"train_loss": 0.007014242000877857, "global_step": 17650, "epoch": 148, "lr": 8.624303668475176e-05} +{"train_loss": 0.005820535589009523, "global_step": 17651, "epoch": 148, "lr": 8.624151039470895e-05} +{"train_loss": 0.006441394332796335, "global_step": 17652, "epoch": 148, "lr": 8.623998403350981e-05} +{"train_loss": 0.003736340906471014, "global_step": 17653, "epoch": 148, "lr": 8.623845760115733e-05} +{"train_loss": 0.003215603996068239, "global_step": 17654, "epoch": 148, "lr": 8.623693109765452e-05} +{"train_loss": 0.007144314702600241, "global_step": 17655, "epoch": 148, "lr": 8.623540452300436e-05} +{"train_loss": 0.005305035505443811, "global_step": 17656, "epoch": 148, "lr": 8.623387787720986e-05} +{"train_loss": 0.004237792920321226, "global_step": 17657, "epoch": 148, "lr": 8.6232351160274e-05} +{"train_loss": 0.006672439631074667, "global_step": 17658, "epoch": 148, "lr": 8.623082437219981e-05} +{"train_loss": 0.004918364342302084, "global_step": 17659, "epoch": 148, "lr": 8.622929751299025e-05} +{"train_loss": 0.005963840056210756, "global_step": 17660, "epoch": 148, "lr": 8.622777058264832e-05} +{"train_loss": 0.0064650108106434345, "global_step": 17661, "epoch": 148, "lr": 8.622624358117706e-05} +{"train_loss": 0.005355120170861483, "global_step": 17662, "epoch": 148, "lr": 8.622471650857944e-05} +{"train_loss": 0.005978332366794348, "global_step": 17663, "epoch": 148, "lr": 8.622318936485845e-05} +{"train_loss": 0.008264360018074512, "global_step": 17664, "epoch": 148, "lr": 8.622166215001711e-05} +{"train_loss": 0.007942572236061096, "global_step": 17665, "epoch": 148, "lr": 8.622013486405838e-05} +{"train_loss": 0.005642368458211422, "global_step": 17666, "epoch": 148, "lr": 8.62186075069853e-05} +{"train_loss": 0.005296100862324238, "global_step": 17667, "epoch": 148, "lr": 8.621708007880085e-05} +{"train_loss": 0.006507312413305044, "global_step": 17668, "epoch": 148, "lr": 8.621555257950804e-05} +{"train_loss": 0.00661961967125535, "global_step": 17669, "epoch": 148, "lr": 8.621402500910985e-05} +{"train_loss": 0.006522498093545437, "global_step": 17670, "epoch": 148, "lr": 8.62124973676093e-05} +{"train_loss": 0.0056449673138558865, "global_step": 17671, "epoch": 148, "lr": 8.621096965500939e-05} +{"train_loss": 0.0064802709966897964, "global_step": 17672, "epoch": 148, "lr": 8.62094418713131e-05} +{"train_loss": 0.007258728612214327, "global_step": 17673, "epoch": 148, "lr": 8.620791401652343e-05} +{"train_loss": 0.0061791809275746346, "global_step": 17674, "epoch": 148, "lr": 8.62063860906434e-05} +{"train_loss": 0.004162533208727837, "global_step": 17675, "epoch": 148, "lr": 8.620485809367599e-05} +{"train_loss": 0.00792607944458723, "global_step": 17676, "epoch": 148, "lr": 8.620333002562422e-05} +{"train_loss": 0.008163204416632652, "global_step": 17677, "epoch": 148, "lr": 8.620180188649107e-05} +{"train_loss": 0.003917194902896881, "global_step": 17678, "epoch": 148, "lr": 8.620027367627955e-05} +{"train_loss": 0.011484029702842236, "global_step": 17679, "epoch": 148, "lr": 8.619874539499267e-05} +{"train_loss": 0.005442759953439236, "global_step": 17680, "epoch": 148, "lr": 8.619721704263342e-05} +{"train_loss": 0.007726794108748436, "global_step": 17681, "epoch": 148, "lr": 8.61956886192048e-05} +{"train_loss": 0.00531691825017333, "global_step": 17682, "epoch": 148, "lr": 8.61941601247098e-05} +{"train_loss": 0.008065329864621162, "global_step": 17683, "epoch": 148, "lr": 8.619263155915144e-05} +{"train_loss": 0.006540324073284864, "global_step": 17684, "epoch": 148, "lr": 8.619110292253272e-05} +{"train_loss": 0.00701133394613862, "global_step": 17685, "epoch": 148, "lr": 8.618957421485662e-05} +{"train_loss": 0.006563643459230661, "global_step": 17686, "epoch": 148, "lr": 8.618804543612617e-05} +{"train_loss": 0.006002636160701513, "global_step": 17687, "epoch": 148, "lr": 8.618651658634436e-05} +{"train_loss": 0.008773407898843288, "global_step": 17688, "epoch": 148, "lr": 8.61849876655142e-05} +{"train_loss": 0.007174843922257423, "global_step": 17689, "epoch": 148, "lr": 8.618345867363866e-05} +{"train_loss": 0.005539423786103725, "global_step": 17690, "epoch": 148, "lr": 8.618192961072078e-05} +{"train_loss": 0.005217922851443291, "global_step": 17691, "epoch": 148, "lr": 8.618040047676355e-05} +{"train_loss": 0.007921066135168076, "global_step": 17692, "epoch": 148, "lr": 8.617887127176996e-05} +{"train_loss": 0.004156594164669514, "global_step": 17693, "epoch": 148, "lr": 8.617734199574302e-05} +{"train_loss": 0.007769588381052017, "global_step": 17694, "epoch": 148, "lr": 8.617581264868572e-05} +{"train_loss": 0.00726596312597394, "global_step": 17695, "epoch": 148, "lr": 8.61742832306011e-05} +{"train_loss": 0.003927590325474739, "global_step": 17696, "epoch": 148, "lr": 8.617275374149213e-05} +{"train_loss": 0.005890743341296911, "global_step": 17697, "epoch": 148, "lr": 8.617122418136183e-05} +{"train_loss": 0.006680426187813282, "global_step": 17698, "epoch": 148, "lr": 8.616969455021318e-05} +{"train_loss": 0.006687865126878023, "global_step": 17699, "epoch": 148, "lr": 8.616816484804921e-05} +{"train_loss": 0.00608288636431098, "global_step": 17700, "epoch": 148, "lr": 8.616663507487293e-05} +{"train_loss": 0.006594749633222818, "global_step": 17701, "epoch": 148, "lr": 8.616510523068731e-05} +{"train_loss": 0.00844525545835495, "global_step": 17702, "epoch": 148, "lr": 8.616357531549535e-05} +{"train_loss": 0.00914793275296688, "global_step": 17703, "epoch": 148, "lr": 8.616204532930011e-05} +{"train_loss": 0.005130171775817871, "global_step": 17704, "epoch": 148, "lr": 8.616051527210453e-05} +{"train_loss": 0.006638723891228437, "global_step": 17705, "epoch": 148, "lr": 8.615898514391163e-05} +{"train_loss": 0.0061357044614851475, "global_step": 17706, "epoch": 148, "lr": 8.615745494472447e-05} +{"train_loss": 0.00598199712112546, "global_step": 17707, "epoch": 148, "lr": 8.615592467454599e-05} +{"train_loss": 0.009285986423492432, "global_step": 17708, "epoch": 148, "lr": 8.61543943333792e-05} +{"train_loss": 0.004212371539324522, "global_step": 17709, "epoch": 148, "lr": 8.615286392122712e-05} +{"train_loss": 0.005591738037765026, "global_step": 17710, "epoch": 148, "lr": 8.615133343809277e-05} +{"train_loss": 0.004698642995208502, "global_step": 17711, "epoch": 148, "lr": 8.614980288397914e-05} +{"train_loss": 0.007503649219870567, "global_step": 17712, "epoch": 148, "lr": 8.614827225888922e-05} +{"train_loss": 0.0052258954383432865, "global_step": 17713, "epoch": 148, "lr": 8.614674156282602e-05} +{"train_loss": 0.004711424466222525, "global_step": 17714, "epoch": 148, "lr": 8.614521079579259e-05} +{"train_loss": 0.008384688757359982, "global_step": 17715, "epoch": 148, "lr": 8.614367995779187e-05} +{"train_loss": 0.00740176672115922, "global_step": 17716, "epoch": 148, "lr": 8.614214904882691e-05} +{"train_loss": 0.004390557762235403, "global_step": 17717, "epoch": 148, "lr": 8.61406180689007e-05} +{"train_loss": 0.00661533372476697, "global_step": 17718, "epoch": 148, "lr": 8.613908701801624e-05} +{"train_loss": 0.007091099862009287, "global_step": 17719, "epoch": 148, "lr": 8.613755589617656e-05} +{"train_loss": 0.004855398088693619, "global_step": 17720, "epoch": 148, "lr": 8.613602470338463e-05} +{"train_loss": 0.0057984995655715466, "global_step": 17721, "epoch": 148, "lr": 8.613449343964349e-05} +{"train_loss": 0.0063973767682909966, "global_step": 17722, "epoch": 148, "lr": 8.613296210495612e-05} +{"train_loss": 0.007789911236613989, "global_step": 17723, "epoch": 148, "lr": 8.613143069932555e-05} +{"train_loss": 0.005131903104484081, "global_step": 17724, "epoch": 148, "lr": 8.612989922275477e-05} +{"train_loss": 0.0051480368711054325, "global_step": 17725, "epoch": 148, "lr": 8.612836767524679e-05} +{"train_loss": 0.009498503059148788, "global_step": 17726, "epoch": 148, "lr": 8.612683605680463e-05} +{"train_loss": 0.00468872208148241, "global_step": 17727, "epoch": 148, "lr": 8.612530436743128e-05} +{"train_loss": 0.005579413380473852, "global_step": 17728, "epoch": 148, "lr": 8.612377260712976e-05} +{"train_loss": 0.004953380208462477, "global_step": 17729, "epoch": 148, "lr": 8.612224077590307e-05} +{"train_loss": 0.0060317139571704785, "global_step": 17730, "epoch": 148, "lr": 8.61207088737542e-05, "val_loss": 0.018199089914560318} +{"train_loss": 0.006968913599848747, "global_step": 17731, "epoch": 149, "lr": 8.61191769006862e-05} +{"train_loss": 0.006496758665889502, "global_step": 17732, "epoch": 149, "lr": 8.611764485670206e-05} +{"train_loss": 0.005628406070172787, "global_step": 17733, "epoch": 149, "lr": 8.611611274180478e-05} +{"train_loss": 0.005219339393079281, "global_step": 17734, "epoch": 149, "lr": 8.611458055599734e-05} +{"train_loss": 0.005556074436753988, "global_step": 17735, "epoch": 149, "lr": 8.611304829928282e-05} +{"train_loss": 0.00619015796110034, "global_step": 17736, "epoch": 149, "lr": 8.611151597166416e-05} +{"train_loss": 0.0027572924736887217, "global_step": 17737, "epoch": 149, "lr": 8.610998357314441e-05} +{"train_loss": 0.0072343661449849606, "global_step": 17738, "epoch": 149, "lr": 8.610845110372657e-05} +{"train_loss": 0.004967934917658567, "global_step": 17739, "epoch": 149, "lr": 8.610691856341362e-05} +{"train_loss": 0.005333921872079372, "global_step": 17740, "epoch": 149, "lr": 8.610538595220863e-05} +{"train_loss": 0.005485684610903263, "global_step": 17741, "epoch": 149, "lr": 8.610385327011454e-05} +{"train_loss": 0.004844977520406246, "global_step": 17742, "epoch": 149, "lr": 8.610232051713441e-05} +{"train_loss": 0.00331145990639925, "global_step": 17743, "epoch": 149, "lr": 8.610078769327121e-05} +{"train_loss": 0.007959868758916855, "global_step": 17744, "epoch": 149, "lr": 8.609925479852798e-05} +{"train_loss": 0.006328356917947531, "global_step": 17745, "epoch": 149, "lr": 8.609772183290774e-05} +{"train_loss": 0.002666797023266554, "global_step": 17746, "epoch": 149, "lr": 8.609618879641345e-05} +{"train_loss": 0.00496074091643095, "global_step": 17747, "epoch": 149, "lr": 8.609465568904816e-05} +{"train_loss": 0.005598139483481646, "global_step": 17748, "epoch": 149, "lr": 8.609312251081488e-05} +{"train_loss": 0.005238307639956474, "global_step": 17749, "epoch": 149, "lr": 8.609158926171658e-05} +{"train_loss": 0.004729634150862694, "global_step": 17750, "epoch": 149, "lr": 8.609005594175634e-05} +{"train_loss": 0.004651798866689205, "global_step": 17751, "epoch": 149, "lr": 8.608852255093711e-05} +{"train_loss": 0.00500137684866786, "global_step": 17752, "epoch": 149, "lr": 8.608698908926191e-05} +{"train_loss": 0.006298120133578777, "global_step": 17753, "epoch": 149, "lr": 8.60854555567338e-05} +{"train_loss": 0.005382892210036516, "global_step": 17754, "epoch": 149, "lr": 8.608392195335572e-05} +{"train_loss": 0.005520549602806568, "global_step": 17755, "epoch": 149, "lr": 8.608238827913072e-05} +{"train_loss": 0.007280245423316956, "global_step": 17756, "epoch": 149, "lr": 8.60808545340618e-05} +{"train_loss": 0.006704092491418123, "global_step": 17757, "epoch": 149, "lr": 8.607932071815199e-05} +{"train_loss": 0.005802283063530922, "global_step": 17758, "epoch": 149, "lr": 8.607778683140428e-05} +{"train_loss": 0.007568676024675369, "global_step": 17759, "epoch": 149, "lr": 8.60762528738217e-05} +{"train_loss": 0.00789384450763464, "global_step": 17760, "epoch": 149, "lr": 8.607471884540725e-05} +{"train_loss": 0.004205598495900631, "global_step": 17761, "epoch": 149, "lr": 8.607318474616394e-05} +{"train_loss": 0.008892858400940895, "global_step": 17762, "epoch": 149, "lr": 8.607165057609478e-05} +{"train_loss": 0.005971012637019157, "global_step": 17763, "epoch": 149, "lr": 8.607011633520279e-05} +{"train_loss": 0.005055527668446302, "global_step": 17764, "epoch": 149, "lr": 8.606858202349098e-05} +{"train_loss": 0.004541492555290461, "global_step": 17765, "epoch": 149, "lr": 8.606704764096237e-05} +{"train_loss": 0.003952749073505402, "global_step": 17766, "epoch": 149, "lr": 8.606551318761996e-05} +{"train_loss": 0.0035483359824866056, "global_step": 17767, "epoch": 149, "lr": 8.606397866346676e-05} +{"train_loss": 0.006274634972214699, "global_step": 17768, "epoch": 149, "lr": 8.606244406850581e-05} +{"train_loss": 0.004030163865536451, "global_step": 17769, "epoch": 149, "lr": 8.60609094027401e-05} +{"train_loss": 0.00606930535286665, "global_step": 17770, "epoch": 149, "lr": 8.605937466617264e-05} +{"train_loss": 0.0056879534386098385, "global_step": 17771, "epoch": 149, "lr": 8.605783985880645e-05} +{"train_loss": 0.004347410053014755, "global_step": 17772, "epoch": 149, "lr": 8.605630498064454e-05} +{"train_loss": 0.007018443197011948, "global_step": 17773, "epoch": 149, "lr": 8.605477003168993e-05} +{"train_loss": 0.006620085798203945, "global_step": 17774, "epoch": 149, "lr": 8.605323501194562e-05} +{"train_loss": 0.007099004928022623, "global_step": 17775, "epoch": 149, "lr": 8.605169992141466e-05} +{"train_loss": 0.00757182203233242, "global_step": 17776, "epoch": 149, "lr": 8.605016476010002e-05} +{"train_loss": 0.007990730926394463, "global_step": 17777, "epoch": 149, "lr": 8.604862952800474e-05} +{"train_loss": 0.005684773903340101, "global_step": 17778, "epoch": 149, "lr": 8.604709422513182e-05} +{"train_loss": 0.006483214441686869, "global_step": 17779, "epoch": 149, "lr": 8.604555885148429e-05} +{"train_loss": 0.006268785800784826, "global_step": 17780, "epoch": 149, "lr": 8.604402340706515e-05} +{"train_loss": 0.00573976943269372, "global_step": 17781, "epoch": 149, "lr": 8.604248789187744e-05} +{"train_loss": 0.005577121861279011, "global_step": 17782, "epoch": 149, "lr": 8.604095230592412e-05} +{"train_loss": 0.003832063404843211, "global_step": 17783, "epoch": 149, "lr": 8.603941664920827e-05} +{"train_loss": 0.007999017834663391, "global_step": 17784, "epoch": 149, "lr": 8.603788092173286e-05} +{"train_loss": 0.006638256832957268, "global_step": 17785, "epoch": 149, "lr": 8.603634512350093e-05} +{"train_loss": 0.005103094037622213, "global_step": 17786, "epoch": 149, "lr": 8.603480925451549e-05} +{"train_loss": 0.0056758541613817215, "global_step": 17787, "epoch": 149, "lr": 8.603327331477952e-05} +{"train_loss": 0.004100331105291843, "global_step": 17788, "epoch": 149, "lr": 8.60317373042961e-05} +{"train_loss": 0.006337759084999561, "global_step": 17789, "epoch": 149, "lr": 8.603020122306821e-05} +{"train_loss": 0.003561236197128892, "global_step": 17790, "epoch": 149, "lr": 8.602866507109886e-05} +{"train_loss": 0.006916997954249382, "global_step": 17791, "epoch": 149, "lr": 8.602712884839108e-05} +{"train_loss": 0.0035144933499395847, "global_step": 17792, "epoch": 149, "lr": 8.602559255494789e-05} +{"train_loss": 0.004487986676394939, "global_step": 17793, "epoch": 149, "lr": 8.602405619077228e-05} +{"train_loss": 0.005895966198295355, "global_step": 17794, "epoch": 149, "lr": 8.60225197558673e-05} +{"train_loss": 0.007441339548677206, "global_step": 17795, "epoch": 149, "lr": 8.602098325023593e-05} +{"train_loss": 0.0043900939635932446, "global_step": 17796, "epoch": 149, "lr": 8.601944667388124e-05} +{"train_loss": 0.003044687444344163, "global_step": 17797, "epoch": 149, "lr": 8.601791002680619e-05} +{"train_loss": 0.005210323259234428, "global_step": 17798, "epoch": 149, "lr": 8.601637330901383e-05} +{"train_loss": 0.005298437085002661, "global_step": 17799, "epoch": 149, "lr": 8.601483652050717e-05} +{"train_loss": 0.004889538045972586, "global_step": 17800, "epoch": 149, "lr": 8.601329966128921e-05} +{"train_loss": 0.004357383586466312, "global_step": 17801, "epoch": 149, "lr": 8.6011762731363e-05} +{"train_loss": 0.004844640381634235, "global_step": 17802, "epoch": 149, "lr": 8.601022573073154e-05} +{"train_loss": 0.005742429755628109, "global_step": 17803, "epoch": 149, "lr": 8.600868865939784e-05} +{"train_loss": 0.011681076139211655, "global_step": 17804, "epoch": 149, "lr": 8.600715151736493e-05} +{"train_loss": 0.0038799066096544266, "global_step": 17805, "epoch": 149, "lr": 8.600561430463583e-05} +{"train_loss": 0.006938416510820389, "global_step": 17806, "epoch": 149, "lr": 8.600407702121356e-05} +{"train_loss": 0.0034432364627718925, "global_step": 17807, "epoch": 149, "lr": 8.600253966710112e-05} +{"train_loss": 0.004245140589773655, "global_step": 17808, "epoch": 149, "lr": 8.600100224230154e-05} +{"train_loss": 0.008016913197934628, "global_step": 17809, "epoch": 149, "lr": 8.599946474681784e-05} +{"train_loss": 0.004978028126060963, "global_step": 17810, "epoch": 149, "lr": 8.599792718065304e-05} +{"train_loss": 0.007894626818597317, "global_step": 17811, "epoch": 149, "lr": 8.599638954381015e-05} +{"train_loss": 0.0070845745503902435, "global_step": 17812, "epoch": 149, "lr": 8.59948518362922e-05} +{"train_loss": 0.004337735008448362, "global_step": 17813, "epoch": 149, "lr": 8.59933140581022e-05} +{"train_loss": 0.00433765584602952, "global_step": 17814, "epoch": 149, "lr": 8.599177620924317e-05} +{"train_loss": 0.006575764622539282, "global_step": 17815, "epoch": 149, "lr": 8.599023828971814e-05} +{"train_loss": 0.004806051962077618, "global_step": 17816, "epoch": 149, "lr": 8.598870029953012e-05} +{"train_loss": 0.00795014388859272, "global_step": 17817, "epoch": 149, "lr": 8.598716223868213e-05} +{"train_loss": 0.0066459146328270435, "global_step": 17818, "epoch": 149, "lr": 8.598562410717719e-05} +{"train_loss": 0.005464194808155298, "global_step": 17819, "epoch": 149, "lr": 8.598408590501832e-05} +{"train_loss": 0.005178498104214668, "global_step": 17820, "epoch": 149, "lr": 8.598254763220855e-05} +{"train_loss": 0.007254967000335455, "global_step": 17821, "epoch": 149, "lr": 8.598100928875088e-05} +{"train_loss": 0.0046510156244039536, "global_step": 17822, "epoch": 149, "lr": 8.597947087464837e-05} +{"train_loss": 0.005880265962332487, "global_step": 17823, "epoch": 149, "lr": 8.597793238990398e-05} +{"train_loss": 0.004432946443557739, "global_step": 17824, "epoch": 149, "lr": 8.597639383452079e-05} +{"train_loss": 0.0075925602577626705, "global_step": 17825, "epoch": 149, "lr": 8.597485520850177e-05} +{"train_loss": 0.005681659560650587, "global_step": 17826, "epoch": 149, "lr": 8.597331651184997e-05} +{"train_loss": 0.0057561504654586315, "global_step": 17827, "epoch": 149, "lr": 8.597177774456842e-05} +{"train_loss": 0.0041748881340026855, "global_step": 17828, "epoch": 149, "lr": 8.597023890666011e-05} +{"train_loss": 0.008785257115960121, "global_step": 17829, "epoch": 149, "lr": 8.59686999981281e-05} +{"train_loss": 0.005056770984083414, "global_step": 17830, "epoch": 149, "lr": 8.596716101897537e-05} +{"train_loss": 0.004075280856341124, "global_step": 17831, "epoch": 149, "lr": 8.596562196920497e-05} +{"train_loss": 0.009067917242646217, "global_step": 17832, "epoch": 149, "lr": 8.596408284881992e-05} +{"train_loss": 0.003653512569144368, "global_step": 17833, "epoch": 149, "lr": 8.596254365782322e-05} +{"train_loss": 0.005124002229422331, "global_step": 17834, "epoch": 149, "lr": 8.596100439621793e-05} +{"train_loss": 0.003636021399870515, "global_step": 17835, "epoch": 149, "lr": 8.595946506400703e-05} +{"train_loss": 0.005429356824606657, "global_step": 17836, "epoch": 149, "lr": 8.595792566119356e-05} +{"train_loss": 0.005973217077553272, "global_step": 17837, "epoch": 149, "lr": 8.595638618778054e-05} +{"train_loss": 0.00700974278151989, "global_step": 17838, "epoch": 149, "lr": 8.595484664377103e-05} +{"train_loss": 0.005004674196243286, "global_step": 17839, "epoch": 149, "lr": 8.5953307029168e-05} +{"train_loss": 0.005846566520631313, "global_step": 17840, "epoch": 149, "lr": 8.595176734397449e-05} +{"train_loss": 0.004404771141707897, "global_step": 17841, "epoch": 149, "lr": 8.595022758819353e-05} +{"train_loss": 0.005606973078101873, "global_step": 17842, "epoch": 149, "lr": 8.594868776182815e-05} +{"train_loss": 0.004702380858361721, "global_step": 17843, "epoch": 149, "lr": 8.594714786488135e-05} +{"train_loss": 0.005185412243008614, "global_step": 17844, "epoch": 149, "lr": 8.594560789735616e-05} +{"train_loss": 0.004236366134136915, "global_step": 17845, "epoch": 149, "lr": 8.59440678592556e-05} +{"train_loss": 0.00767907639965415, "global_step": 17846, "epoch": 149, "lr": 8.594252775058271e-05} +{"train_loss": 0.004509900696575642, "global_step": 17847, "epoch": 149, "lr": 8.594098757134052e-05} +{"train_loss": 0.007543530315160751, "global_step": 17848, "epoch": 149, "lr": 8.593944732153203e-05} +{"train_loss": 0.005655713631779331, "global_step": 17849, "epoch": 149, "lr": 8.59379070011603e-05, "val_loss": 0.011026996187865734} +{"train_loss": 0.004727195482701063, "global_step": 17850, "epoch": 150, "lr": 8.59363666102283e-05} +{"train_loss": 0.007102032192051411, "global_step": 17851, "epoch": 150, "lr": 8.59348261487391e-05} +{"train_loss": 0.0037821349687874317, "global_step": 17852, "epoch": 150, "lr": 8.593328561669568e-05} +{"train_loss": 0.0048170569352805614, "global_step": 17853, "epoch": 150, "lr": 8.593174501410111e-05} +{"train_loss": 0.005678034853190184, "global_step": 17854, "epoch": 150, "lr": 8.593020434095839e-05} +{"train_loss": 0.003855001414194703, "global_step": 17855, "epoch": 150, "lr": 8.592866359727058e-05} +{"train_loss": 0.007894116453826427, "global_step": 17856, "epoch": 150, "lr": 8.592712278304064e-05} +{"train_loss": 0.006640176754444838, "global_step": 17857, "epoch": 150, "lr": 8.592558189827166e-05} +{"train_loss": 0.005820940714329481, "global_step": 17858, "epoch": 150, "lr": 8.592404094296663e-05} +{"train_loss": 0.004388995002955198, "global_step": 17859, "epoch": 150, "lr": 8.592249991712859e-05} +{"train_loss": 0.006635337136685848, "global_step": 17860, "epoch": 150, "lr": 8.592095882076054e-05} +{"train_loss": 0.007880025543272495, "global_step": 17861, "epoch": 150, "lr": 8.591941765386555e-05} +{"train_loss": 0.005073825363069773, "global_step": 17862, "epoch": 150, "lr": 8.59178764164466e-05} +{"train_loss": 0.005778490100055933, "global_step": 17863, "epoch": 150, "lr": 8.591633510850675e-05} +{"train_loss": 0.00612374534830451, "global_step": 17864, "epoch": 150, "lr": 8.5914793730049e-05} +{"train_loss": 0.006647984031587839, "global_step": 17865, "epoch": 150, "lr": 8.59132522810764e-05} +{"train_loss": 0.00484919548034668, "global_step": 17866, "epoch": 150, "lr": 8.591171076159197e-05} +{"train_loss": 0.005872194655239582, "global_step": 17867, "epoch": 150, "lr": 8.591016917159874e-05} +{"train_loss": 0.005828567780554295, "global_step": 17868, "epoch": 150, "lr": 8.590862751109969e-05} +{"train_loss": 0.0033154564443975687, "global_step": 17869, "epoch": 150, "lr": 8.590708578009791e-05} +{"train_loss": 0.00814907718449831, "global_step": 17870, "epoch": 150, "lr": 8.590554397859642e-05} +{"train_loss": 0.006944306660443544, "global_step": 17871, "epoch": 150, "lr": 8.590400210659822e-05} +{"train_loss": 0.0038398122414946556, "global_step": 17872, "epoch": 150, "lr": 8.590246016410634e-05} +{"train_loss": 0.0114534180611372, "global_step": 17873, "epoch": 150, "lr": 8.590091815112382e-05} +{"train_loss": 0.0062697771936655045, "global_step": 17874, "epoch": 150, "lr": 8.589937606765367e-05} +{"train_loss": 0.0036133592948317528, "global_step": 17875, "epoch": 150, "lr": 8.589783391369894e-05} +{"train_loss": 0.006111827678978443, "global_step": 17876, "epoch": 150, "lr": 8.589629168926265e-05} +{"train_loss": 0.0054696183651685715, "global_step": 17877, "epoch": 150, "lr": 8.589474939434783e-05} +{"train_loss": 0.004339902196079493, "global_step": 17878, "epoch": 150, "lr": 8.589320702895751e-05} +{"train_loss": 0.007710988167673349, "global_step": 17879, "epoch": 150, "lr": 8.589166459309469e-05} +{"train_loss": 0.006558447610586882, "global_step": 17880, "epoch": 150, "lr": 8.589012208676243e-05} +{"train_loss": 0.0052590989507734776, "global_step": 17881, "epoch": 150, "lr": 8.588857950996377e-05} +{"train_loss": 0.006793898530304432, "global_step": 17882, "epoch": 150, "lr": 8.588703686270169e-05} +{"train_loss": 0.011280488222837448, "global_step": 17883, "epoch": 150, "lr": 8.588549414497926e-05} +{"train_loss": 0.005234763491898775, "global_step": 17884, "epoch": 150, "lr": 8.588395135679948e-05} +{"train_loss": 0.007360831368714571, "global_step": 17885, "epoch": 150, "lr": 8.588240849816542e-05} +{"train_loss": 0.008282407186925411, "global_step": 17886, "epoch": 150, "lr": 8.588086556908007e-05} +{"train_loss": 0.0055958544835448265, "global_step": 17887, "epoch": 150, "lr": 8.587932256954647e-05} +{"train_loss": 0.008665530011057854, "global_step": 17888, "epoch": 150, "lr": 8.587777949956768e-05} +{"train_loss": 0.005933274049311876, "global_step": 17889, "epoch": 150, "lr": 8.587623635914668e-05} +{"train_loss": 0.007914403453469276, "global_step": 17890, "epoch": 150, "lr": 8.587469314828651e-05} +{"train_loss": 0.005753223318606615, "global_step": 17891, "epoch": 150, "lr": 8.587314986699025e-05} +{"train_loss": 0.004384265281260014, "global_step": 17892, "epoch": 150, "lr": 8.587160651526086e-05} +{"train_loss": 0.0046221972443163395, "global_step": 17893, "epoch": 150, "lr": 8.587006309310141e-05} +{"train_loss": 0.005810888018459082, "global_step": 17894, "epoch": 150, "lr": 8.586851960051494e-05} +{"train_loss": 0.007521428633481264, "global_step": 17895, "epoch": 150, "lr": 8.586697603750445e-05} +{"train_loss": 0.005931363441050053, "global_step": 17896, "epoch": 150, "lr": 8.586543240407299e-05} +{"train_loss": 0.006938875187188387, "global_step": 17897, "epoch": 150, "lr": 8.586388870022357e-05} +{"train_loss": 0.009394818916916847, "global_step": 17898, "epoch": 150, "lr": 8.586234492595925e-05} +{"train_loss": 0.0059472196735441685, "global_step": 17899, "epoch": 150, "lr": 8.586080108128304e-05} +{"train_loss": 0.008149235509335995, "global_step": 17900, "epoch": 150, "lr": 8.585925716619798e-05} +{"train_loss": 0.008875105530023575, "global_step": 17901, "epoch": 150, "lr": 8.58577131807071e-05} +{"train_loss": 0.00871127750724554, "global_step": 17902, "epoch": 150, "lr": 8.585616912481345e-05} +{"train_loss": 0.005360041279345751, "global_step": 17903, "epoch": 150, "lr": 8.585462499852001e-05} +{"train_loss": 0.006945135537534952, "global_step": 17904, "epoch": 150, "lr": 8.585308080182986e-05} +{"train_loss": 0.008008995093405247, "global_step": 17905, "epoch": 150, "lr": 8.585153653474602e-05} +{"train_loss": 0.005033639259636402, "global_step": 17906, "epoch": 150, "lr": 8.584999219727152e-05} +{"train_loss": 0.005712045356631279, "global_step": 17907, "epoch": 150, "lr": 8.584844778940938e-05} +{"train_loss": 0.006762128788977861, "global_step": 17908, "epoch": 150, "lr": 8.584690331116265e-05} +{"train_loss": 0.004827212076634169, "global_step": 17909, "epoch": 150, "lr": 8.584535876253434e-05} +{"train_loss": 0.008153969421982765, "global_step": 17910, "epoch": 150, "lr": 8.584381414352751e-05} +{"train_loss": 0.005925411358475685, "global_step": 17911, "epoch": 150, "lr": 8.584226945414519e-05} +{"train_loss": 0.004678499884903431, "global_step": 17912, "epoch": 150, "lr": 8.58407246943904e-05} +{"train_loss": 0.005363169126212597, "global_step": 17913, "epoch": 150, "lr": 8.583917986426617e-05} +{"train_loss": 0.005483703222125769, "global_step": 17914, "epoch": 150, "lr": 8.583763496377553e-05} +{"train_loss": 0.005417088512331247, "global_step": 17915, "epoch": 150, "lr": 8.583608999292153e-05} +{"train_loss": 0.00977269932627678, "global_step": 17916, "epoch": 150, "lr": 8.583454495170719e-05} +{"train_loss": 0.004842571914196014, "global_step": 17917, "epoch": 150, "lr": 8.583299984013556e-05} +{"train_loss": 0.00519576808437705, "global_step": 17918, "epoch": 150, "lr": 8.583145465820967e-05} +{"train_loss": 0.004583438392728567, "global_step": 17919, "epoch": 150, "lr": 8.582990940593252e-05} +{"train_loss": 0.009097552858293056, "global_step": 17920, "epoch": 150, "lr": 8.582836408330718e-05} +{"train_loss": 0.0064438520930707455, "global_step": 17921, "epoch": 150, "lr": 8.58268186903367e-05} +{"train_loss": 0.0033016756642609835, "global_step": 17922, "epoch": 150, "lr": 8.582527322702407e-05} +{"train_loss": 0.0068109771236777306, "global_step": 17923, "epoch": 150, "lr": 8.582372769337235e-05} +{"train_loss": 0.007425694726407528, "global_step": 17924, "epoch": 150, "lr": 8.582218208938455e-05} +{"train_loss": 0.006579077802598476, "global_step": 17925, "epoch": 150, "lr": 8.582063641506374e-05} +{"train_loss": 0.00437988480553031, "global_step": 17926, "epoch": 150, "lr": 8.581909067041292e-05} +{"train_loss": 0.00803905725479126, "global_step": 17927, "epoch": 150, "lr": 8.581754485543517e-05} +{"train_loss": 0.005376189481467009, "global_step": 17928, "epoch": 150, "lr": 8.581599897013348e-05} +{"train_loss": 0.004639160819351673, "global_step": 17929, "epoch": 150, "lr": 8.58144530145109e-05} +{"train_loss": 0.006535595282912254, "global_step": 17930, "epoch": 150, "lr": 8.581290698857047e-05} +{"train_loss": 0.0067041837610304356, "global_step": 17931, "epoch": 150, "lr": 8.581136089231523e-05} +{"train_loss": 0.006276054307818413, "global_step": 17932, "epoch": 150, "lr": 8.580981472574819e-05} +{"train_loss": 0.00412409845739603, "global_step": 17933, "epoch": 150, "lr": 8.580826848887243e-05} +{"train_loss": 0.006083332933485508, "global_step": 17934, "epoch": 150, "lr": 8.580672218169095e-05} +{"train_loss": 0.003175396705046296, "global_step": 17935, "epoch": 150, "lr": 8.58051758042068e-05} +{"train_loss": 0.005687060300260782, "global_step": 17936, "epoch": 150, "lr": 8.580362935642299e-05} +{"train_loss": 0.006539986934512854, "global_step": 17937, "epoch": 150, "lr": 8.580208283834259e-05} +{"train_loss": 0.006245438475161791, "global_step": 17938, "epoch": 150, "lr": 8.580053624996865e-05} +{"train_loss": 0.004881280940026045, "global_step": 17939, "epoch": 150, "lr": 8.579898959130415e-05} +{"train_loss": 0.005185609217733145, "global_step": 17940, "epoch": 150, "lr": 8.579744286235216e-05} +{"train_loss": 0.006294450256973505, "global_step": 17941, "epoch": 150, "lr": 8.579589606311573e-05} +{"train_loss": 0.006854066159576178, "global_step": 17942, "epoch": 150, "lr": 8.579434919359789e-05} +{"train_loss": 0.004337586462497711, "global_step": 17943, "epoch": 150, "lr": 8.579280225380165e-05} +{"train_loss": 0.008933654054999352, "global_step": 17944, "epoch": 150, "lr": 8.579125524373009e-05} +{"train_loss": 0.004467396065592766, "global_step": 17945, "epoch": 150, "lr": 8.578970816338621e-05} +{"train_loss": 0.007337798364460468, "global_step": 17946, "epoch": 150, "lr": 8.578816101277305e-05} +{"train_loss": 0.005127323791384697, "global_step": 17947, "epoch": 150, "lr": 8.578661379189366e-05} +{"train_loss": 0.007545365020632744, "global_step": 17948, "epoch": 150, "lr": 8.578506650075109e-05} +{"train_loss": 0.006147335283458233, "global_step": 17949, "epoch": 150, "lr": 8.578351913934837e-05} +{"train_loss": 0.007198513951152563, "global_step": 17950, "epoch": 150, "lr": 8.578197170768853e-05} +{"train_loss": 0.005058960523456335, "global_step": 17951, "epoch": 150, "lr": 8.57804242057746e-05} +{"train_loss": 0.003996580373495817, "global_step": 17952, "epoch": 150, "lr": 8.577887663360963e-05} +{"train_loss": 0.005444787908345461, "global_step": 17953, "epoch": 150, "lr": 8.577732899119666e-05} +{"train_loss": 0.005963315721601248, "global_step": 17954, "epoch": 150, "lr": 8.577578127853874e-05} +{"train_loss": 0.00666957488283515, "global_step": 17955, "epoch": 150, "lr": 8.577423349563889e-05} +{"train_loss": 0.005302584730088711, "global_step": 17956, "epoch": 150, "lr": 8.577268564250014e-05} +{"train_loss": 0.01118437759578228, "global_step": 17957, "epoch": 150, "lr": 8.577113771912556e-05} +{"train_loss": 0.003895436180755496, "global_step": 17958, "epoch": 150, "lr": 8.576958972551816e-05} +{"train_loss": 0.004486382938921452, "global_step": 17959, "epoch": 150, "lr": 8.576804166168099e-05} +{"train_loss": 0.005195994861423969, "global_step": 17960, "epoch": 150, "lr": 8.576649352761712e-05} +{"train_loss": 0.0061409990303218365, "global_step": 17961, "epoch": 150, "lr": 8.576494532332953e-05} +{"train_loss": 0.007568450178951025, "global_step": 17962, "epoch": 150, "lr": 8.576339704882131e-05} +{"train_loss": 0.003915883135050535, "global_step": 17963, "epoch": 150, "lr": 8.576184870409547e-05} +{"train_loss": 0.0035994439385831356, "global_step": 17964, "epoch": 150, "lr": 8.576030028915507e-05} +{"train_loss": 0.003082908922806382, "global_step": 17965, "epoch": 150, "lr": 8.575875180400313e-05} +{"train_loss": 0.010595576837658882, "global_step": 17966, "epoch": 150, "lr": 8.575720324864271e-05} +{"train_loss": 0.006382466293871403, "global_step": 17967, "epoch": 150, "lr": 8.575565462307684e-05} +{"train_loss": 0.006138121822708044, "global_step": 17968, "epoch": 150, "lr": 8.575410592730854e-05, "val_loss": 0.016003888100385666, "train_action_mse_error": 0.0001613156491657719} +{"train_loss": 0.006083368323743343, "global_step": 17969, "epoch": 151, "lr": 8.575255716134091e-05} +{"train_loss": 0.004762405063956976, "global_step": 17970, "epoch": 151, "lr": 8.575100832517693e-05} +{"train_loss": 0.004528351128101349, "global_step": 17971, "epoch": 151, "lr": 8.574945941881967e-05} +{"train_loss": 0.009788574650883675, "global_step": 17972, "epoch": 151, "lr": 8.574791044227217e-05} +{"train_loss": 0.0035371885169297457, "global_step": 17973, "epoch": 151, "lr": 8.574636139553745e-05} +{"train_loss": 0.008125427179038525, "global_step": 17974, "epoch": 151, "lr": 8.574481227861859e-05} +{"train_loss": 0.004495496395975351, "global_step": 17975, "epoch": 151, "lr": 8.57432630915186e-05} +{"train_loss": 0.004495651926845312, "global_step": 17976, "epoch": 151, "lr": 8.574171383424053e-05} +{"train_loss": 0.00750434584915638, "global_step": 17977, "epoch": 151, "lr": 8.574016450678743e-05} +{"train_loss": 0.006515056826174259, "global_step": 17978, "epoch": 151, "lr": 8.573861510916232e-05} +{"train_loss": 0.003102558897808194, "global_step": 17979, "epoch": 151, "lr": 8.573706564136827e-05} +{"train_loss": 0.006461380980908871, "global_step": 17980, "epoch": 151, "lr": 8.57355161034083e-05} +{"train_loss": 0.006639222148805857, "global_step": 17981, "epoch": 151, "lr": 8.573396649528548e-05} +{"train_loss": 0.005661024246364832, "global_step": 17982, "epoch": 151, "lr": 8.573241681700283e-05} +{"train_loss": 0.005228848662227392, "global_step": 17983, "epoch": 151, "lr": 8.573086706856339e-05} +{"train_loss": 0.0061998991295695305, "global_step": 17984, "epoch": 151, "lr": 8.572931724997021e-05} +{"train_loss": 0.00581163726747036, "global_step": 17985, "epoch": 151, "lr": 8.572776736122635e-05} +{"train_loss": 0.008552796207368374, "global_step": 17986, "epoch": 151, "lr": 8.57262174023348e-05} +{"train_loss": 0.005490222480148077, "global_step": 17987, "epoch": 151, "lr": 8.572466737329867e-05} +{"train_loss": 0.004176832269877195, "global_step": 17988, "epoch": 151, "lr": 8.572311727412095e-05} +{"train_loss": 0.0069906883873045444, "global_step": 17989, "epoch": 151, "lr": 8.572156710480473e-05} +{"train_loss": 0.005805992055684328, "global_step": 17990, "epoch": 151, "lr": 8.5720016865353e-05} +{"train_loss": 0.0047874441370368, "global_step": 17991, "epoch": 151, "lr": 8.571846655576885e-05} +{"train_loss": 0.0059447502717375755, "global_step": 17992, "epoch": 151, "lr": 8.57169161760553e-05} +{"train_loss": 0.004975949879735708, "global_step": 17993, "epoch": 151, "lr": 8.571536572621541e-05} +{"train_loss": 0.0056253718212246895, "global_step": 17994, "epoch": 151, "lr": 8.571381520625222e-05} +{"train_loss": 0.005809724796563387, "global_step": 17995, "epoch": 151, "lr": 8.571226461616876e-05} +{"train_loss": 0.007925104349851608, "global_step": 17996, "epoch": 151, "lr": 8.571071395596808e-05} +{"train_loss": 0.004459584131836891, "global_step": 17997, "epoch": 151, "lr": 8.570916322565324e-05} +{"train_loss": 0.004279370419681072, "global_step": 17998, "epoch": 151, "lr": 8.570761242522726e-05} +{"train_loss": 0.00680018262937665, "global_step": 17999, "epoch": 151, "lr": 8.57060615546932e-05} +{"train_loss": 0.006697417702525854, "global_step": 18000, "epoch": 151, "lr": 8.57045106140541e-05} +{"train_loss": 0.00916130281984806, "global_step": 18001, "epoch": 151, "lr": 8.570295960331303e-05} +{"train_loss": 0.005292421672493219, "global_step": 18002, "epoch": 151, "lr": 8.5701408522473e-05} +{"train_loss": 0.00554308108985424, "global_step": 18003, "epoch": 151, "lr": 8.569985737153705e-05} +{"train_loss": 0.006068470422178507, "global_step": 18004, "epoch": 151, "lr": 8.569830615050827e-05} +{"train_loss": 0.006116051692515612, "global_step": 18005, "epoch": 151, "lr": 8.569675485938966e-05} +{"train_loss": 0.009893628768622875, "global_step": 18006, "epoch": 151, "lr": 8.56952034981843e-05} +{"train_loss": 0.00525688799098134, "global_step": 18007, "epoch": 151, "lr": 8.569365206689521e-05} +{"train_loss": 0.0059800343587994576, "global_step": 18008, "epoch": 151, "lr": 8.569210056552546e-05} +{"train_loss": 0.006373671814799309, "global_step": 18009, "epoch": 151, "lr": 8.569054899407806e-05} +{"train_loss": 0.006491419859230518, "global_step": 18010, "epoch": 151, "lr": 8.568899735255612e-05} +{"train_loss": 0.005531833972781897, "global_step": 18011, "epoch": 151, "lr": 8.568744564096262e-05} +{"train_loss": 0.006093040574342012, "global_step": 18012, "epoch": 151, "lr": 8.568589385930064e-05} +{"train_loss": 0.004907766357064247, "global_step": 18013, "epoch": 151, "lr": 8.568434200757321e-05} +{"train_loss": 0.004945168737322092, "global_step": 18014, "epoch": 151, "lr": 8.568279008578339e-05} +{"train_loss": 0.006443896796554327, "global_step": 18015, "epoch": 151, "lr": 8.568123809393423e-05} +{"train_loss": 0.0044609843753278255, "global_step": 18016, "epoch": 151, "lr": 8.567968603202876e-05} +{"train_loss": 0.008942042477428913, "global_step": 18017, "epoch": 151, "lr": 8.567813390007004e-05} +{"train_loss": 0.005907590035349131, "global_step": 18018, "epoch": 151, "lr": 8.567658169806114e-05} +{"train_loss": 0.006005688104778528, "global_step": 18019, "epoch": 151, "lr": 8.567502942600507e-05} +{"train_loss": 0.007284507155418396, "global_step": 18020, "epoch": 151, "lr": 8.567347708390487e-05} +{"train_loss": 0.0037549789994955063, "global_step": 18021, "epoch": 151, "lr": 8.567192467176364e-05} +{"train_loss": 0.007165377959609032, "global_step": 18022, "epoch": 151, "lr": 8.567037218958438e-05} +{"train_loss": 0.006850117351859808, "global_step": 18023, "epoch": 151, "lr": 8.566881963737015e-05} +{"train_loss": 0.007022743113338947, "global_step": 18024, "epoch": 151, "lr": 8.566726701512402e-05} +{"train_loss": 0.0035597640089690685, "global_step": 18025, "epoch": 151, "lr": 8.5665714322849e-05} +{"train_loss": 0.004992453847080469, "global_step": 18026, "epoch": 151, "lr": 8.566416156054817e-05} +{"train_loss": 0.004883868619799614, "global_step": 18027, "epoch": 151, "lr": 8.566260872822459e-05} +{"train_loss": 0.0058060395531356335, "global_step": 18028, "epoch": 151, "lr": 8.566105582588126e-05} +{"train_loss": 0.007117139641195536, "global_step": 18029, "epoch": 151, "lr": 8.565950285352126e-05} +{"train_loss": 0.005431576166301966, "global_step": 18030, "epoch": 151, "lr": 8.565794981114766e-05} +{"train_loss": 0.005826731212437153, "global_step": 18031, "epoch": 151, "lr": 8.565639669876345e-05} +{"train_loss": 0.0046545835211873055, "global_step": 18032, "epoch": 151, "lr": 8.565484351637175e-05} +{"train_loss": 0.008688697591423988, "global_step": 18033, "epoch": 151, "lr": 8.565329026397555e-05} +{"train_loss": 0.006578843574970961, "global_step": 18034, "epoch": 151, "lr": 8.565173694157792e-05} +{"train_loss": 0.004887512419372797, "global_step": 18035, "epoch": 151, "lr": 8.565018354918192e-05} +{"train_loss": 0.005748285911977291, "global_step": 18036, "epoch": 151, "lr": 8.564863008679061e-05} +{"train_loss": 0.0036826313007622957, "global_step": 18037, "epoch": 151, "lr": 8.564707655440701e-05} +{"train_loss": 0.007002671714872122, "global_step": 18038, "epoch": 151, "lr": 8.564552295203416e-05} +{"train_loss": 0.006842814851552248, "global_step": 18039, "epoch": 151, "lr": 8.564396927967518e-05} +{"train_loss": 0.007954934611916542, "global_step": 18040, "epoch": 151, "lr": 8.564241553733304e-05} +{"train_loss": 0.004587436094880104, "global_step": 18041, "epoch": 151, "lr": 8.564086172501083e-05} +{"train_loss": 0.005112428218126297, "global_step": 18042, "epoch": 151, "lr": 8.56393078427116e-05} +{"train_loss": 0.009732149541378021, "global_step": 18043, "epoch": 151, "lr": 8.56377538904384e-05} +{"train_loss": 0.007712779566645622, "global_step": 18044, "epoch": 151, "lr": 8.563619986819428e-05} +{"train_loss": 0.005840853322297335, "global_step": 18045, "epoch": 151, "lr": 8.563464577598228e-05} +{"train_loss": 0.005786885507404804, "global_step": 18046, "epoch": 151, "lr": 8.563309161380546e-05} +{"train_loss": 0.004924078471958637, "global_step": 18047, "epoch": 151, "lr": 8.563153738166688e-05} +{"train_loss": 0.006903873290866613, "global_step": 18048, "epoch": 151, "lr": 8.562998307956958e-05} +{"train_loss": 0.0038267243653535843, "global_step": 18049, "epoch": 151, "lr": 8.562842870751662e-05} +{"train_loss": 0.007881156168878078, "global_step": 18050, "epoch": 151, "lr": 8.562687426551104e-05} +{"train_loss": 0.007329726126044989, "global_step": 18051, "epoch": 151, "lr": 8.562531975355589e-05} +{"train_loss": 0.008075742982327938, "global_step": 18052, "epoch": 151, "lr": 8.562376517165424e-05} +{"train_loss": 0.005180001258850098, "global_step": 18053, "epoch": 151, "lr": 8.562221051980913e-05} +{"train_loss": 0.005152358673512936, "global_step": 18054, "epoch": 151, "lr": 8.562065579802362e-05} +{"train_loss": 0.0035734721459448338, "global_step": 18055, "epoch": 151, "lr": 8.561910100630074e-05} +{"train_loss": 0.008779428899288177, "global_step": 18056, "epoch": 151, "lr": 8.561754614464359e-05} +{"train_loss": 0.0072353375144302845, "global_step": 18057, "epoch": 151, "lr": 8.561599121305518e-05} +{"train_loss": 0.004646231420338154, "global_step": 18058, "epoch": 151, "lr": 8.561443621153857e-05} +{"train_loss": 0.005719324573874474, "global_step": 18059, "epoch": 151, "lr": 8.561288114009682e-05} +{"train_loss": 0.004850930534303188, "global_step": 18060, "epoch": 151, "lr": 8.561132599873299e-05} +{"train_loss": 0.008618171326816082, "global_step": 18061, "epoch": 151, "lr": 8.560977078745013e-05} +{"train_loss": 0.006706446874886751, "global_step": 18062, "epoch": 151, "lr": 8.560821550625128e-05} +{"train_loss": 0.003866089042276144, "global_step": 18063, "epoch": 151, "lr": 8.56066601551395e-05} +{"train_loss": 0.005409227218478918, "global_step": 18064, "epoch": 151, "lr": 8.560510473411785e-05} +{"train_loss": 0.007674552965909243, "global_step": 18065, "epoch": 151, "lr": 8.560354924318938e-05} +{"train_loss": 0.0037806499749422073, "global_step": 18066, "epoch": 151, "lr": 8.560199368235715e-05} +{"train_loss": 0.007104078307747841, "global_step": 18067, "epoch": 151, "lr": 8.560043805162421e-05} +{"train_loss": 0.006069857161492109, "global_step": 18068, "epoch": 151, "lr": 8.559888235099361e-05} +{"train_loss": 0.0033997753635048866, "global_step": 18069, "epoch": 151, "lr": 8.559732658046841e-05} +{"train_loss": 0.00812975037842989, "global_step": 18070, "epoch": 151, "lr": 8.559577074005167e-05} +{"train_loss": 0.006216572131961584, "global_step": 18071, "epoch": 151, "lr": 8.559421482974641e-05} +{"train_loss": 0.0038707826752215624, "global_step": 18072, "epoch": 151, "lr": 8.559265884955574e-05} +{"train_loss": 0.006068631540983915, "global_step": 18073, "epoch": 151, "lr": 8.559110279948267e-05} +{"train_loss": 0.00519418902695179, "global_step": 18074, "epoch": 151, "lr": 8.558954667953028e-05} +{"train_loss": 0.005340637173503637, "global_step": 18075, "epoch": 151, "lr": 8.55879904897016e-05} +{"train_loss": 0.005955844186246395, "global_step": 18076, "epoch": 151, "lr": 8.558643422999974e-05} +{"train_loss": 0.005866246297955513, "global_step": 18077, "epoch": 151, "lr": 8.558487790042769e-05} +{"train_loss": 0.00752445962280035, "global_step": 18078, "epoch": 151, "lr": 8.558332150098853e-05} +{"train_loss": 0.005207138601690531, "global_step": 18079, "epoch": 151, "lr": 8.558176503168533e-05} +{"train_loss": 0.004137267824262381, "global_step": 18080, "epoch": 151, "lr": 8.558020849252114e-05} +{"train_loss": 0.006986088119447231, "global_step": 18081, "epoch": 151, "lr": 8.5578651883499e-05} +{"train_loss": 0.003834337927401066, "global_step": 18082, "epoch": 151, "lr": 8.557709520462199e-05} +{"train_loss": 0.003983843140304089, "global_step": 18083, "epoch": 151, "lr": 8.557553845589315e-05} +{"train_loss": 0.0037460403982549906, "global_step": 18084, "epoch": 151, "lr": 8.557398163731553e-05} +{"train_loss": 0.0048134056851267815, "global_step": 18085, "epoch": 151, "lr": 8.557242474889223e-05} +{"train_loss": 0.008739291690289974, "global_step": 18086, "epoch": 151, "lr": 8.557086779062625e-05} +{"train_loss": 0.005952371165015492, "global_step": 18087, "epoch": 151, "lr": 8.556931076252066e-05, "val_loss": 0.017675727605819702} +{"train_loss": 0.005223322194069624, "global_step": 18088, "epoch": 152, "lr": 8.556775366457854e-05} +{"train_loss": 0.007889644242823124, "global_step": 18089, "epoch": 152, "lr": 8.556619649680295e-05} +{"train_loss": 0.005458008963614702, "global_step": 18090, "epoch": 152, "lr": 8.556463925919691e-05} +{"train_loss": 0.005311253946274519, "global_step": 18091, "epoch": 152, "lr": 8.556308195176353e-05} +{"train_loss": 0.005339449737221003, "global_step": 18092, "epoch": 152, "lr": 8.55615245745058e-05} +{"train_loss": 0.0064580622129142284, "global_step": 18093, "epoch": 152, "lr": 8.555996712742685e-05} +{"train_loss": 0.007481754291802645, "global_step": 18094, "epoch": 152, "lr": 8.555840961052968e-05} +{"train_loss": 0.005017551127821207, "global_step": 18095, "epoch": 152, "lr": 8.555685202381738e-05} +{"train_loss": 0.007670082617551088, "global_step": 18096, "epoch": 152, "lr": 8.5555294367293e-05} +{"train_loss": 0.008089575916528702, "global_step": 18097, "epoch": 152, "lr": 8.555373664095957e-05} +{"train_loss": 0.00489850202575326, "global_step": 18098, "epoch": 152, "lr": 8.555217884482023e-05} +{"train_loss": 0.007692976854741573, "global_step": 18099, "epoch": 152, "lr": 8.555062097887796e-05} +{"train_loss": 0.006203118246048689, "global_step": 18100, "epoch": 152, "lr": 8.554906304313583e-05} +{"train_loss": 0.007851514965295792, "global_step": 18101, "epoch": 152, "lr": 8.554750503759693e-05} +{"train_loss": 0.005646917503327131, "global_step": 18102, "epoch": 152, "lr": 8.55459469622643e-05} +{"train_loss": 0.0038272917736321688, "global_step": 18103, "epoch": 152, "lr": 8.554438881714099e-05} +{"train_loss": 0.004531961865723133, "global_step": 18104, "epoch": 152, "lr": 8.554283060223008e-05} +{"train_loss": 0.005335716530680656, "global_step": 18105, "epoch": 152, "lr": 8.554127231753461e-05} +{"train_loss": 0.00820302963256836, "global_step": 18106, "epoch": 152, "lr": 8.553971396305767e-05} +{"train_loss": 0.007219844963401556, "global_step": 18107, "epoch": 152, "lr": 8.553815553880228e-05} +{"train_loss": 0.006000156048685312, "global_step": 18108, "epoch": 152, "lr": 8.553659704477152e-05} +{"train_loss": 0.0064324974082410336, "global_step": 18109, "epoch": 152, "lr": 8.553503848096844e-05} +{"train_loss": 0.005253927316516638, "global_step": 18110, "epoch": 152, "lr": 8.553347984739612e-05} +{"train_loss": 0.00533481827005744, "global_step": 18111, "epoch": 152, "lr": 8.553192114405761e-05} +{"train_loss": 0.005603388417512178, "global_step": 18112, "epoch": 152, "lr": 8.553036237095597e-05} +{"train_loss": 0.005888568703085184, "global_step": 18113, "epoch": 152, "lr": 8.552880352809425e-05} +{"train_loss": 0.005637316964566708, "global_step": 18114, "epoch": 152, "lr": 8.552724461547552e-05} +{"train_loss": 0.006453422829508781, "global_step": 18115, "epoch": 152, "lr": 8.552568563310286e-05} +{"train_loss": 0.005561294034123421, "global_step": 18116, "epoch": 152, "lr": 8.55241265809793e-05} +{"train_loss": 0.005929642356932163, "global_step": 18117, "epoch": 152, "lr": 8.55225674591079e-05} +{"train_loss": 0.007050611078739166, "global_step": 18118, "epoch": 152, "lr": 8.552100826749174e-05} +{"train_loss": 0.005411503370851278, "global_step": 18119, "epoch": 152, "lr": 8.551944900613389e-05} +{"train_loss": 0.005010650958865881, "global_step": 18120, "epoch": 152, "lr": 8.551788967503738e-05} +{"train_loss": 0.0036497090477496386, "global_step": 18121, "epoch": 152, "lr": 8.55163302742053e-05} +{"train_loss": 0.008844678290188313, "global_step": 18122, "epoch": 152, "lr": 8.551477080364069e-05} +{"train_loss": 0.004724153783172369, "global_step": 18123, "epoch": 152, "lr": 8.551321126334663e-05} +{"train_loss": 0.005445971619337797, "global_step": 18124, "epoch": 152, "lr": 8.551165165332616e-05} +{"train_loss": 0.0038989372551441193, "global_step": 18125, "epoch": 152, "lr": 8.551009197358237e-05} +{"train_loss": 0.002871330361813307, "global_step": 18126, "epoch": 152, "lr": 8.55085322241183e-05} +{"train_loss": 0.006574542727321386, "global_step": 18127, "epoch": 152, "lr": 8.550697240493703e-05} +{"train_loss": 0.008650017902255058, "global_step": 18128, "epoch": 152, "lr": 8.55054125160416e-05} +{"train_loss": 0.0055052791722118855, "global_step": 18129, "epoch": 152, "lr": 8.550385255743509e-05} +{"train_loss": 0.006164649035781622, "global_step": 18130, "epoch": 152, "lr": 8.550229252912056e-05} +{"train_loss": 0.0064495098777115345, "global_step": 18131, "epoch": 152, "lr": 8.550073243110108e-05} +{"train_loss": 0.006266895215958357, "global_step": 18132, "epoch": 152, "lr": 8.549917226337968e-05} +{"train_loss": 0.006423492915928364, "global_step": 18133, "epoch": 152, "lr": 8.549761202595948e-05} +{"train_loss": 0.0048936824314296246, "global_step": 18134, "epoch": 152, "lr": 8.549605171884349e-05} +{"train_loss": 0.004325260873883963, "global_step": 18135, "epoch": 152, "lr": 8.549449134203481e-05} +{"train_loss": 0.0060663651674985886, "global_step": 18136, "epoch": 152, "lr": 8.549293089553648e-05} +{"train_loss": 0.005854628048837185, "global_step": 18137, "epoch": 152, "lr": 8.549137037935156e-05} +{"train_loss": 0.004542342387139797, "global_step": 18138, "epoch": 152, "lr": 8.548980979348315e-05} +{"train_loss": 0.003967340104281902, "global_step": 18139, "epoch": 152, "lr": 8.548824913793427e-05} +{"train_loss": 0.006417617667466402, "global_step": 18140, "epoch": 152, "lr": 8.548668841270801e-05} +{"train_loss": 0.00540809566155076, "global_step": 18141, "epoch": 152, "lr": 8.548512761780742e-05} +{"train_loss": 0.0058052996173501015, "global_step": 18142, "epoch": 152, "lr": 8.548356675323559e-05} +{"train_loss": 0.008179737254977226, "global_step": 18143, "epoch": 152, "lr": 8.548200581899557e-05} +{"train_loss": 0.0061204093508422375, "global_step": 18144, "epoch": 152, "lr": 8.548044481509042e-05} +{"train_loss": 0.0044202860444784164, "global_step": 18145, "epoch": 152, "lr": 8.547888374152318e-05} +{"train_loss": 0.00604196498170495, "global_step": 18146, "epoch": 152, "lr": 8.547732259829696e-05} +{"train_loss": 0.010124540887773037, "global_step": 18147, "epoch": 152, "lr": 8.547576138541482e-05} +{"train_loss": 0.004339832346886396, "global_step": 18148, "epoch": 152, "lr": 8.547420010287978e-05} +{"train_loss": 0.00624326104298234, "global_step": 18149, "epoch": 152, "lr": 8.547263875069498e-05} +{"train_loss": 0.008025002665817738, "global_step": 18150, "epoch": 152, "lr": 8.547107732886341e-05} +{"train_loss": 0.006526182405650616, "global_step": 18151, "epoch": 152, "lr": 8.546951583738819e-05} +{"train_loss": 0.006658249534666538, "global_step": 18152, "epoch": 152, "lr": 8.546795427627236e-05} +{"train_loss": 0.004809938371181488, "global_step": 18153, "epoch": 152, "lr": 8.546639264551899e-05} +{"train_loss": 0.00410704268142581, "global_step": 18154, "epoch": 152, "lr": 8.546483094513114e-05} +{"train_loss": 0.008981969207525253, "global_step": 18155, "epoch": 152, "lr": 8.546326917511189e-05} +{"train_loss": 0.004712904337793589, "global_step": 18156, "epoch": 152, "lr": 8.546170733546429e-05} +{"train_loss": 0.00543248699977994, "global_step": 18157, "epoch": 152, "lr": 8.546014542619143e-05} +{"train_loss": 0.004869060590863228, "global_step": 18158, "epoch": 152, "lr": 8.545858344729636e-05} +{"train_loss": 0.006656198762357235, "global_step": 18159, "epoch": 152, "lr": 8.545702139878214e-05} +{"train_loss": 0.007266332395374775, "global_step": 18160, "epoch": 152, "lr": 8.545545928065187e-05} +{"train_loss": 0.006141030695289373, "global_step": 18161, "epoch": 152, "lr": 8.545389709290857e-05} +{"train_loss": 0.004112015012651682, "global_step": 18162, "epoch": 152, "lr": 8.545233483555533e-05} +{"train_loss": 0.003582840785384178, "global_step": 18163, "epoch": 152, "lr": 8.545077250859522e-05} +{"train_loss": 0.004813595674932003, "global_step": 18164, "epoch": 152, "lr": 8.54492101120313e-05} +{"train_loss": 0.008639340288937092, "global_step": 18165, "epoch": 152, "lr": 8.544764764586667e-05} +{"train_loss": 0.006872714962810278, "global_step": 18166, "epoch": 152, "lr": 8.544608511010434e-05} +{"train_loss": 0.00476494338363409, "global_step": 18167, "epoch": 152, "lr": 8.544452250474744e-05} +{"train_loss": 0.005401900969445705, "global_step": 18168, "epoch": 152, "lr": 8.5442959829799e-05} +{"train_loss": 0.0054811448790133, "global_step": 18169, "epoch": 152, "lr": 8.544139708526208e-05} +{"train_loss": 0.007086875382810831, "global_step": 18170, "epoch": 152, "lr": 8.543983427113977e-05} +{"train_loss": 0.0064942254684865475, "global_step": 18171, "epoch": 152, "lr": 8.543827138743513e-05} +{"train_loss": 0.004321593791246414, "global_step": 18172, "epoch": 152, "lr": 8.543670843415121e-05} +{"train_loss": 0.009118327870965004, "global_step": 18173, "epoch": 152, "lr": 8.543514541129115e-05} +{"train_loss": 0.0077962614595890045, "global_step": 18174, "epoch": 152, "lr": 8.543358231885792e-05} +{"train_loss": 0.004029723349958658, "global_step": 18175, "epoch": 152, "lr": 8.543201915685466e-05} +{"train_loss": 0.007646390702575445, "global_step": 18176, "epoch": 152, "lr": 8.54304559252844e-05} +{"train_loss": 0.005640791729092598, "global_step": 18177, "epoch": 152, "lr": 8.542889262415024e-05} +{"train_loss": 0.007356422487646341, "global_step": 18178, "epoch": 152, "lr": 8.542732925345522e-05} +{"train_loss": 0.007599166128784418, "global_step": 18179, "epoch": 152, "lr": 8.542576581320243e-05} +{"train_loss": 0.005848097614943981, "global_step": 18180, "epoch": 152, "lr": 8.542420230339494e-05} +{"train_loss": 0.004692206624895334, "global_step": 18181, "epoch": 152, "lr": 8.54226387240358e-05} +{"train_loss": 0.007047050166875124, "global_step": 18182, "epoch": 152, "lr": 8.542107507512812e-05} +{"train_loss": 0.005357122048735619, "global_step": 18183, "epoch": 152, "lr": 8.541951135667492e-05} +{"train_loss": 0.005969373043626547, "global_step": 18184, "epoch": 152, "lr": 8.54179475686793e-05} +{"train_loss": 0.005763291381299496, "global_step": 18185, "epoch": 152, "lr": 8.541638371114433e-05} +{"train_loss": 0.005997323896735907, "global_step": 18186, "epoch": 152, "lr": 8.541481978407307e-05} +{"train_loss": 0.006442433688789606, "global_step": 18187, "epoch": 152, "lr": 8.541325578746859e-05} +{"train_loss": 0.006719847675412893, "global_step": 18188, "epoch": 152, "lr": 8.541169172133397e-05} +{"train_loss": 0.00924629159271717, "global_step": 18189, "epoch": 152, "lr": 8.541012758567226e-05} +{"train_loss": 0.004308296367526054, "global_step": 18190, "epoch": 152, "lr": 8.540856338048656e-05} +{"train_loss": 0.006052720360457897, "global_step": 18191, "epoch": 152, "lr": 8.540699910577994e-05} +{"train_loss": 0.005625539924949408, "global_step": 18192, "epoch": 152, "lr": 8.540543476155545e-05} +{"train_loss": 0.0030964782927185297, "global_step": 18193, "epoch": 152, "lr": 8.540387034781617e-05} +{"train_loss": 0.0035704001784324646, "global_step": 18194, "epoch": 152, "lr": 8.540230586456517e-05} +{"train_loss": 0.006175644230097532, "global_step": 18195, "epoch": 152, "lr": 8.540074131180554e-05} +{"train_loss": 0.0041953083127737045, "global_step": 18196, "epoch": 152, "lr": 8.539917668954032e-05} +{"train_loss": 0.006214772816747427, "global_step": 18197, "epoch": 152, "lr": 8.539761199777259e-05} +{"train_loss": 0.005693709943443537, "global_step": 18198, "epoch": 152, "lr": 8.539604723650544e-05} +{"train_loss": 0.006744483485817909, "global_step": 18199, "epoch": 152, "lr": 8.539448240574194e-05} +{"train_loss": 0.00674755172803998, "global_step": 18200, "epoch": 152, "lr": 8.539291750548517e-05} +{"train_loss": 0.006342699751257896, "global_step": 18201, "epoch": 152, "lr": 8.539135253573817e-05} +{"train_loss": 0.005848592147231102, "global_step": 18202, "epoch": 152, "lr": 8.538978749650402e-05} +{"train_loss": 0.01026896107941866, "global_step": 18203, "epoch": 152, "lr": 8.538822238778582e-05} +{"train_loss": 0.004150120075792074, "global_step": 18204, "epoch": 152, "lr": 8.538665720958662e-05} +{"train_loss": 0.007670299615710974, "global_step": 18205, "epoch": 152, "lr": 8.538509196190949e-05} +{"train_loss": 0.006009108302801722, "global_step": 18206, "epoch": 152, "lr": 8.538352664475753e-05, "val_loss": 0.012686053290963173} +{"train_loss": 0.007746141403913498, "global_step": 18207, "epoch": 153, "lr": 8.538196125813378e-05} +{"train_loss": 0.008009525015950203, "global_step": 18208, "epoch": 153, "lr": 8.538039580204134e-05} +{"train_loss": 0.0047126947902143, "global_step": 18209, "epoch": 153, "lr": 8.537883027648326e-05} +{"train_loss": 0.0037827969063073397, "global_step": 18210, "epoch": 153, "lr": 8.537726468146264e-05} +{"train_loss": 0.004216314759105444, "global_step": 18211, "epoch": 153, "lr": 8.537569901698255e-05} +{"train_loss": 0.005583957303315401, "global_step": 18212, "epoch": 153, "lr": 8.537413328304602e-05} +{"train_loss": 0.004502926953136921, "global_step": 18213, "epoch": 153, "lr": 8.537256747965618e-05} +{"train_loss": 0.005921666976064444, "global_step": 18214, "epoch": 153, "lr": 8.537100160681609e-05} +{"train_loss": 0.008066504262387753, "global_step": 18215, "epoch": 153, "lr": 8.53694356645288e-05} +{"train_loss": 0.007925828918814659, "global_step": 18216, "epoch": 153, "lr": 8.536786965279742e-05} +{"train_loss": 0.006214338820427656, "global_step": 18217, "epoch": 153, "lr": 8.536630357162499e-05} +{"train_loss": 0.004594055004417896, "global_step": 18218, "epoch": 153, "lr": 8.536473742101461e-05} +{"train_loss": 0.004775890614837408, "global_step": 18219, "epoch": 153, "lr": 8.536317120096934e-05} +{"train_loss": 0.005378939677029848, "global_step": 18220, "epoch": 153, "lr": 8.536160491149226e-05} +{"train_loss": 0.005850289948284626, "global_step": 18221, "epoch": 153, "lr": 8.536003855258645e-05} +{"train_loss": 0.005123491864651442, "global_step": 18222, "epoch": 153, "lr": 8.535847212425498e-05} +{"train_loss": 0.005685112439095974, "global_step": 18223, "epoch": 153, "lr": 8.535690562650094e-05} +{"train_loss": 0.003487603971734643, "global_step": 18224, "epoch": 153, "lr": 8.535533905932738e-05} +{"train_loss": 0.004568404518067837, "global_step": 18225, "epoch": 153, "lr": 8.535377242273739e-05} +{"train_loss": 0.006333788391202688, "global_step": 18226, "epoch": 153, "lr": 8.535220571673406e-05} +{"train_loss": 0.004963667131960392, "global_step": 18227, "epoch": 153, "lr": 8.535063894132043e-05} +{"train_loss": 0.0056295800022780895, "global_step": 18228, "epoch": 153, "lr": 8.53490720964996e-05} +{"train_loss": 0.004345544148236513, "global_step": 18229, "epoch": 153, "lr": 8.534750518227466e-05} +{"train_loss": 0.005186931230127811, "global_step": 18230, "epoch": 153, "lr": 8.534593819864864e-05} +{"train_loss": 0.0057455794885754585, "global_step": 18231, "epoch": 153, "lr": 8.534437114562468e-05} +{"train_loss": 0.0042604077607393265, "global_step": 18232, "epoch": 153, "lr": 8.53428040232058e-05} +{"train_loss": 0.00461994856595993, "global_step": 18233, "epoch": 153, "lr": 8.534123683139512e-05} +{"train_loss": 0.006565128453075886, "global_step": 18234, "epoch": 153, "lr": 8.533966957019568e-05} +{"train_loss": 0.004399564582854509, "global_step": 18235, "epoch": 153, "lr": 8.533810223961058e-05} +{"train_loss": 0.0072633493691682816, "global_step": 18236, "epoch": 153, "lr": 8.53365348396429e-05} +{"train_loss": 0.006025098729878664, "global_step": 18237, "epoch": 153, "lr": 8.533496737029569e-05} +{"train_loss": 0.006572081707417965, "global_step": 18238, "epoch": 153, "lr": 8.533339983157206e-05} +{"train_loss": 0.004705903120338917, "global_step": 18239, "epoch": 153, "lr": 8.533183222347507e-05} +{"train_loss": 0.005423090886324644, "global_step": 18240, "epoch": 153, "lr": 8.53302645460078e-05} +{"train_loss": 0.004183081444352865, "global_step": 18241, "epoch": 153, "lr": 8.532869679917334e-05} +{"train_loss": 0.005689211655408144, "global_step": 18242, "epoch": 153, "lr": 8.532712898297476e-05} +{"train_loss": 0.006028617266565561, "global_step": 18243, "epoch": 153, "lr": 8.532556109741511e-05} +{"train_loss": 0.00690540112555027, "global_step": 18244, "epoch": 153, "lr": 8.532399314249753e-05} +{"train_loss": 0.00420455913990736, "global_step": 18245, "epoch": 153, "lr": 8.532242511822504e-05} +{"train_loss": 0.003920307848602533, "global_step": 18246, "epoch": 153, "lr": 8.532085702460076e-05} +{"train_loss": 0.005369706079363823, "global_step": 18247, "epoch": 153, "lr": 8.531928886162773e-05} +{"train_loss": 0.008375180885195732, "global_step": 18248, "epoch": 153, "lr": 8.531772062930906e-05} +{"train_loss": 0.007253427058458328, "global_step": 18249, "epoch": 153, "lr": 8.531615232764782e-05} +{"train_loss": 0.004876341205090284, "global_step": 18250, "epoch": 153, "lr": 8.531458395664709e-05} +{"train_loss": 0.005035816691815853, "global_step": 18251, "epoch": 153, "lr": 8.531301551630992e-05} +{"train_loss": 0.00817684456706047, "global_step": 18252, "epoch": 153, "lr": 8.531144700663945e-05} +{"train_loss": 0.00807963591068983, "global_step": 18253, "epoch": 153, "lr": 8.530987842763871e-05} +{"train_loss": 0.005270048044621944, "global_step": 18254, "epoch": 153, "lr": 8.530830977931081e-05} +{"train_loss": 0.005740839522331953, "global_step": 18255, "epoch": 153, "lr": 8.530674106165881e-05} +{"train_loss": 0.009228885173797607, "global_step": 18256, "epoch": 153, "lr": 8.530517227468578e-05} +{"train_loss": 0.0045791566371917725, "global_step": 18257, "epoch": 153, "lr": 8.530360341839483e-05} +{"train_loss": 0.008736207149922848, "global_step": 18258, "epoch": 153, "lr": 8.530203449278903e-05} +{"train_loss": 0.0033664635848253965, "global_step": 18259, "epoch": 153, "lr": 8.530046549787145e-05} +{"train_loss": 0.010553862899541855, "global_step": 18260, "epoch": 153, "lr": 8.529889643364519e-05} +{"train_loss": 0.010205759666860104, "global_step": 18261, "epoch": 153, "lr": 8.52973273001133e-05} +{"train_loss": 0.006988749839365482, "global_step": 18262, "epoch": 153, "lr": 8.529575809727888e-05} +{"train_loss": 0.005772759206593037, "global_step": 18263, "epoch": 153, "lr": 8.529418882514501e-05} +{"train_loss": 0.005870096851140261, "global_step": 18264, "epoch": 153, "lr": 8.529261948371478e-05} +{"train_loss": 0.004748085979372263, "global_step": 18265, "epoch": 153, "lr": 8.529105007299128e-05} +{"train_loss": 0.007469339296221733, "global_step": 18266, "epoch": 153, "lr": 8.528948059297754e-05} +{"train_loss": 0.003930439241230488, "global_step": 18267, "epoch": 153, "lr": 8.52879110436767e-05} +{"train_loss": 0.00868607684969902, "global_step": 18268, "epoch": 153, "lr": 8.52863414250918e-05} +{"train_loss": 0.008453200571238995, "global_step": 18269, "epoch": 153, "lr": 8.528477173722593e-05} +{"train_loss": 0.007805096451193094, "global_step": 18270, "epoch": 153, "lr": 8.52832019800822e-05} +{"train_loss": 0.006591365672647953, "global_step": 18271, "epoch": 153, "lr": 8.528163215366367e-05} +{"train_loss": 0.0094106150791049, "global_step": 18272, "epoch": 153, "lr": 8.528006225797342e-05} +{"train_loss": 0.005250574089586735, "global_step": 18273, "epoch": 153, "lr": 8.527849229301453e-05} +{"train_loss": 0.011445802636444569, "global_step": 18274, "epoch": 153, "lr": 8.527692225879009e-05} +{"train_loss": 0.003908607177436352, "global_step": 18275, "epoch": 153, "lr": 8.52753521553032e-05} +{"train_loss": 0.006955673918128014, "global_step": 18276, "epoch": 153, "lr": 8.527378198255691e-05} +{"train_loss": 0.008003035560250282, "global_step": 18277, "epoch": 153, "lr": 8.527221174055431e-05} +{"train_loss": 0.010047376155853271, "global_step": 18278, "epoch": 153, "lr": 8.52706414292985e-05} +{"train_loss": 0.007334399037063122, "global_step": 18279, "epoch": 153, "lr": 8.526907104879255e-05} +{"train_loss": 0.005526165943592787, "global_step": 18280, "epoch": 153, "lr": 8.526750059903957e-05} +{"train_loss": 0.007272705435752869, "global_step": 18281, "epoch": 153, "lr": 8.52659300800426e-05} +{"train_loss": 0.005776095204055309, "global_step": 18282, "epoch": 153, "lr": 8.526435949180473e-05} +{"train_loss": 0.005890207830816507, "global_step": 18283, "epoch": 153, "lr": 8.526278883432907e-05} +{"train_loss": 0.006180721800774336, "global_step": 18284, "epoch": 153, "lr": 8.526121810761871e-05} +{"train_loss": 0.008276033215224743, "global_step": 18285, "epoch": 153, "lr": 8.52596473116767e-05} +{"train_loss": 0.006801149807870388, "global_step": 18286, "epoch": 153, "lr": 8.525807644650614e-05} +{"train_loss": 0.007687165401875973, "global_step": 18287, "epoch": 153, "lr": 8.52565055121101e-05} +{"train_loss": 0.004826701711863279, "global_step": 18288, "epoch": 153, "lr": 8.525493450849169e-05} +{"train_loss": 0.007831013761460781, "global_step": 18289, "epoch": 153, "lr": 8.5253363435654e-05} +{"train_loss": 0.005402734503149986, "global_step": 18290, "epoch": 153, "lr": 8.525179229360007e-05} +{"train_loss": 0.006444127764552832, "global_step": 18291, "epoch": 153, "lr": 8.525022108233302e-05} +{"train_loss": 0.004365939646959305, "global_step": 18292, "epoch": 153, "lr": 8.524864980185594e-05} +{"train_loss": 0.00932501070201397, "global_step": 18293, "epoch": 153, "lr": 8.524707845217189e-05} +{"train_loss": 0.0045227548107504845, "global_step": 18294, "epoch": 153, "lr": 8.524550703328397e-05} +{"train_loss": 0.006445583887398243, "global_step": 18295, "epoch": 153, "lr": 8.524393554519525e-05} +{"train_loss": 0.006258734967559576, "global_step": 18296, "epoch": 153, "lr": 8.524236398790883e-05} +{"train_loss": 0.0041223387233912945, "global_step": 18297, "epoch": 153, "lr": 8.524079236142782e-05} +{"train_loss": 0.004374528303742409, "global_step": 18298, "epoch": 153, "lr": 8.523922066575526e-05} +{"train_loss": 0.007915759459137917, "global_step": 18299, "epoch": 153, "lr": 8.523764890089425e-05} +{"train_loss": 0.004433761816471815, "global_step": 18300, "epoch": 153, "lr": 8.523607706684788e-05} +{"train_loss": 0.006022911053150892, "global_step": 18301, "epoch": 153, "lr": 8.523450516361926e-05} +{"train_loss": 0.006452326197177172, "global_step": 18302, "epoch": 153, "lr": 8.523293319121144e-05} +{"train_loss": 0.007419905159622431, "global_step": 18303, "epoch": 153, "lr": 8.523136114962751e-05} +{"train_loss": 0.011028077453374863, "global_step": 18304, "epoch": 153, "lr": 8.522978903887058e-05} +{"train_loss": 0.00564147112891078, "global_step": 18305, "epoch": 153, "lr": 8.522821685894372e-05} +{"train_loss": 0.00658925948664546, "global_step": 18306, "epoch": 153, "lr": 8.522664460985001e-05} +{"train_loss": 0.008164622820913792, "global_step": 18307, "epoch": 153, "lr": 8.522507229159255e-05} +{"train_loss": 0.004096102900803089, "global_step": 18308, "epoch": 153, "lr": 8.522349990417442e-05} +{"train_loss": 0.003843080485239625, "global_step": 18309, "epoch": 153, "lr": 8.522192744759873e-05} +{"train_loss": 0.0035388795658946037, "global_step": 18310, "epoch": 153, "lr": 8.522035492186853e-05} +{"train_loss": 0.00727252708747983, "global_step": 18311, "epoch": 153, "lr": 8.521878232698692e-05} +{"train_loss": 0.009518606588244438, "global_step": 18312, "epoch": 153, "lr": 8.5217209662957e-05} +{"train_loss": 0.008739462122321129, "global_step": 18313, "epoch": 153, "lr": 8.521563692978187e-05} +{"train_loss": 0.006331377197057009, "global_step": 18314, "epoch": 153, "lr": 8.521406412746458e-05} +{"train_loss": 0.0059718238189816475, "global_step": 18315, "epoch": 153, "lr": 8.521249125600825e-05} +{"train_loss": 0.005160068161785603, "global_step": 18316, "epoch": 153, "lr": 8.521091831541596e-05} +{"train_loss": 0.005448995623737574, "global_step": 18317, "epoch": 153, "lr": 8.520934530569078e-05} +{"train_loss": 0.007152959704399109, "global_step": 18318, "epoch": 153, "lr": 8.520777222683581e-05} +{"train_loss": 0.0038686173502355814, "global_step": 18319, "epoch": 153, "lr": 8.520619907885415e-05} +{"train_loss": 0.005024050362408161, "global_step": 18320, "epoch": 153, "lr": 8.520462586174887e-05} +{"train_loss": 0.0035498845390975475, "global_step": 18321, "epoch": 153, "lr": 8.520305257552305e-05} +{"train_loss": 0.004936743061989546, "global_step": 18322, "epoch": 153, "lr": 8.520147922017984e-05} +{"train_loss": 0.0073264287784695625, "global_step": 18323, "epoch": 153, "lr": 8.519990579572225e-05} +{"train_loss": 0.007460953202098608, "global_step": 18324, "epoch": 153, "lr": 8.519833230215344e-05} +{"train_loss": 0.0062292642214437245, "global_step": 18325, "epoch": 153, "lr": 8.519675873947643e-05, "val_loss": 0.02141615003347397} +{"train_loss": 0.006283754948526621, "global_step": 18326, "epoch": 154, "lr": 8.519518510769438e-05} +{"train_loss": 0.006623507477343082, "global_step": 18327, "epoch": 154, "lr": 8.519361140681031e-05} +{"train_loss": 0.006519705522805452, "global_step": 18328, "epoch": 154, "lr": 8.519203763682738e-05} +{"train_loss": 0.007163298316299915, "global_step": 18329, "epoch": 154, "lr": 8.51904637977486e-05} +{"train_loss": 0.004487332887947559, "global_step": 18330, "epoch": 154, "lr": 8.518888988957715e-05} +{"train_loss": 0.005330988671630621, "global_step": 18331, "epoch": 154, "lr": 8.518731591231604e-05} +{"train_loss": 0.0075411018915474415, "global_step": 18332, "epoch": 154, "lr": 8.518574186596839e-05} +{"train_loss": 0.004774203058332205, "global_step": 18333, "epoch": 154, "lr": 8.518416775053731e-05} +{"train_loss": 0.005558823235332966, "global_step": 18334, "epoch": 154, "lr": 8.518259356602588e-05} +{"train_loss": 0.007979005575180054, "global_step": 18335, "epoch": 154, "lr": 8.518101931243718e-05} +{"train_loss": 0.006502452772110701, "global_step": 18336, "epoch": 154, "lr": 8.517944498977431e-05} +{"train_loss": 0.003675493411719799, "global_step": 18337, "epoch": 154, "lr": 8.517787059804036e-05} +{"train_loss": 0.006051790900528431, "global_step": 18338, "epoch": 154, "lr": 8.517629613723841e-05} +{"train_loss": 0.00527802063152194, "global_step": 18339, "epoch": 154, "lr": 8.517472160737156e-05} +{"train_loss": 0.008249092847108841, "global_step": 18340, "epoch": 154, "lr": 8.517314700844293e-05} +{"train_loss": 0.006022285204380751, "global_step": 18341, "epoch": 154, "lr": 8.517157234045555e-05} +{"train_loss": 0.005485581699758768, "global_step": 18342, "epoch": 154, "lr": 8.516999760341255e-05} +{"train_loss": 0.006750111468136311, "global_step": 18343, "epoch": 154, "lr": 8.516842279731702e-05} +{"train_loss": 0.007481881882995367, "global_step": 18344, "epoch": 154, "lr": 8.516684792217207e-05} +{"train_loss": 0.008407926186919212, "global_step": 18345, "epoch": 154, "lr": 8.516527297798073e-05} +{"train_loss": 0.006574271246790886, "global_step": 18346, "epoch": 154, "lr": 8.516369796474616e-05} +{"train_loss": 0.004460599273443222, "global_step": 18347, "epoch": 154, "lr": 8.516212288247145e-05} +{"train_loss": 0.004550757352262735, "global_step": 18348, "epoch": 154, "lr": 8.516054773115964e-05} +{"train_loss": 0.010365545749664307, "global_step": 18349, "epoch": 154, "lr": 8.515897251081384e-05} +{"train_loss": 0.005959006492048502, "global_step": 18350, "epoch": 154, "lr": 8.515739722143716e-05} +{"train_loss": 0.00469430536031723, "global_step": 18351, "epoch": 154, "lr": 8.51558218630327e-05} +{"train_loss": 0.007229663897305727, "global_step": 18352, "epoch": 154, "lr": 8.515424643560354e-05} +{"train_loss": 0.007105831988155842, "global_step": 18353, "epoch": 154, "lr": 8.515267093915276e-05} +{"train_loss": 0.009791660122573376, "global_step": 18354, "epoch": 154, "lr": 8.515109537368346e-05} +{"train_loss": 0.003143881680443883, "global_step": 18355, "epoch": 154, "lr": 8.514951973919876e-05} +{"train_loss": 0.0028362281154841185, "global_step": 18356, "epoch": 154, "lr": 8.514794403570172e-05} +{"train_loss": 0.0059206061996519566, "global_step": 18357, "epoch": 154, "lr": 8.514636826319547e-05} +{"train_loss": 0.008096140809357166, "global_step": 18358, "epoch": 154, "lr": 8.514479242168305e-05} +{"train_loss": 0.009481332264840603, "global_step": 18359, "epoch": 154, "lr": 8.514321651116759e-05} +{"train_loss": 0.005098762456327677, "global_step": 18360, "epoch": 154, "lr": 8.514164053165219e-05} +{"train_loss": 0.003907390870153904, "global_step": 18361, "epoch": 154, "lr": 8.514006448313994e-05} +{"train_loss": 0.006555210333317518, "global_step": 18362, "epoch": 154, "lr": 8.51384883656339e-05} +{"train_loss": 0.005458645988255739, "global_step": 18363, "epoch": 154, "lr": 8.513691217913722e-05} +{"train_loss": 0.006265660282224417, "global_step": 18364, "epoch": 154, "lr": 8.513533592365295e-05} +{"train_loss": 0.005691873840987682, "global_step": 18365, "epoch": 154, "lr": 8.513375959918421e-05} +{"train_loss": 0.004842789378017187, "global_step": 18366, "epoch": 154, "lr": 8.513218320573408e-05} +{"train_loss": 0.006404276005923748, "global_step": 18367, "epoch": 154, "lr": 8.513060674330567e-05} +{"train_loss": 0.0044456846080720425, "global_step": 18368, "epoch": 154, "lr": 8.512903021190206e-05} +{"train_loss": 0.007885447703301907, "global_step": 18369, "epoch": 154, "lr": 8.512745361152634e-05} +{"train_loss": 0.006889938376843929, "global_step": 18370, "epoch": 154, "lr": 8.512587694218164e-05} +{"train_loss": 0.007346396334469318, "global_step": 18371, "epoch": 154, "lr": 8.5124300203871e-05} +{"train_loss": 0.006604402791708708, "global_step": 18372, "epoch": 154, "lr": 8.512272339659759e-05} +{"train_loss": 0.007476008031517267, "global_step": 18373, "epoch": 154, "lr": 8.512114652036446e-05} +{"train_loss": 0.0036868806928396225, "global_step": 18374, "epoch": 154, "lr": 8.51195695751747e-05} +{"train_loss": 0.005796167533844709, "global_step": 18375, "epoch": 154, "lr": 8.511799256103142e-05} +{"train_loss": 0.008490110747516155, "global_step": 18376, "epoch": 154, "lr": 8.511641547793769e-05} +{"train_loss": 0.007463579997420311, "global_step": 18377, "epoch": 154, "lr": 8.511483832589666e-05} +{"train_loss": 0.005753568839281797, "global_step": 18378, "epoch": 154, "lr": 8.511326110491138e-05} +{"train_loss": 0.003172066528350115, "global_step": 18379, "epoch": 154, "lr": 8.511168381498498e-05} +{"train_loss": 0.004301737993955612, "global_step": 18380, "epoch": 154, "lr": 8.511010645612052e-05} +{"train_loss": 0.006340438965708017, "global_step": 18381, "epoch": 154, "lr": 8.510852902832114e-05} +{"train_loss": 0.007434387691318989, "global_step": 18382, "epoch": 154, "lr": 8.51069515315899e-05} +{"train_loss": 0.004258858505636454, "global_step": 18383, "epoch": 154, "lr": 8.51053739659299e-05} +{"train_loss": 0.003568231128156185, "global_step": 18384, "epoch": 154, "lr": 8.510379633134426e-05} +{"train_loss": 0.0037826639600098133, "global_step": 18385, "epoch": 154, "lr": 8.510221862783608e-05} +{"train_loss": 0.008381366729736328, "global_step": 18386, "epoch": 154, "lr": 8.510064085540842e-05} +{"train_loss": 0.005892068613320589, "global_step": 18387, "epoch": 154, "lr": 8.50990630140644e-05} +{"train_loss": 0.007095912005752325, "global_step": 18388, "epoch": 154, "lr": 8.509748510380714e-05} +{"train_loss": 0.006001344881951809, "global_step": 18389, "epoch": 154, "lr": 8.509590712463971e-05} +{"train_loss": 0.007676450535655022, "global_step": 18390, "epoch": 154, "lr": 8.509432907656521e-05} +{"train_loss": 0.004781391005963087, "global_step": 18391, "epoch": 154, "lr": 8.509275095958676e-05} +{"train_loss": 0.00597976241260767, "global_step": 18392, "epoch": 154, "lr": 8.509117277370743e-05} +{"train_loss": 0.003969494253396988, "global_step": 18393, "epoch": 154, "lr": 8.508959451893033e-05} +{"train_loss": 0.004301003646105528, "global_step": 18394, "epoch": 154, "lr": 8.508801619525856e-05} +{"train_loss": 0.00585631188005209, "global_step": 18395, "epoch": 154, "lr": 8.508643780269522e-05} +{"train_loss": 0.006566033232957125, "global_step": 18396, "epoch": 154, "lr": 8.508485934124342e-05} +{"train_loss": 0.005307281855493784, "global_step": 18397, "epoch": 154, "lr": 8.508328081090622e-05} +{"train_loss": 0.0046189348213374615, "global_step": 18398, "epoch": 154, "lr": 8.508170221168678e-05} +{"train_loss": 0.00782080926001072, "global_step": 18399, "epoch": 154, "lr": 8.508012354358814e-05} +{"train_loss": 0.005420622415840626, "global_step": 18400, "epoch": 154, "lr": 8.507854480661344e-05} +{"train_loss": 0.004297097213566303, "global_step": 18401, "epoch": 154, "lr": 8.507696600076576e-05} +{"train_loss": 0.0056574526242911816, "global_step": 18402, "epoch": 154, "lr": 8.507538712604819e-05} +{"train_loss": 0.006798547692596912, "global_step": 18403, "epoch": 154, "lr": 8.507380818246387e-05} +{"train_loss": 0.004920410457998514, "global_step": 18404, "epoch": 154, "lr": 8.507222917001585e-05} +{"train_loss": 0.004115424118936062, "global_step": 18405, "epoch": 154, "lr": 8.507065008870727e-05} +{"train_loss": 0.005112043581902981, "global_step": 18406, "epoch": 154, "lr": 8.506907093854122e-05} +{"train_loss": 0.009018647484481335, "global_step": 18407, "epoch": 154, "lr": 8.506749171952078e-05} +{"train_loss": 0.00481243385002017, "global_step": 18408, "epoch": 154, "lr": 8.506591243164908e-05} +{"train_loss": 0.0047533633187413216, "global_step": 18409, "epoch": 154, "lr": 8.506433307492921e-05} +{"train_loss": 0.006092661526054144, "global_step": 18410, "epoch": 154, "lr": 8.506275364936425e-05} +{"train_loss": 0.00420294888317585, "global_step": 18411, "epoch": 154, "lr": 8.506117415495732e-05} +{"train_loss": 0.006438951473683119, "global_step": 18412, "epoch": 154, "lr": 8.505959459171153e-05} +{"train_loss": 0.006783723831176758, "global_step": 18413, "epoch": 154, "lr": 8.505801495962997e-05} +{"train_loss": 0.005408150609582663, "global_step": 18414, "epoch": 154, "lr": 8.505643525871575e-05} +{"train_loss": 0.004710051696747541, "global_step": 18415, "epoch": 154, "lr": 8.505485548897197e-05} +{"train_loss": 0.0072441017255187035, "global_step": 18416, "epoch": 154, "lr": 8.505327565040172e-05} +{"train_loss": 0.006435438524931669, "global_step": 18417, "epoch": 154, "lr": 8.505169574300808e-05} +{"train_loss": 0.005419311113655567, "global_step": 18418, "epoch": 154, "lr": 8.50501157667942e-05} +{"train_loss": 0.004800900816917419, "global_step": 18419, "epoch": 154, "lr": 8.504853572176316e-05} +{"train_loss": 0.008274883031845093, "global_step": 18420, "epoch": 154, "lr": 8.504695560791808e-05} +{"train_loss": 0.004946256056427956, "global_step": 18421, "epoch": 154, "lr": 8.504537542526203e-05} +{"train_loss": 0.004412690177559853, "global_step": 18422, "epoch": 154, "lr": 8.504379517379815e-05} +{"train_loss": 0.007960168644785881, "global_step": 18423, "epoch": 154, "lr": 8.50422148535295e-05} +{"train_loss": 0.0045609744265675545, "global_step": 18424, "epoch": 154, "lr": 8.504063446445923e-05} +{"train_loss": 0.009518442675471306, "global_step": 18425, "epoch": 154, "lr": 8.503905400659039e-05} +{"train_loss": 0.0028695417568087578, "global_step": 18426, "epoch": 154, "lr": 8.503747347992612e-05} +{"train_loss": 0.004568371456116438, "global_step": 18427, "epoch": 154, "lr": 8.503589288446951e-05} +{"train_loss": 0.007220536470413208, "global_step": 18428, "epoch": 154, "lr": 8.503431222022369e-05} +{"train_loss": 0.004963374696671963, "global_step": 18429, "epoch": 154, "lr": 8.503273148719171e-05} +{"train_loss": 0.005647522397339344, "global_step": 18430, "epoch": 154, "lr": 8.503115068537673e-05} +{"train_loss": 0.006077323574572802, "global_step": 18431, "epoch": 154, "lr": 8.50295698147818e-05} +{"train_loss": 0.007537210360169411, "global_step": 18432, "epoch": 154, "lr": 8.502798887541008e-05} +{"train_loss": 0.006123202387243509, "global_step": 18433, "epoch": 154, "lr": 8.502640786726463e-05} +{"train_loss": 0.005354313645511866, "global_step": 18434, "epoch": 154, "lr": 8.502482679034858e-05} +{"train_loss": 0.0068127745762467384, "global_step": 18435, "epoch": 154, "lr": 8.502324564466501e-05} +{"train_loss": 0.004803365096449852, "global_step": 18436, "epoch": 154, "lr": 8.502166443021705e-05} +{"train_loss": 0.004824049770832062, "global_step": 18437, "epoch": 154, "lr": 8.50200831470078e-05} +{"train_loss": 0.007414554711431265, "global_step": 18438, "epoch": 154, "lr": 8.501850179504034e-05} +{"train_loss": 0.005534053314477205, "global_step": 18439, "epoch": 154, "lr": 8.501692037431782e-05} +{"train_loss": 0.0064123827032744884, "global_step": 18440, "epoch": 154, "lr": 8.501533888484328e-05} +{"train_loss": 0.006389903370290995, "global_step": 18441, "epoch": 154, "lr": 8.50137573266199e-05} +{"train_loss": 0.0038715640548616648, "global_step": 18442, "epoch": 154, "lr": 8.501217569965072e-05} +{"train_loss": 0.0051152268424630165, "global_step": 18443, "epoch": 154, "lr": 8.501059400393888e-05} +{"train_loss": 0.005962336809617006, "global_step": 18444, "epoch": 154, "lr": 8.500901223948748e-05, "val_loss": 0.018473975360393524} +{"train_loss": 0.00414342200383544, "global_step": 18445, "epoch": 155, "lr": 8.500743040629964e-05} +{"train_loss": 0.007030325476080179, "global_step": 18446, "epoch": 155, "lr": 8.500584850437843e-05} +{"train_loss": 0.0034389710053801537, "global_step": 18447, "epoch": 155, "lr": 8.500426653372699e-05} +{"train_loss": 0.004397896584123373, "global_step": 18448, "epoch": 155, "lr": 8.50026844943484e-05} +{"train_loss": 0.006793208420276642, "global_step": 18449, "epoch": 155, "lr": 8.500110238624578e-05} +{"train_loss": 0.00697238277643919, "global_step": 18450, "epoch": 155, "lr": 8.499952020942226e-05} +{"train_loss": 0.004704903345555067, "global_step": 18451, "epoch": 155, "lr": 8.49979379638809e-05} +{"train_loss": 0.005655056796967983, "global_step": 18452, "epoch": 155, "lr": 8.499635564962482e-05} +{"train_loss": 0.005302076227962971, "global_step": 18453, "epoch": 155, "lr": 8.499477326665715e-05} +{"train_loss": 0.004213137086480856, "global_step": 18454, "epoch": 155, "lr": 8.499319081498098e-05} +{"train_loss": 0.004019244574010372, "global_step": 18455, "epoch": 155, "lr": 8.499160829459941e-05} +{"train_loss": 0.006898311898112297, "global_step": 18456, "epoch": 155, "lr": 8.499002570551555e-05} +{"train_loss": 0.004303087946027517, "global_step": 18457, "epoch": 155, "lr": 8.498844304773253e-05} +{"train_loss": 0.004782270174473524, "global_step": 18458, "epoch": 155, "lr": 8.498686032125342e-05} +{"train_loss": 0.007425519172102213, "global_step": 18459, "epoch": 155, "lr": 8.498527752608138e-05} +{"train_loss": 0.004124763887375593, "global_step": 18460, "epoch": 155, "lr": 8.498369466221945e-05} +{"train_loss": 0.00440655741840601, "global_step": 18461, "epoch": 155, "lr": 8.498211172967078e-05} +{"train_loss": 0.004121743142604828, "global_step": 18462, "epoch": 155, "lr": 8.498052872843849e-05} +{"train_loss": 0.0036731224972754717, "global_step": 18463, "epoch": 155, "lr": 8.497894565852566e-05} +{"train_loss": 0.006105491425842047, "global_step": 18464, "epoch": 155, "lr": 8.49773625199354e-05} +{"train_loss": 0.005129270255565643, "global_step": 18465, "epoch": 155, "lr": 8.497577931267084e-05} +{"train_loss": 0.006897416897118092, "global_step": 18466, "epoch": 155, "lr": 8.497419603673507e-05} +{"train_loss": 0.005289948545396328, "global_step": 18467, "epoch": 155, "lr": 8.497261269213119e-05} +{"train_loss": 0.003518695244565606, "global_step": 18468, "epoch": 155, "lr": 8.497102927886232e-05} +{"train_loss": 0.005301660392433405, "global_step": 18469, "epoch": 155, "lr": 8.496944579693157e-05} +{"train_loss": 0.0032286413479596376, "global_step": 18470, "epoch": 155, "lr": 8.496786224634206e-05} +{"train_loss": 0.006323291454464197, "global_step": 18471, "epoch": 155, "lr": 8.49662786270969e-05} +{"train_loss": 0.004635616671293974, "global_step": 18472, "epoch": 155, "lr": 8.496469493919916e-05} +{"train_loss": 0.007588923908770084, "global_step": 18473, "epoch": 155, "lr": 8.4963111182652e-05} +{"train_loss": 0.005549009423702955, "global_step": 18474, "epoch": 155, "lr": 8.49615273574585e-05} +{"train_loss": 0.004892691038548946, "global_step": 18475, "epoch": 155, "lr": 8.495994346362177e-05} +{"train_loss": 0.006874977145344019, "global_step": 18476, "epoch": 155, "lr": 8.495835950114493e-05} +{"train_loss": 0.007087738253176212, "global_step": 18477, "epoch": 155, "lr": 8.495677547003108e-05} +{"train_loss": 0.0036846480797976255, "global_step": 18478, "epoch": 155, "lr": 8.495519137028334e-05} +{"train_loss": 0.006562643218785524, "global_step": 18479, "epoch": 155, "lr": 8.495360720190482e-05} +{"train_loss": 0.006400929763913155, "global_step": 18480, "epoch": 155, "lr": 8.495202296489861e-05} +{"train_loss": 0.008387163281440735, "global_step": 18481, "epoch": 155, "lr": 8.495043865926786e-05} +{"train_loss": 0.00927874818444252, "global_step": 18482, "epoch": 155, "lr": 8.494885428501564e-05} +{"train_loss": 0.007497380021959543, "global_step": 18483, "epoch": 155, "lr": 8.49472698421451e-05} +{"train_loss": 0.0036974381655454636, "global_step": 18484, "epoch": 155, "lr": 8.49456853306593e-05} +{"train_loss": 0.008091832511126995, "global_step": 18485, "epoch": 155, "lr": 8.494410075056141e-05} +{"train_loss": 0.007047074381262064, "global_step": 18486, "epoch": 155, "lr": 8.494251610185449e-05} +{"train_loss": 0.006389555521309376, "global_step": 18487, "epoch": 155, "lr": 8.494093138454167e-05} +{"train_loss": 0.008631735108792782, "global_step": 18488, "epoch": 155, "lr": 8.493934659862608e-05} +{"train_loss": 0.006412470247596502, "global_step": 18489, "epoch": 155, "lr": 8.493776174411081e-05} +{"train_loss": 0.0069038947112858295, "global_step": 18490, "epoch": 155, "lr": 8.493617682099897e-05} +{"train_loss": 0.0045822737738490105, "global_step": 18491, "epoch": 155, "lr": 8.493459182929369e-05} +{"train_loss": 0.004190923646092415, "global_step": 18492, "epoch": 155, "lr": 8.493300676899806e-05} +{"train_loss": 0.0052977558225393295, "global_step": 18493, "epoch": 155, "lr": 8.49314216401152e-05} +{"train_loss": 0.0047341883182525635, "global_step": 18494, "epoch": 155, "lr": 8.492983644264824e-05} +{"train_loss": 0.0036905319429934025, "global_step": 18495, "epoch": 155, "lr": 8.492825117660028e-05} +{"train_loss": 0.0056826276704669, "global_step": 18496, "epoch": 155, "lr": 8.492666584197442e-05} +{"train_loss": 0.006084301043301821, "global_step": 18497, "epoch": 155, "lr": 8.49250804387738e-05} +{"train_loss": 0.006652279756963253, "global_step": 18498, "epoch": 155, "lr": 8.49234949670015e-05} +{"train_loss": 0.008044352754950523, "global_step": 18499, "epoch": 155, "lr": 8.492190942666066e-05} +{"train_loss": 0.0041366866789758205, "global_step": 18500, "epoch": 155, "lr": 8.492032381775437e-05} +{"train_loss": 0.004488801583647728, "global_step": 18501, "epoch": 155, "lr": 8.491873814028575e-05} +{"train_loss": 0.005731946788728237, "global_step": 18502, "epoch": 155, "lr": 8.491715239425793e-05} +{"train_loss": 0.004459851421415806, "global_step": 18503, "epoch": 155, "lr": 8.491556657967402e-05} +{"train_loss": 0.005948742851614952, "global_step": 18504, "epoch": 155, "lr": 8.491398069653709e-05} +{"train_loss": 0.00517678540199995, "global_step": 18505, "epoch": 155, "lr": 8.491239474485031e-05} +{"train_loss": 0.004814349114894867, "global_step": 18506, "epoch": 155, "lr": 8.491080872461679e-05} +{"train_loss": 0.006056119687855244, "global_step": 18507, "epoch": 155, "lr": 8.49092226358396e-05} +{"train_loss": 0.00572921009734273, "global_step": 18508, "epoch": 155, "lr": 8.490763647852188e-05} +{"train_loss": 0.004216894507408142, "global_step": 18509, "epoch": 155, "lr": 8.490605025266676e-05} +{"train_loss": 0.004242205526679754, "global_step": 18510, "epoch": 155, "lr": 8.490446395827734e-05} +{"train_loss": 0.006107718218117952, "global_step": 18511, "epoch": 155, "lr": 8.490287759535673e-05} +{"train_loss": 0.004351317882537842, "global_step": 18512, "epoch": 155, "lr": 8.490129116390805e-05} +{"train_loss": 0.004724656231701374, "global_step": 18513, "epoch": 155, "lr": 8.489970466393442e-05} +{"train_loss": 0.005095740780234337, "global_step": 18514, "epoch": 155, "lr": 8.489811809543894e-05} +{"train_loss": 0.003886606078594923, "global_step": 18515, "epoch": 155, "lr": 8.489653145842474e-05} +{"train_loss": 0.006165855098515749, "global_step": 18516, "epoch": 155, "lr": 8.489494475289492e-05} +{"train_loss": 0.0031282149720937014, "global_step": 18517, "epoch": 155, "lr": 8.48933579788526e-05} +{"train_loss": 0.0058096605353057384, "global_step": 18518, "epoch": 155, "lr": 8.489177113630092e-05} +{"train_loss": 0.004690054338425398, "global_step": 18519, "epoch": 155, "lr": 8.489018422524295e-05} +{"train_loss": 0.005017393734306097, "global_step": 18520, "epoch": 155, "lr": 8.488859724568183e-05} +{"train_loss": 0.004665420390665531, "global_step": 18521, "epoch": 155, "lr": 8.48870101976207e-05} +{"train_loss": 0.00259064557030797, "global_step": 18522, "epoch": 155, "lr": 8.488542308106264e-05} +{"train_loss": 0.005122481379657984, "global_step": 18523, "epoch": 155, "lr": 8.488383589601078e-05} +{"train_loss": 0.0068109845742583275, "global_step": 18524, "epoch": 155, "lr": 8.488224864246825e-05} +{"train_loss": 0.0035741638857871294, "global_step": 18525, "epoch": 155, "lr": 8.488066132043812e-05} +{"train_loss": 0.006161544006317854, "global_step": 18526, "epoch": 155, "lr": 8.487907392992356e-05} +{"train_loss": 0.007468393072485924, "global_step": 18527, "epoch": 155, "lr": 8.487748647092766e-05} +{"train_loss": 0.004527012351900339, "global_step": 18528, "epoch": 155, "lr": 8.487589894345353e-05} +{"train_loss": 0.004996524658054113, "global_step": 18529, "epoch": 155, "lr": 8.487431134750432e-05} +{"train_loss": 0.006132334936410189, "global_step": 18530, "epoch": 155, "lr": 8.487272368308311e-05} +{"train_loss": 0.004817203618586063, "global_step": 18531, "epoch": 155, "lr": 8.487113595019303e-05} +{"train_loss": 0.0048845806159079075, "global_step": 18532, "epoch": 155, "lr": 8.486954814883721e-05} +{"train_loss": 0.004813020117580891, "global_step": 18533, "epoch": 155, "lr": 8.486796027901875e-05} +{"train_loss": 0.009293239563703537, "global_step": 18534, "epoch": 155, "lr": 8.486637234074078e-05} +{"train_loss": 0.004680752754211426, "global_step": 18535, "epoch": 155, "lr": 8.486478433400641e-05} +{"train_loss": 0.006599193438887596, "global_step": 18536, "epoch": 155, "lr": 8.486319625881878e-05} +{"train_loss": 0.00800840463489294, "global_step": 18537, "epoch": 155, "lr": 8.486160811518097e-05} +{"train_loss": 0.009053869172930717, "global_step": 18538, "epoch": 155, "lr": 8.486001990309611e-05} +{"train_loss": 0.008881955407559872, "global_step": 18539, "epoch": 155, "lr": 8.485843162256734e-05} +{"train_loss": 0.003449725918471813, "global_step": 18540, "epoch": 155, "lr": 8.485684327359775e-05} +{"train_loss": 0.007165983319282532, "global_step": 18541, "epoch": 155, "lr": 8.485525485619049e-05} +{"train_loss": 0.004490738734602928, "global_step": 18542, "epoch": 155, "lr": 8.485366637034864e-05} +{"train_loss": 0.005948869977146387, "global_step": 18543, "epoch": 155, "lr": 8.485207781607535e-05} +{"train_loss": 0.005358917638659477, "global_step": 18544, "epoch": 155, "lr": 8.485048919337373e-05} +{"train_loss": 0.007471473887562752, "global_step": 18545, "epoch": 155, "lr": 8.484890050224689e-05} +{"train_loss": 0.005703237373381853, "global_step": 18546, "epoch": 155, "lr": 8.484731174269798e-05} +{"train_loss": 0.0044269864447414875, "global_step": 18547, "epoch": 155, "lr": 8.484572291473008e-05} +{"train_loss": 0.0061016385443508625, "global_step": 18548, "epoch": 155, "lr": 8.484413401834632e-05} +{"train_loss": 0.003814416006207466, "global_step": 18549, "epoch": 155, "lr": 8.484254505354983e-05} +{"train_loss": 0.003939082380384207, "global_step": 18550, "epoch": 155, "lr": 8.484095602034372e-05} +{"train_loss": 0.006455490365624428, "global_step": 18551, "epoch": 155, "lr": 8.483936691873112e-05} +{"train_loss": 0.006079031620174646, "global_step": 18552, "epoch": 155, "lr": 8.483777774871515e-05} +{"train_loss": 0.003588554449379444, "global_step": 18553, "epoch": 155, "lr": 8.483618851029894e-05} +{"train_loss": 0.0042436979711055756, "global_step": 18554, "epoch": 155, "lr": 8.483459920348557e-05} +{"train_loss": 0.005715346895158291, "global_step": 18555, "epoch": 155, "lr": 8.483300982827818e-05} +{"train_loss": 0.0044180164113640785, "global_step": 18556, "epoch": 155, "lr": 8.483142038467992e-05} +{"train_loss": 0.005980309564620256, "global_step": 18557, "epoch": 155, "lr": 8.482983087269387e-05} +{"train_loss": 0.005405796226114035, "global_step": 18558, "epoch": 155, "lr": 8.482824129232318e-05} +{"train_loss": 0.0046726069413125515, "global_step": 18559, "epoch": 155, "lr": 8.482665164357095e-05} +{"train_loss": 0.005102019291371107, "global_step": 18560, "epoch": 155, "lr": 8.482506192644031e-05} +{"train_loss": 0.006182878278195858, "global_step": 18561, "epoch": 155, "lr": 8.482347214093439e-05} +{"train_loss": 0.00657653110101819, "global_step": 18562, "epoch": 155, "lr": 8.48218822870563e-05} +{"train_loss": 0.005535302210223524, "global_step": 18563, "epoch": 155, "lr": 8.482029236480915e-05, "val_loss": 0.01205528900027275, "train_action_mse_error": 0.00014182282029651105} +{"train_loss": 0.0025688798632472754, "global_step": 18564, "epoch": 156, "lr": 8.481870237419609e-05} +{"train_loss": 0.0068250312469899654, "global_step": 18565, "epoch": 156, "lr": 8.481711231522023e-05} +{"train_loss": 0.0031206330750137568, "global_step": 18566, "epoch": 156, "lr": 8.481552218788468e-05} +{"train_loss": 0.004536191467195749, "global_step": 18567, "epoch": 156, "lr": 8.481393199219258e-05} +{"train_loss": 0.007014372851699591, "global_step": 18568, "epoch": 156, "lr": 8.481234172814706e-05} +{"train_loss": 0.007328817620873451, "global_step": 18569, "epoch": 156, "lr": 8.481075139575118e-05} +{"train_loss": 0.004207789432257414, "global_step": 18570, "epoch": 156, "lr": 8.480916099500816e-05} +{"train_loss": 0.0045966170728206635, "global_step": 18571, "epoch": 156, "lr": 8.480757052592104e-05} +{"train_loss": 0.007046440150588751, "global_step": 18572, "epoch": 156, "lr": 8.480597998849298e-05} +{"train_loss": 0.006433433387428522, "global_step": 18573, "epoch": 156, "lr": 8.48043893827271e-05} +{"train_loss": 0.00513959676027298, "global_step": 18574, "epoch": 156, "lr": 8.480279870862652e-05} +{"train_loss": 0.007538207340985537, "global_step": 18575, "epoch": 156, "lr": 8.480120796619434e-05} +{"train_loss": 0.005220451857894659, "global_step": 18576, "epoch": 156, "lr": 8.479961715543374e-05} +{"train_loss": 0.007466783281415701, "global_step": 18577, "epoch": 156, "lr": 8.47980262763478e-05} +{"train_loss": 0.006743569392710924, "global_step": 18578, "epoch": 156, "lr": 8.479643532893965e-05} +{"train_loss": 0.004741941578686237, "global_step": 18579, "epoch": 156, "lr": 8.479484431321242e-05} +{"train_loss": 0.005316604860126972, "global_step": 18580, "epoch": 156, "lr": 8.479325322916923e-05} +{"train_loss": 0.006059239152818918, "global_step": 18581, "epoch": 156, "lr": 8.47916620768132e-05} +{"train_loss": 0.0055300211533904076, "global_step": 18582, "epoch": 156, "lr": 8.479007085614745e-05} +{"train_loss": 0.004557386972010136, "global_step": 18583, "epoch": 156, "lr": 8.478847956717513e-05} +{"train_loss": 0.0049912892282009125, "global_step": 18584, "epoch": 156, "lr": 8.478688820989933e-05} +{"train_loss": 0.005246692802757025, "global_step": 18585, "epoch": 156, "lr": 8.478529678432321e-05} +{"train_loss": 0.005487420130521059, "global_step": 18586, "epoch": 156, "lr": 8.478370529044985e-05} +{"train_loss": 0.005271731875836849, "global_step": 18587, "epoch": 156, "lr": 8.478211372828242e-05} +{"train_loss": 0.006182604469358921, "global_step": 18588, "epoch": 156, "lr": 8.478052209782404e-05} +{"train_loss": 0.004111899994313717, "global_step": 18589, "epoch": 156, "lr": 8.477893039907779e-05} +{"train_loss": 0.006810234393924475, "global_step": 18590, "epoch": 156, "lr": 8.477733863204685e-05} +{"train_loss": 0.006708209402859211, "global_step": 18591, "epoch": 156, "lr": 8.47757467967343e-05} +{"train_loss": 0.005195956211537123, "global_step": 18592, "epoch": 156, "lr": 8.47741548931433e-05} +{"train_loss": 0.0061600785702466965, "global_step": 18593, "epoch": 156, "lr": 8.477256292127696e-05} +{"train_loss": 0.0036068938206881285, "global_step": 18594, "epoch": 156, "lr": 8.47709708811384e-05} +{"train_loss": 0.006836278364062309, "global_step": 18595, "epoch": 156, "lr": 8.476937877273075e-05} +{"train_loss": 0.0034913895651698112, "global_step": 18596, "epoch": 156, "lr": 8.476778659605715e-05} +{"train_loss": 0.005406435113400221, "global_step": 18597, "epoch": 156, "lr": 8.476619435112072e-05} +{"train_loss": 0.002936101285740733, "global_step": 18598, "epoch": 156, "lr": 8.476460203792458e-05} +{"train_loss": 0.004388931207358837, "global_step": 18599, "epoch": 156, "lr": 8.476300965647186e-05} +{"train_loss": 0.0031307016033679247, "global_step": 18600, "epoch": 156, "lr": 8.476141720676567e-05} +{"train_loss": 0.00340926181524992, "global_step": 18601, "epoch": 156, "lr": 8.475982468880916e-05} +{"train_loss": 0.004857718013226986, "global_step": 18602, "epoch": 156, "lr": 8.475823210260545e-05} +{"train_loss": 0.005076396744698286, "global_step": 18603, "epoch": 156, "lr": 8.475663944815766e-05} +{"train_loss": 0.0052563901990652084, "global_step": 18604, "epoch": 156, "lr": 8.475504672546892e-05} +{"train_loss": 0.003190862713381648, "global_step": 18605, "epoch": 156, "lr": 8.475345393454237e-05} +{"train_loss": 0.0043149832636117935, "global_step": 18606, "epoch": 156, "lr": 8.475186107538111e-05} +{"train_loss": 0.00311833037994802, "global_step": 18607, "epoch": 156, "lr": 8.47502681479883e-05} +{"train_loss": 0.006854644976556301, "global_step": 18608, "epoch": 156, "lr": 8.474867515236705e-05} +{"train_loss": 0.005281366873532534, "global_step": 18609, "epoch": 156, "lr": 8.474708208852046e-05} +{"train_loss": 0.00836675800383091, "global_step": 18610, "epoch": 156, "lr": 8.474548895645172e-05} +{"train_loss": 0.005093663930892944, "global_step": 18611, "epoch": 156, "lr": 8.47438957561639e-05} +{"train_loss": 0.004946964327245951, "global_step": 18612, "epoch": 156, "lr": 8.474230248766017e-05} +{"train_loss": 0.008061468601226807, "global_step": 18613, "epoch": 156, "lr": 8.474070915094363e-05} +{"train_loss": 0.0037105532828718424, "global_step": 18614, "epoch": 156, "lr": 8.473911574601743e-05} +{"train_loss": 0.005506123881787062, "global_step": 18615, "epoch": 156, "lr": 8.473752227288469e-05} +{"train_loss": 0.00889823492616415, "global_step": 18616, "epoch": 156, "lr": 8.473592873154852e-05} +{"train_loss": 0.003547611879184842, "global_step": 18617, "epoch": 156, "lr": 8.473433512201208e-05} +{"train_loss": 0.004549711477011442, "global_step": 18618, "epoch": 156, "lr": 8.473274144427848e-05} +{"train_loss": 0.007668905425816774, "global_step": 18619, "epoch": 156, "lr": 8.473114769835085e-05} +{"train_loss": 0.003756718710064888, "global_step": 18620, "epoch": 156, "lr": 8.472955388423231e-05} +{"train_loss": 0.008266769349575043, "global_step": 18621, "epoch": 156, "lr": 8.472796000192602e-05} +{"train_loss": 0.0064704869873821735, "global_step": 18622, "epoch": 156, "lr": 8.47263660514351e-05} +{"train_loss": 0.006782409735023975, "global_step": 18623, "epoch": 156, "lr": 8.472477203276263e-05} +{"train_loss": 0.003335012588649988, "global_step": 18624, "epoch": 156, "lr": 8.47231779459118e-05} +{"train_loss": 0.004924689419567585, "global_step": 18625, "epoch": 156, "lr": 8.472158379088573e-05} +{"train_loss": 0.004414783325046301, "global_step": 18626, "epoch": 156, "lr": 8.471998956768753e-05} +{"train_loss": 0.004713273141533136, "global_step": 18627, "epoch": 156, "lr": 8.471839527632035e-05} +{"train_loss": 0.0034370373468846083, "global_step": 18628, "epoch": 156, "lr": 8.47168009167873e-05} +{"train_loss": 0.00816839374601841, "global_step": 18629, "epoch": 156, "lr": 8.471520648909152e-05} +{"train_loss": 0.010303604416549206, "global_step": 18630, "epoch": 156, "lr": 8.471361199323616e-05} +{"train_loss": 0.006729049142450094, "global_step": 18631, "epoch": 156, "lr": 8.47120174292243e-05} +{"train_loss": 0.004445735365152359, "global_step": 18632, "epoch": 156, "lr": 8.471042279705912e-05} +{"train_loss": 0.0068977223709225655, "global_step": 18633, "epoch": 156, "lr": 8.470882809674373e-05} +{"train_loss": 0.008335280232131481, "global_step": 18634, "epoch": 156, "lr": 8.470723332828127e-05} +{"train_loss": 0.006509345956146717, "global_step": 18635, "epoch": 156, "lr": 8.470563849167485e-05} +{"train_loss": 0.007144252769649029, "global_step": 18636, "epoch": 156, "lr": 8.470404358692764e-05} +{"train_loss": 0.008590771816670895, "global_step": 18637, "epoch": 156, "lr": 8.470244861404273e-05} +{"train_loss": 0.007590441964566708, "global_step": 18638, "epoch": 156, "lr": 8.470085357302327e-05} +{"train_loss": 0.004959451500326395, "global_step": 18639, "epoch": 156, "lr": 8.46992584638724e-05} +{"train_loss": 0.005735310725867748, "global_step": 18640, "epoch": 156, "lr": 8.469766328659323e-05} +{"train_loss": 0.005749175325036049, "global_step": 18641, "epoch": 156, "lr": 8.469606804118892e-05} +{"train_loss": 0.00856917817145586, "global_step": 18642, "epoch": 156, "lr": 8.469447272766258e-05} +{"train_loss": 0.004477369599044323, "global_step": 18643, "epoch": 156, "lr": 8.469287734601735e-05} +{"train_loss": 0.007893664762377739, "global_step": 18644, "epoch": 156, "lr": 8.469128189625637e-05} +{"train_loss": 0.006991006899625063, "global_step": 18645, "epoch": 156, "lr": 8.468968637838275e-05} +{"train_loss": 0.009005359373986721, "global_step": 18646, "epoch": 156, "lr": 8.468809079239964e-05} +{"train_loss": 0.0031978883780539036, "global_step": 18647, "epoch": 156, "lr": 8.468649513831019e-05} +{"train_loss": 0.004738863091915846, "global_step": 18648, "epoch": 156, "lr": 8.468489941611748e-05} +{"train_loss": 0.005265479441732168, "global_step": 18649, "epoch": 156, "lr": 8.46833036258247e-05} +{"train_loss": 0.005189172923564911, "global_step": 18650, "epoch": 156, "lr": 8.468170776743494e-05} +{"train_loss": 0.00578915374353528, "global_step": 18651, "epoch": 156, "lr": 8.468011184095137e-05} +{"train_loss": 0.00674001919105649, "global_step": 18652, "epoch": 156, "lr": 8.467851584637709e-05} +{"train_loss": 0.004163879901170731, "global_step": 18653, "epoch": 156, "lr": 8.467691978371526e-05} +{"train_loss": 0.004912734031677246, "global_step": 18654, "epoch": 156, "lr": 8.4675323652969e-05} +{"train_loss": 0.007521900348365307, "global_step": 18655, "epoch": 156, "lr": 8.467372745414143e-05} +{"train_loss": 0.004937966354191303, "global_step": 18656, "epoch": 156, "lr": 8.467213118723572e-05} +{"train_loss": 0.0055832769721746445, "global_step": 18657, "epoch": 156, "lr": 8.467053485225499e-05} +{"train_loss": 0.0040725283324718475, "global_step": 18658, "epoch": 156, "lr": 8.466893844920236e-05} +{"train_loss": 0.005626889411360025, "global_step": 18659, "epoch": 156, "lr": 8.466734197808097e-05} +{"train_loss": 0.007397053763270378, "global_step": 18660, "epoch": 156, "lr": 8.466574543889397e-05} +{"train_loss": 0.006066943984478712, "global_step": 18661, "epoch": 156, "lr": 8.466414883164447e-05} +{"train_loss": 0.010039737448096275, "global_step": 18662, "epoch": 156, "lr": 8.466255215633561e-05} +{"train_loss": 0.005039765499532223, "global_step": 18663, "epoch": 156, "lr": 8.466095541297055e-05} +{"train_loss": 0.004490536637604237, "global_step": 18664, "epoch": 156, "lr": 8.465935860155239e-05} +{"train_loss": 0.006932062096893787, "global_step": 18665, "epoch": 156, "lr": 8.465776172208428e-05} +{"train_loss": 0.006054476369172335, "global_step": 18666, "epoch": 156, "lr": 8.465616477456938e-05} +{"train_loss": 0.005103759467601776, "global_step": 18667, "epoch": 156, "lr": 8.465456775901079e-05} +{"train_loss": 0.005169849377125502, "global_step": 18668, "epoch": 156, "lr": 8.465297067541166e-05} +{"train_loss": 0.007633950561285019, "global_step": 18669, "epoch": 156, "lr": 8.465137352377513e-05} +{"train_loss": 0.005645201541483402, "global_step": 18670, "epoch": 156, "lr": 8.464977630410431e-05} +{"train_loss": 0.005461891181766987, "global_step": 18671, "epoch": 156, "lr": 8.464817901640238e-05} +{"train_loss": 0.009358827024698257, "global_step": 18672, "epoch": 156, "lr": 8.464658166067243e-05} +{"train_loss": 0.0071450634859502316, "global_step": 18673, "epoch": 156, "lr": 8.464498423691763e-05} +{"train_loss": 0.003497887635603547, "global_step": 18674, "epoch": 156, "lr": 8.46433867451411e-05} +{"train_loss": 0.009106709621846676, "global_step": 18675, "epoch": 156, "lr": 8.4641789185346e-05} +{"train_loss": 0.003695581341162324, "global_step": 18676, "epoch": 156, "lr": 8.464019155753542e-05} +{"train_loss": 0.0050042602233588696, "global_step": 18677, "epoch": 156, "lr": 8.463859386171254e-05} +{"train_loss": 0.0065033407881855965, "global_step": 18678, "epoch": 156, "lr": 8.463699609788048e-05} +{"train_loss": 0.005746776238083839, "global_step": 18679, "epoch": 156, "lr": 8.463539826604238e-05} +{"train_loss": 0.004945481661707163, "global_step": 18680, "epoch": 156, "lr": 8.463380036620139e-05} +{"train_loss": 0.004517498891800642, "global_step": 18681, "epoch": 156, "lr": 8.46322023983606e-05} +{"train_loss": 0.005714963589395795, "global_step": 18682, "epoch": 156, "lr": 8.463060436252321e-05, "val_loss": 0.01893359236419201} +{"train_loss": 0.0034578002523630857, "global_step": 18683, "epoch": 157, "lr": 8.462900625869231e-05} +{"train_loss": 0.006892639212310314, "global_step": 18684, "epoch": 157, "lr": 8.462740808687106e-05} +{"train_loss": 0.004080010112375021, "global_step": 18685, "epoch": 157, "lr": 8.46258098470626e-05} +{"train_loss": 0.004427395761013031, "global_step": 18686, "epoch": 157, "lr": 8.462421153927006e-05} +{"train_loss": 0.006556092761456966, "global_step": 18687, "epoch": 157, "lr": 8.462261316349658e-05} +{"train_loss": 0.006286778952926397, "global_step": 18688, "epoch": 157, "lr": 8.462101471974528e-05} +{"train_loss": 0.003996263258159161, "global_step": 18689, "epoch": 157, "lr": 8.461941620801934e-05} +{"train_loss": 0.008949005976319313, "global_step": 18690, "epoch": 157, "lr": 8.461781762832187e-05} +{"train_loss": 0.005015164613723755, "global_step": 18691, "epoch": 157, "lr": 8.4616218980656e-05} +{"train_loss": 0.004458751063793898, "global_step": 18692, "epoch": 157, "lr": 8.461462026502489e-05} +{"train_loss": 0.006157184951007366, "global_step": 18693, "epoch": 157, "lr": 8.461302148143168e-05} +{"train_loss": 0.008158220909535885, "global_step": 18694, "epoch": 157, "lr": 8.461142262987949e-05} +{"train_loss": 0.006119015160948038, "global_step": 18695, "epoch": 157, "lr": 8.460982371037147e-05} +{"train_loss": 0.003806587541475892, "global_step": 18696, "epoch": 157, "lr": 8.460822472291077e-05} +{"train_loss": 0.0077329664491117, "global_step": 18697, "epoch": 157, "lr": 8.460662566750051e-05} +{"train_loss": 0.002936457982286811, "global_step": 18698, "epoch": 157, "lr": 8.460502654414383e-05} +{"train_loss": 0.005013532470911741, "global_step": 18699, "epoch": 157, "lr": 8.460342735284388e-05} +{"train_loss": 0.004760516341775656, "global_step": 18700, "epoch": 157, "lr": 8.460182809360379e-05} +{"train_loss": 0.004342339001595974, "global_step": 18701, "epoch": 157, "lr": 8.460022876642672e-05} +{"train_loss": 0.004330276977270842, "global_step": 18702, "epoch": 157, "lr": 8.459862937131581e-05} +{"train_loss": 0.004359664395451546, "global_step": 18703, "epoch": 157, "lr": 8.459702990827416e-05} +{"train_loss": 0.00828457996249199, "global_step": 18704, "epoch": 157, "lr": 8.459543037730496e-05} +{"train_loss": 0.005808438640087843, "global_step": 18705, "epoch": 157, "lr": 8.459383077841132e-05} +{"train_loss": 0.005651755258440971, "global_step": 18706, "epoch": 157, "lr": 8.459223111159639e-05} +{"train_loss": 0.00648478651419282, "global_step": 18707, "epoch": 157, "lr": 8.459063137686332e-05} +{"train_loss": 0.007657362148165703, "global_step": 18708, "epoch": 157, "lr": 8.458903157421522e-05} +{"train_loss": 0.008192939683794975, "global_step": 18709, "epoch": 157, "lr": 8.458743170365527e-05} +{"train_loss": 0.006245387252420187, "global_step": 18710, "epoch": 157, "lr": 8.458583176518657e-05} +{"train_loss": 0.005753801669925451, "global_step": 18711, "epoch": 157, "lr": 8.45842317588123e-05} +{"train_loss": 0.004722982179373503, "global_step": 18712, "epoch": 157, "lr": 8.458263168453558e-05} +{"train_loss": 0.007126418873667717, "global_step": 18713, "epoch": 157, "lr": 8.458103154235957e-05} +{"train_loss": 0.006498024798929691, "global_step": 18714, "epoch": 157, "lr": 8.457943133228738e-05} +{"train_loss": 0.005988784600049257, "global_step": 18715, "epoch": 157, "lr": 8.457783105432219e-05} +{"train_loss": 0.0042479196563363075, "global_step": 18716, "epoch": 157, "lr": 8.457623070846711e-05} +{"train_loss": 0.007621391210705042, "global_step": 18717, "epoch": 157, "lr": 8.45746302947253e-05} +{"train_loss": 0.004363820422440767, "global_step": 18718, "epoch": 157, "lr": 8.45730298130999e-05} +{"train_loss": 0.007917821407318115, "global_step": 18719, "epoch": 157, "lr": 8.457142926359405e-05} +{"train_loss": 0.005066231824457645, "global_step": 18720, "epoch": 157, "lr": 8.456982864621088e-05} +{"train_loss": 0.00562272546812892, "global_step": 18721, "epoch": 157, "lr": 8.456822796095355e-05} +{"train_loss": 0.00381681090220809, "global_step": 18722, "epoch": 157, "lr": 8.45666272078252e-05} +{"train_loss": 0.009226075373589993, "global_step": 18723, "epoch": 157, "lr": 8.456502638682897e-05} +{"train_loss": 0.004312101751565933, "global_step": 18724, "epoch": 157, "lr": 8.4563425497968e-05} +{"train_loss": 0.0033569280058145523, "global_step": 18725, "epoch": 157, "lr": 8.456182454124544e-05} +{"train_loss": 0.0062239039689302444, "global_step": 18726, "epoch": 157, "lr": 8.456022351666444e-05} +{"train_loss": 0.004266653209924698, "global_step": 18727, "epoch": 157, "lr": 8.455862242422812e-05} +{"train_loss": 0.005619005300104618, "global_step": 18728, "epoch": 157, "lr": 8.455702126393963e-05} +{"train_loss": 0.0043416800908744335, "global_step": 18729, "epoch": 157, "lr": 8.455542003580215e-05} +{"train_loss": 0.0047645848244428635, "global_step": 18730, "epoch": 157, "lr": 8.455381873981877e-05} +{"train_loss": 0.0066452715545892715, "global_step": 18731, "epoch": 157, "lr": 8.455221737599265e-05} +{"train_loss": 0.0051285699009895325, "global_step": 18732, "epoch": 157, "lr": 8.455061594432696e-05} +{"train_loss": 0.004027105402201414, "global_step": 18733, "epoch": 157, "lr": 8.454901444482483e-05} +{"train_loss": 0.005863855127245188, "global_step": 18734, "epoch": 157, "lr": 8.45474128774894e-05} +{"train_loss": 0.006388538982719183, "global_step": 18735, "epoch": 157, "lr": 8.454581124232382e-05} +{"train_loss": 0.0072343130595982075, "global_step": 18736, "epoch": 157, "lr": 8.45442095393312e-05} +{"train_loss": 0.005762639921158552, "global_step": 18737, "epoch": 157, "lr": 8.454260776851475e-05} +{"train_loss": 0.0033151123207062483, "global_step": 18738, "epoch": 157, "lr": 8.454100592987755e-05} +{"train_loss": 0.006586187984794378, "global_step": 18739, "epoch": 157, "lr": 8.45394040234228e-05} +{"train_loss": 0.0073832557536661625, "global_step": 18740, "epoch": 157, "lr": 8.453780204915361e-05} +{"train_loss": 0.009444370865821838, "global_step": 18741, "epoch": 157, "lr": 8.453620000707314e-05} +{"train_loss": 0.008108057081699371, "global_step": 18742, "epoch": 157, "lr": 8.453459789718452e-05} +{"train_loss": 0.008975796401500702, "global_step": 18743, "epoch": 157, "lr": 8.453299571949092e-05} +{"train_loss": 0.00821208581328392, "global_step": 18744, "epoch": 157, "lr": 8.453139347399546e-05} +{"train_loss": 0.006151834037154913, "global_step": 18745, "epoch": 157, "lr": 8.45297911607013e-05} +{"train_loss": 0.00734329130500555, "global_step": 18746, "epoch": 157, "lr": 8.45281887796116e-05} +{"train_loss": 0.006271593738347292, "global_step": 18747, "epoch": 157, "lr": 8.452658633072948e-05} +{"train_loss": 0.007522033993154764, "global_step": 18748, "epoch": 157, "lr": 8.452498381405808e-05} +{"train_loss": 0.0061263456009328365, "global_step": 18749, "epoch": 157, "lr": 8.452338122960057e-05} +{"train_loss": 0.005163175519555807, "global_step": 18750, "epoch": 157, "lr": 8.45217785773601e-05} +{"train_loss": 0.006353003904223442, "global_step": 18751, "epoch": 157, "lr": 8.45201758573398e-05} +{"train_loss": 0.00468475092202425, "global_step": 18752, "epoch": 157, "lr": 8.451857306954282e-05} +{"train_loss": 0.007885324768722057, "global_step": 18753, "epoch": 157, "lr": 8.451697021397233e-05} +{"train_loss": 0.009147971868515015, "global_step": 18754, "epoch": 157, "lr": 8.451536729063145e-05} +{"train_loss": 0.007589645683765411, "global_step": 18755, "epoch": 157, "lr": 8.451376429952331e-05} +{"train_loss": 0.003833700204268098, "global_step": 18756, "epoch": 157, "lr": 8.451216124065109e-05} +{"train_loss": 0.004751989152282476, "global_step": 18757, "epoch": 157, "lr": 8.451055811401793e-05} +{"train_loss": 0.007849117740988731, "global_step": 18758, "epoch": 157, "lr": 8.450895491962699e-05} +{"train_loss": 0.009222844615578651, "global_step": 18759, "epoch": 157, "lr": 8.45073516574814e-05} +{"train_loss": 0.004714954644441605, "global_step": 18760, "epoch": 157, "lr": 8.450574832758431e-05} +{"train_loss": 0.003677201224491, "global_step": 18761, "epoch": 157, "lr": 8.450414492993886e-05} +{"train_loss": 0.00503949262201786, "global_step": 18762, "epoch": 157, "lr": 8.450254146454822e-05} +{"train_loss": 0.006797755602747202, "global_step": 18763, "epoch": 157, "lr": 8.450093793141551e-05} +{"train_loss": 0.007764545269310474, "global_step": 18764, "epoch": 157, "lr": 8.44993343305439e-05} +{"train_loss": 0.005207858048379421, "global_step": 18765, "epoch": 157, "lr": 8.449773066193654e-05} +{"train_loss": 0.004028362222015858, "global_step": 18766, "epoch": 157, "lr": 8.449612692559656e-05} +{"train_loss": 0.00681960117071867, "global_step": 18767, "epoch": 157, "lr": 8.449452312152714e-05} +{"train_loss": 0.008927343413233757, "global_step": 18768, "epoch": 157, "lr": 8.449291924973139e-05} +{"train_loss": 0.005973135586827993, "global_step": 18769, "epoch": 157, "lr": 8.449131531021248e-05} +{"train_loss": 0.006906585767865181, "global_step": 18770, "epoch": 157, "lr": 8.448971130297356e-05} +{"train_loss": 0.005643454845994711, "global_step": 18771, "epoch": 157, "lr": 8.448810722801779e-05} +{"train_loss": 0.005659035407006741, "global_step": 18772, "epoch": 157, "lr": 8.448650308534829e-05} +{"train_loss": 0.006488035898655653, "global_step": 18773, "epoch": 157, "lr": 8.448489887496822e-05} +{"train_loss": 0.006056117359548807, "global_step": 18774, "epoch": 157, "lr": 8.448329459688076e-05} +{"train_loss": 0.0051924544386565685, "global_step": 18775, "epoch": 157, "lr": 8.448169025108901e-05} +{"train_loss": 0.006345770321786404, "global_step": 18776, "epoch": 157, "lr": 8.448008583759616e-05} +{"train_loss": 0.004457527305930853, "global_step": 18777, "epoch": 157, "lr": 8.447848135640532e-05} +{"train_loss": 0.005497755017131567, "global_step": 18778, "epoch": 157, "lr": 8.44768768075197e-05} +{"train_loss": 0.005581853911280632, "global_step": 18779, "epoch": 157, "lr": 8.44752721909424e-05} +{"train_loss": 0.007625488564372063, "global_step": 18780, "epoch": 157, "lr": 8.447366750667659e-05} +{"train_loss": 0.005472318734973669, "global_step": 18781, "epoch": 157, "lr": 8.447206275472541e-05} +{"train_loss": 0.004515096545219421, "global_step": 18782, "epoch": 157, "lr": 8.447045793509202e-05} +{"train_loss": 0.007481784094125032, "global_step": 18783, "epoch": 157, "lr": 8.446885304777957e-05} +{"train_loss": 0.0051666367799043655, "global_step": 18784, "epoch": 157, "lr": 8.44672480927912e-05} +{"train_loss": 0.004844893701374531, "global_step": 18785, "epoch": 157, "lr": 8.446564307013009e-05} +{"train_loss": 0.004688314162194729, "global_step": 18786, "epoch": 157, "lr": 8.446403797979937e-05} +{"train_loss": 0.004847191274166107, "global_step": 18787, "epoch": 157, "lr": 8.446243282180218e-05} +{"train_loss": 0.008220228366553783, "global_step": 18788, "epoch": 157, "lr": 8.446082759614168e-05} +{"train_loss": 0.004284649156033993, "global_step": 18789, "epoch": 157, "lr": 8.445922230282105e-05} +{"train_loss": 0.00580187002196908, "global_step": 18790, "epoch": 157, "lr": 8.44576169418434e-05} +{"train_loss": 0.005187576171010733, "global_step": 18791, "epoch": 157, "lr": 8.445601151321193e-05} +{"train_loss": 0.008197113871574402, "global_step": 18792, "epoch": 157, "lr": 8.445440601692973e-05} +{"train_loss": 0.0047420295886695385, "global_step": 18793, "epoch": 157, "lr": 8.4452800453e-05} +{"train_loss": 0.005475538782775402, "global_step": 18794, "epoch": 157, "lr": 8.445119482142585e-05} +{"train_loss": 0.00618733512237668, "global_step": 18795, "epoch": 157, "lr": 8.444958912221048e-05} +{"train_loss": 0.004797378554940224, "global_step": 18796, "epoch": 157, "lr": 8.444798335535702e-05} +{"train_loss": 0.005378641653805971, "global_step": 18797, "epoch": 157, "lr": 8.444637752086864e-05} +{"train_loss": 0.0054224515333771706, "global_step": 18798, "epoch": 157, "lr": 8.444477161874846e-05} +{"train_loss": 0.006223314441740513, "global_step": 18799, "epoch": 157, "lr": 8.444316564899966e-05} +{"train_loss": 0.006413170602172613, "global_step": 18800, "epoch": 157, "lr": 8.444155961162536e-05} +{"train_loss": 0.00595347532423354, "global_step": 18801, "epoch": 157, "lr": 8.443995350662877e-05, "val_loss": 0.013876394368708134} +{"train_loss": 0.004970872309058905, "global_step": 18802, "epoch": 158, "lr": 8.443834733401299e-05} +{"train_loss": 0.008193569257855415, "global_step": 18803, "epoch": 158, "lr": 8.443674109378121e-05} +{"train_loss": 0.005885821767151356, "global_step": 18804, "epoch": 158, "lr": 8.443513478593656e-05} +{"train_loss": 0.0034899439197033644, "global_step": 18805, "epoch": 158, "lr": 8.44335284104822e-05} +{"train_loss": 0.007303493097424507, "global_step": 18806, "epoch": 158, "lr": 8.443192196742129e-05} +{"train_loss": 0.004845497664064169, "global_step": 18807, "epoch": 158, "lr": 8.443031545675697e-05} +{"train_loss": 0.006445514038205147, "global_step": 18808, "epoch": 158, "lr": 8.442870887849242e-05} +{"train_loss": 0.005897600669413805, "global_step": 18809, "epoch": 158, "lr": 8.442710223263075e-05} +{"train_loss": 0.004723175894469023, "global_step": 18810, "epoch": 158, "lr": 8.442549551917518e-05} +{"train_loss": 0.004643175285309553, "global_step": 18811, "epoch": 158, "lr": 8.442388873812881e-05} +{"train_loss": 0.003783997381106019, "global_step": 18812, "epoch": 158, "lr": 8.44222818894948e-05} +{"train_loss": 0.004296937957406044, "global_step": 18813, "epoch": 158, "lr": 8.442067497327632e-05} +{"train_loss": 0.006399862933903933, "global_step": 18814, "epoch": 158, "lr": 8.441906798947654e-05} +{"train_loss": 0.006061631720513105, "global_step": 18815, "epoch": 158, "lr": 8.441746093809859e-05} +{"train_loss": 0.005255646537989378, "global_step": 18816, "epoch": 158, "lr": 8.441585381914562e-05} +{"train_loss": 0.00557665666565299, "global_step": 18817, "epoch": 158, "lr": 8.44142466326208e-05} +{"train_loss": 0.007098520174622536, "global_step": 18818, "epoch": 158, "lr": 8.44126393785273e-05} +{"train_loss": 0.00538278603926301, "global_step": 18819, "epoch": 158, "lr": 8.441103205686824e-05} +{"train_loss": 0.00446299510076642, "global_step": 18820, "epoch": 158, "lr": 8.44094246676468e-05} +{"train_loss": 0.0038937150966376066, "global_step": 18821, "epoch": 158, "lr": 8.440781721086615e-05} +{"train_loss": 0.004047419410198927, "global_step": 18822, "epoch": 158, "lr": 8.440620968652942e-05} +{"train_loss": 0.004249898251146078, "global_step": 18823, "epoch": 158, "lr": 8.440460209463976e-05} +{"train_loss": 0.004580188542604446, "global_step": 18824, "epoch": 158, "lr": 8.440299443520035e-05} +{"train_loss": 0.005227631889283657, "global_step": 18825, "epoch": 158, "lr": 8.440138670821433e-05} +{"train_loss": 0.0038819240871816874, "global_step": 18826, "epoch": 158, "lr": 8.439977891368486e-05} +{"train_loss": 0.007883649319410324, "global_step": 18827, "epoch": 158, "lr": 8.439817105161509e-05} +{"train_loss": 0.004510083701461554, "global_step": 18828, "epoch": 158, "lr": 8.439656312200821e-05} +{"train_loss": 0.006473494693636894, "global_step": 18829, "epoch": 158, "lr": 8.439495512486733e-05} +{"train_loss": 0.0032895084004849195, "global_step": 18830, "epoch": 158, "lr": 8.439334706019565e-05} +{"train_loss": 0.008197355084121227, "global_step": 18831, "epoch": 158, "lr": 8.43917389279963e-05} +{"train_loss": 0.004640053492039442, "global_step": 18832, "epoch": 158, "lr": 8.439013072827244e-05} +{"train_loss": 0.0035491513554006815, "global_step": 18833, "epoch": 158, "lr": 8.438852246102725e-05} +{"train_loss": 0.007894288748502731, "global_step": 18834, "epoch": 158, "lr": 8.438691412626384e-05} +{"train_loss": 0.0039520952850580215, "global_step": 18835, "epoch": 158, "lr": 8.438530572398542e-05} +{"train_loss": 0.0057080890983343124, "global_step": 18836, "epoch": 158, "lr": 8.438369725419513e-05} +{"train_loss": 0.006315344478935003, "global_step": 18837, "epoch": 158, "lr": 8.43820887168961e-05} +{"train_loss": 0.005183667875826359, "global_step": 18838, "epoch": 158, "lr": 8.438048011209152e-05} +{"train_loss": 0.006645073648542166, "global_step": 18839, "epoch": 158, "lr": 8.437887143978456e-05} +{"train_loss": 0.004180938005447388, "global_step": 18840, "epoch": 158, "lr": 8.437726269997832e-05} +{"train_loss": 0.004325613379478455, "global_step": 18841, "epoch": 158, "lr": 8.437565389267603e-05} +{"train_loss": 0.00895120482891798, "global_step": 18842, "epoch": 158, "lr": 8.437404501788082e-05} +{"train_loss": 0.005380467977374792, "global_step": 18843, "epoch": 158, "lr": 8.437243607559582e-05} +{"train_loss": 0.004821605980396271, "global_step": 18844, "epoch": 158, "lr": 8.437082706582423e-05} +{"train_loss": 0.005501011852174997, "global_step": 18845, "epoch": 158, "lr": 8.436921798856919e-05} +{"train_loss": 0.0038486949633806944, "global_step": 18846, "epoch": 158, "lr": 8.436760884383386e-05} +{"train_loss": 0.0064810593612492085, "global_step": 18847, "epoch": 158, "lr": 8.436599963162141e-05} +{"train_loss": 0.0050966390408575535, "global_step": 18848, "epoch": 158, "lr": 8.436439035193499e-05} +{"train_loss": 0.0045673721469938755, "global_step": 18849, "epoch": 158, "lr": 8.436278100477775e-05} +{"train_loss": 0.003361751092597842, "global_step": 18850, "epoch": 158, "lr": 8.436117159015287e-05} +{"train_loss": 0.007201957516372204, "global_step": 18851, "epoch": 158, "lr": 8.435956210806349e-05} +{"train_loss": 0.005751897115260363, "global_step": 18852, "epoch": 158, "lr": 8.435795255851279e-05} +{"train_loss": 0.0043377261608839035, "global_step": 18853, "epoch": 158, "lr": 8.435634294150392e-05} +{"train_loss": 0.004897611681371927, "global_step": 18854, "epoch": 158, "lr": 8.435473325704005e-05} +{"train_loss": 0.0044984943233430386, "global_step": 18855, "epoch": 158, "lr": 8.43531235051243e-05} +{"train_loss": 0.004745228216052055, "global_step": 18856, "epoch": 158, "lr": 8.435151368575988e-05} +{"train_loss": 0.0071272156201303005, "global_step": 18857, "epoch": 158, "lr": 8.434990379894993e-05} +{"train_loss": 0.0045621744357049465, "global_step": 18858, "epoch": 158, "lr": 8.434829384469762e-05} +{"train_loss": 0.007130774203687906, "global_step": 18859, "epoch": 158, "lr": 8.434668382300611e-05} +{"train_loss": 0.004196884110569954, "global_step": 18860, "epoch": 158, "lr": 8.434507373387856e-05} +{"train_loss": 0.0055559417232871056, "global_step": 18861, "epoch": 158, "lr": 8.434346357731811e-05} +{"train_loss": 0.004734877031296492, "global_step": 18862, "epoch": 158, "lr": 8.434185335332795e-05} +{"train_loss": 0.0031001262832432985, "global_step": 18863, "epoch": 158, "lr": 8.434024306191121e-05} +{"train_loss": 0.006200655363500118, "global_step": 18864, "epoch": 158, "lr": 8.433863270307109e-05} +{"train_loss": 0.006745535880327225, "global_step": 18865, "epoch": 158, "lr": 8.433702227681073e-05} +{"train_loss": 0.0041018337942659855, "global_step": 18866, "epoch": 158, "lr": 8.433541178313329e-05} +{"train_loss": 0.004838425200432539, "global_step": 18867, "epoch": 158, "lr": 8.433380122204195e-05} +{"train_loss": 0.004073295276612043, "global_step": 18868, "epoch": 158, "lr": 8.433219059353986e-05} +{"train_loss": 0.005826103035360575, "global_step": 18869, "epoch": 158, "lr": 8.433057989763017e-05} +{"train_loss": 0.006306140683591366, "global_step": 18870, "epoch": 158, "lr": 8.432896913431605e-05} +{"train_loss": 0.005658227484673262, "global_step": 18871, "epoch": 158, "lr": 8.432735830360068e-05} +{"train_loss": 0.007690587546676397, "global_step": 18872, "epoch": 158, "lr": 8.43257474054872e-05} +{"train_loss": 0.007280396763235331, "global_step": 18873, "epoch": 158, "lr": 8.432413643997878e-05} +{"train_loss": 0.007730650249868631, "global_step": 18874, "epoch": 158, "lr": 8.432252540707859e-05} +{"train_loss": 0.006325656082481146, "global_step": 18875, "epoch": 158, "lr": 8.432091430678979e-05} +{"train_loss": 0.005334860645234585, "global_step": 18876, "epoch": 158, "lr": 8.431930313911554e-05} +{"train_loss": 0.007255627308040857, "global_step": 18877, "epoch": 158, "lr": 8.4317691904059e-05} +{"train_loss": 0.005119302310049534, "global_step": 18878, "epoch": 158, "lr": 8.431608060162335e-05} +{"train_loss": 0.006134958006441593, "global_step": 18879, "epoch": 158, "lr": 8.431446923181174e-05} +{"train_loss": 0.003942430019378662, "global_step": 18880, "epoch": 158, "lr": 8.431285779462732e-05} +{"train_loss": 0.007727121002972126, "global_step": 18881, "epoch": 158, "lr": 8.431124629007327e-05} +{"train_loss": 0.007034521549940109, "global_step": 18882, "epoch": 158, "lr": 8.430963471815277e-05} +{"train_loss": 0.0044870199635624886, "global_step": 18883, "epoch": 158, "lr": 8.430802307886895e-05} +{"train_loss": 0.005663520190864801, "global_step": 18884, "epoch": 158, "lr": 8.430641137222501e-05} +{"train_loss": 0.006103838793933392, "global_step": 18885, "epoch": 158, "lr": 8.43047995982241e-05} +{"train_loss": 0.006448222789913416, "global_step": 18886, "epoch": 158, "lr": 8.430318775686936e-05} +{"train_loss": 0.004108020104467869, "global_step": 18887, "epoch": 158, "lr": 8.4301575848164e-05} +{"train_loss": 0.0040900991298258305, "global_step": 18888, "epoch": 158, "lr": 8.429996387211114e-05} +{"train_loss": 0.0040980856865644455, "global_step": 18889, "epoch": 158, "lr": 8.429835182871397e-05} +{"train_loss": 0.00615777587518096, "global_step": 18890, "epoch": 158, "lr": 8.429673971797564e-05} +{"train_loss": 0.00780410785228014, "global_step": 18891, "epoch": 158, "lr": 8.429512753989934e-05} +{"train_loss": 0.006511886138468981, "global_step": 18892, "epoch": 158, "lr": 8.429351529448823e-05} +{"train_loss": 0.003998125903308392, "global_step": 18893, "epoch": 158, "lr": 8.429190298174546e-05} +{"train_loss": 0.004698850214481354, "global_step": 18894, "epoch": 158, "lr": 8.429029060167419e-05} +{"train_loss": 0.003963808063417673, "global_step": 18895, "epoch": 158, "lr": 8.42886781542776e-05} +{"train_loss": 0.004756654147058725, "global_step": 18896, "epoch": 158, "lr": 8.428706563955887e-05} +{"train_loss": 0.0026791864074766636, "global_step": 18897, "epoch": 158, "lr": 8.428545305752113e-05} +{"train_loss": 0.004683974664658308, "global_step": 18898, "epoch": 158, "lr": 8.428384040816757e-05} +{"train_loss": 0.0041495198383927345, "global_step": 18899, "epoch": 158, "lr": 8.428222769150136e-05} +{"train_loss": 0.0051656924188137054, "global_step": 18900, "epoch": 158, "lr": 8.428061490752565e-05} +{"train_loss": 0.005220094230026007, "global_step": 18901, "epoch": 158, "lr": 8.427900205624361e-05} +{"train_loss": 0.004634426441043615, "global_step": 18902, "epoch": 158, "lr": 8.427738913765844e-05} +{"train_loss": 0.006610116921365261, "global_step": 18903, "epoch": 158, "lr": 8.427577615177324e-05} +{"train_loss": 0.0031218738295137882, "global_step": 18904, "epoch": 158, "lr": 8.427416309859125e-05} +{"train_loss": 0.006118980702012777, "global_step": 18905, "epoch": 158, "lr": 8.427254997811558e-05} +{"train_loss": 0.0030383248813450336, "global_step": 18906, "epoch": 158, "lr": 8.427093679034943e-05} +{"train_loss": 0.005835561081767082, "global_step": 18907, "epoch": 158, "lr": 8.426932353529596e-05} +{"train_loss": 0.006409810855984688, "global_step": 18908, "epoch": 158, "lr": 8.426771021295832e-05} +{"train_loss": 0.0053207422606647015, "global_step": 18909, "epoch": 158, "lr": 8.42660968233397e-05} +{"train_loss": 0.004581010900437832, "global_step": 18910, "epoch": 158, "lr": 8.426448336644326e-05} +{"train_loss": 0.006086395122110844, "global_step": 18911, "epoch": 158, "lr": 8.426286984227216e-05} +{"train_loss": 0.006707219406962395, "global_step": 18912, "epoch": 158, "lr": 8.42612562508296e-05} +{"train_loss": 0.004732787609100342, "global_step": 18913, "epoch": 158, "lr": 8.42596425921187e-05} +{"train_loss": 0.007065747864544392, "global_step": 18914, "epoch": 158, "lr": 8.425802886614265e-05} +{"train_loss": 0.004265832714736462, "global_step": 18915, "epoch": 158, "lr": 8.425641507290462e-05} +{"train_loss": 0.006211303640156984, "global_step": 18916, "epoch": 158, "lr": 8.425480121240779e-05} +{"train_loss": 0.006762112025171518, "global_step": 18917, "epoch": 158, "lr": 8.425318728465532e-05} +{"train_loss": 0.007164434529840946, "global_step": 18918, "epoch": 158, "lr": 8.425157328965036e-05} +{"train_loss": 0.00617866450920701, "global_step": 18919, "epoch": 158, "lr": 8.424995922739611e-05} +{"train_loss": 0.005432983255796447, "global_step": 18920, "epoch": 158, "lr": 8.424834509789572e-05, "val_loss": 0.0158687736839056} +{"train_loss": 0.005985538009554148, "global_step": 18921, "epoch": 159, "lr": 8.424673090115237e-05} +{"train_loss": 0.004390422720462084, "global_step": 18922, "epoch": 159, "lr": 8.42451166371692e-05} +{"train_loss": 0.003938667010515928, "global_step": 18923, "epoch": 159, "lr": 8.424350230594944e-05} +{"train_loss": 0.004179618787020445, "global_step": 18924, "epoch": 159, "lr": 8.424188790749618e-05} +{"train_loss": 0.006105318199843168, "global_step": 18925, "epoch": 159, "lr": 8.424027344181267e-05} +{"train_loss": 0.004553498234599829, "global_step": 18926, "epoch": 159, "lr": 8.423865890890201e-05} +{"train_loss": 0.003121576039120555, "global_step": 18927, "epoch": 159, "lr": 8.423704430876742e-05} +{"train_loss": 0.005197486374527216, "global_step": 18928, "epoch": 159, "lr": 8.423542964141204e-05} +{"train_loss": 0.005487452726811171, "global_step": 18929, "epoch": 159, "lr": 8.423381490683906e-05} +{"train_loss": 0.006495373789221048, "global_step": 18930, "epoch": 159, "lr": 8.423220010505164e-05} +{"train_loss": 0.005721726920455694, "global_step": 18931, "epoch": 159, "lr": 8.423058523605294e-05} +{"train_loss": 0.004312284290790558, "global_step": 18932, "epoch": 159, "lr": 8.422897029984616e-05} +{"train_loss": 0.004995075520128012, "global_step": 18933, "epoch": 159, "lr": 8.422735529643444e-05} +{"train_loss": 0.0044560362584888935, "global_step": 18934, "epoch": 159, "lr": 8.422574022582097e-05} +{"train_loss": 0.00499358493834734, "global_step": 18935, "epoch": 159, "lr": 8.42241250880089e-05} +{"train_loss": 0.006100307684391737, "global_step": 18936, "epoch": 159, "lr": 8.422250988300146e-05} +{"train_loss": 0.004485743585973978, "global_step": 18937, "epoch": 159, "lr": 8.422089461080174e-05} +{"train_loss": 0.00459898030385375, "global_step": 18938, "epoch": 159, "lr": 8.421927927141295e-05} +{"train_loss": 0.005329831037670374, "global_step": 18939, "epoch": 159, "lr": 8.421766386483827e-05} +{"train_loss": 0.007273986004292965, "global_step": 18940, "epoch": 159, "lr": 8.421604839108086e-05} +{"train_loss": 0.003952661994844675, "global_step": 18941, "epoch": 159, "lr": 8.421443285014392e-05} +{"train_loss": 0.005585954524576664, "global_step": 18942, "epoch": 159, "lr": 8.421281724203056e-05} +{"train_loss": 0.00538464542478323, "global_step": 18943, "epoch": 159, "lr": 8.421120156674402e-05} +{"train_loss": 0.005358650349080563, "global_step": 18944, "epoch": 159, "lr": 8.420958582428742e-05} +{"train_loss": 0.004353486001491547, "global_step": 18945, "epoch": 159, "lr": 8.420797001466394e-05} +{"train_loss": 0.005775074008852243, "global_step": 18946, "epoch": 159, "lr": 8.420635413787679e-05} +{"train_loss": 0.0028667792212218046, "global_step": 18947, "epoch": 159, "lr": 8.420473819392912e-05} +{"train_loss": 0.0049551078118383884, "global_step": 18948, "epoch": 159, "lr": 8.420312218282409e-05} +{"train_loss": 0.00618051178753376, "global_step": 18949, "epoch": 159, "lr": 8.420150610456488e-05} +{"train_loss": 0.0036333652678877115, "global_step": 18950, "epoch": 159, "lr": 8.419988995915467e-05} +{"train_loss": 0.005703238304704428, "global_step": 18951, "epoch": 159, "lr": 8.419827374659663e-05} +{"train_loss": 0.005745009984821081, "global_step": 18952, "epoch": 159, "lr": 8.419665746689393e-05} +{"train_loss": 0.007285106927156448, "global_step": 18953, "epoch": 159, "lr": 8.419504112004975e-05} +{"train_loss": 0.007793613243848085, "global_step": 18954, "epoch": 159, "lr": 8.419342470606726e-05} +{"train_loss": 0.004593695048242807, "global_step": 18955, "epoch": 159, "lr": 8.419180822494963e-05} +{"train_loss": 0.005063833203166723, "global_step": 18956, "epoch": 159, "lr": 8.419019167670004e-05} +{"train_loss": 0.006341973785310984, "global_step": 18957, "epoch": 159, "lr": 8.418857506132167e-05} +{"train_loss": 0.005200738552957773, "global_step": 18958, "epoch": 159, "lr": 8.418695837881767e-05} +{"train_loss": 0.005320380907505751, "global_step": 18959, "epoch": 159, "lr": 8.418534162919125e-05} +{"train_loss": 0.00709904870018363, "global_step": 18960, "epoch": 159, "lr": 8.418372481244554e-05} +{"train_loss": 0.005935654975473881, "global_step": 18961, "epoch": 159, "lr": 8.418210792858377e-05} +{"train_loss": 0.0071649192832410336, "global_step": 18962, "epoch": 159, "lr": 8.418049097760904e-05} +{"train_loss": 0.00420122966170311, "global_step": 18963, "epoch": 159, "lr": 8.41788739595246e-05} +{"train_loss": 0.0030585387721657753, "global_step": 18964, "epoch": 159, "lr": 8.417725687433358e-05} +{"train_loss": 0.006709766574203968, "global_step": 18965, "epoch": 159, "lr": 8.417563972203916e-05} +{"train_loss": 0.005292659625411034, "global_step": 18966, "epoch": 159, "lr": 8.417402250264455e-05} +{"train_loss": 0.0062514967285096645, "global_step": 18967, "epoch": 159, "lr": 8.417240521615289e-05} +{"train_loss": 0.00407683989033103, "global_step": 18968, "epoch": 159, "lr": 8.417078786256734e-05} +{"train_loss": 0.004964926745742559, "global_step": 18969, "epoch": 159, "lr": 8.416917044189112e-05} +{"train_loss": 0.004725562874227762, "global_step": 18970, "epoch": 159, "lr": 8.416755295412737e-05} +{"train_loss": 0.006641169544309378, "global_step": 18971, "epoch": 159, "lr": 8.416593539927928e-05} +{"train_loss": 0.005758322309702635, "global_step": 18972, "epoch": 159, "lr": 8.416431777735005e-05} +{"train_loss": 0.004586705006659031, "global_step": 18973, "epoch": 159, "lr": 8.416270008834282e-05} +{"train_loss": 0.0043694437481462955, "global_step": 18974, "epoch": 159, "lr": 8.416108233226077e-05} +{"train_loss": 0.00281177437864244, "global_step": 18975, "epoch": 159, "lr": 8.415946450910707e-05} +{"train_loss": 0.0038661095313727856, "global_step": 18976, "epoch": 159, "lr": 8.415784661888493e-05} +{"train_loss": 0.005609775427728891, "global_step": 18977, "epoch": 159, "lr": 8.415622866159751e-05} +{"train_loss": 0.004172562155872583, "global_step": 18978, "epoch": 159, "lr": 8.415461063724798e-05} +{"train_loss": 0.0031022829934954643, "global_step": 18979, "epoch": 159, "lr": 8.415299254583952e-05} +{"train_loss": 0.005005558952689171, "global_step": 18980, "epoch": 159, "lr": 8.415137438737531e-05} +{"train_loss": 0.0032560157123953104, "global_step": 18981, "epoch": 159, "lr": 8.414975616185852e-05} +{"train_loss": 0.004804752301424742, "global_step": 18982, "epoch": 159, "lr": 8.414813786929234e-05} +{"train_loss": 0.0048426478169858456, "global_step": 18983, "epoch": 159, "lr": 8.414651950967993e-05} +{"train_loss": 0.0059698899276554585, "global_step": 18984, "epoch": 159, "lr": 8.414490108302448e-05} +{"train_loss": 0.005608664359897375, "global_step": 18985, "epoch": 159, "lr": 8.414328258932916e-05} +{"train_loss": 0.004311659839004278, "global_step": 18986, "epoch": 159, "lr": 8.414166402859717e-05} +{"train_loss": 0.0053854347206652164, "global_step": 18987, "epoch": 159, "lr": 8.414004540083166e-05} +{"train_loss": 0.004286114126443863, "global_step": 18988, "epoch": 159, "lr": 8.413842670603581e-05} +{"train_loss": 0.005834726616740227, "global_step": 18989, "epoch": 159, "lr": 8.413680794421282e-05} +{"train_loss": 0.004357248079031706, "global_step": 18990, "epoch": 159, "lr": 8.413518911536584e-05} +{"train_loss": 0.0055208997800946236, "global_step": 18991, "epoch": 159, "lr": 8.413357021949807e-05} +{"train_loss": 0.005085329990833998, "global_step": 18992, "epoch": 159, "lr": 8.413195125661269e-05} +{"train_loss": 0.007074230816215277, "global_step": 18993, "epoch": 159, "lr": 8.413033222671287e-05} +{"train_loss": 0.003932918421924114, "global_step": 18994, "epoch": 159, "lr": 8.412871312980177e-05} +{"train_loss": 0.00481372931972146, "global_step": 18995, "epoch": 159, "lr": 8.41270939658826e-05} +{"train_loss": 0.00330470222979784, "global_step": 18996, "epoch": 159, "lr": 8.412547473495854e-05} +{"train_loss": 0.003962785936892033, "global_step": 18997, "epoch": 159, "lr": 8.412385543703273e-05} +{"train_loss": 0.005972580052912235, "global_step": 18998, "epoch": 159, "lr": 8.412223607210839e-05} +{"train_loss": 0.004435517825186253, "global_step": 18999, "epoch": 159, "lr": 8.412061664018869e-05} +{"train_loss": 0.004732772707939148, "global_step": 19000, "epoch": 159, "lr": 8.411899714127679e-05} +{"train_loss": 0.006170355249196291, "global_step": 19001, "epoch": 159, "lr": 8.41173775753759e-05} +{"train_loss": 0.00579355051741004, "global_step": 19002, "epoch": 159, "lr": 8.411575794248916e-05} +{"train_loss": 0.003947771154344082, "global_step": 19003, "epoch": 159, "lr": 8.41141382426198e-05} +{"train_loss": 0.0034065835643559694, "global_step": 19004, "epoch": 159, "lr": 8.411251847577095e-05} +{"train_loss": 0.0062646144069731236, "global_step": 19005, "epoch": 159, "lr": 8.411089864194583e-05} +{"train_loss": 0.006397857330739498, "global_step": 19006, "epoch": 159, "lr": 8.41092787411476e-05} +{"train_loss": 0.0036566280759871006, "global_step": 19007, "epoch": 159, "lr": 8.410765877337945e-05} +{"train_loss": 0.004839772824198008, "global_step": 19008, "epoch": 159, "lr": 8.410603873864456e-05} +{"train_loss": 0.003423236543312669, "global_step": 19009, "epoch": 159, "lr": 8.410441863694609e-05} +{"train_loss": 0.003978298511356115, "global_step": 19010, "epoch": 159, "lr": 8.410279846828726e-05} +{"train_loss": 0.008226750418543816, "global_step": 19011, "epoch": 159, "lr": 8.410117823267122e-05} +{"train_loss": 0.008432870730757713, "global_step": 19012, "epoch": 159, "lr": 8.409955793010116e-05} +{"train_loss": 0.005178626161068678, "global_step": 19013, "epoch": 159, "lr": 8.409793756058024e-05} +{"train_loss": 0.0064316256903111935, "global_step": 19014, "epoch": 159, "lr": 8.409631712411168e-05} +{"train_loss": 0.004728941712528467, "global_step": 19015, "epoch": 159, "lr": 8.409469662069864e-05} +{"train_loss": 0.0063224961049854755, "global_step": 19016, "epoch": 159, "lr": 8.409307605034431e-05} +{"train_loss": 0.0033712389413267374, "global_step": 19017, "epoch": 159, "lr": 8.409145541305188e-05} +{"train_loss": 0.005995674058794975, "global_step": 19018, "epoch": 159, "lr": 8.40898347088245e-05} +{"train_loss": 0.00647336570546031, "global_step": 19019, "epoch": 159, "lr": 8.408821393766538e-05} +{"train_loss": 0.0025706090964376926, "global_step": 19020, "epoch": 159, "lr": 8.408659309957769e-05} +{"train_loss": 0.005659196991473436, "global_step": 19021, "epoch": 159, "lr": 8.408497219456462e-05} +{"train_loss": 0.004172997083514929, "global_step": 19022, "epoch": 159, "lr": 8.408335122262934e-05} +{"train_loss": 0.006851400248706341, "global_step": 19023, "epoch": 159, "lr": 8.408173018377505e-05} +{"train_loss": 0.004311725031584501, "global_step": 19024, "epoch": 159, "lr": 8.408010907800492e-05} +{"train_loss": 0.006041149143129587, "global_step": 19025, "epoch": 159, "lr": 8.407848790532215e-05} +{"train_loss": 0.00594230554997921, "global_step": 19026, "epoch": 159, "lr": 8.407686666572989e-05} +{"train_loss": 0.003275893395766616, "global_step": 19027, "epoch": 159, "lr": 8.407524535923134e-05} +{"train_loss": 0.004085536114871502, "global_step": 19028, "epoch": 159, "lr": 8.407362398582971e-05} +{"train_loss": 0.0057355924509465694, "global_step": 19029, "epoch": 159, "lr": 8.407200254552814e-05} +{"train_loss": 0.008389590308070183, "global_step": 19030, "epoch": 159, "lr": 8.407038103832985e-05} +{"train_loss": 0.0044356584548950195, "global_step": 19031, "epoch": 159, "lr": 8.4068759464238e-05} +{"train_loss": 0.0033247557003051043, "global_step": 19032, "epoch": 159, "lr": 8.406713782325577e-05} +{"train_loss": 0.004857892170548439, "global_step": 19033, "epoch": 159, "lr": 8.406551611538635e-05} +{"train_loss": 0.004083841107785702, "global_step": 19034, "epoch": 159, "lr": 8.406389434063295e-05} +{"train_loss": 0.0041938479989767075, "global_step": 19035, "epoch": 159, "lr": 8.406227249899872e-05} +{"train_loss": 0.005299179814755917, "global_step": 19036, "epoch": 159, "lr": 8.406065059048686e-05} +{"train_loss": 0.004442878533154726, "global_step": 19037, "epoch": 159, "lr": 8.405902861510055e-05} +{"train_loss": 0.006900655571371317, "global_step": 19038, "epoch": 159, "lr": 8.405740657284298e-05} +{"train_loss": 0.005136842005925269, "global_step": 19039, "epoch": 159, "lr": 8.405578446371731e-05, "val_loss": 0.020589470863342285} +{"train_loss": 0.0075812991708517075, "global_step": 19040, "epoch": 160, "lr": 8.405416228772677e-05} +{"train_loss": 0.00524216378107667, "global_step": 19041, "epoch": 160, "lr": 8.40525400448745e-05} +{"train_loss": 0.007947588339447975, "global_step": 19042, "epoch": 160, "lr": 8.405091773516374e-05} +{"train_loss": 0.004887102171778679, "global_step": 19043, "epoch": 160, "lr": 8.404929535859763e-05} +{"train_loss": 0.0044976635836064816, "global_step": 19044, "epoch": 160, "lr": 8.404767291517934e-05} +{"train_loss": 0.005876349750906229, "global_step": 19045, "epoch": 160, "lr": 8.40460504049121e-05} +{"train_loss": 0.005587064195424318, "global_step": 19046, "epoch": 160, "lr": 8.404442782779906e-05} +{"train_loss": 0.005837625358253717, "global_step": 19047, "epoch": 160, "lr": 8.404280518384345e-05} +{"train_loss": 0.005410187877714634, "global_step": 19048, "epoch": 160, "lr": 8.404118247304842e-05} +{"train_loss": 0.006160742603242397, "global_step": 19049, "epoch": 160, "lr": 8.403955969541716e-05} +{"train_loss": 0.0061177825555205345, "global_step": 19050, "epoch": 160, "lr": 8.403793685095288e-05} +{"train_loss": 0.0044333674013614655, "global_step": 19051, "epoch": 160, "lr": 8.403631393965871e-05} +{"train_loss": 0.007132640108466148, "global_step": 19052, "epoch": 160, "lr": 8.403469096153789e-05} +{"train_loss": 0.004849739372730255, "global_step": 19053, "epoch": 160, "lr": 8.40330679165936e-05} +{"train_loss": 0.005067893769592047, "global_step": 19054, "epoch": 160, "lr": 8.4031444804829e-05} +{"train_loss": 0.004168841987848282, "global_step": 19055, "epoch": 160, "lr": 8.402982162624732e-05} +{"train_loss": 0.007833307608962059, "global_step": 19056, "epoch": 160, "lr": 8.402819838085169e-05} +{"train_loss": 0.005434925202280283, "global_step": 19057, "epoch": 160, "lr": 8.402657506864536e-05} +{"train_loss": 0.0032367403618991375, "global_step": 19058, "epoch": 160, "lr": 8.402495168963147e-05} +{"train_loss": 0.005115237087011337, "global_step": 19059, "epoch": 160, "lr": 8.402332824381321e-05} +{"train_loss": 0.00733796413987875, "global_step": 19060, "epoch": 160, "lr": 8.40217047311938e-05} +{"train_loss": 0.006082995794713497, "global_step": 19061, "epoch": 160, "lr": 8.402008115177639e-05} +{"train_loss": 0.004274600185453892, "global_step": 19062, "epoch": 160, "lr": 8.40184575055642e-05} +{"train_loss": 0.0052644116804003716, "global_step": 19063, "epoch": 160, "lr": 8.40168337925604e-05} +{"train_loss": 0.004753855522722006, "global_step": 19064, "epoch": 160, "lr": 8.401521001276818e-05} +{"train_loss": 0.0065928976982831955, "global_step": 19065, "epoch": 160, "lr": 8.401358616619072e-05} +{"train_loss": 0.003835741663351655, "global_step": 19066, "epoch": 160, "lr": 8.401196225283123e-05} +{"train_loss": 0.004308920353651047, "global_step": 19067, "epoch": 160, "lr": 8.401033827269287e-05} +{"train_loss": 0.006140336859971285, "global_step": 19068, "epoch": 160, "lr": 8.400871422577886e-05} +{"train_loss": 0.006117960438132286, "global_step": 19069, "epoch": 160, "lr": 8.400709011209237e-05} +{"train_loss": 0.0038757706061005592, "global_step": 19070, "epoch": 160, "lr": 8.400546593163658e-05} +{"train_loss": 0.009127169847488403, "global_step": 19071, "epoch": 160, "lr": 8.400384168441471e-05} +{"train_loss": 0.0045149303041398525, "global_step": 19072, "epoch": 160, "lr": 8.400221737042991e-05} +{"train_loss": 0.0054869274608790874, "global_step": 19073, "epoch": 160, "lr": 8.400059298968541e-05} +{"train_loss": 0.005669138394296169, "global_step": 19074, "epoch": 160, "lr": 8.399896854218437e-05} +{"train_loss": 0.006535978987812996, "global_step": 19075, "epoch": 160, "lr": 8.399734402792998e-05} +{"train_loss": 0.0030791552271693945, "global_step": 19076, "epoch": 160, "lr": 8.399571944692544e-05} +{"train_loss": 0.006586323957890272, "global_step": 19077, "epoch": 160, "lr": 8.399409479917393e-05} +{"train_loss": 0.006414060480892658, "global_step": 19078, "epoch": 160, "lr": 8.399247008467865e-05} +{"train_loss": 0.006317305378615856, "global_step": 19079, "epoch": 160, "lr": 8.399084530344279e-05} +{"train_loss": 0.0048330994322896, "global_step": 19080, "epoch": 160, "lr": 8.398922045546955e-05} +{"train_loss": 0.0037222199607640505, "global_step": 19081, "epoch": 160, "lr": 8.398759554076208e-05} +{"train_loss": 0.0048430245369672775, "global_step": 19082, "epoch": 160, "lr": 8.398597055932363e-05} +{"train_loss": 0.0037783572915941477, "global_step": 19083, "epoch": 160, "lr": 8.398434551115732e-05} +{"train_loss": 0.003219109494239092, "global_step": 19084, "epoch": 160, "lr": 8.39827203962664e-05} +{"train_loss": 0.006212505977600813, "global_step": 19085, "epoch": 160, "lr": 8.398109521465404e-05} +{"train_loss": 0.006296155974268913, "global_step": 19086, "epoch": 160, "lr": 8.397946996632343e-05} +{"train_loss": 0.00542197423055768, "global_step": 19087, "epoch": 160, "lr": 8.397784465127777e-05} +{"train_loss": 0.00530362268909812, "global_step": 19088, "epoch": 160, "lr": 8.397621926952022e-05} +{"train_loss": 0.003166220150887966, "global_step": 19089, "epoch": 160, "lr": 8.3974593821054e-05} +{"train_loss": 0.004168146289885044, "global_step": 19090, "epoch": 160, "lr": 8.39729683058823e-05} +{"train_loss": 0.00493170041590929, "global_step": 19091, "epoch": 160, "lr": 8.39713427240083e-05} +{"train_loss": 0.004753417335450649, "global_step": 19092, "epoch": 160, "lr": 8.396971707543521e-05} +{"train_loss": 0.004869581665843725, "global_step": 19093, "epoch": 160, "lr": 8.396809136016618e-05} +{"train_loss": 0.007343452423810959, "global_step": 19094, "epoch": 160, "lr": 8.396646557820446e-05} +{"train_loss": 0.005113005638122559, "global_step": 19095, "epoch": 160, "lr": 8.39648397295532e-05} +{"train_loss": 0.0038861162029206753, "global_step": 19096, "epoch": 160, "lr": 8.396321381421561e-05} +{"train_loss": 0.003787076100707054, "global_step": 19097, "epoch": 160, "lr": 8.396158783219489e-05} +{"train_loss": 0.0038974639028310776, "global_step": 19098, "epoch": 160, "lr": 8.395996178349421e-05} +{"train_loss": 0.008831239305436611, "global_step": 19099, "epoch": 160, "lr": 8.395833566811677e-05} +{"train_loss": 0.004906174726784229, "global_step": 19100, "epoch": 160, "lr": 8.395670948606577e-05} +{"train_loss": 0.006077461410313845, "global_step": 19101, "epoch": 160, "lr": 8.39550832373444e-05} +{"train_loss": 0.008195515722036362, "global_step": 19102, "epoch": 160, "lr": 8.395345692195585e-05} +{"train_loss": 0.0037501512560993433, "global_step": 19103, "epoch": 160, "lr": 8.395183053990331e-05} +{"train_loss": 0.005846125073730946, "global_step": 19104, "epoch": 160, "lr": 8.395020409118999e-05} +{"train_loss": 0.0030654571019113064, "global_step": 19105, "epoch": 160, "lr": 8.394857757581907e-05} +{"train_loss": 0.00583519134670496, "global_step": 19106, "epoch": 160, "lr": 8.394695099379372e-05} +{"train_loss": 0.0042452337220311165, "global_step": 19107, "epoch": 160, "lr": 8.39453243451172e-05} +{"train_loss": 0.005987634416669607, "global_step": 19108, "epoch": 160, "lr": 8.394369762979263e-05} +{"train_loss": 0.0033868011087179184, "global_step": 19109, "epoch": 160, "lr": 8.394207084782324e-05} +{"train_loss": 0.005873618647456169, "global_step": 19110, "epoch": 160, "lr": 8.394044399921222e-05} +{"train_loss": 0.005565206054598093, "global_step": 19111, "epoch": 160, "lr": 8.393881708396278e-05} +{"train_loss": 0.004249165765941143, "global_step": 19112, "epoch": 160, "lr": 8.393719010207807e-05} +{"train_loss": 0.0044252220541238785, "global_step": 19113, "epoch": 160, "lr": 8.393556305356134e-05} +{"train_loss": 0.004661667160689831, "global_step": 19114, "epoch": 160, "lr": 8.393393593841576e-05} +{"train_loss": 0.004816305823624134, "global_step": 19115, "epoch": 160, "lr": 8.39323087566445e-05} +{"train_loss": 0.0054033356718719006, "global_step": 19116, "epoch": 160, "lr": 8.393068150825078e-05} +{"train_loss": 0.004092648159712553, "global_step": 19117, "epoch": 160, "lr": 8.392905419323782e-05} +{"train_loss": 0.004705651197582483, "global_step": 19118, "epoch": 160, "lr": 8.392742681160877e-05} +{"train_loss": 0.004207113292068243, "global_step": 19119, "epoch": 160, "lr": 8.392579936336682e-05} +{"train_loss": 0.0044599054381251335, "global_step": 19120, "epoch": 160, "lr": 8.392417184851521e-05} +{"train_loss": 0.005157019942998886, "global_step": 19121, "epoch": 160, "lr": 8.39225442670571e-05} +{"train_loss": 0.00881536677479744, "global_step": 19122, "epoch": 160, "lr": 8.392091661899571e-05} +{"train_loss": 0.0075138225220143795, "global_step": 19123, "epoch": 160, "lr": 8.391928890433422e-05} +{"train_loss": 0.0035830121487379074, "global_step": 19124, "epoch": 160, "lr": 8.391766112307584e-05} +{"train_loss": 0.004233197774738073, "global_step": 19125, "epoch": 160, "lr": 8.391603327522375e-05} +{"train_loss": 0.006227151025086641, "global_step": 19126, "epoch": 160, "lr": 8.391440536078114e-05} +{"train_loss": 0.004762852098792791, "global_step": 19127, "epoch": 160, "lr": 8.391277737975123e-05} +{"train_loss": 0.0038153822533786297, "global_step": 19128, "epoch": 160, "lr": 8.39111493321372e-05} +{"train_loss": 0.00372930895537138, "global_step": 19129, "epoch": 160, "lr": 8.390952121794225e-05} +{"train_loss": 0.006236815359443426, "global_step": 19130, "epoch": 160, "lr": 8.390789303716959e-05} +{"train_loss": 0.004761223681271076, "global_step": 19131, "epoch": 160, "lr": 8.39062647898224e-05} +{"train_loss": 0.00407975260168314, "global_step": 19132, "epoch": 160, "lr": 8.390463647590387e-05} +{"train_loss": 0.00534074055030942, "global_step": 19133, "epoch": 160, "lr": 8.39030080954172e-05} +{"train_loss": 0.004700617399066687, "global_step": 19134, "epoch": 160, "lr": 8.390137964836562e-05} +{"train_loss": 0.003107977332547307, "global_step": 19135, "epoch": 160, "lr": 8.389975113475229e-05} +{"train_loss": 0.007473386824131012, "global_step": 19136, "epoch": 160, "lr": 8.389812255458043e-05} +{"train_loss": 0.0047116405330598354, "global_step": 19137, "epoch": 160, "lr": 8.389649390785321e-05} +{"train_loss": 0.005686045158654451, "global_step": 19138, "epoch": 160, "lr": 8.389486519457387e-05} +{"train_loss": 0.003159652929753065, "global_step": 19139, "epoch": 160, "lr": 8.389323641474557e-05} +{"train_loss": 0.004462473094463348, "global_step": 19140, "epoch": 160, "lr": 8.389160756837151e-05} +{"train_loss": 0.00571411894634366, "global_step": 19141, "epoch": 160, "lr": 8.388997865545492e-05} +{"train_loss": 0.004293899983167648, "global_step": 19142, "epoch": 160, "lr": 8.388834967599897e-05} +{"train_loss": 0.005705729592591524, "global_step": 19143, "epoch": 160, "lr": 8.388672063000687e-05} +{"train_loss": 0.0048238011077046394, "global_step": 19144, "epoch": 160, "lr": 8.388509151748181e-05} +{"train_loss": 0.004835823550820351, "global_step": 19145, "epoch": 160, "lr": 8.388346233842699e-05} +{"train_loss": 0.005860100965946913, "global_step": 19146, "epoch": 160, "lr": 8.388183309284561e-05} +{"train_loss": 0.010252301581203938, "global_step": 19147, "epoch": 160, "lr": 8.388020378074086e-05} +{"train_loss": 0.004830232355743647, "global_step": 19148, "epoch": 160, "lr": 8.387857440211597e-05} +{"train_loss": 0.006397579796612263, "global_step": 19149, "epoch": 160, "lr": 8.387694495697411e-05} +{"train_loss": 0.005466316360980272, "global_step": 19150, "epoch": 160, "lr": 8.38753154453185e-05} +{"train_loss": 0.006273813080042601, "global_step": 19151, "epoch": 160, "lr": 8.387368586715231e-05} +{"train_loss": 0.0031784989405423403, "global_step": 19152, "epoch": 160, "lr": 8.387205622247877e-05} +{"train_loss": 0.0035358481109142303, "global_step": 19153, "epoch": 160, "lr": 8.387042651130106e-05} +{"train_loss": 0.006380700971931219, "global_step": 19154, "epoch": 160, "lr": 8.386879673362237e-05} +{"train_loss": 0.003522655926644802, "global_step": 19155, "epoch": 160, "lr": 8.386716688944595e-05} +{"train_loss": 0.007801894564181566, "global_step": 19156, "epoch": 160, "lr": 8.386553697877495e-05} +{"train_loss": 0.004979513585567474, "global_step": 19157, "epoch": 160, "lr": 8.386390700161258e-05} +{"train_loss": 0.005280059055980889, "global_step": 19158, "epoch": 160, "lr": 8.386227695796205e-05, "val_loss": 0.011300057172775269, "train_action_mse_error": 0.00017722192569635808} +{"train_loss": 0.008913344703614712, "global_step": 19159, "epoch": 161, "lr": 8.386064684782655e-05} +{"train_loss": 0.005997906439006329, "global_step": 19160, "epoch": 161, "lr": 8.38590166712093e-05} +{"train_loss": 0.005600334610790014, "global_step": 19161, "epoch": 161, "lr": 8.385738642811349e-05} +{"train_loss": 0.0045911772176623344, "global_step": 19162, "epoch": 161, "lr": 8.38557561185423e-05} +{"train_loss": 0.007137802429497242, "global_step": 19163, "epoch": 161, "lr": 8.385412574249896e-05} +{"train_loss": 0.004679804667830467, "global_step": 19164, "epoch": 161, "lr": 8.385249529998666e-05} +{"train_loss": 0.004945053718984127, "global_step": 19165, "epoch": 161, "lr": 8.385086479100861e-05} +{"train_loss": 0.005169510841369629, "global_step": 19166, "epoch": 161, "lr": 8.384923421556799e-05} +{"train_loss": 0.0065347859635949135, "global_step": 19167, "epoch": 161, "lr": 8.384760357366803e-05} +{"train_loss": 0.005704777780920267, "global_step": 19168, "epoch": 161, "lr": 8.38459728653119e-05} +{"train_loss": 0.005149072967469692, "global_step": 19169, "epoch": 161, "lr": 8.384434209050284e-05} +{"train_loss": 0.0031650273595005274, "global_step": 19170, "epoch": 161, "lr": 8.3842711249244e-05} +{"train_loss": 0.0066824848763644695, "global_step": 19171, "epoch": 161, "lr": 8.384108034153864e-05} +{"train_loss": 0.004660408478230238, "global_step": 19172, "epoch": 161, "lr": 8.383944936738992e-05} +{"train_loss": 0.008306709118187428, "global_step": 19173, "epoch": 161, "lr": 8.383781832680106e-05} +{"train_loss": 0.0045241001062095165, "global_step": 19174, "epoch": 161, "lr": 8.383618721977526e-05} +{"train_loss": 0.004220272414386272, "global_step": 19175, "epoch": 161, "lr": 8.383455604631573e-05} +{"train_loss": 0.005242302082479, "global_step": 19176, "epoch": 161, "lr": 8.383292480642565e-05} +{"train_loss": 0.0050964741967618465, "global_step": 19177, "epoch": 161, "lr": 8.383129350010823e-05} +{"train_loss": 0.005220624152570963, "global_step": 19178, "epoch": 161, "lr": 8.382966212736669e-05} +{"train_loss": 0.00594640988856554, "global_step": 19179, "epoch": 161, "lr": 8.382803068820421e-05} +{"train_loss": 0.007265730760991573, "global_step": 19180, "epoch": 161, "lr": 8.382639918262406e-05} +{"train_loss": 0.00984558928757906, "global_step": 19181, "epoch": 161, "lr": 8.382476761062933e-05} +{"train_loss": 0.009377246722579002, "global_step": 19182, "epoch": 161, "lr": 8.38231359722233e-05} +{"train_loss": 0.007039508782327175, "global_step": 19183, "epoch": 161, "lr": 8.382150426740916e-05} +{"train_loss": 0.00782562792301178, "global_step": 19184, "epoch": 161, "lr": 8.38198724961901e-05} +{"train_loss": 0.010165175423026085, "global_step": 19185, "epoch": 161, "lr": 8.381824065856934e-05} +{"train_loss": 0.005842292681336403, "global_step": 19186, "epoch": 161, "lr": 8.381660875455008e-05} +{"train_loss": 0.004662166349589825, "global_step": 19187, "epoch": 161, "lr": 8.381497678413552e-05} +{"train_loss": 0.006449682638049126, "global_step": 19188, "epoch": 161, "lr": 8.381334474732885e-05} +{"train_loss": 0.005010128021240234, "global_step": 19189, "epoch": 161, "lr": 8.38117126441333e-05} +{"train_loss": 0.005026140715926886, "global_step": 19190, "epoch": 161, "lr": 8.381008047455208e-05} +{"train_loss": 0.006887541618198156, "global_step": 19191, "epoch": 161, "lr": 8.380844823858836e-05} +{"train_loss": 0.007503061555325985, "global_step": 19192, "epoch": 161, "lr": 8.380681593624537e-05} +{"train_loss": 0.007183507084846497, "global_step": 19193, "epoch": 161, "lr": 8.380518356752631e-05} +{"train_loss": 0.004308708943426609, "global_step": 19194, "epoch": 161, "lr": 8.380355113243439e-05} +{"train_loss": 0.005774756893515587, "global_step": 19195, "epoch": 161, "lr": 8.38019186309728e-05} +{"train_loss": 0.00460081547498703, "global_step": 19196, "epoch": 161, "lr": 8.380028606314475e-05} +{"train_loss": 0.0038726232014596462, "global_step": 19197, "epoch": 161, "lr": 8.379865342895346e-05} +{"train_loss": 0.005948392674326897, "global_step": 19198, "epoch": 161, "lr": 8.379702072840212e-05} +{"train_loss": 0.009069845080375671, "global_step": 19199, "epoch": 161, "lr": 8.379538796149394e-05} +{"train_loss": 0.004515423439443111, "global_step": 19200, "epoch": 161, "lr": 8.379375512823214e-05} +{"train_loss": 0.005807273555546999, "global_step": 19201, "epoch": 161, "lr": 8.379212222861988e-05} +{"train_loss": 0.004155523143708706, "global_step": 19202, "epoch": 161, "lr": 8.379048926266042e-05} +{"train_loss": 0.006518156733363867, "global_step": 19203, "epoch": 161, "lr": 8.378885623035694e-05} +{"train_loss": 0.008991654962301254, "global_step": 19204, "epoch": 161, "lr": 8.378722313171265e-05} +{"train_loss": 0.00354940933175385, "global_step": 19205, "epoch": 161, "lr": 8.378558996673075e-05} +{"train_loss": 0.008497493341565132, "global_step": 19206, "epoch": 161, "lr": 8.378395673541448e-05} +{"train_loss": 0.005989468656480312, "global_step": 19207, "epoch": 161, "lr": 8.3782323437767e-05} +{"train_loss": 0.004970585461705923, "global_step": 19208, "epoch": 161, "lr": 8.378069007379154e-05} +{"train_loss": 0.007062452379614115, "global_step": 19209, "epoch": 161, "lr": 8.37790566434913e-05} +{"train_loss": 0.004985625855624676, "global_step": 19210, "epoch": 161, "lr": 8.37774231468695e-05} +{"train_loss": 0.0035694679245352745, "global_step": 19211, "epoch": 161, "lr": 8.377578958392933e-05} +{"train_loss": 0.005193250719457865, "global_step": 19212, "epoch": 161, "lr": 8.377415595467401e-05} +{"train_loss": 0.006792380474507809, "global_step": 19213, "epoch": 161, "lr": 8.377252225910674e-05} +{"train_loss": 0.004964455030858517, "global_step": 19214, "epoch": 161, "lr": 8.377088849723072e-05} +{"train_loss": 0.004637401085346937, "global_step": 19215, "epoch": 161, "lr": 8.376925466904919e-05} +{"train_loss": 0.006884654983878136, "global_step": 19216, "epoch": 161, "lr": 8.376762077456532e-05} +{"train_loss": 0.005253563169389963, "global_step": 19217, "epoch": 161, "lr": 8.376598681378234e-05} +{"train_loss": 0.004803485237061977, "global_step": 19218, "epoch": 161, "lr": 8.376435278670346e-05} +{"train_loss": 0.005031239241361618, "global_step": 19219, "epoch": 161, "lr": 8.376271869333187e-05} +{"train_loss": 0.007220471277832985, "global_step": 19220, "epoch": 161, "lr": 8.37610845336708e-05} +{"train_loss": 0.004489137791097164, "global_step": 19221, "epoch": 161, "lr": 8.375945030772342e-05} +{"train_loss": 0.008969161659479141, "global_step": 19222, "epoch": 161, "lr": 8.3757816015493e-05} +{"train_loss": 0.005594226997345686, "global_step": 19223, "epoch": 161, "lr": 8.375618165698269e-05} +{"train_loss": 0.006685678381472826, "global_step": 19224, "epoch": 161, "lr": 8.375454723219575e-05} +{"train_loss": 0.006767771206796169, "global_step": 19225, "epoch": 161, "lr": 8.375291274113535e-05} +{"train_loss": 0.005876927636563778, "global_step": 19226, "epoch": 161, "lr": 8.37512781838047e-05} +{"train_loss": 0.006201927084475756, "global_step": 19227, "epoch": 161, "lr": 8.374964356020702e-05} +{"train_loss": 0.00604374660179019, "global_step": 19228, "epoch": 161, "lr": 8.374800887034554e-05} +{"train_loss": 0.003391201375052333, "global_step": 19229, "epoch": 161, "lr": 8.374637411422344e-05} +{"train_loss": 0.006494507659226656, "global_step": 19230, "epoch": 161, "lr": 8.374473929184395e-05} +{"train_loss": 0.009412065148353577, "global_step": 19231, "epoch": 161, "lr": 8.374310440321025e-05} +{"train_loss": 0.006456868257373571, "global_step": 19232, "epoch": 161, "lr": 8.374146944832559e-05} +{"train_loss": 0.0034397209528833628, "global_step": 19233, "epoch": 161, "lr": 8.373983442719313e-05} +{"train_loss": 0.003783097490668297, "global_step": 19234, "epoch": 161, "lr": 8.373819933981614e-05} +{"train_loss": 0.008891947567462921, "global_step": 19235, "epoch": 161, "lr": 8.373656418619777e-05} +{"train_loss": 0.0072479709051549435, "global_step": 19236, "epoch": 161, "lr": 8.373492896634129e-05} +{"train_loss": 0.004026293288916349, "global_step": 19237, "epoch": 161, "lr": 8.373329368024987e-05} +{"train_loss": 0.004982903134077787, "global_step": 19238, "epoch": 161, "lr": 8.373165832792673e-05} +{"train_loss": 0.007727933116257191, "global_step": 19239, "epoch": 161, "lr": 8.373002290937508e-05} +{"train_loss": 0.007246923632919788, "global_step": 19240, "epoch": 161, "lr": 8.372838742459815e-05} +{"train_loss": 0.0050925081595778465, "global_step": 19241, "epoch": 161, "lr": 8.372675187359911e-05} +{"train_loss": 0.007288722321391106, "global_step": 19242, "epoch": 161, "lr": 8.37251162563812e-05} +{"train_loss": 0.005827142857015133, "global_step": 19243, "epoch": 161, "lr": 8.372348057294766e-05} +{"train_loss": 0.005543341860175133, "global_step": 19244, "epoch": 161, "lr": 8.372184482330163e-05} +{"train_loss": 0.004902353510260582, "global_step": 19245, "epoch": 161, "lr": 8.372020900744636e-05} +{"train_loss": 0.007403173018246889, "global_step": 19246, "epoch": 161, "lr": 8.37185731253851e-05} +{"train_loss": 0.004537290893495083, "global_step": 19247, "epoch": 161, "lr": 8.371693717712099e-05} +{"train_loss": 0.005143076181411743, "global_step": 19248, "epoch": 161, "lr": 8.371530116265729e-05} +{"train_loss": 0.005719874985516071, "global_step": 19249, "epoch": 161, "lr": 8.37136650819972e-05} +{"train_loss": 0.005194410681724548, "global_step": 19250, "epoch": 161, "lr": 8.371202893514391e-05} +{"train_loss": 0.003729365300387144, "global_step": 19251, "epoch": 161, "lr": 8.371039272210069e-05} +{"train_loss": 0.004703940823674202, "global_step": 19252, "epoch": 161, "lr": 8.370875644287067e-05} +{"train_loss": 0.007496190257370472, "global_step": 19253, "epoch": 161, "lr": 8.370712009745714e-05} +{"train_loss": 0.004612923599779606, "global_step": 19254, "epoch": 161, "lr": 8.370548368586327e-05} +{"train_loss": 0.0030730017460882664, "global_step": 19255, "epoch": 161, "lr": 8.370384720809228e-05} +{"train_loss": 0.006888607516884804, "global_step": 19256, "epoch": 161, "lr": 8.37022106641474e-05} +{"train_loss": 0.007281636353582144, "global_step": 19257, "epoch": 161, "lr": 8.370057405403182e-05} +{"train_loss": 0.002877347869798541, "global_step": 19258, "epoch": 161, "lr": 8.369893737774877e-05} +{"train_loss": 0.0030053930822759867, "global_step": 19259, "epoch": 161, "lr": 8.369730063530144e-05} +{"train_loss": 0.00699051097035408, "global_step": 19260, "epoch": 161, "lr": 8.369566382669307e-05} +{"train_loss": 0.007358086761087179, "global_step": 19261, "epoch": 161, "lr": 8.369402695192687e-05} +{"train_loss": 0.009815879166126251, "global_step": 19262, "epoch": 161, "lr": 8.369239001100603e-05} +{"train_loss": 0.00640353886410594, "global_step": 19263, "epoch": 161, "lr": 8.36907530039338e-05} +{"train_loss": 0.006616489961743355, "global_step": 19264, "epoch": 161, "lr": 8.368911593071338e-05} +{"train_loss": 0.006691079121083021, "global_step": 19265, "epoch": 161, "lr": 8.368747879134797e-05} +{"train_loss": 0.0035997412633150816, "global_step": 19266, "epoch": 161, "lr": 8.36858415858408e-05} +{"train_loss": 0.007210037671029568, "global_step": 19267, "epoch": 161, "lr": 8.368420431419507e-05} +{"train_loss": 0.004619518294930458, "global_step": 19268, "epoch": 161, "lr": 8.368256697641401e-05} +{"train_loss": 0.005758340936154127, "global_step": 19269, "epoch": 161, "lr": 8.368092957250083e-05} +{"train_loss": 0.005465678405016661, "global_step": 19270, "epoch": 161, "lr": 8.367929210245873e-05} +{"train_loss": 0.003176062135025859, "global_step": 19271, "epoch": 161, "lr": 8.367765456629096e-05} +{"train_loss": 0.007521427236497402, "global_step": 19272, "epoch": 161, "lr": 8.36760169640007e-05} +{"train_loss": 0.006481239106506109, "global_step": 19273, "epoch": 161, "lr": 8.367437929559116e-05} +{"train_loss": 0.006749110296368599, "global_step": 19274, "epoch": 161, "lr": 8.36727415610656e-05} +{"train_loss": 0.006417700555175543, "global_step": 19275, "epoch": 161, "lr": 8.36711037604272e-05} +{"train_loss": 0.0037433842662721872, "global_step": 19276, "epoch": 161, "lr": 8.366946589367919e-05} +{"train_loss": 0.005918894563762455, "global_step": 19277, "epoch": 161, "lr": 8.366782796082478e-05, "val_loss": 0.017322726547718048} +{"train_loss": 0.005802720319479704, "global_step": 19278, "epoch": 162, "lr": 8.366618996186718e-05} +{"train_loss": 0.004156878218054771, "global_step": 19279, "epoch": 162, "lr": 8.366455189680962e-05} +{"train_loss": 0.0057123927399516106, "global_step": 19280, "epoch": 162, "lr": 8.366291376565532e-05} +{"train_loss": 0.007909341715276241, "global_step": 19281, "epoch": 162, "lr": 8.366127556840746e-05} +{"train_loss": 0.0064621311612427235, "global_step": 19282, "epoch": 162, "lr": 8.365963730506929e-05} +{"train_loss": 0.005746107082813978, "global_step": 19283, "epoch": 162, "lr": 8.365799897564402e-05} +{"train_loss": 0.004056322388350964, "global_step": 19284, "epoch": 162, "lr": 8.365636058013487e-05} +{"train_loss": 0.0036724512465298176, "global_step": 19285, "epoch": 162, "lr": 8.365472211854504e-05} +{"train_loss": 0.004438953474164009, "global_step": 19286, "epoch": 162, "lr": 8.365308359087777e-05} +{"train_loss": 0.004985243082046509, "global_step": 19287, "epoch": 162, "lr": 8.365144499713627e-05} +{"train_loss": 0.0035961985122412443, "global_step": 19288, "epoch": 162, "lr": 8.364980633732373e-05} +{"train_loss": 0.0044550104066729546, "global_step": 19289, "epoch": 162, "lr": 8.364816761144341e-05} +{"train_loss": 0.004976043477654457, "global_step": 19290, "epoch": 162, "lr": 8.36465288194985e-05} +{"train_loss": 0.0073403250426054, "global_step": 19291, "epoch": 162, "lr": 8.364488996149222e-05} +{"train_loss": 0.004934493452310562, "global_step": 19292, "epoch": 162, "lr": 8.364325103742781e-05} +{"train_loss": 0.004812667611986399, "global_step": 19293, "epoch": 162, "lr": 8.364161204730846e-05} +{"train_loss": 0.004126110579818487, "global_step": 19294, "epoch": 162, "lr": 8.36399729911374e-05} +{"train_loss": 0.004190504550933838, "global_step": 19295, "epoch": 162, "lr": 8.363833386891784e-05} +{"train_loss": 0.00316569278948009, "global_step": 19296, "epoch": 162, "lr": 8.363669468065302e-05} +{"train_loss": 0.004349685274064541, "global_step": 19297, "epoch": 162, "lr": 8.363505542634614e-05} +{"train_loss": 0.007746059447526932, "global_step": 19298, "epoch": 162, "lr": 8.363341610600042e-05} +{"train_loss": 0.00449310103431344, "global_step": 19299, "epoch": 162, "lr": 8.363177671961908e-05} +{"train_loss": 0.003781820647418499, "global_step": 19300, "epoch": 162, "lr": 8.363013726720532e-05} +{"train_loss": 0.004610976669937372, "global_step": 19301, "epoch": 162, "lr": 8.36284977487624e-05} +{"train_loss": 0.004191966727375984, "global_step": 19302, "epoch": 162, "lr": 8.362685816429352e-05} +{"train_loss": 0.005376553162932396, "global_step": 19303, "epoch": 162, "lr": 8.36252185138019e-05} +{"train_loss": 0.0052010598592460155, "global_step": 19304, "epoch": 162, "lr": 8.362357879729073e-05} +{"train_loss": 0.004559202119708061, "global_step": 19305, "epoch": 162, "lr": 8.362193901476328e-05} +{"train_loss": 0.006678191479295492, "global_step": 19306, "epoch": 162, "lr": 8.362029916622274e-05} +{"train_loss": 0.0064677889458835125, "global_step": 19307, "epoch": 162, "lr": 8.361865925167232e-05} +{"train_loss": 0.005606154445558786, "global_step": 19308, "epoch": 162, "lr": 8.361701927111527e-05} +{"train_loss": 0.0063386824913322926, "global_step": 19309, "epoch": 162, "lr": 8.361537922455479e-05} +{"train_loss": 0.0038425875827670097, "global_step": 19310, "epoch": 162, "lr": 8.36137391119941e-05} +{"train_loss": 0.004416214302182198, "global_step": 19311, "epoch": 162, "lr": 8.361209893343642e-05} +{"train_loss": 0.005055862013250589, "global_step": 19312, "epoch": 162, "lr": 8.361045868888499e-05} +{"train_loss": 0.006387877743691206, "global_step": 19313, "epoch": 162, "lr": 8.3608818378343e-05} +{"train_loss": 0.004502664320170879, "global_step": 19314, "epoch": 162, "lr": 8.36071780018137e-05} +{"train_loss": 0.006048121955245733, "global_step": 19315, "epoch": 162, "lr": 8.360553755930028e-05} +{"train_loss": 0.005302839446812868, "global_step": 19316, "epoch": 162, "lr": 8.360389705080598e-05} +{"train_loss": 0.007073369808495045, "global_step": 19317, "epoch": 162, "lr": 8.360225647633404e-05} +{"train_loss": 0.005528145469725132, "global_step": 19318, "epoch": 162, "lr": 8.360061583588764e-05} +{"train_loss": 0.005875987000763416, "global_step": 19319, "epoch": 162, "lr": 8.359897512947003e-05} +{"train_loss": 0.0069443597458302975, "global_step": 19320, "epoch": 162, "lr": 8.359733435708441e-05} +{"train_loss": 0.006600157357752323, "global_step": 19321, "epoch": 162, "lr": 8.359569351873402e-05} +{"train_loss": 0.008540818467736244, "global_step": 19322, "epoch": 162, "lr": 8.359405261442207e-05} +{"train_loss": 0.0042608738876879215, "global_step": 19323, "epoch": 162, "lr": 8.359241164415178e-05} +{"train_loss": 0.006611147429794073, "global_step": 19324, "epoch": 162, "lr": 8.359077060792642e-05} +{"train_loss": 0.0049267783761024475, "global_step": 19325, "epoch": 162, "lr": 8.358912950574913e-05} +{"train_loss": 0.0067351930774748325, "global_step": 19326, "epoch": 162, "lr": 8.358748833762317e-05} +{"train_loss": 0.006385517306625843, "global_step": 19327, "epoch": 162, "lr": 8.358584710355178e-05} +{"train_loss": 0.004875676706433296, "global_step": 19328, "epoch": 162, "lr": 8.358420580353816e-05} +{"train_loss": 0.006590655539184809, "global_step": 19329, "epoch": 162, "lr": 8.358256443758555e-05} +{"train_loss": 0.004136018455028534, "global_step": 19330, "epoch": 162, "lr": 8.358092300569716e-05} +{"train_loss": 0.004152253270149231, "global_step": 19331, "epoch": 162, "lr": 8.357928150787622e-05} +{"train_loss": 0.00440027192234993, "global_step": 19332, "epoch": 162, "lr": 8.357763994412595e-05} +{"train_loss": 0.004762438591569662, "global_step": 19333, "epoch": 162, "lr": 8.357599831444955e-05} +{"train_loss": 0.006942304782569408, "global_step": 19334, "epoch": 162, "lr": 8.357435661885026e-05} +{"train_loss": 0.004836350679397583, "global_step": 19335, "epoch": 162, "lr": 8.357271485733134e-05} +{"train_loss": 0.004302039742469788, "global_step": 19336, "epoch": 162, "lr": 8.357107302989595e-05} +{"train_loss": 0.005056661553680897, "global_step": 19337, "epoch": 162, "lr": 8.356943113654739e-05} +{"train_loss": 0.009117829613387585, "global_step": 19338, "epoch": 162, "lr": 8.356778917728879e-05} +{"train_loss": 0.007558238226920366, "global_step": 19339, "epoch": 162, "lr": 8.356614715212345e-05} +{"train_loss": 0.0054237376898527145, "global_step": 19340, "epoch": 162, "lr": 8.356450506105456e-05} +{"train_loss": 0.004536093212664127, "global_step": 19341, "epoch": 162, "lr": 8.356286290408533e-05} +{"train_loss": 0.004534521605819464, "global_step": 19342, "epoch": 162, "lr": 8.356122068121902e-05} +{"train_loss": 0.004978636745363474, "global_step": 19343, "epoch": 162, "lr": 8.355957839245885e-05} +{"train_loss": 0.008039469830691814, "global_step": 19344, "epoch": 162, "lr": 8.355793603780801e-05} +{"train_loss": 0.0029481530655175447, "global_step": 19345, "epoch": 162, "lr": 8.355629361726976e-05} +{"train_loss": 0.0050714584067463875, "global_step": 19346, "epoch": 162, "lr": 8.355465113084733e-05} +{"train_loss": 0.0055315326899290085, "global_step": 19347, "epoch": 162, "lr": 8.35530085785439e-05} +{"train_loss": 0.00677338894456625, "global_step": 19348, "epoch": 162, "lr": 8.355136596036272e-05} +{"train_loss": 0.005530704744160175, "global_step": 19349, "epoch": 162, "lr": 8.354972327630705e-05} +{"train_loss": 0.005162357352674007, "global_step": 19350, "epoch": 162, "lr": 8.354808052638006e-05} +{"train_loss": 0.0034540279302746058, "global_step": 19351, "epoch": 162, "lr": 8.354643771058498e-05} +{"train_loss": 0.0062195053324103355, "global_step": 19352, "epoch": 162, "lr": 8.354479482892509e-05} +{"train_loss": 0.006317867431789637, "global_step": 19353, "epoch": 162, "lr": 8.354315188140355e-05} +{"train_loss": 0.0071627236902713776, "global_step": 19354, "epoch": 162, "lr": 8.354150886802364e-05} +{"train_loss": 0.004786267876625061, "global_step": 19355, "epoch": 162, "lr": 8.353986578878855e-05} +{"train_loss": 0.0037847484927624464, "global_step": 19356, "epoch": 162, "lr": 8.353822264370153e-05} +{"train_loss": 0.0073816897347569466, "global_step": 19357, "epoch": 162, "lr": 8.353657943276576e-05} +{"train_loss": 0.004226283170282841, "global_step": 19358, "epoch": 162, "lr": 8.353493615598452e-05} +{"train_loss": 0.00444219121709466, "global_step": 19359, "epoch": 162, "lr": 8.353329281336102e-05} +{"train_loss": 0.005252329166978598, "global_step": 19360, "epoch": 162, "lr": 8.353164940489846e-05} +{"train_loss": 0.004732341971248388, "global_step": 19361, "epoch": 162, "lr": 8.353000593060011e-05} +{"train_loss": 0.007788953371345997, "global_step": 19362, "epoch": 162, "lr": 8.352836239046917e-05} +{"train_loss": 0.004214830230921507, "global_step": 19363, "epoch": 162, "lr": 8.352671878450887e-05} +{"train_loss": 0.0050466894172132015, "global_step": 19364, "epoch": 162, "lr": 8.352507511272245e-05} +{"train_loss": 0.004815391730517149, "global_step": 19365, "epoch": 162, "lr": 8.352343137511311e-05} +{"train_loss": 0.005964827723801136, "global_step": 19366, "epoch": 162, "lr": 8.35217875716841e-05} +{"train_loss": 0.002866125898435712, "global_step": 19367, "epoch": 162, "lr": 8.352014370243863e-05} +{"train_loss": 0.006553668063133955, "global_step": 19368, "epoch": 162, "lr": 8.351849976737997e-05} +{"train_loss": 0.0037087812088429928, "global_step": 19369, "epoch": 162, "lr": 8.351685576651129e-05} +{"train_loss": 0.005119756795465946, "global_step": 19370, "epoch": 162, "lr": 8.351521169983585e-05} +{"train_loss": 0.004899153020232916, "global_step": 19371, "epoch": 162, "lr": 8.35135675673569e-05} +{"train_loss": 0.0033232762943953276, "global_step": 19372, "epoch": 162, "lr": 8.35119233690776e-05} +{"train_loss": 0.006645002402365208, "global_step": 19373, "epoch": 162, "lr": 8.351027910500123e-05} +{"train_loss": 0.00688900938257575, "global_step": 19374, "epoch": 162, "lr": 8.350863477513102e-05} +{"train_loss": 0.005351144354790449, "global_step": 19375, "epoch": 162, "lr": 8.350699037947018e-05} +{"train_loss": 0.003948912024497986, "global_step": 19376, "epoch": 162, "lr": 8.350534591802192e-05} +{"train_loss": 0.00856466218829155, "global_step": 19377, "epoch": 162, "lr": 8.350370139078953e-05} +{"train_loss": 0.004665856249630451, "global_step": 19378, "epoch": 162, "lr": 8.350205679777619e-05} +{"train_loss": 0.005243716761469841, "global_step": 19379, "epoch": 162, "lr": 8.350041213898511e-05} +{"train_loss": 0.0063543301075696945, "global_step": 19380, "epoch": 162, "lr": 8.34987674144196e-05} +{"train_loss": 0.004646315239369869, "global_step": 19381, "epoch": 162, "lr": 8.349712262408281e-05} +{"train_loss": 0.003911520354449749, "global_step": 19382, "epoch": 162, "lr": 8.3495477767978e-05} +{"train_loss": 0.005223571322858334, "global_step": 19383, "epoch": 162, "lr": 8.349383284610841e-05} +{"train_loss": 0.003780422965064645, "global_step": 19384, "epoch": 162, "lr": 8.349218785847723e-05} +{"train_loss": 0.006480622570961714, "global_step": 19385, "epoch": 162, "lr": 8.349054280508774e-05} +{"train_loss": 0.005689744837582111, "global_step": 19386, "epoch": 162, "lr": 8.348889768594314e-05} +{"train_loss": 0.005522030871361494, "global_step": 19387, "epoch": 162, "lr": 8.348725250104669e-05} +{"train_loss": 0.006044649984687567, "global_step": 19388, "epoch": 162, "lr": 8.348560725040158e-05} +{"train_loss": 0.003606125945225358, "global_step": 19389, "epoch": 162, "lr": 8.348396193401104e-05} +{"train_loss": 0.0029290777165442705, "global_step": 19390, "epoch": 162, "lr": 8.348231655187834e-05} +{"train_loss": 0.0045440420508384705, "global_step": 19391, "epoch": 162, "lr": 8.348067110400668e-05} +{"train_loss": 0.004451256711035967, "global_step": 19392, "epoch": 162, "lr": 8.34790255903993e-05} +{"train_loss": 0.007922559976577759, "global_step": 19393, "epoch": 162, "lr": 8.347738001105943e-05} +{"train_loss": 0.006331285461783409, "global_step": 19394, "epoch": 162, "lr": 8.34757343659903e-05} +{"train_loss": 0.003911053296178579, "global_step": 19395, "epoch": 162, "lr": 8.347408865519514e-05} +{"train_loss": 0.005319330997827674, "global_step": 19396, "epoch": 162, "lr": 8.347244287867719e-05, "val_loss": 0.02448105253279209} +{"train_loss": 0.00503227673470974, "global_step": 19397, "epoch": 163, "lr": 8.347079703643967e-05} +{"train_loss": 0.004373203497380018, "global_step": 19398, "epoch": 163, "lr": 8.346915112848581e-05} +{"train_loss": 0.00438147597014904, "global_step": 19399, "epoch": 163, "lr": 8.346750515481887e-05} +{"train_loss": 0.003294724738225341, "global_step": 19400, "epoch": 163, "lr": 8.346585911544204e-05} +{"train_loss": 0.0033211293630301952, "global_step": 19401, "epoch": 163, "lr": 8.346421301035858e-05} +{"train_loss": 0.004380056168884039, "global_step": 19402, "epoch": 163, "lr": 8.34625668395717e-05} +{"train_loss": 0.004808304365724325, "global_step": 19403, "epoch": 163, "lr": 8.346092060308465e-05} +{"train_loss": 0.006356860976666212, "global_step": 19404, "epoch": 163, "lr": 8.345927430090065e-05} +{"train_loss": 0.008556402288377285, "global_step": 19405, "epoch": 163, "lr": 8.345762793302296e-05} +{"train_loss": 0.004155989270657301, "global_step": 19406, "epoch": 163, "lr": 8.345598149945478e-05} +{"train_loss": 0.006286990363150835, "global_step": 19407, "epoch": 163, "lr": 8.345433500019935e-05} +{"train_loss": 0.0044600991532206535, "global_step": 19408, "epoch": 163, "lr": 8.345268843525992e-05} +{"train_loss": 0.007115548942238092, "global_step": 19409, "epoch": 163, "lr": 8.345104180463969e-05} +{"train_loss": 0.006229300517588854, "global_step": 19410, "epoch": 163, "lr": 8.344939510834194e-05} +{"train_loss": 0.004712632857263088, "global_step": 19411, "epoch": 163, "lr": 8.344774834636986e-05} +{"train_loss": 0.006697554606944323, "global_step": 19412, "epoch": 163, "lr": 8.344610151872671e-05} +{"train_loss": 0.00468837795779109, "global_step": 19413, "epoch": 163, "lr": 8.34444546254157e-05} +{"train_loss": 0.006568468175828457, "global_step": 19414, "epoch": 163, "lr": 8.344280766644008e-05} +{"train_loss": 0.0034094008151441813, "global_step": 19415, "epoch": 163, "lr": 8.344116064180307e-05} +{"train_loss": 0.006344927940517664, "global_step": 19416, "epoch": 163, "lr": 8.343951355150793e-05} +{"train_loss": 0.004993523936718702, "global_step": 19417, "epoch": 163, "lr": 8.343786639555787e-05} +{"train_loss": 0.005649579223245382, "global_step": 19418, "epoch": 163, "lr": 8.343621917395614e-05} +{"train_loss": 0.0038025658577680588, "global_step": 19419, "epoch": 163, "lr": 8.343457188670596e-05} +{"train_loss": 0.003162446664646268, "global_step": 19420, "epoch": 163, "lr": 8.343292453381058e-05} +{"train_loss": 0.007375609595328569, "global_step": 19421, "epoch": 163, "lr": 8.343127711527321e-05} +{"train_loss": 0.0037421819288283587, "global_step": 19422, "epoch": 163, "lr": 8.34296296310971e-05} +{"train_loss": 0.006120031233876944, "global_step": 19423, "epoch": 163, "lr": 8.342798208128549e-05} +{"train_loss": 0.004015082493424416, "global_step": 19424, "epoch": 163, "lr": 8.34263344658416e-05} +{"train_loss": 0.005362378433346748, "global_step": 19425, "epoch": 163, "lr": 8.342468678476868e-05} +{"train_loss": 0.005874975584447384, "global_step": 19426, "epoch": 163, "lr": 8.342303903806997e-05} +{"train_loss": 0.003821434685960412, "global_step": 19427, "epoch": 163, "lr": 8.342139122574866e-05} +{"train_loss": 0.0063114045187830925, "global_step": 19428, "epoch": 163, "lr": 8.341974334780804e-05} +{"train_loss": 0.004522772040218115, "global_step": 19429, "epoch": 163, "lr": 8.341809540425132e-05} +{"train_loss": 0.0044081308878958225, "global_step": 19430, "epoch": 163, "lr": 8.341644739508175e-05} +{"train_loss": 0.00903459545224905, "global_step": 19431, "epoch": 163, "lr": 8.341479932030256e-05} +{"train_loss": 0.003969756420701742, "global_step": 19432, "epoch": 163, "lr": 8.341315117991697e-05} +{"train_loss": 0.0039152586832642555, "global_step": 19433, "epoch": 163, "lr": 8.341150297392822e-05} +{"train_loss": 0.004562593996524811, "global_step": 19434, "epoch": 163, "lr": 8.340985470233956e-05} +{"train_loss": 0.003474595956504345, "global_step": 19435, "epoch": 163, "lr": 8.340820636515421e-05} +{"train_loss": 0.009874146431684494, "global_step": 19436, "epoch": 163, "lr": 8.340655796237545e-05} +{"train_loss": 0.006176114547997713, "global_step": 19437, "epoch": 163, "lr": 8.340490949400645e-05} +{"train_loss": 0.007345900405198336, "global_step": 19438, "epoch": 163, "lr": 8.340326096005049e-05} +{"train_loss": 0.005310744978487492, "global_step": 19439, "epoch": 163, "lr": 8.340161236051078e-05} +{"train_loss": 0.004038387443870306, "global_step": 19440, "epoch": 163, "lr": 8.339996369539061e-05} +{"train_loss": 0.00538880517706275, "global_step": 19441, "epoch": 163, "lr": 8.339831496469315e-05} +{"train_loss": 0.006428688298910856, "global_step": 19442, "epoch": 163, "lr": 8.339666616842167e-05} +{"train_loss": 0.00413260143250227, "global_step": 19443, "epoch": 163, "lr": 8.33950173065794e-05} +{"train_loss": 0.0064627500250935555, "global_step": 19444, "epoch": 163, "lr": 8.33933683791696e-05} +{"train_loss": 0.0034814905375242233, "global_step": 19445, "epoch": 163, "lr": 8.339171938619547e-05} +{"train_loss": 0.006744345650076866, "global_step": 19446, "epoch": 163, "lr": 8.339007032766027e-05} +{"train_loss": 0.0063288332894444466, "global_step": 19447, "epoch": 163, "lr": 8.338842120356723e-05} +{"train_loss": 0.007716348860412836, "global_step": 19448, "epoch": 163, "lr": 8.338677201391961e-05} +{"train_loss": 0.004778355360031128, "global_step": 19449, "epoch": 163, "lr": 8.338512275872062e-05} +{"train_loss": 0.004805167205631733, "global_step": 19450, "epoch": 163, "lr": 8.33834734379735e-05} +{"train_loss": 0.004325065296143293, "global_step": 19451, "epoch": 163, "lr": 8.338182405168151e-05} +{"train_loss": 0.005932618398219347, "global_step": 19452, "epoch": 163, "lr": 8.338017459984786e-05} +{"train_loss": 0.005398153327405453, "global_step": 19453, "epoch": 163, "lr": 8.337852508247582e-05} +{"train_loss": 0.005682527087628841, "global_step": 19454, "epoch": 163, "lr": 8.337687549956859e-05} +{"train_loss": 0.00893603079020977, "global_step": 19455, "epoch": 163, "lr": 8.337522585112945e-05} +{"train_loss": 0.0039772759191691875, "global_step": 19456, "epoch": 163, "lr": 8.337357613716162e-05} +{"train_loss": 0.00406976044178009, "global_step": 19457, "epoch": 163, "lr": 8.337192635766833e-05} +{"train_loss": 0.0031966608949005604, "global_step": 19458, "epoch": 163, "lr": 8.337027651265283e-05} +{"train_loss": 0.006666797678917646, "global_step": 19459, "epoch": 163, "lr": 8.336862660211836e-05} +{"train_loss": 0.003478537779301405, "global_step": 19460, "epoch": 163, "lr": 8.336697662606814e-05} +{"train_loss": 0.008437102660536766, "global_step": 19461, "epoch": 163, "lr": 8.336532658450545e-05} +{"train_loss": 0.005060380790382624, "global_step": 19462, "epoch": 163, "lr": 8.33636764774335e-05} +{"train_loss": 0.006868398282676935, "global_step": 19463, "epoch": 163, "lr": 8.336202630485554e-05} +{"train_loss": 0.004092202987521887, "global_step": 19464, "epoch": 163, "lr": 8.33603760667748e-05} +{"train_loss": 0.006085467990487814, "global_step": 19465, "epoch": 163, "lr": 8.335872576319452e-05} +{"train_loss": 0.005844780709594488, "global_step": 19466, "epoch": 163, "lr": 8.335707539411795e-05} +{"train_loss": 0.005340216215699911, "global_step": 19467, "epoch": 163, "lr": 8.335542495954831e-05} +{"train_loss": 0.005131823942065239, "global_step": 19468, "epoch": 163, "lr": 8.335377445948889e-05} +{"train_loss": 0.007489881478250027, "global_step": 19469, "epoch": 163, "lr": 8.335212389394287e-05} +{"train_loss": 0.004614987410604954, "global_step": 19470, "epoch": 163, "lr": 8.335047326291352e-05} +{"train_loss": 0.005397560074925423, "global_step": 19471, "epoch": 163, "lr": 8.33488225664041e-05} +{"train_loss": 0.0046454924158751965, "global_step": 19472, "epoch": 163, "lr": 8.33471718044178e-05} +{"train_loss": 0.005409194156527519, "global_step": 19473, "epoch": 163, "lr": 8.334552097695791e-05} +{"train_loss": 0.005983924493193626, "global_step": 19474, "epoch": 163, "lr": 8.334387008402766e-05} +{"train_loss": 0.004442514386028051, "global_step": 19475, "epoch": 163, "lr": 8.334221912563027e-05} +{"train_loss": 0.005075996741652489, "global_step": 19476, "epoch": 163, "lr": 8.3340568101769e-05} +{"train_loss": 0.003949479665607214, "global_step": 19477, "epoch": 163, "lr": 8.333891701244708e-05} +{"train_loss": 0.006507740821689367, "global_step": 19478, "epoch": 163, "lr": 8.333726585766774e-05} +{"train_loss": 0.006224552635103464, "global_step": 19479, "epoch": 163, "lr": 8.333561463743427e-05} +{"train_loss": 0.004925190936774015, "global_step": 19480, "epoch": 163, "lr": 8.333396335174988e-05} +{"train_loss": 0.0034363691229373217, "global_step": 19481, "epoch": 163, "lr": 8.333231200061781e-05} +{"train_loss": 0.011035824194550514, "global_step": 19482, "epoch": 163, "lr": 8.33306605840413e-05} +{"train_loss": 0.005408892408013344, "global_step": 19483, "epoch": 163, "lr": 8.332900910202359e-05} +{"train_loss": 0.005535087548196316, "global_step": 19484, "epoch": 163, "lr": 8.332735755456795e-05} +{"train_loss": 0.003174134064465761, "global_step": 19485, "epoch": 163, "lr": 8.33257059416776e-05} +{"train_loss": 0.004575324710458517, "global_step": 19486, "epoch": 163, "lr": 8.332405426335579e-05} +{"train_loss": 0.005497958045452833, "global_step": 19487, "epoch": 163, "lr": 8.332240251960574e-05} +{"train_loss": 0.006027767900377512, "global_step": 19488, "epoch": 163, "lr": 8.332075071043074e-05} +{"train_loss": 0.004244616255164146, "global_step": 19489, "epoch": 163, "lr": 8.3319098835834e-05} +{"train_loss": 0.0037084948271512985, "global_step": 19490, "epoch": 163, "lr": 8.331744689581875e-05} +{"train_loss": 0.007473485544323921, "global_step": 19491, "epoch": 163, "lr": 8.331579489038826e-05} +{"train_loss": 0.004267100244760513, "global_step": 19492, "epoch": 163, "lr": 8.331414281954578e-05} +{"train_loss": 0.008264079689979553, "global_step": 19493, "epoch": 163, "lr": 8.331249068329452e-05} +{"train_loss": 0.0044391825795173645, "global_step": 19494, "epoch": 163, "lr": 8.331083848163776e-05} +{"train_loss": 0.006048410199582577, "global_step": 19495, "epoch": 163, "lr": 8.330918621457872e-05} +{"train_loss": 0.006846277974545956, "global_step": 19496, "epoch": 163, "lr": 8.330753388212065e-05} +{"train_loss": 0.007152278907597065, "global_step": 19497, "epoch": 163, "lr": 8.33058814842668e-05} +{"train_loss": 0.0038278326392173767, "global_step": 19498, "epoch": 163, "lr": 8.33042290210204e-05} +{"train_loss": 0.006371035240590572, "global_step": 19499, "epoch": 163, "lr": 8.330257649238471e-05} +{"train_loss": 0.00700779166072607, "global_step": 19500, "epoch": 163, "lr": 8.330092389836297e-05} +{"train_loss": 0.007736771367490292, "global_step": 19501, "epoch": 163, "lr": 8.329927123895843e-05} +{"train_loss": 0.005155292339622974, "global_step": 19502, "epoch": 163, "lr": 8.329761851417432e-05} +{"train_loss": 0.007801814470440149, "global_step": 19503, "epoch": 163, "lr": 8.329596572401391e-05} +{"train_loss": 0.00851094163954258, "global_step": 19504, "epoch": 163, "lr": 8.32943128684804e-05} +{"train_loss": 0.004648536443710327, "global_step": 19505, "epoch": 163, "lr": 8.329265994757708e-05} +{"train_loss": 0.0057111033238470554, "global_step": 19506, "epoch": 163, "lr": 8.329100696130718e-05} +{"train_loss": 0.005467980168759823, "global_step": 19507, "epoch": 163, "lr": 8.328935390967394e-05} +{"train_loss": 0.006746967788785696, "global_step": 19508, "epoch": 163, "lr": 8.328770079268062e-05} +{"train_loss": 0.00540201598778367, "global_step": 19509, "epoch": 163, "lr": 8.328604761033043e-05} +{"train_loss": 0.006949775852262974, "global_step": 19510, "epoch": 163, "lr": 8.328439436262667e-05} +{"train_loss": 0.0048178331926465034, "global_step": 19511, "epoch": 163, "lr": 8.328274104957254e-05} +{"train_loss": 0.0036783397663384676, "global_step": 19512, "epoch": 163, "lr": 8.328108767117131e-05} +{"train_loss": 0.006412406452000141, "global_step": 19513, "epoch": 163, "lr": 8.327943422742623e-05} +{"train_loss": 0.0065062930807471275, "global_step": 19514, "epoch": 163, "lr": 8.327778071834052e-05} +{"train_loss": 0.0055059173336143, "global_step": 19515, "epoch": 163, "lr": 8.327612714391744e-05, "val_loss": 0.01600421592593193} +{"train_loss": 0.0036981592420488596, "global_step": 19516, "epoch": 164, "lr": 8.327447350416025e-05} +{"train_loss": 0.006652976851910353, "global_step": 19517, "epoch": 164, "lr": 8.327281979907219e-05} +{"train_loss": 0.004532308783382177, "global_step": 19518, "epoch": 164, "lr": 8.32711660286565e-05} +{"train_loss": 0.004739065654575825, "global_step": 19519, "epoch": 164, "lr": 8.326951219291644e-05} +{"train_loss": 0.003567840438336134, "global_step": 19520, "epoch": 164, "lr": 8.326785829185522e-05} +{"train_loss": 0.003460489446297288, "global_step": 19521, "epoch": 164, "lr": 8.326620432547613e-05} +{"train_loss": 0.004816947504878044, "global_step": 19522, "epoch": 164, "lr": 8.326455029378239e-05} +{"train_loss": 0.005417253356426954, "global_step": 19523, "epoch": 164, "lr": 8.326289619677727e-05} +{"train_loss": 0.004878838546574116, "global_step": 19524, "epoch": 164, "lr": 8.326124203446402e-05} +{"train_loss": 0.006420033518224955, "global_step": 19525, "epoch": 164, "lr": 8.325958780684586e-05} +{"train_loss": 0.0032985995057970285, "global_step": 19526, "epoch": 164, "lr": 8.325793351392605e-05} +{"train_loss": 0.006487079430371523, "global_step": 19527, "epoch": 164, "lr": 8.325627915570784e-05} +{"train_loss": 0.0035273537505418062, "global_step": 19528, "epoch": 164, "lr": 8.32546247321945e-05} +{"train_loss": 0.005109952297061682, "global_step": 19529, "epoch": 164, "lr": 8.325297024338923e-05} +{"train_loss": 0.004507008474320173, "global_step": 19530, "epoch": 164, "lr": 8.325131568929532e-05} +{"train_loss": 0.005450239405035973, "global_step": 19531, "epoch": 164, "lr": 8.324966106991601e-05} +{"train_loss": 0.003507760586217046, "global_step": 19532, "epoch": 164, "lr": 8.324800638525453e-05} +{"train_loss": 0.00566889438778162, "global_step": 19533, "epoch": 164, "lr": 8.324635163531414e-05} +{"train_loss": 0.0044835591688752174, "global_step": 19534, "epoch": 164, "lr": 8.32446968200981e-05} +{"train_loss": 0.0034213117323815823, "global_step": 19535, "epoch": 164, "lr": 8.324304193960964e-05} +{"train_loss": 0.006085120607167482, "global_step": 19536, "epoch": 164, "lr": 8.324138699385203e-05} +{"train_loss": 0.0034901755861938, "global_step": 19537, "epoch": 164, "lr": 8.323973198282851e-05} +{"train_loss": 0.0038383984938263893, "global_step": 19538, "epoch": 164, "lr": 8.323807690654231e-05} +{"train_loss": 0.005506900139153004, "global_step": 19539, "epoch": 164, "lr": 8.323642176499671e-05} +{"train_loss": 0.004209388978779316, "global_step": 19540, "epoch": 164, "lr": 8.323476655819493e-05} +{"train_loss": 0.007570898160338402, "global_step": 19541, "epoch": 164, "lr": 8.323311128614024e-05} +{"train_loss": 0.0032022343948483467, "global_step": 19542, "epoch": 164, "lr": 8.32314559488359e-05} +{"train_loss": 0.0049199252389371395, "global_step": 19543, "epoch": 164, "lr": 8.322980054628516e-05} +{"train_loss": 0.004432552959769964, "global_step": 19544, "epoch": 164, "lr": 8.322814507849122e-05} +{"train_loss": 0.0057721673510968685, "global_step": 19545, "epoch": 164, "lr": 8.32264895454574e-05} +{"train_loss": 0.004600904416292906, "global_step": 19546, "epoch": 164, "lr": 8.32248339471869e-05} +{"train_loss": 0.00536674028262496, "global_step": 19547, "epoch": 164, "lr": 8.322317828368298e-05} +{"train_loss": 0.007299327291548252, "global_step": 19548, "epoch": 164, "lr": 8.32215225549489e-05} +{"train_loss": 0.0050246985629200935, "global_step": 19549, "epoch": 164, "lr": 8.321986676098792e-05} +{"train_loss": 0.0036965461913496256, "global_step": 19550, "epoch": 164, "lr": 8.321821090180329e-05} +{"train_loss": 0.003434224287047982, "global_step": 19551, "epoch": 164, "lr": 8.321655497739824e-05} +{"train_loss": 0.005983536131680012, "global_step": 19552, "epoch": 164, "lr": 8.321489898777603e-05} +{"train_loss": 0.005822761915624142, "global_step": 19553, "epoch": 164, "lr": 8.321324293293992e-05} +{"train_loss": 0.006392051465809345, "global_step": 19554, "epoch": 164, "lr": 8.321158681289316e-05} +{"train_loss": 0.004733330570161343, "global_step": 19555, "epoch": 164, "lr": 8.320993062763899e-05} +{"train_loss": 0.0055056228302419186, "global_step": 19556, "epoch": 164, "lr": 8.320827437718068e-05} +{"train_loss": 0.006938959006220102, "global_step": 19557, "epoch": 164, "lr": 8.320661806152145e-05} +{"train_loss": 0.0042032115161418915, "global_step": 19558, "epoch": 164, "lr": 8.32049616806646e-05} +{"train_loss": 0.0041137076914310455, "global_step": 19559, "epoch": 164, "lr": 8.320330523461334e-05} +{"train_loss": 0.006020502652972937, "global_step": 19560, "epoch": 164, "lr": 8.320164872337093e-05} +{"train_loss": 0.006010259967297316, "global_step": 19561, "epoch": 164, "lr": 8.319999214694064e-05} +{"train_loss": 0.004277434200048447, "global_step": 19562, "epoch": 164, "lr": 8.319833550532572e-05} +{"train_loss": 0.008378453552722931, "global_step": 19563, "epoch": 164, "lr": 8.319667879852941e-05} +{"train_loss": 0.0042045083828270435, "global_step": 19564, "epoch": 164, "lr": 8.319502202655496e-05} +{"train_loss": 0.0044005513191223145, "global_step": 19565, "epoch": 164, "lr": 8.319336518940563e-05} +{"train_loss": 0.0056442818604409695, "global_step": 19566, "epoch": 164, "lr": 8.319170828708467e-05} +{"train_loss": 0.0057446314021945, "global_step": 19567, "epoch": 164, "lr": 8.319005131959534e-05} +{"train_loss": 0.004587988834828138, "global_step": 19568, "epoch": 164, "lr": 8.31883942869409e-05} +{"train_loss": 0.003917879890650511, "global_step": 19569, "epoch": 164, "lr": 8.31867371891246e-05} +{"train_loss": 0.0024035321548581123, "global_step": 19570, "epoch": 164, "lr": 8.318508002614966e-05} +{"train_loss": 0.006817938759922981, "global_step": 19571, "epoch": 164, "lr": 8.318342279801938e-05} +{"train_loss": 0.005946765653789043, "global_step": 19572, "epoch": 164, "lr": 8.318176550473698e-05} +{"train_loss": 0.003866717452183366, "global_step": 19573, "epoch": 164, "lr": 8.318010814630574e-05} +{"train_loss": 0.00311484606936574, "global_step": 19574, "epoch": 164, "lr": 8.317845072272891e-05} +{"train_loss": 0.00449969619512558, "global_step": 19575, "epoch": 164, "lr": 8.317679323400973e-05} +{"train_loss": 0.004310435615479946, "global_step": 19576, "epoch": 164, "lr": 8.317513568015146e-05} +{"train_loss": 0.007644134573638439, "global_step": 19577, "epoch": 164, "lr": 8.317347806115734e-05} +{"train_loss": 0.004471189342439175, "global_step": 19578, "epoch": 164, "lr": 8.317182037703067e-05} +{"train_loss": 0.004836380481719971, "global_step": 19579, "epoch": 164, "lr": 8.317016262777464e-05} +{"train_loss": 0.0037245675921440125, "global_step": 19580, "epoch": 164, "lr": 8.316850481339256e-05} +{"train_loss": 0.005474903155118227, "global_step": 19581, "epoch": 164, "lr": 8.316684693388767e-05} +{"train_loss": 0.004454083740711212, "global_step": 19582, "epoch": 164, "lr": 8.31651889892632e-05} +{"train_loss": 0.00450137909501791, "global_step": 19583, "epoch": 164, "lr": 8.316353097952244e-05} +{"train_loss": 0.005016962066292763, "global_step": 19584, "epoch": 164, "lr": 8.316187290466863e-05} +{"train_loss": 0.004279740154743195, "global_step": 19585, "epoch": 164, "lr": 8.316021476470501e-05} +{"train_loss": 0.003983025439083576, "global_step": 19586, "epoch": 164, "lr": 8.315855655963486e-05} +{"train_loss": 0.006712818052619696, "global_step": 19587, "epoch": 164, "lr": 8.315689828946145e-05} +{"train_loss": 0.003524291329085827, "global_step": 19588, "epoch": 164, "lr": 8.315523995418797e-05} +{"train_loss": 0.00311074685305357, "global_step": 19589, "epoch": 164, "lr": 8.315358155381775e-05} +{"train_loss": 0.00443741399794817, "global_step": 19590, "epoch": 164, "lr": 8.3151923088354e-05} +{"train_loss": 0.006008012220263481, "global_step": 19591, "epoch": 164, "lr": 8.31502645578e-05} +{"train_loss": 0.0029577172826975584, "global_step": 19592, "epoch": 164, "lr": 8.314860596215899e-05} +{"train_loss": 0.008241426199674606, "global_step": 19593, "epoch": 164, "lr": 8.314694730143423e-05} +{"train_loss": 0.004144772887229919, "global_step": 19594, "epoch": 164, "lr": 8.3145288575629e-05} +{"train_loss": 0.003204799722880125, "global_step": 19595, "epoch": 164, "lr": 8.314362978474652e-05} +{"train_loss": 0.004610039293766022, "global_step": 19596, "epoch": 164, "lr": 8.314197092879005e-05} +{"train_loss": 0.005029269959777594, "global_step": 19597, "epoch": 164, "lr": 8.31403120077629e-05} +{"train_loss": 0.0038740753661841154, "global_step": 19598, "epoch": 164, "lr": 8.313865302166825e-05} +{"train_loss": 0.004382661543786526, "global_step": 19599, "epoch": 164, "lr": 8.31369939705094e-05} +{"train_loss": 0.005638015456497669, "global_step": 19600, "epoch": 164, "lr": 8.313533485428962e-05} +{"train_loss": 0.003391210688278079, "global_step": 19601, "epoch": 164, "lr": 8.313367567301215e-05} +{"train_loss": 0.00512103084474802, "global_step": 19602, "epoch": 164, "lr": 8.313201642668024e-05} +{"train_loss": 0.004025588743388653, "global_step": 19603, "epoch": 164, "lr": 8.313035711529716e-05} +{"train_loss": 0.004945570137351751, "global_step": 19604, "epoch": 164, "lr": 8.312869773886616e-05} +{"train_loss": 0.004378124140202999, "global_step": 19605, "epoch": 164, "lr": 8.312703829739049e-05} +{"train_loss": 0.006469374988228083, "global_step": 19606, "epoch": 164, "lr": 8.312537879087344e-05} +{"train_loss": 0.0044801305048167706, "global_step": 19607, "epoch": 164, "lr": 8.312371921931823e-05} +{"train_loss": 0.003572652814909816, "global_step": 19608, "epoch": 164, "lr": 8.312205958272814e-05} +{"train_loss": 0.003961635287851095, "global_step": 19609, "epoch": 164, "lr": 8.312039988110642e-05} +{"train_loss": 0.002583750756457448, "global_step": 19610, "epoch": 164, "lr": 8.311874011445635e-05} +{"train_loss": 0.004371406976133585, "global_step": 19611, "epoch": 164, "lr": 8.311708028278115e-05} +{"train_loss": 0.003327096113935113, "global_step": 19612, "epoch": 164, "lr": 8.311542038608413e-05} +{"train_loss": 0.006416054908186197, "global_step": 19613, "epoch": 164, "lr": 8.311376042436851e-05} +{"train_loss": 0.0033894283697009087, "global_step": 19614, "epoch": 164, "lr": 8.311210039763755e-05} +{"train_loss": 0.005753337871283293, "global_step": 19615, "epoch": 164, "lr": 8.311044030589452e-05} +{"train_loss": 0.002574342768639326, "global_step": 19616, "epoch": 164, "lr": 8.310878014914268e-05} +{"train_loss": 0.007116489112377167, "global_step": 19617, "epoch": 164, "lr": 8.310711992738529e-05} +{"train_loss": 0.0038599721156060696, "global_step": 19618, "epoch": 164, "lr": 8.31054596406256e-05} +{"train_loss": 0.00659649632871151, "global_step": 19619, "epoch": 164, "lr": 8.310379928886688e-05} +{"train_loss": 0.004304814618080854, "global_step": 19620, "epoch": 164, "lr": 8.310213887211238e-05} +{"train_loss": 0.004166433122009039, "global_step": 19621, "epoch": 164, "lr": 8.310047839036538e-05} +{"train_loss": 0.007046461571007967, "global_step": 19622, "epoch": 164, "lr": 8.309881784362912e-05} +{"train_loss": 0.0031019661109894514, "global_step": 19623, "epoch": 164, "lr": 8.309715723190688e-05} +{"train_loss": 0.004041736945509911, "global_step": 19624, "epoch": 164, "lr": 8.309549655520188e-05} +{"train_loss": 0.002955622272565961, "global_step": 19625, "epoch": 164, "lr": 8.309383581351744e-05} +{"train_loss": 0.006424995139241219, "global_step": 19626, "epoch": 164, "lr": 8.309217500685675e-05} +{"train_loss": 0.005209018941968679, "global_step": 19627, "epoch": 164, "lr": 8.309051413522314e-05} +{"train_loss": 0.003502799663692713, "global_step": 19628, "epoch": 164, "lr": 8.308885319861983e-05} +{"train_loss": 0.006064210552722216, "global_step": 19629, "epoch": 164, "lr": 8.30871921970501e-05} +{"train_loss": 0.008171770721673965, "global_step": 19630, "epoch": 164, "lr": 8.308553113051721e-05} +{"train_loss": 0.00534897530451417, "global_step": 19631, "epoch": 164, "lr": 8.30838699990244e-05} +{"train_loss": 0.005122798029333353, "global_step": 19632, "epoch": 164, "lr": 8.308220880257494e-05} +{"train_loss": 0.0054841372184455395, "global_step": 19633, "epoch": 164, "lr": 8.308054754117211e-05} +{"train_loss": 0.00487292735610439, "global_step": 19634, "epoch": 164, "lr": 8.307888621481915e-05, "val_loss": 0.011872691102325916} +{"train_loss": 0.003407185198739171, "global_step": 19635, "epoch": 165, "lr": 8.307722482351934e-05} +{"train_loss": 0.005353880114853382, "global_step": 19636, "epoch": 165, "lr": 8.307556336727593e-05} +{"train_loss": 0.004703981801867485, "global_step": 19637, "epoch": 165, "lr": 8.307390184609219e-05} +{"train_loss": 0.004627676215022802, "global_step": 19638, "epoch": 165, "lr": 8.307224025997136e-05} +{"train_loss": 0.004633601289242506, "global_step": 19639, "epoch": 165, "lr": 8.307057860891672e-05} +{"train_loss": 0.006924131419509649, "global_step": 19640, "epoch": 165, "lr": 8.306891689293155e-05} +{"train_loss": 0.005334088113158941, "global_step": 19641, "epoch": 165, "lr": 8.306725511201908e-05} +{"train_loss": 0.004853802267462015, "global_step": 19642, "epoch": 165, "lr": 8.306559326618259e-05} +{"train_loss": 0.004154806956648827, "global_step": 19643, "epoch": 165, "lr": 8.306393135542535e-05} +{"train_loss": 0.00832388736307621, "global_step": 19644, "epoch": 165, "lr": 8.306226937975061e-05} +{"train_loss": 0.004502228461205959, "global_step": 19645, "epoch": 165, "lr": 8.306060733916164e-05} +{"train_loss": 0.0037894914858043194, "global_step": 19646, "epoch": 165, "lr": 8.305894523366169e-05} +{"train_loss": 0.008102980442345142, "global_step": 19647, "epoch": 165, "lr": 8.305728306325403e-05} +{"train_loss": 0.0064508928917348385, "global_step": 19648, "epoch": 165, "lr": 8.305562082794194e-05} +{"train_loss": 0.005729380529373884, "global_step": 19649, "epoch": 165, "lr": 8.305395852772864e-05} +{"train_loss": 0.006015240214765072, "global_step": 19650, "epoch": 165, "lr": 8.305229616261746e-05} +{"train_loss": 0.006229921244084835, "global_step": 19651, "epoch": 165, "lr": 8.305063373261162e-05} +{"train_loss": 0.00417381851002574, "global_step": 19652, "epoch": 165, "lr": 8.304897123771438e-05} +{"train_loss": 0.004103929735720158, "global_step": 19653, "epoch": 165, "lr": 8.304730867792902e-05} +{"train_loss": 0.005791065748780966, "global_step": 19654, "epoch": 165, "lr": 8.30456460532588e-05} +{"train_loss": 0.005523028317838907, "global_step": 19655, "epoch": 165, "lr": 8.304398336370698e-05} +{"train_loss": 0.007345070131123066, "global_step": 19656, "epoch": 165, "lr": 8.304232060927683e-05} +{"train_loss": 0.0030981453601270914, "global_step": 19657, "epoch": 165, "lr": 8.304065778997163e-05} +{"train_loss": 0.0059769367799162865, "global_step": 19658, "epoch": 165, "lr": 8.30389949057946e-05} +{"train_loss": 0.006087844260036945, "global_step": 19659, "epoch": 165, "lr": 8.303733195674905e-05} +{"train_loss": 0.0029271391686052084, "global_step": 19660, "epoch": 165, "lr": 8.303566894283824e-05} +{"train_loss": 0.0029111842159181833, "global_step": 19661, "epoch": 165, "lr": 8.30340058640654e-05} +{"train_loss": 0.0036874564830213785, "global_step": 19662, "epoch": 165, "lr": 8.303234272043385e-05} +{"train_loss": 0.004930645227432251, "global_step": 19663, "epoch": 165, "lr": 8.303067951194679e-05} +{"train_loss": 0.004856472834944725, "global_step": 19664, "epoch": 165, "lr": 8.302901623860753e-05} +{"train_loss": 0.00415596691891551, "global_step": 19665, "epoch": 165, "lr": 8.302735290041933e-05} +{"train_loss": 0.0036492468789219856, "global_step": 19666, "epoch": 165, "lr": 8.302568949738545e-05} +{"train_loss": 0.004396416712552309, "global_step": 19667, "epoch": 165, "lr": 8.302402602950917e-05} +{"train_loss": 0.0041437577456235886, "global_step": 19668, "epoch": 165, "lr": 8.302236249679371e-05} +{"train_loss": 0.0045211100950837135, "global_step": 19669, "epoch": 165, "lr": 8.30206988992424e-05} +{"train_loss": 0.00522173848003149, "global_step": 19670, "epoch": 165, "lr": 8.301903523685846e-05} +{"train_loss": 0.007037715055048466, "global_step": 19671, "epoch": 165, "lr": 8.301737150964517e-05} +{"train_loss": 0.004455359186977148, "global_step": 19672, "epoch": 165, "lr": 8.301570771760581e-05} +{"train_loss": 0.007476157508790493, "global_step": 19673, "epoch": 165, "lr": 8.301404386074362e-05} +{"train_loss": 0.0057859402149915695, "global_step": 19674, "epoch": 165, "lr": 8.301237993906189e-05} +{"train_loss": 0.003899897448718548, "global_step": 19675, "epoch": 165, "lr": 8.301071595256388e-05} +{"train_loss": 0.005246897228062153, "global_step": 19676, "epoch": 165, "lr": 8.300905190125287e-05} +{"train_loss": 0.00919376965612173, "global_step": 19677, "epoch": 165, "lr": 8.300738778513209e-05} +{"train_loss": 0.0035722251050174236, "global_step": 19678, "epoch": 165, "lr": 8.300572360420484e-05} +{"train_loss": 0.0035548866726458073, "global_step": 19679, "epoch": 165, "lr": 8.300405935847437e-05} +{"train_loss": 0.0052886358462274075, "global_step": 19680, "epoch": 165, "lr": 8.300239504794397e-05} +{"train_loss": 0.008391951210796833, "global_step": 19681, "epoch": 165, "lr": 8.300073067261689e-05} +{"train_loss": 0.005983214359730482, "global_step": 19682, "epoch": 165, "lr": 8.29990662324964e-05} +{"train_loss": 0.0038422029465436935, "global_step": 19683, "epoch": 165, "lr": 8.299740172758577e-05} +{"train_loss": 0.003737356746569276, "global_step": 19684, "epoch": 165, "lr": 8.299573715788824e-05} +{"train_loss": 0.007635652087628841, "global_step": 19685, "epoch": 165, "lr": 8.299407252340715e-05} +{"train_loss": 0.005346393678337336, "global_step": 19686, "epoch": 165, "lr": 8.299240782414568e-05} +{"train_loss": 0.0055307867005467415, "global_step": 19687, "epoch": 165, "lr": 8.299074306010717e-05} +{"train_loss": 0.005245128646492958, "global_step": 19688, "epoch": 165, "lr": 8.298907823129486e-05} +{"train_loss": 0.00578276114538312, "global_step": 19689, "epoch": 165, "lr": 8.298741333771201e-05} +{"train_loss": 0.004437230061739683, "global_step": 19690, "epoch": 165, "lr": 8.29857483793619e-05} +{"train_loss": 0.006431705318391323, "global_step": 19691, "epoch": 165, "lr": 8.298408335624778e-05} +{"train_loss": 0.0044304863549768925, "global_step": 19692, "epoch": 165, "lr": 8.298241826837297e-05} +{"train_loss": 0.006498326081782579, "global_step": 19693, "epoch": 165, "lr": 8.298075311574069e-05} +{"train_loss": 0.0056559550575912, "global_step": 19694, "epoch": 165, "lr": 8.297908789835422e-05} +{"train_loss": 0.0064264927059412, "global_step": 19695, "epoch": 165, "lr": 8.297742261621684e-05} +{"train_loss": 0.0028405014891177416, "global_step": 19696, "epoch": 165, "lr": 8.297575726933182e-05} +{"train_loss": 0.0026788068935275078, "global_step": 19697, "epoch": 165, "lr": 8.297409185770242e-05} +{"train_loss": 0.003671137848868966, "global_step": 19698, "epoch": 165, "lr": 8.297242638133188e-05} +{"train_loss": 0.006157224997878075, "global_step": 19699, "epoch": 165, "lr": 8.297076084022355e-05} +{"train_loss": 0.008582593873143196, "global_step": 19700, "epoch": 165, "lr": 8.296909523438064e-05} +{"train_loss": 0.003729467745870352, "global_step": 19701, "epoch": 165, "lr": 8.296742956380643e-05} +{"train_loss": 0.0049650282599031925, "global_step": 19702, "epoch": 165, "lr": 8.296576382850419e-05} +{"train_loss": 0.006024824921041727, "global_step": 19703, "epoch": 165, "lr": 8.29640980284772e-05} +{"train_loss": 0.004055168479681015, "global_step": 19704, "epoch": 165, "lr": 8.296243216372872e-05} +{"train_loss": 0.0031654543709009886, "global_step": 19705, "epoch": 165, "lr": 8.296076623426204e-05} +{"train_loss": 0.004033992532640696, "global_step": 19706, "epoch": 165, "lr": 8.29591002400804e-05} +{"train_loss": 0.005401396192610264, "global_step": 19707, "epoch": 165, "lr": 8.29574341811871e-05} +{"train_loss": 0.008312787860631943, "global_step": 19708, "epoch": 165, "lr": 8.295576805758538e-05} +{"train_loss": 0.004438336472958326, "global_step": 19709, "epoch": 165, "lr": 8.295410186927855e-05} +{"train_loss": 0.0046785492449998856, "global_step": 19710, "epoch": 165, "lr": 8.295243561626986e-05} +{"train_loss": 0.0046221474185585976, "global_step": 19711, "epoch": 165, "lr": 8.295076929856258e-05} +{"train_loss": 0.006786546669900417, "global_step": 19712, "epoch": 165, "lr": 8.294910291615998e-05} +{"train_loss": 0.004886398557573557, "global_step": 19713, "epoch": 165, "lr": 8.294743646906533e-05} +{"train_loss": 0.004377075470983982, "global_step": 19714, "epoch": 165, "lr": 8.294576995728193e-05} +{"train_loss": 0.004630083683878183, "global_step": 19715, "epoch": 165, "lr": 8.294410338081302e-05} +{"train_loss": 0.004488452337682247, "global_step": 19716, "epoch": 165, "lr": 8.294243673966187e-05} +{"train_loss": 0.002929295878857374, "global_step": 19717, "epoch": 165, "lr": 8.294077003383179e-05} +{"train_loss": 0.00865259300917387, "global_step": 19718, "epoch": 165, "lr": 8.2939103263326e-05} +{"train_loss": 0.0062831128016114235, "global_step": 19719, "epoch": 165, "lr": 8.293743642814782e-05} +{"train_loss": 0.003943673800677061, "global_step": 19720, "epoch": 165, "lr": 8.293576952830049e-05} +{"train_loss": 0.006129723973572254, "global_step": 19721, "epoch": 165, "lr": 8.293410256378731e-05} +{"train_loss": 0.0037882057949900627, "global_step": 19722, "epoch": 165, "lr": 8.293243553461152e-05} +{"train_loss": 0.004364417400211096, "global_step": 19723, "epoch": 165, "lr": 8.293076844077642e-05} +{"train_loss": 0.004987678490579128, "global_step": 19724, "epoch": 165, "lr": 8.292910128228527e-05} +{"train_loss": 0.005572495050728321, "global_step": 19725, "epoch": 165, "lr": 8.292743405914136e-05} +{"train_loss": 0.006004963535815477, "global_step": 19726, "epoch": 165, "lr": 8.292576677134794e-05} +{"train_loss": 0.004572113510221243, "global_step": 19727, "epoch": 165, "lr": 8.29240994189083e-05} +{"train_loss": 0.004810904152691364, "global_step": 19728, "epoch": 165, "lr": 8.29224320018257e-05} +{"train_loss": 0.005294795613735914, "global_step": 19729, "epoch": 165, "lr": 8.292076452010342e-05} +{"train_loss": 0.004661188926547766, "global_step": 19730, "epoch": 165, "lr": 8.291909697374476e-05} +{"train_loss": 0.0029895526822656393, "global_step": 19731, "epoch": 165, "lr": 8.291742936275296e-05} +{"train_loss": 0.005543718580156565, "global_step": 19732, "epoch": 165, "lr": 8.291576168713128e-05} +{"train_loss": 0.007795696146786213, "global_step": 19733, "epoch": 165, "lr": 8.291409394688303e-05} +{"train_loss": 0.0034043288324028254, "global_step": 19734, "epoch": 165, "lr": 8.291242614201148e-05} +{"train_loss": 0.007539608981460333, "global_step": 19735, "epoch": 165, "lr": 8.29107582725199e-05} +{"train_loss": 0.004292767494916916, "global_step": 19736, "epoch": 165, "lr": 8.290909033841157e-05} +{"train_loss": 0.003995207604020834, "global_step": 19737, "epoch": 165, "lr": 8.290742233968973e-05} +{"train_loss": 0.005032227374613285, "global_step": 19738, "epoch": 165, "lr": 8.29057542763577e-05} +{"train_loss": 0.0035837930627167225, "global_step": 19739, "epoch": 165, "lr": 8.290408614841874e-05} +{"train_loss": 0.004465121775865555, "global_step": 19740, "epoch": 165, "lr": 8.290241795587611e-05} +{"train_loss": 0.0038423407822847366, "global_step": 19741, "epoch": 165, "lr": 8.29007496987331e-05} +{"train_loss": 0.006247357930988073, "global_step": 19742, "epoch": 165, "lr": 8.289908137699299e-05} +{"train_loss": 0.005301177967339754, "global_step": 19743, "epoch": 165, "lr": 8.289741299065905e-05} +{"train_loss": 0.008239639922976494, "global_step": 19744, "epoch": 165, "lr": 8.289574453973455e-05} +{"train_loss": 0.0056976922787725925, "global_step": 19745, "epoch": 165, "lr": 8.289407602422276e-05} +{"train_loss": 0.009438065811991692, "global_step": 19746, "epoch": 165, "lr": 8.289240744412699e-05} +{"train_loss": 0.004211368504911661, "global_step": 19747, "epoch": 165, "lr": 8.289073879945046e-05} +{"train_loss": 0.0031592922750860453, "global_step": 19748, "epoch": 165, "lr": 8.28890700901965e-05} +{"train_loss": 0.006662044208496809, "global_step": 19749, "epoch": 165, "lr": 8.288740131636837e-05} +{"train_loss": 0.0064173052087426186, "global_step": 19750, "epoch": 165, "lr": 8.288573247796934e-05} +{"train_loss": 0.004894113168120384, "global_step": 19751, "epoch": 165, "lr": 8.288406357500267e-05} +{"train_loss": 0.004058688413351774, "global_step": 19752, "epoch": 165, "lr": 8.288239460747165e-05} +{"train_loss": 0.005199511860254682, "global_step": 19753, "epoch": 165, "lr": 8.288072557537958e-05, "val_loss": 0.023779386654496193, "train_action_mse_error": 0.00013800764281768352} +{"train_loss": 0.004876012448221445, "global_step": 19754, "epoch": 166, "lr": 8.287905647872971e-05} +{"train_loss": 0.006518930662423372, "global_step": 19755, "epoch": 166, "lr": 8.287738731752533e-05} +{"train_loss": 0.008059779182076454, "global_step": 19756, "epoch": 166, "lr": 8.28757180917697e-05} +{"train_loss": 0.003223357954993844, "global_step": 19757, "epoch": 166, "lr": 8.287404880146613e-05} +{"train_loss": 0.004334297962486744, "global_step": 19758, "epoch": 166, "lr": 8.287237944661786e-05} +{"train_loss": 0.003888003993779421, "global_step": 19759, "epoch": 166, "lr": 8.28707100272282e-05} +{"train_loss": 0.0051945289596915245, "global_step": 19760, "epoch": 166, "lr": 8.28690405433004e-05} +{"train_loss": 0.00510961189866066, "global_step": 19761, "epoch": 166, "lr": 8.286737099483776e-05} +{"train_loss": 0.00449163094162941, "global_step": 19762, "epoch": 166, "lr": 8.286570138184353e-05} +{"train_loss": 0.0060367705300450325, "global_step": 19763, "epoch": 166, "lr": 8.286403170432104e-05} +{"train_loss": 0.00550636975094676, "global_step": 19764, "epoch": 166, "lr": 8.28623619622735e-05} +{"train_loss": 0.004238843452185392, "global_step": 19765, "epoch": 166, "lr": 8.286069215570424e-05} +{"train_loss": 0.007539596874266863, "global_step": 19766, "epoch": 166, "lr": 8.285902228461652e-05} +{"train_loss": 0.00598136568441987, "global_step": 19767, "epoch": 166, "lr": 8.285735234901362e-05} +{"train_loss": 0.004932154901325703, "global_step": 19768, "epoch": 166, "lr": 8.285568234889882e-05} +{"train_loss": 0.007401888258755207, "global_step": 19769, "epoch": 166, "lr": 8.285401228427541e-05} +{"train_loss": 0.003229683032259345, "global_step": 19770, "epoch": 166, "lr": 8.285234215514664e-05} +{"train_loss": 0.006040752399712801, "global_step": 19771, "epoch": 166, "lr": 8.285067196151579e-05} +{"train_loss": 0.004128958564251661, "global_step": 19772, "epoch": 166, "lr": 8.284900170338618e-05} +{"train_loss": 0.00386754609644413, "global_step": 19773, "epoch": 166, "lr": 8.284733138076106e-05} +{"train_loss": 0.005185226909816265, "global_step": 19774, "epoch": 166, "lr": 8.28456609936437e-05} +{"train_loss": 0.003817962948232889, "global_step": 19775, "epoch": 166, "lr": 8.284399054203742e-05} +{"train_loss": 0.00533946743234992, "global_step": 19776, "epoch": 166, "lr": 8.284232002594546e-05} +{"train_loss": 0.006250204052776098, "global_step": 19777, "epoch": 166, "lr": 8.284064944537111e-05} +{"train_loss": 0.004125046078115702, "global_step": 19778, "epoch": 166, "lr": 8.283897880031766e-05} +{"train_loss": 0.00457922276109457, "global_step": 19779, "epoch": 166, "lr": 8.283730809078838e-05} +{"train_loss": 0.0028898329474031925, "global_step": 19780, "epoch": 166, "lr": 8.283563731678655e-05} +{"train_loss": 0.005670889746397734, "global_step": 19781, "epoch": 166, "lr": 8.283396647831547e-05} +{"train_loss": 0.006113047245889902, "global_step": 19782, "epoch": 166, "lr": 8.283229557537838e-05} +{"train_loss": 0.004335233010351658, "global_step": 19783, "epoch": 166, "lr": 8.283062460797858e-05} +{"train_loss": 0.005524264182895422, "global_step": 19784, "epoch": 166, "lr": 8.28289535761194e-05} +{"train_loss": 0.002832517260685563, "global_step": 19785, "epoch": 166, "lr": 8.282728247980405e-05} +{"train_loss": 0.005462591536343098, "global_step": 19786, "epoch": 166, "lr": 8.282561131903583e-05} +{"train_loss": 0.003466825932264328, "global_step": 19787, "epoch": 166, "lr": 8.282394009381803e-05} +{"train_loss": 0.003961142152547836, "global_step": 19788, "epoch": 166, "lr": 8.282226880415394e-05} +{"train_loss": 0.004064943175762892, "global_step": 19789, "epoch": 166, "lr": 8.282059745004683e-05} +{"train_loss": 0.003850105684250593, "global_step": 19790, "epoch": 166, "lr": 8.281892603149998e-05} +{"train_loss": 0.00579353142529726, "global_step": 19791, "epoch": 166, "lr": 8.281725454851668e-05} +{"train_loss": 0.0036882562562823296, "global_step": 19792, "epoch": 166, "lr": 8.281558300110021e-05} +{"train_loss": 0.004071624018251896, "global_step": 19793, "epoch": 166, "lr": 8.281391138925384e-05} +{"train_loss": 0.0066379099152982235, "global_step": 19794, "epoch": 166, "lr": 8.281223971298086e-05} +{"train_loss": 0.005755043588578701, "global_step": 19795, "epoch": 166, "lr": 8.281056797228458e-05} +{"train_loss": 0.0041803596541285515, "global_step": 19796, "epoch": 166, "lr": 8.280889616716821e-05} +{"train_loss": 0.005227202083915472, "global_step": 19797, "epoch": 166, "lr": 8.28072242976351e-05} +{"train_loss": 0.0034691591281443834, "global_step": 19798, "epoch": 166, "lr": 8.28055523636885e-05} +{"train_loss": 0.004650572780519724, "global_step": 19799, "epoch": 166, "lr": 8.280388036533171e-05} +{"train_loss": 0.004583984613418579, "global_step": 19800, "epoch": 166, "lr": 8.280220830256802e-05} +{"train_loss": 0.0045213340781629086, "global_step": 19801, "epoch": 166, "lr": 8.280053617540069e-05} +{"train_loss": 0.004856149200350046, "global_step": 19802, "epoch": 166, "lr": 8.2798863983833e-05} +{"train_loss": 0.0055879042483866215, "global_step": 19803, "epoch": 166, "lr": 8.279719172786826e-05} +{"train_loss": 0.005218972451984882, "global_step": 19804, "epoch": 166, "lr": 8.279551940750973e-05} +{"train_loss": 0.006600051186978817, "global_step": 19805, "epoch": 166, "lr": 8.279384702276069e-05} +{"train_loss": 0.005229294765740633, "global_step": 19806, "epoch": 166, "lr": 8.279217457362445e-05} +{"train_loss": 0.004313045181334019, "global_step": 19807, "epoch": 166, "lr": 8.279050206010428e-05} +{"train_loss": 0.0050811609253287315, "global_step": 19808, "epoch": 166, "lr": 8.278882948220346e-05} +{"train_loss": 0.004591909237205982, "global_step": 19809, "epoch": 166, "lr": 8.278715683992526e-05} +{"train_loss": 0.006124590523540974, "global_step": 19810, "epoch": 166, "lr": 8.2785484133273e-05} +{"train_loss": 0.004252856597304344, "global_step": 19811, "epoch": 166, "lr": 8.278381136224993e-05} +{"train_loss": 0.0036111134104430676, "global_step": 19812, "epoch": 166, "lr": 8.278213852685937e-05} +{"train_loss": 0.006224782671779394, "global_step": 19813, "epoch": 166, "lr": 8.278046562710456e-05} +{"train_loss": 0.0034940792247653008, "global_step": 19814, "epoch": 166, "lr": 8.277879266298882e-05} +{"train_loss": 0.0048281303606927395, "global_step": 19815, "epoch": 166, "lr": 8.277711963451543e-05} +{"train_loss": 0.0056051271967589855, "global_step": 19816, "epoch": 166, "lr": 8.277544654168765e-05} +{"train_loss": 0.004765716381371021, "global_step": 19817, "epoch": 166, "lr": 8.277377338450878e-05} +{"train_loss": 0.0064921071752905846, "global_step": 19818, "epoch": 166, "lr": 8.277210016298212e-05} +{"train_loss": 0.005011746659874916, "global_step": 19819, "epoch": 166, "lr": 8.277042687711094e-05} +{"train_loss": 0.002845410956069827, "global_step": 19820, "epoch": 166, "lr": 8.276875352689853e-05} +{"train_loss": 0.005161704961210489, "global_step": 19821, "epoch": 166, "lr": 8.276708011234817e-05} +{"train_loss": 0.007397470995783806, "global_step": 19822, "epoch": 166, "lr": 8.276540663346315e-05} +{"train_loss": 0.00479717506095767, "global_step": 19823, "epoch": 166, "lr": 8.276373309024676e-05} +{"train_loss": 0.00453718239441514, "global_step": 19824, "epoch": 166, "lr": 8.276205948270226e-05} +{"train_loss": 0.0049528940580785275, "global_step": 19825, "epoch": 166, "lr": 8.276038581083299e-05} +{"train_loss": 0.0030924812890589237, "global_step": 19826, "epoch": 166, "lr": 8.275871207464218e-05} +{"train_loss": 0.0031826833728700876, "global_step": 19827, "epoch": 166, "lr": 8.275703827413314e-05} +{"train_loss": 0.008200766518712044, "global_step": 19828, "epoch": 166, "lr": 8.275536440930915e-05} +{"train_loss": 0.005914008244872093, "global_step": 19829, "epoch": 166, "lr": 8.275369048017351e-05} +{"train_loss": 0.003281237091869116, "global_step": 19830, "epoch": 166, "lr": 8.27520164867295e-05} +{"train_loss": 0.005666395649313927, "global_step": 19831, "epoch": 166, "lr": 8.275034242898039e-05} +{"train_loss": 0.006684804800897837, "global_step": 19832, "epoch": 166, "lr": 8.27486683069295e-05} +{"train_loss": 0.007791012525558472, "global_step": 19833, "epoch": 166, "lr": 8.27469941205801e-05} +{"train_loss": 0.005040754564106464, "global_step": 19834, "epoch": 166, "lr": 8.274531986993545e-05} +{"train_loss": 0.00312607130035758, "global_step": 19835, "epoch": 166, "lr": 8.274364555499888e-05} +{"train_loss": 0.003767743008211255, "global_step": 19836, "epoch": 166, "lr": 8.274197117577366e-05} +{"train_loss": 0.00554924039170146, "global_step": 19837, "epoch": 166, "lr": 8.274029673226308e-05} +{"train_loss": 0.003120019566267729, "global_step": 19838, "epoch": 166, "lr": 8.273862222447041e-05} +{"train_loss": 0.0046532172709703445, "global_step": 19839, "epoch": 166, "lr": 8.273694765239898e-05} +{"train_loss": 0.003977588843554258, "global_step": 19840, "epoch": 166, "lr": 8.273527301605203e-05} +{"train_loss": 0.007290129084140062, "global_step": 19841, "epoch": 166, "lr": 8.273359831543288e-05} +{"train_loss": 0.005861317273229361, "global_step": 19842, "epoch": 166, "lr": 8.27319235505448e-05} +{"train_loss": 0.0037276586517691612, "global_step": 19843, "epoch": 166, "lr": 8.273024872139107e-05} +{"train_loss": 0.002937012119218707, "global_step": 19844, "epoch": 166, "lr": 8.272857382797502e-05} +{"train_loss": 0.006739665754139423, "global_step": 19845, "epoch": 166, "lr": 8.27268988702999e-05} +{"train_loss": 0.006422640290111303, "global_step": 19846, "epoch": 166, "lr": 8.2725223848369e-05} +{"train_loss": 0.0039423201233148575, "global_step": 19847, "epoch": 166, "lr": 8.272354876218565e-05} +{"train_loss": 0.003615201683714986, "global_step": 19848, "epoch": 166, "lr": 8.272187361175307e-05} +{"train_loss": 0.005390168633311987, "global_step": 19849, "epoch": 166, "lr": 8.272019839707461e-05} +{"train_loss": 0.004324900917708874, "global_step": 19850, "epoch": 166, "lr": 8.271852311815353e-05} +{"train_loss": 0.0035669063217937946, "global_step": 19851, "epoch": 166, "lr": 8.271684777499314e-05} +{"train_loss": 0.007955670356750488, "global_step": 19852, "epoch": 166, "lr": 8.271517236759669e-05} +{"train_loss": 0.004884242080152035, "global_step": 19853, "epoch": 166, "lr": 8.271349689596751e-05} +{"train_loss": 0.0067400638945400715, "global_step": 19854, "epoch": 166, "lr": 8.271182136010886e-05} +{"train_loss": 0.00359933590516448, "global_step": 19855, "epoch": 166, "lr": 8.271014576002406e-05} +{"train_loss": 0.006429907400161028, "global_step": 19856, "epoch": 166, "lr": 8.270847009571638e-05} +{"train_loss": 0.0036666947416961193, "global_step": 19857, "epoch": 166, "lr": 8.270679436718911e-05} +{"train_loss": 0.0042640212923288345, "global_step": 19858, "epoch": 166, "lr": 8.270511857444554e-05} +{"train_loss": 0.004822313319891691, "global_step": 19859, "epoch": 166, "lr": 8.270344271748898e-05} +{"train_loss": 0.0038691575173288584, "global_step": 19860, "epoch": 166, "lr": 8.270176679632269e-05} +{"train_loss": 0.004554225131869316, "global_step": 19861, "epoch": 166, "lr": 8.270009081094996e-05} +{"train_loss": 0.004855553153902292, "global_step": 19862, "epoch": 166, "lr": 8.269841476137412e-05} +{"train_loss": 0.004441316705197096, "global_step": 19863, "epoch": 166, "lr": 8.269673864759843e-05} +{"train_loss": 0.002732549561187625, "global_step": 19864, "epoch": 166, "lr": 8.269506246962617e-05} +{"train_loss": 0.005038238596171141, "global_step": 19865, "epoch": 166, "lr": 8.269338622746066e-05} +{"train_loss": 0.006918296217918396, "global_step": 19866, "epoch": 166, "lr": 8.269170992110519e-05} +{"train_loss": 0.005862405523657799, "global_step": 19867, "epoch": 166, "lr": 8.269003355056303e-05} +{"train_loss": 0.005126715637743473, "global_step": 19868, "epoch": 166, "lr": 8.268835711583748e-05} +{"train_loss": 0.008249680511653423, "global_step": 19869, "epoch": 166, "lr": 8.268668061693183e-05} +{"train_loss": 0.0034455943387001753, "global_step": 19870, "epoch": 166, "lr": 8.268500405384938e-05} +{"train_loss": 0.005494787823408842, "global_step": 19871, "epoch": 166, "lr": 8.268332742659341e-05} +{"train_loss": 0.004958194050499622, "global_step": 19872, "epoch": 166, "lr": 8.268165073516724e-05, "val_loss": 0.015683040022850037} +{"train_loss": 0.003157012863084674, "global_step": 19873, "epoch": 167, "lr": 8.267997397957412e-05} +{"train_loss": 0.006456452887505293, "global_step": 19874, "epoch": 167, "lr": 8.267829715981737e-05} +{"train_loss": 0.0031261672265827656, "global_step": 19875, "epoch": 167, "lr": 8.267662027590027e-05} +{"train_loss": 0.0052010612562298775, "global_step": 19876, "epoch": 167, "lr": 8.267494332782613e-05} +{"train_loss": 0.006133356597274542, "global_step": 19877, "epoch": 167, "lr": 8.267326631559821e-05} +{"train_loss": 0.006616190541535616, "global_step": 19878, "epoch": 167, "lr": 8.267158923921983e-05} +{"train_loss": 0.004087212961167097, "global_step": 19879, "epoch": 167, "lr": 8.266991209869428e-05} +{"train_loss": 0.003218297613784671, "global_step": 19880, "epoch": 167, "lr": 8.266823489402483e-05} +{"train_loss": 0.006044019479304552, "global_step": 19881, "epoch": 167, "lr": 8.26665576252148e-05} +{"train_loss": 0.005117015913128853, "global_step": 19882, "epoch": 167, "lr": 8.266488029226749e-05} +{"train_loss": 0.002929645124822855, "global_step": 19883, "epoch": 167, "lr": 8.266320289518617e-05} +{"train_loss": 0.005985802970826626, "global_step": 19884, "epoch": 167, "lr": 8.266152543397414e-05} +{"train_loss": 0.005316976923495531, "global_step": 19885, "epoch": 167, "lr": 8.265984790863469e-05} +{"train_loss": 0.005607613828033209, "global_step": 19886, "epoch": 167, "lr": 8.265817031917111e-05} +{"train_loss": 0.0044798944145441055, "global_step": 19887, "epoch": 167, "lr": 8.26564926655867e-05} +{"train_loss": 0.006121357437223196, "global_step": 19888, "epoch": 167, "lr": 8.265481494788478e-05} +{"train_loss": 0.004525794647634029, "global_step": 19889, "epoch": 167, "lr": 8.265313716606859e-05} +{"train_loss": 0.0027382296975702047, "global_step": 19890, "epoch": 167, "lr": 8.265145932014148e-05} +{"train_loss": 0.004294180311262608, "global_step": 19891, "epoch": 167, "lr": 8.26497814101067e-05} +{"train_loss": 0.0051637208089232445, "global_step": 19892, "epoch": 167, "lr": 8.264810343596757e-05} +{"train_loss": 0.003776153549551964, "global_step": 19893, "epoch": 167, "lr": 8.264642539772737e-05} +{"train_loss": 0.005395837593823671, "global_step": 19894, "epoch": 167, "lr": 8.264474729538942e-05} +{"train_loss": 0.005201405845582485, "global_step": 19895, "epoch": 167, "lr": 8.264306912895698e-05} +{"train_loss": 0.006584384944289923, "global_step": 19896, "epoch": 167, "lr": 8.264139089843337e-05} +{"train_loss": 0.005154287442564964, "global_step": 19897, "epoch": 167, "lr": 8.263971260382186e-05} +{"train_loss": 0.0034304040018469095, "global_step": 19898, "epoch": 167, "lr": 8.263803424512577e-05} +{"train_loss": 0.004708585329353809, "global_step": 19899, "epoch": 167, "lr": 8.263635582234839e-05} +{"train_loss": 0.005116267595440149, "global_step": 19900, "epoch": 167, "lr": 8.263467733549301e-05} +{"train_loss": 0.004225804004818201, "global_step": 19901, "epoch": 167, "lr": 8.263299878456294e-05} +{"train_loss": 0.0034093777649104595, "global_step": 19902, "epoch": 167, "lr": 8.263132016956145e-05} +{"train_loss": 0.0034969141706824303, "global_step": 19903, "epoch": 167, "lr": 8.262964149049184e-05} +{"train_loss": 0.00501237390562892, "global_step": 19904, "epoch": 167, "lr": 8.262796274735743e-05} +{"train_loss": 0.00537957064807415, "global_step": 19905, "epoch": 167, "lr": 8.26262839401615e-05} +{"train_loss": 0.003714738879352808, "global_step": 19906, "epoch": 167, "lr": 8.262460506890733e-05} +{"train_loss": 0.005352332256734371, "global_step": 19907, "epoch": 167, "lr": 8.262292613359826e-05} +{"train_loss": 0.0046064588241279125, "global_step": 19908, "epoch": 167, "lr": 8.262124713423755e-05} +{"train_loss": 0.004487196449190378, "global_step": 19909, "epoch": 167, "lr": 8.261956807082849e-05} +{"train_loss": 0.004974631126970053, "global_step": 19910, "epoch": 167, "lr": 8.261788894337441e-05} +{"train_loss": 0.007419934496283531, "global_step": 19911, "epoch": 167, "lr": 8.261620975187858e-05} +{"train_loss": 0.004403149243444204, "global_step": 19912, "epoch": 167, "lr": 8.261453049634431e-05} +{"train_loss": 0.0047164177522063255, "global_step": 19913, "epoch": 167, "lr": 8.261285117677491e-05} +{"train_loss": 0.006772034801542759, "global_step": 19914, "epoch": 167, "lr": 8.261117179317364e-05} +{"train_loss": 0.006700264289975166, "global_step": 19915, "epoch": 167, "lr": 8.260949234554383e-05} +{"train_loss": 0.003382398746907711, "global_step": 19916, "epoch": 167, "lr": 8.260781283388876e-05} +{"train_loss": 0.0032813672441989183, "global_step": 19917, "epoch": 167, "lr": 8.260613325821173e-05} +{"train_loss": 0.006508497521281242, "global_step": 19918, "epoch": 167, "lr": 8.260445361851604e-05} +{"train_loss": 0.004845093470066786, "global_step": 19919, "epoch": 167, "lr": 8.2602773914805e-05} +{"train_loss": 0.004438948351889849, "global_step": 19920, "epoch": 167, "lr": 8.260109414708189e-05} +{"train_loss": 0.003357867244631052, "global_step": 19921, "epoch": 167, "lr": 8.259941431535001e-05} +{"train_loss": 0.004596385173499584, "global_step": 19922, "epoch": 167, "lr": 8.259773441961267e-05} +{"train_loss": 0.0029617133550345898, "global_step": 19923, "epoch": 167, "lr": 8.259605445987315e-05} +{"train_loss": 0.007944677956402302, "global_step": 19924, "epoch": 167, "lr": 8.259437443613477e-05} +{"train_loss": 0.005216365214437246, "global_step": 19925, "epoch": 167, "lr": 8.259269434840082e-05} +{"train_loss": 0.0041912323795259, "global_step": 19926, "epoch": 167, "lr": 8.25910141966746e-05} +{"train_loss": 0.0065384660847485065, "global_step": 19927, "epoch": 167, "lr": 8.258933398095939e-05} +{"train_loss": 0.0038044662214815617, "global_step": 19928, "epoch": 167, "lr": 8.258765370125852e-05} +{"train_loss": 0.004991085268557072, "global_step": 19929, "epoch": 167, "lr": 8.258597335757525e-05} +{"train_loss": 0.00288205174729228, "global_step": 19930, "epoch": 167, "lr": 8.258429294991292e-05} +{"train_loss": 0.006484791170805693, "global_step": 19931, "epoch": 167, "lr": 8.25826124782748e-05} +{"train_loss": 0.00490263057872653, "global_step": 19932, "epoch": 167, "lr": 8.258093194266423e-05} +{"train_loss": 0.0071665821596980095, "global_step": 19933, "epoch": 167, "lr": 8.257925134308446e-05} +{"train_loss": 0.003955803345888853, "global_step": 19934, "epoch": 167, "lr": 8.25775706795388e-05} +{"train_loss": 0.004616349004209042, "global_step": 19935, "epoch": 167, "lr": 8.257588995203058e-05} +{"train_loss": 0.005384967662394047, "global_step": 19936, "epoch": 167, "lr": 8.257420916056308e-05} +{"train_loss": 0.005602279677987099, "global_step": 19937, "epoch": 167, "lr": 8.257252830513958e-05} +{"train_loss": 0.0038336629513651133, "global_step": 19938, "epoch": 167, "lr": 8.257084738576342e-05} +{"train_loss": 0.006963461637496948, "global_step": 19939, "epoch": 167, "lr": 8.256916640243788e-05} +{"train_loss": 0.004069473594427109, "global_step": 19940, "epoch": 167, "lr": 8.256748535516625e-05} +{"train_loss": 0.003580329241231084, "global_step": 19941, "epoch": 167, "lr": 8.256580424395185e-05} +{"train_loss": 0.005982464645057917, "global_step": 19942, "epoch": 167, "lr": 8.256412306879797e-05} +{"train_loss": 0.0058448477648198605, "global_step": 19943, "epoch": 167, "lr": 8.256244182970791e-05} +{"train_loss": 0.0026150874327868223, "global_step": 19944, "epoch": 167, "lr": 8.256076052668499e-05} +{"train_loss": 0.0034038671292364597, "global_step": 19945, "epoch": 167, "lr": 8.255907915973247e-05} +{"train_loss": 0.003949717618525028, "global_step": 19946, "epoch": 167, "lr": 8.255739772885369e-05} +{"train_loss": 0.005908550228923559, "global_step": 19947, "epoch": 167, "lr": 8.255571623405194e-05} +{"train_loss": 0.00271564070135355, "global_step": 19948, "epoch": 167, "lr": 8.255403467533051e-05} +{"train_loss": 0.0035638592671602964, "global_step": 19949, "epoch": 167, "lr": 8.255235305269273e-05} +{"train_loss": 0.006231515668332577, "global_step": 19950, "epoch": 167, "lr": 8.255067136614188e-05} +{"train_loss": 0.0056620435789227486, "global_step": 19951, "epoch": 167, "lr": 8.254898961568125e-05} +{"train_loss": 0.003989031538367271, "global_step": 19952, "epoch": 167, "lr": 8.254730780131416e-05} +{"train_loss": 0.0055077653378248215, "global_step": 19953, "epoch": 167, "lr": 8.25456259230439e-05} +{"train_loss": 0.0061910864897072315, "global_step": 19954, "epoch": 167, "lr": 8.25439439808738e-05} +{"train_loss": 0.005381870549172163, "global_step": 19955, "epoch": 167, "lr": 8.254226197480712e-05} +{"train_loss": 0.005560177844017744, "global_step": 19956, "epoch": 167, "lr": 8.25405799048472e-05} +{"train_loss": 0.006196779198944569, "global_step": 19957, "epoch": 167, "lr": 8.253889777099733e-05} +{"train_loss": 0.0041605085134506226, "global_step": 19958, "epoch": 167, "lr": 8.253721557326081e-05} +{"train_loss": 0.005087490659207106, "global_step": 19959, "epoch": 167, "lr": 8.253553331164095e-05} +{"train_loss": 0.003637998830527067, "global_step": 19960, "epoch": 167, "lr": 8.253385098614101e-05} +{"train_loss": 0.005634843371808529, "global_step": 19961, "epoch": 167, "lr": 8.253216859676436e-05} +{"train_loss": 0.004775464069098234, "global_step": 19962, "epoch": 167, "lr": 8.253048614351428e-05} +{"train_loss": 0.0030735679902136326, "global_step": 19963, "epoch": 167, "lr": 8.252880362639405e-05} +{"train_loss": 0.006033577956259251, "global_step": 19964, "epoch": 167, "lr": 8.252712104540698e-05} +{"train_loss": 0.00581183098256588, "global_step": 19965, "epoch": 167, "lr": 8.25254384005564e-05} +{"train_loss": 0.006223834119737148, "global_step": 19966, "epoch": 167, "lr": 8.252375569184559e-05} +{"train_loss": 0.005478001199662685, "global_step": 19967, "epoch": 167, "lr": 8.252207291927787e-05} +{"train_loss": 0.006497287657111883, "global_step": 19968, "epoch": 167, "lr": 8.252039008285652e-05} +{"train_loss": 0.004129288252443075, "global_step": 19969, "epoch": 167, "lr": 8.251870718258487e-05} +{"train_loss": 0.0027686641551554203, "global_step": 19970, "epoch": 167, "lr": 8.25170242184662e-05} +{"train_loss": 0.006241000257432461, "global_step": 19971, "epoch": 167, "lr": 8.251534119050383e-05} +{"train_loss": 0.005263513419777155, "global_step": 19972, "epoch": 167, "lr": 8.251365809870108e-05} +{"train_loss": 0.0038748998194932938, "global_step": 19973, "epoch": 167, "lr": 8.251197494306122e-05} +{"train_loss": 0.004675472620874643, "global_step": 19974, "epoch": 167, "lr": 8.251029172358757e-05} +{"train_loss": 0.004915222525596619, "global_step": 19975, "epoch": 167, "lr": 8.250860844028343e-05} +{"train_loss": 0.006126081105321646, "global_step": 19976, "epoch": 167, "lr": 8.250692509315213e-05} +{"train_loss": 0.0057399095967411995, "global_step": 19977, "epoch": 167, "lr": 8.250524168219693e-05} +{"train_loss": 0.007127279881387949, "global_step": 19978, "epoch": 167, "lr": 8.250355820742118e-05} +{"train_loss": 0.0035004126839339733, "global_step": 19979, "epoch": 167, "lr": 8.250187466882816e-05} +{"train_loss": 0.00499007198959589, "global_step": 19980, "epoch": 167, "lr": 8.250019106642117e-05} +{"train_loss": 0.006119012366980314, "global_step": 19981, "epoch": 167, "lr": 8.249850740020355e-05} +{"train_loss": 0.006923815235495567, "global_step": 19982, "epoch": 167, "lr": 8.249682367017858e-05} +{"train_loss": 0.009058437310159206, "global_step": 19983, "epoch": 167, "lr": 8.249513987634956e-05} +{"train_loss": 0.004058064427226782, "global_step": 19984, "epoch": 167, "lr": 8.24934560187198e-05} +{"train_loss": 0.004626715090125799, "global_step": 19985, "epoch": 167, "lr": 8.249177209729262e-05} +{"train_loss": 0.005290116649121046, "global_step": 19986, "epoch": 167, "lr": 8.24900881120713e-05} +{"train_loss": 0.005069154780358076, "global_step": 19987, "epoch": 167, "lr": 8.248840406305918e-05} +{"train_loss": 0.003376611741259694, "global_step": 19988, "epoch": 167, "lr": 8.248671995025953e-05} +{"train_loss": 0.003467629663646221, "global_step": 19989, "epoch": 167, "lr": 8.24850357736757e-05} +{"train_loss": 0.008511761203408241, "global_step": 19990, "epoch": 167, "lr": 8.248335153331097e-05} +{"train_loss": 0.004972072408198058, "global_step": 19991, "epoch": 167, "lr": 8.248166722916863e-05, "val_loss": 0.017913950607180595} +{"train_loss": 0.007385783363133669, "global_step": 19992, "epoch": 168, "lr": 8.247998286125203e-05} +{"train_loss": 0.0054788668639957905, "global_step": 19993, "epoch": 168, "lr": 8.247829842956443e-05} +{"train_loss": 0.0048245773650705814, "global_step": 19994, "epoch": 168, "lr": 8.247661393410919e-05} +{"train_loss": 0.004846170544624329, "global_step": 19995, "epoch": 168, "lr": 8.247492937488957e-05} +{"train_loss": 0.004013998433947563, "global_step": 19996, "epoch": 168, "lr": 8.247324475190888e-05} +{"train_loss": 0.005439976695924997, "global_step": 19997, "epoch": 168, "lr": 8.247156006517047e-05} +{"train_loss": 0.006638416089117527, "global_step": 19998, "epoch": 168, "lr": 8.24698753146776e-05} +{"train_loss": 0.006781857460737228, "global_step": 19999, "epoch": 168, "lr": 8.246819050043362e-05} +{"train_loss": 0.0050940727815032005, "global_step": 20000, "epoch": 168, "lr": 8.24665056224418e-05} +{"train_loss": 0.004503094591200352, "global_step": 20001, "epoch": 168, "lr": 8.246482068070547e-05} +{"train_loss": 0.006351051386445761, "global_step": 20002, "epoch": 168, "lr": 8.246313567522794e-05} +{"train_loss": 0.004308752249926329, "global_step": 20003, "epoch": 168, "lr": 8.24614506060125e-05} +{"train_loss": 0.00419963663443923, "global_step": 20004, "epoch": 168, "lr": 8.245976547306248e-05} +{"train_loss": 0.0069151767529547215, "global_step": 20005, "epoch": 168, "lr": 8.245808027638117e-05} +{"train_loss": 0.004203291609883308, "global_step": 20006, "epoch": 168, "lr": 8.245639501597189e-05} +{"train_loss": 0.0053374795243144035, "global_step": 20007, "epoch": 168, "lr": 8.245470969183795e-05} +{"train_loss": 0.005142877344042063, "global_step": 20008, "epoch": 168, "lr": 8.245302430398265e-05} +{"train_loss": 0.00491657480597496, "global_step": 20009, "epoch": 168, "lr": 8.24513388524093e-05} +{"train_loss": 0.0035835299640893936, "global_step": 20010, "epoch": 168, "lr": 8.244965333712123e-05} +{"train_loss": 0.003564076032489538, "global_step": 20011, "epoch": 168, "lr": 8.244796775812172e-05} +{"train_loss": 0.006510515697300434, "global_step": 20012, "epoch": 168, "lr": 8.244628211541408e-05} +{"train_loss": 0.0036659161560237408, "global_step": 20013, "epoch": 168, "lr": 8.244459640900165e-05} +{"train_loss": 0.006838307250291109, "global_step": 20014, "epoch": 168, "lr": 8.244291063888771e-05} +{"train_loss": 0.004384579136967659, "global_step": 20015, "epoch": 168, "lr": 8.244122480507559e-05} +{"train_loss": 0.003096026601269841, "global_step": 20016, "epoch": 168, "lr": 8.24395389075686e-05} +{"train_loss": 0.0057886457070708275, "global_step": 20017, "epoch": 168, "lr": 8.243785294637001e-05} +{"train_loss": 0.005157915875315666, "global_step": 20018, "epoch": 168, "lr": 8.243616692148318e-05} +{"train_loss": 0.006610470358282328, "global_step": 20019, "epoch": 168, "lr": 8.243448083291141e-05} +{"train_loss": 0.0037986126262694597, "global_step": 20020, "epoch": 168, "lr": 8.243279468065799e-05} +{"train_loss": 0.005132091697305441, "global_step": 20021, "epoch": 168, "lr": 8.243110846472624e-05} +{"train_loss": 0.0040527405217289925, "global_step": 20022, "epoch": 168, "lr": 8.242942218511947e-05} +{"train_loss": 0.009213032200932503, "global_step": 20023, "epoch": 168, "lr": 8.242773584184101e-05} +{"train_loss": 0.005200079642236233, "global_step": 20024, "epoch": 168, "lr": 8.242604943489415e-05} +{"train_loss": 0.005846192594617605, "global_step": 20025, "epoch": 168, "lr": 8.24243629642822e-05} +{"train_loss": 0.0033522499725222588, "global_step": 20026, "epoch": 168, "lr": 8.242267643000849e-05} +{"train_loss": 0.0034662007819861174, "global_step": 20027, "epoch": 168, "lr": 8.24209898320763e-05} +{"train_loss": 0.002883759792894125, "global_step": 20028, "epoch": 168, "lr": 8.241930317048897e-05} +{"train_loss": 0.003973192535340786, "global_step": 20029, "epoch": 168, "lr": 8.24176164452498e-05} +{"train_loss": 0.006129307672381401, "global_step": 20030, "epoch": 168, "lr": 8.241592965636211e-05} +{"train_loss": 0.004227886442095041, "global_step": 20031, "epoch": 168, "lr": 8.24142428038292e-05} +{"train_loss": 0.005184120498597622, "global_step": 20032, "epoch": 168, "lr": 8.24125558876544e-05} +{"train_loss": 0.004567284137010574, "global_step": 20033, "epoch": 168, "lr": 8.241086890784099e-05} +{"train_loss": 0.0033046023454517126, "global_step": 20034, "epoch": 168, "lr": 8.240918186439231e-05} +{"train_loss": 0.003615760011598468, "global_step": 20035, "epoch": 168, "lr": 8.240749475731166e-05} +{"train_loss": 0.007347537204623222, "global_step": 20036, "epoch": 168, "lr": 8.240580758660235e-05} +{"train_loss": 0.00368315982632339, "global_step": 20037, "epoch": 168, "lr": 8.24041203522677e-05} +{"train_loss": 0.0046076904982328415, "global_step": 20038, "epoch": 168, "lr": 8.240243305431104e-05} +{"train_loss": 0.004575327038764954, "global_step": 20039, "epoch": 168, "lr": 8.240074569273567e-05} +{"train_loss": 0.003475258592516184, "global_step": 20040, "epoch": 168, "lr": 8.239905826754486e-05} +{"train_loss": 0.004019506741315126, "global_step": 20041, "epoch": 168, "lr": 8.239737077874198e-05} +{"train_loss": 0.005296229850500822, "global_step": 20042, "epoch": 168, "lr": 8.239568322633033e-05} +{"train_loss": 0.003847825573757291, "global_step": 20043, "epoch": 168, "lr": 8.23939956103132e-05} +{"train_loss": 0.0036996561102569103, "global_step": 20044, "epoch": 168, "lr": 8.239230793069394e-05} +{"train_loss": 0.0036914441734552383, "global_step": 20045, "epoch": 168, "lr": 8.239062018747583e-05} +{"train_loss": 0.003123744623735547, "global_step": 20046, "epoch": 168, "lr": 8.23889323806622e-05} +{"train_loss": 0.00393102690577507, "global_step": 20047, "epoch": 168, "lr": 8.238724451025637e-05} +{"train_loss": 0.004296697676181793, "global_step": 20048, "epoch": 168, "lr": 8.238555657626165e-05} +{"train_loss": 0.005514972377568483, "global_step": 20049, "epoch": 168, "lr": 8.238386857868134e-05} +{"train_loss": 0.0032772698905318975, "global_step": 20050, "epoch": 168, "lr": 8.238218051751876e-05} +{"train_loss": 0.0053552850149571896, "global_step": 20051, "epoch": 168, "lr": 8.238049239277723e-05} +{"train_loss": 0.0033425104338675737, "global_step": 20052, "epoch": 168, "lr": 8.237880420446007e-05} +{"train_loss": 0.00886109285056591, "global_step": 20053, "epoch": 168, "lr": 8.237711595257058e-05} +{"train_loss": 0.00885405857115984, "global_step": 20054, "epoch": 168, "lr": 8.237542763711208e-05} +{"train_loss": 0.004164779093116522, "global_step": 20055, "epoch": 168, "lr": 8.237373925808788e-05} +{"train_loss": 0.004168621730059385, "global_step": 20056, "epoch": 168, "lr": 8.237205081550132e-05} +{"train_loss": 0.0030501573346555233, "global_step": 20057, "epoch": 168, "lr": 8.237036230935568e-05} +{"train_loss": 0.003991149365901947, "global_step": 20058, "epoch": 168, "lr": 8.236867373965431e-05} +{"train_loss": 0.00552851427346468, "global_step": 20059, "epoch": 168, "lr": 8.236698510640051e-05} +{"train_loss": 0.006055950187146664, "global_step": 20060, "epoch": 168, "lr": 8.236529640959757e-05} +{"train_loss": 0.0064016361720860004, "global_step": 20061, "epoch": 168, "lr": 8.236360764924883e-05} +{"train_loss": 0.006042590830475092, "global_step": 20062, "epoch": 168, "lr": 8.236191882535762e-05} +{"train_loss": 0.007124430499970913, "global_step": 20063, "epoch": 168, "lr": 8.236022993792722e-05} +{"train_loss": 0.004811664577573538, "global_step": 20064, "epoch": 168, "lr": 8.235854098696098e-05} +{"train_loss": 0.00578464986756444, "global_step": 20065, "epoch": 168, "lr": 8.23568519724622e-05} +{"train_loss": 0.0029626362957060337, "global_step": 20066, "epoch": 168, "lr": 8.235516289443421e-05} +{"train_loss": 0.0063545615412294865, "global_step": 20067, "epoch": 168, "lr": 8.23534737528803e-05} +{"train_loss": 0.002953748218715191, "global_step": 20068, "epoch": 168, "lr": 8.23517845478038e-05} +{"train_loss": 0.00939185731112957, "global_step": 20069, "epoch": 168, "lr": 8.235009527920802e-05} +{"train_loss": 0.002505389042198658, "global_step": 20070, "epoch": 168, "lr": 8.23484059470963e-05} +{"train_loss": 0.0030634107533842325, "global_step": 20071, "epoch": 168, "lr": 8.234671655147194e-05} +{"train_loss": 0.0043555255979299545, "global_step": 20072, "epoch": 168, "lr": 8.234502709233825e-05} +{"train_loss": 0.004501288756728172, "global_step": 20073, "epoch": 168, "lr": 8.234333756969855e-05} +{"train_loss": 0.007121930364519358, "global_step": 20074, "epoch": 168, "lr": 8.234164798355617e-05} +{"train_loss": 0.004130862187594175, "global_step": 20075, "epoch": 168, "lr": 8.233995833391441e-05} +{"train_loss": 0.005660088267177343, "global_step": 20076, "epoch": 168, "lr": 8.233826862077662e-05} +{"train_loss": 0.00450637424364686, "global_step": 20077, "epoch": 168, "lr": 8.233657884414607e-05} +{"train_loss": 0.004387688357383013, "global_step": 20078, "epoch": 168, "lr": 8.233488900402612e-05} +{"train_loss": 0.0037539273034781218, "global_step": 20079, "epoch": 168, "lr": 8.233319910042006e-05} +{"train_loss": 0.004700754769146442, "global_step": 20080, "epoch": 168, "lr": 8.233150913333122e-05} +{"train_loss": 0.0047402638010680676, "global_step": 20081, "epoch": 168, "lr": 8.232981910276292e-05} +{"train_loss": 0.006642476189881563, "global_step": 20082, "epoch": 168, "lr": 8.232812900871846e-05} +{"train_loss": 0.00533932214602828, "global_step": 20083, "epoch": 168, "lr": 8.23264388512012e-05} +{"train_loss": 0.003899648319929838, "global_step": 20084, "epoch": 168, "lr": 8.23247486302144e-05} +{"train_loss": 0.006735149770975113, "global_step": 20085, "epoch": 168, "lr": 8.232305834576141e-05} +{"train_loss": 0.0025024698115885258, "global_step": 20086, "epoch": 168, "lr": 8.232136799784558e-05} +{"train_loss": 0.004973734263330698, "global_step": 20087, "epoch": 168, "lr": 8.231967758647016e-05} +{"train_loss": 0.004137110430747271, "global_step": 20088, "epoch": 168, "lr": 8.231798711163854e-05} +{"train_loss": 0.0033858749084174633, "global_step": 20089, "epoch": 168, "lr": 8.231629657335399e-05} +{"train_loss": 0.0041922470554709435, "global_step": 20090, "epoch": 168, "lr": 8.231460597161985e-05} +{"train_loss": 0.0046098604798316956, "global_step": 20091, "epoch": 168, "lr": 8.231291530643941e-05} +{"train_loss": 0.004631571471691132, "global_step": 20092, "epoch": 168, "lr": 8.231122457781604e-05} +{"train_loss": 0.006359637249261141, "global_step": 20093, "epoch": 168, "lr": 8.230953378575301e-05} +{"train_loss": 0.004489008337259293, "global_step": 20094, "epoch": 168, "lr": 8.230784293025367e-05} +{"train_loss": 0.005328961182385683, "global_step": 20095, "epoch": 168, "lr": 8.230615201132134e-05} +{"train_loss": 0.008064388297498226, "global_step": 20096, "epoch": 168, "lr": 8.230446102895933e-05} +{"train_loss": 0.006223637145012617, "global_step": 20097, "epoch": 168, "lr": 8.230276998317097e-05} +{"train_loss": 0.006255935411900282, "global_step": 20098, "epoch": 168, "lr": 8.230107887395955e-05} +{"train_loss": 0.005459454841911793, "global_step": 20099, "epoch": 168, "lr": 8.229938770132843e-05} +{"train_loss": 0.007636000402271748, "global_step": 20100, "epoch": 168, "lr": 8.22976964652809e-05} +{"train_loss": 0.004628846887499094, "global_step": 20101, "epoch": 168, "lr": 8.22960051658203e-05} +{"train_loss": 0.005051945801824331, "global_step": 20102, "epoch": 168, "lr": 8.229431380294996e-05} +{"train_loss": 0.004939098842442036, "global_step": 20103, "epoch": 168, "lr": 8.229262237667317e-05} +{"train_loss": 0.0030450737103819847, "global_step": 20104, "epoch": 168, "lr": 8.229093088699326e-05} +{"train_loss": 0.005007551517337561, "global_step": 20105, "epoch": 168, "lr": 8.228923933391357e-05} +{"train_loss": 0.0033118599094450474, "global_step": 20106, "epoch": 168, "lr": 8.228754771743738e-05} +{"train_loss": 0.003678311826661229, "global_step": 20107, "epoch": 168, "lr": 8.228585603756808e-05} +{"train_loss": 0.004320783074945211, "global_step": 20108, "epoch": 168, "lr": 8.228416429430892e-05} +{"train_loss": 0.005033449735492468, "global_step": 20109, "epoch": 168, "lr": 8.228247248766328e-05} +{"train_loss": 0.004930454280869174, "global_step": 20110, "epoch": 168, "lr": 8.228078061763442e-05, "val_loss": 0.010279913432896137} +{"train_loss": 0.005421903915703297, "global_step": 20111, "epoch": 169, "lr": 8.227908868422571e-05} +{"train_loss": 0.006921782158315182, "global_step": 20112, "epoch": 169, "lr": 8.227739668744046e-05} +{"train_loss": 0.005546684376895428, "global_step": 20113, "epoch": 169, "lr": 8.2275704627282e-05} +{"train_loss": 0.006944098975509405, "global_step": 20114, "epoch": 169, "lr": 8.227401250375364e-05} +{"train_loss": 0.004463928751647472, "global_step": 20115, "epoch": 169, "lr": 8.227232031685869e-05} +{"train_loss": 0.005626225378364325, "global_step": 20116, "epoch": 169, "lr": 8.227062806660051e-05} +{"train_loss": 0.006116835400462151, "global_step": 20117, "epoch": 169, "lr": 8.226893575298238e-05} +{"train_loss": 0.0045404089614748955, "global_step": 20118, "epoch": 169, "lr": 8.226724337600764e-05} +{"train_loss": 0.004298997577279806, "global_step": 20119, "epoch": 169, "lr": 8.226555093567963e-05} +{"train_loss": 0.0035115268547087908, "global_step": 20120, "epoch": 169, "lr": 8.226385843200164e-05} +{"train_loss": 0.0056684440933167934, "global_step": 20121, "epoch": 169, "lr": 8.226216586497702e-05} +{"train_loss": 0.004362898413091898, "global_step": 20122, "epoch": 169, "lr": 8.226047323460908e-05} +{"train_loss": 0.004197301343083382, "global_step": 20123, "epoch": 169, "lr": 8.225878054090114e-05} +{"train_loss": 0.006685784086585045, "global_step": 20124, "epoch": 169, "lr": 8.225708778385655e-05} +{"train_loss": 0.003033566754311323, "global_step": 20125, "epoch": 169, "lr": 8.225539496347862e-05} +{"train_loss": 0.006173447240144014, "global_step": 20126, "epoch": 169, "lr": 8.225370207977065e-05} +{"train_loss": 0.0033641632180660963, "global_step": 20127, "epoch": 169, "lr": 8.225200913273599e-05} +{"train_loss": 0.0051112244836986065, "global_step": 20128, "epoch": 169, "lr": 8.225031612237794e-05} +{"train_loss": 0.008779049851000309, "global_step": 20129, "epoch": 169, "lr": 8.224862304869986e-05} +{"train_loss": 0.002956492593511939, "global_step": 20130, "epoch": 169, "lr": 8.224692991170504e-05} +{"train_loss": 0.004253774415701628, "global_step": 20131, "epoch": 169, "lr": 8.224523671139683e-05} +{"train_loss": 0.003929796162992716, "global_step": 20132, "epoch": 169, "lr": 8.224354344777854e-05} +{"train_loss": 0.00577523885294795, "global_step": 20133, "epoch": 169, "lr": 8.224185012085349e-05} +{"train_loss": 0.002896078396588564, "global_step": 20134, "epoch": 169, "lr": 8.224015673062502e-05} +{"train_loss": 0.003394628409296274, "global_step": 20135, "epoch": 169, "lr": 8.223846327709643e-05} +{"train_loss": 0.004787365440279245, "global_step": 20136, "epoch": 169, "lr": 8.223676976027108e-05} +{"train_loss": 0.005400327034294605, "global_step": 20137, "epoch": 169, "lr": 8.223507618015228e-05} +{"train_loss": 0.006587420590221882, "global_step": 20138, "epoch": 169, "lr": 8.223338253674333e-05} +{"train_loss": 0.003288388019427657, "global_step": 20139, "epoch": 169, "lr": 8.223168883004759e-05} +{"train_loss": 0.005369636695832014, "global_step": 20140, "epoch": 169, "lr": 8.222999506006837e-05} +{"train_loss": 0.0036955494433641434, "global_step": 20141, "epoch": 169, "lr": 8.2228301226809e-05} +{"train_loss": 0.003210989059880376, "global_step": 20142, "epoch": 169, "lr": 8.22266073302728e-05} +{"train_loss": 0.003926103003323078, "global_step": 20143, "epoch": 169, "lr": 8.22249133704631e-05} +{"train_loss": 0.005653498228639364, "global_step": 20144, "epoch": 169, "lr": 8.222321934738324e-05} +{"train_loss": 0.0046010008081793785, "global_step": 20145, "epoch": 169, "lr": 8.222152526103651e-05} +{"train_loss": 0.004527484066784382, "global_step": 20146, "epoch": 169, "lr": 8.221983111142627e-05} +{"train_loss": 0.003466683905571699, "global_step": 20147, "epoch": 169, "lr": 8.221813689855584e-05} +{"train_loss": 0.00482947938144207, "global_step": 20148, "epoch": 169, "lr": 8.221644262242851e-05} +{"train_loss": 0.0057394434697926044, "global_step": 20149, "epoch": 169, "lr": 8.221474828304768e-05} +{"train_loss": 0.004924566950649023, "global_step": 20150, "epoch": 169, "lr": 8.22130538804166e-05} +{"train_loss": 0.002965409541502595, "global_step": 20151, "epoch": 169, "lr": 8.221135941453863e-05} +{"train_loss": 0.007684459909796715, "global_step": 20152, "epoch": 169, "lr": 8.220966488541712e-05} +{"train_loss": 0.0050340378656983376, "global_step": 20153, "epoch": 169, "lr": 8.220797029305536e-05} +{"train_loss": 0.005159767810255289, "global_step": 20154, "epoch": 169, "lr": 8.220627563745669e-05} +{"train_loss": 0.005123964510858059, "global_step": 20155, "epoch": 169, "lr": 8.220458091862444e-05} +{"train_loss": 0.005236856173723936, "global_step": 20156, "epoch": 169, "lr": 8.220288613656194e-05} +{"train_loss": 0.005343607161194086, "global_step": 20157, "epoch": 169, "lr": 8.220119129127252e-05} +{"train_loss": 0.005697300191968679, "global_step": 20158, "epoch": 169, "lr": 8.219949638275947e-05} +{"train_loss": 0.005234403535723686, "global_step": 20159, "epoch": 169, "lr": 8.219780141102618e-05} +{"train_loss": 0.0047968914732337, "global_step": 20160, "epoch": 169, "lr": 8.219610637607594e-05} +{"train_loss": 0.007262818980962038, "global_step": 20161, "epoch": 169, "lr": 8.219441127791207e-05} +{"train_loss": 0.006142290774732828, "global_step": 20162, "epoch": 169, "lr": 8.219271611653794e-05} +{"train_loss": 0.003813055343925953, "global_step": 20163, "epoch": 169, "lr": 8.219102089195682e-05} +{"train_loss": 0.005009210668504238, "global_step": 20164, "epoch": 169, "lr": 8.21893256041721e-05} +{"train_loss": 0.003821631893515587, "global_step": 20165, "epoch": 169, "lr": 8.218763025318707e-05} +{"train_loss": 0.004388998728245497, "global_step": 20166, "epoch": 169, "lr": 8.218593483900506e-05} +{"train_loss": 0.004781404044479132, "global_step": 20167, "epoch": 169, "lr": 8.21842393616294e-05} +{"train_loss": 0.005744283087551594, "global_step": 20168, "epoch": 169, "lr": 8.218254382106342e-05} +{"train_loss": 0.004028993658721447, "global_step": 20169, "epoch": 169, "lr": 8.218084821731047e-05} +{"train_loss": 0.0029121970292180777, "global_step": 20170, "epoch": 169, "lr": 8.217915255037388e-05} +{"train_loss": 0.005235309712588787, "global_step": 20171, "epoch": 169, "lr": 8.217745682025692e-05} +{"train_loss": 0.007065617945045233, "global_step": 20172, "epoch": 169, "lr": 8.217576102696298e-05} +{"train_loss": 0.007602514233440161, "global_step": 20173, "epoch": 169, "lr": 8.217406517049537e-05} +{"train_loss": 0.006429439410567284, "global_step": 20174, "epoch": 169, "lr": 8.217236925085743e-05} +{"train_loss": 0.003911120817065239, "global_step": 20175, "epoch": 169, "lr": 8.217067326805247e-05} +{"train_loss": 0.008543619886040688, "global_step": 20176, "epoch": 169, "lr": 8.216897722208383e-05} +{"train_loss": 0.0050454824231565, "global_step": 20177, "epoch": 169, "lr": 8.216728111295484e-05} +{"train_loss": 0.006268273573368788, "global_step": 20178, "epoch": 169, "lr": 8.216558494066884e-05} +{"train_loss": 0.0041525159031152725, "global_step": 20179, "epoch": 169, "lr": 8.216388870522914e-05} +{"train_loss": 0.002981337020173669, "global_step": 20180, "epoch": 169, "lr": 8.216219240663907e-05} +{"train_loss": 0.007436984684318304, "global_step": 20181, "epoch": 169, "lr": 8.216049604490199e-05} +{"train_loss": 0.0047168005257844925, "global_step": 20182, "epoch": 169, "lr": 8.21587996200212e-05} +{"train_loss": 0.0050676241517066956, "global_step": 20183, "epoch": 169, "lr": 8.215710313200004e-05} +{"train_loss": 0.004920525476336479, "global_step": 20184, "epoch": 169, "lr": 8.215540658084186e-05} +{"train_loss": 0.003610288957133889, "global_step": 20185, "epoch": 169, "lr": 8.215370996654996e-05} +{"train_loss": 0.007942127995193005, "global_step": 20186, "epoch": 169, "lr": 8.215201328912769e-05} +{"train_loss": 0.006212308537214994, "global_step": 20187, "epoch": 169, "lr": 8.215031654857838e-05} +{"train_loss": 0.004764179233461618, "global_step": 20188, "epoch": 169, "lr": 8.214861974490537e-05} +{"train_loss": 0.0036291866563260555, "global_step": 20189, "epoch": 169, "lr": 8.214692287811197e-05} +{"train_loss": 0.00583708705380559, "global_step": 20190, "epoch": 169, "lr": 8.214522594820151e-05} +{"train_loss": 0.005887923296540976, "global_step": 20191, "epoch": 169, "lr": 8.214352895517734e-05} +{"train_loss": 0.0029238846618682146, "global_step": 20192, "epoch": 169, "lr": 8.214183189904279e-05} +{"train_loss": 0.007268169429153204, "global_step": 20193, "epoch": 169, "lr": 8.214013477980118e-05} +{"train_loss": 0.0062398104928433895, "global_step": 20194, "epoch": 169, "lr": 8.213843759745584e-05} +{"train_loss": 0.005094446241855621, "global_step": 20195, "epoch": 169, "lr": 8.213674035201013e-05} +{"train_loss": 0.00410638190805912, "global_step": 20196, "epoch": 169, "lr": 8.213504304346735e-05} +{"train_loss": 0.005432811100035906, "global_step": 20197, "epoch": 169, "lr": 8.213334567183086e-05} +{"train_loss": 0.007374051958322525, "global_step": 20198, "epoch": 169, "lr": 8.213164823710397e-05} +{"train_loss": 0.004141159821301699, "global_step": 20199, "epoch": 169, "lr": 8.212995073929002e-05} +{"train_loss": 0.0060292440466582775, "global_step": 20200, "epoch": 169, "lr": 8.212825317839235e-05} +{"train_loss": 0.0044758012518286705, "global_step": 20201, "epoch": 169, "lr": 8.212655555441429e-05} +{"train_loss": 0.006426953244954348, "global_step": 20202, "epoch": 169, "lr": 8.212485786735916e-05} +{"train_loss": 0.007678242400288582, "global_step": 20203, "epoch": 169, "lr": 8.212316011723032e-05} +{"train_loss": 0.004864466842263937, "global_step": 20204, "epoch": 169, "lr": 8.212146230403106e-05} +{"train_loss": 0.0077461316250264645, "global_step": 20205, "epoch": 169, "lr": 8.211976442776476e-05} +{"train_loss": 0.005189398769289255, "global_step": 20206, "epoch": 169, "lr": 8.211806648843471e-05} +{"train_loss": 0.007149560377001762, "global_step": 20207, "epoch": 169, "lr": 8.21163684860443e-05} +{"train_loss": 0.004871951881796122, "global_step": 20208, "epoch": 169, "lr": 8.211467042059681e-05} +{"train_loss": 0.005741545464843512, "global_step": 20209, "epoch": 169, "lr": 8.211297229209562e-05} +{"train_loss": 0.006391357164829969, "global_step": 20210, "epoch": 169, "lr": 8.211127410054402e-05} +{"train_loss": 0.0037696133367717266, "global_step": 20211, "epoch": 169, "lr": 8.210957584594536e-05} +{"train_loss": 0.004543254617601633, "global_step": 20212, "epoch": 169, "lr": 8.2107877528303e-05} +{"train_loss": 0.003231859765946865, "global_step": 20213, "epoch": 169, "lr": 8.210617914762023e-05} +{"train_loss": 0.00563333835452795, "global_step": 20214, "epoch": 169, "lr": 8.210448070390042e-05} +{"train_loss": 0.004575841128826141, "global_step": 20215, "epoch": 169, "lr": 8.210278219714689e-05} +{"train_loss": 0.0036541656590998173, "global_step": 20216, "epoch": 169, "lr": 8.210108362736297e-05} +{"train_loss": 0.005992693826556206, "global_step": 20217, "epoch": 169, "lr": 8.209938499455201e-05} +{"train_loss": 0.0044771707616746426, "global_step": 20218, "epoch": 169, "lr": 8.209768629871733e-05} +{"train_loss": 0.005323897115886211, "global_step": 20219, "epoch": 169, "lr": 8.209598753986227e-05} +{"train_loss": 0.007451185490936041, "global_step": 20220, "epoch": 169, "lr": 8.209428871799019e-05} +{"train_loss": 0.008099282160401344, "global_step": 20221, "epoch": 169, "lr": 8.209258983310438e-05} +{"train_loss": 0.0036787616554647684, "global_step": 20222, "epoch": 169, "lr": 8.209089088520821e-05} +{"train_loss": 0.007303318474441767, "global_step": 20223, "epoch": 169, "lr": 8.2089191874305e-05} +{"train_loss": 0.005001425743103027, "global_step": 20224, "epoch": 169, "lr": 8.208749280039809e-05} +{"train_loss": 0.0040368083864450455, "global_step": 20225, "epoch": 169, "lr": 8.20857936634908e-05} +{"train_loss": 0.004587190225720406, "global_step": 20226, "epoch": 169, "lr": 8.208409446358651e-05} +{"train_loss": 0.01329062320291996, "global_step": 20227, "epoch": 169, "lr": 8.208239520068852e-05} +{"train_loss": 0.005631139501929283, "global_step": 20228, "epoch": 169, "lr": 8.208069587480017e-05} +{"train_loss": 0.005266013615882071, "global_step": 20229, "epoch": 169, "lr": 8.207899648592479e-05, "val_loss": 0.01129784993827343} +{"train_loss": 0.005636879708617926, "global_step": 20230, "epoch": 170, "lr": 8.207729703406574e-05} +{"train_loss": 0.004702556412667036, "global_step": 20231, "epoch": 170, "lr": 8.207559751922633e-05} +{"train_loss": 0.010807440616190434, "global_step": 20232, "epoch": 170, "lr": 8.207389794140993e-05} +{"train_loss": 0.0054655130952596664, "global_step": 20233, "epoch": 170, "lr": 8.207219830061986e-05} +{"train_loss": 0.008741904981434345, "global_step": 20234, "epoch": 170, "lr": 8.207049859685944e-05} +{"train_loss": 0.007935436442494392, "global_step": 20235, "epoch": 170, "lr": 8.206879883013204e-05} +{"train_loss": 0.00825971644371748, "global_step": 20236, "epoch": 170, "lr": 8.206709900044095e-05} +{"train_loss": 0.006313784047961235, "global_step": 20237, "epoch": 170, "lr": 8.206539910778956e-05} +{"train_loss": 0.0052752005867660046, "global_step": 20238, "epoch": 170, "lr": 8.206369915218117e-05} +{"train_loss": 0.0069534932263195515, "global_step": 20239, "epoch": 170, "lr": 8.206199913361915e-05} +{"train_loss": 0.01053300779312849, "global_step": 20240, "epoch": 170, "lr": 8.206029905210682e-05} +{"train_loss": 0.005134908482432365, "global_step": 20241, "epoch": 170, "lr": 8.205859890764751e-05} +{"train_loss": 0.00618230365216732, "global_step": 20242, "epoch": 170, "lr": 8.205689870024455e-05} +{"train_loss": 0.007251276634633541, "global_step": 20243, "epoch": 170, "lr": 8.205519842990132e-05} +{"train_loss": 0.004172027111053467, "global_step": 20244, "epoch": 170, "lr": 8.205349809662111e-05} +{"train_loss": 0.005184548441320658, "global_step": 20245, "epoch": 170, "lr": 8.205179770040732e-05} +{"train_loss": 0.004681500606238842, "global_step": 20246, "epoch": 170, "lr": 8.205009724126321e-05} +{"train_loss": 0.004862444940954447, "global_step": 20247, "epoch": 170, "lr": 8.204839671919218e-05} +{"train_loss": 0.004863588139414787, "global_step": 20248, "epoch": 170, "lr": 8.204669613419753e-05} +{"train_loss": 0.007663129363209009, "global_step": 20249, "epoch": 170, "lr": 8.204499548628262e-05} +{"train_loss": 0.005291132256388664, "global_step": 20250, "epoch": 170, "lr": 8.204329477545078e-05} +{"train_loss": 0.0064573935233056545, "global_step": 20251, "epoch": 170, "lr": 8.204159400170536e-05} +{"train_loss": 0.004893790930509567, "global_step": 20252, "epoch": 170, "lr": 8.203989316504971e-05} +{"train_loss": 0.0061705936677753925, "global_step": 20253, "epoch": 170, "lr": 8.203819226548713e-05} +{"train_loss": 0.005873568821698427, "global_step": 20254, "epoch": 170, "lr": 8.2036491303021e-05} +{"train_loss": 0.004304816480726004, "global_step": 20255, "epoch": 170, "lr": 8.203479027765463e-05} +{"train_loss": 0.005814509466290474, "global_step": 20256, "epoch": 170, "lr": 8.203308918939137e-05} +{"train_loss": 0.005028370302170515, "global_step": 20257, "epoch": 170, "lr": 8.203138803823458e-05} +{"train_loss": 0.004650224931538105, "global_step": 20258, "epoch": 170, "lr": 8.202968682418755e-05} +{"train_loss": 0.005898258648812771, "global_step": 20259, "epoch": 170, "lr": 8.202798554725369e-05} +{"train_loss": 0.005599651951342821, "global_step": 20260, "epoch": 170, "lr": 8.202628420743626e-05} +{"train_loss": 0.005195596721023321, "global_step": 20261, "epoch": 170, "lr": 8.202458280473867e-05} +{"train_loss": 0.005119656212627888, "global_step": 20262, "epoch": 170, "lr": 8.202288133916423e-05} +{"train_loss": 0.005868976935744286, "global_step": 20263, "epoch": 170, "lr": 8.202117981071628e-05} +{"train_loss": 0.00539750512689352, "global_step": 20264, "epoch": 170, "lr": 8.201947821939817e-05} +{"train_loss": 0.00563215184956789, "global_step": 20265, "epoch": 170, "lr": 8.201777656521323e-05} +{"train_loss": 0.004854766186326742, "global_step": 20266, "epoch": 170, "lr": 8.20160748481648e-05} +{"train_loss": 0.004662284627556801, "global_step": 20267, "epoch": 170, "lr": 8.201437306825624e-05} +{"train_loss": 0.00488290935754776, "global_step": 20268, "epoch": 170, "lr": 8.201267122549087e-05} +{"train_loss": 0.006844995077699423, "global_step": 20269, "epoch": 170, "lr": 8.201096931987204e-05} +{"train_loss": 0.006548787001520395, "global_step": 20270, "epoch": 170, "lr": 8.200926735140311e-05} +{"train_loss": 0.0052065616473555565, "global_step": 20271, "epoch": 170, "lr": 8.200756532008738e-05} +{"train_loss": 0.003708970034494996, "global_step": 20272, "epoch": 170, "lr": 8.200586322592822e-05} +{"train_loss": 0.005980056710541248, "global_step": 20273, "epoch": 170, "lr": 8.200416106892897e-05} +{"train_loss": 0.005323496647179127, "global_step": 20274, "epoch": 170, "lr": 8.200245884909296e-05} +{"train_loss": 0.0028724470175802708, "global_step": 20275, "epoch": 170, "lr": 8.200075656642355e-05} +{"train_loss": 0.00566088454797864, "global_step": 20276, "epoch": 170, "lr": 8.199905422092408e-05} +{"train_loss": 0.006498418282717466, "global_step": 20277, "epoch": 170, "lr": 8.199735181259787e-05} +{"train_loss": 0.007895275950431824, "global_step": 20278, "epoch": 170, "lr": 8.19956493414483e-05} +{"train_loss": 0.004333395045250654, "global_step": 20279, "epoch": 170, "lr": 8.199394680747868e-05} +{"train_loss": 0.003986019175499678, "global_step": 20280, "epoch": 170, "lr": 8.199224421069234e-05} +{"train_loss": 0.004845752846449614, "global_step": 20281, "epoch": 170, "lr": 8.199054155109267e-05} +{"train_loss": 0.004853792488574982, "global_step": 20282, "epoch": 170, "lr": 8.198883882868299e-05} +{"train_loss": 0.004273380618542433, "global_step": 20283, "epoch": 170, "lr": 8.198713604346664e-05} +{"train_loss": 0.0072916545905172825, "global_step": 20284, "epoch": 170, "lr": 8.198543319544696e-05} +{"train_loss": 0.0062040900811553, "global_step": 20285, "epoch": 170, "lr": 8.198373028462732e-05} +{"train_loss": 0.005105172283947468, "global_step": 20286, "epoch": 170, "lr": 8.198202731101101e-05} +{"train_loss": 0.004945899825543165, "global_step": 20287, "epoch": 170, "lr": 8.198032427460143e-05} +{"train_loss": 0.006075250916182995, "global_step": 20288, "epoch": 170, "lr": 8.19786211754019e-05} +{"train_loss": 0.0053581963293254375, "global_step": 20289, "epoch": 170, "lr": 8.197691801341575e-05} +{"train_loss": 0.00613464554771781, "global_step": 20290, "epoch": 170, "lr": 8.197521478864634e-05} +{"train_loss": 0.005406475625932217, "global_step": 20291, "epoch": 170, "lr": 8.197351150109701e-05} +{"train_loss": 0.005025026388466358, "global_step": 20292, "epoch": 170, "lr": 8.197180815077111e-05} +{"train_loss": 0.004865623079240322, "global_step": 20293, "epoch": 170, "lr": 8.197010473767199e-05} +{"train_loss": 0.005900225136429071, "global_step": 20294, "epoch": 170, "lr": 8.196840126180297e-05} +{"train_loss": 0.0035838375333696604, "global_step": 20295, "epoch": 170, "lr": 8.196669772316743e-05} +{"train_loss": 0.00664493115618825, "global_step": 20296, "epoch": 170, "lr": 8.196499412176867e-05} +{"train_loss": 0.00471618864685297, "global_step": 20297, "epoch": 170, "lr": 8.196329045761007e-05} +{"train_loss": 0.004431745503097773, "global_step": 20298, "epoch": 170, "lr": 8.196158673069496e-05} +{"train_loss": 0.005852590315043926, "global_step": 20299, "epoch": 170, "lr": 8.19598829410267e-05} +{"train_loss": 0.004489015322178602, "global_step": 20300, "epoch": 170, "lr": 8.195817908860861e-05} +{"train_loss": 0.004260360728949308, "global_step": 20301, "epoch": 170, "lr": 8.195647517344406e-05} +{"train_loss": 0.0034401086159050465, "global_step": 20302, "epoch": 170, "lr": 8.195477119553638e-05} +{"train_loss": 0.003317308146506548, "global_step": 20303, "epoch": 170, "lr": 8.195306715488893e-05} +{"train_loss": 0.005327749531716108, "global_step": 20304, "epoch": 170, "lr": 8.195136305150504e-05} +{"train_loss": 0.00545973377302289, "global_step": 20305, "epoch": 170, "lr": 8.194965888538806e-05} +{"train_loss": 0.004432510584592819, "global_step": 20306, "epoch": 170, "lr": 8.194795465654133e-05} +{"train_loss": 0.004886481445282698, "global_step": 20307, "epoch": 170, "lr": 8.194625036496821e-05} +{"train_loss": 0.006791525520384312, "global_step": 20308, "epoch": 170, "lr": 8.194454601067205e-05} +{"train_loss": 0.006088766269385815, "global_step": 20309, "epoch": 170, "lr": 8.194284159365617e-05} +{"train_loss": 0.004145523998886347, "global_step": 20310, "epoch": 170, "lr": 8.194113711392395e-05} +{"train_loss": 0.004349344875663519, "global_step": 20311, "epoch": 170, "lr": 8.193943257147871e-05} +{"train_loss": 0.003915214911103249, "global_step": 20312, "epoch": 170, "lr": 8.19377279663238e-05} +{"train_loss": 0.005183911882340908, "global_step": 20313, "epoch": 170, "lr": 8.193602329846259e-05} +{"train_loss": 0.005751431453973055, "global_step": 20314, "epoch": 170, "lr": 8.193431856789841e-05} +{"train_loss": 0.004089971072971821, "global_step": 20315, "epoch": 170, "lr": 8.193261377463459e-05} +{"train_loss": 0.004635028541088104, "global_step": 20316, "epoch": 170, "lr": 8.193090891867449e-05} +{"train_loss": 0.007766039576381445, "global_step": 20317, "epoch": 170, "lr": 8.192920400002149e-05} +{"train_loss": 0.005877366289496422, "global_step": 20318, "epoch": 170, "lr": 8.19274990186789e-05} +{"train_loss": 0.004593593068420887, "global_step": 20319, "epoch": 170, "lr": 8.192579397465005e-05} +{"train_loss": 0.005013147834688425, "global_step": 20320, "epoch": 170, "lr": 8.192408886793836e-05} +{"train_loss": 0.0035164132714271545, "global_step": 20321, "epoch": 170, "lr": 8.19223836985471e-05} +{"train_loss": 0.0036894616205245256, "global_step": 20322, "epoch": 170, "lr": 8.192067846647965e-05} +{"train_loss": 0.004571821540594101, "global_step": 20323, "epoch": 170, "lr": 8.191897317173937e-05} +{"train_loss": 0.003587016137316823, "global_step": 20324, "epoch": 170, "lr": 8.19172678143296e-05} +{"train_loss": 0.005907578859478235, "global_step": 20325, "epoch": 170, "lr": 8.191556239425366e-05} +{"train_loss": 0.002463149605318904, "global_step": 20326, "epoch": 170, "lr": 8.191385691151494e-05} +{"train_loss": 0.005212727468460798, "global_step": 20327, "epoch": 170, "lr": 8.191215136611678e-05} +{"train_loss": 0.007167702540755272, "global_step": 20328, "epoch": 170, "lr": 8.191044575806251e-05} +{"train_loss": 0.00479865912348032, "global_step": 20329, "epoch": 170, "lr": 8.19087400873555e-05} +{"train_loss": 0.005198820494115353, "global_step": 20330, "epoch": 170, "lr": 8.190703435399907e-05} +{"train_loss": 0.004845119081437588, "global_step": 20331, "epoch": 170, "lr": 8.19053285579966e-05} +{"train_loss": 0.005287597421556711, "global_step": 20332, "epoch": 170, "lr": 8.190362269935141e-05} +{"train_loss": 0.003354943124577403, "global_step": 20333, "epoch": 170, "lr": 8.190191677806687e-05} +{"train_loss": 0.002956484677270055, "global_step": 20334, "epoch": 170, "lr": 8.190021079414634e-05} +{"train_loss": 0.007017172873020172, "global_step": 20335, "epoch": 170, "lr": 8.189850474759314e-05} +{"train_loss": 0.003243420971557498, "global_step": 20336, "epoch": 170, "lr": 8.189679863841064e-05} +{"train_loss": 0.0060730897821486, "global_step": 20337, "epoch": 170, "lr": 8.189509246660218e-05} +{"train_loss": 0.005112293642014265, "global_step": 20338, "epoch": 170, "lr": 8.18933862321711e-05} +{"train_loss": 0.0041796364821493626, "global_step": 20339, "epoch": 170, "lr": 8.189167993512079e-05} +{"train_loss": 0.0030007788445800543, "global_step": 20340, "epoch": 170, "lr": 8.188997357545456e-05} +{"train_loss": 0.004107964690774679, "global_step": 20341, "epoch": 170, "lr": 8.188826715317577e-05} +{"train_loss": 0.005960836075246334, "global_step": 20342, "epoch": 170, "lr": 8.188656066828779e-05} +{"train_loss": 0.003921052441000938, "global_step": 20343, "epoch": 170, "lr": 8.188485412079394e-05} +{"train_loss": 0.003772352123633027, "global_step": 20344, "epoch": 170, "lr": 8.188314751069759e-05} +{"train_loss": 0.0036757488269358873, "global_step": 20345, "epoch": 170, "lr": 8.188144083800209e-05} +{"train_loss": 0.0056767938658595085, "global_step": 20346, "epoch": 170, "lr": 8.18797341027108e-05} +{"train_loss": 0.0066645327024161816, "global_step": 20347, "epoch": 170, "lr": 8.187802730482704e-05} +{"train_loss": 0.005317992912292355, "global_step": 20348, "epoch": 170, "lr": 8.187632044435416e-05, "val_loss": 0.013012639246881008, "train_action_mse_error": 0.00010792090324684978} +{"train_loss": 0.0034574309829622507, "global_step": 20349, "epoch": 171, "lr": 8.187461352129556e-05} +{"train_loss": 0.0056949760764837265, "global_step": 20350, "epoch": 171, "lr": 8.187290653565453e-05} +{"train_loss": 0.006155571900308132, "global_step": 20351, "epoch": 171, "lr": 8.18711994874345e-05} +{"train_loss": 0.003562555881217122, "global_step": 20352, "epoch": 171, "lr": 8.186949237663874e-05} +{"train_loss": 0.0032341713085770607, "global_step": 20353, "epoch": 171, "lr": 8.186778520327066e-05} +{"train_loss": 0.004799412097781897, "global_step": 20354, "epoch": 171, "lr": 8.186607796733356e-05} +{"train_loss": 0.005182879976928234, "global_step": 20355, "epoch": 171, "lr": 8.186437066883084e-05} +{"train_loss": 0.0056679341942071915, "global_step": 20356, "epoch": 171, "lr": 8.186266330776582e-05} +{"train_loss": 0.006394061725586653, "global_step": 20357, "epoch": 171, "lr": 8.186095588414187e-05} +{"train_loss": 0.004002145491540432, "global_step": 20358, "epoch": 171, "lr": 8.185924839796235e-05} +{"train_loss": 0.0036897086538374424, "global_step": 20359, "epoch": 171, "lr": 8.185754084923058e-05} +{"train_loss": 0.00501686567440629, "global_step": 20360, "epoch": 171, "lr": 8.185583323794995e-05} +{"train_loss": 0.006751390174031258, "global_step": 20361, "epoch": 171, "lr": 8.185412556412377e-05} +{"train_loss": 0.004803735297173262, "global_step": 20362, "epoch": 171, "lr": 8.185241782775543e-05} +{"train_loss": 0.003211840521544218, "global_step": 20363, "epoch": 171, "lr": 8.185071002884828e-05} +{"train_loss": 0.006077890750020742, "global_step": 20364, "epoch": 171, "lr": 8.184900216740565e-05} +{"train_loss": 0.006692762020975351, "global_step": 20365, "epoch": 171, "lr": 8.184729424343092e-05} +{"train_loss": 0.006141116376966238, "global_step": 20366, "epoch": 171, "lr": 8.184558625692742e-05} +{"train_loss": 0.005739870015531778, "global_step": 20367, "epoch": 171, "lr": 8.184387820789852e-05} +{"train_loss": 0.0038938678335398436, "global_step": 20368, "epoch": 171, "lr": 8.184217009634756e-05} +{"train_loss": 0.004566403571516275, "global_step": 20369, "epoch": 171, "lr": 8.184046192227791e-05} +{"train_loss": 0.004365427885204554, "global_step": 20370, "epoch": 171, "lr": 8.183875368569291e-05} +{"train_loss": 0.004183492623269558, "global_step": 20371, "epoch": 171, "lr": 8.183704538659593e-05} +{"train_loss": 0.006368027534335852, "global_step": 20372, "epoch": 171, "lr": 8.183533702499029e-05} +{"train_loss": 0.005327232647687197, "global_step": 20373, "epoch": 171, "lr": 8.183362860087937e-05} +{"train_loss": 0.004248735494911671, "global_step": 20374, "epoch": 171, "lr": 8.183192011426655e-05} +{"train_loss": 0.006095954682677984, "global_step": 20375, "epoch": 171, "lr": 8.183021156515512e-05} +{"train_loss": 0.0037597741466015577, "global_step": 20376, "epoch": 171, "lr": 8.18285029535485e-05} +{"train_loss": 0.003982788883149624, "global_step": 20377, "epoch": 171, "lr": 8.182679427944999e-05} +{"train_loss": 0.004700613673776388, "global_step": 20378, "epoch": 171, "lr": 8.182508554286299e-05} +{"train_loss": 0.0036597060970962048, "global_step": 20379, "epoch": 171, "lr": 8.182337674379082e-05} +{"train_loss": 0.005447122734040022, "global_step": 20380, "epoch": 171, "lr": 8.182166788223684e-05} +{"train_loss": 0.005935641471296549, "global_step": 20381, "epoch": 171, "lr": 8.181995895820444e-05} +{"train_loss": 0.002691574627533555, "global_step": 20382, "epoch": 171, "lr": 8.181824997169694e-05} +{"train_loss": 0.006671675946563482, "global_step": 20383, "epoch": 171, "lr": 8.18165409227177e-05} +{"train_loss": 0.0054890853352844715, "global_step": 20384, "epoch": 171, "lr": 8.181483181127008e-05} +{"train_loss": 0.00543562974780798, "global_step": 20385, "epoch": 171, "lr": 8.181312263735745e-05} +{"train_loss": 0.004160230979323387, "global_step": 20386, "epoch": 171, "lr": 8.181141340098314e-05} +{"train_loss": 0.005190630443394184, "global_step": 20387, "epoch": 171, "lr": 8.180970410215051e-05} +{"train_loss": 0.0025694421492516994, "global_step": 20388, "epoch": 171, "lr": 8.180799474086293e-05} +{"train_loss": 0.01164930872619152, "global_step": 20389, "epoch": 171, "lr": 8.180628531712378e-05} +{"train_loss": 0.005754889454692602, "global_step": 20390, "epoch": 171, "lr": 8.180457583093636e-05} +{"train_loss": 0.005127167794853449, "global_step": 20391, "epoch": 171, "lr": 8.180286628230404e-05} +{"train_loss": 0.007495350204408169, "global_step": 20392, "epoch": 171, "lr": 8.180115667123021e-05} +{"train_loss": 0.006837916560471058, "global_step": 20393, "epoch": 171, "lr": 8.179944699771821e-05} +{"train_loss": 0.006709645036607981, "global_step": 20394, "epoch": 171, "lr": 8.179773726177138e-05} +{"train_loss": 0.004999147262424231, "global_step": 20395, "epoch": 171, "lr": 8.17960274633931e-05} +{"train_loss": 0.004985506180673838, "global_step": 20396, "epoch": 171, "lr": 8.179431760258672e-05} +{"train_loss": 0.007043665274977684, "global_step": 20397, "epoch": 171, "lr": 8.17926076793556e-05} +{"train_loss": 0.005309367552399635, "global_step": 20398, "epoch": 171, "lr": 8.179089769370308e-05} +{"train_loss": 0.004913774318993092, "global_step": 20399, "epoch": 171, "lr": 8.17891876456325e-05} +{"train_loss": 0.006512588355690241, "global_step": 20400, "epoch": 171, "lr": 8.178747753514728e-05} +{"train_loss": 0.0033481204882264137, "global_step": 20401, "epoch": 171, "lr": 8.178576736225075e-05} +{"train_loss": 0.004800786729902029, "global_step": 20402, "epoch": 171, "lr": 8.178405712694624e-05} +{"train_loss": 0.005766662769019604, "global_step": 20403, "epoch": 171, "lr": 8.178234682923715e-05} +{"train_loss": 0.005350081250071526, "global_step": 20404, "epoch": 171, "lr": 8.17806364691268e-05} +{"train_loss": 0.007817033678293228, "global_step": 20405, "epoch": 171, "lr": 8.177892604661857e-05} +{"train_loss": 0.005612875800579786, "global_step": 20406, "epoch": 171, "lr": 8.177721556171582e-05} +{"train_loss": 0.005096827633678913, "global_step": 20407, "epoch": 171, "lr": 8.177550501442188e-05} +{"train_loss": 0.003986764699220657, "global_step": 20408, "epoch": 171, "lr": 8.177379440474016e-05} +{"train_loss": 0.005437080282717943, "global_step": 20409, "epoch": 171, "lr": 8.177208373267398e-05} +{"train_loss": 0.0041095479391515255, "global_step": 20410, "epoch": 171, "lr": 8.177037299822669e-05} +{"train_loss": 0.0052881790325045586, "global_step": 20411, "epoch": 171, "lr": 8.176866220140168e-05} +{"train_loss": 0.004557854495942593, "global_step": 20412, "epoch": 171, "lr": 8.176695134220231e-05} +{"train_loss": 0.009346002712845802, "global_step": 20413, "epoch": 171, "lr": 8.176524042063192e-05} +{"train_loss": 0.004720051772892475, "global_step": 20414, "epoch": 171, "lr": 8.176352943669385e-05} +{"train_loss": 0.006811711937189102, "global_step": 20415, "epoch": 171, "lr": 8.176181839039151e-05} +{"train_loss": 0.004095971118658781, "global_step": 20416, "epoch": 171, "lr": 8.176010728172822e-05} +{"train_loss": 0.008334959857165813, "global_step": 20417, "epoch": 171, "lr": 8.175839611070734e-05} +{"train_loss": 0.007111445069313049, "global_step": 20418, "epoch": 171, "lr": 8.175668487733228e-05} +{"train_loss": 0.0044798171147704124, "global_step": 20419, "epoch": 171, "lr": 8.175497358160633e-05} +{"train_loss": 0.005047874990850687, "global_step": 20420, "epoch": 171, "lr": 8.175326222353289e-05} +{"train_loss": 0.008246461860835552, "global_step": 20421, "epoch": 171, "lr": 8.175155080311531e-05} +{"train_loss": 0.004677706863731146, "global_step": 20422, "epoch": 171, "lr": 8.174983932035696e-05} +{"train_loss": 0.006081338506191969, "global_step": 20423, "epoch": 171, "lr": 8.17481277752612e-05} +{"train_loss": 0.004582669120281935, "global_step": 20424, "epoch": 171, "lr": 8.174641616783137e-05} +{"train_loss": 0.006688934750854969, "global_step": 20425, "epoch": 171, "lr": 8.174470449807084e-05} +{"train_loss": 0.003948525991290808, "global_step": 20426, "epoch": 171, "lr": 8.174299276598296e-05} +{"train_loss": 0.006095693912357092, "global_step": 20427, "epoch": 171, "lr": 8.174128097157114e-05} +{"train_loss": 0.003777763806283474, "global_step": 20428, "epoch": 171, "lr": 8.173956911483868e-05} +{"train_loss": 0.00651967991143465, "global_step": 20429, "epoch": 171, "lr": 8.173785719578898e-05} +{"train_loss": 0.004295479506254196, "global_step": 20430, "epoch": 171, "lr": 8.173614521442538e-05} +{"train_loss": 0.003888400737196207, "global_step": 20431, "epoch": 171, "lr": 8.173443317075126e-05} +{"train_loss": 0.0049774982035160065, "global_step": 20432, "epoch": 171, "lr": 8.173272106476997e-05} +{"train_loss": 0.003493363270536065, "global_step": 20433, "epoch": 171, "lr": 8.173100889648486e-05} +{"train_loss": 0.0055838944390416145, "global_step": 20434, "epoch": 171, "lr": 8.172929666589931e-05} +{"train_loss": 0.006554397288709879, "global_step": 20435, "epoch": 171, "lr": 8.172758437301668e-05} +{"train_loss": 0.004403833299875259, "global_step": 20436, "epoch": 171, "lr": 8.172587201784032e-05} +{"train_loss": 0.004167819395661354, "global_step": 20437, "epoch": 171, "lr": 8.172415960037361e-05} +{"train_loss": 0.0049774786457419395, "global_step": 20438, "epoch": 171, "lr": 8.17224471206199e-05} +{"train_loss": 0.004194335080683231, "global_step": 20439, "epoch": 171, "lr": 8.172073457858254e-05} +{"train_loss": 0.004331259056925774, "global_step": 20440, "epoch": 171, "lr": 8.17190219742649e-05} +{"train_loss": 0.006994422525167465, "global_step": 20441, "epoch": 171, "lr": 8.171730930767038e-05} +{"train_loss": 0.007727013435214758, "global_step": 20442, "epoch": 171, "lr": 8.17155965788023e-05} +{"train_loss": 0.004569122567772865, "global_step": 20443, "epoch": 171, "lr": 8.171388378766402e-05} +{"train_loss": 0.005787821486592293, "global_step": 20444, "epoch": 171, "lr": 8.171217093425894e-05} +{"train_loss": 0.004461128730326891, "global_step": 20445, "epoch": 171, "lr": 8.171045801859038e-05} +{"train_loss": 0.0051250159740448, "global_step": 20446, "epoch": 171, "lr": 8.170874504066174e-05} +{"train_loss": 0.006410073954612017, "global_step": 20447, "epoch": 171, "lr": 8.170703200047636e-05} +{"train_loss": 0.006988277193158865, "global_step": 20448, "epoch": 171, "lr": 8.17053188980376e-05} +{"train_loss": 0.005058031063526869, "global_step": 20449, "epoch": 171, "lr": 8.170360573334886e-05} +{"train_loss": 0.006250304635614157, "global_step": 20450, "epoch": 171, "lr": 8.170189250641344e-05} +{"train_loss": 0.007613263092935085, "global_step": 20451, "epoch": 171, "lr": 8.170017921723477e-05} +{"train_loss": 0.0029979259707033634, "global_step": 20452, "epoch": 171, "lr": 8.169846586581618e-05} +{"train_loss": 0.0065337177366018295, "global_step": 20453, "epoch": 171, "lr": 8.169675245216104e-05} +{"train_loss": 0.004891142249107361, "global_step": 20454, "epoch": 171, "lr": 8.16950389762727e-05} +{"train_loss": 0.005896097049117088, "global_step": 20455, "epoch": 171, "lr": 8.169332543815454e-05} +{"train_loss": 0.0051258644089102745, "global_step": 20456, "epoch": 171, "lr": 8.169161183780994e-05} +{"train_loss": 0.006410663947463036, "global_step": 20457, "epoch": 171, "lr": 8.168989817524221e-05} +{"train_loss": 0.0033860886469483376, "global_step": 20458, "epoch": 171, "lr": 8.168818445045478e-05} +{"train_loss": 0.005588015541434288, "global_step": 20459, "epoch": 171, "lr": 8.168647066345099e-05} +{"train_loss": 0.005679764784872532, "global_step": 20460, "epoch": 171, "lr": 8.168475681423418e-05} +{"train_loss": 0.005040514748543501, "global_step": 20461, "epoch": 171, "lr": 8.168304290280774e-05} +{"train_loss": 0.004034054931253195, "global_step": 20462, "epoch": 171, "lr": 8.168132892917503e-05} +{"train_loss": 0.00437968922778964, "global_step": 20463, "epoch": 171, "lr": 8.167961489333941e-05} +{"train_loss": 0.003891967935487628, "global_step": 20464, "epoch": 171, "lr": 8.167790079530426e-05} +{"train_loss": 0.008606741204857826, "global_step": 20465, "epoch": 171, "lr": 8.167618663507295e-05} +{"train_loss": 0.003604358993470669, "global_step": 20466, "epoch": 171, "lr": 8.16744724126488e-05} +{"train_loss": 0.00531550869541321, "global_step": 20467, "epoch": 171, "lr": 8.167275812803523e-05, "val_loss": 0.026376590132713318} +{"train_loss": 0.005231885705143213, "global_step": 20468, "epoch": 172, "lr": 8.167104378123558e-05} +{"train_loss": 0.003407601499930024, "global_step": 20469, "epoch": 172, "lr": 8.16693293722532e-05} +{"train_loss": 0.004354392644017935, "global_step": 20470, "epoch": 172, "lr": 8.16676149010915e-05} +{"train_loss": 0.0025133220478892326, "global_step": 20471, "epoch": 172, "lr": 8.166590036775382e-05} +{"train_loss": 0.005165735259652138, "global_step": 20472, "epoch": 172, "lr": 8.16641857722435e-05} +{"train_loss": 0.0031542745418846607, "global_step": 20473, "epoch": 172, "lr": 8.166247111456396e-05} +{"train_loss": 0.0053833420388400555, "global_step": 20474, "epoch": 172, "lr": 8.166075639471853e-05} +{"train_loss": 0.006325843743979931, "global_step": 20475, "epoch": 172, "lr": 8.16590416127106e-05} +{"train_loss": 0.004069124814122915, "global_step": 20476, "epoch": 172, "lr": 8.165732676854352e-05} +{"train_loss": 0.003101819194853306, "global_step": 20477, "epoch": 172, "lr": 8.165561186222066e-05} +{"train_loss": 0.004300667438656092, "global_step": 20478, "epoch": 172, "lr": 8.165389689374539e-05} +{"train_loss": 0.006475850008428097, "global_step": 20479, "epoch": 172, "lr": 8.165218186312106e-05} +{"train_loss": 0.0039547099731862545, "global_step": 20480, "epoch": 172, "lr": 8.165046677035107e-05} +{"train_loss": 0.004531340207904577, "global_step": 20481, "epoch": 172, "lr": 8.164875161543875e-05} +{"train_loss": 0.003004561411216855, "global_step": 20482, "epoch": 172, "lr": 8.16470363983875e-05} +{"train_loss": 0.003054949687793851, "global_step": 20483, "epoch": 172, "lr": 8.16453211192007e-05} +{"train_loss": 0.004821682348847389, "global_step": 20484, "epoch": 172, "lr": 8.164360577788165e-05} +{"train_loss": 0.0039017300587147474, "global_step": 20485, "epoch": 172, "lr": 8.164189037443377e-05} +{"train_loss": 0.006563572213053703, "global_step": 20486, "epoch": 172, "lr": 8.164017490886044e-05} +{"train_loss": 0.00413279514759779, "global_step": 20487, "epoch": 172, "lr": 8.163845938116499e-05} +{"train_loss": 0.005380941554903984, "global_step": 20488, "epoch": 172, "lr": 8.16367437913508e-05} +{"train_loss": 0.003727869363501668, "global_step": 20489, "epoch": 172, "lr": 8.163502813942125e-05} +{"train_loss": 0.005254747811704874, "global_step": 20490, "epoch": 172, "lr": 8.163331242537971e-05} +{"train_loss": 0.007669446058571339, "global_step": 20491, "epoch": 172, "lr": 8.163159664922954e-05} +{"train_loss": 0.0054986136965453625, "global_step": 20492, "epoch": 172, "lr": 8.16298808109741e-05} +{"train_loss": 0.00543705141171813, "global_step": 20493, "epoch": 172, "lr": 8.162816491061678e-05} +{"train_loss": 0.004446340724825859, "global_step": 20494, "epoch": 172, "lr": 8.162644894816092e-05} +{"train_loss": 0.0048719788901507854, "global_step": 20495, "epoch": 172, "lr": 8.162473292360991e-05} +{"train_loss": 0.0029545912984758615, "global_step": 20496, "epoch": 172, "lr": 8.162301683696714e-05} +{"train_loss": 0.006879474967718124, "global_step": 20497, "epoch": 172, "lr": 8.162130068823593e-05} +{"train_loss": 0.0034591490402817726, "global_step": 20498, "epoch": 172, "lr": 8.161958447741967e-05} +{"train_loss": 0.0033988438080996275, "global_step": 20499, "epoch": 172, "lr": 8.161786820452176e-05} +{"train_loss": 0.00376895722001791, "global_step": 20500, "epoch": 172, "lr": 8.161615186954552e-05} +{"train_loss": 0.006432355847209692, "global_step": 20501, "epoch": 172, "lr": 8.161443547249435e-05} +{"train_loss": 0.0035126153379678726, "global_step": 20502, "epoch": 172, "lr": 8.161271901337162e-05} +{"train_loss": 0.005495897959917784, "global_step": 20503, "epoch": 172, "lr": 8.161100249218067e-05} +{"train_loss": 0.002636139513924718, "global_step": 20504, "epoch": 172, "lr": 8.160928590892492e-05} +{"train_loss": 0.004148020874708891, "global_step": 20505, "epoch": 172, "lr": 8.160756926360771e-05} +{"train_loss": 0.004659587983042002, "global_step": 20506, "epoch": 172, "lr": 8.160585255623241e-05} +{"train_loss": 0.003786026732996106, "global_step": 20507, "epoch": 172, "lr": 8.160413578680239e-05} +{"train_loss": 0.004132911562919617, "global_step": 20508, "epoch": 172, "lr": 8.160241895532103e-05} +{"train_loss": 0.00558755686506629, "global_step": 20509, "epoch": 172, "lr": 8.160070206179171e-05} +{"train_loss": 0.0027251827996224165, "global_step": 20510, "epoch": 172, "lr": 8.159898510621778e-05} +{"train_loss": 0.004546932876110077, "global_step": 20511, "epoch": 172, "lr": 8.159726808860261e-05} +{"train_loss": 0.004284131806343794, "global_step": 20512, "epoch": 172, "lr": 8.159555100894958e-05} +{"train_loss": 0.008319991640746593, "global_step": 20513, "epoch": 172, "lr": 8.159383386726207e-05} +{"train_loss": 0.0035125247668474913, "global_step": 20514, "epoch": 172, "lr": 8.159211666354342e-05} +{"train_loss": 0.0032280427403748035, "global_step": 20515, "epoch": 172, "lr": 8.159039939779706e-05} +{"train_loss": 0.0051366970874369144, "global_step": 20516, "epoch": 172, "lr": 8.15886820700263e-05} +{"train_loss": 0.004388057626783848, "global_step": 20517, "epoch": 172, "lr": 8.158696468023454e-05} +{"train_loss": 0.005170003976672888, "global_step": 20518, "epoch": 172, "lr": 8.158524722842515e-05} +{"train_loss": 0.006771002896130085, "global_step": 20519, "epoch": 172, "lr": 8.158352971460151e-05} +{"train_loss": 0.007309634238481522, "global_step": 20520, "epoch": 172, "lr": 8.1581812138767e-05} +{"train_loss": 0.0058562858030200005, "global_step": 20521, "epoch": 172, "lr": 8.158009450092494e-05} +{"train_loss": 0.0034971912391483784, "global_step": 20522, "epoch": 172, "lr": 8.157837680107877e-05} +{"train_loss": 0.002743621589615941, "global_step": 20523, "epoch": 172, "lr": 8.157665903923179e-05} +{"train_loss": 0.004803923424333334, "global_step": 20524, "epoch": 172, "lr": 8.157494121538745e-05} +{"train_loss": 0.007437400985509157, "global_step": 20525, "epoch": 172, "lr": 8.157322332954907e-05} +{"train_loss": 0.004592048469930887, "global_step": 20526, "epoch": 172, "lr": 8.157150538172004e-05} +{"train_loss": 0.006243085954338312, "global_step": 20527, "epoch": 172, "lr": 8.156978737190375e-05} +{"train_loss": 0.004587871488183737, "global_step": 20528, "epoch": 172, "lr": 8.156806930010353e-05} +{"train_loss": 0.005208128597587347, "global_step": 20529, "epoch": 172, "lr": 8.15663511663228e-05} +{"train_loss": 0.004116836469620466, "global_step": 20530, "epoch": 172, "lr": 8.156463297056489e-05} +{"train_loss": 0.004093652591109276, "global_step": 20531, "epoch": 172, "lr": 8.156291471283322e-05} +{"train_loss": 0.008323109708726406, "global_step": 20532, "epoch": 172, "lr": 8.156119639313111e-05} +{"train_loss": 0.0035285691265016794, "global_step": 20533, "epoch": 172, "lr": 8.155947801146199e-05} +{"train_loss": 0.00398960430175066, "global_step": 20534, "epoch": 172, "lr": 8.155775956782919e-05} +{"train_loss": 0.005241881590336561, "global_step": 20535, "epoch": 172, "lr": 8.155604106223611e-05} +{"train_loss": 0.005369273014366627, "global_step": 20536, "epoch": 172, "lr": 8.15543224946861e-05} +{"train_loss": 0.0037419642321765423, "global_step": 20537, "epoch": 172, "lr": 8.155260386518256e-05} +{"train_loss": 0.005269802641123533, "global_step": 20538, "epoch": 172, "lr": 8.155088517372885e-05} +{"train_loss": 0.0059792953543365, "global_step": 20539, "epoch": 172, "lr": 8.154916642032835e-05} +{"train_loss": 0.006512628402560949, "global_step": 20540, "epoch": 172, "lr": 8.154744760498443e-05} +{"train_loss": 0.004796426277607679, "global_step": 20541, "epoch": 172, "lr": 8.154572872770048e-05} +{"train_loss": 0.004920691251754761, "global_step": 20542, "epoch": 172, "lr": 8.154400978847985e-05} +{"train_loss": 0.005332707427442074, "global_step": 20543, "epoch": 172, "lr": 8.154229078732591e-05} +{"train_loss": 0.012037846259772778, "global_step": 20544, "epoch": 172, "lr": 8.154057172424208e-05} +{"train_loss": 0.004648992326110601, "global_step": 20545, "epoch": 172, "lr": 8.153885259923168e-05} +{"train_loss": 0.006210152991116047, "global_step": 20546, "epoch": 172, "lr": 8.153713341229814e-05} +{"train_loss": 0.00372683210298419, "global_step": 20547, "epoch": 172, "lr": 8.153541416344479e-05} +{"train_loss": 0.008528604172170162, "global_step": 20548, "epoch": 172, "lr": 8.153369485267504e-05} +{"train_loss": 0.003799332771450281, "global_step": 20549, "epoch": 172, "lr": 8.153197547999222e-05} +{"train_loss": 0.008726208470761776, "global_step": 20550, "epoch": 172, "lr": 8.153025604539977e-05} +{"train_loss": 0.003954728599637747, "global_step": 20551, "epoch": 172, "lr": 8.152853654890101e-05} +{"train_loss": 0.005375016015022993, "global_step": 20552, "epoch": 172, "lr": 8.152681699049936e-05} +{"train_loss": 0.007863562554121017, "global_step": 20553, "epoch": 172, "lr": 8.152509737019813e-05} +{"train_loss": 0.009943144395947456, "global_step": 20554, "epoch": 172, "lr": 8.152337768800077e-05} +{"train_loss": 0.0033714796882122755, "global_step": 20555, "epoch": 172, "lr": 8.152165794391062e-05} +{"train_loss": 0.0055318488739430904, "global_step": 20556, "epoch": 172, "lr": 8.151993813793106e-05} +{"train_loss": 0.006928642280399799, "global_step": 20557, "epoch": 172, "lr": 8.151821827006548e-05} +{"train_loss": 0.007516501471400261, "global_step": 20558, "epoch": 172, "lr": 8.151649834031722e-05} +{"train_loss": 0.007434648461639881, "global_step": 20559, "epoch": 172, "lr": 8.15147783486897e-05} +{"train_loss": 0.004682672210037708, "global_step": 20560, "epoch": 172, "lr": 8.151305829518628e-05} +{"train_loss": 0.0056127822026610374, "global_step": 20561, "epoch": 172, "lr": 8.151133817981034e-05} +{"train_loss": 0.00523862149566412, "global_step": 20562, "epoch": 172, "lr": 8.150961800256524e-05} +{"train_loss": 0.005422339774668217, "global_step": 20563, "epoch": 172, "lr": 8.150789776345437e-05} +{"train_loss": 0.00700309919193387, "global_step": 20564, "epoch": 172, "lr": 8.150617746248113e-05} +{"train_loss": 0.00492988433688879, "global_step": 20565, "epoch": 172, "lr": 8.150445709964887e-05} +{"train_loss": 0.005303127691149712, "global_step": 20566, "epoch": 172, "lr": 8.150273667496098e-05} +{"train_loss": 0.007757491432130337, "global_step": 20567, "epoch": 172, "lr": 8.150101618842081e-05} +{"train_loss": 0.005911489482969046, "global_step": 20568, "epoch": 172, "lr": 8.149929564003177e-05} +{"train_loss": 0.004913438111543655, "global_step": 20569, "epoch": 172, "lr": 8.149757502979723e-05} +{"train_loss": 0.004409393761307001, "global_step": 20570, "epoch": 172, "lr": 8.149585435772057e-05} +{"train_loss": 0.003925404977053404, "global_step": 20571, "epoch": 172, "lr": 8.149413362380515e-05} +{"train_loss": 0.004491652362048626, "global_step": 20572, "epoch": 172, "lr": 8.149241282805437e-05} +{"train_loss": 0.006394998170435429, "global_step": 20573, "epoch": 172, "lr": 8.149069197047163e-05} +{"train_loss": 0.005009211599826813, "global_step": 20574, "epoch": 172, "lr": 8.148897105106024e-05} +{"train_loss": 0.004619996529072523, "global_step": 20575, "epoch": 172, "lr": 8.148725006982364e-05} +{"train_loss": 0.004160403273999691, "global_step": 20576, "epoch": 172, "lr": 8.148552902676518e-05} +{"train_loss": 0.005321061238646507, "global_step": 20577, "epoch": 172, "lr": 8.148380792188826e-05} +{"train_loss": 0.007348319515585899, "global_step": 20578, "epoch": 172, "lr": 8.148208675519624e-05} +{"train_loss": 0.005643210839480162, "global_step": 20579, "epoch": 172, "lr": 8.148036552669252e-05} +{"train_loss": 0.003251585178077221, "global_step": 20580, "epoch": 172, "lr": 8.147864423638042e-05} +{"train_loss": 0.004610602743923664, "global_step": 20581, "epoch": 172, "lr": 8.147692288426341e-05} +{"train_loss": 0.002933899173513055, "global_step": 20582, "epoch": 172, "lr": 8.14752014703448e-05} +{"train_loss": 0.004750341176986694, "global_step": 20583, "epoch": 172, "lr": 8.147347999462803e-05} +{"train_loss": 0.00708333496004343, "global_step": 20584, "epoch": 172, "lr": 8.147175845711641e-05} +{"train_loss": 0.004176185466349125, "global_step": 20585, "epoch": 172, "lr": 8.147003685781336e-05} +{"train_loss": 0.005114021486047061, "global_step": 20586, "epoch": 172, "lr": 8.146831519672225e-05, "val_loss": 0.012697887606918812} +{"train_loss": 0.00601332588121295, "global_step": 20587, "epoch": 173, "lr": 8.146659347384649e-05} +{"train_loss": 0.005547041073441505, "global_step": 20588, "epoch": 173, "lr": 8.146487168918941e-05} +{"train_loss": 0.004148774314671755, "global_step": 20589, "epoch": 173, "lr": 8.146314984275443e-05} +{"train_loss": 0.0026172788348048925, "global_step": 20590, "epoch": 173, "lr": 8.146142793454491e-05} +{"train_loss": 0.0023257089778780937, "global_step": 20591, "epoch": 173, "lr": 8.145970596456424e-05} +{"train_loss": 0.003309373278170824, "global_step": 20592, "epoch": 173, "lr": 8.145798393281579e-05} +{"train_loss": 0.004429335240274668, "global_step": 20593, "epoch": 173, "lr": 8.145626183930295e-05} +{"train_loss": 0.004759524948894978, "global_step": 20594, "epoch": 173, "lr": 8.145453968402912e-05} +{"train_loss": 0.004249064717441797, "global_step": 20595, "epoch": 173, "lr": 8.145281746699765e-05} +{"train_loss": 0.0056343539617955685, "global_step": 20596, "epoch": 173, "lr": 8.145109518821192e-05} +{"train_loss": 0.0024706521071493626, "global_step": 20597, "epoch": 173, "lr": 8.144937284767534e-05} +{"train_loss": 0.005504184868186712, "global_step": 20598, "epoch": 173, "lr": 8.144765044539128e-05} +{"train_loss": 0.007450752891600132, "global_step": 20599, "epoch": 173, "lr": 8.14459279813631e-05} +{"train_loss": 0.003854345763102174, "global_step": 20600, "epoch": 173, "lr": 8.144420545559422e-05} +{"train_loss": 0.003778159851208329, "global_step": 20601, "epoch": 173, "lr": 8.144248286808799e-05} +{"train_loss": 0.003289515618234873, "global_step": 20602, "epoch": 173, "lr": 8.144076021884781e-05} +{"train_loss": 0.003026357153430581, "global_step": 20603, "epoch": 173, "lr": 8.143903750787704e-05} +{"train_loss": 0.004334992729127407, "global_step": 20604, "epoch": 173, "lr": 8.143731473517911e-05} +{"train_loss": 0.00643908279016614, "global_step": 20605, "epoch": 173, "lr": 8.143559190075734e-05} +{"train_loss": 0.004648665897548199, "global_step": 20606, "epoch": 173, "lr": 8.143386900461517e-05} +{"train_loss": 0.003726484254002571, "global_step": 20607, "epoch": 173, "lr": 8.143214604675594e-05} +{"train_loss": 0.0037794290110468864, "global_step": 20608, "epoch": 173, "lr": 8.143042302718305e-05} +{"train_loss": 0.0035611791536211967, "global_step": 20609, "epoch": 173, "lr": 8.142869994589987e-05} +{"train_loss": 0.0037534425500780344, "global_step": 20610, "epoch": 173, "lr": 8.142697680290983e-05} +{"train_loss": 0.0032351769041270018, "global_step": 20611, "epoch": 173, "lr": 8.142525359821624e-05} +{"train_loss": 0.008567881770431995, "global_step": 20612, "epoch": 173, "lr": 8.142353033182255e-05} +{"train_loss": 0.005088679492473602, "global_step": 20613, "epoch": 173, "lr": 8.14218070037321e-05} +{"train_loss": 0.004223166964948177, "global_step": 20614, "epoch": 173, "lr": 8.14200836139483e-05} +{"train_loss": 0.003515692660585046, "global_step": 20615, "epoch": 173, "lr": 8.141836016247452e-05} +{"train_loss": 0.00746048241853714, "global_step": 20616, "epoch": 173, "lr": 8.141663664931414e-05} +{"train_loss": 0.0032701820600777864, "global_step": 20617, "epoch": 173, "lr": 8.141491307447055e-05} +{"train_loss": 0.004266162868589163, "global_step": 20618, "epoch": 173, "lr": 8.141318943794713e-05} +{"train_loss": 0.00497352983802557, "global_step": 20619, "epoch": 173, "lr": 8.141146573974729e-05} +{"train_loss": 0.005071008112281561, "global_step": 20620, "epoch": 173, "lr": 8.140974197987437e-05} +{"train_loss": 0.00715347845107317, "global_step": 20621, "epoch": 173, "lr": 8.140801815833179e-05} +{"train_loss": 0.004961090628057718, "global_step": 20622, "epoch": 173, "lr": 8.140629427512292e-05} +{"train_loss": 0.004329079296439886, "global_step": 20623, "epoch": 173, "lr": 8.140457033025113e-05} +{"train_loss": 0.005691239610314369, "global_step": 20624, "epoch": 173, "lr": 8.140284632371984e-05} +{"train_loss": 0.006082588341087103, "global_step": 20625, "epoch": 173, "lr": 8.140112225553243e-05} +{"train_loss": 0.0076895891688764095, "global_step": 20626, "epoch": 173, "lr": 8.139939812569224e-05} +{"train_loss": 0.006963114254176617, "global_step": 20627, "epoch": 173, "lr": 8.13976739342027e-05} +{"train_loss": 0.005222419276833534, "global_step": 20628, "epoch": 173, "lr": 8.139594968106719e-05} +{"train_loss": 0.00824753101915121, "global_step": 20629, "epoch": 173, "lr": 8.139422536628907e-05} +{"train_loss": 0.0039140693843364716, "global_step": 20630, "epoch": 173, "lr": 8.139250098987175e-05} +{"train_loss": 0.004378850106149912, "global_step": 20631, "epoch": 173, "lr": 8.139077655181861e-05} +{"train_loss": 0.006143013946712017, "global_step": 20632, "epoch": 173, "lr": 8.138905205213303e-05} +{"train_loss": 0.005225288216024637, "global_step": 20633, "epoch": 173, "lr": 8.138732749081841e-05} +{"train_loss": 0.005618975032120943, "global_step": 20634, "epoch": 173, "lr": 8.138560286787812e-05} +{"train_loss": 0.003281413810327649, "global_step": 20635, "epoch": 173, "lr": 8.138387818331554e-05} +{"train_loss": 0.005676967091858387, "global_step": 20636, "epoch": 173, "lr": 8.138215343713409e-05} +{"train_loss": 0.00603078119456768, "global_step": 20637, "epoch": 173, "lr": 8.138042862933711e-05} +{"train_loss": 0.002931798342615366, "global_step": 20638, "epoch": 173, "lr": 8.137870375992802e-05} +{"train_loss": 0.003786845365539193, "global_step": 20639, "epoch": 173, "lr": 8.13769788289102e-05} +{"train_loss": 0.009069472551345825, "global_step": 20640, "epoch": 173, "lr": 8.137525383628704e-05} +{"train_loss": 0.00784584041684866, "global_step": 20641, "epoch": 173, "lr": 8.137352878206193e-05} +{"train_loss": 0.006160794757306576, "global_step": 20642, "epoch": 173, "lr": 8.137180366623822e-05} +{"train_loss": 0.0064041768200695515, "global_step": 20643, "epoch": 173, "lr": 8.137007848881934e-05} +{"train_loss": 0.004473736509680748, "global_step": 20644, "epoch": 173, "lr": 8.136835324980866e-05} +{"train_loss": 0.0035500156227499247, "global_step": 20645, "epoch": 173, "lr": 8.136662794920958e-05} +{"train_loss": 0.0031578915659338236, "global_step": 20646, "epoch": 173, "lr": 8.136490258702547e-05} +{"train_loss": 0.004828035831451416, "global_step": 20647, "epoch": 173, "lr": 8.136317716325972e-05} +{"train_loss": 0.004233382176607847, "global_step": 20648, "epoch": 173, "lr": 8.136145167791571e-05} +{"train_loss": 0.003580735996365547, "global_step": 20649, "epoch": 173, "lr": 8.135972613099687e-05} +{"train_loss": 0.007508115377277136, "global_step": 20650, "epoch": 173, "lr": 8.135800052250653e-05} +{"train_loss": 0.007186437491327524, "global_step": 20651, "epoch": 173, "lr": 8.135627485244812e-05} +{"train_loss": 0.004999461583793163, "global_step": 20652, "epoch": 173, "lr": 8.135454912082503e-05} +{"train_loss": 0.003970252349972725, "global_step": 20653, "epoch": 173, "lr": 8.13528233276406e-05} +{"train_loss": 0.003256594529375434, "global_step": 20654, "epoch": 173, "lr": 8.135109747289827e-05} +{"train_loss": 0.005515292752534151, "global_step": 20655, "epoch": 173, "lr": 8.13493715566014e-05} +{"train_loss": 0.004793267231434584, "global_step": 20656, "epoch": 173, "lr": 8.134764557875341e-05} +{"train_loss": 0.005865407641977072, "global_step": 20657, "epoch": 173, "lr": 8.134591953935764e-05} +{"train_loss": 0.006266411859542131, "global_step": 20658, "epoch": 173, "lr": 8.134419343841752e-05} +{"train_loss": 0.006009313277900219, "global_step": 20659, "epoch": 173, "lr": 8.134246727593643e-05} +{"train_loss": 0.005947628524154425, "global_step": 20660, "epoch": 173, "lr": 8.134074105191774e-05} +{"train_loss": 0.0021564331836998463, "global_step": 20661, "epoch": 173, "lr": 8.133901476636486e-05} +{"train_loss": 0.0047309803776443005, "global_step": 20662, "epoch": 173, "lr": 8.133728841928117e-05} +{"train_loss": 0.005357538815587759, "global_step": 20663, "epoch": 173, "lr": 8.133556201067006e-05} +{"train_loss": 0.00532095180824399, "global_step": 20664, "epoch": 173, "lr": 8.133383554053493e-05} +{"train_loss": 0.004687433131039143, "global_step": 20665, "epoch": 173, "lr": 8.133210900887915e-05} +{"train_loss": 0.006912314798682928, "global_step": 20666, "epoch": 173, "lr": 8.133038241570614e-05} +{"train_loss": 0.007567789405584335, "global_step": 20667, "epoch": 173, "lr": 8.132865576101926e-05} +{"train_loss": 0.0059273736551404, "global_step": 20668, "epoch": 173, "lr": 8.132692904482191e-05} +{"train_loss": 0.007801647298038006, "global_step": 20669, "epoch": 173, "lr": 8.132520226711748e-05} +{"train_loss": 0.00926101952791214, "global_step": 20670, "epoch": 173, "lr": 8.132347542790937e-05} +{"train_loss": 0.0027296901680529118, "global_step": 20671, "epoch": 173, "lr": 8.132174852720096e-05} +{"train_loss": 0.005210353061556816, "global_step": 20672, "epoch": 173, "lr": 8.132002156499563e-05} +{"train_loss": 0.008507702499628067, "global_step": 20673, "epoch": 173, "lr": 8.131829454129679e-05} +{"train_loss": 0.00588199682533741, "global_step": 20674, "epoch": 173, "lr": 8.131656745610782e-05} +{"train_loss": 0.008519415743649006, "global_step": 20675, "epoch": 173, "lr": 8.131484030943213e-05} +{"train_loss": 0.006564189679920673, "global_step": 20676, "epoch": 173, "lr": 8.13131131012731e-05} +{"train_loss": 0.005733470898121595, "global_step": 20677, "epoch": 173, "lr": 8.13113858316341e-05} +{"train_loss": 0.007507988717406988, "global_step": 20678, "epoch": 173, "lr": 8.130965850051855e-05} +{"train_loss": 0.005449105519801378, "global_step": 20679, "epoch": 173, "lr": 8.130793110792983e-05} +{"train_loss": 0.00579416798427701, "global_step": 20680, "epoch": 173, "lr": 8.130620365387132e-05} +{"train_loss": 0.006171722896397114, "global_step": 20681, "epoch": 173, "lr": 8.130447613834643e-05} +{"train_loss": 0.007074344903230667, "global_step": 20682, "epoch": 173, "lr": 8.130274856135856e-05} +{"train_loss": 0.005984800402075052, "global_step": 20683, "epoch": 173, "lr": 8.130102092291108e-05} +{"train_loss": 0.006989669986069202, "global_step": 20684, "epoch": 173, "lr": 8.129929322300738e-05} +{"train_loss": 0.004726724233478308, "global_step": 20685, "epoch": 173, "lr": 8.129756546165087e-05} +{"train_loss": 0.005277996417135, "global_step": 20686, "epoch": 173, "lr": 8.129583763884492e-05} +{"train_loss": 0.0023900640662759542, "global_step": 20687, "epoch": 173, "lr": 8.129410975459294e-05} +{"train_loss": 0.009660793468356133, "global_step": 20688, "epoch": 173, "lr": 8.129238180889835e-05} +{"train_loss": 0.004582440480589867, "global_step": 20689, "epoch": 173, "lr": 8.129065380176448e-05} +{"train_loss": 0.0036626525688916445, "global_step": 20690, "epoch": 173, "lr": 8.128892573319477e-05} +{"train_loss": 0.0076110451482236385, "global_step": 20691, "epoch": 173, "lr": 8.12871976031926e-05} +{"train_loss": 0.007187873590737581, "global_step": 20692, "epoch": 173, "lr": 8.128546941176132e-05} +{"train_loss": 0.004399397410452366, "global_step": 20693, "epoch": 173, "lr": 8.12837411589044e-05} +{"train_loss": 0.0062586222775280476, "global_step": 20694, "epoch": 173, "lr": 8.128201284462518e-05} +{"train_loss": 0.005573754198849201, "global_step": 20695, "epoch": 173, "lr": 8.128028446892709e-05} +{"train_loss": 0.006333624478429556, "global_step": 20696, "epoch": 173, "lr": 8.127855603181349e-05} +{"train_loss": 0.005577160511165857, "global_step": 20697, "epoch": 173, "lr": 8.127682753328778e-05} +{"train_loss": 0.007841254584491253, "global_step": 20698, "epoch": 173, "lr": 8.127509897335337e-05} +{"train_loss": 0.00594613142311573, "global_step": 20699, "epoch": 173, "lr": 8.127337035201366e-05} +{"train_loss": 0.006457450333982706, "global_step": 20700, "epoch": 173, "lr": 8.127164166927199e-05} +{"train_loss": 0.005854459013789892, "global_step": 20701, "epoch": 173, "lr": 8.126991292513182e-05} +{"train_loss": 0.0038562549743801355, "global_step": 20702, "epoch": 173, "lr": 8.126818411959652e-05} +{"train_loss": 0.005357392597943544, "global_step": 20703, "epoch": 173, "lr": 8.126645525266947e-05} +{"train_loss": 0.0062741744332015514, "global_step": 20704, "epoch": 173, "lr": 8.126472632435407e-05} +{"train_loss": 0.005375249491331457, "global_step": 20705, "epoch": 173, "lr": 8.126299733465373e-05, "val_loss": 0.008151035755872726} +{"train_loss": 0.006261586211621761, "global_step": 20706, "epoch": 174, "lr": 8.126126828357184e-05} +{"train_loss": 0.0071307457983493805, "global_step": 20707, "epoch": 174, "lr": 8.125953917111177e-05} +{"train_loss": 0.009288976900279522, "global_step": 20708, "epoch": 174, "lr": 8.125780999727695e-05} +{"train_loss": 0.004240016918629408, "global_step": 20709, "epoch": 174, "lr": 8.125608076207076e-05} +{"train_loss": 0.008467590436339378, "global_step": 20710, "epoch": 174, "lr": 8.125435146549658e-05} +{"train_loss": 0.007181673310697079, "global_step": 20711, "epoch": 174, "lr": 8.125262210755784e-05} +{"train_loss": 0.004731662571430206, "global_step": 20712, "epoch": 174, "lr": 8.125089268825789e-05} +{"train_loss": 0.008043457753956318, "global_step": 20713, "epoch": 174, "lr": 8.124916320760017e-05} +{"train_loss": 0.007381269242614508, "global_step": 20714, "epoch": 174, "lr": 8.124743366558805e-05} +{"train_loss": 0.0056261224672198296, "global_step": 20715, "epoch": 174, "lr": 8.124570406222494e-05} +{"train_loss": 0.00482520367950201, "global_step": 20716, "epoch": 174, "lr": 8.124397439751423e-05} +{"train_loss": 0.005438348278403282, "global_step": 20717, "epoch": 174, "lr": 8.124224467145931e-05} +{"train_loss": 0.005829601548612118, "global_step": 20718, "epoch": 174, "lr": 8.124051488406357e-05} +{"train_loss": 0.004133164416998625, "global_step": 20719, "epoch": 174, "lr": 8.123878503533043e-05} +{"train_loss": 0.0033419702667742968, "global_step": 20720, "epoch": 174, "lr": 8.123705512526326e-05} +{"train_loss": 0.004311536438763142, "global_step": 20721, "epoch": 174, "lr": 8.123532515386548e-05} +{"train_loss": 0.003283093683421612, "global_step": 20722, "epoch": 174, "lr": 8.123359512114048e-05} +{"train_loss": 0.003075981279835105, "global_step": 20723, "epoch": 174, "lr": 8.123186502709163e-05} +{"train_loss": 0.004931586794555187, "global_step": 20724, "epoch": 174, "lr": 8.123013487172237e-05} +{"train_loss": 0.00506548909470439, "global_step": 20725, "epoch": 174, "lr": 8.122840465503607e-05} +{"train_loss": 0.00400790898129344, "global_step": 20726, "epoch": 174, "lr": 8.122667437703613e-05} +{"train_loss": 0.0070976875722408295, "global_step": 20727, "epoch": 174, "lr": 8.122494403772596e-05} +{"train_loss": 0.003564625047147274, "global_step": 20728, "epoch": 174, "lr": 8.122321363710896e-05} +{"train_loss": 0.0037807058542966843, "global_step": 20729, "epoch": 174, "lr": 8.12214831751885e-05} +{"train_loss": 0.0065902601927518845, "global_step": 20730, "epoch": 174, "lr": 8.121975265196798e-05} +{"train_loss": 0.0033592490945011377, "global_step": 20731, "epoch": 174, "lr": 8.121802206745083e-05} +{"train_loss": 0.005894017871469259, "global_step": 20732, "epoch": 174, "lr": 8.121629142164042e-05} +{"train_loss": 0.005411961115896702, "global_step": 20733, "epoch": 174, "lr": 8.121456071454017e-05} +{"train_loss": 0.0049803368747234344, "global_step": 20734, "epoch": 174, "lr": 8.121282994615345e-05} +{"train_loss": 0.005637805443257093, "global_step": 20735, "epoch": 174, "lr": 8.121109911648368e-05} +{"train_loss": 0.0037210851442068815, "global_step": 20736, "epoch": 174, "lr": 8.120936822553424e-05} +{"train_loss": 0.004603451583534479, "global_step": 20737, "epoch": 174, "lr": 8.120763727330856e-05} +{"train_loss": 0.0032012895680963993, "global_step": 20738, "epoch": 174, "lr": 8.120590625981e-05} +{"train_loss": 0.0058931466192007065, "global_step": 20739, "epoch": 174, "lr": 8.120417518504197e-05} +{"train_loss": 0.0041457535699009895, "global_step": 20740, "epoch": 174, "lr": 8.12024440490079e-05} +{"train_loss": 0.005643871612846851, "global_step": 20741, "epoch": 174, "lr": 8.120071285171115e-05} +{"train_loss": 0.005249068606644869, "global_step": 20742, "epoch": 174, "lr": 8.119898159315515e-05} +{"train_loss": 0.00582027668133378, "global_step": 20743, "epoch": 174, "lr": 8.119725027334326e-05} +{"train_loss": 0.005640587769448757, "global_step": 20744, "epoch": 174, "lr": 8.119551889227893e-05} +{"train_loss": 0.004256994929164648, "global_step": 20745, "epoch": 174, "lr": 8.119378744996551e-05} +{"train_loss": 0.0034819135908037424, "global_step": 20746, "epoch": 174, "lr": 8.119205594640642e-05} +{"train_loss": 0.005265212617814541, "global_step": 20747, "epoch": 174, "lr": 8.119032438160507e-05} +{"train_loss": 0.004845756106078625, "global_step": 20748, "epoch": 174, "lr": 8.118859275556486e-05} +{"train_loss": 0.004290195181965828, "global_step": 20749, "epoch": 174, "lr": 8.118686106828914e-05} +{"train_loss": 0.006592522840946913, "global_step": 20750, "epoch": 174, "lr": 8.118512931978138e-05} +{"train_loss": 0.005357112269848585, "global_step": 20751, "epoch": 174, "lr": 8.118339751004495e-05} +{"train_loss": 0.0048506902530789375, "global_step": 20752, "epoch": 174, "lr": 8.118166563908325e-05} +{"train_loss": 0.005096603184938431, "global_step": 20753, "epoch": 174, "lr": 8.117993370689968e-05} +{"train_loss": 0.007035253569483757, "global_step": 20754, "epoch": 174, "lr": 8.117820171349763e-05} +{"train_loss": 0.009172062389552593, "global_step": 20755, "epoch": 174, "lr": 8.117646965888052e-05} +{"train_loss": 0.0053891330026090145, "global_step": 20756, "epoch": 174, "lr": 8.117473754305174e-05} +{"train_loss": 0.005647815298289061, "global_step": 20757, "epoch": 174, "lr": 8.117300536601471e-05} +{"train_loss": 0.0047473059967160225, "global_step": 20758, "epoch": 174, "lr": 8.11712731277728e-05} +{"train_loss": 0.004353049211204052, "global_step": 20759, "epoch": 174, "lr": 8.116954082832944e-05} +{"train_loss": 0.005105192773044109, "global_step": 20760, "epoch": 174, "lr": 8.116780846768798e-05} +{"train_loss": 0.0060995896346867085, "global_step": 20761, "epoch": 174, "lr": 8.11660760458519e-05} +{"train_loss": 0.0033620852045714855, "global_step": 20762, "epoch": 174, "lr": 8.116434356282452e-05} +{"train_loss": 0.006096425466239452, "global_step": 20763, "epoch": 174, "lr": 8.116261101860932e-05} +{"train_loss": 0.006367597263306379, "global_step": 20764, "epoch": 174, "lr": 8.116087841320963e-05} +{"train_loss": 0.003794898046180606, "global_step": 20765, "epoch": 174, "lr": 8.11591457466289e-05} +{"train_loss": 0.007292379625141621, "global_step": 20766, "epoch": 174, "lr": 8.115741301887052e-05} +{"train_loss": 0.00434851786121726, "global_step": 20767, "epoch": 174, "lr": 8.115568022993788e-05} +{"train_loss": 0.005035900976508856, "global_step": 20768, "epoch": 174, "lr": 8.11539473798344e-05} +{"train_loss": 0.00469960505142808, "global_step": 20769, "epoch": 174, "lr": 8.115221446856344e-05} +{"train_loss": 0.005283050704747438, "global_step": 20770, "epoch": 174, "lr": 8.115048149612847e-05} +{"train_loss": 0.004367073532193899, "global_step": 20771, "epoch": 174, "lr": 8.114874846253287e-05} +{"train_loss": 0.0046668024733662605, "global_step": 20772, "epoch": 174, "lr": 8.114701536777999e-05} +{"train_loss": 0.006588960066437721, "global_step": 20773, "epoch": 174, "lr": 8.114528221187329e-05} +{"train_loss": 0.005216846242547035, "global_step": 20774, "epoch": 174, "lr": 8.114354899481615e-05} +{"train_loss": 0.005580310709774494, "global_step": 20775, "epoch": 174, "lr": 8.114181571661199e-05} +{"train_loss": 0.0075010680593550205, "global_step": 20776, "epoch": 174, "lr": 8.11400823772642e-05} +{"train_loss": 0.004310603719204664, "global_step": 20777, "epoch": 174, "lr": 8.113834897677618e-05} +{"train_loss": 0.004268085118383169, "global_step": 20778, "epoch": 174, "lr": 8.113661551515134e-05} +{"train_loss": 0.005593124311417341, "global_step": 20779, "epoch": 174, "lr": 8.113488199239309e-05} +{"train_loss": 0.007048267871141434, "global_step": 20780, "epoch": 174, "lr": 8.113314840850482e-05} +{"train_loss": 0.00456957658752799, "global_step": 20781, "epoch": 174, "lr": 8.113141476348993e-05} +{"train_loss": 0.004819881170988083, "global_step": 20782, "epoch": 174, "lr": 8.112968105735183e-05} +{"train_loss": 0.005783243104815483, "global_step": 20783, "epoch": 174, "lr": 8.112794729009394e-05} +{"train_loss": 0.004290893208235502, "global_step": 20784, "epoch": 174, "lr": 8.112621346171966e-05} +{"train_loss": 0.0037865731865167618, "global_step": 20785, "epoch": 174, "lr": 8.112447957223237e-05} +{"train_loss": 0.005139765329658985, "global_step": 20786, "epoch": 174, "lr": 8.112274562163549e-05} +{"train_loss": 0.006717780139297247, "global_step": 20787, "epoch": 174, "lr": 8.112101160993243e-05} +{"train_loss": 0.005165088456124067, "global_step": 20788, "epoch": 174, "lr": 8.111927753712658e-05} +{"train_loss": 0.005849878769367933, "global_step": 20789, "epoch": 174, "lr": 8.111754340322136e-05} +{"train_loss": 0.005170403514057398, "global_step": 20790, "epoch": 174, "lr": 8.111580920822018e-05} +{"train_loss": 0.007160273380577564, "global_step": 20791, "epoch": 174, "lr": 8.111407495212642e-05} +{"train_loss": 0.00635929312556982, "global_step": 20792, "epoch": 174, "lr": 8.111234063494349e-05} +{"train_loss": 0.006536354776471853, "global_step": 20793, "epoch": 174, "lr": 8.111060625667481e-05} +{"train_loss": 0.004129619803279638, "global_step": 20794, "epoch": 174, "lr": 8.110887181732379e-05} +{"train_loss": 0.006687580607831478, "global_step": 20795, "epoch": 174, "lr": 8.11071373168938e-05} +{"train_loss": 0.006296559236943722, "global_step": 20796, "epoch": 174, "lr": 8.110540275538829e-05} +{"train_loss": 0.008374224416911602, "global_step": 20797, "epoch": 174, "lr": 8.110366813281063e-05} +{"train_loss": 0.00462854839861393, "global_step": 20798, "epoch": 174, "lr": 8.110193344916425e-05} +{"train_loss": 0.00496843783184886, "global_step": 20799, "epoch": 174, "lr": 8.110019870445253e-05} +{"train_loss": 0.005765819922089577, "global_step": 20800, "epoch": 174, "lr": 8.109846389867891e-05} +{"train_loss": 0.008876497857272625, "global_step": 20801, "epoch": 174, "lr": 8.109672903184677e-05} +{"train_loss": 0.0059554544277489185, "global_step": 20802, "epoch": 174, "lr": 8.109499410395953e-05} +{"train_loss": 0.008152483031153679, "global_step": 20803, "epoch": 174, "lr": 8.10932591150206e-05} +{"train_loss": 0.007071834057569504, "global_step": 20804, "epoch": 174, "lr": 8.109152406503337e-05} +{"train_loss": 0.0027579767629504204, "global_step": 20805, "epoch": 174, "lr": 8.108978895400125e-05} +{"train_loss": 0.008781790733337402, "global_step": 20806, "epoch": 174, "lr": 8.108805378192765e-05} +{"train_loss": 0.00650141341611743, "global_step": 20807, "epoch": 174, "lr": 8.108631854881598e-05} +{"train_loss": 0.004370478447526693, "global_step": 20808, "epoch": 174, "lr": 8.108458325466963e-05} +{"train_loss": 0.005587889812886715, "global_step": 20809, "epoch": 174, "lr": 8.108284789949205e-05} +{"train_loss": 0.004057702608406544, "global_step": 20810, "epoch": 174, "lr": 8.10811124832866e-05} +{"train_loss": 0.0038563134148716927, "global_step": 20811, "epoch": 174, "lr": 8.107937700605672e-05} +{"train_loss": 0.0059092482551932335, "global_step": 20812, "epoch": 174, "lr": 8.107764146780579e-05} +{"train_loss": 0.005884082522243261, "global_step": 20813, "epoch": 174, "lr": 8.107590586853724e-05} +{"train_loss": 0.005472394172102213, "global_step": 20814, "epoch": 174, "lr": 8.107417020825445e-05} +{"train_loss": 0.004660028964281082, "global_step": 20815, "epoch": 174, "lr": 8.107243448696087e-05} +{"train_loss": 0.004672682378441095, "global_step": 20816, "epoch": 174, "lr": 8.107069870465989e-05} +{"train_loss": 0.005163644440472126, "global_step": 20817, "epoch": 174, "lr": 8.106896286135489e-05} +{"train_loss": 0.008466266095638275, "global_step": 20818, "epoch": 174, "lr": 8.106722695704932e-05} +{"train_loss": 0.007352420128881931, "global_step": 20819, "epoch": 174, "lr": 8.106549099174654e-05} +{"train_loss": 0.002851872704923153, "global_step": 20820, "epoch": 174, "lr": 8.106375496545001e-05} +{"train_loss": 0.004518942441791296, "global_step": 20821, "epoch": 174, "lr": 8.10620188781631e-05} +{"train_loss": 0.006549956742674112, "global_step": 20822, "epoch": 174, "lr": 8.106028272988926e-05} +{"train_loss": 0.007541435770690441, "global_step": 20823, "epoch": 174, "lr": 8.105854652063185e-05} +{"train_loss": 0.005481540706759992, "global_step": 20824, "epoch": 174, "lr": 8.105681025039432e-05, "val_loss": 0.01211574487388134} +{"train_loss": 0.005923050921410322, "global_step": 20825, "epoch": 175, "lr": 8.105507391918005e-05} +{"train_loss": 0.0032356486190110445, "global_step": 20826, "epoch": 175, "lr": 8.105333752699245e-05} +{"train_loss": 0.0029595692176371813, "global_step": 20827, "epoch": 175, "lr": 8.105160107383496e-05} +{"train_loss": 0.00647598784416914, "global_step": 20828, "epoch": 175, "lr": 8.104986455971096e-05} +{"train_loss": 0.004839736502617598, "global_step": 20829, "epoch": 175, "lr": 8.104812798462386e-05} +{"train_loss": 0.0037605923134833574, "global_step": 20830, "epoch": 175, "lr": 8.10463913485771e-05} +{"train_loss": 0.009460998699069023, "global_step": 20831, "epoch": 175, "lr": 8.104465465157404e-05} +{"train_loss": 0.004134080372750759, "global_step": 20832, "epoch": 175, "lr": 8.104291789361813e-05} +{"train_loss": 0.004991999827325344, "global_step": 20833, "epoch": 175, "lr": 8.104118107471277e-05} +{"train_loss": 0.004942228086292744, "global_step": 20834, "epoch": 175, "lr": 8.103944419486138e-05} +{"train_loss": 0.003777544479817152, "global_step": 20835, "epoch": 175, "lr": 8.103770725406734e-05} +{"train_loss": 0.0034608833957463503, "global_step": 20836, "epoch": 175, "lr": 8.103597025233407e-05} +{"train_loss": 0.00882125087082386, "global_step": 20837, "epoch": 175, "lr": 8.1034233189665e-05} +{"train_loss": 0.004016601946204901, "global_step": 20838, "epoch": 175, "lr": 8.103249606606352e-05} +{"train_loss": 0.007873743772506714, "global_step": 20839, "epoch": 175, "lr": 8.103075888153307e-05} +{"train_loss": 0.006846363190561533, "global_step": 20840, "epoch": 175, "lr": 8.102902163607702e-05} +{"train_loss": 0.0038749845698475838, "global_step": 20841, "epoch": 175, "lr": 8.102728432969882e-05} +{"train_loss": 0.0033878765534609556, "global_step": 20842, "epoch": 175, "lr": 8.102554696240183e-05} +{"train_loss": 0.0030387574806809425, "global_step": 20843, "epoch": 175, "lr": 8.102380953418952e-05} +{"train_loss": 0.003340735100209713, "global_step": 20844, "epoch": 175, "lr": 8.102207204506526e-05} +{"train_loss": 0.004581323359161615, "global_step": 20845, "epoch": 175, "lr": 8.102033449503248e-05} +{"train_loss": 0.004744408652186394, "global_step": 20846, "epoch": 175, "lr": 8.101859688409459e-05} +{"train_loss": 0.006572759710252285, "global_step": 20847, "epoch": 175, "lr": 8.101685921225501e-05} +{"train_loss": 0.0035695384722203016, "global_step": 20848, "epoch": 175, "lr": 8.101512147951713e-05} +{"train_loss": 0.005565802101045847, "global_step": 20849, "epoch": 175, "lr": 8.101338368588435e-05} +{"train_loss": 0.0063559734262526035, "global_step": 20850, "epoch": 175, "lr": 8.101164583136014e-05} +{"train_loss": 0.0046805888414382935, "global_step": 20851, "epoch": 175, "lr": 8.100990791594786e-05} +{"train_loss": 0.006761953700333834, "global_step": 20852, "epoch": 175, "lr": 8.100816993965094e-05} +{"train_loss": 0.006053978111594915, "global_step": 20853, "epoch": 175, "lr": 8.10064319024728e-05} +{"train_loss": 0.005491313524544239, "global_step": 20854, "epoch": 175, "lr": 8.100469380441683e-05} +{"train_loss": 0.004566607065498829, "global_step": 20855, "epoch": 175, "lr": 8.100295564548647e-05} +{"train_loss": 0.005123603157699108, "global_step": 20856, "epoch": 175, "lr": 8.10012174256851e-05} +{"train_loss": 0.003986581694334745, "global_step": 20857, "epoch": 175, "lr": 8.099947914501617e-05} +{"train_loss": 0.004615469835698605, "global_step": 20858, "epoch": 175, "lr": 8.099774080348306e-05} +{"train_loss": 0.00437906151637435, "global_step": 20859, "epoch": 175, "lr": 8.099600240108921e-05} +{"train_loss": 0.003884674981236458, "global_step": 20860, "epoch": 175, "lr": 8.0994263937838e-05} +{"train_loss": 0.004591570235788822, "global_step": 20861, "epoch": 175, "lr": 8.09925254137329e-05} +{"train_loss": 0.005278559867292643, "global_step": 20862, "epoch": 175, "lr": 8.099078682877726e-05} +{"train_loss": 0.006020150147378445, "global_step": 20863, "epoch": 175, "lr": 8.098904818297453e-05} +{"train_loss": 0.005222368519753218, "global_step": 20864, "epoch": 175, "lr": 8.098730947632811e-05} +{"train_loss": 0.005785101559013128, "global_step": 20865, "epoch": 175, "lr": 8.098557070884143e-05} +{"train_loss": 0.0032206482719630003, "global_step": 20866, "epoch": 175, "lr": 8.098383188051787e-05} +{"train_loss": 0.003985904622823, "global_step": 20867, "epoch": 175, "lr": 8.098209299136089e-05} +{"train_loss": 0.005164469126611948, "global_step": 20868, "epoch": 175, "lr": 8.098035404137387e-05} +{"train_loss": 0.00555479247123003, "global_step": 20869, "epoch": 175, "lr": 8.097861503056022e-05} +{"train_loss": 0.004379981197416782, "global_step": 20870, "epoch": 175, "lr": 8.097687595892338e-05} +{"train_loss": 0.005333001725375652, "global_step": 20871, "epoch": 175, "lr": 8.097513682646676e-05} +{"train_loss": 0.005127794574946165, "global_step": 20872, "epoch": 175, "lr": 8.097339763319376e-05} +{"train_loss": 0.0063578723929822445, "global_step": 20873, "epoch": 175, "lr": 8.09716583791078e-05} +{"train_loss": 0.007789256051182747, "global_step": 20874, "epoch": 175, "lr": 8.096991906421233e-05} +{"train_loss": 0.007885564118623734, "global_step": 20875, "epoch": 175, "lr": 8.09681796885107e-05} +{"train_loss": 0.004521246068179607, "global_step": 20876, "epoch": 175, "lr": 8.096644025200636e-05} +{"train_loss": 0.006619241554290056, "global_step": 20877, "epoch": 175, "lr": 8.096470075470272e-05} +{"train_loss": 0.0053199236281216145, "global_step": 20878, "epoch": 175, "lr": 8.096296119660322e-05} +{"train_loss": 0.005769162438809872, "global_step": 20879, "epoch": 175, "lr": 8.096122157771123e-05} +{"train_loss": 0.005209656432271004, "global_step": 20880, "epoch": 175, "lr": 8.09594818980302e-05} +{"train_loss": 0.003476174548268318, "global_step": 20881, "epoch": 175, "lr": 8.095774215756353e-05} +{"train_loss": 0.006489180494099855, "global_step": 20882, "epoch": 175, "lr": 8.095600235631464e-05} +{"train_loss": 0.0030991393141448498, "global_step": 20883, "epoch": 175, "lr": 8.095426249428695e-05} +{"train_loss": 0.006005174480378628, "global_step": 20884, "epoch": 175, "lr": 8.095252257148388e-05} +{"train_loss": 0.006798713468015194, "global_step": 20885, "epoch": 175, "lr": 8.095078258790883e-05} +{"train_loss": 0.004395002499222755, "global_step": 20886, "epoch": 175, "lr": 8.094904254356523e-05} +{"train_loss": 0.0029373872093856335, "global_step": 20887, "epoch": 175, "lr": 8.094730243845649e-05} +{"train_loss": 0.003789621638134122, "global_step": 20888, "epoch": 175, "lr": 8.094556227258601e-05} +{"train_loss": 0.00700982753187418, "global_step": 20889, "epoch": 175, "lr": 8.094382204595725e-05} +{"train_loss": 0.005589993204921484, "global_step": 20890, "epoch": 175, "lr": 8.094208175857361e-05} +{"train_loss": 0.006399764679372311, "global_step": 20891, "epoch": 175, "lr": 8.094034141043848e-05} +{"train_loss": 0.0025197311770170927, "global_step": 20892, "epoch": 175, "lr": 8.093860100155528e-05} +{"train_loss": 0.003996637649834156, "global_step": 20893, "epoch": 175, "lr": 8.093686053192747e-05} +{"train_loss": 0.00561604555696249, "global_step": 20894, "epoch": 175, "lr": 8.093512000155841e-05} +{"train_loss": 0.0036309114657342434, "global_step": 20895, "epoch": 175, "lr": 8.093337941045156e-05} +{"train_loss": 0.004714879672974348, "global_step": 20896, "epoch": 175, "lr": 8.093163875861032e-05} +{"train_loss": 0.007040061522275209, "global_step": 20897, "epoch": 175, "lr": 8.092989804603814e-05} +{"train_loss": 0.003008468309417367, "global_step": 20898, "epoch": 175, "lr": 8.092815727273839e-05} +{"train_loss": 0.008516652509570122, "global_step": 20899, "epoch": 175, "lr": 8.09264164387145e-05} +{"train_loss": 0.0058008222840726376, "global_step": 20900, "epoch": 175, "lr": 8.09246755439699e-05} +{"train_loss": 0.003622123971581459, "global_step": 20901, "epoch": 175, "lr": 8.092293458850802e-05} +{"train_loss": 0.004302970599383116, "global_step": 20902, "epoch": 175, "lr": 8.092119357233223e-05} +{"train_loss": 0.005286892410367727, "global_step": 20903, "epoch": 175, "lr": 8.091945249544601e-05} +{"train_loss": 0.008061070926487446, "global_step": 20904, "epoch": 175, "lr": 8.091771135785273e-05} +{"train_loss": 0.005555466283112764, "global_step": 20905, "epoch": 175, "lr": 8.091597015955583e-05} +{"train_loss": 0.005328700412064791, "global_step": 20906, "epoch": 175, "lr": 8.091422890055874e-05} +{"train_loss": 0.003028139006346464, "global_step": 20907, "epoch": 175, "lr": 8.091248758086484e-05} +{"train_loss": 0.004651564639061689, "global_step": 20908, "epoch": 175, "lr": 8.091074620047758e-05} +{"train_loss": 0.00521534588187933, "global_step": 20909, "epoch": 175, "lr": 8.090900475940037e-05} +{"train_loss": 0.006651062052696943, "global_step": 20910, "epoch": 175, "lr": 8.090726325763664e-05} +{"train_loss": 0.004230923019349575, "global_step": 20911, "epoch": 175, "lr": 8.090552169518981e-05} +{"train_loss": 0.005405945237725973, "global_step": 20912, "epoch": 175, "lr": 8.090378007206327e-05} +{"train_loss": 0.00319873308762908, "global_step": 20913, "epoch": 175, "lr": 8.090203838826047e-05} +{"train_loss": 0.005175712052732706, "global_step": 20914, "epoch": 175, "lr": 8.090029664378483e-05} +{"train_loss": 0.005194955971091986, "global_step": 20915, "epoch": 175, "lr": 8.089855483863972e-05} +{"train_loss": 0.006380212027579546, "global_step": 20916, "epoch": 175, "lr": 8.089681297282866e-05} +{"train_loss": 0.004455448593944311, "global_step": 20917, "epoch": 175, "lr": 8.089507104635495e-05} +{"train_loss": 0.004576859995722771, "global_step": 20918, "epoch": 175, "lr": 8.089332905922209e-05} +{"train_loss": 0.004825770389288664, "global_step": 20919, "epoch": 175, "lr": 8.089158701143349e-05} +{"train_loss": 0.004266115836799145, "global_step": 20920, "epoch": 175, "lr": 8.088984490299254e-05} +{"train_loss": 0.007284859195351601, "global_step": 20921, "epoch": 175, "lr": 8.088810273390269e-05} +{"train_loss": 0.0038282787427306175, "global_step": 20922, "epoch": 175, "lr": 8.088636050416736e-05} +{"train_loss": 0.004074165131896734, "global_step": 20923, "epoch": 175, "lr": 8.088461821378994e-05} +{"train_loss": 0.006743328180164099, "global_step": 20924, "epoch": 175, "lr": 8.088287586277389e-05} +{"train_loss": 0.0046884226612746716, "global_step": 20925, "epoch": 175, "lr": 8.08811334511226e-05} +{"train_loss": 0.0041391863487660885, "global_step": 20926, "epoch": 175, "lr": 8.087939097883951e-05} +{"train_loss": 0.006437179632484913, "global_step": 20927, "epoch": 175, "lr": 8.087764844592802e-05} +{"train_loss": 0.006419560872018337, "global_step": 20928, "epoch": 175, "lr": 8.087590585239159e-05} +{"train_loss": 0.003872513771057129, "global_step": 20929, "epoch": 175, "lr": 8.087416319823361e-05} +{"train_loss": 0.0038305160123854876, "global_step": 20930, "epoch": 175, "lr": 8.08724204834575e-05} +{"train_loss": 0.007680697366595268, "global_step": 20931, "epoch": 175, "lr": 8.08706777080667e-05} +{"train_loss": 0.0040907058864831924, "global_step": 20932, "epoch": 175, "lr": 8.086893487206462e-05} +{"train_loss": 0.004213343374431133, "global_step": 20933, "epoch": 175, "lr": 8.086719197545467e-05} +{"train_loss": 0.003404116490855813, "global_step": 20934, "epoch": 175, "lr": 8.086544901824032e-05} +{"train_loss": 0.004555764142423868, "global_step": 20935, "epoch": 175, "lr": 8.086370600042493e-05} +{"train_loss": 0.0057018836960196495, "global_step": 20936, "epoch": 175, "lr": 8.086196292201195e-05} +{"train_loss": 0.004675713833421469, "global_step": 20937, "epoch": 175, "lr": 8.086021978300482e-05} +{"train_loss": 0.005997358821332455, "global_step": 20938, "epoch": 175, "lr": 8.085847658340693e-05} +{"train_loss": 0.004062793217599392, "global_step": 20939, "epoch": 175, "lr": 8.085673332322173e-05} +{"train_loss": 0.0059721264988183975, "global_step": 20940, "epoch": 175, "lr": 8.085499000245262e-05} +{"train_loss": 0.004849513527005911, "global_step": 20941, "epoch": 175, "lr": 8.085324662110305e-05} +{"train_loss": 0.0032010118011385202, "global_step": 20942, "epoch": 175, "lr": 8.08515031791764e-05} +{"train_loss": 0.005084303154868363, "global_step": 20943, "epoch": 175, "lr": 8.084975967667614e-05, "val_loss": 0.016000032424926758, "train_action_mse_error": 0.00014754734002053738} +{"train_loss": 0.002679383847862482, "global_step": 20944, "epoch": 176, "lr": 8.084801611360566e-05} +{"train_loss": 0.00486270897090435, "global_step": 20945, "epoch": 176, "lr": 8.08462724899684e-05} +{"train_loss": 0.005711974110454321, "global_step": 20946, "epoch": 176, "lr": 8.084452880576778e-05} +{"train_loss": 0.006180198397487402, "global_step": 20947, "epoch": 176, "lr": 8.084278506100725e-05} +{"train_loss": 0.002795050386339426, "global_step": 20948, "epoch": 176, "lr": 8.084104125569017e-05} +{"train_loss": 0.005900012794882059, "global_step": 20949, "epoch": 176, "lr": 8.083929738982001e-05} +{"train_loss": 0.006319667678326368, "global_step": 20950, "epoch": 176, "lr": 8.083755346340019e-05} +{"train_loss": 0.002402673475444317, "global_step": 20951, "epoch": 176, "lr": 8.083580947643412e-05} +{"train_loss": 0.004432340152561665, "global_step": 20952, "epoch": 176, "lr": 8.083406542892524e-05} +{"train_loss": 0.0022285289596766233, "global_step": 20953, "epoch": 176, "lr": 8.083232132087697e-05} +{"train_loss": 0.0055941250175237656, "global_step": 20954, "epoch": 176, "lr": 8.083057715229272e-05} +{"train_loss": 0.003936576656997204, "global_step": 20955, "epoch": 176, "lr": 8.082883292317594e-05} +{"train_loss": 0.0034115693997591734, "global_step": 20956, "epoch": 176, "lr": 8.082708863353002e-05} +{"train_loss": 0.004413551185280085, "global_step": 20957, "epoch": 176, "lr": 8.082534428335841e-05} +{"train_loss": 0.004362180829048157, "global_step": 20958, "epoch": 176, "lr": 8.082359987266454e-05} +{"train_loss": 0.003068322781473398, "global_step": 20959, "epoch": 176, "lr": 8.082185540145182e-05} +{"train_loss": 0.004922306630760431, "global_step": 20960, "epoch": 176, "lr": 8.082011086972367e-05} +{"train_loss": 0.0046027228236198425, "global_step": 20961, "epoch": 176, "lr": 8.081836627748353e-05} +{"train_loss": 0.00407441658899188, "global_step": 20962, "epoch": 176, "lr": 8.081662162473485e-05} +{"train_loss": 0.0039244890213012695, "global_step": 20963, "epoch": 176, "lr": 8.081487691148099e-05} +{"train_loss": 0.004869373515248299, "global_step": 20964, "epoch": 176, "lr": 8.081313213772542e-05} +{"train_loss": 0.005311718210577965, "global_step": 20965, "epoch": 176, "lr": 8.081138730347156e-05} +{"train_loss": 0.0039438470266759396, "global_step": 20966, "epoch": 176, "lr": 8.080964240872283e-05} +{"train_loss": 0.007202010601758957, "global_step": 20967, "epoch": 176, "lr": 8.080789745348268e-05} +{"train_loss": 0.004189957864582539, "global_step": 20968, "epoch": 176, "lr": 8.080615243775446e-05} +{"train_loss": 0.0016189481830224395, "global_step": 20969, "epoch": 176, "lr": 8.08044073615417e-05} +{"train_loss": 0.0039060439448803663, "global_step": 20970, "epoch": 176, "lr": 8.080266222484776e-05} +{"train_loss": 0.003926553763449192, "global_step": 20971, "epoch": 176, "lr": 8.08009170276761e-05} +{"train_loss": 0.005379912443459034, "global_step": 20972, "epoch": 176, "lr": 8.079917177003011e-05} +{"train_loss": 0.004386603366583586, "global_step": 20973, "epoch": 176, "lr": 8.079742645191324e-05} +{"train_loss": 0.0034856745041906834, "global_step": 20974, "epoch": 176, "lr": 8.079568107332892e-05} +{"train_loss": 0.004403837025165558, "global_step": 20975, "epoch": 176, "lr": 8.079393563428057e-05} +{"train_loss": 0.005661026109009981, "global_step": 20976, "epoch": 176, "lr": 8.079219013477161e-05} +{"train_loss": 0.004439232405275106, "global_step": 20977, "epoch": 176, "lr": 8.079044457480547e-05} +{"train_loss": 0.0045908489264547825, "global_step": 20978, "epoch": 176, "lr": 8.07886989543856e-05} +{"train_loss": 0.0054155378602445126, "global_step": 20979, "epoch": 176, "lr": 8.07869532735154e-05} +{"train_loss": 0.005256550386548042, "global_step": 20980, "epoch": 176, "lr": 8.078520753219829e-05} +{"train_loss": 0.004893858917057514, "global_step": 20981, "epoch": 176, "lr": 8.078346173043774e-05} +{"train_loss": 0.004691386129707098, "global_step": 20982, "epoch": 176, "lr": 8.078171586823714e-05} +{"train_loss": 0.004891803953796625, "global_step": 20983, "epoch": 176, "lr": 8.077996994559993e-05} +{"train_loss": 0.006780367344617844, "global_step": 20984, "epoch": 176, "lr": 8.077822396252954e-05} +{"train_loss": 0.005237674806267023, "global_step": 20985, "epoch": 176, "lr": 8.07764779190294e-05} +{"train_loss": 0.006885952316224575, "global_step": 20986, "epoch": 176, "lr": 8.077473181510291e-05} +{"train_loss": 0.00333923427388072, "global_step": 20987, "epoch": 176, "lr": 8.077298565075354e-05} +{"train_loss": 0.003356875153258443, "global_step": 20988, "epoch": 176, "lr": 8.07712394259847e-05} +{"train_loss": 0.004712571389973164, "global_step": 20989, "epoch": 176, "lr": 8.076949314079983e-05} +{"train_loss": 0.006077769678086042, "global_step": 20990, "epoch": 176, "lr": 8.076774679520232e-05} +{"train_loss": 0.004237161949276924, "global_step": 20991, "epoch": 176, "lr": 8.076600038919565e-05} +{"train_loss": 0.006361702922731638, "global_step": 20992, "epoch": 176, "lr": 8.076425392278322e-05} +{"train_loss": 0.004038759507238865, "global_step": 20993, "epoch": 176, "lr": 8.076250739596845e-05} +{"train_loss": 0.007201222702860832, "global_step": 20994, "epoch": 176, "lr": 8.076076080875479e-05} +{"train_loss": 0.006535761523991823, "global_step": 20995, "epoch": 176, "lr": 8.075901416114566e-05} +{"train_loss": 0.0035082187969237566, "global_step": 20996, "epoch": 176, "lr": 8.07572674531445e-05} +{"train_loss": 0.007004540879279375, "global_step": 20997, "epoch": 176, "lr": 8.075552068475473e-05} +{"train_loss": 0.004571228753775358, "global_step": 20998, "epoch": 176, "lr": 8.075377385597979e-05} +{"train_loss": 0.003775293007493019, "global_step": 20999, "epoch": 176, "lr": 8.075202696682309e-05} +{"train_loss": 0.006031050346791744, "global_step": 21000, "epoch": 176, "lr": 8.075028001728805e-05} +{"train_loss": 0.010180617682635784, "global_step": 21001, "epoch": 176, "lr": 8.074853300737816e-05} +{"train_loss": 0.003485969267785549, "global_step": 21002, "epoch": 176, "lr": 8.074678593709679e-05} +{"train_loss": 0.003586880164220929, "global_step": 21003, "epoch": 176, "lr": 8.07450388064474e-05} +{"train_loss": 0.005977810826152563, "global_step": 21004, "epoch": 176, "lr": 8.074329161543339e-05} +{"train_loss": 0.007278170436620712, "global_step": 21005, "epoch": 176, "lr": 8.074154436405823e-05} +{"train_loss": 0.005205760709941387, "global_step": 21006, "epoch": 176, "lr": 8.073979705232533e-05} +{"train_loss": 0.005120075773447752, "global_step": 21007, "epoch": 176, "lr": 8.073804968023811e-05} +{"train_loss": 0.00839126855134964, "global_step": 21008, "epoch": 176, "lr": 8.073630224780002e-05} +{"train_loss": 0.003135171253234148, "global_step": 21009, "epoch": 176, "lr": 8.07345547550145e-05} +{"train_loss": 0.006052569951862097, "global_step": 21010, "epoch": 176, "lr": 8.073280720188494e-05} +{"train_loss": 0.005028128158301115, "global_step": 21011, "epoch": 176, "lr": 8.073105958841482e-05} +{"train_loss": 0.006764495279639959, "global_step": 21012, "epoch": 176, "lr": 8.072931191460752e-05} +{"train_loss": 0.0033122466411441565, "global_step": 21013, "epoch": 176, "lr": 8.072756418046652e-05} +{"train_loss": 0.004292813595384359, "global_step": 21014, "epoch": 176, "lr": 8.072581638599523e-05} +{"train_loss": 0.006885942071676254, "global_step": 21015, "epoch": 176, "lr": 8.072406853119707e-05} +{"train_loss": 0.004205051343888044, "global_step": 21016, "epoch": 176, "lr": 8.07223206160755e-05} +{"train_loss": 0.004638830665498972, "global_step": 21017, "epoch": 176, "lr": 8.072057264063393e-05} +{"train_loss": 0.008089768700301647, "global_step": 21018, "epoch": 176, "lr": 8.071882460487579e-05} +{"train_loss": 0.00755646638572216, "global_step": 21019, "epoch": 176, "lr": 8.071707650880452e-05} +{"train_loss": 0.0025400426238775253, "global_step": 21020, "epoch": 176, "lr": 8.071532835242355e-05} +{"train_loss": 0.00399730633944273, "global_step": 21021, "epoch": 176, "lr": 8.071358013573634e-05} +{"train_loss": 0.007412283681333065, "global_step": 21022, "epoch": 176, "lr": 8.071183185874627e-05} +{"train_loss": 0.005547528620809317, "global_step": 21023, "epoch": 176, "lr": 8.07100835214568e-05} +{"train_loss": 0.005372075363993645, "global_step": 21024, "epoch": 176, "lr": 8.070833512387138e-05} +{"train_loss": 0.005369932856410742, "global_step": 21025, "epoch": 176, "lr": 8.07065866659934e-05} +{"train_loss": 0.003383675590157509, "global_step": 21026, "epoch": 176, "lr": 8.070483814782634e-05} +{"train_loss": 0.003988353535532951, "global_step": 21027, "epoch": 176, "lr": 8.07030895693736e-05} +{"train_loss": 0.005354778375476599, "global_step": 21028, "epoch": 176, "lr": 8.070134093063862e-05} +{"train_loss": 0.003955998457968235, "global_step": 21029, "epoch": 176, "lr": 8.069959223162485e-05} +{"train_loss": 0.0048762233927845955, "global_step": 21030, "epoch": 176, "lr": 8.06978434723357e-05} +{"train_loss": 0.0029283049516379833, "global_step": 21031, "epoch": 176, "lr": 8.06960946527746e-05} +{"train_loss": 0.0036330888979136944, "global_step": 21032, "epoch": 176, "lr": 8.069434577294502e-05} +{"train_loss": 0.006744577083736658, "global_step": 21033, "epoch": 176, "lr": 8.069259683285036e-05} +{"train_loss": 0.0035645628813654184, "global_step": 21034, "epoch": 176, "lr": 8.069084783249407e-05} +{"train_loss": 0.0077920835465192795, "global_step": 21035, "epoch": 176, "lr": 8.068909877187959e-05} +{"train_loss": 0.004469351377338171, "global_step": 21036, "epoch": 176, "lr": 8.068734965101033e-05} +{"train_loss": 0.004238232970237732, "global_step": 21037, "epoch": 176, "lr": 8.068560046988973e-05} +{"train_loss": 0.005640481133013964, "global_step": 21038, "epoch": 176, "lr": 8.068385122852125e-05} +{"train_loss": 0.005508990492671728, "global_step": 21039, "epoch": 176, "lr": 8.06821019269083e-05} +{"train_loss": 0.004716762341558933, "global_step": 21040, "epoch": 176, "lr": 8.06803525650543e-05} +{"train_loss": 0.004494986496865749, "global_step": 21041, "epoch": 176, "lr": 8.067860314296274e-05} +{"train_loss": 0.005005537532269955, "global_step": 21042, "epoch": 176, "lr": 8.067685366063701e-05} +{"train_loss": 0.005575123708695173, "global_step": 21043, "epoch": 176, "lr": 8.067510411808054e-05} +{"train_loss": 0.003951591905206442, "global_step": 21044, "epoch": 176, "lr": 8.067335451529679e-05} +{"train_loss": 0.008714543655514717, "global_step": 21045, "epoch": 176, "lr": 8.06716048522892e-05} +{"train_loss": 0.0034603497479110956, "global_step": 21046, "epoch": 176, "lr": 8.066985512906116e-05} +{"train_loss": 0.0039650872349739075, "global_step": 21047, "epoch": 176, "lr": 8.066810534561616e-05} +{"train_loss": 0.00571749173104763, "global_step": 21048, "epoch": 176, "lr": 8.06663555019576e-05} +{"train_loss": 0.004695230629295111, "global_step": 21049, "epoch": 176, "lr": 8.066460559808893e-05} +{"train_loss": 0.007023405283689499, "global_step": 21050, "epoch": 176, "lr": 8.066285563401359e-05} +{"train_loss": 0.004322883673012257, "global_step": 21051, "epoch": 176, "lr": 8.066110560973499e-05} +{"train_loss": 0.008685784414410591, "global_step": 21052, "epoch": 176, "lr": 8.06593555252566e-05} +{"train_loss": 0.00600401358678937, "global_step": 21053, "epoch": 176, "lr": 8.065760538058184e-05} +{"train_loss": 0.005040979012846947, "global_step": 21054, "epoch": 176, "lr": 8.065585517571414e-05} +{"train_loss": 0.0065535749308764935, "global_step": 21055, "epoch": 176, "lr": 8.065410491065696e-05} +{"train_loss": 0.005062852054834366, "global_step": 21056, "epoch": 176, "lr": 8.06523545854137e-05} +{"train_loss": 0.00554093299433589, "global_step": 21057, "epoch": 176, "lr": 8.065060419998782e-05} +{"train_loss": 0.0032109252642840147, "global_step": 21058, "epoch": 176, "lr": 8.064885375438276e-05} +{"train_loss": 0.004082462750375271, "global_step": 21059, "epoch": 176, "lr": 8.064710324860196e-05} +{"train_loss": 0.005686478223651648, "global_step": 21060, "epoch": 176, "lr": 8.064535268264883e-05} +{"train_loss": 0.006174857262521982, "global_step": 21061, "epoch": 176, "lr": 8.064360205652683e-05} +{"train_loss": 0.005013420425566743, "global_step": 21062, "epoch": 176, "lr": 8.064185137023938e-05, "val_loss": 0.0134388767182827} +{"train_loss": 0.004290880635380745, "global_step": 21063, "epoch": 177, "lr": 8.064010062378995e-05} +{"train_loss": 0.006742102559655905, "global_step": 21064, "epoch": 177, "lr": 8.063834981718195e-05} +{"train_loss": 0.004811088554561138, "global_step": 21065, "epoch": 177, "lr": 8.063659895041881e-05} +{"train_loss": 0.004921916406601667, "global_step": 21066, "epoch": 177, "lr": 8.063484802350399e-05} +{"train_loss": 0.00905824638903141, "global_step": 21067, "epoch": 177, "lr": 8.063309703644092e-05} +{"train_loss": 0.005714526399970055, "global_step": 21068, "epoch": 177, "lr": 8.063134598923303e-05} +{"train_loss": 0.006291894242167473, "global_step": 21069, "epoch": 177, "lr": 8.062959488188377e-05} +{"train_loss": 0.009071274660527706, "global_step": 21070, "epoch": 177, "lr": 8.062784371439656e-05} +{"train_loss": 0.006566684227436781, "global_step": 21071, "epoch": 177, "lr": 8.062609248677487e-05} +{"train_loss": 0.0047908625565469265, "global_step": 21072, "epoch": 177, "lr": 8.062434119902211e-05} +{"train_loss": 0.005205865949392319, "global_step": 21073, "epoch": 177, "lr": 8.062258985114174e-05} +{"train_loss": 0.006437885574996471, "global_step": 21074, "epoch": 177, "lr": 8.062083844313717e-05} +{"train_loss": 0.004660191014409065, "global_step": 21075, "epoch": 177, "lr": 8.061908697501186e-05} +{"train_loss": 0.0047660572454333305, "global_step": 21076, "epoch": 177, "lr": 8.061733544676924e-05} +{"train_loss": 0.004688887391239405, "global_step": 21077, "epoch": 177, "lr": 8.061558385841276e-05} +{"train_loss": 0.008058151230216026, "global_step": 21078, "epoch": 177, "lr": 8.061383220994585e-05} +{"train_loss": 0.004685056395828724, "global_step": 21079, "epoch": 177, "lr": 8.061208050137196e-05} +{"train_loss": 0.005540361627936363, "global_step": 21080, "epoch": 177, "lr": 8.061032873269451e-05} +{"train_loss": 0.008445804007351398, "global_step": 21081, "epoch": 177, "lr": 8.060857690391694e-05} +{"train_loss": 0.005764108616858721, "global_step": 21082, "epoch": 177, "lr": 8.060682501504273e-05} +{"train_loss": 0.006539001129567623, "global_step": 21083, "epoch": 177, "lr": 8.060507306607525e-05} +{"train_loss": 0.005430803168565035, "global_step": 21084, "epoch": 177, "lr": 8.0603321057018e-05} +{"train_loss": 0.004851676058024168, "global_step": 21085, "epoch": 177, "lr": 8.06015689878744e-05} +{"train_loss": 0.007913009263575077, "global_step": 21086, "epoch": 177, "lr": 8.059981685864788e-05} +{"train_loss": 0.006412608548998833, "global_step": 21087, "epoch": 177, "lr": 8.05980646693419e-05} +{"train_loss": 0.003897626418620348, "global_step": 21088, "epoch": 177, "lr": 8.059631241995988e-05} +{"train_loss": 0.0053099519573152065, "global_step": 21089, "epoch": 177, "lr": 8.059456011050528e-05} +{"train_loss": 0.007986290380358696, "global_step": 21090, "epoch": 177, "lr": 8.059280774098151e-05} +{"train_loss": 0.007098012138158083, "global_step": 21091, "epoch": 177, "lr": 8.059105531139205e-05} +{"train_loss": 0.004647193010896444, "global_step": 21092, "epoch": 177, "lr": 8.058930282174031e-05} +{"train_loss": 0.006572767626494169, "global_step": 21093, "epoch": 177, "lr": 8.058755027202974e-05} +{"train_loss": 0.005426263436675072, "global_step": 21094, "epoch": 177, "lr": 8.05857976622638e-05} +{"train_loss": 0.005778314545750618, "global_step": 21095, "epoch": 177, "lr": 8.05840449924459e-05} +{"train_loss": 0.004236272536218166, "global_step": 21096, "epoch": 177, "lr": 8.058229226257949e-05} +{"train_loss": 0.004248127341270447, "global_step": 21097, "epoch": 177, "lr": 8.058053947266804e-05} +{"train_loss": 0.006344337482005358, "global_step": 21098, "epoch": 177, "lr": 8.057878662271494e-05} +{"train_loss": 0.007100874092429876, "global_step": 21099, "epoch": 177, "lr": 8.057703371272366e-05} +{"train_loss": 0.007427391596138477, "global_step": 21100, "epoch": 177, "lr": 8.057528074269765e-05} +{"train_loss": 0.0030239990446716547, "global_step": 21101, "epoch": 177, "lr": 8.057352771264035e-05} +{"train_loss": 0.0037342067807912827, "global_step": 21102, "epoch": 177, "lr": 8.057177462255518e-05} +{"train_loss": 0.004939476028084755, "global_step": 21103, "epoch": 177, "lr": 8.057002147244562e-05} +{"train_loss": 0.006637969519942999, "global_step": 21104, "epoch": 177, "lr": 8.056826826231508e-05} +{"train_loss": 0.004566804971545935, "global_step": 21105, "epoch": 177, "lr": 8.0566514992167e-05} +{"train_loss": 0.0033005515579134226, "global_step": 21106, "epoch": 177, "lr": 8.056476166200484e-05} +{"train_loss": 0.004941854625940323, "global_step": 21107, "epoch": 177, "lr": 8.056300827183203e-05} +{"train_loss": 0.004528951831161976, "global_step": 21108, "epoch": 177, "lr": 8.056125482165202e-05} +{"train_loss": 0.004797820001840591, "global_step": 21109, "epoch": 177, "lr": 8.055950131146826e-05} +{"train_loss": 0.005184700712561607, "global_step": 21110, "epoch": 177, "lr": 8.055774774128417e-05} +{"train_loss": 0.00659222062677145, "global_step": 21111, "epoch": 177, "lr": 8.055599411110321e-05} +{"train_loss": 0.0049405526369810104, "global_step": 21112, "epoch": 177, "lr": 8.055424042092883e-05} +{"train_loss": 0.00588343758136034, "global_step": 21113, "epoch": 177, "lr": 8.055248667076446e-05} +{"train_loss": 0.0043289680033922195, "global_step": 21114, "epoch": 177, "lr": 8.055073286061354e-05} +{"train_loss": 0.0036611531395465136, "global_step": 21115, "epoch": 177, "lr": 8.054897899047953e-05} +{"train_loss": 0.00740126334130764, "global_step": 21116, "epoch": 177, "lr": 8.054722506036585e-05} +{"train_loss": 0.0034270838368684053, "global_step": 21117, "epoch": 177, "lr": 8.054547107027596e-05} +{"train_loss": 0.007248326204717159, "global_step": 21118, "epoch": 177, "lr": 8.054371702021332e-05} +{"train_loss": 0.003526307176798582, "global_step": 21119, "epoch": 177, "lr": 8.054196291018133e-05} +{"train_loss": 0.005559886340051889, "global_step": 21120, "epoch": 177, "lr": 8.054020874018348e-05} +{"train_loss": 0.0067511191591620445, "global_step": 21121, "epoch": 177, "lr": 8.053845451022317e-05} +{"train_loss": 0.007573023438453674, "global_step": 21122, "epoch": 177, "lr": 8.053670022030389e-05} +{"train_loss": 0.005725028458982706, "global_step": 21123, "epoch": 177, "lr": 8.053494587042904e-05} +{"train_loss": 0.002823416842147708, "global_step": 21124, "epoch": 177, "lr": 8.05331914606021e-05} +{"train_loss": 0.004197676666080952, "global_step": 21125, "epoch": 177, "lr": 8.05314369908265e-05} +{"train_loss": 0.005384498741477728, "global_step": 21126, "epoch": 177, "lr": 8.052968246110568e-05} +{"train_loss": 0.004382329992949963, "global_step": 21127, "epoch": 177, "lr": 8.05279278714431e-05} +{"train_loss": 0.006870610173791647, "global_step": 21128, "epoch": 177, "lr": 8.052617322184217e-05} +{"train_loss": 0.008051261305809021, "global_step": 21129, "epoch": 177, "lr": 8.052441851230638e-05} +{"train_loss": 0.0030149943195283413, "global_step": 21130, "epoch": 177, "lr": 8.052266374283916e-05} +{"train_loss": 0.004822203423827887, "global_step": 21131, "epoch": 177, "lr": 8.052090891344395e-05} +{"train_loss": 0.00646281149238348, "global_step": 21132, "epoch": 177, "lr": 8.051915402412419e-05} +{"train_loss": 0.0055602495558559895, "global_step": 21133, "epoch": 177, "lr": 8.051739907488334e-05} +{"train_loss": 0.006497563328593969, "global_step": 21134, "epoch": 177, "lr": 8.051564406572481e-05} +{"train_loss": 0.00407360540702939, "global_step": 21135, "epoch": 177, "lr": 8.051388899665211e-05} +{"train_loss": 0.0051747774705290794, "global_step": 21136, "epoch": 177, "lr": 8.051213386766862e-05} +{"train_loss": 0.005314363166689873, "global_step": 21137, "epoch": 177, "lr": 8.051037867877782e-05} +{"train_loss": 0.004187156446278095, "global_step": 21138, "epoch": 177, "lr": 8.050862342998316e-05} +{"train_loss": 0.008264187723398209, "global_step": 21139, "epoch": 177, "lr": 8.050686812128808e-05} +{"train_loss": 0.0040424540638923645, "global_step": 21140, "epoch": 177, "lr": 8.050511275269602e-05} +{"train_loss": 0.007337961345911026, "global_step": 21141, "epoch": 177, "lr": 8.050335732421042e-05} +{"train_loss": 0.008127124048769474, "global_step": 21142, "epoch": 177, "lr": 8.050160183583476e-05} +{"train_loss": 0.009438717737793922, "global_step": 21143, "epoch": 177, "lr": 8.049984628757244e-05} +{"train_loss": 0.005415590945631266, "global_step": 21144, "epoch": 177, "lr": 8.049809067942693e-05} +{"train_loss": 0.004748655017465353, "global_step": 21145, "epoch": 177, "lr": 8.049633501140169e-05} +{"train_loss": 0.002990944078192115, "global_step": 21146, "epoch": 177, "lr": 8.049457928350013e-05} +{"train_loss": 0.0037222611717879772, "global_step": 21147, "epoch": 177, "lr": 8.049282349572575e-05} +{"train_loss": 0.0067180185578763485, "global_step": 21148, "epoch": 177, "lr": 8.049106764808196e-05} +{"train_loss": 0.004211129620671272, "global_step": 21149, "epoch": 177, "lr": 8.048931174057222e-05} +{"train_loss": 0.005451560486108065, "global_step": 21150, "epoch": 177, "lr": 8.048755577319997e-05} +{"train_loss": 0.0035456421319395304, "global_step": 21151, "epoch": 177, "lr": 8.048579974596865e-05} +{"train_loss": 0.005902174394577742, "global_step": 21152, "epoch": 177, "lr": 8.048404365888174e-05} +{"train_loss": 0.005031989421695471, "global_step": 21153, "epoch": 177, "lr": 8.048228751194265e-05} +{"train_loss": 0.004941912833601236, "global_step": 21154, "epoch": 177, "lr": 8.048053130515486e-05} +{"train_loss": 0.00514540821313858, "global_step": 21155, "epoch": 177, "lr": 8.047877503852179e-05} +{"train_loss": 0.0052455090917646885, "global_step": 21156, "epoch": 177, "lr": 8.047701871204691e-05} +{"train_loss": 0.003187658032402396, "global_step": 21157, "epoch": 177, "lr": 8.047526232573366e-05} +{"train_loss": 0.006804823875427246, "global_step": 21158, "epoch": 177, "lr": 8.047350587958548e-05} +{"train_loss": 0.008756187744438648, "global_step": 21159, "epoch": 177, "lr": 8.047174937360582e-05} +{"train_loss": 0.003949590027332306, "global_step": 21160, "epoch": 177, "lr": 8.046999280779815e-05} +{"train_loss": 0.006416269112378359, "global_step": 21161, "epoch": 177, "lr": 8.04682361821659e-05} +{"train_loss": 0.00549317616969347, "global_step": 21162, "epoch": 177, "lr": 8.046647949671253e-05} +{"train_loss": 0.004687709733843803, "global_step": 21163, "epoch": 177, "lr": 8.046472275144148e-05} +{"train_loss": 0.0028637086506932974, "global_step": 21164, "epoch": 177, "lr": 8.046296594635619e-05} +{"train_loss": 0.005676069762557745, "global_step": 21165, "epoch": 177, "lr": 8.046120908146013e-05} +{"train_loss": 0.003854432376101613, "global_step": 21166, "epoch": 177, "lr": 8.045945215675675e-05} +{"train_loss": 0.0033401253167539835, "global_step": 21167, "epoch": 177, "lr": 8.045769517224947e-05} +{"train_loss": 0.005475722718983889, "global_step": 21168, "epoch": 177, "lr": 8.045593812794176e-05} +{"train_loss": 0.005105064250528812, "global_step": 21169, "epoch": 177, "lr": 8.045418102383709e-05} +{"train_loss": 0.0071489205583930016, "global_step": 21170, "epoch": 177, "lr": 8.045242385993887e-05} +{"train_loss": 0.0045736306346952915, "global_step": 21171, "epoch": 177, "lr": 8.045066663625059e-05} +{"train_loss": 0.007079526782035828, "global_step": 21172, "epoch": 177, "lr": 8.044890935277566e-05} +{"train_loss": 0.006710604298859835, "global_step": 21173, "epoch": 177, "lr": 8.044715200951755e-05} +{"train_loss": 0.0050010234117507935, "global_step": 21174, "epoch": 177, "lr": 8.04453946064797e-05} +{"train_loss": 0.004529466852545738, "global_step": 21175, "epoch": 177, "lr": 8.04436371436656e-05} +{"train_loss": 0.005301992874592543, "global_step": 21176, "epoch": 177, "lr": 8.044187962107865e-05} +{"train_loss": 0.005592878442257643, "global_step": 21177, "epoch": 177, "lr": 8.044012203872233e-05} +{"train_loss": 0.0038466183468699455, "global_step": 21178, "epoch": 177, "lr": 8.043836439660007e-05} +{"train_loss": 0.006953033152967691, "global_step": 21179, "epoch": 177, "lr": 8.043660669471535e-05} +{"train_loss": 0.003410467179492116, "global_step": 21180, "epoch": 177, "lr": 8.043484893307161e-05} +{"train_loss": 0.005483090556657114, "global_step": 21181, "epoch": 177, "lr": 8.043309111167228e-05, "val_loss": 0.018673401325941086} +{"train_loss": 0.004517192952334881, "global_step": 21182, "epoch": 178, "lr": 8.043133323052082e-05} +{"train_loss": 0.006118037272244692, "global_step": 21183, "epoch": 178, "lr": 8.04295752896207e-05} +{"train_loss": 0.006348899565637112, "global_step": 21184, "epoch": 178, "lr": 8.042781728897536e-05} +{"train_loss": 0.0046945130452513695, "global_step": 21185, "epoch": 178, "lr": 8.042605922858825e-05} +{"train_loss": 0.0026975723449140787, "global_step": 21186, "epoch": 178, "lr": 8.042430110846282e-05} +{"train_loss": 0.004924124572426081, "global_step": 21187, "epoch": 178, "lr": 8.042254292860253e-05} +{"train_loss": 0.004281328525394201, "global_step": 21188, "epoch": 178, "lr": 8.042078468901082e-05} +{"train_loss": 0.003936309367418289, "global_step": 21189, "epoch": 178, "lr": 8.041902638969116e-05} +{"train_loss": 0.006828179582953453, "global_step": 21190, "epoch": 178, "lr": 8.041726803064699e-05} +{"train_loss": 0.004956903401762247, "global_step": 21191, "epoch": 178, "lr": 8.041550961188176e-05} +{"train_loss": 0.0036220327019691467, "global_step": 21192, "epoch": 178, "lr": 8.041375113339893e-05} +{"train_loss": 0.005094335880130529, "global_step": 21193, "epoch": 178, "lr": 8.041199259520194e-05} +{"train_loss": 0.007034548092633486, "global_step": 21194, "epoch": 178, "lr": 8.041023399729425e-05} +{"train_loss": 0.00398695282638073, "global_step": 21195, "epoch": 178, "lr": 8.040847533967933e-05} +{"train_loss": 0.003770646871998906, "global_step": 21196, "epoch": 178, "lr": 8.04067166223606e-05} +{"train_loss": 0.005132824182510376, "global_step": 21197, "epoch": 178, "lr": 8.040495784534155e-05} +{"train_loss": 0.005084659904241562, "global_step": 21198, "epoch": 178, "lr": 8.040319900862559e-05} +{"train_loss": 0.005207708105444908, "global_step": 21199, "epoch": 178, "lr": 8.040144011221621e-05} +{"train_loss": 0.004567690193653107, "global_step": 21200, "epoch": 178, "lr": 8.039968115611685e-05} +{"train_loss": 0.005061503499746323, "global_step": 21201, "epoch": 178, "lr": 8.039792214033096e-05} +{"train_loss": 0.003290774067863822, "global_step": 21202, "epoch": 178, "lr": 8.0396163064862e-05} +{"train_loss": 0.003372840816155076, "global_step": 21203, "epoch": 178, "lr": 8.039440392971342e-05} +{"train_loss": 0.00368873099796474, "global_step": 21204, "epoch": 178, "lr": 8.039264473488867e-05} +{"train_loss": 0.004128320142626762, "global_step": 21205, "epoch": 178, "lr": 8.039088548039123e-05} +{"train_loss": 0.004169600550085306, "global_step": 21206, "epoch": 178, "lr": 8.038912616622451e-05} +{"train_loss": 0.006659660022705793, "global_step": 21207, "epoch": 178, "lr": 8.0387366792392e-05} +{"train_loss": 0.003799505764618516, "global_step": 21208, "epoch": 178, "lr": 8.038560735889713e-05} +{"train_loss": 0.003281392389908433, "global_step": 21209, "epoch": 178, "lr": 8.038384786574337e-05} +{"train_loss": 0.004731758497655392, "global_step": 21210, "epoch": 178, "lr": 8.038208831293419e-05} +{"train_loss": 0.003839748678728938, "global_step": 21211, "epoch": 178, "lr": 8.038032870047301e-05} +{"train_loss": 0.004441566299647093, "global_step": 21212, "epoch": 178, "lr": 8.03785690283633e-05} +{"train_loss": 0.005448817275464535, "global_step": 21213, "epoch": 178, "lr": 8.037680929660852e-05} +{"train_loss": 0.005543649662286043, "global_step": 21214, "epoch": 178, "lr": 8.03750495052121e-05} +{"train_loss": 0.0030117719434201717, "global_step": 21215, "epoch": 178, "lr": 8.037328965417754e-05} +{"train_loss": 0.0036679694894701242, "global_step": 21216, "epoch": 178, "lr": 8.037152974350826e-05} +{"train_loss": 0.003652906510978937, "global_step": 21217, "epoch": 178, "lr": 8.036976977320774e-05} +{"train_loss": 0.005003951024264097, "global_step": 21218, "epoch": 178, "lr": 8.03680097432794e-05} +{"train_loss": 0.003926044330000877, "global_step": 21219, "epoch": 178, "lr": 8.036624965372672e-05} +{"train_loss": 0.00614300649613142, "global_step": 21220, "epoch": 178, "lr": 8.036448950455318e-05} +{"train_loss": 0.0029735774733126163, "global_step": 21221, "epoch": 178, "lr": 8.036272929576217e-05} +{"train_loss": 0.0030900374986231327, "global_step": 21222, "epoch": 178, "lr": 8.036096902735721e-05} +{"train_loss": 0.0022024239879101515, "global_step": 21223, "epoch": 178, "lr": 8.035920869934172e-05} +{"train_loss": 0.0033626030199229717, "global_step": 21224, "epoch": 178, "lr": 8.035744831171917e-05} +{"train_loss": 0.005337330978363752, "global_step": 21225, "epoch": 178, "lr": 8.035568786449301e-05} +{"train_loss": 0.002846220275387168, "global_step": 21226, "epoch": 178, "lr": 8.035392735766671e-05} +{"train_loss": 0.004030105657875538, "global_step": 21227, "epoch": 178, "lr": 8.03521667912437e-05} +{"train_loss": 0.00408773310482502, "global_step": 21228, "epoch": 178, "lr": 8.035040616522747e-05} +{"train_loss": 0.0027007036842405796, "global_step": 21229, "epoch": 178, "lr": 8.034864547962146e-05} +{"train_loss": 0.0031143082305788994, "global_step": 21230, "epoch": 178, "lr": 8.034688473442913e-05} +{"train_loss": 0.004366805776953697, "global_step": 21231, "epoch": 178, "lr": 8.034512392965392e-05} +{"train_loss": 0.002163827884942293, "global_step": 21232, "epoch": 178, "lr": 8.03433630652993e-05} +{"train_loss": 0.003587449435144663, "global_step": 21233, "epoch": 178, "lr": 8.034160214136874e-05} +{"train_loss": 0.004795108921825886, "global_step": 21234, "epoch": 178, "lr": 8.033984115786568e-05} +{"train_loss": 0.0032216119579970837, "global_step": 21235, "epoch": 178, "lr": 8.033808011479359e-05} +{"train_loss": 0.003234490053728223, "global_step": 21236, "epoch": 178, "lr": 8.033631901215591e-05} +{"train_loss": 0.006001480855047703, "global_step": 21237, "epoch": 178, "lr": 8.033455784995611e-05} +{"train_loss": 0.0036293051671236753, "global_step": 21238, "epoch": 178, "lr": 8.033279662819766e-05} +{"train_loss": 0.002268225885927677, "global_step": 21239, "epoch": 178, "lr": 8.033103534688399e-05} +{"train_loss": 0.00284219766035676, "global_step": 21240, "epoch": 178, "lr": 8.032927400601857e-05} +{"train_loss": 0.007109781727194786, "global_step": 21241, "epoch": 178, "lr": 8.032751260560487e-05} +{"train_loss": 0.004000800661742687, "global_step": 21242, "epoch": 178, "lr": 8.032575114564633e-05} +{"train_loss": 0.004360539838671684, "global_step": 21243, "epoch": 178, "lr": 8.032398962614643e-05} +{"train_loss": 0.0027133983094245195, "global_step": 21244, "epoch": 178, "lr": 8.03222280471086e-05} +{"train_loss": 0.0059957667253911495, "global_step": 21245, "epoch": 178, "lr": 8.032046640853633e-05} +{"train_loss": 0.003177710110321641, "global_step": 21246, "epoch": 178, "lr": 8.031870471043306e-05} +{"train_loss": 0.00451183645054698, "global_step": 21247, "epoch": 178, "lr": 8.031694295280225e-05} +{"train_loss": 0.0032778335735201836, "global_step": 21248, "epoch": 178, "lr": 8.031518113564737e-05} +{"train_loss": 0.003846488893032074, "global_step": 21249, "epoch": 178, "lr": 8.031341925897186e-05} +{"train_loss": 0.005039021372795105, "global_step": 21250, "epoch": 178, "lr": 8.031165732277919e-05} +{"train_loss": 0.0036989850923419, "global_step": 21251, "epoch": 178, "lr": 8.030989532707281e-05} +{"train_loss": 0.004959261044859886, "global_step": 21252, "epoch": 178, "lr": 8.03081332718562e-05} +{"train_loss": 0.007238535210490227, "global_step": 21253, "epoch": 178, "lr": 8.030637115713282e-05} +{"train_loss": 0.007443837821483612, "global_step": 21254, "epoch": 178, "lr": 8.03046089829061e-05} +{"train_loss": 0.0038102727849036455, "global_step": 21255, "epoch": 178, "lr": 8.030284674917953e-05} +{"train_loss": 0.003953814506530762, "global_step": 21256, "epoch": 178, "lr": 8.030108445595654e-05} +{"train_loss": 0.003192289499565959, "global_step": 21257, "epoch": 178, "lr": 8.029932210324063e-05} +{"train_loss": 0.008066046051681042, "global_step": 21258, "epoch": 178, "lr": 8.029755969103522e-05} +{"train_loss": 0.003879115218296647, "global_step": 21259, "epoch": 178, "lr": 8.029579721934379e-05} +{"train_loss": 0.007799074985086918, "global_step": 21260, "epoch": 178, "lr": 8.029403468816982e-05} +{"train_loss": 0.006077091675251722, "global_step": 21261, "epoch": 178, "lr": 8.029227209751673e-05} +{"train_loss": 0.0023639879655092955, "global_step": 21262, "epoch": 178, "lr": 8.029050944738801e-05} +{"train_loss": 0.006984802428632975, "global_step": 21263, "epoch": 178, "lr": 8.02887467377871e-05} +{"train_loss": 0.004672651179134846, "global_step": 21264, "epoch": 178, "lr": 8.028698396871748e-05} +{"train_loss": 0.003598050680011511, "global_step": 21265, "epoch": 178, "lr": 8.02852211401826e-05} +{"train_loss": 0.004747400525957346, "global_step": 21266, "epoch": 178, "lr": 8.028345825218592e-05} +{"train_loss": 0.006760116666555405, "global_step": 21267, "epoch": 178, "lr": 8.02816953047309e-05} +{"train_loss": 0.003990720491856337, "global_step": 21268, "epoch": 178, "lr": 8.027993229782101e-05} +{"train_loss": 0.004946095868945122, "global_step": 21269, "epoch": 178, "lr": 8.027816923145972e-05} +{"train_loss": 0.0044913762249052525, "global_step": 21270, "epoch": 178, "lr": 8.027640610565047e-05} +{"train_loss": 0.0038767741061747074, "global_step": 21271, "epoch": 178, "lr": 8.027464292039673e-05} +{"train_loss": 0.006177755072712898, "global_step": 21272, "epoch": 178, "lr": 8.027287967570196e-05} +{"train_loss": 0.0068988073617219925, "global_step": 21273, "epoch": 178, "lr": 8.027111637156964e-05} +{"train_loss": 0.004611695185303688, "global_step": 21274, "epoch": 178, "lr": 8.02693530080032e-05} +{"train_loss": 0.004156000446528196, "global_step": 21275, "epoch": 178, "lr": 8.026758958500612e-05} +{"train_loss": 0.0035937349312007427, "global_step": 21276, "epoch": 178, "lr": 8.026582610258188e-05} +{"train_loss": 0.007451927289366722, "global_step": 21277, "epoch": 178, "lr": 8.026406256073391e-05} +{"train_loss": 0.0031152896117419004, "global_step": 21278, "epoch": 178, "lr": 8.026229895946569e-05} +{"train_loss": 0.005014530848711729, "global_step": 21279, "epoch": 178, "lr": 8.026053529878068e-05} +{"train_loss": 0.005366908852010965, "global_step": 21280, "epoch": 178, "lr": 8.025877157868234e-05} +{"train_loss": 0.006295377854257822, "global_step": 21281, "epoch": 178, "lr": 8.025700779917414e-05} +{"train_loss": 0.00487243477255106, "global_step": 21282, "epoch": 178, "lr": 8.025524396025952e-05} +{"train_loss": 0.00478166900575161, "global_step": 21283, "epoch": 178, "lr": 8.025348006194197e-05} +{"train_loss": 0.0032352220732718706, "global_step": 21284, "epoch": 178, "lr": 8.025171610422495e-05} +{"train_loss": 0.005273786839097738, "global_step": 21285, "epoch": 178, "lr": 8.024995208711192e-05} +{"train_loss": 0.0048144846223294735, "global_step": 21286, "epoch": 178, "lr": 8.024818801060635e-05} +{"train_loss": 0.005368166137486696, "global_step": 21287, "epoch": 178, "lr": 8.024642387471166e-05} +{"train_loss": 0.0048484499566257, "global_step": 21288, "epoch": 178, "lr": 8.024465967943136e-05} +{"train_loss": 0.005777867045253515, "global_step": 21289, "epoch": 178, "lr": 8.024289542476891e-05} +{"train_loss": 0.007778987754136324, "global_step": 21290, "epoch": 178, "lr": 8.024113111072778e-05} +{"train_loss": 0.005067347548902035, "global_step": 21291, "epoch": 178, "lr": 8.02393667373114e-05} +{"train_loss": 0.003757011378183961, "global_step": 21292, "epoch": 178, "lr": 8.023760230452326e-05} +{"train_loss": 0.004304385744035244, "global_step": 21293, "epoch": 178, "lr": 8.023583781236681e-05} +{"train_loss": 0.004468051716685295, "global_step": 21294, "epoch": 178, "lr": 8.023407326084553e-05} +{"train_loss": 0.00411238195374608, "global_step": 21295, "epoch": 178, "lr": 8.023230864996287e-05} +{"train_loss": 0.004759626928716898, "global_step": 21296, "epoch": 178, "lr": 8.023054397972232e-05} +{"train_loss": 0.006910225376486778, "global_step": 21297, "epoch": 178, "lr": 8.022877925012731e-05} +{"train_loss": 0.004287305753678083, "global_step": 21298, "epoch": 178, "lr": 8.022701446118133e-05} +{"train_loss": 0.00484151765704155, "global_step": 21299, "epoch": 178, "lr": 8.022524961288783e-05} +{"train_loss": 0.004585911173514333, "global_step": 21300, "epoch": 178, "lr": 8.022348470525028e-05, "val_loss": 0.011663435027003288} +{"train_loss": 0.0031754891388118267, "global_step": 21301, "epoch": 179, "lr": 8.022171973827214e-05} +{"train_loss": 0.005962095223367214, "global_step": 21302, "epoch": 179, "lr": 8.021995471195691e-05} +{"train_loss": 0.006491424050182104, "global_step": 21303, "epoch": 179, "lr": 8.0218189626308e-05} +{"train_loss": 0.003909274935722351, "global_step": 21304, "epoch": 179, "lr": 8.021642448132893e-05} +{"train_loss": 0.00440081674605608, "global_step": 21305, "epoch": 179, "lr": 8.021465927702311e-05} +{"train_loss": 0.00537647120654583, "global_step": 21306, "epoch": 179, "lr": 8.021289401339405e-05} +{"train_loss": 0.005751708056777716, "global_step": 21307, "epoch": 179, "lr": 8.02111286904452e-05} +{"train_loss": 0.005573104601353407, "global_step": 21308, "epoch": 179, "lr": 8.020936330818001e-05} +{"train_loss": 0.005374603904783726, "global_step": 21309, "epoch": 179, "lr": 8.0207597866602e-05} +{"train_loss": 0.002489941194653511, "global_step": 21310, "epoch": 179, "lr": 8.020583236571457e-05} +{"train_loss": 0.0055727604776620865, "global_step": 21311, "epoch": 179, "lr": 8.020406680552122e-05} +{"train_loss": 0.0030930901411920786, "global_step": 21312, "epoch": 179, "lr": 8.020230118602541e-05} +{"train_loss": 0.005481217987835407, "global_step": 21313, "epoch": 179, "lr": 8.020053550723061e-05} +{"train_loss": 0.005122622475028038, "global_step": 21314, "epoch": 179, "lr": 8.019876976914028e-05} +{"train_loss": 0.0033913564402610064, "global_step": 21315, "epoch": 179, "lr": 8.019700397175789e-05} +{"train_loss": 0.004215500317513943, "global_step": 21316, "epoch": 179, "lr": 8.019523811508692e-05} +{"train_loss": 0.004774685017764568, "global_step": 21317, "epoch": 179, "lr": 8.019347219913083e-05} +{"train_loss": 0.004772006068378687, "global_step": 21318, "epoch": 179, "lr": 8.019170622389306e-05} +{"train_loss": 0.004658475052565336, "global_step": 21319, "epoch": 179, "lr": 8.018994018937712e-05} +{"train_loss": 0.005546894855797291, "global_step": 21320, "epoch": 179, "lr": 8.018817409558646e-05} +{"train_loss": 0.004725491628050804, "global_step": 21321, "epoch": 179, "lr": 8.018640794252454e-05} +{"train_loss": 0.0030639644246548414, "global_step": 21322, "epoch": 179, "lr": 8.018464173019483e-05} +{"train_loss": 0.005927132908254862, "global_step": 21323, "epoch": 179, "lr": 8.01828754586008e-05} +{"train_loss": 0.0035743284970521927, "global_step": 21324, "epoch": 179, "lr": 8.018110912774593e-05} +{"train_loss": 0.0032194459345191717, "global_step": 21325, "epoch": 179, "lr": 8.017934273763365e-05} +{"train_loss": 0.0040335156954824924, "global_step": 21326, "epoch": 179, "lr": 8.017757628826747e-05} +{"train_loss": 0.004612289369106293, "global_step": 21327, "epoch": 179, "lr": 8.017580977965084e-05} +{"train_loss": 0.005063469987362623, "global_step": 21328, "epoch": 179, "lr": 8.017404321178724e-05} +{"train_loss": 0.0023711323738098145, "global_step": 21329, "epoch": 179, "lr": 8.017227658468014e-05} +{"train_loss": 0.003570827189832926, "global_step": 21330, "epoch": 179, "lr": 8.017050989833297e-05} +{"train_loss": 0.002256621839478612, "global_step": 21331, "epoch": 179, "lr": 8.016874315274925e-05} +{"train_loss": 0.0056404611095786095, "global_step": 21332, "epoch": 179, "lr": 8.016697634793241e-05} +{"train_loss": 0.0021406076848506927, "global_step": 21333, "epoch": 179, "lr": 8.016520948388594e-05} +{"train_loss": 0.003818495199084282, "global_step": 21334, "epoch": 179, "lr": 8.01634425606133e-05} +{"train_loss": 0.006579747889190912, "global_step": 21335, "epoch": 179, "lr": 8.016167557811798e-05} +{"train_loss": 0.004160797223448753, "global_step": 21336, "epoch": 179, "lr": 8.015990853640342e-05} +{"train_loss": 0.003601754317060113, "global_step": 21337, "epoch": 179, "lr": 8.01581414354731e-05} +{"train_loss": 0.0033153435215353966, "global_step": 21338, "epoch": 179, "lr": 8.015637427533049e-05} +{"train_loss": 0.003204607404768467, "global_step": 21339, "epoch": 179, "lr": 8.015460705597907e-05} +{"train_loss": 0.003943352028727531, "global_step": 21340, "epoch": 179, "lr": 8.01528397774223e-05} +{"train_loss": 0.0031901157926768064, "global_step": 21341, "epoch": 179, "lr": 8.015107243966363e-05} +{"train_loss": 0.003589427564293146, "global_step": 21342, "epoch": 179, "lr": 8.014930504270657e-05} +{"train_loss": 0.0065268524922430515, "global_step": 21343, "epoch": 179, "lr": 8.014753758655458e-05} +{"train_loss": 0.007234570570290089, "global_step": 21344, "epoch": 179, "lr": 8.014577007121109e-05} +{"train_loss": 0.003250803565606475, "global_step": 21345, "epoch": 179, "lr": 8.014400249667963e-05} +{"train_loss": 0.004516164772212505, "global_step": 21346, "epoch": 179, "lr": 8.014223486296361e-05} +{"train_loss": 0.005475067067891359, "global_step": 21347, "epoch": 179, "lr": 8.014046717006656e-05} +{"train_loss": 0.003031097585335374, "global_step": 21348, "epoch": 179, "lr": 8.013869941799193e-05} +{"train_loss": 0.00442871218547225, "global_step": 21349, "epoch": 179, "lr": 8.013693160674316e-05} +{"train_loss": 0.003835445735603571, "global_step": 21350, "epoch": 179, "lr": 8.013516373632375e-05} +{"train_loss": 0.0039307111874222755, "global_step": 21351, "epoch": 179, "lr": 8.013339580673717e-05} +{"train_loss": 0.005787127651274204, "global_step": 21352, "epoch": 179, "lr": 8.013162781798688e-05} +{"train_loss": 0.005684676114469767, "global_step": 21353, "epoch": 179, "lr": 8.012985977007636e-05} +{"train_loss": 0.006444810424000025, "global_step": 21354, "epoch": 179, "lr": 8.01280916630091e-05} +{"train_loss": 0.004124377854168415, "global_step": 21355, "epoch": 179, "lr": 8.012632349678852e-05} +{"train_loss": 0.004152893554419279, "global_step": 21356, "epoch": 179, "lr": 8.012455527141813e-05} +{"train_loss": 0.0037690061144530773, "global_step": 21357, "epoch": 179, "lr": 8.01227869869014e-05} +{"train_loss": 0.005387750919908285, "global_step": 21358, "epoch": 179, "lr": 8.012101864324179e-05} +{"train_loss": 0.0037963269278407097, "global_step": 21359, "epoch": 179, "lr": 8.011925024044278e-05} +{"train_loss": 0.0033041357528418303, "global_step": 21360, "epoch": 179, "lr": 8.011748177850787e-05} +{"train_loss": 0.004564414266496897, "global_step": 21361, "epoch": 179, "lr": 8.011571325744047e-05} +{"train_loss": 0.0038345728535205126, "global_step": 21362, "epoch": 179, "lr": 8.011394467724409e-05} +{"train_loss": 0.005914855282753706, "global_step": 21363, "epoch": 179, "lr": 8.011217603792218e-05} +{"train_loss": 0.0048131695948541164, "global_step": 21364, "epoch": 179, "lr": 8.011040733947826e-05} +{"train_loss": 0.006688505876809359, "global_step": 21365, "epoch": 179, "lr": 8.010863858191575e-05} +{"train_loss": 0.004712148569524288, "global_step": 21366, "epoch": 179, "lr": 8.010686976523815e-05} +{"train_loss": 0.0031630168668925762, "global_step": 21367, "epoch": 179, "lr": 8.010510088944894e-05} +{"train_loss": 0.003427439136430621, "global_step": 21368, "epoch": 179, "lr": 8.010333195455156e-05} +{"train_loss": 0.004139631055295467, "global_step": 21369, "epoch": 179, "lr": 8.010156296054951e-05} +{"train_loss": 0.004772735293954611, "global_step": 21370, "epoch": 179, "lr": 8.009979390744626e-05} +{"train_loss": 0.004679007921367884, "global_step": 21371, "epoch": 179, "lr": 8.009802479524529e-05} +{"train_loss": 0.00464272266253829, "global_step": 21372, "epoch": 179, "lr": 8.009625562395004e-05} +{"train_loss": 0.004673918709158897, "global_step": 21373, "epoch": 179, "lr": 8.009448639356404e-05} +{"train_loss": 0.004536740481853485, "global_step": 21374, "epoch": 179, "lr": 8.009271710409071e-05} +{"train_loss": 0.004833946470171213, "global_step": 21375, "epoch": 179, "lr": 8.009094775553355e-05} +{"train_loss": 0.005271504167467356, "global_step": 21376, "epoch": 179, "lr": 8.008917834789602e-05} +{"train_loss": 0.005445320624858141, "global_step": 21377, "epoch": 179, "lr": 8.008740888118162e-05} +{"train_loss": 0.003895386354997754, "global_step": 21378, "epoch": 179, "lr": 8.00856393553938e-05} +{"train_loss": 0.004520879592746496, "global_step": 21379, "epoch": 179, "lr": 8.008386977053603e-05} +{"train_loss": 0.003671969287097454, "global_step": 21380, "epoch": 179, "lr": 8.008210012661182e-05} +{"train_loss": 0.002684171311557293, "global_step": 21381, "epoch": 179, "lr": 8.00803304236246e-05} +{"train_loss": 0.006772895343601704, "global_step": 21382, "epoch": 179, "lr": 8.007856066157786e-05} +{"train_loss": 0.011506679467856884, "global_step": 21383, "epoch": 179, "lr": 8.007679084047508e-05} +{"train_loss": 0.002674153773114085, "global_step": 21384, "epoch": 179, "lr": 8.007502096031975e-05} +{"train_loss": 0.0039854710921645164, "global_step": 21385, "epoch": 179, "lr": 8.007325102111534e-05} +{"train_loss": 0.0065520163625478745, "global_step": 21386, "epoch": 179, "lr": 8.007148102286528e-05} +{"train_loss": 0.0031941370107233524, "global_step": 21387, "epoch": 179, "lr": 8.00697109655731e-05} +{"train_loss": 0.003756351303309202, "global_step": 21388, "epoch": 179, "lr": 8.006794084924226e-05} +{"train_loss": 0.002938685705885291, "global_step": 21389, "epoch": 179, "lr": 8.006617067387621e-05} +{"train_loss": 0.00552788469940424, "global_step": 21390, "epoch": 179, "lr": 8.006440043947846e-05} +{"train_loss": 0.00406452314928174, "global_step": 21391, "epoch": 179, "lr": 8.006263014605246e-05} +{"train_loss": 0.00807185284793377, "global_step": 21392, "epoch": 179, "lr": 8.006085979360171e-05} +{"train_loss": 0.005153654143214226, "global_step": 21393, "epoch": 179, "lr": 8.005908938212968e-05} +{"train_loss": 0.006615315563976765, "global_step": 21394, "epoch": 179, "lr": 8.005731891163984e-05} +{"train_loss": 0.0075864028185606, "global_step": 21395, "epoch": 179, "lr": 8.005554838213565e-05} +{"train_loss": 0.005310446955263615, "global_step": 21396, "epoch": 179, "lr": 8.00537777936206e-05} +{"train_loss": 0.0050311884842813015, "global_step": 21397, "epoch": 179, "lr": 8.005200714609818e-05} +{"train_loss": 0.003970555495470762, "global_step": 21398, "epoch": 179, "lr": 8.005023643957185e-05} +{"train_loss": 0.005772528238594532, "global_step": 21399, "epoch": 179, "lr": 8.004846567404509e-05} +{"train_loss": 0.0075985137373209, "global_step": 21400, "epoch": 179, "lr": 8.004669484952139e-05} +{"train_loss": 0.0053222207352519035, "global_step": 21401, "epoch": 179, "lr": 8.004492396600419e-05} +{"train_loss": 0.006559412460774183, "global_step": 21402, "epoch": 179, "lr": 8.004315302349701e-05} +{"train_loss": 0.004127162508666515, "global_step": 21403, "epoch": 179, "lr": 8.00413820220033e-05} +{"train_loss": 0.00707100797444582, "global_step": 21404, "epoch": 179, "lr": 8.003961096152654e-05} +{"train_loss": 0.00443919887766242, "global_step": 21405, "epoch": 179, "lr": 8.003783984207023e-05} +{"train_loss": 0.003606051905080676, "global_step": 21406, "epoch": 179, "lr": 8.003606866363782e-05} +{"train_loss": 0.008601265028119087, "global_step": 21407, "epoch": 179, "lr": 8.003429742623281e-05} +{"train_loss": 0.004674585070461035, "global_step": 21408, "epoch": 179, "lr": 8.003252612985866e-05} +{"train_loss": 0.0047265454195439816, "global_step": 21409, "epoch": 179, "lr": 8.003075477451885e-05} +{"train_loss": 0.006000099238008261, "global_step": 21410, "epoch": 179, "lr": 8.002898336021686e-05} +{"train_loss": 0.005224226973950863, "global_step": 21411, "epoch": 179, "lr": 8.002721188695618e-05} +{"train_loss": 0.0050410060212016106, "global_step": 21412, "epoch": 179, "lr": 8.002544035474027e-05} +{"train_loss": 0.004870561882853508, "global_step": 21413, "epoch": 179, "lr": 8.002366876357261e-05} +{"train_loss": 0.006017700303345919, "global_step": 21414, "epoch": 179, "lr": 8.002189711345668e-05} +{"train_loss": 0.003825950901955366, "global_step": 21415, "epoch": 179, "lr": 8.002012540439596e-05} +{"train_loss": 0.004146801773458719, "global_step": 21416, "epoch": 179, "lr": 8.001835363639395e-05} +{"train_loss": 0.00786117184907198, "global_step": 21417, "epoch": 179, "lr": 8.00165818094541e-05} +{"train_loss": 0.004303746856749058, "global_step": 21418, "epoch": 179, "lr": 8.00148099235799e-05} +{"train_loss": 0.0047867129509877255, "global_step": 21419, "epoch": 179, "lr": 8.001303797877484e-05, "val_loss": 0.013322358950972557} +{"train_loss": 0.005811541806906462, "global_step": 21420, "epoch": 180, "lr": 8.001126597504235e-05} +{"train_loss": 0.006584973074495792, "global_step": 21421, "epoch": 180, "lr": 8.000949391238598e-05} +{"train_loss": 0.0038925842382013798, "global_step": 21422, "epoch": 180, "lr": 8.000772179080916e-05} +{"train_loss": 0.006901911459863186, "global_step": 21423, "epoch": 180, "lr": 8.00059496103154e-05} +{"train_loss": 0.003794681280851364, "global_step": 21424, "epoch": 180, "lr": 8.000417737090815e-05} +{"train_loss": 0.005701064132153988, "global_step": 21425, "epoch": 180, "lr": 8.00024050725909e-05} +{"train_loss": 0.003472109092399478, "global_step": 21426, "epoch": 180, "lr": 8.000063271536713e-05} +{"train_loss": 0.006509235594421625, "global_step": 21427, "epoch": 180, "lr": 7.999886029924034e-05} +{"train_loss": 0.006688230205327272, "global_step": 21428, "epoch": 180, "lr": 7.999708782421398e-05} +{"train_loss": 0.0059267194010317326, "global_step": 21429, "epoch": 180, "lr": 7.999531529029154e-05} +{"train_loss": 0.004888204857707024, "global_step": 21430, "epoch": 180, "lr": 7.999354269747652e-05} +{"train_loss": 0.004060032311826944, "global_step": 21431, "epoch": 180, "lr": 7.999177004577236e-05} +{"train_loss": 0.00630539795383811, "global_step": 21432, "epoch": 180, "lr": 7.998999733518258e-05} +{"train_loss": 0.0033702224027365446, "global_step": 21433, "epoch": 180, "lr": 7.998822456571064e-05} +{"train_loss": 0.0029547458980232477, "global_step": 21434, "epoch": 180, "lr": 7.998645173736002e-05} +{"train_loss": 0.003621955867856741, "global_step": 21435, "epoch": 180, "lr": 7.998467885013421e-05} +{"train_loss": 0.00672846008092165, "global_step": 21436, "epoch": 180, "lr": 7.99829059040367e-05} +{"train_loss": 0.008128407411277294, "global_step": 21437, "epoch": 180, "lr": 7.998113289907094e-05} +{"train_loss": 0.0042709833942353725, "global_step": 21438, "epoch": 180, "lr": 7.997935983524044e-05} +{"train_loss": 0.004557349719107151, "global_step": 21439, "epoch": 180, "lr": 7.997758671254865e-05} +{"train_loss": 0.0060984413139522076, "global_step": 21440, "epoch": 180, "lr": 7.997581353099908e-05} +{"train_loss": 0.003635527566075325, "global_step": 21441, "epoch": 180, "lr": 7.99740402905952e-05} +{"train_loss": 0.004151863045990467, "global_step": 21442, "epoch": 180, "lr": 7.997226699134051e-05} +{"train_loss": 0.006445626262575388, "global_step": 21443, "epoch": 180, "lr": 7.997049363323847e-05} +{"train_loss": 0.005709114018827677, "global_step": 21444, "epoch": 180, "lr": 7.996872021629256e-05} +{"train_loss": 0.008028252981603146, "global_step": 21445, "epoch": 180, "lr": 7.996694674050626e-05} +{"train_loss": 0.00617393059656024, "global_step": 21446, "epoch": 180, "lr": 7.996517320588308e-05} +{"train_loss": 0.005357502028346062, "global_step": 21447, "epoch": 180, "lr": 7.996339961242649e-05} +{"train_loss": 0.0043104905635118484, "global_step": 21448, "epoch": 180, "lr": 7.996162596013995e-05} +{"train_loss": 0.004305518697947264, "global_step": 21449, "epoch": 180, "lr": 7.995985224902696e-05} +{"train_loss": 0.006285893265157938, "global_step": 21450, "epoch": 180, "lr": 7.9958078479091e-05} +{"train_loss": 0.0040332176722586155, "global_step": 21451, "epoch": 180, "lr": 7.995630465033556e-05} +{"train_loss": 0.00330968271009624, "global_step": 21452, "epoch": 180, "lr": 7.995453076276412e-05} +{"train_loss": 0.004313326440751553, "global_step": 21453, "epoch": 180, "lr": 7.995275681638015e-05} +{"train_loss": 0.0068871742114424706, "global_step": 21454, "epoch": 180, "lr": 7.995098281118715e-05} +{"train_loss": 0.0067308866418898106, "global_step": 21455, "epoch": 180, "lr": 7.994920874718859e-05} +{"train_loss": 0.004572741687297821, "global_step": 21456, "epoch": 180, "lr": 7.994743462438795e-05} +{"train_loss": 0.005157055798918009, "global_step": 21457, "epoch": 180, "lr": 7.994566044278872e-05} +{"train_loss": 0.005811263341456652, "global_step": 21458, "epoch": 180, "lr": 7.99438862023944e-05} +{"train_loss": 0.003916967194527388, "global_step": 21459, "epoch": 180, "lr": 7.994211190320846e-05} +{"train_loss": 0.004564153496176004, "global_step": 21460, "epoch": 180, "lr": 7.994033754523437e-05} +{"train_loss": 0.005340443458408117, "global_step": 21461, "epoch": 180, "lr": 7.993856312847563e-05} +{"train_loss": 0.0050162761472165585, "global_step": 21462, "epoch": 180, "lr": 7.993678865293572e-05} +{"train_loss": 0.0063248747028410435, "global_step": 21463, "epoch": 180, "lr": 7.993501411861813e-05} +{"train_loss": 0.005560645367950201, "global_step": 21464, "epoch": 180, "lr": 7.993323952552632e-05} +{"train_loss": 0.007575128227472305, "global_step": 21465, "epoch": 180, "lr": 7.99314648736638e-05} +{"train_loss": 0.0040519945323467255, "global_step": 21466, "epoch": 180, "lr": 7.992969016303405e-05} +{"train_loss": 0.005268507171422243, "global_step": 21467, "epoch": 180, "lr": 7.992791539364058e-05} +{"train_loss": 0.004242440219968557, "global_step": 21468, "epoch": 180, "lr": 7.99261405654868e-05} +{"train_loss": 0.00413942476734519, "global_step": 21469, "epoch": 180, "lr": 7.992436567857626e-05} +{"train_loss": 0.004318585619330406, "global_step": 21470, "epoch": 180, "lr": 7.992259073291241e-05} +{"train_loss": 0.0048432257026433945, "global_step": 21471, "epoch": 180, "lr": 7.992081572849877e-05} +{"train_loss": 0.006215645000338554, "global_step": 21472, "epoch": 180, "lr": 7.991904066533879e-05} +{"train_loss": 0.004658942576497793, "global_step": 21473, "epoch": 180, "lr": 7.9917265543436e-05} +{"train_loss": 0.007154080085456371, "global_step": 21474, "epoch": 180, "lr": 7.991549036279382e-05} +{"train_loss": 0.004859266337007284, "global_step": 21475, "epoch": 180, "lr": 7.991371512341577e-05} +{"train_loss": 0.005050250329077244, "global_step": 21476, "epoch": 180, "lr": 7.991193982530536e-05} +{"train_loss": 0.006588870193809271, "global_step": 21477, "epoch": 180, "lr": 7.991016446846604e-05} +{"train_loss": 0.004857398569583893, "global_step": 21478, "epoch": 180, "lr": 7.99083890529013e-05} +{"train_loss": 0.006345784291625023, "global_step": 21479, "epoch": 180, "lr": 7.990661357861464e-05} +{"train_loss": 0.005273195914924145, "global_step": 21480, "epoch": 180, "lr": 7.990483804560955e-05} +{"train_loss": 0.003742919070646167, "global_step": 21481, "epoch": 180, "lr": 7.99030624538895e-05} +{"train_loss": 0.004740940872579813, "global_step": 21482, "epoch": 180, "lr": 7.990128680345797e-05} +{"train_loss": 0.005707716569304466, "global_step": 21483, "epoch": 180, "lr": 7.989951109431845e-05} +{"train_loss": 0.00645302003249526, "global_step": 21484, "epoch": 180, "lr": 7.989773532647447e-05} +{"train_loss": 0.005936709698289633, "global_step": 21485, "epoch": 180, "lr": 7.989595949992945e-05} +{"train_loss": 0.004314480349421501, "global_step": 21486, "epoch": 180, "lr": 7.989418361468692e-05} +{"train_loss": 0.0037154678720980883, "global_step": 21487, "epoch": 180, "lr": 7.989240767075035e-05} +{"train_loss": 0.0032856385223567486, "global_step": 21488, "epoch": 180, "lr": 7.989063166812323e-05} +{"train_loss": 0.0034796474501490593, "global_step": 21489, "epoch": 180, "lr": 7.988885560680905e-05} +{"train_loss": 0.006919442676007748, "global_step": 21490, "epoch": 180, "lr": 7.98870794868113e-05} +{"train_loss": 0.006748401094228029, "global_step": 21491, "epoch": 180, "lr": 7.988530330813346e-05} +{"train_loss": 0.0027082255110144615, "global_step": 21492, "epoch": 180, "lr": 7.988352707077902e-05} +{"train_loss": 0.008289437741041183, "global_step": 21493, "epoch": 180, "lr": 7.988175077475147e-05} +{"train_loss": 0.009558111429214478, "global_step": 21494, "epoch": 180, "lr": 7.987997442005429e-05} +{"train_loss": 0.004024181514978409, "global_step": 21495, "epoch": 180, "lr": 7.987819800669097e-05} +{"train_loss": 0.004718468990176916, "global_step": 21496, "epoch": 180, "lr": 7.987642153466501e-05} +{"train_loss": 0.009865514002740383, "global_step": 21497, "epoch": 180, "lr": 7.987464500397987e-05} +{"train_loss": 0.004433457739651203, "global_step": 21498, "epoch": 180, "lr": 7.987286841463908e-05} +{"train_loss": 0.007508451119065285, "global_step": 21499, "epoch": 180, "lr": 7.987109176664609e-05} +{"train_loss": 0.00695387739688158, "global_step": 21500, "epoch": 180, "lr": 7.98693150600044e-05} +{"train_loss": 0.006397600751370192, "global_step": 21501, "epoch": 180, "lr": 7.98675382947175e-05} +{"train_loss": 0.007231323514133692, "global_step": 21502, "epoch": 180, "lr": 7.986576147078888e-05} +{"train_loss": 0.006408517248928547, "global_step": 21503, "epoch": 180, "lr": 7.986398458822205e-05} +{"train_loss": 0.005072539672255516, "global_step": 21504, "epoch": 180, "lr": 7.986220764702046e-05} +{"train_loss": 0.003250520909205079, "global_step": 21505, "epoch": 180, "lr": 7.98604306471876e-05} +{"train_loss": 0.00544667849317193, "global_step": 21506, "epoch": 180, "lr": 7.9858653588727e-05} +{"train_loss": 0.007853766903281212, "global_step": 21507, "epoch": 180, "lr": 7.98568764716421e-05} +{"train_loss": 0.00749655207619071, "global_step": 21508, "epoch": 180, "lr": 7.985509929593644e-05} +{"train_loss": 0.0071408795192837715, "global_step": 21509, "epoch": 180, "lr": 7.985332206161347e-05} +{"train_loss": 0.004932669922709465, "global_step": 21510, "epoch": 180, "lr": 7.985154476867668e-05} +{"train_loss": 0.0055642081424593925, "global_step": 21511, "epoch": 180, "lr": 7.984976741712959e-05} +{"train_loss": 0.0037513759452849627, "global_step": 21512, "epoch": 180, "lr": 7.984799000697565e-05} +{"train_loss": 0.005416105967015028, "global_step": 21513, "epoch": 180, "lr": 7.984621253821838e-05} +{"train_loss": 0.007516232319176197, "global_step": 21514, "epoch": 180, "lr": 7.984443501086127e-05} +{"train_loss": 0.0049145701341331005, "global_step": 21515, "epoch": 180, "lr": 7.984265742490778e-05} +{"train_loss": 0.007543869782239199, "global_step": 21516, "epoch": 180, "lr": 7.984087978036143e-05} +{"train_loss": 0.004176761489361525, "global_step": 21517, "epoch": 180, "lr": 7.983910207722572e-05} +{"train_loss": 0.00651503074914217, "global_step": 21518, "epoch": 180, "lr": 7.98373243155041e-05} +{"train_loss": 0.004397702869027853, "global_step": 21519, "epoch": 180, "lr": 7.983554649520008e-05} +{"train_loss": 0.006236738990992308, "global_step": 21520, "epoch": 180, "lr": 7.983376861631716e-05} +{"train_loss": 0.0032664297614246607, "global_step": 21521, "epoch": 180, "lr": 7.983199067885883e-05} +{"train_loss": 0.005359564907848835, "global_step": 21522, "epoch": 180, "lr": 7.983021268282856e-05} +{"train_loss": 0.0043799602426588535, "global_step": 21523, "epoch": 180, "lr": 7.982843462822986e-05} +{"train_loss": 0.009166846051812172, "global_step": 21524, "epoch": 180, "lr": 7.98266565150662e-05} +{"train_loss": 0.005597310606390238, "global_step": 21525, "epoch": 180, "lr": 7.982487834334111e-05} +{"train_loss": 0.006423824466764927, "global_step": 21526, "epoch": 180, "lr": 7.982310011305805e-05} +{"train_loss": 0.007158936001360416, "global_step": 21527, "epoch": 180, "lr": 7.98213218242205e-05} +{"train_loss": 0.0055190627463161945, "global_step": 21528, "epoch": 180, "lr": 7.9819543476832e-05} +{"train_loss": 0.005821638274937868, "global_step": 21529, "epoch": 180, "lr": 7.981776507089598e-05} +{"train_loss": 0.004175025969743729, "global_step": 21530, "epoch": 180, "lr": 7.9815986606416e-05} +{"train_loss": 0.00569142447784543, "global_step": 21531, "epoch": 180, "lr": 7.981420808339549e-05} +{"train_loss": 0.006999673787504435, "global_step": 21532, "epoch": 180, "lr": 7.981242950183799e-05} +{"train_loss": 0.004193195607513189, "global_step": 21533, "epoch": 180, "lr": 7.981065086174694e-05} +{"train_loss": 0.003957109525799751, "global_step": 21534, "epoch": 180, "lr": 7.980887216312586e-05} +{"train_loss": 0.00723242899402976, "global_step": 21535, "epoch": 180, "lr": 7.980709340597827e-05} +{"train_loss": 0.008720452897250652, "global_step": 21536, "epoch": 180, "lr": 7.980531459030765e-05} +{"train_loss": 0.005140750203281641, "global_step": 21537, "epoch": 180, "lr": 7.980353571611744e-05} +{"train_loss": 0.005517400642700431, "global_step": 21538, "epoch": 180, "lr": 7.98017567834112e-05, "val_loss": 0.0194688867777586, "train_action_mse_error": 0.00011580241698538885} +{"train_loss": 0.006348820403218269, "global_step": 21539, "epoch": 181, "lr": 7.979997779219237e-05} +{"train_loss": 0.004695633891969919, "global_step": 21540, "epoch": 181, "lr": 7.979819874246449e-05} +{"train_loss": 0.0034747133031487465, "global_step": 21541, "epoch": 181, "lr": 7.979641963423102e-05} +{"train_loss": 0.004602732602506876, "global_step": 21542, "epoch": 181, "lr": 7.979464046749547e-05} +{"train_loss": 0.006952672265470028, "global_step": 21543, "epoch": 181, "lr": 7.97928612422613e-05} +{"train_loss": 0.003878046525642276, "global_step": 21544, "epoch": 181, "lr": 7.979108195853207e-05} +{"train_loss": 0.0054675801657140255, "global_step": 21545, "epoch": 181, "lr": 7.978930261631122e-05} +{"train_loss": 0.006076707039028406, "global_step": 21546, "epoch": 181, "lr": 7.978752321560223e-05} +{"train_loss": 0.005613685119897127, "global_step": 21547, "epoch": 181, "lr": 7.978574375640864e-05} +{"train_loss": 0.004681122489273548, "global_step": 21548, "epoch": 181, "lr": 7.978396423873393e-05} +{"train_loss": 0.0042418912053108215, "global_step": 21549, "epoch": 181, "lr": 7.978218466258159e-05} +{"train_loss": 0.0038401768542826176, "global_step": 21550, "epoch": 181, "lr": 7.97804050279551e-05} +{"train_loss": 0.005648619029670954, "global_step": 21551, "epoch": 181, "lr": 7.977862533485797e-05} +{"train_loss": 0.006848860532045364, "global_step": 21552, "epoch": 181, "lr": 7.97768455832937e-05} +{"train_loss": 0.004039842169731855, "global_step": 21553, "epoch": 181, "lr": 7.977506577326577e-05} +{"train_loss": 0.00463456055149436, "global_step": 21554, "epoch": 181, "lr": 7.977328590477766e-05} +{"train_loss": 0.00423216400668025, "global_step": 21555, "epoch": 181, "lr": 7.977150597783292e-05} +{"train_loss": 0.004088353365659714, "global_step": 21556, "epoch": 181, "lr": 7.976972599243498e-05} +{"train_loss": 0.004857962019741535, "global_step": 21557, "epoch": 181, "lr": 7.976794594858736e-05} +{"train_loss": 0.003825183492153883, "global_step": 21558, "epoch": 181, "lr": 7.976616584629358e-05} +{"train_loss": 0.004575119819492102, "global_step": 21559, "epoch": 181, "lr": 7.97643856855571e-05} +{"train_loss": 0.00361894303932786, "global_step": 21560, "epoch": 181, "lr": 7.976260546638143e-05} +{"train_loss": 0.00511398259550333, "global_step": 21561, "epoch": 181, "lr": 7.976082518877008e-05} +{"train_loss": 0.003887471044436097, "global_step": 21562, "epoch": 181, "lr": 7.975904485272652e-05} +{"train_loss": 0.0025767141487449408, "global_step": 21563, "epoch": 181, "lr": 7.975726445825425e-05} +{"train_loss": 0.004034444224089384, "global_step": 21564, "epoch": 181, "lr": 7.975548400535676e-05} +{"train_loss": 0.003105360548943281, "global_step": 21565, "epoch": 181, "lr": 7.975370349403757e-05} +{"train_loss": 0.0035652141086757183, "global_step": 21566, "epoch": 181, "lr": 7.975192292430016e-05} +{"train_loss": 0.005337755661457777, "global_step": 21567, "epoch": 181, "lr": 7.975014229614804e-05} +{"train_loss": 0.0038035293109714985, "global_step": 21568, "epoch": 181, "lr": 7.974836160958468e-05} +{"train_loss": 0.0023042901884764433, "global_step": 21569, "epoch": 181, "lr": 7.974658086461358e-05} +{"train_loss": 0.004323254339396954, "global_step": 21570, "epoch": 181, "lr": 7.974480006123826e-05} +{"train_loss": 0.006068195682018995, "global_step": 21571, "epoch": 181, "lr": 7.974301919946218e-05} +{"train_loss": 0.003779737977311015, "global_step": 21572, "epoch": 181, "lr": 7.974123827928889e-05} +{"train_loss": 0.006580546963959932, "global_step": 21573, "epoch": 181, "lr": 7.973945730072186e-05} +{"train_loss": 0.0029485919512808323, "global_step": 21574, "epoch": 181, "lr": 7.973767626376456e-05} +{"train_loss": 0.006299658678472042, "global_step": 21575, "epoch": 181, "lr": 7.973589516842052e-05} +{"train_loss": 0.003924179822206497, "global_step": 21576, "epoch": 181, "lr": 7.973411401469321e-05} +{"train_loss": 0.0028833637479692698, "global_step": 21577, "epoch": 181, "lr": 7.973233280258616e-05} +{"train_loss": 0.004698868840932846, "global_step": 21578, "epoch": 181, "lr": 7.973055153210285e-05} +{"train_loss": 0.005310681648552418, "global_step": 21579, "epoch": 181, "lr": 7.972877020324678e-05} +{"train_loss": 0.003679285291582346, "global_step": 21580, "epoch": 181, "lr": 7.972698881602146e-05} +{"train_loss": 0.004019865300506353, "global_step": 21581, "epoch": 181, "lr": 7.972520737043034e-05} +{"train_loss": 0.003341659437865019, "global_step": 21582, "epoch": 181, "lr": 7.972342586647697e-05} +{"train_loss": 0.003906900994479656, "global_step": 21583, "epoch": 181, "lr": 7.972164430416482e-05} +{"train_loss": 0.004626448731869459, "global_step": 21584, "epoch": 181, "lr": 7.97198626834974e-05} +{"train_loss": 0.003332041669636965, "global_step": 21585, "epoch": 181, "lr": 7.971808100447822e-05} +{"train_loss": 0.005251054652035236, "global_step": 21586, "epoch": 181, "lr": 7.971629926711075e-05} +{"train_loss": 0.004502254072576761, "global_step": 21587, "epoch": 181, "lr": 7.971451747139851e-05} +{"train_loss": 0.004191237967461348, "global_step": 21588, "epoch": 181, "lr": 7.971273561734496e-05} +{"train_loss": 0.0033736727200448513, "global_step": 21589, "epoch": 181, "lr": 7.971095370495367e-05} +{"train_loss": 0.004525899421423674, "global_step": 21590, "epoch": 181, "lr": 7.970917173422807e-05} +{"train_loss": 0.0037467540241777897, "global_step": 21591, "epoch": 181, "lr": 7.970738970517168e-05} +{"train_loss": 0.0031051908154040575, "global_step": 21592, "epoch": 181, "lr": 7.970560761778803e-05} +{"train_loss": 0.0022713299840688705, "global_step": 21593, "epoch": 181, "lr": 7.970382547208057e-05} +{"train_loss": 0.003629065118730068, "global_step": 21594, "epoch": 181, "lr": 7.970204326805284e-05} +{"train_loss": 0.004774716682732105, "global_step": 21595, "epoch": 181, "lr": 7.97002610057083e-05} +{"train_loss": 0.004666192922741175, "global_step": 21596, "epoch": 181, "lr": 7.969847868505048e-05} +{"train_loss": 0.004759274423122406, "global_step": 21597, "epoch": 181, "lr": 7.969669630608288e-05} +{"train_loss": 0.005362937226891518, "global_step": 21598, "epoch": 181, "lr": 7.969491386880898e-05} +{"train_loss": 0.0036782000679522753, "global_step": 21599, "epoch": 181, "lr": 7.969313137323229e-05} +{"train_loss": 0.005770537536591291, "global_step": 21600, "epoch": 181, "lr": 7.969134881935631e-05} +{"train_loss": 0.004825394134968519, "global_step": 21601, "epoch": 181, "lr": 7.968956620718453e-05} +{"train_loss": 0.0068482328206300735, "global_step": 21602, "epoch": 181, "lr": 7.968778353672048e-05} +{"train_loss": 0.0027102967724204063, "global_step": 21603, "epoch": 181, "lr": 7.968600080796762e-05} +{"train_loss": 0.0042922040447592735, "global_step": 21604, "epoch": 181, "lr": 7.968421802092947e-05} +{"train_loss": 0.004973056260496378, "global_step": 21605, "epoch": 181, "lr": 7.968243517560954e-05} +{"train_loss": 0.004299781285226345, "global_step": 21606, "epoch": 181, "lr": 7.968065227201132e-05} +{"train_loss": 0.003659859299659729, "global_step": 21607, "epoch": 181, "lr": 7.96788693101383e-05} +{"train_loss": 0.0028694630600512028, "global_step": 21608, "epoch": 181, "lr": 7.967708628999398e-05} +{"train_loss": 0.0031250540632754564, "global_step": 21609, "epoch": 181, "lr": 7.967530321158189e-05} +{"train_loss": 0.004350547678768635, "global_step": 21610, "epoch": 181, "lr": 7.96735200749055e-05} +{"train_loss": 0.005280403885990381, "global_step": 21611, "epoch": 181, "lr": 7.967173687996834e-05} +{"train_loss": 0.005407894961535931, "global_step": 21612, "epoch": 181, "lr": 7.966995362677389e-05} +{"train_loss": 0.006240649148821831, "global_step": 21613, "epoch": 181, "lr": 7.966817031532566e-05} +{"train_loss": 0.0039046905003488064, "global_step": 21614, "epoch": 181, "lr": 7.966638694562713e-05} +{"train_loss": 0.003085603704676032, "global_step": 21615, "epoch": 181, "lr": 7.966460351768182e-05} +{"train_loss": 0.004648572765290737, "global_step": 21616, "epoch": 181, "lr": 7.966282003149324e-05} +{"train_loss": 0.004050499759614468, "global_step": 21617, "epoch": 181, "lr": 7.966103648706488e-05} +{"train_loss": 0.004552498459815979, "global_step": 21618, "epoch": 181, "lr": 7.965925288440025e-05} +{"train_loss": 0.005550004076212645, "global_step": 21619, "epoch": 181, "lr": 7.965746922350284e-05} +{"train_loss": 0.005284271202981472, "global_step": 21620, "epoch": 181, "lr": 7.965568550437615e-05} +{"train_loss": 0.00693663302809, "global_step": 21621, "epoch": 181, "lr": 7.965390172702369e-05} +{"train_loss": 0.005425053648650646, "global_step": 21622, "epoch": 181, "lr": 7.965211789144898e-05} +{"train_loss": 0.00607336824759841, "global_step": 21623, "epoch": 181, "lr": 7.965033399765549e-05} +{"train_loss": 0.004338787868618965, "global_step": 21624, "epoch": 181, "lr": 7.964855004564675e-05} +{"train_loss": 0.004594487138092518, "global_step": 21625, "epoch": 181, "lr": 7.964676603542623e-05} +{"train_loss": 0.004578186199069023, "global_step": 21626, "epoch": 181, "lr": 7.964498196699746e-05} +{"train_loss": 0.005750635173171759, "global_step": 21627, "epoch": 181, "lr": 7.964319784036393e-05} +{"train_loss": 0.004498627968132496, "global_step": 21628, "epoch": 181, "lr": 7.964141365552915e-05} +{"train_loss": 0.00498180091381073, "global_step": 21629, "epoch": 181, "lr": 7.963962941249662e-05} +{"train_loss": 0.0025435113348066807, "global_step": 21630, "epoch": 181, "lr": 7.963784511126986e-05} +{"train_loss": 0.0040647052228450775, "global_step": 21631, "epoch": 181, "lr": 7.963606075185234e-05} +{"train_loss": 0.0065050022676587105, "global_step": 21632, "epoch": 181, "lr": 7.96342763342476e-05} +{"train_loss": 0.0039331647567451, "global_step": 21633, "epoch": 181, "lr": 7.963249185845911e-05} +{"train_loss": 0.0035699475556612015, "global_step": 21634, "epoch": 181, "lr": 7.963070732449038e-05} +{"train_loss": 0.002852236619219184, "global_step": 21635, "epoch": 181, "lr": 7.962892273234495e-05} +{"train_loss": 0.00601011561229825, "global_step": 21636, "epoch": 181, "lr": 7.962713808202627e-05} +{"train_loss": 0.004704607184976339, "global_step": 21637, "epoch": 181, "lr": 7.962535337353787e-05} +{"train_loss": 0.004614139441400766, "global_step": 21638, "epoch": 181, "lr": 7.962356860688326e-05} +{"train_loss": 0.004435176495462656, "global_step": 21639, "epoch": 181, "lr": 7.962178378206594e-05} +{"train_loss": 0.004658252000808716, "global_step": 21640, "epoch": 181, "lr": 7.961999889908942e-05} +{"train_loss": 0.003952053841203451, "global_step": 21641, "epoch": 181, "lr": 7.961821395795718e-05} +{"train_loss": 0.0068903397768735886, "global_step": 21642, "epoch": 181, "lr": 7.961642895867276e-05} +{"train_loss": 0.005536729469895363, "global_step": 21643, "epoch": 181, "lr": 7.961464390123963e-05} +{"train_loss": 0.0032902408856898546, "global_step": 21644, "epoch": 181, "lr": 7.961285878566131e-05} +{"train_loss": 0.004207542631775141, "global_step": 21645, "epoch": 181, "lr": 7.961107361194131e-05} +{"train_loss": 0.005567831452935934, "global_step": 21646, "epoch": 181, "lr": 7.960928838008312e-05} +{"train_loss": 0.005357649642974138, "global_step": 21647, "epoch": 181, "lr": 7.960750309009027e-05} +{"train_loss": 0.0034328727051615715, "global_step": 21648, "epoch": 181, "lr": 7.960571774196625e-05} +{"train_loss": 0.003824330400675535, "global_step": 21649, "epoch": 181, "lr": 7.960393233571458e-05} +{"train_loss": 0.0038442430086433887, "global_step": 21650, "epoch": 181, "lr": 7.960214687133873e-05} +{"train_loss": 0.004799742251634598, "global_step": 21651, "epoch": 181, "lr": 7.960036134884223e-05} +{"train_loss": 0.0038493138272315264, "global_step": 21652, "epoch": 181, "lr": 7.959857576822858e-05} +{"train_loss": 0.006947660818696022, "global_step": 21653, "epoch": 181, "lr": 7.95967901295013e-05} +{"train_loss": 0.006114358082413673, "global_step": 21654, "epoch": 181, "lr": 7.959500443266387e-05} +{"train_loss": 0.00748881371691823, "global_step": 21655, "epoch": 181, "lr": 7.959321867771982e-05} +{"train_loss": 0.0021847737953066826, "global_step": 21656, "epoch": 181, "lr": 7.959143286467264e-05} +{"train_loss": 0.004541901474380318, "global_step": 21657, "epoch": 181, "lr": 7.958964699352585e-05, "val_loss": 0.01291142962872982} +{"train_loss": 0.005159859545528889, "global_step": 21658, "epoch": 182, "lr": 7.958786106428295e-05} +{"train_loss": 0.003323107259348035, "global_step": 21659, "epoch": 182, "lr": 7.958607507694745e-05} +{"train_loss": 0.003658680245280266, "global_step": 21660, "epoch": 182, "lr": 7.958428903152284e-05} +{"train_loss": 0.003882254008203745, "global_step": 21661, "epoch": 182, "lr": 7.958250292801264e-05} +{"train_loss": 0.005156929139047861, "global_step": 21662, "epoch": 182, "lr": 7.958071676642037e-05} +{"train_loss": 0.004226953722536564, "global_step": 21663, "epoch": 182, "lr": 7.95789305467495e-05} +{"train_loss": 0.004875180311501026, "global_step": 21664, "epoch": 182, "lr": 7.957714426900358e-05} +{"train_loss": 0.006140580400824547, "global_step": 21665, "epoch": 182, "lr": 7.957535793318608e-05} +{"train_loss": 0.00538651505485177, "global_step": 21666, "epoch": 182, "lr": 7.957357153930054e-05} +{"train_loss": 0.0037956596352159977, "global_step": 21667, "epoch": 182, "lr": 7.957178508735046e-05} +{"train_loss": 0.005679070483893156, "global_step": 21668, "epoch": 182, "lr": 7.956999857733932e-05} +{"train_loss": 0.00523662893101573, "global_step": 21669, "epoch": 182, "lr": 7.956821200927065e-05} +{"train_loss": 0.0033201624173671007, "global_step": 21670, "epoch": 182, "lr": 7.956642538314795e-05} +{"train_loss": 0.006957721430808306, "global_step": 21671, "epoch": 182, "lr": 7.956463869897474e-05} +{"train_loss": 0.004261239897459745, "global_step": 21672, "epoch": 182, "lr": 7.956285195675453e-05} +{"train_loss": 0.004145015962421894, "global_step": 21673, "epoch": 182, "lr": 7.95610651564908e-05} +{"train_loss": 0.003549088491126895, "global_step": 21674, "epoch": 182, "lr": 7.95592782981871e-05} +{"train_loss": 0.003456302685663104, "global_step": 21675, "epoch": 182, "lr": 7.95574913818469e-05} +{"train_loss": 0.004477617330849171, "global_step": 21676, "epoch": 182, "lr": 7.955570440747371e-05} +{"train_loss": 0.004228303208947182, "global_step": 21677, "epoch": 182, "lr": 7.955391737507108e-05} +{"train_loss": 0.0034554325975477695, "global_step": 21678, "epoch": 182, "lr": 7.955213028464246e-05} +{"train_loss": 0.0030392692424356937, "global_step": 21679, "epoch": 182, "lr": 7.955034313619141e-05} +{"train_loss": 0.002412785543128848, "global_step": 21680, "epoch": 182, "lr": 7.954855592972141e-05} +{"train_loss": 0.0064083850011229515, "global_step": 21681, "epoch": 182, "lr": 7.954676866523598e-05} +{"train_loss": 0.0030284137465059757, "global_step": 21682, "epoch": 182, "lr": 7.954498134273863e-05} +{"train_loss": 0.0038895842153578997, "global_step": 21683, "epoch": 182, "lr": 7.954319396223287e-05} +{"train_loss": 0.00526438420638442, "global_step": 21684, "epoch": 182, "lr": 7.95414065237222e-05} +{"train_loss": 0.003880108706653118, "global_step": 21685, "epoch": 182, "lr": 7.953961902721012e-05} +{"train_loss": 0.006960052996873856, "global_step": 21686, "epoch": 182, "lr": 7.953783147270017e-05} +{"train_loss": 0.005264793988317251, "global_step": 21687, "epoch": 182, "lr": 7.953604386019584e-05} +{"train_loss": 0.003607379272580147, "global_step": 21688, "epoch": 182, "lr": 7.953425618970065e-05} +{"train_loss": 0.004912605509161949, "global_step": 21689, "epoch": 182, "lr": 7.95324684612181e-05} +{"train_loss": 0.00467255525290966, "global_step": 21690, "epoch": 182, "lr": 7.953068067475169e-05} +{"train_loss": 0.0026102864649146795, "global_step": 21691, "epoch": 182, "lr": 7.952889283030496e-05} +{"train_loss": 0.007362594828009605, "global_step": 21692, "epoch": 182, "lr": 7.95271049278814e-05} +{"train_loss": 0.004100223071873188, "global_step": 21693, "epoch": 182, "lr": 7.952531696748451e-05} +{"train_loss": 0.003983506001532078, "global_step": 21694, "epoch": 182, "lr": 7.952352894911783e-05} +{"train_loss": 0.003689990844577551, "global_step": 21695, "epoch": 182, "lr": 7.952174087278485e-05} +{"train_loss": 0.006417067721486092, "global_step": 21696, "epoch": 182, "lr": 7.951995273848908e-05} +{"train_loss": 0.005302544217556715, "global_step": 21697, "epoch": 182, "lr": 7.951816454623404e-05} +{"train_loss": 0.004486780613660812, "global_step": 21698, "epoch": 182, "lr": 7.951637629602325e-05} +{"train_loss": 0.005124197807163, "global_step": 21699, "epoch": 182, "lr": 7.95145879878602e-05} +{"train_loss": 0.00458255410194397, "global_step": 21700, "epoch": 182, "lr": 7.95127996217484e-05} +{"train_loss": 0.003963458351790905, "global_step": 21701, "epoch": 182, "lr": 7.951101119769138e-05} +{"train_loss": 0.003186787012964487, "global_step": 21702, "epoch": 182, "lr": 7.950922271569265e-05} +{"train_loss": 0.004923576954752207, "global_step": 21703, "epoch": 182, "lr": 7.95074341757557e-05} +{"train_loss": 0.0044105444103479385, "global_step": 21704, "epoch": 182, "lr": 7.950564557788404e-05} +{"train_loss": 0.003994747996330261, "global_step": 21705, "epoch": 182, "lr": 7.950385692208124e-05} +{"train_loss": 0.003859175369143486, "global_step": 21706, "epoch": 182, "lr": 7.950206820835075e-05} +{"train_loss": 0.006687439512461424, "global_step": 21707, "epoch": 182, "lr": 7.95002794366961e-05} +{"train_loss": 0.004069210961461067, "global_step": 21708, "epoch": 182, "lr": 7.94984906071208e-05} +{"train_loss": 0.0034743810538202524, "global_step": 21709, "epoch": 182, "lr": 7.949670171962835e-05} +{"train_loss": 0.0033392184413969517, "global_step": 21710, "epoch": 182, "lr": 7.94949127742223e-05} +{"train_loss": 0.005510625895112753, "global_step": 21711, "epoch": 182, "lr": 7.949312377090613e-05} +{"train_loss": 0.005500307772308588, "global_step": 21712, "epoch": 182, "lr": 7.949133470968337e-05} +{"train_loss": 0.0028257318772375584, "global_step": 21713, "epoch": 182, "lr": 7.948954559055751e-05} +{"train_loss": 0.00465863011777401, "global_step": 21714, "epoch": 182, "lr": 7.948775641353209e-05} +{"train_loss": 0.0037646018899977207, "global_step": 21715, "epoch": 182, "lr": 7.948596717861061e-05} +{"train_loss": 0.0035022078081965446, "global_step": 21716, "epoch": 182, "lr": 7.948417788579659e-05} +{"train_loss": 0.0032462526578456163, "global_step": 21717, "epoch": 182, "lr": 7.948238853509353e-05} +{"train_loss": 0.005798459518700838, "global_step": 21718, "epoch": 182, "lr": 7.948059912650494e-05} +{"train_loss": 0.00550386356189847, "global_step": 21719, "epoch": 182, "lr": 7.947880966003434e-05} +{"train_loss": 0.004652149043977261, "global_step": 21720, "epoch": 182, "lr": 7.947702013568526e-05} +{"train_loss": 0.005119344685226679, "global_step": 21721, "epoch": 182, "lr": 7.94752305534612e-05} +{"train_loss": 0.004492354579269886, "global_step": 21722, "epoch": 182, "lr": 7.947344091336568e-05} +{"train_loss": 0.005716727580875158, "global_step": 21723, "epoch": 182, "lr": 7.947165121540219e-05} +{"train_loss": 0.005365313030779362, "global_step": 21724, "epoch": 182, "lr": 7.946986145957428e-05} +{"train_loss": 0.005106290802359581, "global_step": 21725, "epoch": 182, "lr": 7.946807164588544e-05} +{"train_loss": 0.003444382920861244, "global_step": 21726, "epoch": 182, "lr": 7.946628177433919e-05} +{"train_loss": 0.004276003688573837, "global_step": 21727, "epoch": 182, "lr": 7.946449184493903e-05} +{"train_loss": 0.003564965445548296, "global_step": 21728, "epoch": 182, "lr": 7.94627018576885e-05} +{"train_loss": 0.004884741269052029, "global_step": 21729, "epoch": 182, "lr": 7.94609118125911e-05} +{"train_loss": 0.005306745879352093, "global_step": 21730, "epoch": 182, "lr": 7.945912170965035e-05} +{"train_loss": 0.008677711710333824, "global_step": 21731, "epoch": 182, "lr": 7.945733154886976e-05} +{"train_loss": 0.004089612979441881, "global_step": 21732, "epoch": 182, "lr": 7.945554133025283e-05} +{"train_loss": 0.004131302237510681, "global_step": 21733, "epoch": 182, "lr": 7.945375105380312e-05} +{"train_loss": 0.004304501228034496, "global_step": 21734, "epoch": 182, "lr": 7.94519607195241e-05} +{"train_loss": 0.004006051458418369, "global_step": 21735, "epoch": 182, "lr": 7.94501703274193e-05} +{"train_loss": 0.00499136233702302, "global_step": 21736, "epoch": 182, "lr": 7.944837987749226e-05} +{"train_loss": 0.006406264845281839, "global_step": 21737, "epoch": 182, "lr": 7.944658936974645e-05} +{"train_loss": 0.004569839686155319, "global_step": 21738, "epoch": 182, "lr": 7.94447988041854e-05} +{"train_loss": 0.007377278991043568, "global_step": 21739, "epoch": 182, "lr": 7.944300818081265e-05} +{"train_loss": 0.004558430518954992, "global_step": 21740, "epoch": 182, "lr": 7.94412174996317e-05} +{"train_loss": 0.0053298817947506905, "global_step": 21741, "epoch": 182, "lr": 7.943942676064605e-05} +{"train_loss": 0.004312403034418821, "global_step": 21742, "epoch": 182, "lr": 7.943763596385924e-05} +{"train_loss": 0.004580327775329351, "global_step": 21743, "epoch": 182, "lr": 7.943584510927477e-05} +{"train_loss": 0.007390993181616068, "global_step": 21744, "epoch": 182, "lr": 7.943405419689618e-05} +{"train_loss": 0.00783741194754839, "global_step": 21745, "epoch": 182, "lr": 7.943226322672695e-05} +{"train_loss": 0.0019303127191960812, "global_step": 21746, "epoch": 182, "lr": 7.943047219877062e-05} +{"train_loss": 0.003419822081923485, "global_step": 21747, "epoch": 182, "lr": 7.942868111303071e-05} +{"train_loss": 0.005046497564762831, "global_step": 21748, "epoch": 182, "lr": 7.942688996951073e-05} +{"train_loss": 0.002822326263412833, "global_step": 21749, "epoch": 182, "lr": 7.94250987682142e-05} +{"train_loss": 0.0036416947841644287, "global_step": 21750, "epoch": 182, "lr": 7.942330750914461e-05} +{"train_loss": 0.0028639202937483788, "global_step": 21751, "epoch": 182, "lr": 7.942151619230552e-05} +{"train_loss": 0.004687632899731398, "global_step": 21752, "epoch": 182, "lr": 7.941972481770041e-05} +{"train_loss": 0.0034226931165903807, "global_step": 21753, "epoch": 182, "lr": 7.941793338533281e-05} +{"train_loss": 0.007363848853856325, "global_step": 21754, "epoch": 182, "lr": 7.941614189520625e-05} +{"train_loss": 0.005617816932499409, "global_step": 21755, "epoch": 182, "lr": 7.941435034732425e-05} +{"train_loss": 0.007354347966611385, "global_step": 21756, "epoch": 182, "lr": 7.941255874169032e-05} +{"train_loss": 0.004805901553481817, "global_step": 21757, "epoch": 182, "lr": 7.941076707830795e-05} +{"train_loss": 0.0025128701236099005, "global_step": 21758, "epoch": 182, "lr": 7.940897535718068e-05} +{"train_loss": 0.00490095280110836, "global_step": 21759, "epoch": 182, "lr": 7.940718357831205e-05} +{"train_loss": 0.003947138320654631, "global_step": 21760, "epoch": 182, "lr": 7.940539174170554e-05} +{"train_loss": 0.0064071835950016975, "global_step": 21761, "epoch": 182, "lr": 7.940359984736469e-05} +{"train_loss": 0.003931510262191296, "global_step": 21762, "epoch": 182, "lr": 7.940180789529302e-05} +{"train_loss": 0.004517014604061842, "global_step": 21763, "epoch": 182, "lr": 7.940001588549402e-05} +{"train_loss": 0.004927096888422966, "global_step": 21764, "epoch": 182, "lr": 7.939822381797124e-05} +{"train_loss": 0.007208854425698519, "global_step": 21765, "epoch": 182, "lr": 7.939643169272819e-05} +{"train_loss": 0.0037241242825984955, "global_step": 21766, "epoch": 182, "lr": 7.93946395097684e-05} +{"train_loss": 0.006666562519967556, "global_step": 21767, "epoch": 182, "lr": 7.939284726909535e-05} +{"train_loss": 0.005058884620666504, "global_step": 21768, "epoch": 182, "lr": 7.93910549707126e-05} +{"train_loss": 0.005668445490300655, "global_step": 21769, "epoch": 182, "lr": 7.938926261462366e-05} +{"train_loss": 0.004840393550693989, "global_step": 21770, "epoch": 182, "lr": 7.938747020083204e-05} +{"train_loss": 0.0055197374895215034, "global_step": 21771, "epoch": 182, "lr": 7.938567772934125e-05} +{"train_loss": 0.0036560746375471354, "global_step": 21772, "epoch": 182, "lr": 7.938388520015483e-05} +{"train_loss": 0.005307526793330908, "global_step": 21773, "epoch": 182, "lr": 7.93820926132763e-05} +{"train_loss": 0.007141873240470886, "global_step": 21774, "epoch": 182, "lr": 7.938029996870915e-05} +{"train_loss": 0.003969206009060144, "global_step": 21775, "epoch": 182, "lr": 7.937850726645692e-05} +{"train_loss": 0.004693979434590756, "global_step": 21776, "epoch": 182, "lr": 7.937671450652315e-05, "val_loss": 0.028901059180498123} +{"train_loss": 0.003522556973621249, "global_step": 21777, "epoch": 183, "lr": 7.937492168891133e-05} +{"train_loss": 0.005343679804354906, "global_step": 21778, "epoch": 183, "lr": 7.937312881362497e-05} +{"train_loss": 0.0027818724047392607, "global_step": 21779, "epoch": 183, "lr": 7.937133588066764e-05} +{"train_loss": 0.004056243225932121, "global_step": 21780, "epoch": 183, "lr": 7.936954289004281e-05} +{"train_loss": 0.003718045074492693, "global_step": 21781, "epoch": 183, "lr": 7.936774984175404e-05} +{"train_loss": 0.004304016008973122, "global_step": 21782, "epoch": 183, "lr": 7.936595673580481e-05} +{"train_loss": 0.0031364646274596453, "global_step": 21783, "epoch": 183, "lr": 7.936416357219867e-05} +{"train_loss": 0.004721710924059153, "global_step": 21784, "epoch": 183, "lr": 7.936237035093913e-05} +{"train_loss": 0.00559249660000205, "global_step": 21785, "epoch": 183, "lr": 7.93605770720297e-05} +{"train_loss": 0.00468537537381053, "global_step": 21786, "epoch": 183, "lr": 7.935878373547393e-05} +{"train_loss": 0.006346023641526699, "global_step": 21787, "epoch": 183, "lr": 7.935699034127533e-05} +{"train_loss": 0.0026567308232188225, "global_step": 21788, "epoch": 183, "lr": 7.935519688943741e-05} +{"train_loss": 0.004371998831629753, "global_step": 21789, "epoch": 183, "lr": 7.935340337996369e-05} +{"train_loss": 0.004455015063285828, "global_step": 21790, "epoch": 183, "lr": 7.935160981285771e-05} +{"train_loss": 0.0063391393050551414, "global_step": 21791, "epoch": 183, "lr": 7.934981618812298e-05} +{"train_loss": 0.0035927214194089174, "global_step": 21792, "epoch": 183, "lr": 7.934802250576301e-05} +{"train_loss": 0.004503083415329456, "global_step": 21793, "epoch": 183, "lr": 7.934622876578132e-05} +{"train_loss": 0.0044663636945188046, "global_step": 21794, "epoch": 183, "lr": 7.934443496818147e-05} +{"train_loss": 0.004092861898243427, "global_step": 21795, "epoch": 183, "lr": 7.934264111296696e-05} +{"train_loss": 0.002880295505747199, "global_step": 21796, "epoch": 183, "lr": 7.93408472001413e-05} +{"train_loss": 0.006077443715184927, "global_step": 21797, "epoch": 183, "lr": 7.9339053229708e-05} +{"train_loss": 0.005937977693974972, "global_step": 21798, "epoch": 183, "lr": 7.933725920167063e-05} +{"train_loss": 0.0024084686301648617, "global_step": 21799, "epoch": 183, "lr": 7.93354651160327e-05} +{"train_loss": 0.008960891515016556, "global_step": 21800, "epoch": 183, "lr": 7.933367097279769e-05} +{"train_loss": 0.003718801774084568, "global_step": 21801, "epoch": 183, "lr": 7.933187677196914e-05} +{"train_loss": 0.004494761116802692, "global_step": 21802, "epoch": 183, "lr": 7.933008251355061e-05} +{"train_loss": 0.0064621432684361935, "global_step": 21803, "epoch": 183, "lr": 7.932828819754559e-05} +{"train_loss": 0.0034468446392565966, "global_step": 21804, "epoch": 183, "lr": 7.93264938239576e-05} +{"train_loss": 0.003189732553437352, "global_step": 21805, "epoch": 183, "lr": 7.93246993927902e-05} +{"train_loss": 0.005191098432987928, "global_step": 21806, "epoch": 183, "lr": 7.932290490404686e-05} +{"train_loss": 0.003354409709572792, "global_step": 21807, "epoch": 183, "lr": 7.932111035773113e-05} +{"train_loss": 0.00504220649600029, "global_step": 21808, "epoch": 183, "lr": 7.931931575384654e-05} +{"train_loss": 0.0046273949556052685, "global_step": 21809, "epoch": 183, "lr": 7.93175210923966e-05} +{"train_loss": 0.0030197554733604193, "global_step": 21810, "epoch": 183, "lr": 7.931572637338484e-05} +{"train_loss": 0.004711911082267761, "global_step": 21811, "epoch": 183, "lr": 7.931393159681479e-05} +{"train_loss": 0.002566116861999035, "global_step": 21812, "epoch": 183, "lr": 7.931213676268996e-05} +{"train_loss": 0.006244422867894173, "global_step": 21813, "epoch": 183, "lr": 7.931034187101388e-05} +{"train_loss": 0.00422392413020134, "global_step": 21814, "epoch": 183, "lr": 7.930854692179008e-05} +{"train_loss": 0.006383778993040323, "global_step": 21815, "epoch": 183, "lr": 7.930675191502208e-05} +{"train_loss": 0.005876663140952587, "global_step": 21816, "epoch": 183, "lr": 7.93049568507134e-05} +{"train_loss": 0.004405065439641476, "global_step": 21817, "epoch": 183, "lr": 7.930316172886756e-05} +{"train_loss": 0.003945731557905674, "global_step": 21818, "epoch": 183, "lr": 7.930136654948811e-05} +{"train_loss": 0.006441317964345217, "global_step": 21819, "epoch": 183, "lr": 7.929957131257855e-05} +{"train_loss": 0.004817477427423, "global_step": 21820, "epoch": 183, "lr": 7.929777601814242e-05} +{"train_loss": 0.005020282231271267, "global_step": 21821, "epoch": 183, "lr": 7.929598066618322e-05} +{"train_loss": 0.00580156734213233, "global_step": 21822, "epoch": 183, "lr": 7.929418525670448e-05} +{"train_loss": 0.003549039363861084, "global_step": 21823, "epoch": 183, "lr": 7.929238978970976e-05} +{"train_loss": 0.006547513883560896, "global_step": 21824, "epoch": 183, "lr": 7.929059426520258e-05} +{"train_loss": 0.006452609319239855, "global_step": 21825, "epoch": 183, "lr": 7.928879868318642e-05} +{"train_loss": 0.005966112948954105, "global_step": 21826, "epoch": 183, "lr": 7.928700304366484e-05} +{"train_loss": 0.004106905311346054, "global_step": 21827, "epoch": 183, "lr": 7.928520734664136e-05} +{"train_loss": 0.006080180872231722, "global_step": 21828, "epoch": 183, "lr": 7.92834115921195e-05} +{"train_loss": 0.0032726910430938005, "global_step": 21829, "epoch": 183, "lr": 7.928161578010279e-05} +{"train_loss": 0.0038371800910681486, "global_step": 21830, "epoch": 183, "lr": 7.927981991059475e-05} +{"train_loss": 0.006963691208511591, "global_step": 21831, "epoch": 183, "lr": 7.927802398359892e-05} +{"train_loss": 0.003312178887426853, "global_step": 21832, "epoch": 183, "lr": 7.927622799911883e-05} +{"train_loss": 0.004345322027802467, "global_step": 21833, "epoch": 183, "lr": 7.927443195715796e-05} +{"train_loss": 0.005776363890618086, "global_step": 21834, "epoch": 183, "lr": 7.92726358577199e-05} +{"train_loss": 0.003961327951401472, "global_step": 21835, "epoch": 183, "lr": 7.927083970080813e-05} +{"train_loss": 0.005186518654227257, "global_step": 21836, "epoch": 183, "lr": 7.92690434864262e-05} +{"train_loss": 0.006740535143762827, "global_step": 21837, "epoch": 183, "lr": 7.926724721457764e-05} +{"train_loss": 0.0032695068512111902, "global_step": 21838, "epoch": 183, "lr": 7.926545088526595e-05} +{"train_loss": 0.005200833082199097, "global_step": 21839, "epoch": 183, "lr": 7.926365449849468e-05} +{"train_loss": 0.00443741399794817, "global_step": 21840, "epoch": 183, "lr": 7.926185805426735e-05} +{"train_loss": 0.0040401858277618885, "global_step": 21841, "epoch": 183, "lr": 7.92600615525875e-05} +{"train_loss": 0.004436028189957142, "global_step": 21842, "epoch": 183, "lr": 7.925826499345863e-05} +{"train_loss": 0.0037868323270231485, "global_step": 21843, "epoch": 183, "lr": 7.92564683768843e-05} +{"train_loss": 0.0043851155787706375, "global_step": 21844, "epoch": 183, "lr": 7.925467170286799e-05} +{"train_loss": 0.006453053560107946, "global_step": 21845, "epoch": 183, "lr": 7.925287497141327e-05} +{"train_loss": 0.002902474720031023, "global_step": 21846, "epoch": 183, "lr": 7.925107818252366e-05} +{"train_loss": 0.003569805296137929, "global_step": 21847, "epoch": 183, "lr": 7.924928133620268e-05} +{"train_loss": 0.005507981404662132, "global_step": 21848, "epoch": 183, "lr": 7.924748443245386e-05} +{"train_loss": 0.005186344031244516, "global_step": 21849, "epoch": 183, "lr": 7.924568747128077e-05} +{"train_loss": 0.0030986785423010588, "global_step": 21850, "epoch": 183, "lr": 7.924389045268685e-05} +{"train_loss": 0.0037818264681845903, "global_step": 21851, "epoch": 183, "lr": 7.924209337667568e-05} +{"train_loss": 0.005178704857826233, "global_step": 21852, "epoch": 183, "lr": 7.924029624325078e-05} +{"train_loss": 0.0036953974049538374, "global_step": 21853, "epoch": 183, "lr": 7.923849905241569e-05} +{"train_loss": 0.007040244992822409, "global_step": 21854, "epoch": 183, "lr": 7.923670180417392e-05} +{"train_loss": 0.005739256273955107, "global_step": 21855, "epoch": 183, "lr": 7.923490449852903e-05} +{"train_loss": 0.004855255130678415, "global_step": 21856, "epoch": 183, "lr": 7.923310713548453e-05} +{"train_loss": 0.0027207599487155676, "global_step": 21857, "epoch": 183, "lr": 7.923130971504394e-05} +{"train_loss": 0.003387806937098503, "global_step": 21858, "epoch": 183, "lr": 7.922951223721079e-05} +{"train_loss": 0.0035511229652911425, "global_step": 21859, "epoch": 183, "lr": 7.922771470198862e-05} +{"train_loss": 0.003546615596860647, "global_step": 21860, "epoch": 183, "lr": 7.922591710938095e-05} +{"train_loss": 0.003849474713206291, "global_step": 21861, "epoch": 183, "lr": 7.922411945939133e-05} +{"train_loss": 0.003923626150935888, "global_step": 21862, "epoch": 183, "lr": 7.922232175202325e-05} +{"train_loss": 0.004537608474493027, "global_step": 21863, "epoch": 183, "lr": 7.922052398728029e-05} +{"train_loss": 0.005917235277593136, "global_step": 21864, "epoch": 183, "lr": 7.921872616516592e-05} +{"train_loss": 0.004097254015505314, "global_step": 21865, "epoch": 183, "lr": 7.921692828568372e-05} +{"train_loss": 0.005538809113204479, "global_step": 21866, "epoch": 183, "lr": 7.921513034883721e-05} +{"train_loss": 0.004960270132869482, "global_step": 21867, "epoch": 183, "lr": 7.92133323546299e-05} +{"train_loss": 0.0057342504151165485, "global_step": 21868, "epoch": 183, "lr": 7.921153430306534e-05} +{"train_loss": 0.004262974020093679, "global_step": 21869, "epoch": 183, "lr": 7.920973619414706e-05} +{"train_loss": 0.002017109887674451, "global_step": 21870, "epoch": 183, "lr": 7.920793802787856e-05} +{"train_loss": 0.005215035285800695, "global_step": 21871, "epoch": 183, "lr": 7.920613980426341e-05} +{"train_loss": 0.004403103142976761, "global_step": 21872, "epoch": 183, "lr": 7.920434152330513e-05} +{"train_loss": 0.0029938980005681515, "global_step": 21873, "epoch": 183, "lr": 7.920254318500723e-05} +{"train_loss": 0.002259476576000452, "global_step": 21874, "epoch": 183, "lr": 7.920074478937327e-05} +{"train_loss": 0.004150237422436476, "global_step": 21875, "epoch": 183, "lr": 7.919894633640676e-05} +{"train_loss": 0.006657003425061703, "global_step": 21876, "epoch": 183, "lr": 7.919714782611125e-05} +{"train_loss": 0.0022044831421226263, "global_step": 21877, "epoch": 183, "lr": 7.919534925849024e-05} +{"train_loss": 0.005397779867053032, "global_step": 21878, "epoch": 183, "lr": 7.91935506335473e-05} +{"train_loss": 0.002581668319180608, "global_step": 21879, "epoch": 183, "lr": 7.919175195128593e-05} +{"train_loss": 0.003567693755030632, "global_step": 21880, "epoch": 183, "lr": 7.918995321170968e-05} +{"train_loss": 0.004019463434815407, "global_step": 21881, "epoch": 183, "lr": 7.918815441482208e-05} +{"train_loss": 0.0046881381422281265, "global_step": 21882, "epoch": 183, "lr": 7.918635556062665e-05} +{"train_loss": 0.003241633763536811, "global_step": 21883, "epoch": 183, "lr": 7.918455664912693e-05} +{"train_loss": 0.004881420638412237, "global_step": 21884, "epoch": 183, "lr": 7.918275768032644e-05} +{"train_loss": 0.0042556775733828545, "global_step": 21885, "epoch": 183, "lr": 7.918095865422874e-05} +{"train_loss": 0.0034876838326454163, "global_step": 21886, "epoch": 183, "lr": 7.917915957083732e-05} +{"train_loss": 0.006534409709274769, "global_step": 21887, "epoch": 183, "lr": 7.917736043015578e-05} +{"train_loss": 0.0035458747297525406, "global_step": 21888, "epoch": 183, "lr": 7.917556123218758e-05} +{"train_loss": 0.004587240517139435, "global_step": 21889, "epoch": 183, "lr": 7.91737619769363e-05} +{"train_loss": 0.005728681106120348, "global_step": 21890, "epoch": 183, "lr": 7.917196266440543e-05} +{"train_loss": 0.0032632392831146717, "global_step": 21891, "epoch": 183, "lr": 7.917016329459855e-05} +{"train_loss": 0.003206272143870592, "global_step": 21892, "epoch": 183, "lr": 7.916836386751915e-05} +{"train_loss": 0.004166417755186558, "global_step": 21893, "epoch": 183, "lr": 7.916656438317081e-05} +{"train_loss": 0.004474678076803684, "global_step": 21894, "epoch": 183, "lr": 7.916476484155702e-05} +{"train_loss": 0.004506778605908406, "global_step": 21895, "epoch": 183, "lr": 7.916296524268131e-05, "val_loss": 0.014187414199113846} +{"train_loss": 0.004785503726452589, "global_step": 21896, "epoch": 184, "lr": 7.916116558654726e-05} +{"train_loss": 0.003495934419333935, "global_step": 21897, "epoch": 184, "lr": 7.915936587315838e-05} +{"train_loss": 0.00340548949316144, "global_step": 21898, "epoch": 184, "lr": 7.915756610251819e-05} +{"train_loss": 0.005133803468197584, "global_step": 21899, "epoch": 184, "lr": 7.915576627463024e-05} +{"train_loss": 0.0036231924314051867, "global_step": 21900, "epoch": 184, "lr": 7.915396638949805e-05} +{"train_loss": 0.004598556086421013, "global_step": 21901, "epoch": 184, "lr": 7.915216644712517e-05} +{"train_loss": 0.0030198919121176004, "global_step": 21902, "epoch": 184, "lr": 7.915036644751513e-05} +{"train_loss": 0.00873639713972807, "global_step": 21903, "epoch": 184, "lr": 7.914856639067145e-05} +{"train_loss": 0.0028162049129605293, "global_step": 21904, "epoch": 184, "lr": 7.914676627659767e-05} +{"train_loss": 0.003978615626692772, "global_step": 21905, "epoch": 184, "lr": 7.914496610529734e-05} +{"train_loss": 0.0035981745459139347, "global_step": 21906, "epoch": 184, "lr": 7.914316587677397e-05} +{"train_loss": 0.005768527276813984, "global_step": 21907, "epoch": 184, "lr": 7.914136559103112e-05} +{"train_loss": 0.003937921952456236, "global_step": 21908, "epoch": 184, "lr": 7.91395652480723e-05} +{"train_loss": 0.005221105646342039, "global_step": 21909, "epoch": 184, "lr": 7.913776484790105e-05} +{"train_loss": 0.0041722264140844345, "global_step": 21910, "epoch": 184, "lr": 7.913596439052094e-05} +{"train_loss": 0.0067325071431696415, "global_step": 21911, "epoch": 184, "lr": 7.913416387593544e-05} +{"train_loss": 0.005143306218087673, "global_step": 21912, "epoch": 184, "lr": 7.913236330414816e-05} +{"train_loss": 0.005325102712959051, "global_step": 21913, "epoch": 184, "lr": 7.913056267516258e-05} +{"train_loss": 0.0042489576153457165, "global_step": 21914, "epoch": 184, "lr": 7.912876198898225e-05} +{"train_loss": 0.006042175460606813, "global_step": 21915, "epoch": 184, "lr": 7.912696124561071e-05} +{"train_loss": 0.006804355885833502, "global_step": 21916, "epoch": 184, "lr": 7.912516044505149e-05} +{"train_loss": 0.0050207884050905704, "global_step": 21917, "epoch": 184, "lr": 7.912335958730813e-05} +{"train_loss": 0.004309384617954493, "global_step": 21918, "epoch": 184, "lr": 7.912155867238418e-05} +{"train_loss": 0.005324794910848141, "global_step": 21919, "epoch": 184, "lr": 7.911975770028313e-05} +{"train_loss": 0.004308296367526054, "global_step": 21920, "epoch": 184, "lr": 7.911795667100856e-05} +{"train_loss": 0.005906360689550638, "global_step": 21921, "epoch": 184, "lr": 7.9116155584564e-05} +{"train_loss": 0.002269741613417864, "global_step": 21922, "epoch": 184, "lr": 7.911435444095299e-05} +{"train_loss": 0.005769788753241301, "global_step": 21923, "epoch": 184, "lr": 7.911255324017904e-05} +{"train_loss": 0.0040749553591012955, "global_step": 21924, "epoch": 184, "lr": 7.91107519822457e-05} +{"train_loss": 0.005948052741587162, "global_step": 21925, "epoch": 184, "lr": 7.910895066715652e-05} +{"train_loss": 0.0032835830934345722, "global_step": 21926, "epoch": 184, "lr": 7.9107149294915e-05} +{"train_loss": 0.0074314638040959835, "global_step": 21927, "epoch": 184, "lr": 7.910534786552473e-05} +{"train_loss": 0.0033289280254393816, "global_step": 21928, "epoch": 184, "lr": 7.91035463789892e-05} +{"train_loss": 0.006226490251719952, "global_step": 21929, "epoch": 184, "lr": 7.910174483531199e-05} +{"train_loss": 0.002710179891437292, "global_step": 21930, "epoch": 184, "lr": 7.909994323449658e-05} +{"train_loss": 0.0056212907657027245, "global_step": 21931, "epoch": 184, "lr": 7.909814157654657e-05} +{"train_loss": 0.005368911195546389, "global_step": 21932, "epoch": 184, "lr": 7.909633986146546e-05} +{"train_loss": 0.006506363861262798, "global_step": 21933, "epoch": 184, "lr": 7.909453808925678e-05} +{"train_loss": 0.004758778493851423, "global_step": 21934, "epoch": 184, "lr": 7.909273625992409e-05} +{"train_loss": 0.005680363159626722, "global_step": 21935, "epoch": 184, "lr": 7.909093437347093e-05} +{"train_loss": 0.0062662893906235695, "global_step": 21936, "epoch": 184, "lr": 7.908913242990081e-05} +{"train_loss": 0.004812969826161861, "global_step": 21937, "epoch": 184, "lr": 7.908733042921731e-05} +{"train_loss": 0.0029747439548373222, "global_step": 21938, "epoch": 184, "lr": 7.908552837142393e-05} +{"train_loss": 0.004770869854837656, "global_step": 21939, "epoch": 184, "lr": 7.908372625652423e-05} +{"train_loss": 0.0032377729658037424, "global_step": 21940, "epoch": 184, "lr": 7.908192408452174e-05} +{"train_loss": 0.006014214362949133, "global_step": 21941, "epoch": 184, "lr": 7.908012185541998e-05} +{"train_loss": 0.0040416656993329525, "global_step": 21942, "epoch": 184, "lr": 7.907831956922253e-05} +{"train_loss": 0.0044629271142184734, "global_step": 21943, "epoch": 184, "lr": 7.90765172259329e-05} +{"train_loss": 0.003469740506261587, "global_step": 21944, "epoch": 184, "lr": 7.907471482555463e-05} +{"train_loss": 0.006057522725313902, "global_step": 21945, "epoch": 184, "lr": 7.907291236809127e-05} +{"train_loss": 0.004112160298973322, "global_step": 21946, "epoch": 184, "lr": 7.907110985354635e-05} +{"train_loss": 0.0028194249607622623, "global_step": 21947, "epoch": 184, "lr": 7.906930728192341e-05} +{"train_loss": 0.006051533855497837, "global_step": 21948, "epoch": 184, "lr": 7.9067504653226e-05} +{"train_loss": 0.004882009234279394, "global_step": 21949, "epoch": 184, "lr": 7.906570196745763e-05} +{"train_loss": 0.004246178548783064, "global_step": 21950, "epoch": 184, "lr": 7.906389922462187e-05} +{"train_loss": 0.002852745819836855, "global_step": 21951, "epoch": 184, "lr": 7.906209642472225e-05} +{"train_loss": 0.003968462813645601, "global_step": 21952, "epoch": 184, "lr": 7.90602935677623e-05} +{"train_loss": 0.0026438359636813402, "global_step": 21953, "epoch": 184, "lr": 7.905849065374558e-05} +{"train_loss": 0.006722604390233755, "global_step": 21954, "epoch": 184, "lr": 7.905668768267561e-05} +{"train_loss": 0.006509874481707811, "global_step": 21955, "epoch": 184, "lr": 7.905488465455596e-05} +{"train_loss": 0.0037260171957314014, "global_step": 21956, "epoch": 184, "lr": 7.905308156939013e-05} +{"train_loss": 0.003210510592907667, "global_step": 21957, "epoch": 184, "lr": 7.905127842718167e-05} +{"train_loss": 0.004484509117901325, "global_step": 21958, "epoch": 184, "lr": 7.904947522793413e-05} +{"train_loss": 0.0034723624121397734, "global_step": 21959, "epoch": 184, "lr": 7.904767197165106e-05} +{"train_loss": 0.0035501651000231504, "global_step": 21960, "epoch": 184, "lr": 7.904586865833599e-05} +{"train_loss": 0.0041635665111243725, "global_step": 21961, "epoch": 184, "lr": 7.904406528799244e-05} +{"train_loss": 0.0043725864961743355, "global_step": 21962, "epoch": 184, "lr": 7.9042261860624e-05} +{"train_loss": 0.0051539004780352116, "global_step": 21963, "epoch": 184, "lr": 7.904045837623417e-05} +{"train_loss": 0.0063692377880215645, "global_step": 21964, "epoch": 184, "lr": 7.90386548348265e-05} +{"train_loss": 0.0031236191280186176, "global_step": 21965, "epoch": 184, "lr": 7.903685123640453e-05} +{"train_loss": 0.003905202727764845, "global_step": 21966, "epoch": 184, "lr": 7.90350475809718e-05} +{"train_loss": 0.005830890499055386, "global_step": 21967, "epoch": 184, "lr": 7.903324386853187e-05} +{"train_loss": 0.0047087459824979305, "global_step": 21968, "epoch": 184, "lr": 7.903144009908827e-05} +{"train_loss": 0.007147334981709719, "global_step": 21969, "epoch": 184, "lr": 7.902963627264452e-05} +{"train_loss": 0.004234354943037033, "global_step": 21970, "epoch": 184, "lr": 7.90278323892042e-05} +{"train_loss": 0.0035541623365134, "global_step": 21971, "epoch": 184, "lr": 7.902602844877082e-05} +{"train_loss": 0.004181336145848036, "global_step": 21972, "epoch": 184, "lr": 7.902422445134794e-05} +{"train_loss": 0.002286142436787486, "global_step": 21973, "epoch": 184, "lr": 7.902242039693908e-05} +{"train_loss": 0.004225187469273806, "global_step": 21974, "epoch": 184, "lr": 7.902061628554782e-05} +{"train_loss": 0.002938361605629325, "global_step": 21975, "epoch": 184, "lr": 7.901881211717767e-05} +{"train_loss": 0.005433508660644293, "global_step": 21976, "epoch": 184, "lr": 7.901700789183219e-05} +{"train_loss": 0.00508127361536026, "global_step": 21977, "epoch": 184, "lr": 7.901520360951491e-05} +{"train_loss": 0.003912320826202631, "global_step": 21978, "epoch": 184, "lr": 7.901339927022937e-05} +{"train_loss": 0.004633232951164246, "global_step": 21979, "epoch": 184, "lr": 7.901159487397913e-05} +{"train_loss": 0.005464473739266396, "global_step": 21980, "epoch": 184, "lr": 7.900979042076771e-05} +{"train_loss": 0.0034139773342758417, "global_step": 21981, "epoch": 184, "lr": 7.90079859105987e-05} +{"train_loss": 0.003943189512938261, "global_step": 21982, "epoch": 184, "lr": 7.900618134347558e-05} +{"train_loss": 0.008515851572155952, "global_step": 21983, "epoch": 184, "lr": 7.900437671940192e-05} +{"train_loss": 0.003997243009507656, "global_step": 21984, "epoch": 184, "lr": 7.900257203838126e-05} +{"train_loss": 0.004412409849464893, "global_step": 21985, "epoch": 184, "lr": 7.900076730041717e-05} +{"train_loss": 0.004007503390312195, "global_step": 21986, "epoch": 184, "lr": 7.899896250551315e-05} +{"train_loss": 0.004278155975043774, "global_step": 21987, "epoch": 184, "lr": 7.89971576536728e-05} +{"train_loss": 0.004549016244709492, "global_step": 21988, "epoch": 184, "lr": 7.89953527448996e-05} +{"train_loss": 0.0031567751429975033, "global_step": 21989, "epoch": 184, "lr": 7.899354777919712e-05} +{"train_loss": 0.0027012815698981285, "global_step": 21990, "epoch": 184, "lr": 7.899174275656891e-05} +{"train_loss": 0.005433674436062574, "global_step": 21991, "epoch": 184, "lr": 7.898993767701852e-05} +{"train_loss": 0.0070460145361721516, "global_step": 21992, "epoch": 184, "lr": 7.898813254054948e-05} +{"train_loss": 0.0039445990696549416, "global_step": 21993, "epoch": 184, "lr": 7.898632734716533e-05} +{"train_loss": 0.005724302958697081, "global_step": 21994, "epoch": 184, "lr": 7.898452209686964e-05} +{"train_loss": 0.006851254962384701, "global_step": 21995, "epoch": 184, "lr": 7.898271678966594e-05} +{"train_loss": 0.003401372581720352, "global_step": 21996, "epoch": 184, "lr": 7.898091142555774e-05} +{"train_loss": 0.004372413735836744, "global_step": 21997, "epoch": 184, "lr": 7.897910600454864e-05} +{"train_loss": 0.0036888804752379656, "global_step": 21998, "epoch": 184, "lr": 7.897730052664216e-05} +{"train_loss": 0.004970435984432697, "global_step": 21999, "epoch": 184, "lr": 7.897549499184185e-05} +{"train_loss": 0.00468283798545599, "global_step": 22000, "epoch": 184, "lr": 7.897368940015124e-05} +{"train_loss": 0.006024654489010572, "global_step": 22001, "epoch": 184, "lr": 7.897188375157389e-05} +{"train_loss": 0.0030127495992928743, "global_step": 22002, "epoch": 184, "lr": 7.897007804611335e-05} +{"train_loss": 0.0058336155489087105, "global_step": 22003, "epoch": 184, "lr": 7.896827228377314e-05} +{"train_loss": 0.0033967981580644846, "global_step": 22004, "epoch": 184, "lr": 7.896646646455683e-05} +{"train_loss": 0.0042905183508992195, "global_step": 22005, "epoch": 184, "lr": 7.896466058846796e-05} +{"train_loss": 0.0063051930628716946, "global_step": 22006, "epoch": 184, "lr": 7.89628546555101e-05} +{"train_loss": 0.005306849256157875, "global_step": 22007, "epoch": 184, "lr": 7.896104866568672e-05} +{"train_loss": 0.006133401300758123, "global_step": 22008, "epoch": 184, "lr": 7.895924261900146e-05} +{"train_loss": 0.0029921894893050194, "global_step": 22009, "epoch": 184, "lr": 7.895743651545778e-05} +{"train_loss": 0.004786905832588673, "global_step": 22010, "epoch": 184, "lr": 7.895563035505928e-05} +{"train_loss": 0.004231993108987808, "global_step": 22011, "epoch": 184, "lr": 7.89538241378095e-05} +{"train_loss": 0.006124267820268869, "global_step": 22012, "epoch": 184, "lr": 7.895201786371199e-05} +{"train_loss": 0.003988110926002264, "global_step": 22013, "epoch": 184, "lr": 7.895021153277027e-05} +{"train_loss": 0.004679298439227483, "global_step": 22014, "epoch": 184, "lr": 7.894840514498792e-05, "val_loss": 0.015256635844707489} +{"train_loss": 0.006103473715484142, "global_step": 22015, "epoch": 185, "lr": 7.894659870036844e-05} +{"train_loss": 0.004270242992788553, "global_step": 22016, "epoch": 185, "lr": 7.894479219891542e-05} +{"train_loss": 0.0069400230422616005, "global_step": 22017, "epoch": 185, "lr": 7.89429856406324e-05} +{"train_loss": 0.0065910061821341515, "global_step": 22018, "epoch": 185, "lr": 7.894117902552291e-05} +{"train_loss": 0.0041351295076310635, "global_step": 22019, "epoch": 185, "lr": 7.893937235359052e-05} +{"train_loss": 0.004417176358401775, "global_step": 22020, "epoch": 185, "lr": 7.893756562483875e-05} +{"train_loss": 0.00344920065253973, "global_step": 22021, "epoch": 185, "lr": 7.893575883927117e-05} +{"train_loss": 0.006820103153586388, "global_step": 22022, "epoch": 185, "lr": 7.893395199689131e-05} +{"train_loss": 0.0034109551925212145, "global_step": 22023, "epoch": 185, "lr": 7.893214509770273e-05} +{"train_loss": 0.004729652777314186, "global_step": 22024, "epoch": 185, "lr": 7.893033814170899e-05} +{"train_loss": 0.007825942710042, "global_step": 22025, "epoch": 185, "lr": 7.892853112891361e-05} +{"train_loss": 0.003495355136692524, "global_step": 22026, "epoch": 185, "lr": 7.892672405932013e-05} +{"train_loss": 0.007081635762006044, "global_step": 22027, "epoch": 185, "lr": 7.892491693293213e-05} +{"train_loss": 0.004453124478459358, "global_step": 22028, "epoch": 185, "lr": 7.892310974975317e-05} +{"train_loss": 0.005333613138645887, "global_step": 22029, "epoch": 185, "lr": 7.892130250978675e-05} +{"train_loss": 0.004261163529008627, "global_step": 22030, "epoch": 185, "lr": 7.891949521303644e-05} +{"train_loss": 0.004840104840695858, "global_step": 22031, "epoch": 185, "lr": 7.891768785950581e-05} +{"train_loss": 0.007476304192095995, "global_step": 22032, "epoch": 185, "lr": 7.891588044919837e-05} +{"train_loss": 0.003644796321168542, "global_step": 22033, "epoch": 185, "lr": 7.89140729821177e-05} +{"train_loss": 0.0034558065235614777, "global_step": 22034, "epoch": 185, "lr": 7.891226545826733e-05} +{"train_loss": 0.006383330095559359, "global_step": 22035, "epoch": 185, "lr": 7.891045787765081e-05} +{"train_loss": 0.0030416795052587986, "global_step": 22036, "epoch": 185, "lr": 7.89086502402717e-05} +{"train_loss": 0.004474469926208258, "global_step": 22037, "epoch": 185, "lr": 7.890684254613356e-05} +{"train_loss": 0.007462134584784508, "global_step": 22038, "epoch": 185, "lr": 7.890503479523991e-05} +{"train_loss": 0.0039930096827447414, "global_step": 22039, "epoch": 185, "lr": 7.890322698759432e-05} +{"train_loss": 0.004852575249969959, "global_step": 22040, "epoch": 185, "lr": 7.890141912320031e-05} +{"train_loss": 0.007111661601811647, "global_step": 22041, "epoch": 185, "lr": 7.889961120206146e-05} +{"train_loss": 0.003837469033896923, "global_step": 22042, "epoch": 185, "lr": 7.889780322418131e-05} +{"train_loss": 0.005435220431536436, "global_step": 22043, "epoch": 185, "lr": 7.889599518956343e-05} +{"train_loss": 0.005241339094936848, "global_step": 22044, "epoch": 185, "lr": 7.889418709821132e-05} +{"train_loss": 0.004080669023096561, "global_step": 22045, "epoch": 185, "lr": 7.889237895012859e-05} +{"train_loss": 0.006336727179586887, "global_step": 22046, "epoch": 185, "lr": 7.889057074531874e-05} +{"train_loss": 0.004738545045256615, "global_step": 22047, "epoch": 185, "lr": 7.888876248378535e-05} +{"train_loss": 0.005448868498206139, "global_step": 22048, "epoch": 185, "lr": 7.888695416553196e-05} +{"train_loss": 0.006347237154841423, "global_step": 22049, "epoch": 185, "lr": 7.888514579056212e-05} +{"train_loss": 0.00494332006201148, "global_step": 22050, "epoch": 185, "lr": 7.888333735887938e-05} +{"train_loss": 0.004707674961537123, "global_step": 22051, "epoch": 185, "lr": 7.88815288704873e-05} +{"train_loss": 0.0035841204226017, "global_step": 22052, "epoch": 185, "lr": 7.887972032538941e-05} +{"train_loss": 0.007944922894239426, "global_step": 22053, "epoch": 185, "lr": 7.88779117235893e-05} +{"train_loss": 0.002748810686171055, "global_step": 22054, "epoch": 185, "lr": 7.887610306509047e-05} +{"train_loss": 0.004023538436740637, "global_step": 22055, "epoch": 185, "lr": 7.88742943498965e-05} +{"train_loss": 0.004101157654076815, "global_step": 22056, "epoch": 185, "lr": 7.887248557801095e-05} +{"train_loss": 0.0034314501099288464, "global_step": 22057, "epoch": 185, "lr": 7.887067674943735e-05} +{"train_loss": 0.0036239721812307835, "global_step": 22058, "epoch": 185, "lr": 7.886886786417926e-05} +{"train_loss": 0.005612628068774939, "global_step": 22059, "epoch": 185, "lr": 7.886705892224024e-05} +{"train_loss": 0.006784075405448675, "global_step": 22060, "epoch": 185, "lr": 7.886524992362383e-05} +{"train_loss": 0.0032239696010947227, "global_step": 22061, "epoch": 185, "lr": 7.886344086833359e-05} +{"train_loss": 0.005496323574334383, "global_step": 22062, "epoch": 185, "lr": 7.886163175637306e-05} +{"train_loss": 0.0053852628916502, "global_step": 22063, "epoch": 185, "lr": 7.88598225877458e-05} +{"train_loss": 0.004818703513592482, "global_step": 22064, "epoch": 185, "lr": 7.885801336245537e-05} +{"train_loss": 0.0038812225684523582, "global_step": 22065, "epoch": 185, "lr": 7.885620408050531e-05} +{"train_loss": 0.005754454527050257, "global_step": 22066, "epoch": 185, "lr": 7.885439474189916e-05} +{"train_loss": 0.004407581407576799, "global_step": 22067, "epoch": 185, "lr": 7.885258534664051e-05} +{"train_loss": 0.00483450572937727, "global_step": 22068, "epoch": 185, "lr": 7.885077589473288e-05} +{"train_loss": 0.005713936407119036, "global_step": 22069, "epoch": 185, "lr": 7.884896638617985e-05} +{"train_loss": 0.005263762082904577, "global_step": 22070, "epoch": 185, "lr": 7.884715682098494e-05} +{"train_loss": 0.004347453825175762, "global_step": 22071, "epoch": 185, "lr": 7.884534719915171e-05} +{"train_loss": 0.0034320096019655466, "global_step": 22072, "epoch": 185, "lr": 7.884353752068374e-05} +{"train_loss": 0.0032640001736581326, "global_step": 22073, "epoch": 185, "lr": 7.884172778558456e-05} +{"train_loss": 0.005442844238132238, "global_step": 22074, "epoch": 185, "lr": 7.883991799385772e-05} +{"train_loss": 0.004323022440075874, "global_step": 22075, "epoch": 185, "lr": 7.883810814550681e-05} +{"train_loss": 0.0033389630261808634, "global_step": 22076, "epoch": 185, "lr": 7.883629824053534e-05} +{"train_loss": 0.0033507170155644417, "global_step": 22077, "epoch": 185, "lr": 7.883448827894685e-05} +{"train_loss": 0.005166483577340841, "global_step": 22078, "epoch": 185, "lr": 7.883267826074497e-05} +{"train_loss": 0.004517910536378622, "global_step": 22079, "epoch": 185, "lr": 7.883086818593317e-05} +{"train_loss": 0.0044217295944690704, "global_step": 22080, "epoch": 185, "lr": 7.882905805451505e-05} +{"train_loss": 0.005967236589640379, "global_step": 22081, "epoch": 185, "lr": 7.882724786649418e-05} +{"train_loss": 0.0035481334198266268, "global_step": 22082, "epoch": 185, "lr": 7.882543762187406e-05} +{"train_loss": 0.005089835729449987, "global_step": 22083, "epoch": 185, "lr": 7.882362732065828e-05} +{"train_loss": 0.00446438929066062, "global_step": 22084, "epoch": 185, "lr": 7.882181696285041e-05} +{"train_loss": 0.004988287575542927, "global_step": 22085, "epoch": 185, "lr": 7.882000654845394e-05} +{"train_loss": 0.00384135777130723, "global_step": 22086, "epoch": 185, "lr": 7.88181960774725e-05} +{"train_loss": 0.00293728313408792, "global_step": 22087, "epoch": 185, "lr": 7.88163855499096e-05} +{"train_loss": 0.005002274643629789, "global_step": 22088, "epoch": 185, "lr": 7.881457496576881e-05} +{"train_loss": 0.002123534679412842, "global_step": 22089, "epoch": 185, "lr": 7.881276432505366e-05} +{"train_loss": 0.004525589291006327, "global_step": 22090, "epoch": 185, "lr": 7.881095362776773e-05} +{"train_loss": 0.0016465592198073864, "global_step": 22091, "epoch": 185, "lr": 7.880914287391459e-05} +{"train_loss": 0.003911558538675308, "global_step": 22092, "epoch": 185, "lr": 7.880733206349776e-05} +{"train_loss": 0.004224611911922693, "global_step": 22093, "epoch": 185, "lr": 7.880552119652083e-05} +{"train_loss": 0.003984247334301472, "global_step": 22094, "epoch": 185, "lr": 7.880371027298731e-05} +{"train_loss": 0.005059330724179745, "global_step": 22095, "epoch": 185, "lr": 7.88018992929008e-05} +{"train_loss": 0.005635723937302828, "global_step": 22096, "epoch": 185, "lr": 7.880008825626484e-05} +{"train_loss": 0.003874541725963354, "global_step": 22097, "epoch": 185, "lr": 7.879827716308297e-05} +{"train_loss": 0.0033250332344323397, "global_step": 22098, "epoch": 185, "lr": 7.879646601335876e-05} +{"train_loss": 0.004787979647517204, "global_step": 22099, "epoch": 185, "lr": 7.879465480709577e-05} +{"train_loss": 0.004498726222664118, "global_step": 22100, "epoch": 185, "lr": 7.879284354429755e-05} +{"train_loss": 0.0028362039010971785, "global_step": 22101, "epoch": 185, "lr": 7.879103222496766e-05} +{"train_loss": 0.0031271488405764103, "global_step": 22102, "epoch": 185, "lr": 7.878922084910966e-05} +{"train_loss": 0.0032553267665207386, "global_step": 22103, "epoch": 185, "lr": 7.878740941672709e-05} +{"train_loss": 0.005432053469121456, "global_step": 22104, "epoch": 185, "lr": 7.878559792782352e-05} +{"train_loss": 0.003812559647485614, "global_step": 22105, "epoch": 185, "lr": 7.878378638240251e-05} +{"train_loss": 0.004648835863918066, "global_step": 22106, "epoch": 185, "lr": 7.878197478046761e-05} +{"train_loss": 0.0033555645495653152, "global_step": 22107, "epoch": 185, "lr": 7.878016312202236e-05} +{"train_loss": 0.003624646458774805, "global_step": 22108, "epoch": 185, "lr": 7.877835140707036e-05} +{"train_loss": 0.004105789586901665, "global_step": 22109, "epoch": 185, "lr": 7.877653963561513e-05} +{"train_loss": 0.004625509958714247, "global_step": 22110, "epoch": 185, "lr": 7.877472780766024e-05} +{"train_loss": 0.0046757059171795845, "global_step": 22111, "epoch": 185, "lr": 7.877291592320924e-05} +{"train_loss": 0.00421041389927268, "global_step": 22112, "epoch": 185, "lr": 7.87711039822657e-05} +{"train_loss": 0.004548986442387104, "global_step": 22113, "epoch": 185, "lr": 7.876929198483318e-05} +{"train_loss": 0.00455690361559391, "global_step": 22114, "epoch": 185, "lr": 7.876747993091521e-05} +{"train_loss": 0.005095405504107475, "global_step": 22115, "epoch": 185, "lr": 7.876566782051538e-05} +{"train_loss": 0.003990295808762312, "global_step": 22116, "epoch": 185, "lr": 7.876385565363722e-05} +{"train_loss": 0.00489009078592062, "global_step": 22117, "epoch": 185, "lr": 7.87620434302843e-05} +{"train_loss": 0.005482963286340237, "global_step": 22118, "epoch": 185, "lr": 7.876023115046021e-05} +{"train_loss": 0.0048499503172934055, "global_step": 22119, "epoch": 185, "lr": 7.875841881416845e-05} +{"train_loss": 0.0036149139050394297, "global_step": 22120, "epoch": 185, "lr": 7.875660642141263e-05} +{"train_loss": 0.004958042409271002, "global_step": 22121, "epoch": 185, "lr": 7.875479397219627e-05} +{"train_loss": 0.006292718928307295, "global_step": 22122, "epoch": 185, "lr": 7.875298146652294e-05} +{"train_loss": 0.0021315044723451138, "global_step": 22123, "epoch": 185, "lr": 7.875116890439623e-05} +{"train_loss": 0.0039551290683448315, "global_step": 22124, "epoch": 185, "lr": 7.874935628581963e-05} +{"train_loss": 0.006570335943251848, "global_step": 22125, "epoch": 185, "lr": 7.874754361079677e-05} +{"train_loss": 0.0032949461601674557, "global_step": 22126, "epoch": 185, "lr": 7.874573087933117e-05} +{"train_loss": 0.0053847371600568295, "global_step": 22127, "epoch": 185, "lr": 7.874391809142641e-05} +{"train_loss": 0.008520929142832756, "global_step": 22128, "epoch": 185, "lr": 7.8742105247086e-05} +{"train_loss": 0.004842172376811504, "global_step": 22129, "epoch": 185, "lr": 7.874029234631357e-05} +{"train_loss": 0.002905128290876746, "global_step": 22130, "epoch": 185, "lr": 7.873847938911265e-05} +{"train_loss": 0.0033047019969671965, "global_step": 22131, "epoch": 185, "lr": 7.873666637548677e-05} +{"train_loss": 0.006555980071425438, "global_step": 22132, "epoch": 185, "lr": 7.873485330543955e-05} +{"train_loss": 0.0046867715085254, "global_step": 22133, "epoch": 185, "lr": 7.87330401789745e-05, "val_loss": 0.013004012405872345, "train_action_mse_error": 0.00011173846723977476} +{"train_loss": 0.005274343769997358, "global_step": 22134, "epoch": 186, "lr": 7.873122699609518e-05} +{"train_loss": 0.004647252149879932, "global_step": 22135, "epoch": 186, "lr": 7.872941375680518e-05} +{"train_loss": 0.005912656895816326, "global_step": 22136, "epoch": 186, "lr": 7.872760046110805e-05} +{"train_loss": 0.005539899691939354, "global_step": 22137, "epoch": 186, "lr": 7.872578710900734e-05} +{"train_loss": 0.0049313269555568695, "global_step": 22138, "epoch": 186, "lr": 7.872397370050661e-05} +{"train_loss": 0.009398473426699638, "global_step": 22139, "epoch": 186, "lr": 7.872216023560943e-05} +{"train_loss": 0.004439763259142637, "global_step": 22140, "epoch": 186, "lr": 7.872034671431936e-05} +{"train_loss": 0.0063683330081403255, "global_step": 22141, "epoch": 186, "lr": 7.871853313663995e-05} +{"train_loss": 0.004420801531523466, "global_step": 22142, "epoch": 186, "lr": 7.871671950257477e-05} +{"train_loss": 0.006133641581982374, "global_step": 22143, "epoch": 186, "lr": 7.871490581212739e-05} +{"train_loss": 0.004892401397228241, "global_step": 22144, "epoch": 186, "lr": 7.871309206530135e-05} +{"train_loss": 0.006166078615933657, "global_step": 22145, "epoch": 186, "lr": 7.871127826210022e-05} +{"train_loss": 0.004735294263809919, "global_step": 22146, "epoch": 186, "lr": 7.870946440252758e-05} +{"train_loss": 0.0026953830383718014, "global_step": 22147, "epoch": 186, "lr": 7.870765048658696e-05} +{"train_loss": 0.0042784735560417175, "global_step": 22148, "epoch": 186, "lr": 7.870583651428194e-05} +{"train_loss": 0.00767291896045208, "global_step": 22149, "epoch": 186, "lr": 7.870402248561607e-05} +{"train_loss": 0.00583243602886796, "global_step": 22150, "epoch": 186, "lr": 7.870220840059293e-05} +{"train_loss": 0.005157608073204756, "global_step": 22151, "epoch": 186, "lr": 7.870039425921604e-05} +{"train_loss": 0.004728458821773529, "global_step": 22152, "epoch": 186, "lr": 7.869858006148902e-05} +{"train_loss": 0.006026716437190771, "global_step": 22153, "epoch": 186, "lr": 7.869676580741541e-05} +{"train_loss": 0.008434567600488663, "global_step": 22154, "epoch": 186, "lr": 7.869495149699875e-05} +{"train_loss": 0.0035990255419164896, "global_step": 22155, "epoch": 186, "lr": 7.869313713024263e-05} +{"train_loss": 0.0027680681087076664, "global_step": 22156, "epoch": 186, "lr": 7.869132270715059e-05} +{"train_loss": 0.007639592979103327, "global_step": 22157, "epoch": 186, "lr": 7.868950822772621e-05} +{"train_loss": 0.0051761651411652565, "global_step": 22158, "epoch": 186, "lr": 7.868769369197303e-05} +{"train_loss": 0.003845613682642579, "global_step": 22159, "epoch": 186, "lr": 7.868587909989464e-05} +{"train_loss": 0.003822592319920659, "global_step": 22160, "epoch": 186, "lr": 7.868406445149459e-05} +{"train_loss": 0.0026621457654982805, "global_step": 22161, "epoch": 186, "lr": 7.868224974677643e-05} +{"train_loss": 0.00691039115190506, "global_step": 22162, "epoch": 186, "lr": 7.868043498574377e-05} +{"train_loss": 0.004668381996452808, "global_step": 22163, "epoch": 186, "lr": 7.867862016840012e-05} +{"train_loss": 0.005535578355193138, "global_step": 22164, "epoch": 186, "lr": 7.867680529474906e-05} +{"train_loss": 0.005891032051295042, "global_step": 22165, "epoch": 186, "lr": 7.867499036479416e-05} +{"train_loss": 0.004374940879642963, "global_step": 22166, "epoch": 186, "lr": 7.867317537853897e-05} +{"train_loss": 0.0065213581547141075, "global_step": 22167, "epoch": 186, "lr": 7.867136033598707e-05} +{"train_loss": 0.004575950559228659, "global_step": 22168, "epoch": 186, "lr": 7.866954523714203e-05} +{"train_loss": 0.0024323598481714725, "global_step": 22169, "epoch": 186, "lr": 7.866773008200741e-05} +{"train_loss": 0.00653865048661828, "global_step": 22170, "epoch": 186, "lr": 7.866591487058674e-05} +{"train_loss": 0.005119791254401207, "global_step": 22171, "epoch": 186, "lr": 7.866409960288362e-05} +{"train_loss": 0.005122601054608822, "global_step": 22172, "epoch": 186, "lr": 7.86622842789016e-05} +{"train_loss": 0.002105278894305229, "global_step": 22173, "epoch": 186, "lr": 7.866046889864423e-05} +{"train_loss": 0.00533717917278409, "global_step": 22174, "epoch": 186, "lr": 7.865865346211511e-05} +{"train_loss": 0.003976155072450638, "global_step": 22175, "epoch": 186, "lr": 7.865683796931778e-05} +{"train_loss": 0.006867267191410065, "global_step": 22176, "epoch": 186, "lr": 7.865502242025582e-05} +{"train_loss": 0.006469587329775095, "global_step": 22177, "epoch": 186, "lr": 7.865320681493278e-05} +{"train_loss": 0.004939892329275608, "global_step": 22178, "epoch": 186, "lr": 7.865139115335222e-05} +{"train_loss": 0.0029739062301814556, "global_step": 22179, "epoch": 186, "lr": 7.864957543551772e-05} +{"train_loss": 0.00593921635299921, "global_step": 22180, "epoch": 186, "lr": 7.864775966143285e-05} +{"train_loss": 0.008319281972944736, "global_step": 22181, "epoch": 186, "lr": 7.864594383110115e-05} +{"train_loss": 0.004572005942463875, "global_step": 22182, "epoch": 186, "lr": 7.86441279445262e-05} +{"train_loss": 0.005726607050746679, "global_step": 22183, "epoch": 186, "lr": 7.864231200171157e-05} +{"train_loss": 0.0033420277759432793, "global_step": 22184, "epoch": 186, "lr": 7.864049600266081e-05} +{"train_loss": 0.005761841777712107, "global_step": 22185, "epoch": 186, "lr": 7.863867994737751e-05} +{"train_loss": 0.004088816232979298, "global_step": 22186, "epoch": 186, "lr": 7.863686383586521e-05} +{"train_loss": 0.0038267909549176693, "global_step": 22187, "epoch": 186, "lr": 7.863504766812751e-05} +{"train_loss": 0.004609163384884596, "global_step": 22188, "epoch": 186, "lr": 7.863323144416794e-05} +{"train_loss": 0.005491952411830425, "global_step": 22189, "epoch": 186, "lr": 7.863141516399007e-05} +{"train_loss": 0.005057999864220619, "global_step": 22190, "epoch": 186, "lr": 7.862959882759749e-05} +{"train_loss": 0.003071305574849248, "global_step": 22191, "epoch": 186, "lr": 7.862778243499374e-05} +{"train_loss": 0.005645164754241705, "global_step": 22192, "epoch": 186, "lr": 7.862596598618239e-05} +{"train_loss": 0.005409047473222017, "global_step": 22193, "epoch": 186, "lr": 7.862414948116703e-05} +{"train_loss": 0.005144866649061441, "global_step": 22194, "epoch": 186, "lr": 7.862233291995122e-05} +{"train_loss": 0.0020638294517993927, "global_step": 22195, "epoch": 186, "lr": 7.86205163025385e-05} +{"train_loss": 0.00279694190248847, "global_step": 22196, "epoch": 186, "lr": 7.861869962893245e-05} +{"train_loss": 0.007117138709872961, "global_step": 22197, "epoch": 186, "lr": 7.861688289913665e-05} +{"train_loss": 0.006008297670632601, "global_step": 22198, "epoch": 186, "lr": 7.861506611315466e-05} +{"train_loss": 0.006165718659758568, "global_step": 22199, "epoch": 186, "lr": 7.861324927099003e-05} +{"train_loss": 0.005126404110342264, "global_step": 22200, "epoch": 186, "lr": 7.861143237264635e-05} +{"train_loss": 0.00691860169172287, "global_step": 22201, "epoch": 186, "lr": 7.860961541812719e-05} +{"train_loss": 0.0052956948056817055, "global_step": 22202, "epoch": 186, "lr": 7.860779840743609e-05} +{"train_loss": 0.00521513307467103, "global_step": 22203, "epoch": 186, "lr": 7.860598134057664e-05} +{"train_loss": 0.004261113237589598, "global_step": 22204, "epoch": 186, "lr": 7.86041642175524e-05} +{"train_loss": 0.006138477008789778, "global_step": 22205, "epoch": 186, "lr": 7.860234703836695e-05} +{"train_loss": 0.003613031469285488, "global_step": 22206, "epoch": 186, "lr": 7.860052980302384e-05} +{"train_loss": 0.00411980040371418, "global_step": 22207, "epoch": 186, "lr": 7.859871251152664e-05} +{"train_loss": 0.0049178143963217735, "global_step": 22208, "epoch": 186, "lr": 7.859689516387894e-05} +{"train_loss": 0.007350195199251175, "global_step": 22209, "epoch": 186, "lr": 7.859507776008426e-05} +{"train_loss": 0.0037170567084103823, "global_step": 22210, "epoch": 186, "lr": 7.859326030014622e-05} +{"train_loss": 0.0035972644109278917, "global_step": 22211, "epoch": 186, "lr": 7.859144278406838e-05} +{"train_loss": 0.005550195463001728, "global_step": 22212, "epoch": 186, "lr": 7.85896252118543e-05} +{"train_loss": 0.00427577830851078, "global_step": 22213, "epoch": 186, "lr": 7.858780758350751e-05} +{"train_loss": 0.006656016688793898, "global_step": 22214, "epoch": 186, "lr": 7.858598989903164e-05} +{"train_loss": 0.005375517066568136, "global_step": 22215, "epoch": 186, "lr": 7.858417215843022e-05} +{"train_loss": 0.0059580677188932896, "global_step": 22216, "epoch": 186, "lr": 7.858235436170685e-05} +{"train_loss": 0.0029816224705427885, "global_step": 22217, "epoch": 186, "lr": 7.858053650886505e-05} +{"train_loss": 0.005179675295948982, "global_step": 22218, "epoch": 186, "lr": 7.857871859990844e-05} +{"train_loss": 0.00508809182792902, "global_step": 22219, "epoch": 186, "lr": 7.857690063484058e-05} +{"train_loss": 0.0049468036741018295, "global_step": 22220, "epoch": 186, "lr": 7.857508261366501e-05} +{"train_loss": 0.0052927713841199875, "global_step": 22221, "epoch": 186, "lr": 7.857326453638533e-05} +{"train_loss": 0.005097389221191406, "global_step": 22222, "epoch": 186, "lr": 7.857144640300509e-05} +{"train_loss": 0.004100756719708443, "global_step": 22223, "epoch": 186, "lr": 7.856962821352787e-05} +{"train_loss": 0.005215518642216921, "global_step": 22224, "epoch": 186, "lr": 7.856780996795723e-05} +{"train_loss": 0.005656376946717501, "global_step": 22225, "epoch": 186, "lr": 7.856599166629677e-05} +{"train_loss": 0.006069994531571865, "global_step": 22226, "epoch": 186, "lr": 7.856417330855002e-05} +{"train_loss": 0.0050820233300328255, "global_step": 22227, "epoch": 186, "lr": 7.856235489472057e-05} +{"train_loss": 0.002495069522410631, "global_step": 22228, "epoch": 186, "lr": 7.856053642481198e-05} +{"train_loss": 0.0034571054857224226, "global_step": 22229, "epoch": 186, "lr": 7.855871789882783e-05} +{"train_loss": 0.004219751339405775, "global_step": 22230, "epoch": 186, "lr": 7.85568993167717e-05} +{"train_loss": 0.00561597989872098, "global_step": 22231, "epoch": 186, "lr": 7.855508067864714e-05} +{"train_loss": 0.003926664125174284, "global_step": 22232, "epoch": 186, "lr": 7.855326198445773e-05} +{"train_loss": 0.0036042670253664255, "global_step": 22233, "epoch": 186, "lr": 7.855144323420704e-05} +{"train_loss": 0.006600880529731512, "global_step": 22234, "epoch": 186, "lr": 7.854962442789865e-05} +{"train_loss": 0.003821337828412652, "global_step": 22235, "epoch": 186, "lr": 7.854780556553612e-05} +{"train_loss": 0.0043142796494066715, "global_step": 22236, "epoch": 186, "lr": 7.8545986647123e-05} +{"train_loss": 0.003082070965319872, "global_step": 22237, "epoch": 186, "lr": 7.854416767266292e-05} +{"train_loss": 0.006091749295592308, "global_step": 22238, "epoch": 186, "lr": 7.854234864215941e-05} +{"train_loss": 0.004093606024980545, "global_step": 22239, "epoch": 186, "lr": 7.854052955561602e-05} +{"train_loss": 0.005026098340749741, "global_step": 22240, "epoch": 186, "lr": 7.853871041303638e-05} +{"train_loss": 0.003947889897972345, "global_step": 22241, "epoch": 186, "lr": 7.853689121442402e-05} +{"train_loss": 0.006542189046740532, "global_step": 22242, "epoch": 186, "lr": 7.853507195978251e-05} +{"train_loss": 0.004791794344782829, "global_step": 22243, "epoch": 186, "lr": 7.853325264911546e-05} +{"train_loss": 0.0032209146302193403, "global_step": 22244, "epoch": 186, "lr": 7.85314332824264e-05} +{"train_loss": 0.007044636644423008, "global_step": 22245, "epoch": 186, "lr": 7.852961385971894e-05} +{"train_loss": 0.003918493632227182, "global_step": 22246, "epoch": 186, "lr": 7.85277943809966e-05} +{"train_loss": 0.004371319897472858, "global_step": 22247, "epoch": 186, "lr": 7.8525974846263e-05} +{"train_loss": 0.005098068621009588, "global_step": 22248, "epoch": 186, "lr": 7.852415525552168e-05} +{"train_loss": 0.005985790863633156, "global_step": 22249, "epoch": 186, "lr": 7.852233560877625e-05} +{"train_loss": 0.006240042392164469, "global_step": 22250, "epoch": 186, "lr": 7.852051590603024e-05} +{"train_loss": 0.0028788214549422264, "global_step": 22251, "epoch": 186, "lr": 7.851869614728726e-05} +{"train_loss": 0.004996543161242324, "global_step": 22252, "epoch": 186, "lr": 7.851687633255087e-05, "val_loss": 0.02434059977531433} +{"train_loss": 0.006052873563021421, "global_step": 22253, "epoch": 187, "lr": 7.851505646182463e-05} +{"train_loss": 0.0036435225047171116, "global_step": 22254, "epoch": 187, "lr": 7.851323653511213e-05} +{"train_loss": 0.0031541166827082634, "global_step": 22255, "epoch": 187, "lr": 7.851141655241693e-05} +{"train_loss": 0.0034827925264835358, "global_step": 22256, "epoch": 187, "lr": 7.85095965137426e-05} +{"train_loss": 0.006310494150966406, "global_step": 22257, "epoch": 187, "lr": 7.850777641909275e-05} +{"train_loss": 0.002804693067446351, "global_step": 22258, "epoch": 187, "lr": 7.85059562684709e-05} +{"train_loss": 0.0048103961162269115, "global_step": 22259, "epoch": 187, "lr": 7.850413606188067e-05} +{"train_loss": 0.003660210408270359, "global_step": 22260, "epoch": 187, "lr": 7.850231579932562e-05} +{"train_loss": 0.004167174454778433, "global_step": 22261, "epoch": 187, "lr": 7.850049548080929e-05} +{"train_loss": 0.004701456055045128, "global_step": 22262, "epoch": 187, "lr": 7.849867510633529e-05} +{"train_loss": 0.003629625542089343, "global_step": 22263, "epoch": 187, "lr": 7.84968546759072e-05} +{"train_loss": 0.0044687362387776375, "global_step": 22264, "epoch": 187, "lr": 7.849503418952857e-05} +{"train_loss": 0.004468646831810474, "global_step": 22265, "epoch": 187, "lr": 7.849321364720299e-05} +{"train_loss": 0.0048300353810191154, "global_step": 22266, "epoch": 187, "lr": 7.849139304893402e-05} +{"train_loss": 0.003900244366377592, "global_step": 22267, "epoch": 187, "lr": 7.848957239472525e-05} +{"train_loss": 0.005285808350890875, "global_step": 22268, "epoch": 187, "lr": 7.848775168458024e-05} +{"train_loss": 0.0033677201718091965, "global_step": 22269, "epoch": 187, "lr": 7.848593091850261e-05} +{"train_loss": 0.005295826122164726, "global_step": 22270, "epoch": 187, "lr": 7.848411009649586e-05} +{"train_loss": 0.004213459324091673, "global_step": 22271, "epoch": 187, "lr": 7.84822892185636e-05} +{"train_loss": 0.0034894519485533237, "global_step": 22272, "epoch": 187, "lr": 7.848046828470942e-05} +{"train_loss": 0.005289970897138119, "global_step": 22273, "epoch": 187, "lr": 7.847864729493688e-05} +{"train_loss": 0.004838842432945967, "global_step": 22274, "epoch": 187, "lr": 7.847682624924957e-05} +{"train_loss": 0.0048776972107589245, "global_step": 22275, "epoch": 187, "lr": 7.847500514765105e-05} +{"train_loss": 0.002248841803520918, "global_step": 22276, "epoch": 187, "lr": 7.847318399014489e-05} +{"train_loss": 0.009848715737462044, "global_step": 22277, "epoch": 187, "lr": 7.847136277673468e-05} +{"train_loss": 0.006817671004682779, "global_step": 22278, "epoch": 187, "lr": 7.8469541507424e-05} +{"train_loss": 0.004583006724715233, "global_step": 22279, "epoch": 187, "lr": 7.84677201822164e-05} +{"train_loss": 0.005684407893568277, "global_step": 22280, "epoch": 187, "lr": 7.846589880111547e-05} +{"train_loss": 0.005154780577868223, "global_step": 22281, "epoch": 187, "lr": 7.846407736412482e-05} +{"train_loss": 0.007323784753680229, "global_step": 22282, "epoch": 187, "lr": 7.846225587124797e-05} +{"train_loss": 0.0036836066283285618, "global_step": 22283, "epoch": 187, "lr": 7.846043432248853e-05} +{"train_loss": 0.004320920445024967, "global_step": 22284, "epoch": 187, "lr": 7.845861271785005e-05} +{"train_loss": 0.003912848886102438, "global_step": 22285, "epoch": 187, "lr": 7.845679105733614e-05} +{"train_loss": 0.007440661080181599, "global_step": 22286, "epoch": 187, "lr": 7.845496934095035e-05} +{"train_loss": 0.003142715198919177, "global_step": 22287, "epoch": 187, "lr": 7.845314756869628e-05} +{"train_loss": 0.004805335309356451, "global_step": 22288, "epoch": 187, "lr": 7.84513257405775e-05} +{"train_loss": 0.003365000244230032, "global_step": 22289, "epoch": 187, "lr": 7.844950385659758e-05} +{"train_loss": 0.003700074041262269, "global_step": 22290, "epoch": 187, "lr": 7.844768191676008e-05} +{"train_loss": 0.006747061852365732, "global_step": 22291, "epoch": 187, "lr": 7.844585992106861e-05} +{"train_loss": 0.00429815798997879, "global_step": 22292, "epoch": 187, "lr": 7.844403786952672e-05} +{"train_loss": 0.005224945489317179, "global_step": 22293, "epoch": 187, "lr": 7.844221576213802e-05} +{"train_loss": 0.004366460256278515, "global_step": 22294, "epoch": 187, "lr": 7.844039359890607e-05} +{"train_loss": 0.004402671009302139, "global_step": 22295, "epoch": 187, "lr": 7.843857137983443e-05} +{"train_loss": 0.004273100756108761, "global_step": 22296, "epoch": 187, "lr": 7.843674910492668e-05} +{"train_loss": 0.006157431285828352, "global_step": 22297, "epoch": 187, "lr": 7.843492677418643e-05} +{"train_loss": 0.0057373023591935635, "global_step": 22298, "epoch": 187, "lr": 7.843310438761724e-05} +{"train_loss": 0.005046514328569174, "global_step": 22299, "epoch": 187, "lr": 7.843128194522268e-05} +{"train_loss": 0.005631315056234598, "global_step": 22300, "epoch": 187, "lr": 7.842945944700635e-05} +{"train_loss": 0.0037178760394454002, "global_step": 22301, "epoch": 187, "lr": 7.84276368929718e-05} +{"train_loss": 0.003433341160416603, "global_step": 22302, "epoch": 187, "lr": 7.842581428312263e-05} +{"train_loss": 0.003710078075528145, "global_step": 22303, "epoch": 187, "lr": 7.842399161746241e-05} +{"train_loss": 0.004883124493062496, "global_step": 22304, "epoch": 187, "lr": 7.842216889599471e-05} +{"train_loss": 0.003705621464177966, "global_step": 22305, "epoch": 187, "lr": 7.842034611872313e-05} +{"train_loss": 0.006161664146929979, "global_step": 22306, "epoch": 187, "lr": 7.841852328565123e-05} +{"train_loss": 0.0025702768471091986, "global_step": 22307, "epoch": 187, "lr": 7.84167003967826e-05} +{"train_loss": 0.00464105699211359, "global_step": 22308, "epoch": 187, "lr": 7.84148774521208e-05} +{"train_loss": 0.0028388877399265766, "global_step": 22309, "epoch": 187, "lr": 7.841305445166943e-05} +{"train_loss": 0.007801858242601156, "global_step": 22310, "epoch": 187, "lr": 7.841123139543208e-05} +{"train_loss": 0.00790273118764162, "global_step": 22311, "epoch": 187, "lr": 7.840940828341229e-05} +{"train_loss": 0.004849820863455534, "global_step": 22312, "epoch": 187, "lr": 7.840758511561367e-05} +{"train_loss": 0.006988902110606432, "global_step": 22313, "epoch": 187, "lr": 7.840576189203979e-05} +{"train_loss": 0.0050233714282512665, "global_step": 22314, "epoch": 187, "lr": 7.840393861269424e-05} +{"train_loss": 0.006882817950099707, "global_step": 22315, "epoch": 187, "lr": 7.840211527758058e-05} +{"train_loss": 0.007090642116963863, "global_step": 22316, "epoch": 187, "lr": 7.84002918867024e-05} +{"train_loss": 0.00616431562229991, "global_step": 22317, "epoch": 187, "lr": 7.839846844006329e-05} +{"train_loss": 0.004818664398044348, "global_step": 22318, "epoch": 187, "lr": 7.839664493766682e-05} +{"train_loss": 0.006067832000553608, "global_step": 22319, "epoch": 187, "lr": 7.839482137951658e-05} +{"train_loss": 0.00417852308601141, "global_step": 22320, "epoch": 187, "lr": 7.839299776561613e-05} +{"train_loss": 0.004979758523404598, "global_step": 22321, "epoch": 187, "lr": 7.839117409596906e-05} +{"train_loss": 0.0052672866731882095, "global_step": 22322, "epoch": 187, "lr": 7.838935037057896e-05} +{"train_loss": 0.0039046911988407373, "global_step": 22323, "epoch": 187, "lr": 7.83875265894494e-05} +{"train_loss": 0.005696549080312252, "global_step": 22324, "epoch": 187, "lr": 7.838570275258395e-05} +{"train_loss": 0.007065881043672562, "global_step": 22325, "epoch": 187, "lr": 7.838387885998624e-05} +{"train_loss": 0.004322161432355642, "global_step": 22326, "epoch": 187, "lr": 7.838205491165978e-05} +{"train_loss": 0.005224515683948994, "global_step": 22327, "epoch": 187, "lr": 7.838023090760821e-05} +{"train_loss": 0.0060926806181669235, "global_step": 22328, "epoch": 187, "lr": 7.837840684783509e-05} +{"train_loss": 0.004555040970444679, "global_step": 22329, "epoch": 187, "lr": 7.837658273234398e-05} +{"train_loss": 0.0032674751710146666, "global_step": 22330, "epoch": 187, "lr": 7.83747585611385e-05} +{"train_loss": 0.00480902474373579, "global_step": 22331, "epoch": 187, "lr": 7.837293433422219e-05} +{"train_loss": 0.0027125095948576927, "global_step": 22332, "epoch": 187, "lr": 7.837111005159868e-05} +{"train_loss": 0.004338672384619713, "global_step": 22333, "epoch": 187, "lr": 7.836928571327152e-05} +{"train_loss": 0.005623542238026857, "global_step": 22334, "epoch": 187, "lr": 7.836746131924428e-05} +{"train_loss": 0.005299883428961039, "global_step": 22335, "epoch": 187, "lr": 7.836563686952058e-05} +{"train_loss": 0.004148383624851704, "global_step": 22336, "epoch": 187, "lr": 7.836381236410399e-05} +{"train_loss": 0.00441461568698287, "global_step": 22337, "epoch": 187, "lr": 7.836198780299807e-05} +{"train_loss": 0.008419244550168514, "global_step": 22338, "epoch": 187, "lr": 7.836016318620641e-05} +{"train_loss": 0.005105958320200443, "global_step": 22339, "epoch": 187, "lr": 7.835833851373263e-05} +{"train_loss": 0.0032322858460247517, "global_step": 22340, "epoch": 187, "lr": 7.835651378558025e-05} +{"train_loss": 0.005784699693322182, "global_step": 22341, "epoch": 187, "lr": 7.835468900175288e-05} +{"train_loss": 0.004795087967067957, "global_step": 22342, "epoch": 187, "lr": 7.835286416225414e-05} +{"train_loss": 0.007150000426918268, "global_step": 22343, "epoch": 187, "lr": 7.835103926708756e-05} +{"train_loss": 0.004320238251239061, "global_step": 22344, "epoch": 187, "lr": 7.834921431625675e-05} +{"train_loss": 0.0046228147111833096, "global_step": 22345, "epoch": 187, "lr": 7.834738930976528e-05} +{"train_loss": 0.007396729197353125, "global_step": 22346, "epoch": 187, "lr": 7.834556424761674e-05} +{"train_loss": 0.005221525672823191, "global_step": 22347, "epoch": 187, "lr": 7.834373912981472e-05} +{"train_loss": 0.009463137947022915, "global_step": 22348, "epoch": 187, "lr": 7.83419139563628e-05} +{"train_loss": 0.005935494787991047, "global_step": 22349, "epoch": 187, "lr": 7.834008872726452e-05} +{"train_loss": 0.004181249532848597, "global_step": 22350, "epoch": 187, "lr": 7.833826344252355e-05} +{"train_loss": 0.0037349064368754625, "global_step": 22351, "epoch": 187, "lr": 7.833643810214342e-05} +{"train_loss": 0.0035139317624270916, "global_step": 22352, "epoch": 187, "lr": 7.833461270612771e-05} +{"train_loss": 0.005977680906653404, "global_step": 22353, "epoch": 187, "lr": 7.833278725448001e-05} +{"train_loss": 0.005934505723416805, "global_step": 22354, "epoch": 187, "lr": 7.833096174720392e-05} +{"train_loss": 0.003244934370741248, "global_step": 22355, "epoch": 187, "lr": 7.832913618430303e-05} +{"train_loss": 0.0072321780025959015, "global_step": 22356, "epoch": 187, "lr": 7.832731056578087e-05} +{"train_loss": 0.004558532498776913, "global_step": 22357, "epoch": 187, "lr": 7.832548489164109e-05} +{"train_loss": 0.004001014865934849, "global_step": 22358, "epoch": 187, "lr": 7.832365916188723e-05} +{"train_loss": 0.005875398870557547, "global_step": 22359, "epoch": 187, "lr": 7.83218333765229e-05} +{"train_loss": 0.005232919938862324, "global_step": 22360, "epoch": 187, "lr": 7.832000753555166e-05} +{"train_loss": 0.003422415116801858, "global_step": 22361, "epoch": 187, "lr": 7.831818163897713e-05} +{"train_loss": 0.003607438877224922, "global_step": 22362, "epoch": 187, "lr": 7.831635568680287e-05} +{"train_loss": 0.00611797533929348, "global_step": 22363, "epoch": 187, "lr": 7.831452967903248e-05} +{"train_loss": 0.006246720440685749, "global_step": 22364, "epoch": 187, "lr": 7.831270361566953e-05} +{"train_loss": 0.004496200941503048, "global_step": 22365, "epoch": 187, "lr": 7.831087749671761e-05} +{"train_loss": 0.006128287874162197, "global_step": 22366, "epoch": 187, "lr": 7.83090513221803e-05} +{"train_loss": 0.004920031409710646, "global_step": 22367, "epoch": 187, "lr": 7.830722509206118e-05} +{"train_loss": 0.005058208014816046, "global_step": 22368, "epoch": 187, "lr": 7.830539880636387e-05} +{"train_loss": 0.004585994873195887, "global_step": 22369, "epoch": 187, "lr": 7.830357246509194e-05} +{"train_loss": 0.0035728509537875652, "global_step": 22370, "epoch": 187, "lr": 7.830174606824896e-05} +{"train_loss": 0.004977468888377066, "global_step": 22371, "epoch": 187, "lr": 7.829991961583851e-05, "val_loss": 0.010466177016496658} +{"train_loss": 0.004660754930227995, "global_step": 22372, "epoch": 188, "lr": 7.829809310786421e-05} +{"train_loss": 0.0048751188442111015, "global_step": 22373, "epoch": 188, "lr": 7.829626654432963e-05} +{"train_loss": 0.004778103902935982, "global_step": 22374, "epoch": 188, "lr": 7.829443992523833e-05} +{"train_loss": 0.00761078204959631, "global_step": 22375, "epoch": 188, "lr": 7.829261325059394e-05} +{"train_loss": 0.0037525100633502007, "global_step": 22376, "epoch": 188, "lr": 7.829078652040002e-05} +{"train_loss": 0.00474420515820384, "global_step": 22377, "epoch": 188, "lr": 7.828895973466017e-05} +{"train_loss": 0.005656196270138025, "global_step": 22378, "epoch": 188, "lr": 7.828713289337797e-05} +{"train_loss": 0.004204995930194855, "global_step": 22379, "epoch": 188, "lr": 7.828530599655699e-05} +{"train_loss": 0.007026632782071829, "global_step": 22380, "epoch": 188, "lr": 7.828347904420084e-05} +{"train_loss": 0.005761757958680391, "global_step": 22381, "epoch": 188, "lr": 7.82816520363131e-05} +{"train_loss": 0.005087763071060181, "global_step": 22382, "epoch": 188, "lr": 7.827982497289738e-05} +{"train_loss": 0.005006785504519939, "global_step": 22383, "epoch": 188, "lr": 7.827799785395723e-05} +{"train_loss": 0.004272197373211384, "global_step": 22384, "epoch": 188, "lr": 7.827617067949625e-05} +{"train_loss": 0.0030357602518051863, "global_step": 22385, "epoch": 188, "lr": 7.827434344951803e-05} +{"train_loss": 0.003873453475534916, "global_step": 22386, "epoch": 188, "lr": 7.827251616402615e-05} +{"train_loss": 0.0038864295929670334, "global_step": 22387, "epoch": 188, "lr": 7.827068882302422e-05} +{"train_loss": 0.003796475473791361, "global_step": 22388, "epoch": 188, "lr": 7.826886142651579e-05} +{"train_loss": 0.004609403200447559, "global_step": 22389, "epoch": 188, "lr": 7.82670339745045e-05} +{"train_loss": 0.003916955552995205, "global_step": 22390, "epoch": 188, "lr": 7.826520646699389e-05} +{"train_loss": 0.007210018578916788, "global_step": 22391, "epoch": 188, "lr": 7.826337890398756e-05} +{"train_loss": 0.0028834950644522905, "global_step": 22392, "epoch": 188, "lr": 7.826155128548912e-05} +{"train_loss": 0.0048754857853055, "global_step": 22393, "epoch": 188, "lr": 7.825972361150214e-05} +{"train_loss": 0.004645291715860367, "global_step": 22394, "epoch": 188, "lr": 7.825789588203022e-05} +{"train_loss": 0.00548746669664979, "global_step": 22395, "epoch": 188, "lr": 7.825606809707693e-05} +{"train_loss": 0.00655097421258688, "global_step": 22396, "epoch": 188, "lr": 7.825424025664588e-05} +{"train_loss": 0.006652916315943003, "global_step": 22397, "epoch": 188, "lr": 7.825241236074063e-05} +{"train_loss": 0.005321749020367861, "global_step": 22398, "epoch": 188, "lr": 7.825058440936479e-05} +{"train_loss": 0.005803059320896864, "global_step": 22399, "epoch": 188, "lr": 7.824875640252194e-05} +{"train_loss": 0.003612311091274023, "global_step": 22400, "epoch": 188, "lr": 7.824692834021569e-05} +{"train_loss": 0.004542199894785881, "global_step": 22401, "epoch": 188, "lr": 7.824510022244962e-05} +{"train_loss": 0.004194024950265884, "global_step": 22402, "epoch": 188, "lr": 7.82432720492273e-05} +{"train_loss": 0.004547779448330402, "global_step": 22403, "epoch": 188, "lr": 7.824144382055234e-05} +{"train_loss": 0.004754168912768364, "global_step": 22404, "epoch": 188, "lr": 7.823961553642831e-05} +{"train_loss": 0.003354056738317013, "global_step": 22405, "epoch": 188, "lr": 7.823778719685881e-05} +{"train_loss": 0.0044094473123550415, "global_step": 22406, "epoch": 188, "lr": 7.823595880184745e-05} +{"train_loss": 0.008139079436659813, "global_step": 22407, "epoch": 188, "lr": 7.823413035139779e-05} +{"train_loss": 0.004591973964124918, "global_step": 22408, "epoch": 188, "lr": 7.823230184551345e-05} +{"train_loss": 0.003904653713107109, "global_step": 22409, "epoch": 188, "lr": 7.823047328419797e-05} +{"train_loss": 0.006408128421753645, "global_step": 22410, "epoch": 188, "lr": 7.822864466745498e-05} +{"train_loss": 0.0052704173140227795, "global_step": 22411, "epoch": 188, "lr": 7.822681599528807e-05} +{"train_loss": 0.005611091386526823, "global_step": 22412, "epoch": 188, "lr": 7.822498726770082e-05} +{"train_loss": 0.0037925620563328266, "global_step": 22413, "epoch": 188, "lr": 7.822315848469683e-05} +{"train_loss": 0.005551828071475029, "global_step": 22414, "epoch": 188, "lr": 7.822132964627968e-05} +{"train_loss": 0.005135464482009411, "global_step": 22415, "epoch": 188, "lr": 7.821950075245296e-05} +{"train_loss": 0.002431292785331607, "global_step": 22416, "epoch": 188, "lr": 7.821767180322026e-05} +{"train_loss": 0.00269130477681756, "global_step": 22417, "epoch": 188, "lr": 7.821584279858518e-05} +{"train_loss": 0.004117080010473728, "global_step": 22418, "epoch": 188, "lr": 7.821401373855132e-05} +{"train_loss": 0.006020651664584875, "global_step": 22419, "epoch": 188, "lr": 7.821218462312225e-05} +{"train_loss": 0.00525269890204072, "global_step": 22420, "epoch": 188, "lr": 7.821035545230157e-05} +{"train_loss": 0.0026049804873764515, "global_step": 22421, "epoch": 188, "lr": 7.820852622609287e-05} +{"train_loss": 0.0023476288188248873, "global_step": 22422, "epoch": 188, "lr": 7.820669694449974e-05} +{"train_loss": 0.0026579841505736113, "global_step": 22423, "epoch": 188, "lr": 7.820486760752577e-05} +{"train_loss": 0.0032499029766768217, "global_step": 22424, "epoch": 188, "lr": 7.820303821517457e-05} +{"train_loss": 0.004112640395760536, "global_step": 22425, "epoch": 188, "lr": 7.82012087674497e-05} +{"train_loss": 0.004777497611939907, "global_step": 22426, "epoch": 188, "lr": 7.819937926435479e-05} +{"train_loss": 0.003897036425769329, "global_step": 22427, "epoch": 188, "lr": 7.819754970589339e-05} +{"train_loss": 0.0033868462778627872, "global_step": 22428, "epoch": 188, "lr": 7.819572009206912e-05} +{"train_loss": 0.005039101000875235, "global_step": 22429, "epoch": 188, "lr": 7.819389042288556e-05} +{"train_loss": 0.0025505758821964264, "global_step": 22430, "epoch": 188, "lr": 7.819206069834632e-05} +{"train_loss": 0.0026684158947318792, "global_step": 22431, "epoch": 188, "lr": 7.8190230918455e-05} +{"train_loss": 0.003862254787236452, "global_step": 22432, "epoch": 188, "lr": 7.818840108321515e-05} +{"train_loss": 0.005069340579211712, "global_step": 22433, "epoch": 188, "lr": 7.818657119263037e-05} +{"train_loss": 0.005866262596100569, "global_step": 22434, "epoch": 188, "lr": 7.81847412467043e-05} +{"train_loss": 0.005210799165070057, "global_step": 22435, "epoch": 188, "lr": 7.818291124544048e-05} +{"train_loss": 0.005704915151000023, "global_step": 22436, "epoch": 188, "lr": 7.818108118884253e-05} +{"train_loss": 0.0077531831339001656, "global_step": 22437, "epoch": 188, "lr": 7.817925107691405e-05} +{"train_loss": 0.005586699116975069, "global_step": 22438, "epoch": 188, "lr": 7.81774209096586e-05} +{"train_loss": 0.004127449356019497, "global_step": 22439, "epoch": 188, "lr": 7.81755906870798e-05} +{"train_loss": 0.005450321361422539, "global_step": 22440, "epoch": 188, "lr": 7.817376040918124e-05} +{"train_loss": 0.002449869178235531, "global_step": 22441, "epoch": 188, "lr": 7.817193007596653e-05} +{"train_loss": 0.004272910766303539, "global_step": 22442, "epoch": 188, "lr": 7.817009968743923e-05} +{"train_loss": 0.006827673874795437, "global_step": 22443, "epoch": 188, "lr": 7.816826924360295e-05} +{"train_loss": 0.005937246605753899, "global_step": 22444, "epoch": 188, "lr": 7.816643874446126e-05} +{"train_loss": 0.004056616220623255, "global_step": 22445, "epoch": 188, "lr": 7.81646081900178e-05} +{"train_loss": 0.0049321623519063, "global_step": 22446, "epoch": 188, "lr": 7.816277758027614e-05} +{"train_loss": 0.00565399369224906, "global_step": 22447, "epoch": 188, "lr": 7.816094691523987e-05} +{"train_loss": 0.0052991872653365135, "global_step": 22448, "epoch": 188, "lr": 7.81591161949126e-05} +{"train_loss": 0.0034793750382959843, "global_step": 22449, "epoch": 188, "lr": 7.81572854192979e-05} +{"train_loss": 0.005201659165322781, "global_step": 22450, "epoch": 188, "lr": 7.81554545883994e-05} +{"train_loss": 0.005578174255788326, "global_step": 22451, "epoch": 188, "lr": 7.815362370222066e-05} +{"train_loss": 0.0032168372999876738, "global_step": 22452, "epoch": 188, "lr": 7.815179276076527e-05} +{"train_loss": 0.0028724507428705692, "global_step": 22453, "epoch": 188, "lr": 7.814996176403686e-05} +{"train_loss": 0.005380262620747089, "global_step": 22454, "epoch": 188, "lr": 7.814813071203901e-05} +{"train_loss": 0.004333776421844959, "global_step": 22455, "epoch": 188, "lr": 7.81462996047753e-05} +{"train_loss": 0.004887694027274847, "global_step": 22456, "epoch": 188, "lr": 7.814446844224934e-05} +{"train_loss": 0.0041542742401361465, "global_step": 22457, "epoch": 188, "lr": 7.814263722446473e-05} +{"train_loss": 0.0032345345243811607, "global_step": 22458, "epoch": 188, "lr": 7.814080595142507e-05} +{"train_loss": 0.0048941681161522865, "global_step": 22459, "epoch": 188, "lr": 7.813897462313394e-05} +{"train_loss": 0.005028542131185532, "global_step": 22460, "epoch": 188, "lr": 7.813714323959491e-05} +{"train_loss": 0.005444271489977837, "global_step": 22461, "epoch": 188, "lr": 7.813531180081163e-05} +{"train_loss": 0.0036532902158796787, "global_step": 22462, "epoch": 188, "lr": 7.813348030678766e-05} +{"train_loss": 0.005414173472672701, "global_step": 22463, "epoch": 188, "lr": 7.813164875752662e-05} +{"train_loss": 0.005097759887576103, "global_step": 22464, "epoch": 188, "lr": 7.812981715303209e-05} +{"train_loss": 0.008381116203963757, "global_step": 22465, "epoch": 188, "lr": 7.812798549330767e-05} +{"train_loss": 0.0046529145911335945, "global_step": 22466, "epoch": 188, "lr": 7.812615377835694e-05} +{"train_loss": 0.005946244578808546, "global_step": 22467, "epoch": 188, "lr": 7.812432200818352e-05} +{"train_loss": 0.004025585018098354, "global_step": 22468, "epoch": 188, "lr": 7.812249018279101e-05} +{"train_loss": 0.004908285103738308, "global_step": 22469, "epoch": 188, "lr": 7.812065830218298e-05} +{"train_loss": 0.0069312346167862415, "global_step": 22470, "epoch": 188, "lr": 7.811882636636305e-05} +{"train_loss": 0.005052493419498205, "global_step": 22471, "epoch": 188, "lr": 7.811699437533481e-05} +{"train_loss": 0.0038674662355333567, "global_step": 22472, "epoch": 188, "lr": 7.811516232910185e-05} +{"train_loss": 0.003628062317147851, "global_step": 22473, "epoch": 188, "lr": 7.811333022766776e-05} +{"train_loss": 0.004455544054508209, "global_step": 22474, "epoch": 188, "lr": 7.811149807103617e-05} +{"train_loss": 0.0030486686155200005, "global_step": 22475, "epoch": 188, "lr": 7.810966585921066e-05} +{"train_loss": 0.007877733558416367, "global_step": 22476, "epoch": 188, "lr": 7.810783359219483e-05} +{"train_loss": 0.004728267900645733, "global_step": 22477, "epoch": 188, "lr": 7.810600126999224e-05} +{"train_loss": 0.0030651530250906944, "global_step": 22478, "epoch": 188, "lr": 7.810416889260653e-05} +{"train_loss": 0.004580446518957615, "global_step": 22479, "epoch": 188, "lr": 7.81023364600413e-05} +{"train_loss": 0.0031933088321238756, "global_step": 22480, "epoch": 188, "lr": 7.810050397230012e-05} +{"train_loss": 0.00413249246776104, "global_step": 22481, "epoch": 188, "lr": 7.80986714293866e-05} +{"train_loss": 0.006322699133306742, "global_step": 22482, "epoch": 188, "lr": 7.809683883130436e-05} +{"train_loss": 0.003589082043617964, "global_step": 22483, "epoch": 188, "lr": 7.809500617805698e-05} +{"train_loss": 0.004747751168906689, "global_step": 22484, "epoch": 188, "lr": 7.809317346964804e-05} +{"train_loss": 0.005890784785151482, "global_step": 22485, "epoch": 188, "lr": 7.809134070608117e-05} +{"train_loss": 0.003073246916756034, "global_step": 22486, "epoch": 188, "lr": 7.808950788735994e-05} +{"train_loss": 0.004248259589076042, "global_step": 22487, "epoch": 188, "lr": 7.808767501348798e-05} +{"train_loss": 0.003876354079693556, "global_step": 22488, "epoch": 188, "lr": 7.808584208446885e-05} +{"train_loss": 0.003966272808611393, "global_step": 22489, "epoch": 188, "lr": 7.808400910030618e-05} +{"train_loss": 0.004679340010258455, "global_step": 22490, "epoch": 188, "lr": 7.808217606100355e-05, "val_loss": 0.017079301178455353} +{"train_loss": 0.0050130621530115604, "global_step": 22491, "epoch": 189, "lr": 7.808034296656457e-05} +{"train_loss": 0.006807616446167231, "global_step": 22492, "epoch": 189, "lr": 7.807850981699284e-05} +{"train_loss": 0.0030437116511166096, "global_step": 22493, "epoch": 189, "lr": 7.807667661229195e-05} +{"train_loss": 0.005697275977581739, "global_step": 22494, "epoch": 189, "lr": 7.807484335246551e-05} +{"train_loss": 0.004191579297184944, "global_step": 22495, "epoch": 189, "lr": 7.807301003751712e-05} +{"train_loss": 0.0050920844078063965, "global_step": 22496, "epoch": 189, "lr": 7.807117666745037e-05} +{"train_loss": 0.007150691002607346, "global_step": 22497, "epoch": 189, "lr": 7.806934324226886e-05} +{"train_loss": 0.004686082247644663, "global_step": 22498, "epoch": 189, "lr": 7.806750976197618e-05} +{"train_loss": 0.005087822675704956, "global_step": 22499, "epoch": 189, "lr": 7.806567622657596e-05} +{"train_loss": 0.005153348669409752, "global_step": 22500, "epoch": 189, "lr": 7.80638426360718e-05} +{"train_loss": 0.0042087542824447155, "global_step": 22501, "epoch": 189, "lr": 7.806200899046728e-05} +{"train_loss": 0.0026061893440783024, "global_step": 22502, "epoch": 189, "lr": 7.806017528976597e-05} +{"train_loss": 0.0044186776503920555, "global_step": 22503, "epoch": 189, "lr": 7.805834153397152e-05} +{"train_loss": 0.0028574890457093716, "global_step": 22504, "epoch": 189, "lr": 7.805650772308753e-05} +{"train_loss": 0.004120406694710255, "global_step": 22505, "epoch": 189, "lr": 7.805467385711756e-05} +{"train_loss": 0.003709483193233609, "global_step": 22506, "epoch": 189, "lr": 7.805283993606524e-05} +{"train_loss": 0.004102950915694237, "global_step": 22507, "epoch": 189, "lr": 7.805100595993418e-05} +{"train_loss": 0.0035484919790178537, "global_step": 22508, "epoch": 189, "lr": 7.804917192872797e-05} +{"train_loss": 0.005079898051917553, "global_step": 22509, "epoch": 189, "lr": 7.804733784245019e-05} +{"train_loss": 0.004806116223335266, "global_step": 22510, "epoch": 189, "lr": 7.804550370110446e-05} +{"train_loss": 0.006263855379074812, "global_step": 22511, "epoch": 189, "lr": 7.804366950469438e-05} +{"train_loss": 0.0058370353654026985, "global_step": 22512, "epoch": 189, "lr": 7.804183525322355e-05} +{"train_loss": 0.00546064879745245, "global_step": 22513, "epoch": 189, "lr": 7.80400009466956e-05} +{"train_loss": 0.004700920544564724, "global_step": 22514, "epoch": 189, "lr": 7.803816658511407e-05} +{"train_loss": 0.0061836084350943565, "global_step": 22515, "epoch": 189, "lr": 7.80363321684826e-05} +{"train_loss": 0.006894637830555439, "global_step": 22516, "epoch": 189, "lr": 7.80344976968048e-05} +{"train_loss": 0.003945301752537489, "global_step": 22517, "epoch": 189, "lr": 7.803266317008424e-05} +{"train_loss": 0.003939395304769278, "global_step": 22518, "epoch": 189, "lr": 7.803082858832455e-05} +{"train_loss": 0.004031162243336439, "global_step": 22519, "epoch": 189, "lr": 7.802899395152934e-05} +{"train_loss": 0.004422694910317659, "global_step": 22520, "epoch": 189, "lr": 7.802715925970218e-05} +{"train_loss": 0.00504954531788826, "global_step": 22521, "epoch": 189, "lr": 7.802532451284667e-05} +{"train_loss": 0.005027904640883207, "global_step": 22522, "epoch": 189, "lr": 7.802348971096646e-05} +{"train_loss": 0.004195025656372309, "global_step": 22523, "epoch": 189, "lr": 7.80216548540651e-05} +{"train_loss": 0.006586231756955385, "global_step": 22524, "epoch": 189, "lr": 7.801981994214622e-05} +{"train_loss": 0.0046971458941698074, "global_step": 22525, "epoch": 189, "lr": 7.801798497521342e-05} +{"train_loss": 0.0029323885682970285, "global_step": 22526, "epoch": 189, "lr": 7.801614995327031e-05} +{"train_loss": 0.004053670912981033, "global_step": 22527, "epoch": 189, "lr": 7.801431487632047e-05} +{"train_loss": 0.0042673079296946526, "global_step": 22528, "epoch": 189, "lr": 7.801247974436752e-05} +{"train_loss": 0.006001846864819527, "global_step": 22529, "epoch": 189, "lr": 7.801064455741506e-05} +{"train_loss": 0.0044153896160423756, "global_step": 22530, "epoch": 189, "lr": 7.800880931546668e-05} +{"train_loss": 0.005585820879787207, "global_step": 22531, "epoch": 189, "lr": 7.800697401852602e-05} +{"train_loss": 0.003337046829983592, "global_step": 22532, "epoch": 189, "lr": 7.800513866659665e-05} +{"train_loss": 0.0038697838317602873, "global_step": 22533, "epoch": 189, "lr": 7.800330325968217e-05} +{"train_loss": 0.006379405036568642, "global_step": 22534, "epoch": 189, "lr": 7.800146779778619e-05} +{"train_loss": 0.005101480986922979, "global_step": 22535, "epoch": 189, "lr": 7.799963228091234e-05} +{"train_loss": 0.004056099336594343, "global_step": 22536, "epoch": 189, "lr": 7.799779670906419e-05} +{"train_loss": 0.004481173120439053, "global_step": 22537, "epoch": 189, "lr": 7.799596108224535e-05} +{"train_loss": 0.004346827510744333, "global_step": 22538, "epoch": 189, "lr": 7.799412540045945e-05} +{"train_loss": 0.004611085634678602, "global_step": 22539, "epoch": 189, "lr": 7.799228966371006e-05} +{"train_loss": 0.006059331353753805, "global_step": 22540, "epoch": 189, "lr": 7.799045387200082e-05} +{"train_loss": 0.005636480636894703, "global_step": 22541, "epoch": 189, "lr": 7.79886180253353e-05} +{"train_loss": 0.005720402579754591, "global_step": 22542, "epoch": 189, "lr": 7.79867821237171e-05} +{"train_loss": 0.003967981319874525, "global_step": 22543, "epoch": 189, "lr": 7.798494616714987e-05} +{"train_loss": 0.00595602672547102, "global_step": 22544, "epoch": 189, "lr": 7.798311015563719e-05} +{"train_loss": 0.005169984884560108, "global_step": 22545, "epoch": 189, "lr": 7.798127408918265e-05} +{"train_loss": 0.004794907756149769, "global_step": 22546, "epoch": 189, "lr": 7.797943796778988e-05} +{"train_loss": 0.0036673578433692455, "global_step": 22547, "epoch": 189, "lr": 7.797760179146245e-05} +{"train_loss": 0.005173295736312866, "global_step": 22548, "epoch": 189, "lr": 7.7975765560204e-05} +{"train_loss": 0.002597588114440441, "global_step": 22549, "epoch": 189, "lr": 7.797392927401813e-05} +{"train_loss": 0.0037167994305491447, "global_step": 22550, "epoch": 189, "lr": 7.797209293290843e-05} +{"train_loss": 0.005798394326120615, "global_step": 22551, "epoch": 189, "lr": 7.797025653687853e-05} +{"train_loss": 0.002629059599712491, "global_step": 22552, "epoch": 189, "lr": 7.7968420085932e-05} +{"train_loss": 0.004677946679294109, "global_step": 22553, "epoch": 189, "lr": 7.796658358007247e-05} +{"train_loss": 0.004973000846803188, "global_step": 22554, "epoch": 189, "lr": 7.796474701930354e-05} +{"train_loss": 0.007107183802872896, "global_step": 22555, "epoch": 189, "lr": 7.796291040362882e-05} +{"train_loss": 0.0037301587872207165, "global_step": 22556, "epoch": 189, "lr": 7.796107373305193e-05} +{"train_loss": 0.0061685857363045216, "global_step": 22557, "epoch": 189, "lr": 7.795923700757644e-05} +{"train_loss": 0.0048342738300561905, "global_step": 22558, "epoch": 189, "lr": 7.795740022720596e-05} +{"train_loss": 0.007984859868884087, "global_step": 22559, "epoch": 189, "lr": 7.795556339194414e-05} +{"train_loss": 0.0038590694312006235, "global_step": 22560, "epoch": 189, "lr": 7.795372650179456e-05} +{"train_loss": 0.009250144474208355, "global_step": 22561, "epoch": 189, "lr": 7.79518895567608e-05} +{"train_loss": 0.0037937774322927, "global_step": 22562, "epoch": 189, "lr": 7.795005255684649e-05} +{"train_loss": 0.003251082729548216, "global_step": 22563, "epoch": 189, "lr": 7.794821550205527e-05} +{"train_loss": 0.003477547550573945, "global_step": 22564, "epoch": 189, "lr": 7.794637839239068e-05} +{"train_loss": 0.0040413811802864075, "global_step": 22565, "epoch": 189, "lr": 7.794454122785638e-05} +{"train_loss": 0.007661206182092428, "global_step": 22566, "epoch": 189, "lr": 7.794270400845596e-05} +{"train_loss": 0.003917308058589697, "global_step": 22567, "epoch": 189, "lr": 7.7940866734193e-05} +{"train_loss": 0.0034250628668814898, "global_step": 22568, "epoch": 189, "lr": 7.793902940507117e-05} +{"train_loss": 0.005696526262909174, "global_step": 22569, "epoch": 189, "lr": 7.793719202109402e-05} +{"train_loss": 0.0038735545240342617, "global_step": 22570, "epoch": 189, "lr": 7.793535458226518e-05} +{"train_loss": 0.0068028829991817474, "global_step": 22571, "epoch": 189, "lr": 7.793351708858827e-05} +{"train_loss": 0.005191081669181585, "global_step": 22572, "epoch": 189, "lr": 7.793167954006686e-05} +{"train_loss": 0.004226330202072859, "global_step": 22573, "epoch": 189, "lr": 7.79298419367046e-05} +{"train_loss": 0.002630826784297824, "global_step": 22574, "epoch": 189, "lr": 7.792800427850506e-05} +{"train_loss": 0.006645352579653263, "global_step": 22575, "epoch": 189, "lr": 7.792616656547189e-05} +{"train_loss": 0.0052650184370577335, "global_step": 22576, "epoch": 189, "lr": 7.792432879760867e-05} +{"train_loss": 0.006310339085757732, "global_step": 22577, "epoch": 189, "lr": 7.792249097491901e-05} +{"train_loss": 0.004928918555378914, "global_step": 22578, "epoch": 189, "lr": 7.792065309740652e-05} +{"train_loss": 0.0037065159995108843, "global_step": 22579, "epoch": 189, "lr": 7.79188151650748e-05} +{"train_loss": 0.005329036619514227, "global_step": 22580, "epoch": 189, "lr": 7.791697717792749e-05} +{"train_loss": 0.003607897087931633, "global_step": 22581, "epoch": 189, "lr": 7.791513913596816e-05} +{"train_loss": 0.0032421457581222057, "global_step": 22582, "epoch": 189, "lr": 7.791330103920044e-05} +{"train_loss": 0.0029243549797683954, "global_step": 22583, "epoch": 189, "lr": 7.791146288762796e-05} +{"train_loss": 0.004948070738464594, "global_step": 22584, "epoch": 189, "lr": 7.790962468125428e-05} +{"train_loss": 0.0050270697101950645, "global_step": 22585, "epoch": 189, "lr": 7.790778642008302e-05} +{"train_loss": 0.003520884783938527, "global_step": 22586, "epoch": 189, "lr": 7.790594810411783e-05} +{"train_loss": 0.0037484965287148952, "global_step": 22587, "epoch": 189, "lr": 7.790410973336228e-05} +{"train_loss": 0.005321631208062172, "global_step": 22588, "epoch": 189, "lr": 7.790227130782e-05} +{"train_loss": 0.004461641889065504, "global_step": 22589, "epoch": 189, "lr": 7.79004328274946e-05} +{"train_loss": 0.005322596989572048, "global_step": 22590, "epoch": 189, "lr": 7.789859429238966e-05} +{"train_loss": 0.0042850421741604805, "global_step": 22591, "epoch": 189, "lr": 7.789675570250882e-05} +{"train_loss": 0.004529117606580257, "global_step": 22592, "epoch": 189, "lr": 7.789491705785568e-05} +{"train_loss": 0.005060418508946896, "global_step": 22593, "epoch": 189, "lr": 7.789307835843384e-05} +{"train_loss": 0.004284655209630728, "global_step": 22594, "epoch": 189, "lr": 7.789123960424693e-05} +{"train_loss": 0.004135684575885534, "global_step": 22595, "epoch": 189, "lr": 7.788940079529856e-05} +{"train_loss": 0.0053734006360173225, "global_step": 22596, "epoch": 189, "lr": 7.788756193159232e-05} +{"train_loss": 0.0028899896424263716, "global_step": 22597, "epoch": 189, "lr": 7.788572301313183e-05} +{"train_loss": 0.004869304597377777, "global_step": 22598, "epoch": 189, "lr": 7.788388403992071e-05} +{"train_loss": 0.0072296797297894955, "global_step": 22599, "epoch": 189, "lr": 7.788204501196255e-05} +{"train_loss": 0.004134393762797117, "global_step": 22600, "epoch": 189, "lr": 7.788020592926097e-05} +{"train_loss": 0.00670787924900651, "global_step": 22601, "epoch": 189, "lr": 7.787836679181962e-05} +{"train_loss": 0.0031704024877399206, "global_step": 22602, "epoch": 189, "lr": 7.787652759964203e-05} +{"train_loss": 0.00344715709798038, "global_step": 22603, "epoch": 189, "lr": 7.787468835273188e-05} +{"train_loss": 0.005670040380209684, "global_step": 22604, "epoch": 189, "lr": 7.787284905109275e-05} +{"train_loss": 0.005472284741699696, "global_step": 22605, "epoch": 189, "lr": 7.787100969472827e-05} +{"train_loss": 0.0033825787249952555, "global_step": 22606, "epoch": 189, "lr": 7.786917028364203e-05} +{"train_loss": 0.004471729043871164, "global_step": 22607, "epoch": 189, "lr": 7.786733081783766e-05} +{"train_loss": 0.004023940768092871, "global_step": 22608, "epoch": 189, "lr": 7.786549129731875e-05} +{"train_loss": 0.004748250563245486, "global_step": 22609, "epoch": 189, "lr": 7.786365172208894e-05, "val_loss": 0.017175547778606415} +{"train_loss": 0.00496054720133543, "global_step": 22610, "epoch": 190, "lr": 7.78618120921518e-05} +{"train_loss": 0.003691118210554123, "global_step": 22611, "epoch": 190, "lr": 7.7859972407511e-05} +{"train_loss": 0.00455823540687561, "global_step": 22612, "epoch": 190, "lr": 7.785813266817011e-05} +{"train_loss": 0.0035498817451298237, "global_step": 22613, "epoch": 190, "lr": 7.785629287413275e-05} +{"train_loss": 0.005221004132181406, "global_step": 22614, "epoch": 190, "lr": 7.785445302540253e-05} +{"train_loss": 0.004714174196124077, "global_step": 22615, "epoch": 190, "lr": 7.785261312198307e-05} +{"train_loss": 0.0031003893818706274, "global_step": 22616, "epoch": 190, "lr": 7.7850773163878e-05} +{"train_loss": 0.003956548869609833, "global_step": 22617, "epoch": 190, "lr": 7.784893315109088e-05} +{"train_loss": 0.004314483143389225, "global_step": 22618, "epoch": 190, "lr": 7.784709308362536e-05} +{"train_loss": 0.004673911724239588, "global_step": 22619, "epoch": 190, "lr": 7.784525296148508e-05} +{"train_loss": 0.0056462069042027, "global_step": 22620, "epoch": 190, "lr": 7.78434127846736e-05} +{"train_loss": 0.004947200417518616, "global_step": 22621, "epoch": 190, "lr": 7.784157255319454e-05} +{"train_loss": 0.0038932079914957285, "global_step": 22622, "epoch": 190, "lr": 7.783973226705155e-05} +{"train_loss": 0.004577989690005779, "global_step": 22623, "epoch": 190, "lr": 7.78378919262482e-05} +{"train_loss": 0.005097946152091026, "global_step": 22624, "epoch": 190, "lr": 7.783605153078812e-05} +{"train_loss": 0.002998688956722617, "global_step": 22625, "epoch": 190, "lr": 7.783421108067494e-05} +{"train_loss": 0.004488085396587849, "global_step": 22626, "epoch": 190, "lr": 7.783237057591226e-05} +{"train_loss": 0.003416196210309863, "global_step": 22627, "epoch": 190, "lr": 7.78305300165037e-05} +{"train_loss": 0.003536087926477194, "global_step": 22628, "epoch": 190, "lr": 7.782868940245286e-05} +{"train_loss": 0.005822227336466312, "global_step": 22629, "epoch": 190, "lr": 7.782684873376336e-05} +{"train_loss": 0.0036691175773739815, "global_step": 22630, "epoch": 190, "lr": 7.782500801043881e-05} +{"train_loss": 0.0032587614841759205, "global_step": 22631, "epoch": 190, "lr": 7.782316723248284e-05} +{"train_loss": 0.0030533235985785723, "global_step": 22632, "epoch": 190, "lr": 7.782132639989905e-05} +{"train_loss": 0.0037070242688059807, "global_step": 22633, "epoch": 190, "lr": 7.781948551269107e-05} +{"train_loss": 0.0057299016043543816, "global_step": 22634, "epoch": 190, "lr": 7.781764457086248e-05} +{"train_loss": 0.002999025397002697, "global_step": 22635, "epoch": 190, "lr": 7.781580357441693e-05} +{"train_loss": 0.006319828797131777, "global_step": 22636, "epoch": 190, "lr": 7.781396252335802e-05} +{"train_loss": 0.004167507402598858, "global_step": 22637, "epoch": 190, "lr": 7.781212141768936e-05} +{"train_loss": 0.00584929995238781, "global_step": 22638, "epoch": 190, "lr": 7.781028025741457e-05} +{"train_loss": 0.0026511098258197308, "global_step": 22639, "epoch": 190, "lr": 7.780843904253727e-05} +{"train_loss": 0.005432761739939451, "global_step": 22640, "epoch": 190, "lr": 7.780659777306108e-05} +{"train_loss": 0.005894613452255726, "global_step": 22641, "epoch": 190, "lr": 7.780475644898959e-05} +{"train_loss": 0.007281616795808077, "global_step": 22642, "epoch": 190, "lr": 7.780291507032645e-05} +{"train_loss": 0.002984162885695696, "global_step": 22643, "epoch": 190, "lr": 7.780107363707523e-05} +{"train_loss": 0.004748533945530653, "global_step": 22644, "epoch": 190, "lr": 7.779923214923959e-05} +{"train_loss": 0.0031942480709403753, "global_step": 22645, "epoch": 190, "lr": 7.779739060682315e-05} +{"train_loss": 0.0032097711227834225, "global_step": 22646, "epoch": 190, "lr": 7.779554900982946e-05} +{"train_loss": 0.005088187288492918, "global_step": 22647, "epoch": 190, "lr": 7.779370735826219e-05} +{"train_loss": 0.004445447586476803, "global_step": 22648, "epoch": 190, "lr": 7.779186565212495e-05} +{"train_loss": 0.0034338952973484993, "global_step": 22649, "epoch": 190, "lr": 7.779002389142137e-05} +{"train_loss": 0.004384415689855814, "global_step": 22650, "epoch": 190, "lr": 7.778818207615501e-05} +{"train_loss": 0.00407025869935751, "global_step": 22651, "epoch": 190, "lr": 7.778634020632956e-05} +{"train_loss": 0.0038242756854742765, "global_step": 22652, "epoch": 190, "lr": 7.778449828194858e-05} +{"train_loss": 0.0037447651848196983, "global_step": 22653, "epoch": 190, "lr": 7.778265630301571e-05} +{"train_loss": 0.00530640734359622, "global_step": 22654, "epoch": 190, "lr": 7.778081426953456e-05} +{"train_loss": 0.0022275166120380163, "global_step": 22655, "epoch": 190, "lr": 7.777897218150874e-05} +{"train_loss": 0.004700162447988987, "global_step": 22656, "epoch": 190, "lr": 7.777713003894189e-05} +{"train_loss": 0.004833859391510487, "global_step": 22657, "epoch": 190, "lr": 7.777528784183762e-05} +{"train_loss": 0.006025646813213825, "global_step": 22658, "epoch": 190, "lr": 7.777344559019952e-05} +{"train_loss": 0.0036346842534840107, "global_step": 22659, "epoch": 190, "lr": 7.777160328403124e-05} +{"train_loss": 0.0032203332521021366, "global_step": 22660, "epoch": 190, "lr": 7.776976092333638e-05} +{"train_loss": 0.0029497186187654734, "global_step": 22661, "epoch": 190, "lr": 7.776791850811855e-05} +{"train_loss": 0.007392226718366146, "global_step": 22662, "epoch": 190, "lr": 7.77660760383814e-05} +{"train_loss": 0.0037588346749544144, "global_step": 22663, "epoch": 190, "lr": 7.776423351412852e-05} +{"train_loss": 0.004641054198145866, "global_step": 22664, "epoch": 190, "lr": 7.776239093536353e-05} +{"train_loss": 0.006370568182319403, "global_step": 22665, "epoch": 190, "lr": 7.776054830209004e-05} +{"train_loss": 0.006701735779643059, "global_step": 22666, "epoch": 190, "lr": 7.775870561431169e-05} +{"train_loss": 0.0027258964255452156, "global_step": 22667, "epoch": 190, "lr": 7.775686287203209e-05} +{"train_loss": 0.007410077378153801, "global_step": 22668, "epoch": 190, "lr": 7.775502007525484e-05} +{"train_loss": 0.003665025345981121, "global_step": 22669, "epoch": 190, "lr": 7.775317722398359e-05} +{"train_loss": 0.0035945517010986805, "global_step": 22670, "epoch": 190, "lr": 7.775133431822195e-05} +{"train_loss": 0.003804455976933241, "global_step": 22671, "epoch": 190, "lr": 7.774949135797352e-05} +{"train_loss": 0.003891656408086419, "global_step": 22672, "epoch": 190, "lr": 7.774764834324191e-05} +{"train_loss": 0.004875997081398964, "global_step": 22673, "epoch": 190, "lr": 7.774580527403077e-05} +{"train_loss": 0.0029141991399228573, "global_step": 22674, "epoch": 190, "lr": 7.774396215034371e-05} +{"train_loss": 0.0036029743496328592, "global_step": 22675, "epoch": 190, "lr": 7.774211897218435e-05} +{"train_loss": 0.005950403865426779, "global_step": 22676, "epoch": 190, "lr": 7.77402757395563e-05} +{"train_loss": 0.003233372699469328, "global_step": 22677, "epoch": 190, "lr": 7.773843245246316e-05} +{"train_loss": 0.0038030878640711308, "global_step": 22678, "epoch": 190, "lr": 7.77365891109086e-05} +{"train_loss": 0.003089927602559328, "global_step": 22679, "epoch": 190, "lr": 7.773474571489619e-05} +{"train_loss": 0.0043766130693256855, "global_step": 22680, "epoch": 190, "lr": 7.773290226442957e-05} +{"train_loss": 0.004121801350265741, "global_step": 22681, "epoch": 190, "lr": 7.773105875951237e-05} +{"train_loss": 0.004847116302698851, "global_step": 22682, "epoch": 190, "lr": 7.77292152001482e-05} +{"train_loss": 0.00400569336488843, "global_step": 22683, "epoch": 190, "lr": 7.772737158634067e-05} +{"train_loss": 0.00317809684202075, "global_step": 22684, "epoch": 190, "lr": 7.772552791809343e-05} +{"train_loss": 0.005286707542836666, "global_step": 22685, "epoch": 190, "lr": 7.772368419541005e-05} +{"train_loss": 0.004416330251842737, "global_step": 22686, "epoch": 190, "lr": 7.772184041829418e-05} +{"train_loss": 0.004573143552988768, "global_step": 22687, "epoch": 190, "lr": 7.771999658674945e-05} +{"train_loss": 0.0049296109937131405, "global_step": 22688, "epoch": 190, "lr": 7.771815270077946e-05} +{"train_loss": 0.003827905748039484, "global_step": 22689, "epoch": 190, "lr": 7.771630876038786e-05} +{"train_loss": 0.0044233831577003, "global_step": 22690, "epoch": 190, "lr": 7.771446476557823e-05} +{"train_loss": 0.005265051499009132, "global_step": 22691, "epoch": 190, "lr": 7.771262071635422e-05} +{"train_loss": 0.005276987329125404, "global_step": 22692, "epoch": 190, "lr": 7.771077661271942e-05} +{"train_loss": 0.0035382756032049656, "global_step": 22693, "epoch": 190, "lr": 7.770893245467747e-05} +{"train_loss": 0.003958453889936209, "global_step": 22694, "epoch": 190, "lr": 7.770708824223201e-05} +{"train_loss": 0.0031626643612980843, "global_step": 22695, "epoch": 190, "lr": 7.770524397538665e-05} +{"train_loss": 0.005764724221080542, "global_step": 22696, "epoch": 190, "lr": 7.770339965414498e-05} +{"train_loss": 0.00391226215288043, "global_step": 22697, "epoch": 190, "lr": 7.770155527851065e-05} +{"train_loss": 0.002653862815350294, "global_step": 22698, "epoch": 190, "lr": 7.769971084848728e-05} +{"train_loss": 0.004428392741829157, "global_step": 22699, "epoch": 190, "lr": 7.769786636407849e-05} +{"train_loss": 0.003671309445053339, "global_step": 22700, "epoch": 190, "lr": 7.769602182528788e-05} +{"train_loss": 0.002939582569524646, "global_step": 22701, "epoch": 190, "lr": 7.769417723211911e-05} +{"train_loss": 0.0038952261675149202, "global_step": 22702, "epoch": 190, "lr": 7.769233258457578e-05} +{"train_loss": 0.0040342919528484344, "global_step": 22703, "epoch": 190, "lr": 7.769048788266151e-05} +{"train_loss": 0.004482837859541178, "global_step": 22704, "epoch": 190, "lr": 7.768864312637993e-05} +{"train_loss": 0.003952726721763611, "global_step": 22705, "epoch": 190, "lr": 7.768679831573465e-05} +{"train_loss": 0.004224951379001141, "global_step": 22706, "epoch": 190, "lr": 7.768495345072931e-05} +{"train_loss": 0.005422665271908045, "global_step": 22707, "epoch": 190, "lr": 7.768310853136751e-05} +{"train_loss": 0.004499746952205896, "global_step": 22708, "epoch": 190, "lr": 7.768126355765288e-05} +{"train_loss": 0.004193026106804609, "global_step": 22709, "epoch": 190, "lr": 7.767941852958905e-05} +{"train_loss": 0.005580392200499773, "global_step": 22710, "epoch": 190, "lr": 7.767757344717966e-05} +{"train_loss": 0.004335395060479641, "global_step": 22711, "epoch": 190, "lr": 7.767572831042829e-05} +{"train_loss": 0.003810462774708867, "global_step": 22712, "epoch": 190, "lr": 7.767388311933858e-05} +{"train_loss": 0.004343860782682896, "global_step": 22713, "epoch": 190, "lr": 7.767203787391417e-05} +{"train_loss": 0.002746755722910166, "global_step": 22714, "epoch": 190, "lr": 7.767019257415867e-05} +{"train_loss": 0.0035064788535237312, "global_step": 22715, "epoch": 190, "lr": 7.76683472200757e-05} +{"train_loss": 0.005278864409774542, "global_step": 22716, "epoch": 190, "lr": 7.766650181166888e-05} +{"train_loss": 0.0032631526701152325, "global_step": 22717, "epoch": 190, "lr": 7.766465634894184e-05} +{"train_loss": 0.0035352197010070086, "global_step": 22718, "epoch": 190, "lr": 7.766281083189821e-05} +{"train_loss": 0.004604133311659098, "global_step": 22719, "epoch": 190, "lr": 7.766096526054158e-05} +{"train_loss": 0.003843862796202302, "global_step": 22720, "epoch": 190, "lr": 7.765911963487564e-05} +{"train_loss": 0.007189804222434759, "global_step": 22721, "epoch": 190, "lr": 7.765727395490396e-05} +{"train_loss": 0.0037657511420547962, "global_step": 22722, "epoch": 190, "lr": 7.765542822063017e-05} +{"train_loss": 0.002161004114896059, "global_step": 22723, "epoch": 190, "lr": 7.76535824320579e-05} +{"train_loss": 0.004599662031978369, "global_step": 22724, "epoch": 190, "lr": 7.765173658919078e-05} +{"train_loss": 0.005203080363571644, "global_step": 22725, "epoch": 190, "lr": 7.764989069203243e-05} +{"train_loss": 0.00253470940515399, "global_step": 22726, "epoch": 190, "lr": 7.764804474058648e-05} +{"train_loss": 0.0041286214254796505, "global_step": 22727, "epoch": 190, "lr": 7.764619873485653e-05} +{"train_loss": 0.004295975768140384, "global_step": 22728, "epoch": 190, "lr": 7.764435267484624e-05, "val_loss": 0.014957055449485779, "train_action_mse_error": 9.29059024201706e-05} +{"train_loss": 0.0045715998858213425, "global_step": 22729, "epoch": 191, "lr": 7.76425065605592e-05} +{"train_loss": 0.004125475883483887, "global_step": 22730, "epoch": 191, "lr": 7.764066039199907e-05} +{"train_loss": 0.004305458627641201, "global_step": 22731, "epoch": 191, "lr": 7.763881416916945e-05} +{"train_loss": 0.00409701419994235, "global_step": 22732, "epoch": 191, "lr": 7.763696789207397e-05} +{"train_loss": 0.0034628671128302813, "global_step": 22733, "epoch": 191, "lr": 7.763512156071626e-05} +{"train_loss": 0.006057631690055132, "global_step": 22734, "epoch": 191, "lr": 7.763327517509993e-05} +{"train_loss": 0.0038651854265481234, "global_step": 22735, "epoch": 191, "lr": 7.763142873522862e-05} +{"train_loss": 0.0033968195784837008, "global_step": 22736, "epoch": 191, "lr": 7.762958224110595e-05} +{"train_loss": 0.006321236956864595, "global_step": 22737, "epoch": 191, "lr": 7.762773569273555e-05} +{"train_loss": 0.003433272708207369, "global_step": 22738, "epoch": 191, "lr": 7.762588909012105e-05} +{"train_loss": 0.004187337122857571, "global_step": 22739, "epoch": 191, "lr": 7.762404243326606e-05} +{"train_loss": 0.0047109066508710384, "global_step": 22740, "epoch": 191, "lr": 7.762219572217422e-05} +{"train_loss": 0.0032944015692919493, "global_step": 22741, "epoch": 191, "lr": 7.762034895684914e-05} +{"train_loss": 0.0036423923447728157, "global_step": 22742, "epoch": 191, "lr": 7.761850213729447e-05} +{"train_loss": 0.007135105784982443, "global_step": 22743, "epoch": 191, "lr": 7.76166552635138e-05} +{"train_loss": 0.006347132381051779, "global_step": 22744, "epoch": 191, "lr": 7.76148083355108e-05} +{"train_loss": 0.0035864440724253654, "global_step": 22745, "epoch": 191, "lr": 7.761296135328906e-05} +{"train_loss": 0.004079865291714668, "global_step": 22746, "epoch": 191, "lr": 7.761111431685223e-05} +{"train_loss": 0.003143300535157323, "global_step": 22747, "epoch": 191, "lr": 7.760926722620391e-05} +{"train_loss": 0.0055147092789411545, "global_step": 22748, "epoch": 191, "lr": 7.760742008134776e-05} +{"train_loss": 0.002024995628744364, "global_step": 22749, "epoch": 191, "lr": 7.76055728822874e-05} +{"train_loss": 0.004664046689867973, "global_step": 22750, "epoch": 191, "lr": 7.760372562902642e-05} +{"train_loss": 0.004516264423727989, "global_step": 22751, "epoch": 191, "lr": 7.760187832156849e-05} +{"train_loss": 0.005662242416292429, "global_step": 22752, "epoch": 191, "lr": 7.760003095991721e-05} +{"train_loss": 0.007329350337386131, "global_step": 22753, "epoch": 191, "lr": 7.759818354407623e-05} +{"train_loss": 0.0029191134963184595, "global_step": 22754, "epoch": 191, "lr": 7.759633607404916e-05} +{"train_loss": 0.004588054958730936, "global_step": 22755, "epoch": 191, "lr": 7.759448854983962e-05} +{"train_loss": 0.006558672990649939, "global_step": 22756, "epoch": 191, "lr": 7.759264097145127e-05} +{"train_loss": 0.004373249597847462, "global_step": 22757, "epoch": 191, "lr": 7.75907933388877e-05} +{"train_loss": 0.005320505239069462, "global_step": 22758, "epoch": 191, "lr": 7.758894565215258e-05} +{"train_loss": 0.004115068353712559, "global_step": 22759, "epoch": 191, "lr": 7.758709791124949e-05} +{"train_loss": 0.004919663071632385, "global_step": 22760, "epoch": 191, "lr": 7.758525011618209e-05} +{"train_loss": 0.004098290111869574, "global_step": 22761, "epoch": 191, "lr": 7.758340226695399e-05} +{"train_loss": 0.007933598011732101, "global_step": 22762, "epoch": 191, "lr": 7.758155436356885e-05} +{"train_loss": 0.0049269795417785645, "global_step": 22763, "epoch": 191, "lr": 7.757970640603024e-05} +{"train_loss": 0.003427107585594058, "global_step": 22764, "epoch": 191, "lr": 7.757785839434185e-05} +{"train_loss": 0.003922032658010721, "global_step": 22765, "epoch": 191, "lr": 7.757601032850727e-05} +{"train_loss": 0.0030845212750136852, "global_step": 22766, "epoch": 191, "lr": 7.757416220853014e-05} +{"train_loss": 0.005481000058352947, "global_step": 22767, "epoch": 191, "lr": 7.757231403441408e-05} +{"train_loss": 0.004461114760488272, "global_step": 22768, "epoch": 191, "lr": 7.757046580616274e-05} +{"train_loss": 0.003110668621957302, "global_step": 22769, "epoch": 191, "lr": 7.756861752377972e-05} +{"train_loss": 0.004335543606430292, "global_step": 22770, "epoch": 191, "lr": 7.75667691872687e-05} +{"train_loss": 0.00467199319973588, "global_step": 22771, "epoch": 191, "lr": 7.756492079663324e-05} +{"train_loss": 0.004666367545723915, "global_step": 22772, "epoch": 191, "lr": 7.756307235187701e-05} +{"train_loss": 0.0058558424934744835, "global_step": 22773, "epoch": 191, "lr": 7.756122385300364e-05} +{"train_loss": 0.004254637286067009, "global_step": 22774, "epoch": 191, "lr": 7.755937530001675e-05} +{"train_loss": 0.005323321092873812, "global_step": 22775, "epoch": 191, "lr": 7.755752669291997e-05} +{"train_loss": 0.004245025105774403, "global_step": 22776, "epoch": 191, "lr": 7.755567803171693e-05} +{"train_loss": 0.0065190051682293415, "global_step": 22777, "epoch": 191, "lr": 7.755382931641125e-05} +{"train_loss": 0.006863257847726345, "global_step": 22778, "epoch": 191, "lr": 7.755198054700659e-05} +{"train_loss": 0.00452407356351614, "global_step": 22779, "epoch": 191, "lr": 7.755013172350653e-05} +{"train_loss": 0.004411264322698116, "global_step": 22780, "epoch": 191, "lr": 7.754828284591475e-05} +{"train_loss": 0.003951521590352058, "global_step": 22781, "epoch": 191, "lr": 7.754643391423486e-05} +{"train_loss": 0.004658447112888098, "global_step": 22782, "epoch": 191, "lr": 7.754458492847049e-05} +{"train_loss": 0.0036903738509863615, "global_step": 22783, "epoch": 191, "lr": 7.754273588862527e-05} +{"train_loss": 0.0053275884129107, "global_step": 22784, "epoch": 191, "lr": 7.754088679470282e-05} +{"train_loss": 0.0074739595875144005, "global_step": 22785, "epoch": 191, "lr": 7.75390376467068e-05} +{"train_loss": 0.004509748890995979, "global_step": 22786, "epoch": 191, "lr": 7.75371884446408e-05} +{"train_loss": 0.00528295524418354, "global_step": 22787, "epoch": 191, "lr": 7.753533918850848e-05} +{"train_loss": 0.0050394185818731785, "global_step": 22788, "epoch": 191, "lr": 7.753348987831348e-05} +{"train_loss": 0.006110598333179951, "global_step": 22789, "epoch": 191, "lr": 7.753164051405941e-05} +{"train_loss": 0.007808090187609196, "global_step": 22790, "epoch": 191, "lr": 7.75297910957499e-05} +{"train_loss": 0.00482204370200634, "global_step": 22791, "epoch": 191, "lr": 7.752794162338856e-05} +{"train_loss": 0.004109145142138004, "global_step": 22792, "epoch": 191, "lr": 7.752609209697908e-05} +{"train_loss": 0.004273438826203346, "global_step": 22793, "epoch": 191, "lr": 7.752424251652504e-05} +{"train_loss": 0.007983279414474964, "global_step": 22794, "epoch": 191, "lr": 7.75223928820301e-05} +{"train_loss": 0.004726733081042767, "global_step": 22795, "epoch": 191, "lr": 7.752054319349789e-05} +{"train_loss": 0.006419508717954159, "global_step": 22796, "epoch": 191, "lr": 7.751869345093202e-05} +{"train_loss": 0.0036574378609657288, "global_step": 22797, "epoch": 191, "lr": 7.751684365433614e-05} +{"train_loss": 0.005893411580473185, "global_step": 22798, "epoch": 191, "lr": 7.751499380371387e-05} +{"train_loss": 0.003957373555749655, "global_step": 22799, "epoch": 191, "lr": 7.751314389906886e-05} +{"train_loss": 0.005444405600428581, "global_step": 22800, "epoch": 191, "lr": 7.751129394040473e-05} +{"train_loss": 0.0027526647318154573, "global_step": 22801, "epoch": 191, "lr": 7.750944392772511e-05} +{"train_loss": 0.006650341674685478, "global_step": 22802, "epoch": 191, "lr": 7.750759386103363e-05} +{"train_loss": 0.006420621182769537, "global_step": 22803, "epoch": 191, "lr": 7.750574374033395e-05} +{"train_loss": 0.0037408913485705853, "global_step": 22804, "epoch": 191, "lr": 7.750389356562966e-05} +{"train_loss": 0.003975483123213053, "global_step": 22805, "epoch": 191, "lr": 7.750204333692441e-05} +{"train_loss": 0.0055538685992360115, "global_step": 22806, "epoch": 191, "lr": 7.750019305422185e-05} +{"train_loss": 0.004288641735911369, "global_step": 22807, "epoch": 191, "lr": 7.749834271752559e-05} +{"train_loss": 0.004852568730711937, "global_step": 22808, "epoch": 191, "lr": 7.749649232683928e-05} +{"train_loss": 0.0032777918968349695, "global_step": 22809, "epoch": 191, "lr": 7.749464188216655e-05} +{"train_loss": 0.0047840699553489685, "global_step": 22810, "epoch": 191, "lr": 7.7492791383511e-05} +{"train_loss": 0.0042601777240633965, "global_step": 22811, "epoch": 191, "lr": 7.749094083087632e-05} +{"train_loss": 0.006155785638839006, "global_step": 22812, "epoch": 191, "lr": 7.74890902242661e-05} +{"train_loss": 0.006125225685536861, "global_step": 22813, "epoch": 191, "lr": 7.7487239563684e-05} +{"train_loss": 0.005140330176800489, "global_step": 22814, "epoch": 191, "lr": 7.748538884913363e-05} +{"train_loss": 0.005481482017785311, "global_step": 22815, "epoch": 191, "lr": 7.748353808061865e-05} +{"train_loss": 0.005777949001640081, "global_step": 22816, "epoch": 191, "lr": 7.748168725814266e-05} +{"train_loss": 0.0029075532220304012, "global_step": 22817, "epoch": 191, "lr": 7.747983638170933e-05} +{"train_loss": 0.005257418379187584, "global_step": 22818, "epoch": 191, "lr": 7.747798545132226e-05} +{"train_loss": 0.005339405499398708, "global_step": 22819, "epoch": 191, "lr": 7.747613446698511e-05} +{"train_loss": 0.004668745677918196, "global_step": 22820, "epoch": 191, "lr": 7.747428342870151e-05} +{"train_loss": 0.005364938639104366, "global_step": 22821, "epoch": 191, "lr": 7.74724323364751e-05} +{"train_loss": 0.005349704995751381, "global_step": 22822, "epoch": 191, "lr": 7.747058119030948e-05} +{"train_loss": 0.006397987250238657, "global_step": 22823, "epoch": 191, "lr": 7.746872999020831e-05} +{"train_loss": 0.005263456143438816, "global_step": 22824, "epoch": 191, "lr": 7.746687873617524e-05} +{"train_loss": 0.0028750270139425993, "global_step": 22825, "epoch": 191, "lr": 7.746502742821388e-05} +{"train_loss": 0.0062614320777356625, "global_step": 22826, "epoch": 191, "lr": 7.746317606632787e-05} +{"train_loss": 0.005985344294458628, "global_step": 22827, "epoch": 191, "lr": 7.746132465052084e-05} +{"train_loss": 0.004656690638512373, "global_step": 22828, "epoch": 191, "lr": 7.745947318079644e-05} +{"train_loss": 0.003918736707419157, "global_step": 22829, "epoch": 191, "lr": 7.745762165715831e-05} +{"train_loss": 0.0035520929377526045, "global_step": 22830, "epoch": 191, "lr": 7.745577007961007e-05} +{"train_loss": 0.004150012042373419, "global_step": 22831, "epoch": 191, "lr": 7.745391844815534e-05} +{"train_loss": 0.004070165567100048, "global_step": 22832, "epoch": 191, "lr": 7.74520667627978e-05} +{"train_loss": 0.005471635144203901, "global_step": 22833, "epoch": 191, "lr": 7.745021502354104e-05} +{"train_loss": 0.005699648056179285, "global_step": 22834, "epoch": 191, "lr": 7.744836323038873e-05} +{"train_loss": 0.004521859344094992, "global_step": 22835, "epoch": 191, "lr": 7.744651138334447e-05} +{"train_loss": 0.005267223808914423, "global_step": 22836, "epoch": 191, "lr": 7.744465948241193e-05} +{"train_loss": 0.0025720116682350636, "global_step": 22837, "epoch": 191, "lr": 7.744280752759474e-05} +{"train_loss": 0.008274050429463387, "global_step": 22838, "epoch": 191, "lr": 7.744095551889651e-05} +{"train_loss": 0.0041252668015658855, "global_step": 22839, "epoch": 191, "lr": 7.743910345632093e-05} +{"train_loss": 0.004304044879972935, "global_step": 22840, "epoch": 191, "lr": 7.743725133987157e-05} +{"train_loss": 0.007146781776100397, "global_step": 22841, "epoch": 191, "lr": 7.743539916955211e-05} +{"train_loss": 0.004635663703083992, "global_step": 22842, "epoch": 191, "lr": 7.743354694536617e-05} +{"train_loss": 0.006489624734967947, "global_step": 22843, "epoch": 191, "lr": 7.74316946673174e-05} +{"train_loss": 0.0038984029088169336, "global_step": 22844, "epoch": 191, "lr": 7.742984233540942e-05} +{"train_loss": 0.0028119636699557304, "global_step": 22845, "epoch": 191, "lr": 7.742798994964589e-05} +{"train_loss": 0.008793632499873638, "global_step": 22846, "epoch": 191, "lr": 7.742613751003042e-05} +{"train_loss": 0.004875877361447245, "global_step": 22847, "epoch": 191, "lr": 7.742428501656666e-05, "val_loss": 0.009408722631633282} +{"train_loss": 0.004789367318153381, "global_step": 22848, "epoch": 192, "lr": 7.742243246925825e-05} +{"train_loss": 0.00532962242141366, "global_step": 22849, "epoch": 192, "lr": 7.74205798681088e-05} +{"train_loss": 0.0066908253356814384, "global_step": 22850, "epoch": 192, "lr": 7.7418727213122e-05} +{"train_loss": 0.004412271082401276, "global_step": 22851, "epoch": 192, "lr": 7.741687450430144e-05} +{"train_loss": 0.004752093460410833, "global_step": 22852, "epoch": 192, "lr": 7.741502174165079e-05} +{"train_loss": 0.0029131791088730097, "global_step": 22853, "epoch": 192, "lr": 7.741316892517367e-05} +{"train_loss": 0.005502425599843264, "global_step": 22854, "epoch": 192, "lr": 7.74113160548737e-05} +{"train_loss": 0.003964800387620926, "global_step": 22855, "epoch": 192, "lr": 7.740946313075456e-05} +{"train_loss": 0.00539062824100256, "global_step": 22856, "epoch": 192, "lr": 7.740761015281987e-05} +{"train_loss": 0.0064398725517094135, "global_step": 22857, "epoch": 192, "lr": 7.740575712107327e-05} +{"train_loss": 0.004913114942610264, "global_step": 22858, "epoch": 192, "lr": 7.740390403551838e-05} +{"train_loss": 0.007282937411218882, "global_step": 22859, "epoch": 192, "lr": 7.740205089615886e-05} +{"train_loss": 0.0053533934988081455, "global_step": 22860, "epoch": 192, "lr": 7.740019770299834e-05} +{"train_loss": 0.004352254793047905, "global_step": 22861, "epoch": 192, "lr": 7.739834445604047e-05} +{"train_loss": 0.003839575918391347, "global_step": 22862, "epoch": 192, "lr": 7.739649115528885e-05} +{"train_loss": 0.004443216137588024, "global_step": 22863, "epoch": 192, "lr": 7.739463780074716e-05} +{"train_loss": 0.007030203007161617, "global_step": 22864, "epoch": 192, "lr": 7.739278439241904e-05} +{"train_loss": 0.0030001269187778234, "global_step": 22865, "epoch": 192, "lr": 7.739093093030809e-05} +{"train_loss": 0.0024501970037817955, "global_step": 22866, "epoch": 192, "lr": 7.738907741441799e-05} +{"train_loss": 0.004319837316870689, "global_step": 22867, "epoch": 192, "lr": 7.738722384475234e-05} +{"train_loss": 0.005235669203102589, "global_step": 22868, "epoch": 192, "lr": 7.738537022131482e-05} +{"train_loss": 0.003742384724318981, "global_step": 22869, "epoch": 192, "lr": 7.738351654410904e-05} +{"train_loss": 0.003944900818169117, "global_step": 22870, "epoch": 192, "lr": 7.738166281313868e-05} +{"train_loss": 0.004999781493097544, "global_step": 22871, "epoch": 192, "lr": 7.737980902840733e-05} +{"train_loss": 0.0040329755283892155, "global_step": 22872, "epoch": 192, "lr": 7.737795518991866e-05} +{"train_loss": 0.0032405985984951258, "global_step": 22873, "epoch": 192, "lr": 7.737610129767629e-05} +{"train_loss": 0.0028478307649493217, "global_step": 22874, "epoch": 192, "lr": 7.737424735168386e-05} +{"train_loss": 0.0040794480592012405, "global_step": 22875, "epoch": 192, "lr": 7.737239335194504e-05} +{"train_loss": 0.003310582134872675, "global_step": 22876, "epoch": 192, "lr": 7.737053929846343e-05} +{"train_loss": 0.003736632177606225, "global_step": 22877, "epoch": 192, "lr": 7.73686851912427e-05} +{"train_loss": 0.003797107143327594, "global_step": 22878, "epoch": 192, "lr": 7.736683103028647e-05} +{"train_loss": 0.003588056191802025, "global_step": 22879, "epoch": 192, "lr": 7.736497681559842e-05} +{"train_loss": 0.004095550626516342, "global_step": 22880, "epoch": 192, "lr": 7.736312254718214e-05} +{"train_loss": 0.004974039737135172, "global_step": 22881, "epoch": 192, "lr": 7.736126822504129e-05} +{"train_loss": 0.005171698983758688, "global_step": 22882, "epoch": 192, "lr": 7.735941384917952e-05} +{"train_loss": 0.004086803644895554, "global_step": 22883, "epoch": 192, "lr": 7.735755941960047e-05} +{"train_loss": 0.0023646398913115263, "global_step": 22884, "epoch": 192, "lr": 7.735570493630777e-05} +{"train_loss": 0.006681641563773155, "global_step": 22885, "epoch": 192, "lr": 7.735385039930505e-05} +{"train_loss": 0.003921946510672569, "global_step": 22886, "epoch": 192, "lr": 7.7351995808596e-05} +{"train_loss": 0.0035900718066841364, "global_step": 22887, "epoch": 192, "lr": 7.735014116418419e-05} +{"train_loss": 0.006079043727368116, "global_step": 22888, "epoch": 192, "lr": 7.734828646607332e-05} +{"train_loss": 0.004254558123648167, "global_step": 22889, "epoch": 192, "lr": 7.734643171426702e-05} +{"train_loss": 0.0036480589769780636, "global_step": 22890, "epoch": 192, "lr": 7.734457690876891e-05} +{"train_loss": 0.003737532766535878, "global_step": 22891, "epoch": 192, "lr": 7.734272204958265e-05} +{"train_loss": 0.005365482531487942, "global_step": 22892, "epoch": 192, "lr": 7.734086713671187e-05} +{"train_loss": 0.005662140902131796, "global_step": 22893, "epoch": 192, "lr": 7.733901217016022e-05} +{"train_loss": 0.003929055295884609, "global_step": 22894, "epoch": 192, "lr": 7.733715714993135e-05} +{"train_loss": 0.0032641447614878416, "global_step": 22895, "epoch": 192, "lr": 7.733530207602888e-05} +{"train_loss": 0.0026218248531222343, "global_step": 22896, "epoch": 192, "lr": 7.733344694845648e-05} +{"train_loss": 0.004532046616077423, "global_step": 22897, "epoch": 192, "lr": 7.733159176721776e-05} +{"train_loss": 0.00701477937400341, "global_step": 22898, "epoch": 192, "lr": 7.732973653231638e-05} +{"train_loss": 0.004022588022053242, "global_step": 22899, "epoch": 192, "lr": 7.7327881243756e-05} +{"train_loss": 0.0033267501275986433, "global_step": 22900, "epoch": 192, "lr": 7.732602590154023e-05} +{"train_loss": 0.004502600058913231, "global_step": 22901, "epoch": 192, "lr": 7.732417050567273e-05} +{"train_loss": 0.005107968579977751, "global_step": 22902, "epoch": 192, "lr": 7.732231505615715e-05} +{"train_loss": 0.005616158712655306, "global_step": 22903, "epoch": 192, "lr": 7.732045955299711e-05} +{"train_loss": 0.004961864557117224, "global_step": 22904, "epoch": 192, "lr": 7.731860399619626e-05} +{"train_loss": 0.004685806576162577, "global_step": 22905, "epoch": 192, "lr": 7.731674838575826e-05} +{"train_loss": 0.0019069850677624345, "global_step": 22906, "epoch": 192, "lr": 7.731489272168675e-05} +{"train_loss": 0.006555304396897554, "global_step": 22907, "epoch": 192, "lr": 7.731303700398536e-05} +{"train_loss": 0.0062531582079827785, "global_step": 22908, "epoch": 192, "lr": 7.731118123265774e-05} +{"train_loss": 0.003113273996859789, "global_step": 22909, "epoch": 192, "lr": 7.730932540770752e-05} +{"train_loss": 0.003017986658960581, "global_step": 22910, "epoch": 192, "lr": 7.730746952913837e-05} +{"train_loss": 0.00548388110473752, "global_step": 22911, "epoch": 192, "lr": 7.730561359695393e-05} +{"train_loss": 0.004107447806745768, "global_step": 22912, "epoch": 192, "lr": 7.730375761115782e-05} +{"train_loss": 0.0035547076258808374, "global_step": 22913, "epoch": 192, "lr": 7.73019015717537e-05} +{"train_loss": 0.003956866450607777, "global_step": 22914, "epoch": 192, "lr": 7.730004547874524e-05} +{"train_loss": 0.006305140908807516, "global_step": 22915, "epoch": 192, "lr": 7.729818933213602e-05} +{"train_loss": 0.0053772395476698875, "global_step": 22916, "epoch": 192, "lr": 7.729633313192974e-05} +{"train_loss": 0.005011554341763258, "global_step": 22917, "epoch": 192, "lr": 7.729447687813002e-05} +{"train_loss": 0.004383016377687454, "global_step": 22918, "epoch": 192, "lr": 7.729262057074051e-05} +{"train_loss": 0.00634743319824338, "global_step": 22919, "epoch": 192, "lr": 7.729076420976486e-05} +{"train_loss": 0.004324393346905708, "global_step": 22920, "epoch": 192, "lr": 7.728890779520672e-05} +{"train_loss": 0.004029699135571718, "global_step": 22921, "epoch": 192, "lr": 7.72870513270697e-05} +{"train_loss": 0.005680480506271124, "global_step": 22922, "epoch": 192, "lr": 7.72851948053575e-05} +{"train_loss": 0.005084475036710501, "global_step": 22923, "epoch": 192, "lr": 7.728333823007371e-05} +{"train_loss": 0.003453474026173353, "global_step": 22924, "epoch": 192, "lr": 7.7281481601222e-05} +{"train_loss": 0.005383801180869341, "global_step": 22925, "epoch": 192, "lr": 7.727962491880602e-05} +{"train_loss": 0.003449697745963931, "global_step": 22926, "epoch": 192, "lr": 7.727776818282943e-05} +{"train_loss": 0.004788153804838657, "global_step": 22927, "epoch": 192, "lr": 7.727591139329584e-05} +{"train_loss": 0.004452666733413935, "global_step": 22928, "epoch": 192, "lr": 7.72740545502089e-05} +{"train_loss": 0.005199159029871225, "global_step": 22929, "epoch": 192, "lr": 7.72721976535723e-05} +{"train_loss": 0.004850552882999182, "global_step": 22930, "epoch": 192, "lr": 7.727034070338964e-05} +{"train_loss": 0.006263198796659708, "global_step": 22931, "epoch": 192, "lr": 7.726848369966456e-05} +{"train_loss": 0.005474775098264217, "global_step": 22932, "epoch": 192, "lr": 7.726662664240075e-05} +{"train_loss": 0.0038492518942803144, "global_step": 22933, "epoch": 192, "lr": 7.726476953160182e-05} +{"train_loss": 0.0031563551165163517, "global_step": 22934, "epoch": 192, "lr": 7.726291236727142e-05} +{"train_loss": 0.005346708465367556, "global_step": 22935, "epoch": 192, "lr": 7.726105514941323e-05} +{"train_loss": 0.007291587069630623, "global_step": 22936, "epoch": 192, "lr": 7.725919787803084e-05} +{"train_loss": 0.004233849234879017, "global_step": 22937, "epoch": 192, "lr": 7.725734055312794e-05} +{"train_loss": 0.0029815935995429754, "global_step": 22938, "epoch": 192, "lr": 7.725548317470816e-05} +{"train_loss": 0.006214733701199293, "global_step": 22939, "epoch": 192, "lr": 7.725362574277516e-05} +{"train_loss": 0.005693951155990362, "global_step": 22940, "epoch": 192, "lr": 7.725176825733258e-05} +{"train_loss": 0.003356918692588806, "global_step": 22941, "epoch": 192, "lr": 7.724991071838405e-05} +{"train_loss": 0.004185662139207125, "global_step": 22942, "epoch": 192, "lr": 7.724805312593323e-05} +{"train_loss": 0.0032598685938864946, "global_step": 22943, "epoch": 192, "lr": 7.724619547998379e-05} +{"train_loss": 0.003961978014558554, "global_step": 22944, "epoch": 192, "lr": 7.724433778053933e-05} +{"train_loss": 0.007137828506529331, "global_step": 22945, "epoch": 192, "lr": 7.724248002760355e-05} +{"train_loss": 0.0027330094017088413, "global_step": 22946, "epoch": 192, "lr": 7.724062222118006e-05} +{"train_loss": 0.0036501598078757524, "global_step": 22947, "epoch": 192, "lr": 7.723876436127251e-05} +{"train_loss": 0.00876244343817234, "global_step": 22948, "epoch": 192, "lr": 7.723690644788457e-05} +{"train_loss": 0.003177535953000188, "global_step": 22949, "epoch": 192, "lr": 7.723504848101986e-05} +{"train_loss": 0.005765536334365606, "global_step": 22950, "epoch": 192, "lr": 7.723319046068205e-05} +{"train_loss": 0.005822767503559589, "global_step": 22951, "epoch": 192, "lr": 7.723133238687477e-05} +{"train_loss": 0.003157744649797678, "global_step": 22952, "epoch": 192, "lr": 7.72294742596017e-05} +{"train_loss": 0.0037060840986669064, "global_step": 22953, "epoch": 192, "lr": 7.722761607886645e-05} +{"train_loss": 0.004784026648849249, "global_step": 22954, "epoch": 192, "lr": 7.722575784467268e-05} +{"train_loss": 0.00587724382057786, "global_step": 22955, "epoch": 192, "lr": 7.722389955702405e-05} +{"train_loss": 0.003779958002269268, "global_step": 22956, "epoch": 192, "lr": 7.72220412159242e-05} +{"train_loss": 0.004664594307541847, "global_step": 22957, "epoch": 192, "lr": 7.72201828213768e-05} +{"train_loss": 0.003601968288421631, "global_step": 22958, "epoch": 192, "lr": 7.721832437338546e-05} +{"train_loss": 0.00452440558001399, "global_step": 22959, "epoch": 192, "lr": 7.721646587195383e-05} +{"train_loss": 0.003721611574292183, "global_step": 22960, "epoch": 192, "lr": 7.72146073170856e-05} +{"train_loss": 0.005450052209198475, "global_step": 22961, "epoch": 192, "lr": 7.72127487087844e-05} +{"train_loss": 0.006365648005157709, "global_step": 22962, "epoch": 192, "lr": 7.721089004705387e-05} +{"train_loss": 0.0030336349736899137, "global_step": 22963, "epoch": 192, "lr": 7.720903133189765e-05} +{"train_loss": 0.005796648096293211, "global_step": 22964, "epoch": 192, "lr": 7.720717256331944e-05} +{"train_loss": 0.0044340649619698524, "global_step": 22965, "epoch": 192, "lr": 7.720531374132282e-05} +{"train_loss": 0.004598397193202639, "global_step": 22966, "epoch": 192, "lr": 7.720345486591147e-05, "val_loss": 0.015622884035110474} +{"train_loss": 0.00662922253832221, "global_step": 22967, "epoch": 193, "lr": 7.720159593708907e-05} +{"train_loss": 0.004356316290795803, "global_step": 22968, "epoch": 193, "lr": 7.719973695485923e-05} +{"train_loss": 0.005714176222681999, "global_step": 22969, "epoch": 193, "lr": 7.71978779192256e-05} +{"train_loss": 0.0031197848729789257, "global_step": 22970, "epoch": 193, "lr": 7.719601883019185e-05} +{"train_loss": 0.0067758415825665, "global_step": 22971, "epoch": 193, "lr": 7.719415968776162e-05} +{"train_loss": 0.0060548242181539536, "global_step": 22972, "epoch": 193, "lr": 7.719230049193857e-05} +{"train_loss": 0.00299456506036222, "global_step": 22973, "epoch": 193, "lr": 7.719044124272634e-05} +{"train_loss": 0.0036932628136128187, "global_step": 22974, "epoch": 193, "lr": 7.718858194012859e-05} +{"train_loss": 0.003271038644015789, "global_step": 22975, "epoch": 193, "lr": 7.718672258414896e-05} +{"train_loss": 0.004787802696228027, "global_step": 22976, "epoch": 193, "lr": 7.71848631747911e-05} +{"train_loss": 0.004995936062186956, "global_step": 22977, "epoch": 193, "lr": 7.718300371205866e-05} +{"train_loss": 0.005217309575527906, "global_step": 22978, "epoch": 193, "lr": 7.718114419595531e-05} +{"train_loss": 0.0038172362837940454, "global_step": 22979, "epoch": 193, "lr": 7.717928462648468e-05} +{"train_loss": 0.005705041810870171, "global_step": 22980, "epoch": 193, "lr": 7.717742500365043e-05} +{"train_loss": 0.005572149530053139, "global_step": 22981, "epoch": 193, "lr": 7.717556532745621e-05} +{"train_loss": 0.004551899619400501, "global_step": 22982, "epoch": 193, "lr": 7.717370559790567e-05} +{"train_loss": 0.005291398148983717, "global_step": 22983, "epoch": 193, "lr": 7.717184581500248e-05} +{"train_loss": 0.004469027742743492, "global_step": 22984, "epoch": 193, "lr": 7.716998597875024e-05} +{"train_loss": 0.002609355142340064, "global_step": 22985, "epoch": 193, "lr": 7.716812608915265e-05} +{"train_loss": 0.004434257745742798, "global_step": 22986, "epoch": 193, "lr": 7.716626614621336e-05} +{"train_loss": 0.0043843407183885574, "global_step": 22987, "epoch": 193, "lr": 7.716440614993598e-05} +{"train_loss": 0.004297708161175251, "global_step": 22988, "epoch": 193, "lr": 7.716254610032421e-05} +{"train_loss": 0.004256023094058037, "global_step": 22989, "epoch": 193, "lr": 7.716068599738169e-05} +{"train_loss": 0.004595532082021236, "global_step": 22990, "epoch": 193, "lr": 7.715882584111204e-05} +{"train_loss": 0.0026635604444891214, "global_step": 22991, "epoch": 193, "lr": 7.715696563151895e-05} +{"train_loss": 0.00389291625469923, "global_step": 22992, "epoch": 193, "lr": 7.715510536860607e-05} +{"train_loss": 0.004048189148306847, "global_step": 22993, "epoch": 193, "lr": 7.715324505237703e-05} +{"train_loss": 0.0031302706338465214, "global_step": 22994, "epoch": 193, "lr": 7.715138468283549e-05} +{"train_loss": 0.007007403299212456, "global_step": 22995, "epoch": 193, "lr": 7.714952425998512e-05} +{"train_loss": 0.003263721475377679, "global_step": 22996, "epoch": 193, "lr": 7.714766378382956e-05} +{"train_loss": 0.00271785375662148, "global_step": 22997, "epoch": 193, "lr": 7.714580325437245e-05} +{"train_loss": 0.002881614724174142, "global_step": 22998, "epoch": 193, "lr": 7.714394267161746e-05} +{"train_loss": 0.003991665318608284, "global_step": 22999, "epoch": 193, "lr": 7.714208203556824e-05} +{"train_loss": 0.005378409754484892, "global_step": 23000, "epoch": 193, "lr": 7.714022134622845e-05} +{"train_loss": 0.004311834461987019, "global_step": 23001, "epoch": 193, "lr": 7.713836060360171e-05} +{"train_loss": 0.007657077629119158, "global_step": 23002, "epoch": 193, "lr": 7.713649980769174e-05} +{"train_loss": 0.003633924527093768, "global_step": 23003, "epoch": 193, "lr": 7.713463895850211e-05} +{"train_loss": 0.005136646330356598, "global_step": 23004, "epoch": 193, "lr": 7.713277805603654e-05} +{"train_loss": 0.00487293116748333, "global_step": 23005, "epoch": 193, "lr": 7.713091710029865e-05} +{"train_loss": 0.004187276121228933, "global_step": 23006, "epoch": 193, "lr": 7.712905609129209e-05} +{"train_loss": 0.00450008874759078, "global_step": 23007, "epoch": 193, "lr": 7.712719502902054e-05} +{"train_loss": 0.005613102577626705, "global_step": 23008, "epoch": 193, "lr": 7.712533391348766e-05} +{"train_loss": 0.006652000825852156, "global_step": 23009, "epoch": 193, "lr": 7.712347274469705e-05} +{"train_loss": 0.003940485883504152, "global_step": 23010, "epoch": 193, "lr": 7.712161152265243e-05} +{"train_loss": 0.006394061725586653, "global_step": 23011, "epoch": 193, "lr": 7.711975024735741e-05} +{"train_loss": 0.004833756014704704, "global_step": 23012, "epoch": 193, "lr": 7.711788891881564e-05} +{"train_loss": 0.004656639881432056, "global_step": 23013, "epoch": 193, "lr": 7.71160275370308e-05} +{"train_loss": 0.005090536084026098, "global_step": 23014, "epoch": 193, "lr": 7.711416610200656e-05} +{"train_loss": 0.005788100883364677, "global_step": 23015, "epoch": 193, "lr": 7.711230461374652e-05} +{"train_loss": 0.004752943757921457, "global_step": 23016, "epoch": 193, "lr": 7.71104430722544e-05} +{"train_loss": 0.0036481949500739574, "global_step": 23017, "epoch": 193, "lr": 7.710858147753379e-05} +{"train_loss": 0.003125221701338887, "global_step": 23018, "epoch": 193, "lr": 7.71067198295884e-05} +{"train_loss": 0.002925681648775935, "global_step": 23019, "epoch": 193, "lr": 7.710485812842185e-05} +{"train_loss": 0.004350610077381134, "global_step": 23020, "epoch": 193, "lr": 7.71029963740378e-05} +{"train_loss": 0.004416074603796005, "global_step": 23021, "epoch": 193, "lr": 7.710113456643992e-05} +{"train_loss": 0.0036708826664835215, "global_step": 23022, "epoch": 193, "lr": 7.709927270563187e-05} +{"train_loss": 0.0047449073754251, "global_step": 23023, "epoch": 193, "lr": 7.709741079161727e-05} +{"train_loss": 0.00567189184948802, "global_step": 23024, "epoch": 193, "lr": 7.709554882439982e-05} +{"train_loss": 0.005116939544677734, "global_step": 23025, "epoch": 193, "lr": 7.709368680398314e-05} +{"train_loss": 0.004704912658780813, "global_step": 23026, "epoch": 193, "lr": 7.709182473037091e-05} +{"train_loss": 0.002686804858967662, "global_step": 23027, "epoch": 193, "lr": 7.708996260356678e-05} +{"train_loss": 0.004256607033312321, "global_step": 23028, "epoch": 193, "lr": 7.70881004235744e-05} +{"train_loss": 0.005203736014664173, "global_step": 23029, "epoch": 193, "lr": 7.70862381903974e-05} +{"train_loss": 0.005253341980278492, "global_step": 23030, "epoch": 193, "lr": 7.70843759040395e-05} +{"train_loss": 0.002849592361599207, "global_step": 23031, "epoch": 193, "lr": 7.708251356450431e-05} +{"train_loss": 0.004664394538849592, "global_step": 23032, "epoch": 193, "lr": 7.70806511717955e-05} +{"train_loss": 0.0048115449026227, "global_step": 23033, "epoch": 193, "lr": 7.707878872591671e-05} +{"train_loss": 0.005193221382796764, "global_step": 23034, "epoch": 193, "lr": 7.707692622687164e-05} +{"train_loss": 0.0049386946484446526, "global_step": 23035, "epoch": 193, "lr": 7.707506367466389e-05} +{"train_loss": 0.006691514514386654, "global_step": 23036, "epoch": 193, "lr": 7.707320106929716e-05} +{"train_loss": 0.0038540104869753122, "global_step": 23037, "epoch": 193, "lr": 7.707133841077508e-05} +{"train_loss": 0.006420921068638563, "global_step": 23038, "epoch": 193, "lr": 7.706947569910133e-05} +{"train_loss": 0.0061544268392026424, "global_step": 23039, "epoch": 193, "lr": 7.706761293427956e-05} +{"train_loss": 0.004158116411417723, "global_step": 23040, "epoch": 193, "lr": 7.706575011631342e-05} +{"train_loss": 0.005958193447440863, "global_step": 23041, "epoch": 193, "lr": 7.706388724520656e-05} +{"train_loss": 0.0048335543833673, "global_step": 23042, "epoch": 193, "lr": 7.706202432096266e-05} +{"train_loss": 0.003911894746124744, "global_step": 23043, "epoch": 193, "lr": 7.706016134358537e-05} +{"train_loss": 0.003944693598896265, "global_step": 23044, "epoch": 193, "lr": 7.705829831307833e-05} +{"train_loss": 0.0035293065011501312, "global_step": 23045, "epoch": 193, "lr": 7.705643522944522e-05} +{"train_loss": 0.006311587058007717, "global_step": 23046, "epoch": 193, "lr": 7.705457209268969e-05} +{"train_loss": 0.004530447069555521, "global_step": 23047, "epoch": 193, "lr": 7.70527089028154e-05} +{"train_loss": 0.0046752095222473145, "global_step": 23048, "epoch": 193, "lr": 7.705084565982601e-05} +{"train_loss": 0.004609973635524511, "global_step": 23049, "epoch": 193, "lr": 7.704898236372518e-05} +{"train_loss": 0.0029616341926157475, "global_step": 23050, "epoch": 193, "lr": 7.704711901451653e-05} +{"train_loss": 0.003954010549932718, "global_step": 23051, "epoch": 193, "lr": 7.704525561220379e-05} +{"train_loss": 0.004080628044903278, "global_step": 23052, "epoch": 193, "lr": 7.704339215679056e-05} +{"train_loss": 0.005679533816874027, "global_step": 23053, "epoch": 193, "lr": 7.704152864828053e-05} +{"train_loss": 0.00508243078365922, "global_step": 23054, "epoch": 193, "lr": 7.703966508667732e-05} +{"train_loss": 0.006189520005136728, "global_step": 23055, "epoch": 193, "lr": 7.703780147198465e-05} +{"train_loss": 0.003824374405667186, "global_step": 23056, "epoch": 193, "lr": 7.703593780420613e-05} +{"train_loss": 0.003931751474738121, "global_step": 23057, "epoch": 193, "lr": 7.703407408334544e-05} +{"train_loss": 0.0053757489658892155, "global_step": 23058, "epoch": 193, "lr": 7.703221030940623e-05} +{"train_loss": 0.006121567916125059, "global_step": 23059, "epoch": 193, "lr": 7.703034648239216e-05} +{"train_loss": 0.0031930969562381506, "global_step": 23060, "epoch": 193, "lr": 7.70284826023069e-05} +{"train_loss": 0.005213561002165079, "global_step": 23061, "epoch": 193, "lr": 7.702661866915408e-05} +{"train_loss": 0.0045610773377120495, "global_step": 23062, "epoch": 193, "lr": 7.70247546829374e-05} +{"train_loss": 0.005684496834874153, "global_step": 23063, "epoch": 193, "lr": 7.70228906436605e-05} +{"train_loss": 0.0052138944156467915, "global_step": 23064, "epoch": 193, "lr": 7.702102655132705e-05} +{"train_loss": 0.0033370826859027147, "global_step": 23065, "epoch": 193, "lr": 7.70191624059407e-05} +{"train_loss": 0.004150742664933205, "global_step": 23066, "epoch": 193, "lr": 7.70172982075051e-05} +{"train_loss": 0.003621035488322377, "global_step": 23067, "epoch": 193, "lr": 7.701543395602391e-05} +{"train_loss": 0.0035446947440505028, "global_step": 23068, "epoch": 193, "lr": 7.701356965150083e-05} +{"train_loss": 0.004619871266186237, "global_step": 23069, "epoch": 193, "lr": 7.701170529393946e-05} +{"train_loss": 0.004448217339813709, "global_step": 23070, "epoch": 193, "lr": 7.700984088334351e-05} +{"train_loss": 0.005007988773286343, "global_step": 23071, "epoch": 193, "lr": 7.700797641971665e-05} +{"train_loss": 0.005068653728812933, "global_step": 23072, "epoch": 193, "lr": 7.700611190306249e-05} +{"train_loss": 0.003895637346431613, "global_step": 23073, "epoch": 193, "lr": 7.70042473333847e-05} +{"train_loss": 0.004310435149818659, "global_step": 23074, "epoch": 193, "lr": 7.700238271068696e-05} +{"train_loss": 0.005497343372553587, "global_step": 23075, "epoch": 193, "lr": 7.700051803497294e-05} +{"train_loss": 0.004687688313424587, "global_step": 23076, "epoch": 193, "lr": 7.699865330624627e-05} +{"train_loss": 0.005161796696484089, "global_step": 23077, "epoch": 193, "lr": 7.699678852451065e-05} +{"train_loss": 0.004411762580275536, "global_step": 23078, "epoch": 193, "lr": 7.699492368976972e-05} +{"train_loss": 0.00557528343051672, "global_step": 23079, "epoch": 193, "lr": 7.699305880202712e-05} +{"train_loss": 0.003168833674862981, "global_step": 23080, "epoch": 193, "lr": 7.699119386128654e-05} +{"train_loss": 0.005185170564800501, "global_step": 23081, "epoch": 193, "lr": 7.698932886755164e-05} +{"train_loss": 0.005662033800035715, "global_step": 23082, "epoch": 193, "lr": 7.698746382082608e-05} +{"train_loss": 0.004091784358024597, "global_step": 23083, "epoch": 193, "lr": 7.698559872111351e-05} +{"train_loss": 0.003931572660803795, "global_step": 23084, "epoch": 193, "lr": 7.698373356841759e-05} +{"train_loss": 0.004629953294804617, "global_step": 23085, "epoch": 193, "lr": 7.698186836274201e-05, "val_loss": 0.019549699500203133} +{"train_loss": 0.004196824971586466, "global_step": 23086, "epoch": 194, "lr": 7.698000310409041e-05} +{"train_loss": 0.0033597450237721205, "global_step": 23087, "epoch": 194, "lr": 7.697813779246645e-05} +{"train_loss": 0.003964572679251432, "global_step": 23088, "epoch": 194, "lr": 7.69762724278738e-05} +{"train_loss": 0.0060415249317884445, "global_step": 23089, "epoch": 194, "lr": 7.697440701031613e-05} +{"train_loss": 0.00406996626406908, "global_step": 23090, "epoch": 194, "lr": 7.697254153979709e-05} +{"train_loss": 0.0023500581737607718, "global_step": 23091, "epoch": 194, "lr": 7.697067601632036e-05} +{"train_loss": 0.0031466151122003794, "global_step": 23092, "epoch": 194, "lr": 7.696881043988955e-05} +{"train_loss": 0.005871293134987354, "global_step": 23093, "epoch": 194, "lr": 7.696694481050839e-05} +{"train_loss": 0.004326612688601017, "global_step": 23094, "epoch": 194, "lr": 7.696507912818052e-05} +{"train_loss": 0.003989275079220533, "global_step": 23095, "epoch": 194, "lr": 7.696321339290959e-05} +{"train_loss": 0.0046965256333351135, "global_step": 23096, "epoch": 194, "lr": 7.696134760469927e-05} +{"train_loss": 0.0028382563032209873, "global_step": 23097, "epoch": 194, "lr": 7.695948176355322e-05} +{"train_loss": 0.007125443778932095, "global_step": 23098, "epoch": 194, "lr": 7.695761586947512e-05} +{"train_loss": 0.004242902621626854, "global_step": 23099, "epoch": 194, "lr": 7.69557499224686e-05} +{"train_loss": 0.0033529673237353563, "global_step": 23100, "epoch": 194, "lr": 7.695388392253734e-05} +{"train_loss": 0.0059776571579277515, "global_step": 23101, "epoch": 194, "lr": 7.695201786968504e-05} +{"train_loss": 0.0038801981136202812, "global_step": 23102, "epoch": 194, "lr": 7.695015176391532e-05} +{"train_loss": 0.004266826435923576, "global_step": 23103, "epoch": 194, "lr": 7.694828560523186e-05} +{"train_loss": 0.004088833462446928, "global_step": 23104, "epoch": 194, "lr": 7.694641939363831e-05} +{"train_loss": 0.005271658767014742, "global_step": 23105, "epoch": 194, "lr": 7.694455312913836e-05} +{"train_loss": 0.004036485217511654, "global_step": 23106, "epoch": 194, "lr": 7.694268681173563e-05} +{"train_loss": 0.002738548908382654, "global_step": 23107, "epoch": 194, "lr": 7.694082044143383e-05} +{"train_loss": 0.0037076943553984165, "global_step": 23108, "epoch": 194, "lr": 7.69389540182366e-05} +{"train_loss": 0.0037097022868692875, "global_step": 23109, "epoch": 194, "lr": 7.693708754214763e-05} +{"train_loss": 0.0038088918663561344, "global_step": 23110, "epoch": 194, "lr": 7.693522101317057e-05} +{"train_loss": 0.0033668808173388243, "global_step": 23111, "epoch": 194, "lr": 7.693335443130905e-05} +{"train_loss": 0.0051203882321715355, "global_step": 23112, "epoch": 194, "lr": 7.693148779656678e-05} +{"train_loss": 0.0030434594955295324, "global_step": 23113, "epoch": 194, "lr": 7.692962110894742e-05} +{"train_loss": 0.0035803532227873802, "global_step": 23114, "epoch": 194, "lr": 7.692775436845462e-05} +{"train_loss": 0.006837003398686647, "global_step": 23115, "epoch": 194, "lr": 7.692588757509206e-05} +{"train_loss": 0.0037478385493159294, "global_step": 23116, "epoch": 194, "lr": 7.692402072886338e-05} +{"train_loss": 0.004580857697874308, "global_step": 23117, "epoch": 194, "lr": 7.692215382977226e-05} +{"train_loss": 0.002950109774246812, "global_step": 23118, "epoch": 194, "lr": 7.692028687782238e-05} +{"train_loss": 0.00216852268204093, "global_step": 23119, "epoch": 194, "lr": 7.691841987301737e-05} +{"train_loss": 0.003179228398948908, "global_step": 23120, "epoch": 194, "lr": 7.691655281536095e-05} +{"train_loss": 0.004479946102946997, "global_step": 23121, "epoch": 194, "lr": 7.691468570485675e-05} +{"train_loss": 0.004123942460864782, "global_step": 23122, "epoch": 194, "lr": 7.691281854150843e-05} +{"train_loss": 0.002666409593075514, "global_step": 23123, "epoch": 194, "lr": 7.691095132531968e-05} +{"train_loss": 0.0027045938186347485, "global_step": 23124, "epoch": 194, "lr": 7.690908405629412e-05} +{"train_loss": 0.0030070559587329626, "global_step": 23125, "epoch": 194, "lr": 7.690721673443547e-05} +{"train_loss": 0.005125991068780422, "global_step": 23126, "epoch": 194, "lr": 7.690534935974737e-05} +{"train_loss": 0.0028350853826850653, "global_step": 23127, "epoch": 194, "lr": 7.69034819322335e-05} +{"train_loss": 0.005955603905022144, "global_step": 23128, "epoch": 194, "lr": 7.690161445189751e-05} +{"train_loss": 0.004350116476416588, "global_step": 23129, "epoch": 194, "lr": 7.689974691874308e-05} +{"train_loss": 0.00487346900627017, "global_step": 23130, "epoch": 194, "lr": 7.689787933277386e-05} +{"train_loss": 0.003195785218849778, "global_step": 23131, "epoch": 194, "lr": 7.689601169399353e-05} +{"train_loss": 0.006164741236716509, "global_step": 23132, "epoch": 194, "lr": 7.689414400240576e-05} +{"train_loss": 0.004819472320377827, "global_step": 23133, "epoch": 194, "lr": 7.689227625801421e-05} +{"train_loss": 0.004611679818481207, "global_step": 23134, "epoch": 194, "lr": 7.689040846082254e-05} +{"train_loss": 0.006075951270759106, "global_step": 23135, "epoch": 194, "lr": 7.688854061083443e-05} +{"train_loss": 0.003818838857114315, "global_step": 23136, "epoch": 194, "lr": 7.688667270805355e-05} +{"train_loss": 0.00347142550162971, "global_step": 23137, "epoch": 194, "lr": 7.688480475248357e-05} +{"train_loss": 0.0032234112732112408, "global_step": 23138, "epoch": 194, "lr": 7.688293674412812e-05} +{"train_loss": 0.004489357583224773, "global_step": 23139, "epoch": 194, "lr": 7.68810686829909e-05} +{"train_loss": 0.004772490356117487, "global_step": 23140, "epoch": 194, "lr": 7.687920056907561e-05} +{"train_loss": 0.004977894015610218, "global_step": 23141, "epoch": 194, "lr": 7.687733240238585e-05} +{"train_loss": 0.004413030110299587, "global_step": 23142, "epoch": 194, "lr": 7.687546418292533e-05} +{"train_loss": 0.007388892583549023, "global_step": 23143, "epoch": 194, "lr": 7.68735959106977e-05} +{"train_loss": 0.003963743802160025, "global_step": 23144, "epoch": 194, "lr": 7.687172758570663e-05} +{"train_loss": 0.0027132073882967234, "global_step": 23145, "epoch": 194, "lr": 7.68698592079558e-05} +{"train_loss": 0.005571643356233835, "global_step": 23146, "epoch": 194, "lr": 7.686799077744889e-05} +{"train_loss": 0.0041292826645076275, "global_step": 23147, "epoch": 194, "lr": 7.686612229418952e-05} +{"train_loss": 0.0037066868972033262, "global_step": 23148, "epoch": 194, "lr": 7.686425375818141e-05} +{"train_loss": 0.005264846608042717, "global_step": 23149, "epoch": 194, "lr": 7.686238516942818e-05} +{"train_loss": 0.006056944373995066, "global_step": 23150, "epoch": 194, "lr": 7.686051652793356e-05} +{"train_loss": 0.003760069841518998, "global_step": 23151, "epoch": 194, "lr": 7.685864783370117e-05} +{"train_loss": 0.002317513804882765, "global_step": 23152, "epoch": 194, "lr": 7.68567790867347e-05} +{"train_loss": 0.004231021739542484, "global_step": 23153, "epoch": 194, "lr": 7.685491028703781e-05} +{"train_loss": 0.005189772229641676, "global_step": 23154, "epoch": 194, "lr": 7.685304143461417e-05} +{"train_loss": 0.00371762178838253, "global_step": 23155, "epoch": 194, "lr": 7.685117252946745e-05} +{"train_loss": 0.0051914993673563, "global_step": 23156, "epoch": 194, "lr": 7.684930357160132e-05} +{"train_loss": 0.0040953075513243675, "global_step": 23157, "epoch": 194, "lr": 7.684743456101946e-05} +{"train_loss": 0.0037968161050230265, "global_step": 23158, "epoch": 194, "lr": 7.684556549772552e-05} +{"train_loss": 0.0033478359691798687, "global_step": 23159, "epoch": 194, "lr": 7.684369638172321e-05} +{"train_loss": 0.004009864758700132, "global_step": 23160, "epoch": 194, "lr": 7.684182721301614e-05} +{"train_loss": 0.005234824493527412, "global_step": 23161, "epoch": 194, "lr": 7.683995799160801e-05} +{"train_loss": 0.00553097715601325, "global_step": 23162, "epoch": 194, "lr": 7.683808871750251e-05} +{"train_loss": 0.005480469670146704, "global_step": 23163, "epoch": 194, "lr": 7.683621939070327e-05} +{"train_loss": 0.004162698518484831, "global_step": 23164, "epoch": 194, "lr": 7.6834350011214e-05} +{"train_loss": 0.003317887894809246, "global_step": 23165, "epoch": 194, "lr": 7.683248057903834e-05} +{"train_loss": 0.005311200860887766, "global_step": 23166, "epoch": 194, "lr": 7.683061109417997e-05} +{"train_loss": 0.004231791477650404, "global_step": 23167, "epoch": 194, "lr": 7.682874155664255e-05} +{"train_loss": 0.003891264321282506, "global_step": 23168, "epoch": 194, "lr": 7.682687196642976e-05} +{"train_loss": 0.004916657693684101, "global_step": 23169, "epoch": 194, "lr": 7.68250023235453e-05} +{"train_loss": 0.0023904358968138695, "global_step": 23170, "epoch": 194, "lr": 7.682313262799278e-05} +{"train_loss": 0.00396067276597023, "global_step": 23171, "epoch": 194, "lr": 7.682126287977595e-05} +{"train_loss": 0.00669911177828908, "global_step": 23172, "epoch": 194, "lr": 7.681939307889841e-05} +{"train_loss": 0.0034068338572978973, "global_step": 23173, "epoch": 194, "lr": 7.681752322536385e-05} +{"train_loss": 0.004212029278278351, "global_step": 23174, "epoch": 194, "lr": 7.681565331917596e-05} +{"train_loss": 0.002573749516159296, "global_step": 23175, "epoch": 194, "lr": 7.68137833603384e-05} +{"train_loss": 0.004025639500468969, "global_step": 23176, "epoch": 194, "lr": 7.681191334885482e-05} +{"train_loss": 0.006732664071023464, "global_step": 23177, "epoch": 194, "lr": 7.681004328472894e-05} +{"train_loss": 0.004956644959747791, "global_step": 23178, "epoch": 194, "lr": 7.68081731679644e-05} +{"train_loss": 0.004057419952005148, "global_step": 23179, "epoch": 194, "lr": 7.680630299856486e-05} +{"train_loss": 0.0033271899446845055, "global_step": 23180, "epoch": 194, "lr": 7.680443277653402e-05} +{"train_loss": 0.004900708794593811, "global_step": 23181, "epoch": 194, "lr": 7.680256250187554e-05} +{"train_loss": 0.005696958862245083, "global_step": 23182, "epoch": 194, "lr": 7.68006921745931e-05} +{"train_loss": 0.003960084170103073, "global_step": 23183, "epoch": 194, "lr": 7.679882179469034e-05} +{"train_loss": 0.003744344227015972, "global_step": 23184, "epoch": 194, "lr": 7.679695136217097e-05} +{"train_loss": 0.0037186723202466965, "global_step": 23185, "epoch": 194, "lr": 7.679508087703864e-05} +{"train_loss": 0.006791604682803154, "global_step": 23186, "epoch": 194, "lr": 7.679321033929704e-05} +{"train_loss": 0.0034804914612323046, "global_step": 23187, "epoch": 194, "lr": 7.679133974894983e-05} +{"train_loss": 0.0058118118904531, "global_step": 23188, "epoch": 194, "lr": 7.67894691060007e-05} +{"train_loss": 0.004239703994244337, "global_step": 23189, "epoch": 194, "lr": 7.678759841045329e-05} +{"train_loss": 0.002845713635906577, "global_step": 23190, "epoch": 194, "lr": 7.678572766231131e-05} +{"train_loss": 0.006770036183297634, "global_step": 23191, "epoch": 194, "lr": 7.678385686157841e-05} +{"train_loss": 0.004845961928367615, "global_step": 23192, "epoch": 194, "lr": 7.678198600825826e-05} +{"train_loss": 0.0032377669122070074, "global_step": 23193, "epoch": 194, "lr": 7.678011510235455e-05} +{"train_loss": 0.003469915362074971, "global_step": 23194, "epoch": 194, "lr": 7.677824414387093e-05} +{"train_loss": 0.004167589358985424, "global_step": 23195, "epoch": 194, "lr": 7.67763731328111e-05} +{"train_loss": 0.006631695199757814, "global_step": 23196, "epoch": 194, "lr": 7.677450206917873e-05} +{"train_loss": 0.0033524795435369015, "global_step": 23197, "epoch": 194, "lr": 7.677263095297749e-05} +{"train_loss": 0.005996441002935171, "global_step": 23198, "epoch": 194, "lr": 7.677075978421104e-05} +{"train_loss": 0.005159951746463776, "global_step": 23199, "epoch": 194, "lr": 7.676888856288306e-05} +{"train_loss": 0.00640055350959301, "global_step": 23200, "epoch": 194, "lr": 7.676701728899723e-05} +{"train_loss": 0.004403471481055021, "global_step": 23201, "epoch": 194, "lr": 7.676514596255721e-05} +{"train_loss": 0.003940116614103317, "global_step": 23202, "epoch": 194, "lr": 7.67632745835667e-05} +{"train_loss": 0.004356738645583391, "global_step": 23203, "epoch": 194, "lr": 7.676140315202936e-05} +{"train_loss": 0.004340021902335291, "global_step": 23204, "epoch": 194, "lr": 7.675953166794884e-05, "val_loss": 0.02756979689002037} +{"train_loss": 0.006735236383974552, "global_step": 23205, "epoch": 195, "lr": 7.675766013132886e-05} +{"train_loss": 0.002643461339175701, "global_step": 23206, "epoch": 195, "lr": 7.675578854217307e-05} +{"train_loss": 0.0030847652815282345, "global_step": 23207, "epoch": 195, "lr": 7.675391690048515e-05} +{"train_loss": 0.003766200039535761, "global_step": 23208, "epoch": 195, "lr": 7.675204520626877e-05} +{"train_loss": 0.006803000811487436, "global_step": 23209, "epoch": 195, "lr": 7.675017345952761e-05} +{"train_loss": 0.00595398573204875, "global_step": 23210, "epoch": 195, "lr": 7.674830166026535e-05} +{"train_loss": 0.0035241625737398863, "global_step": 23211, "epoch": 195, "lr": 7.674642980848564e-05} +{"train_loss": 0.00440378999337554, "global_step": 23212, "epoch": 195, "lr": 7.674455790419217e-05} +{"train_loss": 0.0037627615965902805, "global_step": 23213, "epoch": 195, "lr": 7.674268594738863e-05} +{"train_loss": 0.004419098608195782, "global_step": 23214, "epoch": 195, "lr": 7.674081393807868e-05} +{"train_loss": 0.0033671900164335966, "global_step": 23215, "epoch": 195, "lr": 7.6738941876266e-05} +{"train_loss": 0.0026275389827787876, "global_step": 23216, "epoch": 195, "lr": 7.673706976195425e-05} +{"train_loss": 0.003376214299350977, "global_step": 23217, "epoch": 195, "lr": 7.673519759514713e-05} +{"train_loss": 0.0028465869836509228, "global_step": 23218, "epoch": 195, "lr": 7.673332537584832e-05} +{"train_loss": 0.007291043642908335, "global_step": 23219, "epoch": 195, "lr": 7.673145310406147e-05} +{"train_loss": 0.0035466570407152176, "global_step": 23220, "epoch": 195, "lr": 7.672958077979027e-05} +{"train_loss": 0.003336680121719837, "global_step": 23221, "epoch": 195, "lr": 7.672770840303839e-05} +{"train_loss": 0.004448315128684044, "global_step": 23222, "epoch": 195, "lr": 7.672583597380951e-05} +{"train_loss": 0.0032857051119208336, "global_step": 23223, "epoch": 195, "lr": 7.672396349210731e-05} +{"train_loss": 0.004792097024619579, "global_step": 23224, "epoch": 195, "lr": 7.672209095793545e-05} +{"train_loss": 0.004566492512822151, "global_step": 23225, "epoch": 195, "lr": 7.672021837129763e-05} +{"train_loss": 0.004140980541706085, "global_step": 23226, "epoch": 195, "lr": 7.671834573219752e-05} +{"train_loss": 0.004751765169203281, "global_step": 23227, "epoch": 195, "lr": 7.671647304063881e-05} +{"train_loss": 0.004263830371201038, "global_step": 23228, "epoch": 195, "lr": 7.671460029662512e-05} +{"train_loss": 0.005247074645012617, "global_step": 23229, "epoch": 195, "lr": 7.671272750016019e-05} +{"train_loss": 0.004632684867829084, "global_step": 23230, "epoch": 195, "lr": 7.671085465124767e-05} +{"train_loss": 0.0033112510573118925, "global_step": 23231, "epoch": 195, "lr": 7.670898174989123e-05} +{"train_loss": 0.004297698847949505, "global_step": 23232, "epoch": 195, "lr": 7.670710879609458e-05} +{"train_loss": 0.0050675999373197556, "global_step": 23233, "epoch": 195, "lr": 7.670523578986136e-05} +{"train_loss": 0.0040904502384364605, "global_step": 23234, "epoch": 195, "lr": 7.670336273119525e-05} +{"train_loss": 0.0058215027675032616, "global_step": 23235, "epoch": 195, "lr": 7.670148962009995e-05} +{"train_loss": 0.0055870735086500645, "global_step": 23236, "epoch": 195, "lr": 7.669961645657912e-05} +{"train_loss": 0.0031919965986162424, "global_step": 23237, "epoch": 195, "lr": 7.669774324063646e-05} +{"train_loss": 0.0024820039980113506, "global_step": 23238, "epoch": 195, "lr": 7.669586997227564e-05} +{"train_loss": 0.00392047967761755, "global_step": 23239, "epoch": 195, "lr": 7.669399665150032e-05} +{"train_loss": 0.004823942668735981, "global_step": 23240, "epoch": 195, "lr": 7.66921232783142e-05} +{"train_loss": 0.0038368713576346636, "global_step": 23241, "epoch": 195, "lr": 7.669024985272094e-05} +{"train_loss": 0.00453561544418335, "global_step": 23242, "epoch": 195, "lr": 7.668837637472421e-05} +{"train_loss": 0.005669513717293739, "global_step": 23243, "epoch": 195, "lr": 7.668650284432772e-05} +{"train_loss": 0.003775110002607107, "global_step": 23244, "epoch": 195, "lr": 7.668462926153513e-05} +{"train_loss": 0.0034344433806836605, "global_step": 23245, "epoch": 195, "lr": 7.668275562635013e-05} +{"train_loss": 0.0026805850211530924, "global_step": 23246, "epoch": 195, "lr": 7.668088193877638e-05} +{"train_loss": 0.002295977668836713, "global_step": 23247, "epoch": 195, "lr": 7.667900819881758e-05} +{"train_loss": 0.0030930170323699713, "global_step": 23248, "epoch": 195, "lr": 7.667713440647739e-05} +{"train_loss": 0.0030155284330248833, "global_step": 23249, "epoch": 195, "lr": 7.667526056175949e-05} +{"train_loss": 0.002758346265181899, "global_step": 23250, "epoch": 195, "lr": 7.667338666466757e-05} +{"train_loss": 0.00342859560623765, "global_step": 23251, "epoch": 195, "lr": 7.667151271520529e-05} +{"train_loss": 0.0036926057655364275, "global_step": 23252, "epoch": 195, "lr": 7.666963871337637e-05} +{"train_loss": 0.0031270182225853205, "global_step": 23253, "epoch": 195, "lr": 7.666776465918446e-05} +{"train_loss": 0.001874708803370595, "global_step": 23254, "epoch": 195, "lr": 7.666589055263324e-05} +{"train_loss": 0.0030589851085096598, "global_step": 23255, "epoch": 195, "lr": 7.666401639372638e-05} +{"train_loss": 0.003172348253428936, "global_step": 23256, "epoch": 195, "lr": 7.666214218246759e-05} +{"train_loss": 0.002222074894234538, "global_step": 23257, "epoch": 195, "lr": 7.666026791886052e-05} +{"train_loss": 0.0032681527081876993, "global_step": 23258, "epoch": 195, "lr": 7.665839360290888e-05} +{"train_loss": 0.0026095996145159006, "global_step": 23259, "epoch": 195, "lr": 7.665651923461631e-05} +{"train_loss": 0.0037455102428793907, "global_step": 23260, "epoch": 195, "lr": 7.665464481398652e-05} +{"train_loss": 0.0035310157109051943, "global_step": 23261, "epoch": 195, "lr": 7.665277034102319e-05} +{"train_loss": 0.0054292818531394005, "global_step": 23262, "epoch": 195, "lr": 7.665089581572998e-05} +{"train_loss": 0.0014273200649768114, "global_step": 23263, "epoch": 195, "lr": 7.66490212381106e-05} +{"train_loss": 0.004635837860405445, "global_step": 23264, "epoch": 195, "lr": 7.664714660816869e-05} +{"train_loss": 0.00340637331828475, "global_step": 23265, "epoch": 195, "lr": 7.664527192590797e-05} +{"train_loss": 0.0055281552486121655, "global_step": 23266, "epoch": 195, "lr": 7.664339719133212e-05} +{"train_loss": 0.003286610823124647, "global_step": 23267, "epoch": 195, "lr": 7.664152240444478e-05} +{"train_loss": 0.0027980210725218058, "global_step": 23268, "epoch": 195, "lr": 7.663964756524966e-05} +{"train_loss": 0.003495866898447275, "global_step": 23269, "epoch": 195, "lr": 7.663777267375044e-05} +{"train_loss": 0.002535790903493762, "global_step": 23270, "epoch": 195, "lr": 7.663589772995082e-05} +{"train_loss": 0.0020750758703798056, "global_step": 23271, "epoch": 195, "lr": 7.663402273385444e-05} +{"train_loss": 0.005186745896935463, "global_step": 23272, "epoch": 195, "lr": 7.663214768546501e-05} +{"train_loss": 0.004410171415656805, "global_step": 23273, "epoch": 195, "lr": 7.66302725847862e-05} +{"train_loss": 0.00305645982734859, "global_step": 23274, "epoch": 195, "lr": 7.662839743182169e-05} +{"train_loss": 0.002923299791291356, "global_step": 23275, "epoch": 195, "lr": 7.662652222657516e-05} +{"train_loss": 0.0064222621731460094, "global_step": 23276, "epoch": 195, "lr": 7.662464696905032e-05} +{"train_loss": 0.0034867911599576473, "global_step": 23277, "epoch": 195, "lr": 7.66227716592508e-05} +{"train_loss": 0.005140033550560474, "global_step": 23278, "epoch": 195, "lr": 7.662089629718035e-05} +{"train_loss": 0.003049357095733285, "global_step": 23279, "epoch": 195, "lr": 7.661902088284258e-05} +{"train_loss": 0.005794481839984655, "global_step": 23280, "epoch": 195, "lr": 7.661714541624124e-05} +{"train_loss": 0.0025958239566534758, "global_step": 23281, "epoch": 195, "lr": 7.661526989737996e-05} +{"train_loss": 0.004504708107560873, "global_step": 23282, "epoch": 195, "lr": 7.661339432626243e-05} +{"train_loss": 0.004316105507314205, "global_step": 23283, "epoch": 195, "lr": 7.661151870289235e-05} +{"train_loss": 0.005102825816720724, "global_step": 23284, "epoch": 195, "lr": 7.660964302727341e-05} +{"train_loss": 0.00309099187143147, "global_step": 23285, "epoch": 195, "lr": 7.660776729940927e-05} +{"train_loss": 0.003982867114245892, "global_step": 23286, "epoch": 195, "lr": 7.660589151930361e-05} +{"train_loss": 0.003273541806265712, "global_step": 23287, "epoch": 195, "lr": 7.660401568696014e-05} +{"train_loss": 0.0037895168643444777, "global_step": 23288, "epoch": 195, "lr": 7.660213980238252e-05} +{"train_loss": 0.0060052210465073586, "global_step": 23289, "epoch": 195, "lr": 7.660026386557444e-05} +{"train_loss": 0.0054529220797121525, "global_step": 23290, "epoch": 195, "lr": 7.659838787653959e-05} +{"train_loss": 0.004430846311151981, "global_step": 23291, "epoch": 195, "lr": 7.659651183528165e-05} +{"train_loss": 0.004194500390440226, "global_step": 23292, "epoch": 195, "lr": 7.659463574180428e-05} +{"train_loss": 0.0033258278854191303, "global_step": 23293, "epoch": 195, "lr": 7.65927595961112e-05} +{"train_loss": 0.006734312977641821, "global_step": 23294, "epoch": 195, "lr": 7.659088339820608e-05} +{"train_loss": 0.0037123020738363266, "global_step": 23295, "epoch": 195, "lr": 7.65890071480926e-05} +{"train_loss": 0.006896199192851782, "global_step": 23296, "epoch": 195, "lr": 7.658713084577445e-05} +{"train_loss": 0.004922483116388321, "global_step": 23297, "epoch": 195, "lr": 7.65852544912553e-05} +{"train_loss": 0.008462375961244106, "global_step": 23298, "epoch": 195, "lr": 7.658337808453884e-05} +{"train_loss": 0.004172551445662975, "global_step": 23299, "epoch": 195, "lr": 7.658150162562876e-05} +{"train_loss": 0.0036131837405264378, "global_step": 23300, "epoch": 195, "lr": 7.657962511452874e-05} +{"train_loss": 0.006877783685922623, "global_step": 23301, "epoch": 195, "lr": 7.657774855124247e-05} +{"train_loss": 0.007333802990615368, "global_step": 23302, "epoch": 195, "lr": 7.657587193577363e-05} +{"train_loss": 0.007063628174364567, "global_step": 23303, "epoch": 195, "lr": 7.65739952681259e-05} +{"train_loss": 0.0036049848422408104, "global_step": 23304, "epoch": 195, "lr": 7.657211854830297e-05} +{"train_loss": 0.008329823613166809, "global_step": 23305, "epoch": 195, "lr": 7.657024177630852e-05} +{"train_loss": 0.004665621556341648, "global_step": 23306, "epoch": 195, "lr": 7.656836495214625e-05} +{"train_loss": 0.004485422279685736, "global_step": 23307, "epoch": 195, "lr": 7.656648807581983e-05} +{"train_loss": 0.00704443734139204, "global_step": 23308, "epoch": 195, "lr": 7.656461114733296e-05} +{"train_loss": 0.007937189191579819, "global_step": 23309, "epoch": 195, "lr": 7.656273416668929e-05} +{"train_loss": 0.006492179352790117, "global_step": 23310, "epoch": 195, "lr": 7.656085713389255e-05} +{"train_loss": 0.0041709900833666325, "global_step": 23311, "epoch": 195, "lr": 7.65589800489464e-05} +{"train_loss": 0.004854160826653242, "global_step": 23312, "epoch": 195, "lr": 7.655710291185451e-05} +{"train_loss": 0.003640144132077694, "global_step": 23313, "epoch": 195, "lr": 7.655522572262061e-05} +{"train_loss": 0.005169325973838568, "global_step": 23314, "epoch": 195, "lr": 7.655334848124836e-05} +{"train_loss": 0.0051620700396597385, "global_step": 23315, "epoch": 195, "lr": 7.655147118774143e-05} +{"train_loss": 0.007215694058686495, "global_step": 23316, "epoch": 195, "lr": 7.654959384210354e-05} +{"train_loss": 0.006631716154515743, "global_step": 23317, "epoch": 195, "lr": 7.654771644433834e-05} +{"train_loss": 0.003989444579929113, "global_step": 23318, "epoch": 195, "lr": 7.654583899444955e-05} +{"train_loss": 0.0035185799933969975, "global_step": 23319, "epoch": 195, "lr": 7.654396149244083e-05} +{"train_loss": 0.005460755433887243, "global_step": 23320, "epoch": 195, "lr": 7.654208393831589e-05} +{"train_loss": 0.0030041621066629887, "global_step": 23321, "epoch": 195, "lr": 7.654020633207841e-05} +{"train_loss": 0.009691326878964901, "global_step": 23322, "epoch": 195, "lr": 7.653832867373205e-05} +{"train_loss": 0.0043807176231336195, "global_step": 23323, "epoch": 195, "lr": 7.653645096328053e-05, "val_loss": 0.021672483533620834, "train_action_mse_error": 0.00010188441228820011} +{"train_loss": 0.0037463887128978968, "global_step": 23324, "epoch": 196, "lr": 7.653457320072752e-05} +{"train_loss": 0.0060924505814909935, "global_step": 23325, "epoch": 196, "lr": 7.65326953860767e-05} +{"train_loss": 0.004960572812706232, "global_step": 23326, "epoch": 196, "lr": 7.653081751933179e-05} +{"train_loss": 0.0053001451306045055, "global_step": 23327, "epoch": 196, "lr": 7.652893960049643e-05} +{"train_loss": 0.00509722251445055, "global_step": 23328, "epoch": 196, "lr": 7.652706162957436e-05} +{"train_loss": 0.004344356246292591, "global_step": 23329, "epoch": 196, "lr": 7.652518360656922e-05} +{"train_loss": 0.0037416736595332623, "global_step": 23330, "epoch": 196, "lr": 7.652330553148471e-05} +{"train_loss": 0.005997954402118921, "global_step": 23331, "epoch": 196, "lr": 7.652142740432453e-05} +{"train_loss": 0.005180410575121641, "global_step": 23332, "epoch": 196, "lr": 7.651954922509237e-05} +{"train_loss": 0.006943915970623493, "global_step": 23333, "epoch": 196, "lr": 7.651767099379189e-05} +{"train_loss": 0.003193834563717246, "global_step": 23334, "epoch": 196, "lr": 7.651579271042681e-05} +{"train_loss": 0.002998956246301532, "global_step": 23335, "epoch": 196, "lr": 7.65139143750008e-05} +{"train_loss": 0.005646970588713884, "global_step": 23336, "epoch": 196, "lr": 7.651203598751755e-05} +{"train_loss": 0.005487588234245777, "global_step": 23337, "epoch": 196, "lr": 7.651015754798075e-05} +{"train_loss": 0.005491520278155804, "global_step": 23338, "epoch": 196, "lr": 7.650827905639409e-05} +{"train_loss": 0.005204526241868734, "global_step": 23339, "epoch": 196, "lr": 7.650640051276125e-05} +{"train_loss": 0.002349499147385359, "global_step": 23340, "epoch": 196, "lr": 7.650452191708592e-05} +{"train_loss": 0.006738346070051193, "global_step": 23341, "epoch": 196, "lr": 7.650264326937182e-05} +{"train_loss": 0.008408649824559689, "global_step": 23342, "epoch": 196, "lr": 7.650076456962258e-05} +{"train_loss": 0.003927137702703476, "global_step": 23343, "epoch": 196, "lr": 7.649888581784194e-05} +{"train_loss": 0.0040897466242313385, "global_step": 23344, "epoch": 196, "lr": 7.649700701403356e-05} +{"train_loss": 0.003239438636228442, "global_step": 23345, "epoch": 196, "lr": 7.649512815820114e-05} +{"train_loss": 0.003647296689450741, "global_step": 23346, "epoch": 196, "lr": 7.649324925034835e-05} +{"train_loss": 0.004049211274832487, "global_step": 23347, "epoch": 196, "lr": 7.649137029047893e-05} +{"train_loss": 0.003784097032621503, "global_step": 23348, "epoch": 196, "lr": 7.64894912785965e-05} +{"train_loss": 0.004172077868133783, "global_step": 23349, "epoch": 196, "lr": 7.648761221470481e-05} +{"train_loss": 0.00376711692661047, "global_step": 23350, "epoch": 196, "lr": 7.648573309880751e-05} +{"train_loss": 0.006405868101865053, "global_step": 23351, "epoch": 196, "lr": 7.64838539309083e-05} +{"train_loss": 0.004821354523301125, "global_step": 23352, "epoch": 196, "lr": 7.648197471101088e-05} +{"train_loss": 0.0032196284737437963, "global_step": 23353, "epoch": 196, "lr": 7.648009543911894e-05} +{"train_loss": 0.0042890217155218124, "global_step": 23354, "epoch": 196, "lr": 7.647821611523615e-05} +{"train_loss": 0.004057527519762516, "global_step": 23355, "epoch": 196, "lr": 7.64763367393662e-05} +{"train_loss": 0.005185360554605722, "global_step": 23356, "epoch": 196, "lr": 7.647445731151281e-05} +{"train_loss": 0.004415122792124748, "global_step": 23357, "epoch": 196, "lr": 7.647257783167965e-05} +{"train_loss": 0.00505400775000453, "global_step": 23358, "epoch": 196, "lr": 7.647069829987039e-05} +{"train_loss": 0.004542679991573095, "global_step": 23359, "epoch": 196, "lr": 7.646881871608878e-05} +{"train_loss": 0.004619590938091278, "global_step": 23360, "epoch": 196, "lr": 7.646693908033844e-05} +{"train_loss": 0.0026086559519171715, "global_step": 23361, "epoch": 196, "lr": 7.646505939262312e-05} +{"train_loss": 0.0045827338472008705, "global_step": 23362, "epoch": 196, "lr": 7.646317965294645e-05} +{"train_loss": 0.005728506948798895, "global_step": 23363, "epoch": 196, "lr": 7.646129986131217e-05} +{"train_loss": 0.003788028145208955, "global_step": 23364, "epoch": 196, "lr": 7.645942001772396e-05} +{"train_loss": 0.00578034482896328, "global_step": 23365, "epoch": 196, "lr": 7.64575401221855e-05} +{"train_loss": 0.006149927619844675, "global_step": 23366, "epoch": 196, "lr": 7.64556601747005e-05} +{"train_loss": 0.006190208718180656, "global_step": 23367, "epoch": 196, "lr": 7.64537801752726e-05} +{"train_loss": 0.0035387584939599037, "global_step": 23368, "epoch": 196, "lr": 7.645190012390556e-05} +{"train_loss": 0.0062161595560610294, "global_step": 23369, "epoch": 196, "lr": 7.645002002060304e-05} +{"train_loss": 0.004297106992453337, "global_step": 23370, "epoch": 196, "lr": 7.644813986536871e-05} +{"train_loss": 0.005491128657013178, "global_step": 23371, "epoch": 196, "lr": 7.64462596582063e-05} +{"train_loss": 0.005482227075845003, "global_step": 23372, "epoch": 196, "lr": 7.64443793991195e-05} +{"train_loss": 0.0034248060546815395, "global_step": 23373, "epoch": 196, "lr": 7.644249908811197e-05} +{"train_loss": 0.0038075088523328304, "global_step": 23374, "epoch": 196, "lr": 7.644061872518742e-05} +{"train_loss": 0.0031482770573347807, "global_step": 23375, "epoch": 196, "lr": 7.643873831034953e-05} +{"train_loss": 0.00448183435946703, "global_step": 23376, "epoch": 196, "lr": 7.643685784360202e-05} +{"train_loss": 0.0048718927428126335, "global_step": 23377, "epoch": 196, "lr": 7.643497732494854e-05} +{"train_loss": 0.004295734688639641, "global_step": 23378, "epoch": 196, "lr": 7.643309675439283e-05} +{"train_loss": 0.004391827154904604, "global_step": 23379, "epoch": 196, "lr": 7.643121613193856e-05} +{"train_loss": 0.0030419998802244663, "global_step": 23380, "epoch": 196, "lr": 7.64293354575894e-05} +{"train_loss": 0.003930241800844669, "global_step": 23381, "epoch": 196, "lr": 7.642745473134907e-05} +{"train_loss": 0.003809890244156122, "global_step": 23382, "epoch": 196, "lr": 7.642557395322125e-05} +{"train_loss": 0.004021746106445789, "global_step": 23383, "epoch": 196, "lr": 7.642369312320964e-05} +{"train_loss": 0.0041165538132190704, "global_step": 23384, "epoch": 196, "lr": 7.642181224131795e-05} +{"train_loss": 0.002798787783831358, "global_step": 23385, "epoch": 196, "lr": 7.641993130754982e-05} +{"train_loss": 0.0034745479933917522, "global_step": 23386, "epoch": 196, "lr": 7.641805032190902e-05} +{"train_loss": 0.0046976711601018906, "global_step": 23387, "epoch": 196, "lr": 7.641616928439917e-05} +{"train_loss": 0.004594686906784773, "global_step": 23388, "epoch": 196, "lr": 7.641428819502402e-05} +{"train_loss": 0.00227111647836864, "global_step": 23389, "epoch": 196, "lr": 7.64124070537872e-05} +{"train_loss": 0.0033341748639941216, "global_step": 23390, "epoch": 196, "lr": 7.641052586069248e-05} +{"train_loss": 0.004765370395034552, "global_step": 23391, "epoch": 196, "lr": 7.640864461574349e-05} +{"train_loss": 0.0029650358483195305, "global_step": 23392, "epoch": 196, "lr": 7.640676331894397e-05} +{"train_loss": 0.0034425135236233473, "global_step": 23393, "epoch": 196, "lr": 7.640488197029756e-05} +{"train_loss": 0.002742149168625474, "global_step": 23394, "epoch": 196, "lr": 7.6403000569808e-05} +{"train_loss": 0.004634613636881113, "global_step": 23395, "epoch": 196, "lr": 7.640111911747897e-05} +{"train_loss": 0.003554871305823326, "global_step": 23396, "epoch": 196, "lr": 7.639923761331415e-05} +{"train_loss": 0.002389226108789444, "global_step": 23397, "epoch": 196, "lr": 7.639735605731728e-05} +{"train_loss": 0.004610851407051086, "global_step": 23398, "epoch": 196, "lr": 7.6395474449492e-05} +{"train_loss": 0.005130457226186991, "global_step": 23399, "epoch": 196, "lr": 7.639359278984202e-05} +{"train_loss": 0.00449376879259944, "global_step": 23400, "epoch": 196, "lr": 7.639171107837104e-05} +{"train_loss": 0.004504677839577198, "global_step": 23401, "epoch": 196, "lr": 7.638982931508276e-05} +{"train_loss": 0.005007001105695963, "global_step": 23402, "epoch": 196, "lr": 7.638794749998089e-05} +{"train_loss": 0.004851142875850201, "global_step": 23403, "epoch": 196, "lr": 7.638606563306909e-05} +{"train_loss": 0.002774630906060338, "global_step": 23404, "epoch": 196, "lr": 7.638418371435106e-05} +{"train_loss": 0.0065301223658025265, "global_step": 23405, "epoch": 196, "lr": 7.63823017438305e-05} +{"train_loss": 0.0034416927956044674, "global_step": 23406, "epoch": 196, "lr": 7.638041972151112e-05} +{"train_loss": 0.0034902619663625956, "global_step": 23407, "epoch": 196, "lr": 7.63785376473966e-05} +{"train_loss": 0.0035321288742125034, "global_step": 23408, "epoch": 196, "lr": 7.637665552149065e-05} +{"train_loss": 0.0054404097609221935, "global_step": 23409, "epoch": 196, "lr": 7.637477334379694e-05} +{"train_loss": 0.0022062230855226517, "global_step": 23410, "epoch": 196, "lr": 7.63728911143192e-05} +{"train_loss": 0.004673670046031475, "global_step": 23411, "epoch": 196, "lr": 7.637100883306109e-05} +{"train_loss": 0.004419674631208181, "global_step": 23412, "epoch": 196, "lr": 7.636912650002633e-05} +{"train_loss": 0.003697257023304701, "global_step": 23413, "epoch": 196, "lr": 7.636724411521858e-05} +{"train_loss": 0.003888780251145363, "global_step": 23414, "epoch": 196, "lr": 7.636536167864159e-05} +{"train_loss": 0.003927720710635185, "global_step": 23415, "epoch": 196, "lr": 7.636347919029903e-05} +{"train_loss": 0.003896509064361453, "global_step": 23416, "epoch": 196, "lr": 7.636159665019458e-05} +{"train_loss": 0.0055563910864293575, "global_step": 23417, "epoch": 196, "lr": 7.635971405833196e-05} +{"train_loss": 0.005669896956533194, "global_step": 23418, "epoch": 196, "lr": 7.635783141471487e-05} +{"train_loss": 0.005215407349169254, "global_step": 23419, "epoch": 196, "lr": 7.635594871934698e-05} +{"train_loss": 0.003542824648320675, "global_step": 23420, "epoch": 196, "lr": 7.6354065972232e-05} +{"train_loss": 0.0037134159356355667, "global_step": 23421, "epoch": 196, "lr": 7.635218317337362e-05} +{"train_loss": 0.006197021808475256, "global_step": 23422, "epoch": 196, "lr": 7.635030032277556e-05} +{"train_loss": 0.0035794521681964397, "global_step": 23423, "epoch": 196, "lr": 7.63484174204415e-05} +{"train_loss": 0.003494818229228258, "global_step": 23424, "epoch": 196, "lr": 7.634653446637512e-05} +{"train_loss": 0.007282448932528496, "global_step": 23425, "epoch": 196, "lr": 7.634465146058014e-05} +{"train_loss": 0.005864442326128483, "global_step": 23426, "epoch": 196, "lr": 7.634276840306026e-05} +{"train_loss": 0.0027874326333403587, "global_step": 23427, "epoch": 196, "lr": 7.634088529381916e-05} +{"train_loss": 0.004708494525402784, "global_step": 23428, "epoch": 196, "lr": 7.633900213286055e-05} +{"train_loss": 0.004739629570394754, "global_step": 23429, "epoch": 196, "lr": 7.633711892018813e-05} +{"train_loss": 0.0038183073047548532, "global_step": 23430, "epoch": 196, "lr": 7.633523565580559e-05} +{"train_loss": 0.0027706618420779705, "global_step": 23431, "epoch": 196, "lr": 7.633335233971661e-05} +{"train_loss": 0.004268313758075237, "global_step": 23432, "epoch": 196, "lr": 7.633146897192492e-05} +{"train_loss": 0.004016730468720198, "global_step": 23433, "epoch": 196, "lr": 7.632958555243418e-05} +{"train_loss": 0.0051923468708992004, "global_step": 23434, "epoch": 196, "lr": 7.632770208124815e-05} +{"train_loss": 0.003426947630941868, "global_step": 23435, "epoch": 196, "lr": 7.632581855837048e-05} +{"train_loss": 0.00563355116173625, "global_step": 23436, "epoch": 196, "lr": 7.632393498380488e-05} +{"train_loss": 0.003831676207482815, "global_step": 23437, "epoch": 196, "lr": 7.632205135755504e-05} +{"train_loss": 0.007665122393518686, "global_step": 23438, "epoch": 196, "lr": 7.632016767962465e-05} +{"train_loss": 0.002105420920997858, "global_step": 23439, "epoch": 196, "lr": 7.631828395001743e-05} +{"train_loss": 0.004796176217496395, "global_step": 23440, "epoch": 196, "lr": 7.631640016873709e-05} +{"train_loss": 0.002685375278815627, "global_step": 23441, "epoch": 196, "lr": 7.63145163357873e-05} +{"train_loss": 0.004406427753259654, "global_step": 23442, "epoch": 196, "lr": 7.631263245117175e-05, "val_loss": 0.012346221134066582} +{"train_loss": 0.0061662583611905575, "global_step": 23443, "epoch": 197, "lr": 7.631074851489417e-05} +{"train_loss": 0.004282367881387472, "global_step": 23444, "epoch": 197, "lr": 7.630886452695824e-05} +{"train_loss": 0.0033448277972638607, "global_step": 23445, "epoch": 197, "lr": 7.630698048736769e-05} +{"train_loss": 0.0043397205881774426, "global_step": 23446, "epoch": 197, "lr": 7.630509639612617e-05} +{"train_loss": 0.003859293181449175, "global_step": 23447, "epoch": 197, "lr": 7.630321225323741e-05} +{"train_loss": 0.006035515572875738, "global_step": 23448, "epoch": 197, "lr": 7.63013280587051e-05} +{"train_loss": 0.0024659540504217148, "global_step": 23449, "epoch": 197, "lr": 7.629944381253294e-05} +{"train_loss": 0.007392966654151678, "global_step": 23450, "epoch": 197, "lr": 7.629755951472464e-05} +{"train_loss": 0.002797727705910802, "global_step": 23451, "epoch": 197, "lr": 7.629567516528388e-05} +{"train_loss": 0.004498585127294064, "global_step": 23452, "epoch": 197, "lr": 7.629379076421439e-05} +{"train_loss": 0.005607227329164743, "global_step": 23453, "epoch": 197, "lr": 7.629190631151984e-05} +{"train_loss": 0.006667474750429392, "global_step": 23454, "epoch": 197, "lr": 7.629002180720395e-05} +{"train_loss": 0.004882397595793009, "global_step": 23455, "epoch": 197, "lr": 7.628813725127039e-05} +{"train_loss": 0.003434868762269616, "global_step": 23456, "epoch": 197, "lr": 7.62862526437229e-05} +{"train_loss": 0.003388763405382633, "global_step": 23457, "epoch": 197, "lr": 7.628436798456516e-05} +{"train_loss": 0.0037975553423166275, "global_step": 23458, "epoch": 197, "lr": 7.628248327380086e-05} +{"train_loss": 0.00685920612886548, "global_step": 23459, "epoch": 197, "lr": 7.628059851143373e-05} +{"train_loss": 0.005472307093441486, "global_step": 23460, "epoch": 197, "lr": 7.627871369746743e-05} +{"train_loss": 0.0054079280234873295, "global_step": 23461, "epoch": 197, "lr": 7.62768288319057e-05} +{"train_loss": 0.004379902500659227, "global_step": 23462, "epoch": 197, "lr": 7.627494391475221e-05} +{"train_loss": 0.005998854525387287, "global_step": 23463, "epoch": 197, "lr": 7.627305894601069e-05} +{"train_loss": 0.0034838698338717222, "global_step": 23464, "epoch": 197, "lr": 7.627117392568481e-05} +{"train_loss": 0.006634269841015339, "global_step": 23465, "epoch": 197, "lr": 7.626928885377828e-05} +{"train_loss": 0.004953010007739067, "global_step": 23466, "epoch": 197, "lr": 7.626740373029484e-05} +{"train_loss": 0.0023153163492679596, "global_step": 23467, "epoch": 197, "lr": 7.626551855523814e-05} +{"train_loss": 0.003562993835657835, "global_step": 23468, "epoch": 197, "lr": 7.62636333286119e-05} +{"train_loss": 0.007526740897446871, "global_step": 23469, "epoch": 197, "lr": 7.62617480504198e-05} +{"train_loss": 0.004830487072467804, "global_step": 23470, "epoch": 197, "lr": 7.62598627206656e-05} +{"train_loss": 0.0036199491005390882, "global_step": 23471, "epoch": 197, "lr": 7.625797733935295e-05} +{"train_loss": 0.004515525884926319, "global_step": 23472, "epoch": 197, "lr": 7.625609190648557e-05} +{"train_loss": 0.006829278077930212, "global_step": 23473, "epoch": 197, "lr": 7.625420642206716e-05} +{"train_loss": 0.0036733972374349833, "global_step": 23474, "epoch": 197, "lr": 7.625232088610141e-05} +{"train_loss": 0.0016965559916570783, "global_step": 23475, "epoch": 197, "lr": 7.625043529859205e-05} +{"train_loss": 0.007120118476450443, "global_step": 23476, "epoch": 197, "lr": 7.624854965954275e-05} +{"train_loss": 0.005869580898433924, "global_step": 23477, "epoch": 197, "lr": 7.624666396895724e-05} +{"train_loss": 0.007925396785140038, "global_step": 23478, "epoch": 197, "lr": 7.62447782268392e-05} +{"train_loss": 0.004557223524898291, "global_step": 23479, "epoch": 197, "lr": 7.624289243319235e-05} +{"train_loss": 0.0036293715238571167, "global_step": 23480, "epoch": 197, "lr": 7.624100658802038e-05} +{"train_loss": 0.005714557133615017, "global_step": 23481, "epoch": 197, "lr": 7.623912069132697e-05} +{"train_loss": 0.005818777251988649, "global_step": 23482, "epoch": 197, "lr": 7.623723474311588e-05} +{"train_loss": 0.0034537643659859896, "global_step": 23483, "epoch": 197, "lr": 7.623534874339078e-05} +{"train_loss": 0.006063972134143114, "global_step": 23484, "epoch": 197, "lr": 7.623346269215537e-05} +{"train_loss": 0.0075975931249558926, "global_step": 23485, "epoch": 197, "lr": 7.623157658941335e-05} +{"train_loss": 0.004498069640249014, "global_step": 23486, "epoch": 197, "lr": 7.622969043516846e-05} +{"train_loss": 0.003529082518070936, "global_step": 23487, "epoch": 197, "lr": 7.622780422942435e-05} +{"train_loss": 0.008327452465891838, "global_step": 23488, "epoch": 197, "lr": 7.622591797218475e-05} +{"train_loss": 0.0062109739519655704, "global_step": 23489, "epoch": 197, "lr": 7.622403166345337e-05} +{"train_loss": 0.0035049859434366226, "global_step": 23490, "epoch": 197, "lr": 7.62221453032339e-05} +{"train_loss": 0.004549700301140547, "global_step": 23491, "epoch": 197, "lr": 7.622025889153007e-05} +{"train_loss": 0.005471575073897839, "global_step": 23492, "epoch": 197, "lr": 7.621837242834554e-05} +{"train_loss": 0.005594130139797926, "global_step": 23493, "epoch": 197, "lr": 7.621648591368405e-05} +{"train_loss": 0.0032088274601846933, "global_step": 23494, "epoch": 197, "lr": 7.621459934754928e-05} +{"train_loss": 0.00487892422825098, "global_step": 23495, "epoch": 197, "lr": 7.621271272994495e-05} +{"train_loss": 0.0038296449929475784, "global_step": 23496, "epoch": 197, "lr": 7.621082606087475e-05} +{"train_loss": 0.005997749511152506, "global_step": 23497, "epoch": 197, "lr": 7.62089393403424e-05} +{"train_loss": 0.005040637217462063, "global_step": 23498, "epoch": 197, "lr": 7.620705256835159e-05} +{"train_loss": 0.002710743108764291, "global_step": 23499, "epoch": 197, "lr": 7.620516574490603e-05} +{"train_loss": 0.004441451746970415, "global_step": 23500, "epoch": 197, "lr": 7.620327887000944e-05} +{"train_loss": 0.005882891360670328, "global_step": 23501, "epoch": 197, "lr": 7.620139194366551e-05} +{"train_loss": 0.005169425159692764, "global_step": 23502, "epoch": 197, "lr": 7.619950496587796e-05} +{"train_loss": 0.003157608676701784, "global_step": 23503, "epoch": 197, "lr": 7.619761793665046e-05} +{"train_loss": 0.004206039942800999, "global_step": 23504, "epoch": 197, "lr": 7.619573085598674e-05} +{"train_loss": 0.003922963514924049, "global_step": 23505, "epoch": 197, "lr": 7.61938437238905e-05} +{"train_loss": 0.005066459067165852, "global_step": 23506, "epoch": 197, "lr": 7.619195654036545e-05} +{"train_loss": 0.00539980037137866, "global_step": 23507, "epoch": 197, "lr": 7.619006930541528e-05} +{"train_loss": 0.003964683506637812, "global_step": 23508, "epoch": 197, "lr": 7.618818201904371e-05} +{"train_loss": 0.004353957250714302, "global_step": 23509, "epoch": 197, "lr": 7.618629468125446e-05} +{"train_loss": 0.004859032575041056, "global_step": 23510, "epoch": 197, "lr": 7.618440729205122e-05} +{"train_loss": 0.0034206463024020195, "global_step": 23511, "epoch": 197, "lr": 7.618251985143768e-05} +{"train_loss": 0.0025569081772118807, "global_step": 23512, "epoch": 197, "lr": 7.618063235941755e-05} +{"train_loss": 0.00540607376024127, "global_step": 23513, "epoch": 197, "lr": 7.617874481599457e-05} +{"train_loss": 0.0039153024554252625, "global_step": 23514, "epoch": 197, "lr": 7.617685722117239e-05} +{"train_loss": 0.004559333901852369, "global_step": 23515, "epoch": 197, "lr": 7.617496957495477e-05} +{"train_loss": 0.003349044593051076, "global_step": 23516, "epoch": 197, "lr": 7.617308187734539e-05} +{"train_loss": 0.005799117963761091, "global_step": 23517, "epoch": 197, "lr": 7.617119412834795e-05} +{"train_loss": 0.005117795430123806, "global_step": 23518, "epoch": 197, "lr": 7.616930632796618e-05} +{"train_loss": 0.004049905575811863, "global_step": 23519, "epoch": 197, "lr": 7.616741847620377e-05} +{"train_loss": 0.005790744908154011, "global_step": 23520, "epoch": 197, "lr": 7.616553057306442e-05} +{"train_loss": 0.00557707529515028, "global_step": 23521, "epoch": 197, "lr": 7.616364261855185e-05} +{"train_loss": 0.002970280824229121, "global_step": 23522, "epoch": 197, "lr": 7.616175461266977e-05} +{"train_loss": 0.003384048119187355, "global_step": 23523, "epoch": 197, "lr": 7.615986655542187e-05} +{"train_loss": 0.0029520292300730944, "global_step": 23524, "epoch": 197, "lr": 7.615797844681188e-05} +{"train_loss": 0.0037190457805991173, "global_step": 23525, "epoch": 197, "lr": 7.615609028684348e-05} +{"train_loss": 0.004047171212732792, "global_step": 23526, "epoch": 197, "lr": 7.61542020755204e-05} +{"train_loss": 0.005794207565486431, "global_step": 23527, "epoch": 197, "lr": 7.615231381284633e-05} +{"train_loss": 0.003344007534906268, "global_step": 23528, "epoch": 197, "lr": 7.615042549882501e-05} +{"train_loss": 0.005045984871685505, "global_step": 23529, "epoch": 197, "lr": 7.614853713346008e-05} +{"train_loss": 0.004551182966679335, "global_step": 23530, "epoch": 197, "lr": 7.614664871675532e-05} +{"train_loss": 0.003935053013265133, "global_step": 23531, "epoch": 197, "lr": 7.61447602487144e-05} +{"train_loss": 0.00424529891461134, "global_step": 23532, "epoch": 197, "lr": 7.614287172934105e-05} +{"train_loss": 0.004396652802824974, "global_step": 23533, "epoch": 197, "lr": 7.614098315863895e-05} +{"train_loss": 0.005745479371398687, "global_step": 23534, "epoch": 197, "lr": 7.613909453661183e-05} +{"train_loss": 0.003074736101552844, "global_step": 23535, "epoch": 197, "lr": 7.613720586326339e-05} +{"train_loss": 0.003065201686695218, "global_step": 23536, "epoch": 197, "lr": 7.613531713859733e-05} +{"train_loss": 0.007141676731407642, "global_step": 23537, "epoch": 197, "lr": 7.613342836261736e-05} +{"train_loss": 0.004349223803728819, "global_step": 23538, "epoch": 197, "lr": 7.613153953532722e-05} +{"train_loss": 0.005500146187841892, "global_step": 23539, "epoch": 197, "lr": 7.612965065673058e-05} +{"train_loss": 0.0046617453917860985, "global_step": 23540, "epoch": 197, "lr": 7.612776172683116e-05} +{"train_loss": 0.005314620211720467, "global_step": 23541, "epoch": 197, "lr": 7.612587274563269e-05} +{"train_loss": 0.0028642506804317236, "global_step": 23542, "epoch": 197, "lr": 7.612398371313885e-05} +{"train_loss": 0.0033089234493672848, "global_step": 23543, "epoch": 197, "lr": 7.612209462935334e-05} +{"train_loss": 0.004603222012519836, "global_step": 23544, "epoch": 197, "lr": 7.61202054942799e-05} +{"train_loss": 0.006061274092644453, "global_step": 23545, "epoch": 197, "lr": 7.611831630792223e-05} +{"train_loss": 0.004828541539609432, "global_step": 23546, "epoch": 197, "lr": 7.611642707028403e-05} +{"train_loss": 0.0034588812850415707, "global_step": 23547, "epoch": 197, "lr": 7.611453778136903e-05} +{"train_loss": 0.004039272665977478, "global_step": 23548, "epoch": 197, "lr": 7.611264844118091e-05} +{"train_loss": 0.005259977653622627, "global_step": 23549, "epoch": 197, "lr": 7.61107590497234e-05} +{"train_loss": 0.0039047023747116327, "global_step": 23550, "epoch": 197, "lr": 7.610886960700022e-05} +{"train_loss": 0.004056312143802643, "global_step": 23551, "epoch": 197, "lr": 7.610698011301505e-05} +{"train_loss": 0.003248189575970173, "global_step": 23552, "epoch": 197, "lr": 7.61050905677716e-05} +{"train_loss": 0.005151150282472372, "global_step": 23553, "epoch": 197, "lr": 7.610320097127361e-05} +{"train_loss": 0.004555089399218559, "global_step": 23554, "epoch": 197, "lr": 7.610131132352478e-05} +{"train_loss": 0.003265268635004759, "global_step": 23555, "epoch": 197, "lr": 7.609942162452879e-05} +{"train_loss": 0.003682947251945734, "global_step": 23556, "epoch": 197, "lr": 7.609753187428939e-05} +{"train_loss": 0.0038102010730654, "global_step": 23557, "epoch": 197, "lr": 7.609564207281028e-05} +{"train_loss": 0.0038339965976774693, "global_step": 23558, "epoch": 197, "lr": 7.609375222009515e-05} +{"train_loss": 0.003417735919356346, "global_step": 23559, "epoch": 197, "lr": 7.609186231614773e-05} +{"train_loss": 0.0025938847102224827, "global_step": 23560, "epoch": 197, "lr": 7.608997236097173e-05} +{"train_loss": 0.004584616563721176, "global_step": 23561, "epoch": 197, "lr": 7.608808235457086e-05, "val_loss": 0.01518525555729866} +{"train_loss": 0.0031055393628776073, "global_step": 23562, "epoch": 198, "lr": 7.608619229694882e-05} +{"train_loss": 0.0040666088461875916, "global_step": 23563, "epoch": 198, "lr": 7.608430218810933e-05} +{"train_loss": 0.0029461162630468607, "global_step": 23564, "epoch": 198, "lr": 7.608241202805608e-05} +{"train_loss": 0.0032207004260271788, "global_step": 23565, "epoch": 198, "lr": 7.608052181679282e-05} +{"train_loss": 0.006731425877660513, "global_step": 23566, "epoch": 198, "lr": 7.607863155432326e-05} +{"train_loss": 0.0031715419609099627, "global_step": 23567, "epoch": 198, "lr": 7.607674124065107e-05} +{"train_loss": 0.0041378517635166645, "global_step": 23568, "epoch": 198, "lr": 7.607485087578e-05} +{"train_loss": 0.003868109779432416, "global_step": 23569, "epoch": 198, "lr": 7.607296045971373e-05} +{"train_loss": 0.005281656514853239, "global_step": 23570, "epoch": 198, "lr": 7.607106999245599e-05} +{"train_loss": 0.0028491991106420755, "global_step": 23571, "epoch": 198, "lr": 7.606917947401049e-05} +{"train_loss": 0.003655173582956195, "global_step": 23572, "epoch": 198, "lr": 7.606728890438096e-05} +{"train_loss": 0.0045410566963255405, "global_step": 23573, "epoch": 198, "lr": 7.606539828357107e-05} +{"train_loss": 0.005059871356934309, "global_step": 23574, "epoch": 198, "lr": 7.606350761158455e-05} +{"train_loss": 0.0034504986833781004, "global_step": 23575, "epoch": 198, "lr": 7.606161688842512e-05} +{"train_loss": 0.004866723902523518, "global_step": 23576, "epoch": 198, "lr": 7.605972611409651e-05} +{"train_loss": 0.005219705868512392, "global_step": 23577, "epoch": 198, "lr": 7.60578352886024e-05} +{"train_loss": 0.007612275425344706, "global_step": 23578, "epoch": 198, "lr": 7.60559444119465e-05} +{"train_loss": 0.0038909290451556444, "global_step": 23579, "epoch": 198, "lr": 7.605405348413256e-05} +{"train_loss": 0.007455829530954361, "global_step": 23580, "epoch": 198, "lr": 7.605216250516424e-05} +{"train_loss": 0.0029091888573020697, "global_step": 23581, "epoch": 198, "lr": 7.60502714750453e-05} +{"train_loss": 0.0056975847110152245, "global_step": 23582, "epoch": 198, "lr": 7.604838039377946e-05} +{"train_loss": 0.0059438166208565235, "global_step": 23583, "epoch": 198, "lr": 7.604648926137037e-05} +{"train_loss": 0.005174913909286261, "global_step": 23584, "epoch": 198, "lr": 7.604459807782181e-05} +{"train_loss": 0.003430840326473117, "global_step": 23585, "epoch": 198, "lr": 7.604270684313746e-05} +{"train_loss": 0.0030097540002316236, "global_step": 23586, "epoch": 198, "lr": 7.604081555732101e-05} +{"train_loss": 0.0031024308409541845, "global_step": 23587, "epoch": 198, "lr": 7.603892422037623e-05} +{"train_loss": 0.005932437721639872, "global_step": 23588, "epoch": 198, "lr": 7.603703283230678e-05} +{"train_loss": 0.005615635309368372, "global_step": 23589, "epoch": 198, "lr": 7.603514139311643e-05} +{"train_loss": 0.00333461188711226, "global_step": 23590, "epoch": 198, "lr": 7.603324990280882e-05} +{"train_loss": 0.003990127705037594, "global_step": 23591, "epoch": 198, "lr": 7.603135836138776e-05} +{"train_loss": 0.004931846167892218, "global_step": 23592, "epoch": 198, "lr": 7.602946676885686e-05} +{"train_loss": 0.0031115293968468904, "global_step": 23593, "epoch": 198, "lr": 7.602757512521989e-05} +{"train_loss": 0.0024692208971828222, "global_step": 23594, "epoch": 198, "lr": 7.602568343048057e-05} +{"train_loss": 0.005774056538939476, "global_step": 23595, "epoch": 198, "lr": 7.60237916846426e-05} +{"train_loss": 0.003405829193070531, "global_step": 23596, "epoch": 198, "lr": 7.602189988770969e-05} +{"train_loss": 0.004282308276742697, "global_step": 23597, "epoch": 198, "lr": 7.602000803968557e-05} +{"train_loss": 0.0034387516789138317, "global_step": 23598, "epoch": 198, "lr": 7.601811614057393e-05} +{"train_loss": 0.004449963103979826, "global_step": 23599, "epoch": 198, "lr": 7.60162241903785e-05} +{"train_loss": 0.004645893815904856, "global_step": 23600, "epoch": 198, "lr": 7.601433218910299e-05} +{"train_loss": 0.004904137458652258, "global_step": 23601, "epoch": 198, "lr": 7.601244013675113e-05} +{"train_loss": 0.003907080739736557, "global_step": 23602, "epoch": 198, "lr": 7.601054803332662e-05} +{"train_loss": 0.0034079470206052065, "global_step": 23603, "epoch": 198, "lr": 7.600865587883317e-05} +{"train_loss": 0.008632049895823002, "global_step": 23604, "epoch": 198, "lr": 7.600676367327452e-05} +{"train_loss": 0.003590057138353586, "global_step": 23605, "epoch": 198, "lr": 7.600487141665436e-05} +{"train_loss": 0.00346805970184505, "global_step": 23606, "epoch": 198, "lr": 7.60029791089764e-05} +{"train_loss": 0.0049217259511351585, "global_step": 23607, "epoch": 198, "lr": 7.600108675024438e-05} +{"train_loss": 0.0030443104915320873, "global_step": 23608, "epoch": 198, "lr": 7.599919434046199e-05} +{"train_loss": 0.004700234159827232, "global_step": 23609, "epoch": 198, "lr": 7.599730187963298e-05} +{"train_loss": 0.0024464407470077276, "global_step": 23610, "epoch": 198, "lr": 7.599540936776105e-05} +{"train_loss": 0.0046250722371041775, "global_step": 23611, "epoch": 198, "lr": 7.59935168048499e-05} +{"train_loss": 0.0071042375639081, "global_step": 23612, "epoch": 198, "lr": 7.599162419090324e-05} +{"train_loss": 0.0035974476486444473, "global_step": 23613, "epoch": 198, "lr": 7.598973152592482e-05} +{"train_loss": 0.004644758999347687, "global_step": 23614, "epoch": 198, "lr": 7.598783880991834e-05} +{"train_loss": 0.005064873956143856, "global_step": 23615, "epoch": 198, "lr": 7.59859460428875e-05} +{"train_loss": 0.0039053841028362513, "global_step": 23616, "epoch": 198, "lr": 7.598405322483605e-05} +{"train_loss": 0.003932738211005926, "global_step": 23617, "epoch": 198, "lr": 7.598216035576768e-05} +{"train_loss": 0.004268526565283537, "global_step": 23618, "epoch": 198, "lr": 7.598026743568612e-05} +{"train_loss": 0.0037368054036051035, "global_step": 23619, "epoch": 198, "lr": 7.597837446459506e-05} +{"train_loss": 0.0046283286064863205, "global_step": 23620, "epoch": 198, "lr": 7.597648144249825e-05} +{"train_loss": 0.002961651422083378, "global_step": 23621, "epoch": 198, "lr": 7.597458836939939e-05} +{"train_loss": 0.0056330361403524876, "global_step": 23622, "epoch": 198, "lr": 7.597269524530222e-05} +{"train_loss": 0.006249378900974989, "global_step": 23623, "epoch": 198, "lr": 7.597080207021043e-05} +{"train_loss": 0.00808118749409914, "global_step": 23624, "epoch": 198, "lr": 7.596890884412772e-05} +{"train_loss": 0.005467458162456751, "global_step": 23625, "epoch": 198, "lr": 7.596701556705787e-05} +{"train_loss": 0.006090547423809767, "global_step": 23626, "epoch": 198, "lr": 7.596512223900453e-05} +{"train_loss": 0.002051403047516942, "global_step": 23627, "epoch": 198, "lr": 7.596322885997145e-05} +{"train_loss": 0.003930370789021254, "global_step": 23628, "epoch": 198, "lr": 7.596133542996236e-05} +{"train_loss": 0.003937813453376293, "global_step": 23629, "epoch": 198, "lr": 7.595944194898095e-05} +{"train_loss": 0.00472797267138958, "global_step": 23630, "epoch": 198, "lr": 7.595754841703095e-05} +{"train_loss": 0.005309446714818478, "global_step": 23631, "epoch": 198, "lr": 7.595565483411606e-05} +{"train_loss": 0.0031699095852673054, "global_step": 23632, "epoch": 198, "lr": 7.595376120024004e-05} +{"train_loss": 0.002891338197514415, "global_step": 23633, "epoch": 198, "lr": 7.595186751540658e-05} +{"train_loss": 0.004358235746622086, "global_step": 23634, "epoch": 198, "lr": 7.594997377961939e-05} +{"train_loss": 0.007346799597144127, "global_step": 23635, "epoch": 198, "lr": 7.59480799928822e-05} +{"train_loss": 0.004138145595788956, "global_step": 23636, "epoch": 198, "lr": 7.594618615519873e-05} +{"train_loss": 0.0047242227010428905, "global_step": 23637, "epoch": 198, "lr": 7.594429226657271e-05} +{"train_loss": 0.006980923004448414, "global_step": 23638, "epoch": 198, "lr": 7.594239832700782e-05} +{"train_loss": 0.005634380504488945, "global_step": 23639, "epoch": 198, "lr": 7.594050433650781e-05} +{"train_loss": 0.005539481528103352, "global_step": 23640, "epoch": 198, "lr": 7.59386102950764e-05} +{"train_loss": 0.002537650056183338, "global_step": 23641, "epoch": 198, "lr": 7.593671620271729e-05} +{"train_loss": 0.004638769663870335, "global_step": 23642, "epoch": 198, "lr": 7.593482205943422e-05} +{"train_loss": 0.0030271033756434917, "global_step": 23643, "epoch": 198, "lr": 7.593292786523089e-05} +{"train_loss": 0.003931158222258091, "global_step": 23644, "epoch": 198, "lr": 7.593103362011102e-05} +{"train_loss": 0.004631809890270233, "global_step": 23645, "epoch": 198, "lr": 7.592913932407834e-05} +{"train_loss": 0.006602138746529818, "global_step": 23646, "epoch": 198, "lr": 7.592724497713656e-05} +{"train_loss": 0.003605618141591549, "global_step": 23647, "epoch": 198, "lr": 7.592535057928942e-05} +{"train_loss": 0.0049982513301074505, "global_step": 23648, "epoch": 198, "lr": 7.592345613054062e-05} +{"train_loss": 0.002927880035713315, "global_step": 23649, "epoch": 198, "lr": 7.592156163089387e-05} +{"train_loss": 0.006896662525832653, "global_step": 23650, "epoch": 198, "lr": 7.591966708035291e-05} +{"train_loss": 0.004805328790098429, "global_step": 23651, "epoch": 198, "lr": 7.591777247892146e-05} +{"train_loss": 0.0036416801158338785, "global_step": 23652, "epoch": 198, "lr": 7.591587782660322e-05} +{"train_loss": 0.003471004543825984, "global_step": 23653, "epoch": 198, "lr": 7.591398312340192e-05} +{"train_loss": 0.0041732327081263065, "global_step": 23654, "epoch": 198, "lr": 7.591208836932132e-05} +{"train_loss": 0.005532475188374519, "global_step": 23655, "epoch": 198, "lr": 7.591019356436507e-05} +{"train_loss": 0.006064446177333593, "global_step": 23656, "epoch": 198, "lr": 7.590829870853693e-05} +{"train_loss": 0.004933781921863556, "global_step": 23657, "epoch": 198, "lr": 7.59064038018406e-05} +{"train_loss": 0.0027291157748550177, "global_step": 23658, "epoch": 198, "lr": 7.590450884427982e-05} +{"train_loss": 0.006253032945096493, "global_step": 23659, "epoch": 198, "lr": 7.590261383585832e-05} +{"train_loss": 0.004442307632416487, "global_step": 23660, "epoch": 198, "lr": 7.59007187765798e-05} +{"train_loss": 0.006230033002793789, "global_step": 23661, "epoch": 198, "lr": 7.589882366644798e-05} +{"train_loss": 0.0028060998301953077, "global_step": 23662, "epoch": 198, "lr": 7.589692850546657e-05} +{"train_loss": 0.0044620586559176445, "global_step": 23663, "epoch": 198, "lr": 7.589503329363933e-05} +{"train_loss": 0.0030050433706492186, "global_step": 23664, "epoch": 198, "lr": 7.589313803096995e-05} +{"train_loss": 0.004875022452324629, "global_step": 23665, "epoch": 198, "lr": 7.589124271746216e-05} +{"train_loss": 0.0034174444153904915, "global_step": 23666, "epoch": 198, "lr": 7.58893473531197e-05} +{"train_loss": 0.005030169151723385, "global_step": 23667, "epoch": 198, "lr": 7.588745193794625e-05} +{"train_loss": 0.006270792800933123, "global_step": 23668, "epoch": 198, "lr": 7.588555647194556e-05} +{"train_loss": 0.005151594989001751, "global_step": 23669, "epoch": 198, "lr": 7.588366095512134e-05} +{"train_loss": 0.00286861858330667, "global_step": 23670, "epoch": 198, "lr": 7.588176538747733e-05} +{"train_loss": 0.0036463222932070494, "global_step": 23671, "epoch": 198, "lr": 7.587986976901722e-05} +{"train_loss": 0.003926265984773636, "global_step": 23672, "epoch": 198, "lr": 7.587797409974477e-05} +{"train_loss": 0.004903649911284447, "global_step": 23673, "epoch": 198, "lr": 7.587607837966368e-05} +{"train_loss": 0.003411963814869523, "global_step": 23674, "epoch": 198, "lr": 7.587418260877767e-05} +{"train_loss": 0.004081737715750933, "global_step": 23675, "epoch": 198, "lr": 7.587228678709046e-05} +{"train_loss": 0.003453570418059826, "global_step": 23676, "epoch": 198, "lr": 7.58703909146058e-05} +{"train_loss": 0.007026159670203924, "global_step": 23677, "epoch": 198, "lr": 7.586849499132736e-05} +{"train_loss": 0.0037325453013181686, "global_step": 23678, "epoch": 198, "lr": 7.586659901725891e-05} +{"train_loss": 0.003667698474600911, "global_step": 23679, "epoch": 198, "lr": 7.586470299240416e-05} +{"train_loss": 0.0044842065456753765, "global_step": 23680, "epoch": 198, "lr": 7.586280691676682e-05, "val_loss": 0.021975990384817123} +{"train_loss": 0.005643781740218401, "global_step": 23681, "epoch": 199, "lr": 7.586091079035063e-05} +{"train_loss": 0.00545078469440341, "global_step": 23682, "epoch": 199, "lr": 7.58590146131593e-05} +{"train_loss": 0.00482461741194129, "global_step": 23683, "epoch": 199, "lr": 7.585711838519656e-05} +{"train_loss": 0.0060516842640936375, "global_step": 23684, "epoch": 199, "lr": 7.585522210646611e-05} +{"train_loss": 0.004062567837536335, "global_step": 23685, "epoch": 199, "lr": 7.585332577697173e-05} +{"train_loss": 0.0029520648531615734, "global_step": 23686, "epoch": 199, "lr": 7.585142939671709e-05} +{"train_loss": 0.0048599159345030785, "global_step": 23687, "epoch": 199, "lr": 7.584953296570592e-05} +{"train_loss": 0.002828635973855853, "global_step": 23688, "epoch": 199, "lr": 7.584763648394197e-05} +{"train_loss": 0.004715869668871164, "global_step": 23689, "epoch": 199, "lr": 7.584573995142894e-05} +{"train_loss": 0.0020581420976668596, "global_step": 23690, "epoch": 199, "lr": 7.584384336817056e-05} +{"train_loss": 0.0037129102274775505, "global_step": 23691, "epoch": 199, "lr": 7.584194673417056e-05} +{"train_loss": 0.004845056217163801, "global_step": 23692, "epoch": 199, "lr": 7.584005004943265e-05} +{"train_loss": 0.005646683741360903, "global_step": 23693, "epoch": 199, "lr": 7.583815331396057e-05} +{"train_loss": 0.003872501663863659, "global_step": 23694, "epoch": 199, "lr": 7.583625652775803e-05} +{"train_loss": 0.0030869359616190195, "global_step": 23695, "epoch": 199, "lr": 7.583435969082878e-05} +{"train_loss": 0.004725313745439053, "global_step": 23696, "epoch": 199, "lr": 7.583246280317648e-05} +{"train_loss": 0.00733764236792922, "global_step": 23697, "epoch": 199, "lr": 7.583056586480493e-05} +{"train_loss": 0.0050711315125226974, "global_step": 23698, "epoch": 199, "lr": 7.582866887571783e-05} +{"train_loss": 0.004829544574022293, "global_step": 23699, "epoch": 199, "lr": 7.582677183591888e-05} +{"train_loss": 0.003611201886087656, "global_step": 23700, "epoch": 199, "lr": 7.582487474541183e-05} +{"train_loss": 0.003853049362078309, "global_step": 23701, "epoch": 199, "lr": 7.582297760420041e-05} +{"train_loss": 0.005021931137889624, "global_step": 23702, "epoch": 199, "lr": 7.582108041228831e-05} +{"train_loss": 0.0031698443926870823, "global_step": 23703, "epoch": 199, "lr": 7.581918316967928e-05} +{"train_loss": 0.004390094429254532, "global_step": 23704, "epoch": 199, "lr": 7.581728587637706e-05} +{"train_loss": 0.0030904700979590416, "global_step": 23705, "epoch": 199, "lr": 7.581538853238536e-05} +{"train_loss": 0.0044634691439569, "global_step": 23706, "epoch": 199, "lr": 7.581349113770788e-05} +{"train_loss": 0.003060980001464486, "global_step": 23707, "epoch": 199, "lr": 7.581159369234839e-05} +{"train_loss": 0.0049804882146418095, "global_step": 23708, "epoch": 199, "lr": 7.580969619631058e-05} +{"train_loss": 0.004551717080175877, "global_step": 23709, "epoch": 199, "lr": 7.580779864959818e-05} +{"train_loss": 0.006330490577965975, "global_step": 23710, "epoch": 199, "lr": 7.580590105221495e-05} +{"train_loss": 0.005170613527297974, "global_step": 23711, "epoch": 199, "lr": 7.580400340416456e-05} +{"train_loss": 0.0034066971857100725, "global_step": 23712, "epoch": 199, "lr": 7.580210570545078e-05} +{"train_loss": 0.0054854657500982285, "global_step": 23713, "epoch": 199, "lr": 7.580020795607731e-05} +{"train_loss": 0.004583870526403189, "global_step": 23714, "epoch": 199, "lr": 7.579831015604791e-05} +{"train_loss": 0.007627259939908981, "global_step": 23715, "epoch": 199, "lr": 7.579641230536627e-05} +{"train_loss": 0.004677537363022566, "global_step": 23716, "epoch": 199, "lr": 7.579451440403616e-05} +{"train_loss": 0.0032483928371220827, "global_step": 23717, "epoch": 199, "lr": 7.579261645206124e-05} +{"train_loss": 0.0031173357274383307, "global_step": 23718, "epoch": 199, "lr": 7.57907184494453e-05} +{"train_loss": 0.0036034772638231516, "global_step": 23719, "epoch": 199, "lr": 7.578882039619202e-05} +{"train_loss": 0.003414178267121315, "global_step": 23720, "epoch": 199, "lr": 7.578692229230515e-05} +{"train_loss": 0.0028271942865103483, "global_step": 23721, "epoch": 199, "lr": 7.578502413778841e-05} +{"train_loss": 0.0057694208808243275, "global_step": 23722, "epoch": 199, "lr": 7.578312593264554e-05} +{"train_loss": 0.004920510109513998, "global_step": 23723, "epoch": 199, "lr": 7.578122767688025e-05} +{"train_loss": 0.002978310454636812, "global_step": 23724, "epoch": 199, "lr": 7.577932937049627e-05} +{"train_loss": 0.00501225283369422, "global_step": 23725, "epoch": 199, "lr": 7.577743101349734e-05} +{"train_loss": 0.005173156503587961, "global_step": 23726, "epoch": 199, "lr": 7.577553260588717e-05} +{"train_loss": 0.0035051126033067703, "global_step": 23727, "epoch": 199, "lr": 7.57736341476695e-05} +{"train_loss": 0.0033466035965830088, "global_step": 23728, "epoch": 199, "lr": 7.577173563884804e-05} +{"train_loss": 0.003054544096812606, "global_step": 23729, "epoch": 199, "lr": 7.576983707942655e-05} +{"train_loss": 0.004426958970725536, "global_step": 23730, "epoch": 199, "lr": 7.576793846940873e-05} +{"train_loss": 0.004309663083404303, "global_step": 23731, "epoch": 199, "lr": 7.576603980879831e-05} +{"train_loss": 0.0030895217787474394, "global_step": 23732, "epoch": 199, "lr": 7.576414109759903e-05} +{"train_loss": 0.006054392084479332, "global_step": 23733, "epoch": 199, "lr": 7.576224233581462e-05} +{"train_loss": 0.0024602224584668875, "global_step": 23734, "epoch": 199, "lr": 7.576034352344879e-05} +{"train_loss": 0.0036425332073122263, "global_step": 23735, "epoch": 199, "lr": 7.575844466050528e-05} +{"train_loss": 0.005991027690470219, "global_step": 23736, "epoch": 199, "lr": 7.575654574698781e-05} +{"train_loss": 0.0045735836029052734, "global_step": 23737, "epoch": 199, "lr": 7.575464678290011e-05} +{"train_loss": 0.0030467042233794928, "global_step": 23738, "epoch": 199, "lr": 7.575274776824594e-05} +{"train_loss": 0.006419429089874029, "global_step": 23739, "epoch": 199, "lr": 7.575084870302898e-05} +{"train_loss": 0.00328933191485703, "global_step": 23740, "epoch": 199, "lr": 7.574894958725298e-05} +{"train_loss": 0.003014097921550274, "global_step": 23741, "epoch": 199, "lr": 7.574705042092167e-05} +{"train_loss": 0.004763366188853979, "global_step": 23742, "epoch": 199, "lr": 7.574515120403878e-05} +{"train_loss": 0.005171061959117651, "global_step": 23743, "epoch": 199, "lr": 7.574325193660803e-05} +{"train_loss": 0.0049578407779335976, "global_step": 23744, "epoch": 199, "lr": 7.574135261863315e-05} +{"train_loss": 0.005310020875185728, "global_step": 23745, "epoch": 199, "lr": 7.573945325011789e-05} +{"train_loss": 0.005310705862939358, "global_step": 23746, "epoch": 199, "lr": 7.573755383106595e-05} +{"train_loss": 0.004008439835160971, "global_step": 23747, "epoch": 199, "lr": 7.573565436148106e-05} +{"train_loss": 0.0038232370279729366, "global_step": 23748, "epoch": 199, "lr": 7.5733754841367e-05} +{"train_loss": 0.0026912232860922813, "global_step": 23749, "epoch": 199, "lr": 7.573185527072745e-05} +{"train_loss": 0.005752032622694969, "global_step": 23750, "epoch": 199, "lr": 7.572995564956613e-05} +{"train_loss": 0.0035962117835879326, "global_step": 23751, "epoch": 199, "lr": 7.572805597788681e-05} +{"train_loss": 0.004646200221031904, "global_step": 23752, "epoch": 199, "lr": 7.57261562556932e-05} +{"train_loss": 0.006495269481092691, "global_step": 23753, "epoch": 199, "lr": 7.572425648298902e-05} +{"train_loss": 0.0023846605326980352, "global_step": 23754, "epoch": 199, "lr": 7.572235665977802e-05} +{"train_loss": 0.006639084778726101, "global_step": 23755, "epoch": 199, "lr": 7.572045678606392e-05} +{"train_loss": 0.007732550147920847, "global_step": 23756, "epoch": 199, "lr": 7.571855686185045e-05} +{"train_loss": 0.0037316035013645887, "global_step": 23757, "epoch": 199, "lr": 7.571665688714134e-05} +{"train_loss": 0.0031677528750151396, "global_step": 23758, "epoch": 199, "lr": 7.571475686194032e-05} +{"train_loss": 0.004911520984023809, "global_step": 23759, "epoch": 199, "lr": 7.571285678625111e-05} +{"train_loss": 0.0032046025153249502, "global_step": 23760, "epoch": 199, "lr": 7.571095666007747e-05} +{"train_loss": 0.005274352617561817, "global_step": 23761, "epoch": 199, "lr": 7.57090564834231e-05} +{"train_loss": 0.005089753773063421, "global_step": 23762, "epoch": 199, "lr": 7.570715625629177e-05} +{"train_loss": 0.005162443500012159, "global_step": 23763, "epoch": 199, "lr": 7.570525597868716e-05} +{"train_loss": 0.004986319225281477, "global_step": 23764, "epoch": 199, "lr": 7.570335565061303e-05} +{"train_loss": 0.0033301906660199165, "global_step": 23765, "epoch": 199, "lr": 7.57014552720731e-05} +{"train_loss": 0.003635850502178073, "global_step": 23766, "epoch": 199, "lr": 7.569955484307114e-05} +{"train_loss": 0.003267139894887805, "global_step": 23767, "epoch": 199, "lr": 7.569765436361083e-05} +{"train_loss": 0.003867299063131213, "global_step": 23768, "epoch": 199, "lr": 7.569575383369592e-05} +{"train_loss": 0.003930846694856882, "global_step": 23769, "epoch": 199, "lr": 7.569385325333014e-05} +{"train_loss": 0.004974535200744867, "global_step": 23770, "epoch": 199, "lr": 7.569195262251722e-05} +{"train_loss": 0.0026443651877343655, "global_step": 23771, "epoch": 199, "lr": 7.56900519412609e-05} +{"train_loss": 0.004209491889923811, "global_step": 23772, "epoch": 199, "lr": 7.568815120956491e-05} +{"train_loss": 0.004336904268711805, "global_step": 23773, "epoch": 199, "lr": 7.5686250427433e-05} +{"train_loss": 0.0032143243588507175, "global_step": 23774, "epoch": 199, "lr": 7.568434959486886e-05} +{"train_loss": 0.004038155544549227, "global_step": 23775, "epoch": 199, "lr": 7.568244871187625e-05} +{"train_loss": 0.004636251367628574, "global_step": 23776, "epoch": 199, "lr": 7.568054777845887e-05} +{"train_loss": 0.0019526543328538537, "global_step": 23777, "epoch": 199, "lr": 7.567864679462051e-05} +{"train_loss": 0.004600523971021175, "global_step": 23778, "epoch": 199, "lr": 7.567674576036485e-05} +{"train_loss": 0.00579362828284502, "global_step": 23779, "epoch": 199, "lr": 7.567484467569566e-05} +{"train_loss": 0.005953413434326649, "global_step": 23780, "epoch": 199, "lr": 7.567294354061665e-05} +{"train_loss": 0.005021388176828623, "global_step": 23781, "epoch": 199, "lr": 7.567104235513156e-05} +{"train_loss": 0.002935594180598855, "global_step": 23782, "epoch": 199, "lr": 7.566914111924411e-05} +{"train_loss": 0.0038504351396113634, "global_step": 23783, "epoch": 199, "lr": 7.566723983295805e-05} +{"train_loss": 0.008120543323457241, "global_step": 23784, "epoch": 199, "lr": 7.566533849627711e-05} +{"train_loss": 0.0035881889052689075, "global_step": 23785, "epoch": 199, "lr": 7.566343710920503e-05} +{"train_loss": 0.0029669192153960466, "global_step": 23786, "epoch": 199, "lr": 7.56615356717455e-05} +{"train_loss": 0.006162751000374556, "global_step": 23787, "epoch": 199, "lr": 7.565963418390232e-05} +{"train_loss": 0.005191407632082701, "global_step": 23788, "epoch": 199, "lr": 7.565773264567918e-05} +{"train_loss": 0.004858188331127167, "global_step": 23789, "epoch": 199, "lr": 7.565583105707981e-05} +{"train_loss": 0.003799737896770239, "global_step": 23790, "epoch": 199, "lr": 7.565392941810796e-05} +{"train_loss": 0.0043752980418503284, "global_step": 23791, "epoch": 199, "lr": 7.565202772876739e-05} +{"train_loss": 0.0029033301398158073, "global_step": 23792, "epoch": 199, "lr": 7.565012598906176e-05} +{"train_loss": 0.003391435369849205, "global_step": 23793, "epoch": 199, "lr": 7.564822419899486e-05} +{"train_loss": 0.0032668153289705515, "global_step": 23794, "epoch": 199, "lr": 7.564632235857043e-05} +{"train_loss": 0.004849769175052643, "global_step": 23795, "epoch": 199, "lr": 7.564442046779217e-05} +{"train_loss": 0.004502353258430958, "global_step": 23796, "epoch": 199, "lr": 7.564251852666383e-05} +{"train_loss": 0.0043648649007081985, "global_step": 23797, "epoch": 199, "lr": 7.564061653518914e-05} +{"train_loss": 0.0047713578678667545, "global_step": 23798, "epoch": 199, "lr": 7.563871449337187e-05} +{"train_loss": 0.004360257586299935, "global_step": 23799, "epoch": 199, "lr": 7.56368124012157e-05, "val_loss": 0.017805948853492737} +{"train_loss": 0.005341766402125359, "global_step": 23800, "epoch": 200, "lr": 7.563491025872438e-05} +{"train_loss": 0.0034685395658016205, "global_step": 23801, "epoch": 200, "lr": 7.563300806590166e-05} +{"train_loss": 0.006437459494918585, "global_step": 23802, "epoch": 200, "lr": 7.563110582275129e-05} +{"train_loss": 0.0038659381680190563, "global_step": 23803, "epoch": 200, "lr": 7.562920352927693e-05} +{"train_loss": 0.0040706004947423935, "global_step": 23804, "epoch": 200, "lr": 7.562730118548242e-05} +{"train_loss": 0.005496670491993427, "global_step": 23805, "epoch": 200, "lr": 7.562539879137142e-05} +{"train_loss": 0.004981940612196922, "global_step": 23806, "epoch": 200, "lr": 7.562349634694769e-05} +{"train_loss": 0.004563218913972378, "global_step": 23807, "epoch": 200, "lr": 7.562159385221496e-05} +{"train_loss": 0.003955521155148745, "global_step": 23808, "epoch": 200, "lr": 7.561969130717697e-05} +{"train_loss": 0.005369225051254034, "global_step": 23809, "epoch": 200, "lr": 7.561778871183745e-05} +{"train_loss": 0.0041633835062384605, "global_step": 23810, "epoch": 200, "lr": 7.561588606620013e-05} +{"train_loss": 0.0038141701370477676, "global_step": 23811, "epoch": 200, "lr": 7.561398337026877e-05} +{"train_loss": 0.006236494053155184, "global_step": 23812, "epoch": 200, "lr": 7.561208062404708e-05} +{"train_loss": 0.004906888585537672, "global_step": 23813, "epoch": 200, "lr": 7.56101778275388e-05} +{"train_loss": 0.004808517172932625, "global_step": 23814, "epoch": 200, "lr": 7.560827498074768e-05} +{"train_loss": 0.003160219406709075, "global_step": 23815, "epoch": 200, "lr": 7.560637208367746e-05} +{"train_loss": 0.0022715453524142504, "global_step": 23816, "epoch": 200, "lr": 7.560446913633186e-05} +{"train_loss": 0.004316754173487425, "global_step": 23817, "epoch": 200, "lr": 7.560256613871462e-05} +{"train_loss": 0.0058715143240988255, "global_step": 23818, "epoch": 200, "lr": 7.560066309082946e-05} +{"train_loss": 0.006522009614855051, "global_step": 23819, "epoch": 200, "lr": 7.559875999268013e-05} +{"train_loss": 0.00255321292206645, "global_step": 23820, "epoch": 200, "lr": 7.55968568442704e-05} +{"train_loss": 0.003965162206441164, "global_step": 23821, "epoch": 200, "lr": 7.559495364560395e-05} +{"train_loss": 0.0045269327238202095, "global_step": 23822, "epoch": 200, "lr": 7.559305039668457e-05} +{"train_loss": 0.002952635521069169, "global_step": 23823, "epoch": 200, "lr": 7.559114709751595e-05} +{"train_loss": 0.00530929584056139, "global_step": 23824, "epoch": 200, "lr": 7.558924374810183e-05} +{"train_loss": 0.003203711239621043, "global_step": 23825, "epoch": 200, "lr": 7.5587340348446e-05} +{"train_loss": 0.004961017519235611, "global_step": 23826, "epoch": 200, "lr": 7.558543689855213e-05} +{"train_loss": 0.0038031665608286858, "global_step": 23827, "epoch": 200, "lr": 7.5583533398424e-05} +{"train_loss": 0.003877850715070963, "global_step": 23828, "epoch": 200, "lr": 7.558162984806534e-05} +{"train_loss": 0.0035851961001753807, "global_step": 23829, "epoch": 200, "lr": 7.557972624747988e-05} +{"train_loss": 0.005968139041215181, "global_step": 23830, "epoch": 200, "lr": 7.557782259667136e-05} +{"train_loss": 0.00420505041256547, "global_step": 23831, "epoch": 200, "lr": 7.557591889564352e-05} +{"train_loss": 0.0048327031545341015, "global_step": 23832, "epoch": 200, "lr": 7.557401514440009e-05} +{"train_loss": 0.0045704348012804985, "global_step": 23833, "epoch": 200, "lr": 7.557211134294482e-05} +{"train_loss": 0.0023841741494834423, "global_step": 23834, "epoch": 200, "lr": 7.557020749128144e-05} +{"train_loss": 0.004577990621328354, "global_step": 23835, "epoch": 200, "lr": 7.556830358941369e-05} +{"train_loss": 0.004033563192933798, "global_step": 23836, "epoch": 200, "lr": 7.556639963734531e-05} +{"train_loss": 0.004799370653927326, "global_step": 23837, "epoch": 200, "lr": 7.556449563508001e-05} +{"train_loss": 0.004832876846194267, "global_step": 23838, "epoch": 200, "lr": 7.556259158262157e-05} +{"train_loss": 0.004121121019124985, "global_step": 23839, "epoch": 200, "lr": 7.556068747997373e-05} +{"train_loss": 0.004633268341422081, "global_step": 23840, "epoch": 200, "lr": 7.55587833271402e-05} +{"train_loss": 0.004805443342775106, "global_step": 23841, "epoch": 200, "lr": 7.555687912412474e-05} +{"train_loss": 0.002900768769904971, "global_step": 23842, "epoch": 200, "lr": 7.555497487093107e-05} +{"train_loss": 0.0051513309590518475, "global_step": 23843, "epoch": 200, "lr": 7.555307056756291e-05} +{"train_loss": 0.005225385073572397, "global_step": 23844, "epoch": 200, "lr": 7.555116621402405e-05} +{"train_loss": 0.004570965655148029, "global_step": 23845, "epoch": 200, "lr": 7.554926181031821e-05} +{"train_loss": 0.003996401559561491, "global_step": 23846, "epoch": 200, "lr": 7.55473573564491e-05} +{"train_loss": 0.003636847250163555, "global_step": 23847, "epoch": 200, "lr": 7.55454528524205e-05} +{"train_loss": 0.004613763652741909, "global_step": 23848, "epoch": 200, "lr": 7.554354829823615e-05} +{"train_loss": 0.005466786213219166, "global_step": 23849, "epoch": 200, "lr": 7.554164369389975e-05} +{"train_loss": 0.00308590242639184, "global_step": 23850, "epoch": 200, "lr": 7.553973903941507e-05} +{"train_loss": 0.004198897164314985, "global_step": 23851, "epoch": 200, "lr": 7.553783433478582e-05} +{"train_loss": 0.004204561933875084, "global_step": 23852, "epoch": 200, "lr": 7.553592958001579e-05} +{"train_loss": 0.004319248255342245, "global_step": 23853, "epoch": 200, "lr": 7.553402477510867e-05} +{"train_loss": 0.0036497677210718393, "global_step": 23854, "epoch": 200, "lr": 7.553211992006824e-05} +{"train_loss": 0.004793956875801086, "global_step": 23855, "epoch": 200, "lr": 7.553021501489821e-05} +{"train_loss": 0.0021748910658061504, "global_step": 23856, "epoch": 200, "lr": 7.552831005960233e-05} +{"train_loss": 0.0019818858709186316, "global_step": 23857, "epoch": 200, "lr": 7.552640505418433e-05} +{"train_loss": 0.003768758149817586, "global_step": 23858, "epoch": 200, "lr": 7.552449999864797e-05} +{"train_loss": 0.004818724002689123, "global_step": 23859, "epoch": 200, "lr": 7.552259489299698e-05} +{"train_loss": 0.005662551149725914, "global_step": 23860, "epoch": 200, "lr": 7.552068973723511e-05} +{"train_loss": 0.003647233359515667, "global_step": 23861, "epoch": 200, "lr": 7.551878453136608e-05} +{"train_loss": 0.005583473015576601, "global_step": 23862, "epoch": 200, "lr": 7.551687927539365e-05} +{"train_loss": 0.005368412937968969, "global_step": 23863, "epoch": 200, "lr": 7.551497396932154e-05} +{"train_loss": 0.004037700593471527, "global_step": 23864, "epoch": 200, "lr": 7.551306861315352e-05} +{"train_loss": 0.0033339662477374077, "global_step": 23865, "epoch": 200, "lr": 7.551116320689332e-05} +{"train_loss": 0.0035664578899741173, "global_step": 23866, "epoch": 200, "lr": 7.550925775054466e-05} +{"train_loss": 0.004125307779759169, "global_step": 23867, "epoch": 200, "lr": 7.550735224411131e-05} +{"train_loss": 0.004409611690789461, "global_step": 23868, "epoch": 200, "lr": 7.5505446687597e-05} +{"train_loss": 0.001812517992220819, "global_step": 23869, "epoch": 200, "lr": 7.550354108100545e-05} +{"train_loss": 0.003437577746808529, "global_step": 23870, "epoch": 200, "lr": 7.550163542434046e-05} +{"train_loss": 0.004241946619004011, "global_step": 23871, "epoch": 200, "lr": 7.549972971760571e-05} +{"train_loss": 0.0031641435343772173, "global_step": 23872, "epoch": 200, "lr": 7.549782396080495e-05} +{"train_loss": 0.003820673795416951, "global_step": 23873, "epoch": 200, "lr": 7.549591815394196e-05} +{"train_loss": 0.0032558755483478308, "global_step": 23874, "epoch": 200, "lr": 7.549401229702045e-05} +{"train_loss": 0.0046512167900800705, "global_step": 23875, "epoch": 200, "lr": 7.549210639004417e-05} +{"train_loss": 0.005039537791162729, "global_step": 23876, "epoch": 200, "lr": 7.549020043301686e-05} +{"train_loss": 0.0038426558021456003, "global_step": 23877, "epoch": 200, "lr": 7.548829442594228e-05} +{"train_loss": 0.004848691169172525, "global_step": 23878, "epoch": 200, "lr": 7.548638836882412e-05} +{"train_loss": 0.0033939185086637735, "global_step": 23879, "epoch": 200, "lr": 7.54844822616662e-05} +{"train_loss": 0.007433382794260979, "global_step": 23880, "epoch": 200, "lr": 7.54825761044722e-05} +{"train_loss": 0.0022398275323212147, "global_step": 23881, "epoch": 200, "lr": 7.548066989724589e-05} +{"train_loss": 0.002793931169435382, "global_step": 23882, "epoch": 200, "lr": 7.5478763639991e-05} +{"train_loss": 0.0035129638854414225, "global_step": 23883, "epoch": 200, "lr": 7.547685733271129e-05} +{"train_loss": 0.004745009820908308, "global_step": 23884, "epoch": 200, "lr": 7.547495097541048e-05} +{"train_loss": 0.002882226835936308, "global_step": 23885, "epoch": 200, "lr": 7.547304456809234e-05} +{"train_loss": 0.0042229085229337215, "global_step": 23886, "epoch": 200, "lr": 7.54711381107606e-05} +{"train_loss": 0.003902237396687269, "global_step": 23887, "epoch": 200, "lr": 7.546923160341898e-05} +{"train_loss": 0.004011339042335749, "global_step": 23888, "epoch": 200, "lr": 7.546732504607128e-05} +{"train_loss": 0.004507133737206459, "global_step": 23889, "epoch": 200, "lr": 7.546541843872118e-05} +{"train_loss": 0.005528987850993872, "global_step": 23890, "epoch": 200, "lr": 7.546351178137245e-05} +{"train_loss": 0.004690233152359724, "global_step": 23891, "epoch": 200, "lr": 7.546160507402885e-05} +{"train_loss": 0.0031523301731795073, "global_step": 23892, "epoch": 200, "lr": 7.54596983166941e-05} +{"train_loss": 0.004817909561097622, "global_step": 23893, "epoch": 200, "lr": 7.545779150937195e-05} +{"train_loss": 0.0046872347593307495, "global_step": 23894, "epoch": 200, "lr": 7.545588465206615e-05} +{"train_loss": 0.004201734438538551, "global_step": 23895, "epoch": 200, "lr": 7.545397774478044e-05} +{"train_loss": 0.0051391273736953735, "global_step": 23896, "epoch": 200, "lr": 7.545207078751857e-05} +{"train_loss": 0.004505568649619818, "global_step": 23897, "epoch": 200, "lr": 7.545016378028426e-05} +{"train_loss": 0.004672493319958448, "global_step": 23898, "epoch": 200, "lr": 7.54482567230813e-05} +{"train_loss": 0.0039284988306462765, "global_step": 23899, "epoch": 200, "lr": 7.544634961591339e-05} +{"train_loss": 0.0034762010909616947, "global_step": 23900, "epoch": 200, "lr": 7.54444424587843e-05} +{"train_loss": 0.006305131129920483, "global_step": 23901, "epoch": 200, "lr": 7.544253525169776e-05} +{"train_loss": 0.0033203987404704094, "global_step": 23902, "epoch": 200, "lr": 7.54406279946575e-05} +{"train_loss": 0.006247868295758963, "global_step": 23903, "epoch": 200, "lr": 7.54387206876673e-05} +{"train_loss": 0.005591773893684149, "global_step": 23904, "epoch": 200, "lr": 7.543681333073092e-05} +{"train_loss": 0.004028446041047573, "global_step": 23905, "epoch": 200, "lr": 7.543490592385204e-05} +{"train_loss": 0.004121741745620966, "global_step": 23906, "epoch": 200, "lr": 7.543299846703444e-05} +{"train_loss": 0.0044955783523619175, "global_step": 23907, "epoch": 200, "lr": 7.543109096028187e-05} +{"train_loss": 0.0034494444262236357, "global_step": 23908, "epoch": 200, "lr": 7.542918340359808e-05} +{"train_loss": 0.004685809835791588, "global_step": 23909, "epoch": 200, "lr": 7.542727579698678e-05} +{"train_loss": 0.004183609504252672, "global_step": 23910, "epoch": 200, "lr": 7.542536814045177e-05} +{"train_loss": 0.0037826094776391983, "global_step": 23911, "epoch": 200, "lr": 7.542346043399676e-05} +{"train_loss": 0.006376040633767843, "global_step": 23912, "epoch": 200, "lr": 7.542155267762548e-05} +{"train_loss": 0.005270278546959162, "global_step": 23913, "epoch": 200, "lr": 7.541964487134171e-05} +{"train_loss": 0.004110765643417835, "global_step": 23914, "epoch": 200, "lr": 7.541773701514919e-05} +{"train_loss": 0.004012545105069876, "global_step": 23915, "epoch": 200, "lr": 7.541582910905165e-05} +{"train_loss": 0.004381460137665272, "global_step": 23916, "epoch": 200, "lr": 7.541392115305285e-05} +{"train_loss": 0.003284757724031806, "global_step": 23917, "epoch": 200, "lr": 7.541201314715653e-05} +{"train_loss": 0.004298893522525973, "global_step": 23918, "epoch": 200, "lr": 7.541010509136643e-05, "val_loss": 0.014795809052884579, "train_action_mse_error": 7.042320794425905e-05} +{"train_loss": 0.004212522879242897, "global_step": 23919, "epoch": 201, "lr": 7.540819698568631e-05} +{"train_loss": 0.004097840283066034, "global_step": 23920, "epoch": 201, "lr": 7.540628883011991e-05} +{"train_loss": 0.0028524112422019243, "global_step": 23921, "epoch": 201, "lr": 7.540438062467098e-05} +{"train_loss": 0.0038723857142031193, "global_step": 23922, "epoch": 201, "lr": 7.540247236934326e-05} +{"train_loss": 0.003550643101334572, "global_step": 23923, "epoch": 201, "lr": 7.54005640641405e-05} +{"train_loss": 0.004525999538600445, "global_step": 23924, "epoch": 201, "lr": 7.539865570906644e-05} +{"train_loss": 0.005970847327262163, "global_step": 23925, "epoch": 201, "lr": 7.539674730412485e-05} +{"train_loss": 0.003957177512347698, "global_step": 23926, "epoch": 201, "lr": 7.539483884931944e-05} +{"train_loss": 0.004328568931668997, "global_step": 23927, "epoch": 201, "lr": 7.539293034465398e-05} +{"train_loss": 0.004806009586900473, "global_step": 23928, "epoch": 201, "lr": 7.539102179013221e-05} +{"train_loss": 0.0044778259471058846, "global_step": 23929, "epoch": 201, "lr": 7.538911318575789e-05} +{"train_loss": 0.0056443228386342525, "global_step": 23930, "epoch": 201, "lr": 7.538720453153476e-05} +{"train_loss": 0.006247394252568483, "global_step": 23931, "epoch": 201, "lr": 7.538529582746657e-05} +{"train_loss": 0.004863074980676174, "global_step": 23932, "epoch": 201, "lr": 7.538338707355705e-05} +{"train_loss": 0.005058608949184418, "global_step": 23933, "epoch": 201, "lr": 7.538147826980997e-05} +{"train_loss": 0.005079843103885651, "global_step": 23934, "epoch": 201, "lr": 7.537956941622906e-05} +{"train_loss": 0.006507856771349907, "global_step": 23935, "epoch": 201, "lr": 7.53776605128181e-05} +{"train_loss": 0.004501061048358679, "global_step": 23936, "epoch": 201, "lr": 7.53757515595808e-05} +{"train_loss": 0.005918336100876331, "global_step": 23937, "epoch": 201, "lr": 7.537384255652092e-05} +{"train_loss": 0.0029307871591299772, "global_step": 23938, "epoch": 201, "lr": 7.53719335036422e-05} +{"train_loss": 0.004225072916597128, "global_step": 23939, "epoch": 201, "lr": 7.537002440094843e-05} +{"train_loss": 0.0031007465440779924, "global_step": 23940, "epoch": 201, "lr": 7.536811524844329e-05} +{"train_loss": 0.006862290669232607, "global_step": 23941, "epoch": 201, "lr": 7.53662060461306e-05} +{"train_loss": 0.004603510722517967, "global_step": 23942, "epoch": 201, "lr": 7.536429679401405e-05} +{"train_loss": 0.003501745406538248, "global_step": 23943, "epoch": 201, "lr": 7.536238749209742e-05} +{"train_loss": 0.005207243841141462, "global_step": 23944, "epoch": 201, "lr": 7.536047814038446e-05} +{"train_loss": 0.0053501552902162075, "global_step": 23945, "epoch": 201, "lr": 7.53585687388789e-05} +{"train_loss": 0.004929987248033285, "global_step": 23946, "epoch": 201, "lr": 7.53566592875845e-05} +{"train_loss": 0.004335725214332342, "global_step": 23947, "epoch": 201, "lr": 7.535474978650502e-05} +{"train_loss": 0.004424934275448322, "global_step": 23948, "epoch": 201, "lr": 7.53528402356442e-05} +{"train_loss": 0.005996451247483492, "global_step": 23949, "epoch": 201, "lr": 7.535093063500577e-05} +{"train_loss": 0.002845273120328784, "global_step": 23950, "epoch": 201, "lr": 7.534902098459351e-05} +{"train_loss": 0.006798925809562206, "global_step": 23951, "epoch": 201, "lr": 7.534711128441114e-05} +{"train_loss": 0.004284451715648174, "global_step": 23952, "epoch": 201, "lr": 7.534520153446244e-05} +{"train_loss": 0.00448695570230484, "global_step": 23953, "epoch": 201, "lr": 7.534329173475114e-05} +{"train_loss": 0.007677213288843632, "global_step": 23954, "epoch": 201, "lr": 7.534138188528099e-05} +{"train_loss": 0.0036213193088769913, "global_step": 23955, "epoch": 201, "lr": 7.533947198605575e-05} +{"train_loss": 0.005572138354182243, "global_step": 23956, "epoch": 201, "lr": 7.533756203707916e-05} +{"train_loss": 0.0029840071219950914, "global_step": 23957, "epoch": 201, "lr": 7.533565203835497e-05} +{"train_loss": 0.004274648614227772, "global_step": 23958, "epoch": 201, "lr": 7.533374198988694e-05} +{"train_loss": 0.0059400699101388454, "global_step": 23959, "epoch": 201, "lr": 7.533183189167882e-05} +{"train_loss": 0.005557929631322622, "global_step": 23960, "epoch": 201, "lr": 7.532992174373434e-05} +{"train_loss": 0.0048264628276228905, "global_step": 23961, "epoch": 201, "lr": 7.532801154605728e-05} +{"train_loss": 0.004549062345176935, "global_step": 23962, "epoch": 201, "lr": 7.532610129865137e-05} +{"train_loss": 0.0064408546313643456, "global_step": 23963, "epoch": 201, "lr": 7.532419100152034e-05} +{"train_loss": 0.003353926818817854, "global_step": 23964, "epoch": 201, "lr": 7.5322280654668e-05} +{"train_loss": 0.005046309437602758, "global_step": 23965, "epoch": 201, "lr": 7.532037025809806e-05} +{"train_loss": 0.005361715331673622, "global_step": 23966, "epoch": 201, "lr": 7.531845981181427e-05} +{"train_loss": 0.005735080223530531, "global_step": 23967, "epoch": 201, "lr": 7.531654931582039e-05} +{"train_loss": 0.004460996016860008, "global_step": 23968, "epoch": 201, "lr": 7.531463877012018e-05} +{"train_loss": 0.002964896848425269, "global_step": 23969, "epoch": 201, "lr": 7.531272817471737e-05} +{"train_loss": 0.0044390237890183926, "global_step": 23970, "epoch": 201, "lr": 7.531081752961572e-05} +{"train_loss": 0.004033179953694344, "global_step": 23971, "epoch": 201, "lr": 7.5308906834819e-05} +{"train_loss": 0.007620217744261026, "global_step": 23972, "epoch": 201, "lr": 7.530699609033093e-05} +{"train_loss": 0.0027862542774528265, "global_step": 23973, "epoch": 201, "lr": 7.53050852961553e-05} +{"train_loss": 0.003396029118448496, "global_step": 23974, "epoch": 201, "lr": 7.530317445229582e-05} +{"train_loss": 0.006417158525437117, "global_step": 23975, "epoch": 201, "lr": 7.530126355875626e-05} +{"train_loss": 0.004986586049199104, "global_step": 23976, "epoch": 201, "lr": 7.529935261554036e-05} +{"train_loss": 0.007459389045834541, "global_step": 23977, "epoch": 201, "lr": 7.529744162265191e-05} +{"train_loss": 0.003975174855440855, "global_step": 23978, "epoch": 201, "lr": 7.529553058009462e-05} +{"train_loss": 0.005363767966628075, "global_step": 23979, "epoch": 201, "lr": 7.529361948787227e-05} +{"train_loss": 0.004625724162906408, "global_step": 23980, "epoch": 201, "lr": 7.529170834598859e-05} +{"train_loss": 0.002538231434300542, "global_step": 23981, "epoch": 201, "lr": 7.528979715444735e-05} +{"train_loss": 0.004246070049703121, "global_step": 23982, "epoch": 201, "lr": 7.528788591325229e-05} +{"train_loss": 0.005912341643124819, "global_step": 23983, "epoch": 201, "lr": 7.528597462240716e-05} +{"train_loss": 0.003172317985445261, "global_step": 23984, "epoch": 201, "lr": 7.528406328191572e-05} +{"train_loss": 0.005602399352937937, "global_step": 23985, "epoch": 201, "lr": 7.528215189178173e-05} +{"train_loss": 0.005906702484935522, "global_step": 23986, "epoch": 201, "lr": 7.528024045200896e-05} +{"train_loss": 0.00608332734555006, "global_step": 23987, "epoch": 201, "lr": 7.52783289626011e-05} +{"train_loss": 0.003594778012484312, "global_step": 23988, "epoch": 201, "lr": 7.527641742356196e-05} +{"train_loss": 0.004934309981763363, "global_step": 23989, "epoch": 201, "lr": 7.527450583489528e-05} +{"train_loss": 0.003951913211494684, "global_step": 23990, "epoch": 201, "lr": 7.52725941966048e-05} +{"train_loss": 0.007868710905313492, "global_step": 23991, "epoch": 201, "lr": 7.527068250869427e-05} +{"train_loss": 0.003962891176342964, "global_step": 23992, "epoch": 201, "lr": 7.526877077116747e-05} +{"train_loss": 0.0052433558739721775, "global_step": 23993, "epoch": 201, "lr": 7.526685898402813e-05} +{"train_loss": 0.0036520028952509165, "global_step": 23994, "epoch": 201, "lr": 7.526494714728002e-05} +{"train_loss": 0.005613110493868589, "global_step": 23995, "epoch": 201, "lr": 7.526303526092688e-05} +{"train_loss": 0.006528803613036871, "global_step": 23996, "epoch": 201, "lr": 7.526112332497246e-05} +{"train_loss": 0.004745739512145519, "global_step": 23997, "epoch": 201, "lr": 7.525921133942054e-05} +{"train_loss": 0.003485009539872408, "global_step": 23998, "epoch": 201, "lr": 7.525729930427485e-05} +{"train_loss": 0.0026486669667065144, "global_step": 23999, "epoch": 201, "lr": 7.525538721953916e-05} +{"train_loss": 0.004359539598226547, "global_step": 24000, "epoch": 201, "lr": 7.525347508521721e-05} +{"train_loss": 0.006653620861470699, "global_step": 24001, "epoch": 201, "lr": 7.525156290131275e-05} +{"train_loss": 0.0029426414985209703, "global_step": 24002, "epoch": 201, "lr": 7.524965066782955e-05} +{"train_loss": 0.00463680736720562, "global_step": 24003, "epoch": 201, "lr": 7.524773838477136e-05} +{"train_loss": 0.005217964295297861, "global_step": 24004, "epoch": 201, "lr": 7.524582605214195e-05} +{"train_loss": 0.004163214471191168, "global_step": 24005, "epoch": 201, "lr": 7.524391366994504e-05} +{"train_loss": 0.005172590259462595, "global_step": 24006, "epoch": 201, "lr": 7.52420012381844e-05} +{"train_loss": 0.006073770113289356, "global_step": 24007, "epoch": 201, "lr": 7.524008875686377e-05} +{"train_loss": 0.005155051592737436, "global_step": 24008, "epoch": 201, "lr": 7.523817622598694e-05} +{"train_loss": 0.004809832666069269, "global_step": 24009, "epoch": 201, "lr": 7.523626364555765e-05} +{"train_loss": 0.003766498528420925, "global_step": 24010, "epoch": 201, "lr": 7.523435101557964e-05} +{"train_loss": 0.0036878103855997324, "global_step": 24011, "epoch": 201, "lr": 7.523243833605672e-05} +{"train_loss": 0.005641398020088673, "global_step": 24012, "epoch": 201, "lr": 7.523052560699255e-05} +{"train_loss": 0.0038569460157305002, "global_step": 24013, "epoch": 201, "lr": 7.522861282839097e-05} +{"train_loss": 0.007317522540688515, "global_step": 24014, "epoch": 201, "lr": 7.522670000025569e-05} +{"train_loss": 0.0038777601439505816, "global_step": 24015, "epoch": 201, "lr": 7.522478712259049e-05} +{"train_loss": 0.0057547674514353275, "global_step": 24016, "epoch": 201, "lr": 7.522287419539911e-05} +{"train_loss": 0.0038895991165190935, "global_step": 24017, "epoch": 201, "lr": 7.522096121868531e-05} +{"train_loss": 0.0052929287776350975, "global_step": 24018, "epoch": 201, "lr": 7.521904819245285e-05} +{"train_loss": 0.006098554935306311, "global_step": 24019, "epoch": 201, "lr": 7.521713511670547e-05} +{"train_loss": 0.004193289205431938, "global_step": 24020, "epoch": 201, "lr": 7.521522199144694e-05} +{"train_loss": 0.0028623908292502165, "global_step": 24021, "epoch": 201, "lr": 7.521330881668105e-05} +{"train_loss": 0.006648232229053974, "global_step": 24022, "epoch": 201, "lr": 7.521139559241148e-05} +{"train_loss": 0.004200272262096405, "global_step": 24023, "epoch": 201, "lr": 7.520948231864206e-05} +{"train_loss": 0.003190945601090789, "global_step": 24024, "epoch": 201, "lr": 7.52075689953765e-05} +{"train_loss": 0.00453362800180912, "global_step": 24025, "epoch": 201, "lr": 7.520565562261857e-05} +{"train_loss": 0.004785265773534775, "global_step": 24026, "epoch": 201, "lr": 7.520374220037203e-05} +{"train_loss": 0.004027937538921833, "global_step": 24027, "epoch": 201, "lr": 7.520182872864063e-05} +{"train_loss": 0.004815069492906332, "global_step": 24028, "epoch": 201, "lr": 7.519991520742812e-05} +{"train_loss": 0.004326550755649805, "global_step": 24029, "epoch": 201, "lr": 7.51980016367383e-05} +{"train_loss": 0.0022195209749042988, "global_step": 24030, "epoch": 201, "lr": 7.519608801657488e-05} +{"train_loss": 0.0029194694943726063, "global_step": 24031, "epoch": 201, "lr": 7.519417434694164e-05} +{"train_loss": 0.006287890020757914, "global_step": 24032, "epoch": 201, "lr": 7.519226062784233e-05} +{"train_loss": 0.004739660304039717, "global_step": 24033, "epoch": 201, "lr": 7.51903468592807e-05} +{"train_loss": 0.00376434950158, "global_step": 24034, "epoch": 201, "lr": 7.518843304126051e-05} +{"train_loss": 0.0053739603608846664, "global_step": 24035, "epoch": 201, "lr": 7.518651917378551e-05} +{"train_loss": 0.003293209010735154, "global_step": 24036, "epoch": 201, "lr": 7.518460525685951e-05} +{"train_loss": 0.004738292697926655, "global_step": 24037, "epoch": 201, "lr": 7.518269129048621e-05, "val_loss": 0.018118660897016525} +{"train_loss": 0.0038211203645914793, "global_step": 24038, "epoch": 202, "lr": 7.518077727466939e-05} +{"train_loss": 0.0031881306786090136, "global_step": 24039, "epoch": 202, "lr": 7.517886320941278e-05} +{"train_loss": 0.005943809170275927, "global_step": 24040, "epoch": 202, "lr": 7.51769490947202e-05} +{"train_loss": 0.006639253813773394, "global_step": 24041, "epoch": 202, "lr": 7.517503493059535e-05} +{"train_loss": 0.004594071768224239, "global_step": 24042, "epoch": 202, "lr": 7.517312071704199e-05} +{"train_loss": 0.003688092576339841, "global_step": 24043, "epoch": 202, "lr": 7.517120645406393e-05} +{"train_loss": 0.003678579581901431, "global_step": 24044, "epoch": 202, "lr": 7.516929214166487e-05} +{"train_loss": 0.0034544002264738083, "global_step": 24045, "epoch": 202, "lr": 7.516737777984862e-05} +{"train_loss": 0.004623860120773315, "global_step": 24046, "epoch": 202, "lr": 7.516546336861888e-05} +{"train_loss": 0.005666918121278286, "global_step": 24047, "epoch": 202, "lr": 7.516354890797945e-05} +{"train_loss": 0.002525885356590152, "global_step": 24048, "epoch": 202, "lr": 7.516163439793411e-05} +{"train_loss": 0.00416614580899477, "global_step": 24049, "epoch": 202, "lr": 7.515971983848656e-05} +{"train_loss": 0.005181525833904743, "global_step": 24050, "epoch": 202, "lr": 7.51578052296406e-05} +{"train_loss": 0.005374853033572435, "global_step": 24051, "epoch": 202, "lr": 7.515589057139997e-05} +{"train_loss": 0.005072189029306173, "global_step": 24052, "epoch": 202, "lr": 7.515397586376845e-05} +{"train_loss": 0.004154148977249861, "global_step": 24053, "epoch": 202, "lr": 7.515206110674976e-05} +{"train_loss": 0.0037170597352087498, "global_step": 24054, "epoch": 202, "lr": 7.51501463003477e-05} +{"train_loss": 0.004700045101344585, "global_step": 24055, "epoch": 202, "lr": 7.514823144456602e-05} +{"train_loss": 0.004063215106725693, "global_step": 24056, "epoch": 202, "lr": 7.514631653940847e-05} +{"train_loss": 0.004013598896563053, "global_step": 24057, "epoch": 202, "lr": 7.51444015848788e-05} +{"train_loss": 0.00583123741671443, "global_step": 24058, "epoch": 202, "lr": 7.514248658098081e-05} +{"train_loss": 0.0025653669144958258, "global_step": 24059, "epoch": 202, "lr": 7.514057152771822e-05} +{"train_loss": 0.0037371080834418535, "global_step": 24060, "epoch": 202, "lr": 7.513865642509479e-05} +{"train_loss": 0.004037849139422178, "global_step": 24061, "epoch": 202, "lr": 7.513674127311432e-05} +{"train_loss": 0.006094405427575111, "global_step": 24062, "epoch": 202, "lr": 7.513482607178054e-05} +{"train_loss": 0.004949965514242649, "global_step": 24063, "epoch": 202, "lr": 7.513291082109719e-05} +{"train_loss": 0.004763755481690168, "global_step": 24064, "epoch": 202, "lr": 7.513099552106807e-05} +{"train_loss": 0.0038394969888031483, "global_step": 24065, "epoch": 202, "lr": 7.512908017169694e-05} +{"train_loss": 0.004088849760591984, "global_step": 24066, "epoch": 202, "lr": 7.512716477298752e-05} +{"train_loss": 0.003074167063459754, "global_step": 24067, "epoch": 202, "lr": 7.512524932494361e-05} +{"train_loss": 0.004673383664339781, "global_step": 24068, "epoch": 202, "lr": 7.512333382756896e-05} +{"train_loss": 0.004395927302539349, "global_step": 24069, "epoch": 202, "lr": 7.512141828086731e-05} +{"train_loss": 0.004594644531607628, "global_step": 24070, "epoch": 202, "lr": 7.511950268484245e-05} +{"train_loss": 0.004558177199214697, "global_step": 24071, "epoch": 202, "lr": 7.511758703949814e-05} +{"train_loss": 0.005909211467951536, "global_step": 24072, "epoch": 202, "lr": 7.511567134483812e-05} +{"train_loss": 0.004914828576147556, "global_step": 24073, "epoch": 202, "lr": 7.511375560086617e-05} +{"train_loss": 0.003873926354572177, "global_step": 24074, "epoch": 202, "lr": 7.511183980758604e-05} +{"train_loss": 0.002720222342759371, "global_step": 24075, "epoch": 202, "lr": 7.510992396500149e-05} +{"train_loss": 0.0033709099516272545, "global_step": 24076, "epoch": 202, "lr": 7.510800807311629e-05} +{"train_loss": 0.0028012662660330534, "global_step": 24077, "epoch": 202, "lr": 7.51060921319342e-05} +{"train_loss": 0.005714822094887495, "global_step": 24078, "epoch": 202, "lr": 7.510417614145898e-05} +{"train_loss": 0.004225195851176977, "global_step": 24079, "epoch": 202, "lr": 7.510226010169439e-05} +{"train_loss": 0.0067170546390116215, "global_step": 24080, "epoch": 202, "lr": 7.510034401264421e-05} +{"train_loss": 0.005795726086944342, "global_step": 24081, "epoch": 202, "lr": 7.509842787431217e-05} +{"train_loss": 0.0030320065561681986, "global_step": 24082, "epoch": 202, "lr": 7.509651168670206e-05} +{"train_loss": 0.004397566895931959, "global_step": 24083, "epoch": 202, "lr": 7.509459544981761e-05} +{"train_loss": 0.004350969102233648, "global_step": 24084, "epoch": 202, "lr": 7.509267916366261e-05} +{"train_loss": 0.00358401145786047, "global_step": 24085, "epoch": 202, "lr": 7.509076282824083e-05} +{"train_loss": 0.004837432410567999, "global_step": 24086, "epoch": 202, "lr": 7.5088846443556e-05} +{"train_loss": 0.004898553714156151, "global_step": 24087, "epoch": 202, "lr": 7.508693000961192e-05} +{"train_loss": 0.003980543464422226, "global_step": 24088, "epoch": 202, "lr": 7.508501352641232e-05} +{"train_loss": 0.0033573266118764877, "global_step": 24089, "epoch": 202, "lr": 7.508309699396097e-05} +{"train_loss": 0.0049690380692481995, "global_step": 24090, "epoch": 202, "lr": 7.508118041226164e-05} +{"train_loss": 0.006604385562241077, "global_step": 24091, "epoch": 202, "lr": 7.507926378131811e-05} +{"train_loss": 0.001897594891488552, "global_step": 24092, "epoch": 202, "lr": 7.507734710113412e-05} +{"train_loss": 0.0033696715254336596, "global_step": 24093, "epoch": 202, "lr": 7.507543037171341e-05} +{"train_loss": 0.003691502148285508, "global_step": 24094, "epoch": 202, "lr": 7.50735135930598e-05} +{"train_loss": 0.003679670626297593, "global_step": 24095, "epoch": 202, "lr": 7.507159676517702e-05} +{"train_loss": 0.0032166920136660337, "global_step": 24096, "epoch": 202, "lr": 7.506967988806883e-05} +{"train_loss": 0.007586686871945858, "global_step": 24097, "epoch": 202, "lr": 7.506776296173901e-05} +{"train_loss": 0.0029487009160220623, "global_step": 24098, "epoch": 202, "lr": 7.506584598619131e-05} +{"train_loss": 0.004270584788173437, "global_step": 24099, "epoch": 202, "lr": 7.50639289614295e-05} +{"train_loss": 0.00491316756233573, "global_step": 24100, "epoch": 202, "lr": 7.506201188745735e-05} +{"train_loss": 0.0033316751942038536, "global_step": 24101, "epoch": 202, "lr": 7.506009476427861e-05} +{"train_loss": 0.004656163509935141, "global_step": 24102, "epoch": 202, "lr": 7.505817759189705e-05} +{"train_loss": 0.0039060255512595177, "global_step": 24103, "epoch": 202, "lr": 7.505626037031643e-05} +{"train_loss": 0.00650859484449029, "global_step": 24104, "epoch": 202, "lr": 7.505434309954054e-05} +{"train_loss": 0.004377027973532677, "global_step": 24105, "epoch": 202, "lr": 7.505242577957312e-05} +{"train_loss": 0.004435961600393057, "global_step": 24106, "epoch": 202, "lr": 7.505050841041791e-05} +{"train_loss": 0.0023544305004179478, "global_step": 24107, "epoch": 202, "lr": 7.504859099207874e-05} +{"train_loss": 0.007551733870059252, "global_step": 24108, "epoch": 202, "lr": 7.504667352455931e-05} +{"train_loss": 0.003371280850842595, "global_step": 24109, "epoch": 202, "lr": 7.504475600786343e-05} +{"train_loss": 0.006180991418659687, "global_step": 24110, "epoch": 202, "lr": 7.504283844199483e-05} +{"train_loss": 0.0032648106571286917, "global_step": 24111, "epoch": 202, "lr": 7.50409208269573e-05} +{"train_loss": 0.005379204172641039, "global_step": 24112, "epoch": 202, "lr": 7.50390031627546e-05} +{"train_loss": 0.004603898152709007, "global_step": 24113, "epoch": 202, "lr": 7.50370854493905e-05} +{"train_loss": 0.006080091465264559, "global_step": 24114, "epoch": 202, "lr": 7.503516768686876e-05} +{"train_loss": 0.0028717454988509417, "global_step": 24115, "epoch": 202, "lr": 7.503324987519313e-05} +{"train_loss": 0.004503978416323662, "global_step": 24116, "epoch": 202, "lr": 7.503133201436738e-05} +{"train_loss": 0.008525492623448372, "global_step": 24117, "epoch": 202, "lr": 7.50294141043953e-05} +{"train_loss": 0.005673413164913654, "global_step": 24118, "epoch": 202, "lr": 7.502749614528065e-05} +{"train_loss": 0.0063101863488554955, "global_step": 24119, "epoch": 202, "lr": 7.502557813702715e-05} +{"train_loss": 0.004168140236288309, "global_step": 24120, "epoch": 202, "lr": 7.502366007963863e-05} +{"train_loss": 0.00924825668334961, "global_step": 24121, "epoch": 202, "lr": 7.502174197311882e-05} +{"train_loss": 0.004259507637470961, "global_step": 24122, "epoch": 202, "lr": 7.501982381747148e-05} +{"train_loss": 0.0053697871044278145, "global_step": 24123, "epoch": 202, "lr": 7.501790561270041e-05} +{"train_loss": 0.006182060576975346, "global_step": 24124, "epoch": 202, "lr": 7.501598735880934e-05} +{"train_loss": 0.004171724896878004, "global_step": 24125, "epoch": 202, "lr": 7.501406905580205e-05} +{"train_loss": 0.00406083045527339, "global_step": 24126, "epoch": 202, "lr": 7.50121507036823e-05} +{"train_loss": 0.005284549668431282, "global_step": 24127, "epoch": 202, "lr": 7.501023230245389e-05} +{"train_loss": 0.002868028823286295, "global_step": 24128, "epoch": 202, "lr": 7.500831385212055e-05} +{"train_loss": 0.006239808164536953, "global_step": 24129, "epoch": 202, "lr": 7.500639535268605e-05} +{"train_loss": 0.0038365451619029045, "global_step": 24130, "epoch": 202, "lr": 7.500447680415417e-05} +{"train_loss": 0.0026328549720346928, "global_step": 24131, "epoch": 202, "lr": 7.500255820652869e-05} +{"train_loss": 0.004510947968810797, "global_step": 24132, "epoch": 202, "lr": 7.500063955981333e-05} +{"train_loss": 0.004244569689035416, "global_step": 24133, "epoch": 202, "lr": 7.499872086401189e-05} +{"train_loss": 0.004502726718783379, "global_step": 24134, "epoch": 202, "lr": 7.499680211912814e-05} +{"train_loss": 0.004209426697343588, "global_step": 24135, "epoch": 202, "lr": 7.499488332516583e-05} +{"train_loss": 0.005643815267831087, "global_step": 24136, "epoch": 202, "lr": 7.499296448212875e-05} +{"train_loss": 0.005632029380649328, "global_step": 24137, "epoch": 202, "lr": 7.499104559002065e-05} +{"train_loss": 0.004156522452831268, "global_step": 24138, "epoch": 202, "lr": 7.49891266488453e-05} +{"train_loss": 0.005006888881325722, "global_step": 24139, "epoch": 202, "lr": 7.498720765860646e-05} +{"train_loss": 0.00456432206556201, "global_step": 24140, "epoch": 202, "lr": 7.498528861930792e-05} +{"train_loss": 0.004559116438031197, "global_step": 24141, "epoch": 202, "lr": 7.498336953095343e-05} +{"train_loss": 0.005131728947162628, "global_step": 24142, "epoch": 202, "lr": 7.498145039354676e-05} +{"train_loss": 0.004277854226529598, "global_step": 24143, "epoch": 202, "lr": 7.497953120709169e-05} +{"train_loss": 0.005018509924411774, "global_step": 24144, "epoch": 202, "lr": 7.497761197159197e-05} +{"train_loss": 0.005286966450512409, "global_step": 24145, "epoch": 202, "lr": 7.497569268705137e-05} +{"train_loss": 0.00505549693480134, "global_step": 24146, "epoch": 202, "lr": 7.497377335347368e-05} +{"train_loss": 0.0028116763569414616, "global_step": 24147, "epoch": 202, "lr": 7.497185397086266e-05} +{"train_loss": 0.004686618689447641, "global_step": 24148, "epoch": 202, "lr": 7.496993453922207e-05} +{"train_loss": 0.0027490402571856976, "global_step": 24149, "epoch": 202, "lr": 7.496801505855567e-05} +{"train_loss": 0.008365867659449577, "global_step": 24150, "epoch": 202, "lr": 7.496609552886725e-05} +{"train_loss": 0.00410899892449379, "global_step": 24151, "epoch": 202, "lr": 7.496417595016057e-05} +{"train_loss": 0.00832541286945343, "global_step": 24152, "epoch": 202, "lr": 7.496225632243938e-05} +{"train_loss": 0.004614061675965786, "global_step": 24153, "epoch": 202, "lr": 7.496033664570747e-05} +{"train_loss": 0.0032945575658231974, "global_step": 24154, "epoch": 202, "lr": 7.495841691996862e-05} +{"train_loss": 0.005114133469760418, "global_step": 24155, "epoch": 202, "lr": 7.495649714522659e-05} +{"train_loss": 0.004601606819387369, "global_step": 24156, "epoch": 202, "lr": 7.495457732148513e-05, "val_loss": 0.013778980821371078} +{"train_loss": 0.006361141335219145, "global_step": 24157, "epoch": 203, "lr": 7.495265744874803e-05} +{"train_loss": 0.003279113909229636, "global_step": 24158, "epoch": 203, "lr": 7.495073752701904e-05} +{"train_loss": 0.003104271600022912, "global_step": 24159, "epoch": 203, "lr": 7.494881755630194e-05} +{"train_loss": 0.005379919894039631, "global_step": 24160, "epoch": 203, "lr": 7.494689753660051e-05} +{"train_loss": 0.005551617126911879, "global_step": 24161, "epoch": 203, "lr": 7.494497746791853e-05} +{"train_loss": 0.005933521781116724, "global_step": 24162, "epoch": 203, "lr": 7.494305735025973e-05} +{"train_loss": 0.004553226754069328, "global_step": 24163, "epoch": 203, "lr": 7.494113718362791e-05} +{"train_loss": 0.008912362158298492, "global_step": 24164, "epoch": 203, "lr": 7.493921696802683e-05} +{"train_loss": 0.0038765992503613234, "global_step": 24165, "epoch": 203, "lr": 7.493729670346025e-05} +{"train_loss": 0.004197500646114349, "global_step": 24166, "epoch": 203, "lr": 7.493537638993197e-05} +{"train_loss": 0.005341959185898304, "global_step": 24167, "epoch": 203, "lr": 7.493345602744574e-05} +{"train_loss": 0.0030782718677073717, "global_step": 24168, "epoch": 203, "lr": 7.493153561600534e-05} +{"train_loss": 0.002691013505682349, "global_step": 24169, "epoch": 203, "lr": 7.492961515561452e-05} +{"train_loss": 0.0024598867166787386, "global_step": 24170, "epoch": 203, "lr": 7.492769464627707e-05} +{"train_loss": 0.005907702725380659, "global_step": 24171, "epoch": 203, "lr": 7.492577408799675e-05} +{"train_loss": 0.0035902380477637053, "global_step": 24172, "epoch": 203, "lr": 7.492385348077733e-05} +{"train_loss": 0.005407909397035837, "global_step": 24173, "epoch": 203, "lr": 7.49219328246226e-05} +{"train_loss": 0.004063781350851059, "global_step": 24174, "epoch": 203, "lr": 7.492001211953631e-05} +{"train_loss": 0.0038474611937999725, "global_step": 24175, "epoch": 203, "lr": 7.491809136552223e-05} +{"train_loss": 0.005982957314699888, "global_step": 24176, "epoch": 203, "lr": 7.491617056258416e-05} +{"train_loss": 0.004423798993229866, "global_step": 24177, "epoch": 203, "lr": 7.491424971072582e-05} +{"train_loss": 0.00576526066288352, "global_step": 24178, "epoch": 203, "lr": 7.491232880995103e-05} +{"train_loss": 0.003471741685643792, "global_step": 24179, "epoch": 203, "lr": 7.491040786026356e-05} +{"train_loss": 0.005601567681878805, "global_step": 24180, "epoch": 203, "lr": 7.490848686166716e-05} +{"train_loss": 0.0023561615962535143, "global_step": 24181, "epoch": 203, "lr": 7.49065658141656e-05} +{"train_loss": 0.0029566234443336725, "global_step": 24182, "epoch": 203, "lr": 7.490464471776266e-05} +{"train_loss": 0.004361151251941919, "global_step": 24183, "epoch": 203, "lr": 7.49027235724621e-05} +{"train_loss": 0.004756435751914978, "global_step": 24184, "epoch": 203, "lr": 7.490080237826771e-05} +{"train_loss": 0.002935998374596238, "global_step": 24185, "epoch": 203, "lr": 7.489888113518325e-05} +{"train_loss": 0.003452312434092164, "global_step": 24186, "epoch": 203, "lr": 7.489695984321252e-05} +{"train_loss": 0.0056841010227799416, "global_step": 24187, "epoch": 203, "lr": 7.489503850235925e-05} +{"train_loss": 0.005289201159030199, "global_step": 24188, "epoch": 203, "lr": 7.489311711262723e-05} +{"train_loss": 0.003708776319399476, "global_step": 24189, "epoch": 203, "lr": 7.489119567402023e-05} +{"train_loss": 0.0040079206228256226, "global_step": 24190, "epoch": 203, "lr": 7.488927418654204e-05} +{"train_loss": 0.003755175741389394, "global_step": 24191, "epoch": 203, "lr": 7.48873526501964e-05} +{"train_loss": 0.002175494795665145, "global_step": 24192, "epoch": 203, "lr": 7.488543106498712e-05} +{"train_loss": 0.0031040043104439974, "global_step": 24193, "epoch": 203, "lr": 7.488350943091795e-05} +{"train_loss": 0.004460049327462912, "global_step": 24194, "epoch": 203, "lr": 7.488158774799268e-05} +{"train_loss": 0.005696197040379047, "global_step": 24195, "epoch": 203, "lr": 7.487966601621505e-05} +{"train_loss": 0.005124785006046295, "global_step": 24196, "epoch": 203, "lr": 7.487774423558887e-05} +{"train_loss": 0.004590216558426619, "global_step": 24197, "epoch": 203, "lr": 7.487582240611787e-05} +{"train_loss": 0.005003310739994049, "global_step": 24198, "epoch": 203, "lr": 7.487390052780588e-05} +{"train_loss": 0.004314780700951815, "global_step": 24199, "epoch": 203, "lr": 7.487197860065664e-05} +{"train_loss": 0.006124147679656744, "global_step": 24200, "epoch": 203, "lr": 7.487005662467392e-05} +{"train_loss": 0.0059731570072472095, "global_step": 24201, "epoch": 203, "lr": 7.486813459986149e-05} +{"train_loss": 0.003139193868264556, "global_step": 24202, "epoch": 203, "lr": 7.486621252622314e-05} +{"train_loss": 0.005268468987196684, "global_step": 24203, "epoch": 203, "lr": 7.486429040376266e-05} +{"train_loss": 0.007915115915238857, "global_step": 24204, "epoch": 203, "lr": 7.486236823248379e-05} +{"train_loss": 0.0041265892796218395, "global_step": 24205, "epoch": 203, "lr": 7.486044601239031e-05} +{"train_loss": 0.004635538440197706, "global_step": 24206, "epoch": 203, "lr": 7.485852374348599e-05} +{"train_loss": 0.0054535893723368645, "global_step": 24207, "epoch": 203, "lr": 7.485660142577462e-05} +{"train_loss": 0.006647717673331499, "global_step": 24208, "epoch": 203, "lr": 7.485467905925998e-05} +{"train_loss": 0.003790725953876972, "global_step": 24209, "epoch": 203, "lr": 7.485275664394583e-05} +{"train_loss": 0.004719350021332502, "global_step": 24210, "epoch": 203, "lr": 7.485083417983594e-05} +{"train_loss": 0.004502056632190943, "global_step": 24211, "epoch": 203, "lr": 7.484891166693411e-05} +{"train_loss": 0.004571387078613043, "global_step": 24212, "epoch": 203, "lr": 7.484698910524407e-05} +{"train_loss": 0.003961808048188686, "global_step": 24213, "epoch": 203, "lr": 7.484506649476964e-05} +{"train_loss": 0.0030129519291222095, "global_step": 24214, "epoch": 203, "lr": 7.484314383551459e-05} +{"train_loss": 0.004319522995501757, "global_step": 24215, "epoch": 203, "lr": 7.484122112748265e-05} +{"train_loss": 0.0041487193666398525, "global_step": 24216, "epoch": 203, "lr": 7.483929837067763e-05} +{"train_loss": 0.0031552878208458424, "global_step": 24217, "epoch": 203, "lr": 7.483737556510332e-05} +{"train_loss": 0.0040816655382514, "global_step": 24218, "epoch": 203, "lr": 7.483545271076347e-05} +{"train_loss": 0.00425743218511343, "global_step": 24219, "epoch": 203, "lr": 7.483352980766186e-05} +{"train_loss": 0.004364433698356152, "global_step": 24220, "epoch": 203, "lr": 7.483160685580227e-05} +{"train_loss": 0.0033521661534905434, "global_step": 24221, "epoch": 203, "lr": 7.482968385518847e-05} +{"train_loss": 0.005090856458991766, "global_step": 24222, "epoch": 203, "lr": 7.482776080582423e-05} +{"train_loss": 0.004214164800941944, "global_step": 24223, "epoch": 203, "lr": 7.482583770771334e-05} +{"train_loss": 0.004318742547184229, "global_step": 24224, "epoch": 203, "lr": 7.482391456085958e-05} +{"train_loss": 0.005436317529529333, "global_step": 24225, "epoch": 203, "lr": 7.48219913652667e-05} +{"train_loss": 0.003441540990024805, "global_step": 24226, "epoch": 203, "lr": 7.48200681209385e-05} +{"train_loss": 0.005222101230174303, "global_step": 24227, "epoch": 203, "lr": 7.481814482787875e-05} +{"train_loss": 0.0050490302965044975, "global_step": 24228, "epoch": 203, "lr": 7.481622148609122e-05} +{"train_loss": 0.005146577022969723, "global_step": 24229, "epoch": 203, "lr": 7.481429809557968e-05} +{"train_loss": 0.003388873767107725, "global_step": 24230, "epoch": 203, "lr": 7.481237465634794e-05} +{"train_loss": 0.004847751464694738, "global_step": 24231, "epoch": 203, "lr": 7.481045116839974e-05} +{"train_loss": 0.0031033300328999758, "global_step": 24232, "epoch": 203, "lr": 7.480852763173887e-05} +{"train_loss": 0.003867036895826459, "global_step": 24233, "epoch": 203, "lr": 7.48066040463691e-05} +{"train_loss": 0.0051782261580228806, "global_step": 24234, "epoch": 203, "lr": 7.480468041229423e-05} +{"train_loss": 0.0055317445658147335, "global_step": 24235, "epoch": 203, "lr": 7.4802756729518e-05} +{"train_loss": 0.004871053155511618, "global_step": 24236, "epoch": 203, "lr": 7.480083299804423e-05} +{"train_loss": 0.0029838376212865114, "global_step": 24237, "epoch": 203, "lr": 7.479890921787667e-05} +{"train_loss": 0.0049348571337759495, "global_step": 24238, "epoch": 203, "lr": 7.479698538901909e-05} +{"train_loss": 0.0030527084600180387, "global_step": 24239, "epoch": 203, "lr": 7.479506151147528e-05} +{"train_loss": 0.005232659634202719, "global_step": 24240, "epoch": 203, "lr": 7.479313758524902e-05} +{"train_loss": 0.003889300161972642, "global_step": 24241, "epoch": 203, "lr": 7.479121361034406e-05} +{"train_loss": 0.0034742956049740314, "global_step": 24242, "epoch": 203, "lr": 7.478928958676423e-05} +{"train_loss": 0.0033624290954321623, "global_step": 24243, "epoch": 203, "lr": 7.478736551451327e-05} +{"train_loss": 0.0037464455235749483, "global_step": 24244, "epoch": 203, "lr": 7.478544139359496e-05} +{"train_loss": 0.0026451738085597754, "global_step": 24245, "epoch": 203, "lr": 7.478351722401308e-05} +{"train_loss": 0.004874008242040873, "global_step": 24246, "epoch": 203, "lr": 7.478159300577143e-05} +{"train_loss": 0.0044252872467041016, "global_step": 24247, "epoch": 203, "lr": 7.477966873887376e-05} +{"train_loss": 0.003413035534322262, "global_step": 24248, "epoch": 203, "lr": 7.477774442332385e-05} +{"train_loss": 0.005277801770716906, "global_step": 24249, "epoch": 203, "lr": 7.47758200591255e-05} +{"train_loss": 0.0058004665188491344, "global_step": 24250, "epoch": 203, "lr": 7.477389564628248e-05} +{"train_loss": 0.004225102253258228, "global_step": 24251, "epoch": 203, "lr": 7.477197118479855e-05} +{"train_loss": 0.002413815353065729, "global_step": 24252, "epoch": 203, "lr": 7.47700466746775e-05} +{"train_loss": 0.00335415406152606, "global_step": 24253, "epoch": 203, "lr": 7.47681221159231e-05} +{"train_loss": 0.0033767076674848795, "global_step": 24254, "epoch": 203, "lr": 7.476619750853915e-05} +{"train_loss": 0.003933933563530445, "global_step": 24255, "epoch": 203, "lr": 7.476427285252942e-05} +{"train_loss": 0.004797703120857477, "global_step": 24256, "epoch": 203, "lr": 7.476234814789768e-05} +{"train_loss": 0.0057169902138412, "global_step": 24257, "epoch": 203, "lr": 7.476042339464772e-05} +{"train_loss": 0.005663447547703981, "global_step": 24258, "epoch": 203, "lr": 7.47584985927833e-05} +{"train_loss": 0.004180354531854391, "global_step": 24259, "epoch": 203, "lr": 7.475657374230822e-05} +{"train_loss": 0.0031203152611851692, "global_step": 24260, "epoch": 203, "lr": 7.475464884322625e-05} +{"train_loss": 0.0038888338021934032, "global_step": 24261, "epoch": 203, "lr": 7.47527238955412e-05} +{"train_loss": 0.004467981401830912, "global_step": 24262, "epoch": 203, "lr": 7.475079889925681e-05} +{"train_loss": 0.004539026878774166, "global_step": 24263, "epoch": 203, "lr": 7.474887385437685e-05} +{"train_loss": 0.0039153373800218105, "global_step": 24264, "epoch": 203, "lr": 7.474694876090513e-05} +{"train_loss": 0.004487173166126013, "global_step": 24265, "epoch": 203, "lr": 7.474502361884541e-05} +{"train_loss": 0.0051762014627456665, "global_step": 24266, "epoch": 203, "lr": 7.47430984282015e-05} +{"train_loss": 0.005914777982980013, "global_step": 24267, "epoch": 203, "lr": 7.474117318897714e-05} +{"train_loss": 0.004432477056980133, "global_step": 24268, "epoch": 203, "lr": 7.473924790117614e-05} +{"train_loss": 0.0024764337576925755, "global_step": 24269, "epoch": 203, "lr": 7.473732256480229e-05} +{"train_loss": 0.0066178641282022, "global_step": 24270, "epoch": 203, "lr": 7.473539717985931e-05} +{"train_loss": 0.004519317299127579, "global_step": 24271, "epoch": 203, "lr": 7.473347174635105e-05} +{"train_loss": 0.0047184620052576065, "global_step": 24272, "epoch": 203, "lr": 7.473154626428125e-05} +{"train_loss": 0.0032536627259105444, "global_step": 24273, "epoch": 203, "lr": 7.47296207336537e-05} +{"train_loss": 0.007051816210150719, "global_step": 24274, "epoch": 203, "lr": 7.472769515447217e-05} +{"train_loss": 0.004448585241579083, "global_step": 24275, "epoch": 203, "lr": 7.472576952674047e-05, "val_loss": 0.024256782606244087} +{"train_loss": 0.004172108136117458, "global_step": 24276, "epoch": 204, "lr": 7.472384385046236e-05} +{"train_loss": 0.0048918225802481174, "global_step": 24277, "epoch": 204, "lr": 7.472191812564163e-05} +{"train_loss": 0.0035582995042204857, "global_step": 24278, "epoch": 204, "lr": 7.471999235228203e-05} +{"train_loss": 0.005675144959241152, "global_step": 24279, "epoch": 204, "lr": 7.471806653038737e-05} +{"train_loss": 0.002628228161484003, "global_step": 24280, "epoch": 204, "lr": 7.471614065996147e-05} +{"train_loss": 0.00577242998406291, "global_step": 24281, "epoch": 204, "lr": 7.471421474100803e-05} +{"train_loss": 0.0046746633015573025, "global_step": 24282, "epoch": 204, "lr": 7.471228877353087e-05} +{"train_loss": 0.004348038230091333, "global_step": 24283, "epoch": 204, "lr": 7.471036275753378e-05} +{"train_loss": 0.004766099154949188, "global_step": 24284, "epoch": 204, "lr": 7.470843669302053e-05} +{"train_loss": 0.0036566839553415775, "global_step": 24285, "epoch": 204, "lr": 7.470651057999491e-05} +{"train_loss": 0.004430856090039015, "global_step": 24286, "epoch": 204, "lr": 7.47045844184607e-05} +{"train_loss": 0.003949278499931097, "global_step": 24287, "epoch": 204, "lr": 7.470265820842166e-05} +{"train_loss": 0.0040596285834908485, "global_step": 24288, "epoch": 204, "lr": 7.47007319498816e-05} +{"train_loss": 0.0038042583037167788, "global_step": 24289, "epoch": 204, "lr": 7.469880564284429e-05} +{"train_loss": 0.004998457618057728, "global_step": 24290, "epoch": 204, "lr": 7.469687928731351e-05} +{"train_loss": 0.007004117593169212, "global_step": 24291, "epoch": 204, "lr": 7.469495288329305e-05} +{"train_loss": 0.0035495541524142027, "global_step": 24292, "epoch": 204, "lr": 7.469302643078669e-05} +{"train_loss": 0.006125372368842363, "global_step": 24293, "epoch": 204, "lr": 7.469109992979821e-05} +{"train_loss": 0.005646639969199896, "global_step": 24294, "epoch": 204, "lr": 7.468917338033139e-05} +{"train_loss": 0.005530430004000664, "global_step": 24295, "epoch": 204, "lr": 7.468724678239001e-05} +{"train_loss": 0.003951238468289375, "global_step": 24296, "epoch": 204, "lr": 7.468532013597787e-05} +{"train_loss": 0.003909201826900244, "global_step": 24297, "epoch": 204, "lr": 7.468339344109875e-05} +{"train_loss": 0.0067753572948277, "global_step": 24298, "epoch": 204, "lr": 7.468146669775641e-05} +{"train_loss": 0.0034648398868739605, "global_step": 24299, "epoch": 204, "lr": 7.467953990595466e-05} +{"train_loss": 0.005115855019539595, "global_step": 24300, "epoch": 204, "lr": 7.467761306569725e-05} +{"train_loss": 0.004825415555387735, "global_step": 24301, "epoch": 204, "lr": 7.467568617698799e-05} +{"train_loss": 0.0033912346698343754, "global_step": 24302, "epoch": 204, "lr": 7.467375923983067e-05} +{"train_loss": 0.004448933061212301, "global_step": 24303, "epoch": 204, "lr": 7.467183225422904e-05} +{"train_loss": 0.006597842555493116, "global_step": 24304, "epoch": 204, "lr": 7.466990522018691e-05} +{"train_loss": 0.004627637565135956, "global_step": 24305, "epoch": 204, "lr": 7.466797813770805e-05} +{"train_loss": 0.0029393339063972235, "global_step": 24306, "epoch": 204, "lr": 7.466605100679627e-05} +{"train_loss": 0.004528453573584557, "global_step": 24307, "epoch": 204, "lr": 7.466412382745532e-05} +{"train_loss": 0.006694330833852291, "global_step": 24308, "epoch": 204, "lr": 7.4662196599689e-05} +{"train_loss": 0.0034645760897547007, "global_step": 24309, "epoch": 204, "lr": 7.466026932350109e-05} +{"train_loss": 0.00488336943089962, "global_step": 24310, "epoch": 204, "lr": 7.465834199889537e-05} +{"train_loss": 0.004039037507027388, "global_step": 24311, "epoch": 204, "lr": 7.465641462587565e-05} +{"train_loss": 0.004943695850670338, "global_step": 24312, "epoch": 204, "lr": 7.465448720444567e-05} +{"train_loss": 0.0037326058372855186, "global_step": 24313, "epoch": 204, "lr": 7.465255973460925e-05} +{"train_loss": 0.004737423732876778, "global_step": 24314, "epoch": 204, "lr": 7.465063221637017e-05} +{"train_loss": 0.0035488270223140717, "global_step": 24315, "epoch": 204, "lr": 7.46487046497322e-05} +{"train_loss": 0.0032068544533103704, "global_step": 24316, "epoch": 204, "lr": 7.464677703469913e-05} +{"train_loss": 0.0031170514412224293, "global_step": 24317, "epoch": 204, "lr": 7.464484937127474e-05} +{"train_loss": 0.004993547685444355, "global_step": 24318, "epoch": 204, "lr": 7.464292165946284e-05} +{"train_loss": 0.004129844252020121, "global_step": 24319, "epoch": 204, "lr": 7.464099389926719e-05} +{"train_loss": 0.004094042349606752, "global_step": 24320, "epoch": 204, "lr": 7.463906609069158e-05} +{"train_loss": 0.006537044420838356, "global_step": 24321, "epoch": 204, "lr": 7.463713823373979e-05} +{"train_loss": 0.002735958667472005, "global_step": 24322, "epoch": 204, "lr": 7.46352103284156e-05} +{"train_loss": 0.0045302510261535645, "global_step": 24323, "epoch": 204, "lr": 7.463328237472282e-05} +{"train_loss": 0.003936209715902805, "global_step": 24324, "epoch": 204, "lr": 7.463135437266522e-05} +{"train_loss": 0.0029517807997763157, "global_step": 24325, "epoch": 204, "lr": 7.462942632224658e-05} +{"train_loss": 0.0031272931955754757, "global_step": 24326, "epoch": 204, "lr": 7.462749822347071e-05} +{"train_loss": 0.003902277210727334, "global_step": 24327, "epoch": 204, "lr": 7.462557007634137e-05} +{"train_loss": 0.0053211236372590065, "global_step": 24328, "epoch": 204, "lr": 7.462364188086235e-05} +{"train_loss": 0.0031117091421037912, "global_step": 24329, "epoch": 204, "lr": 7.462171363703745e-05} +{"train_loss": 0.006226213648915291, "global_step": 24330, "epoch": 204, "lr": 7.461978534487045e-05} +{"train_loss": 0.001927339704707265, "global_step": 24331, "epoch": 204, "lr": 7.46178570043651e-05} +{"train_loss": 0.005617867223918438, "global_step": 24332, "epoch": 204, "lr": 7.461592861552526e-05} +{"train_loss": 0.005895886104553938, "global_step": 24333, "epoch": 204, "lr": 7.461400017835465e-05} +{"train_loss": 0.0024555244017392397, "global_step": 24334, "epoch": 204, "lr": 7.461207169285708e-05} +{"train_loss": 0.0034630587324500084, "global_step": 24335, "epoch": 204, "lr": 7.461014315903633e-05} +{"train_loss": 0.006729735992848873, "global_step": 24336, "epoch": 204, "lr": 7.460821457689622e-05} +{"train_loss": 0.0027376776561141014, "global_step": 24337, "epoch": 204, "lr": 7.460628594644049e-05} +{"train_loss": 0.003834836883470416, "global_step": 24338, "epoch": 204, "lr": 7.460435726767294e-05} +{"train_loss": 0.0038593467324972153, "global_step": 24339, "epoch": 204, "lr": 7.460242854059736e-05} +{"train_loss": 0.0037454618141055107, "global_step": 24340, "epoch": 204, "lr": 7.460049976521756e-05} +{"train_loss": 0.0036434177309274673, "global_step": 24341, "epoch": 204, "lr": 7.45985709415373e-05} +{"train_loss": 0.005031795706599951, "global_step": 24342, "epoch": 204, "lr": 7.459664206956036e-05} +{"train_loss": 0.0045876032672822475, "global_step": 24343, "epoch": 204, "lr": 7.459471314929057e-05} +{"train_loss": 0.00463689211755991, "global_step": 24344, "epoch": 204, "lr": 7.459278418073167e-05} +{"train_loss": 0.0028471671976149082, "global_step": 24345, "epoch": 204, "lr": 7.459085516388746e-05} +{"train_loss": 0.004647777881473303, "global_step": 24346, "epoch": 204, "lr": 7.458892609876175e-05} +{"train_loss": 0.004401239566504955, "global_step": 24347, "epoch": 204, "lr": 7.458699698535829e-05} +{"train_loss": 0.0036849058233201504, "global_step": 24348, "epoch": 204, "lr": 7.458506782368091e-05} +{"train_loss": 0.004796297755092382, "global_step": 24349, "epoch": 204, "lr": 7.458313861373337e-05} +{"train_loss": 0.003311583073809743, "global_step": 24350, "epoch": 204, "lr": 7.458120935551945e-05} +{"train_loss": 0.0037566276732832193, "global_step": 24351, "epoch": 204, "lr": 7.457928004904296e-05} +{"train_loss": 0.006243815179914236, "global_step": 24352, "epoch": 204, "lr": 7.457735069430767e-05} +{"train_loss": 0.0035054790787398815, "global_step": 24353, "epoch": 204, "lr": 7.457542129131741e-05} +{"train_loss": 0.005975565407425165, "global_step": 24354, "epoch": 204, "lr": 7.45734918400759e-05} +{"train_loss": 0.004219658672809601, "global_step": 24355, "epoch": 204, "lr": 7.457156234058698e-05} +{"train_loss": 0.006460865959525108, "global_step": 24356, "epoch": 204, "lr": 7.456963279285442e-05} +{"train_loss": 0.004924820736050606, "global_step": 24357, "epoch": 204, "lr": 7.456770319688201e-05} +{"train_loss": 0.0043587530963122845, "global_step": 24358, "epoch": 204, "lr": 7.456577355267354e-05} +{"train_loss": 0.004554382991045713, "global_step": 24359, "epoch": 204, "lr": 7.45638438602328e-05} +{"train_loss": 0.005423072259873152, "global_step": 24360, "epoch": 204, "lr": 7.456191411956357e-05} +{"train_loss": 0.007076284848153591, "global_step": 24361, "epoch": 204, "lr": 7.455998433066964e-05} +{"train_loss": 0.0033852499909698963, "global_step": 24362, "epoch": 204, "lr": 7.455805449355482e-05} +{"train_loss": 0.004627321846783161, "global_step": 24363, "epoch": 204, "lr": 7.455612460822289e-05} +{"train_loss": 0.0031846535857766867, "global_step": 24364, "epoch": 204, "lr": 7.455419467467761e-05} +{"train_loss": 0.0038025800604373217, "global_step": 24365, "epoch": 204, "lr": 7.455226469292281e-05} +{"train_loss": 0.005125780589878559, "global_step": 24366, "epoch": 204, "lr": 7.455033466296227e-05} +{"train_loss": 0.002043112413957715, "global_step": 24367, "epoch": 204, "lr": 7.454840458479975e-05} +{"train_loss": 0.0026217589620500803, "global_step": 24368, "epoch": 204, "lr": 7.454647445843906e-05} +{"train_loss": 0.005851937923580408, "global_step": 24369, "epoch": 204, "lr": 7.4544544283884e-05} +{"train_loss": 0.005077403970062733, "global_step": 24370, "epoch": 204, "lr": 7.454261406113834e-05} +{"train_loss": 0.00418081134557724, "global_step": 24371, "epoch": 204, "lr": 7.45406837902059e-05} +{"train_loss": 0.005776845384389162, "global_step": 24372, "epoch": 204, "lr": 7.453875347109042e-05} +{"train_loss": 0.008335410617291927, "global_step": 24373, "epoch": 204, "lr": 7.453682310379573e-05} +{"train_loss": 0.00454977061599493, "global_step": 24374, "epoch": 204, "lr": 7.45348926883256e-05} +{"train_loss": 0.00331208948045969, "global_step": 24375, "epoch": 204, "lr": 7.453296222468385e-05} +{"train_loss": 0.005085628014057875, "global_step": 24376, "epoch": 204, "lr": 7.453103171287424e-05} +{"train_loss": 0.003734010737389326, "global_step": 24377, "epoch": 204, "lr": 7.452910115290057e-05} +{"train_loss": 0.0058209761045873165, "global_step": 24378, "epoch": 204, "lr": 7.452717054476664e-05} +{"train_loss": 0.0025243815034627914, "global_step": 24379, "epoch": 204, "lr": 7.452523988847621e-05} +{"train_loss": 0.0035363654606044292, "global_step": 24380, "epoch": 204, "lr": 7.452330918403312e-05} +{"train_loss": 0.005311575718224049, "global_step": 24381, "epoch": 204, "lr": 7.452137843144112e-05} +{"train_loss": 0.0028914527501910925, "global_step": 24382, "epoch": 204, "lr": 7.4519447630704e-05} +{"train_loss": 0.0042650289833545685, "global_step": 24383, "epoch": 204, "lr": 7.451751678182558e-05} +{"train_loss": 0.003807587781921029, "global_step": 24384, "epoch": 204, "lr": 7.451558588480962e-05} +{"train_loss": 0.0033152454998344183, "global_step": 24385, "epoch": 204, "lr": 7.451365493965994e-05} +{"train_loss": 0.002982289297506213, "global_step": 24386, "epoch": 204, "lr": 7.45117239463803e-05} +{"train_loss": 0.003256659023463726, "global_step": 24387, "epoch": 204, "lr": 7.450979290497454e-05} +{"train_loss": 0.005918602459132671, "global_step": 24388, "epoch": 204, "lr": 7.450786181544638e-05} +{"train_loss": 0.0018893750384449959, "global_step": 24389, "epoch": 204, "lr": 7.450593067779968e-05} +{"train_loss": 0.004591537639498711, "global_step": 24390, "epoch": 204, "lr": 7.45039994920382e-05} +{"train_loss": 0.003648602170869708, "global_step": 24391, "epoch": 204, "lr": 7.450206825816572e-05} +{"train_loss": 0.002684801584109664, "global_step": 24392, "epoch": 204, "lr": 7.450013697618606e-05} +{"train_loss": 0.004632996395230293, "global_step": 24393, "epoch": 204, "lr": 7.449820564610302e-05} +{"train_loss": 0.004383173432717679, "global_step": 24394, "epoch": 204, "lr": 7.449627426792033e-05, "val_loss": 0.014100540429353714} +{"train_loss": 0.003943867515772581, "global_step": 24395, "epoch": 205, "lr": 7.449434284164184e-05} +{"train_loss": 0.004058475606143475, "global_step": 24396, "epoch": 205, "lr": 7.449241136727132e-05} +{"train_loss": 0.00628501595929265, "global_step": 24397, "epoch": 205, "lr": 7.449047984481257e-05} +{"train_loss": 0.005836261436343193, "global_step": 24398, "epoch": 205, "lr": 7.448854827426939e-05} +{"train_loss": 0.004486816935241222, "global_step": 24399, "epoch": 205, "lr": 7.448661665564556e-05} +{"train_loss": 0.004750736057758331, "global_step": 24400, "epoch": 205, "lr": 7.448468498894485e-05} +{"train_loss": 0.0052053057588636875, "global_step": 24401, "epoch": 205, "lr": 7.44827532741711e-05} +{"train_loss": 0.004064665641635656, "global_step": 24402, "epoch": 205, "lr": 7.448082151132807e-05} +{"train_loss": 0.002958275843411684, "global_step": 24403, "epoch": 205, "lr": 7.447888970041957e-05} +{"train_loss": 0.0025790720246732235, "global_step": 24404, "epoch": 205, "lr": 7.447695784144937e-05} +{"train_loss": 0.0036835395731031895, "global_step": 24405, "epoch": 205, "lr": 7.447502593442128e-05} +{"train_loss": 0.004817525390535593, "global_step": 24406, "epoch": 205, "lr": 7.44730939793391e-05} +{"train_loss": 0.004752960987389088, "global_step": 24407, "epoch": 205, "lr": 7.447116197620662e-05} +{"train_loss": 0.0031811052467674017, "global_step": 24408, "epoch": 205, "lr": 7.446922992502762e-05} +{"train_loss": 0.002134363166987896, "global_step": 24409, "epoch": 205, "lr": 7.44672978258059e-05} +{"train_loss": 0.004377754405140877, "global_step": 24410, "epoch": 205, "lr": 7.446536567854526e-05} +{"train_loss": 0.0047468142583966255, "global_step": 24411, "epoch": 205, "lr": 7.44634334832495e-05} +{"train_loss": 0.003921189345419407, "global_step": 24412, "epoch": 205, "lr": 7.446150123992239e-05} +{"train_loss": 0.0036858911626040936, "global_step": 24413, "epoch": 205, "lr": 7.445956894856773e-05} +{"train_loss": 0.003212104318663478, "global_step": 24414, "epoch": 205, "lr": 7.445763660918932e-05} +{"train_loss": 0.00565378600731492, "global_step": 24415, "epoch": 205, "lr": 7.445570422179095e-05} +{"train_loss": 0.003763208631426096, "global_step": 24416, "epoch": 205, "lr": 7.445377178637643e-05} +{"train_loss": 0.004212001338601112, "global_step": 24417, "epoch": 205, "lr": 7.445183930294952e-05} +{"train_loss": 0.003545436542481184, "global_step": 24418, "epoch": 205, "lr": 7.444990677151407e-05} +{"train_loss": 0.0051739695481956005, "global_step": 24419, "epoch": 205, "lr": 7.444797419207381e-05} +{"train_loss": 0.003993229009211063, "global_step": 24420, "epoch": 205, "lr": 7.444604156463258e-05} +{"train_loss": 0.0041037374176084995, "global_step": 24421, "epoch": 205, "lr": 7.444410888919415e-05} +{"train_loss": 0.004516996443271637, "global_step": 24422, "epoch": 205, "lr": 7.444217616576232e-05} +{"train_loss": 0.005656103137880564, "global_step": 24423, "epoch": 205, "lr": 7.444024339434091e-05} +{"train_loss": 0.005886894650757313, "global_step": 24424, "epoch": 205, "lr": 7.443831057493369e-05} +{"train_loss": 0.0039235129952430725, "global_step": 24425, "epoch": 205, "lr": 7.443637770754443e-05} +{"train_loss": 0.004411289002746344, "global_step": 24426, "epoch": 205, "lr": 7.443444479217697e-05} +{"train_loss": 0.00482129817828536, "global_step": 24427, "epoch": 205, "lr": 7.443251182883509e-05} +{"train_loss": 0.0039584459736943245, "global_step": 24428, "epoch": 205, "lr": 7.443057881752258e-05} +{"train_loss": 0.004072083625942469, "global_step": 24429, "epoch": 205, "lr": 7.442864575824324e-05} +{"train_loss": 0.0044852676801383495, "global_step": 24430, "epoch": 205, "lr": 7.442671265100087e-05} +{"train_loss": 0.0032651813235133886, "global_step": 24431, "epoch": 205, "lr": 7.442477949579925e-05} +{"train_loss": 0.0034917567390948534, "global_step": 24432, "epoch": 205, "lr": 7.44228462926422e-05} +{"train_loss": 0.004584689624607563, "global_step": 24433, "epoch": 205, "lr": 7.442091304153349e-05} +{"train_loss": 0.0041356212459504604, "global_step": 24434, "epoch": 205, "lr": 7.441897974247692e-05} +{"train_loss": 0.0028149650897830725, "global_step": 24435, "epoch": 205, "lr": 7.44170463954763e-05} +{"train_loss": 0.0038059535436332226, "global_step": 24436, "epoch": 205, "lr": 7.441511300053541e-05} +{"train_loss": 0.003269272856414318, "global_step": 24437, "epoch": 205, "lr": 7.441317955765807e-05} +{"train_loss": 0.003651035251095891, "global_step": 24438, "epoch": 205, "lr": 7.441124606684804e-05} +{"train_loss": 0.001989576034247875, "global_step": 24439, "epoch": 205, "lr": 7.440931252810914e-05} +{"train_loss": 0.003796003060415387, "global_step": 24440, "epoch": 205, "lr": 7.440737894144517e-05} +{"train_loss": 0.004219309892505407, "global_step": 24441, "epoch": 205, "lr": 7.440544530685993e-05} +{"train_loss": 0.0030193293932825327, "global_step": 24442, "epoch": 205, "lr": 7.440351162435718e-05} +{"train_loss": 0.003671925747767091, "global_step": 24443, "epoch": 205, "lr": 7.440157789394077e-05} +{"train_loss": 0.0033280120696872473, "global_step": 24444, "epoch": 205, "lr": 7.439964411561446e-05} +{"train_loss": 0.004693408962339163, "global_step": 24445, "epoch": 205, "lr": 7.439771028938204e-05} +{"train_loss": 0.003725821850821376, "global_step": 24446, "epoch": 205, "lr": 7.439577641524733e-05} +{"train_loss": 0.003963676746934652, "global_step": 24447, "epoch": 205, "lr": 7.439384249321411e-05} +{"train_loss": 0.003405793337151408, "global_step": 24448, "epoch": 205, "lr": 7.439190852328621e-05} +{"train_loss": 0.0025178201030939817, "global_step": 24449, "epoch": 205, "lr": 7.438997450546739e-05} +{"train_loss": 0.004186870064586401, "global_step": 24450, "epoch": 205, "lr": 7.438804043976146e-05} +{"train_loss": 0.0036893258802592754, "global_step": 24451, "epoch": 205, "lr": 7.438610632617222e-05} +{"train_loss": 0.005808022804558277, "global_step": 24452, "epoch": 205, "lr": 7.438417216470347e-05} +{"train_loss": 0.004225745797157288, "global_step": 24453, "epoch": 205, "lr": 7.4382237955359e-05} +{"train_loss": 0.002098479773849249, "global_step": 24454, "epoch": 205, "lr": 7.43803036981426e-05} +{"train_loss": 0.0024658620823174715, "global_step": 24455, "epoch": 205, "lr": 7.437836939305809e-05} +{"train_loss": 0.006123961880803108, "global_step": 24456, "epoch": 205, "lr": 7.437643504010925e-05} +{"train_loss": 0.00282731163315475, "global_step": 24457, "epoch": 205, "lr": 7.437450063929989e-05} +{"train_loss": 0.0031534333247691393, "global_step": 24458, "epoch": 205, "lr": 7.437256619063379e-05} +{"train_loss": 0.00400233268737793, "global_step": 24459, "epoch": 205, "lr": 7.437063169411478e-05} +{"train_loss": 0.003345342818647623, "global_step": 24460, "epoch": 205, "lr": 7.436869714974663e-05} +{"train_loss": 0.004982191603630781, "global_step": 24461, "epoch": 205, "lr": 7.436676255753315e-05} +{"train_loss": 0.0056976876221597195, "global_step": 24462, "epoch": 205, "lr": 7.436482791747813e-05} +{"train_loss": 0.0032712738029658794, "global_step": 24463, "epoch": 205, "lr": 7.436289322958537e-05} +{"train_loss": 0.005398670677095652, "global_step": 24464, "epoch": 205, "lr": 7.436095849385866e-05} +{"train_loss": 0.005197114311158657, "global_step": 24465, "epoch": 205, "lr": 7.435902371030184e-05} +{"train_loss": 0.005980695132166147, "global_step": 24466, "epoch": 205, "lr": 7.435708887891866e-05} +{"train_loss": 0.004024168476462364, "global_step": 24467, "epoch": 205, "lr": 7.435515399971294e-05} +{"train_loss": 0.003154362551867962, "global_step": 24468, "epoch": 205, "lr": 7.435321907268848e-05} +{"train_loss": 0.0027063493616878986, "global_step": 24469, "epoch": 205, "lr": 7.435128409784908e-05} +{"train_loss": 0.004673996940255165, "global_step": 24470, "epoch": 205, "lr": 7.434934907519853e-05} +{"train_loss": 0.004762133117765188, "global_step": 24471, "epoch": 205, "lr": 7.434741400474063e-05} +{"train_loss": 0.004954745061695576, "global_step": 24472, "epoch": 205, "lr": 7.43454788864792e-05} +{"train_loss": 0.0022231980692595243, "global_step": 24473, "epoch": 205, "lr": 7.4343543720418e-05} +{"train_loss": 0.004873507656157017, "global_step": 24474, "epoch": 205, "lr": 7.434160850656088e-05} +{"train_loss": 0.0035122870467603207, "global_step": 24475, "epoch": 205, "lr": 7.43396732449116e-05} +{"train_loss": 0.005701696500182152, "global_step": 24476, "epoch": 205, "lr": 7.433773793547396e-05} +{"train_loss": 0.0050670369528234005, "global_step": 24477, "epoch": 205, "lr": 7.433580257825178e-05} +{"train_loss": 0.0034679577220231295, "global_step": 24478, "epoch": 205, "lr": 7.433386717324885e-05} +{"train_loss": 0.003158573992550373, "global_step": 24479, "epoch": 205, "lr": 7.433193172046897e-05} +{"train_loss": 0.004791155457496643, "global_step": 24480, "epoch": 205, "lr": 7.432999621991594e-05} +{"train_loss": 0.00405696127563715, "global_step": 24481, "epoch": 205, "lr": 7.432806067159359e-05} +{"train_loss": 0.0027627248782664537, "global_step": 24482, "epoch": 205, "lr": 7.432612507550566e-05} +{"train_loss": 0.005510296206921339, "global_step": 24483, "epoch": 205, "lr": 7.4324189431656e-05} +{"train_loss": 0.002820082474499941, "global_step": 24484, "epoch": 205, "lr": 7.432225374004838e-05} +{"train_loss": 0.0056398105807602406, "global_step": 24485, "epoch": 205, "lr": 7.432031800068662e-05} +{"train_loss": 0.0048239221796393394, "global_step": 24486, "epoch": 205, "lr": 7.43183822135745e-05} +{"train_loss": 0.0025190559681504965, "global_step": 24487, "epoch": 205, "lr": 7.431644637871585e-05} +{"train_loss": 0.003800772363319993, "global_step": 24488, "epoch": 205, "lr": 7.431451049611444e-05} +{"train_loss": 0.005023261532187462, "global_step": 24489, "epoch": 205, "lr": 7.431257456577411e-05} +{"train_loss": 0.004603305831551552, "global_step": 24490, "epoch": 205, "lr": 7.431063858769863e-05} +{"train_loss": 0.0039020823314785957, "global_step": 24491, "epoch": 205, "lr": 7.43087025618918e-05} +{"train_loss": 0.002678089076653123, "global_step": 24492, "epoch": 205, "lr": 7.430676648835742e-05} +{"train_loss": 0.0028650767635554075, "global_step": 24493, "epoch": 205, "lr": 7.430483036709932e-05} +{"train_loss": 0.00441194511950016, "global_step": 24494, "epoch": 205, "lr": 7.430289419812128e-05} +{"train_loss": 0.005336259491741657, "global_step": 24495, "epoch": 205, "lr": 7.43009579814271e-05} +{"train_loss": 0.004493198357522488, "global_step": 24496, "epoch": 205, "lr": 7.429902171702058e-05} +{"train_loss": 0.0033728312700986862, "global_step": 24497, "epoch": 205, "lr": 7.429708540490553e-05} +{"train_loss": 0.004774771630764008, "global_step": 24498, "epoch": 205, "lr": 7.429514904508574e-05} +{"train_loss": 0.0023808167316019535, "global_step": 24499, "epoch": 205, "lr": 7.429321263756504e-05} +{"train_loss": 0.007184966001659632, "global_step": 24500, "epoch": 205, "lr": 7.429127618234721e-05} +{"train_loss": 0.005814285483211279, "global_step": 24501, "epoch": 205, "lr": 7.428933967943605e-05} +{"train_loss": 0.0031542156357318163, "global_step": 24502, "epoch": 205, "lr": 7.428740312883536e-05} +{"train_loss": 0.0039443764835596085, "global_step": 24503, "epoch": 205, "lr": 7.428546653054896e-05} +{"train_loss": 0.004963620565831661, "global_step": 24504, "epoch": 205, "lr": 7.428352988458062e-05} +{"train_loss": 0.0033479095436632633, "global_step": 24505, "epoch": 205, "lr": 7.428159319093417e-05} +{"train_loss": 0.005000121891498566, "global_step": 24506, "epoch": 205, "lr": 7.427965644961342e-05} +{"train_loss": 0.0038853874430060387, "global_step": 24507, "epoch": 205, "lr": 7.427771966062214e-05} +{"train_loss": 0.0038215615786612034, "global_step": 24508, "epoch": 205, "lr": 7.427578282396417e-05} +{"train_loss": 0.002824988914653659, "global_step": 24509, "epoch": 205, "lr": 7.427384593964328e-05} +{"train_loss": 0.004713697358965874, "global_step": 24510, "epoch": 205, "lr": 7.42719090076633e-05} +{"train_loss": 0.0026192546356469393, "global_step": 24511, "epoch": 205, "lr": 7.426997202802802e-05} +{"train_loss": 0.006082831881940365, "global_step": 24512, "epoch": 205, "lr": 7.426803500074123e-05} +{"train_loss": 0.0041029552592575045, "global_step": 24513, "epoch": 205, "lr": 7.426609792580674e-05, "val_loss": 0.014405353926122189, "train_action_mse_error": 9.377954847877845e-05} +{"train_loss": 0.002579932799562812, "global_step": 24514, "epoch": 206, "lr": 7.426416080322838e-05} +{"train_loss": 0.0017269139643758535, "global_step": 24515, "epoch": 206, "lr": 7.426222363300993e-05} +{"train_loss": 0.003450222546234727, "global_step": 24516, "epoch": 206, "lr": 7.426028641515518e-05} +{"train_loss": 0.005744355730712414, "global_step": 24517, "epoch": 206, "lr": 7.425834914966796e-05} +{"train_loss": 0.0030474935192614794, "global_step": 24518, "epoch": 206, "lr": 7.425641183655206e-05} +{"train_loss": 0.0031364918686449528, "global_step": 24519, "epoch": 206, "lr": 7.425447447581129e-05} +{"train_loss": 0.003721157554537058, "global_step": 24520, "epoch": 206, "lr": 7.425253706744944e-05} +{"train_loss": 0.005635725799947977, "global_step": 24521, "epoch": 206, "lr": 7.425059961147033e-05} +{"train_loss": 0.004131912253797054, "global_step": 24522, "epoch": 206, "lr": 7.424866210787776e-05} +{"train_loss": 0.004735926166176796, "global_step": 24523, "epoch": 206, "lr": 7.424672455667554e-05} +{"train_loss": 0.00618754280731082, "global_step": 24524, "epoch": 206, "lr": 7.424478695786746e-05} +{"train_loss": 0.0048887114971876144, "global_step": 24525, "epoch": 206, "lr": 7.424284931145733e-05} +{"train_loss": 0.005413846578449011, "global_step": 24526, "epoch": 206, "lr": 7.424091161744896e-05} +{"train_loss": 0.0016996636986732483, "global_step": 24527, "epoch": 206, "lr": 7.423897387584615e-05} +{"train_loss": 0.0037511512637138367, "global_step": 24528, "epoch": 206, "lr": 7.42370360866527e-05} +{"train_loss": 0.002631910378113389, "global_step": 24529, "epoch": 206, "lr": 7.423509824987241e-05} +{"train_loss": 0.0030392413027584553, "global_step": 24530, "epoch": 206, "lr": 7.423316036550911e-05} +{"train_loss": 0.004502910189330578, "global_step": 24531, "epoch": 206, "lr": 7.423122243356659e-05} +{"train_loss": 0.007676084525883198, "global_step": 24532, "epoch": 206, "lr": 7.422928445404864e-05} +{"train_loss": 0.0056418729946017265, "global_step": 24533, "epoch": 206, "lr": 7.422734642695909e-05} +{"train_loss": 0.002419249387457967, "global_step": 24534, "epoch": 206, "lr": 7.422540835230172e-05} +{"train_loss": 0.0033826983999460936, "global_step": 24535, "epoch": 206, "lr": 7.422347023008036e-05} +{"train_loss": 0.005062108859419823, "global_step": 24536, "epoch": 206, "lr": 7.42215320602988e-05} +{"train_loss": 0.004725212696939707, "global_step": 24537, "epoch": 206, "lr": 7.421959384296084e-05} +{"train_loss": 0.005094815976917744, "global_step": 24538, "epoch": 206, "lr": 7.421765557807032e-05} +{"train_loss": 0.003146903356537223, "global_step": 24539, "epoch": 206, "lr": 7.4215717265631e-05} +{"train_loss": 0.0030352298635989428, "global_step": 24540, "epoch": 206, "lr": 7.421377890564672e-05} +{"train_loss": 0.0035361002665013075, "global_step": 24541, "epoch": 206, "lr": 7.421184049812125e-05} +{"train_loss": 0.004077026154845953, "global_step": 24542, "epoch": 206, "lr": 7.420990204305843e-05} +{"train_loss": 0.0056785461492836475, "global_step": 24543, "epoch": 206, "lr": 7.420796354046206e-05} +{"train_loss": 0.004899274557828903, "global_step": 24544, "epoch": 206, "lr": 7.420602499033595e-05} +{"train_loss": 0.007906291633844376, "global_step": 24545, "epoch": 206, "lr": 7.420408639268388e-05} +{"train_loss": 0.003512590192258358, "global_step": 24546, "epoch": 206, "lr": 7.420214774750967e-05} +{"train_loss": 0.005647237412631512, "global_step": 24547, "epoch": 206, "lr": 7.420020905481713e-05} +{"train_loss": 0.007544296327978373, "global_step": 24548, "epoch": 206, "lr": 7.419827031461006e-05} +{"train_loss": 0.004257248714566231, "global_step": 24549, "epoch": 206, "lr": 7.419633152689229e-05} +{"train_loss": 0.003942443057894707, "global_step": 24550, "epoch": 206, "lr": 7.41943926916676e-05} +{"train_loss": 0.004958710633218288, "global_step": 24551, "epoch": 206, "lr": 7.41924538089398e-05} +{"train_loss": 0.004094427451491356, "global_step": 24552, "epoch": 206, "lr": 7.41905148787127e-05} +{"train_loss": 0.004188959952443838, "global_step": 24553, "epoch": 206, "lr": 7.41885759009901e-05} +{"train_loss": 0.003565607825294137, "global_step": 24554, "epoch": 206, "lr": 7.418663687577583e-05} +{"train_loss": 0.005649852100759745, "global_step": 24555, "epoch": 206, "lr": 7.418469780307367e-05} +{"train_loss": 0.005010536871850491, "global_step": 24556, "epoch": 206, "lr": 7.418275868288747e-05} +{"train_loss": 0.003542955033481121, "global_step": 24557, "epoch": 206, "lr": 7.418081951522098e-05} +{"train_loss": 0.004744004458189011, "global_step": 24558, "epoch": 206, "lr": 7.417888030007804e-05} +{"train_loss": 0.0027199082542210817, "global_step": 24559, "epoch": 206, "lr": 7.417694103746245e-05} +{"train_loss": 0.005009117536246777, "global_step": 24560, "epoch": 206, "lr": 7.4175001727378e-05} +{"train_loss": 0.005908707622438669, "global_step": 24561, "epoch": 206, "lr": 7.417306236982855e-05} +{"train_loss": 0.0037238423246890306, "global_step": 24562, "epoch": 206, "lr": 7.417112296481787e-05} +{"train_loss": 0.0032539719250053167, "global_step": 24563, "epoch": 206, "lr": 7.416918351234977e-05} +{"train_loss": 0.003491038689389825, "global_step": 24564, "epoch": 206, "lr": 7.416724401242804e-05} +{"train_loss": 0.005311133805662394, "global_step": 24565, "epoch": 206, "lr": 7.416530446505653e-05} +{"train_loss": 0.006669927854090929, "global_step": 24566, "epoch": 206, "lr": 7.416336487023902e-05} +{"train_loss": 0.002863642992451787, "global_step": 24567, "epoch": 206, "lr": 7.416142522797932e-05} +{"train_loss": 0.005360943730920553, "global_step": 24568, "epoch": 206, "lr": 7.415948553828126e-05} +{"train_loss": 0.007198849227279425, "global_step": 24569, "epoch": 206, "lr": 7.41575458011486e-05} +{"train_loss": 0.0037042181938886642, "global_step": 24570, "epoch": 206, "lr": 7.41556060165852e-05} +{"train_loss": 0.0039033780340105295, "global_step": 24571, "epoch": 206, "lr": 7.415366618459485e-05} +{"train_loss": 0.0033851624466478825, "global_step": 24572, "epoch": 206, "lr": 7.415172630518135e-05} +{"train_loss": 0.0027623490896075964, "global_step": 24573, "epoch": 206, "lr": 7.414978637834852e-05} +{"train_loss": 0.007187340408563614, "global_step": 24574, "epoch": 206, "lr": 7.414784640410015e-05} +{"train_loss": 0.0055909063667058945, "global_step": 24575, "epoch": 206, "lr": 7.414590638244009e-05} +{"train_loss": 0.0035326951183378696, "global_step": 24576, "epoch": 206, "lr": 7.41439663133721e-05} +{"train_loss": 0.0023211846128106117, "global_step": 24577, "epoch": 206, "lr": 7.414202619690003e-05} +{"train_loss": 0.003958513028919697, "global_step": 24578, "epoch": 206, "lr": 7.414008603302766e-05} +{"train_loss": 0.0024863416329026222, "global_step": 24579, "epoch": 206, "lr": 7.41381458217588e-05} +{"train_loss": 0.0038341879844665527, "global_step": 24580, "epoch": 206, "lr": 7.413620556309729e-05} +{"train_loss": 0.004312584642320871, "global_step": 24581, "epoch": 206, "lr": 7.413426525704692e-05} +{"train_loss": 0.0034673577174544334, "global_step": 24582, "epoch": 206, "lr": 7.413232490361149e-05} +{"train_loss": 0.0022846870124340057, "global_step": 24583, "epoch": 206, "lr": 7.413038450279481e-05} +{"train_loss": 0.004743953235447407, "global_step": 24584, "epoch": 206, "lr": 7.41284440546007e-05} +{"train_loss": 0.003240196732804179, "global_step": 24585, "epoch": 206, "lr": 7.412650355903296e-05} +{"train_loss": 0.0038133319467306137, "global_step": 24586, "epoch": 206, "lr": 7.412456301609543e-05} +{"train_loss": 0.005199967417865992, "global_step": 24587, "epoch": 206, "lr": 7.412262242579189e-05} +{"train_loss": 0.004058647435158491, "global_step": 24588, "epoch": 206, "lr": 7.412068178812616e-05} +{"train_loss": 0.0038664224557578564, "global_step": 24589, "epoch": 206, "lr": 7.411874110310203e-05} +{"train_loss": 0.002234941115602851, "global_step": 24590, "epoch": 206, "lr": 7.411680037072334e-05} +{"train_loss": 0.004679111763834953, "global_step": 24591, "epoch": 206, "lr": 7.411485959099389e-05} +{"train_loss": 0.004015099257230759, "global_step": 24592, "epoch": 206, "lr": 7.41129187639175e-05} +{"train_loss": 0.003438290674239397, "global_step": 24593, "epoch": 206, "lr": 7.411097788949797e-05} +{"train_loss": 0.004852747544646263, "global_step": 24594, "epoch": 206, "lr": 7.41090369677391e-05} +{"train_loss": 0.002992982277646661, "global_step": 24595, "epoch": 206, "lr": 7.410709599864472e-05} +{"train_loss": 0.004824254661798477, "global_step": 24596, "epoch": 206, "lr": 7.410515498221861e-05} +{"train_loss": 0.0029207831248641014, "global_step": 24597, "epoch": 206, "lr": 7.410321391846463e-05} +{"train_loss": 0.0027976795099675655, "global_step": 24598, "epoch": 206, "lr": 7.410127280738655e-05} +{"train_loss": 0.0036710412241518497, "global_step": 24599, "epoch": 206, "lr": 7.409933164898819e-05} +{"train_loss": 0.0044117821380496025, "global_step": 24600, "epoch": 206, "lr": 7.40973904432734e-05} +{"train_loss": 0.002774847438558936, "global_step": 24601, "epoch": 206, "lr": 7.409544919024593e-05} +{"train_loss": 0.003289713291451335, "global_step": 24602, "epoch": 206, "lr": 7.409350788990962e-05} +{"train_loss": 0.003387636039406061, "global_step": 24603, "epoch": 206, "lr": 7.409156654226828e-05} +{"train_loss": 0.00410864595323801, "global_step": 24604, "epoch": 206, "lr": 7.408962514732571e-05} +{"train_loss": 0.002277507446706295, "global_step": 24605, "epoch": 206, "lr": 7.408768370508576e-05} +{"train_loss": 0.0029573680367320776, "global_step": 24606, "epoch": 206, "lr": 7.408574221555222e-05} +{"train_loss": 0.003141500987112522, "global_step": 24607, "epoch": 206, "lr": 7.408380067872889e-05} +{"train_loss": 0.004976777359843254, "global_step": 24608, "epoch": 206, "lr": 7.408185909461959e-05} +{"train_loss": 0.004554609768092632, "global_step": 24609, "epoch": 206, "lr": 7.407991746322812e-05} +{"train_loss": 0.0034044329077005386, "global_step": 24610, "epoch": 206, "lr": 7.407797578455831e-05} +{"train_loss": 0.004598063416779041, "global_step": 24611, "epoch": 206, "lr": 7.407603405861399e-05} +{"train_loss": 0.0033504858147352934, "global_step": 24612, "epoch": 206, "lr": 7.407409228539894e-05} +{"train_loss": 0.0058482554741203785, "global_step": 24613, "epoch": 206, "lr": 7.407215046491695e-05} +{"train_loss": 0.0027597020380198956, "global_step": 24614, "epoch": 206, "lr": 7.40702085971719e-05} +{"train_loss": 0.0032701583113521338, "global_step": 24615, "epoch": 206, "lr": 7.406826668216756e-05} +{"train_loss": 0.004604298155754805, "global_step": 24616, "epoch": 206, "lr": 7.406632471990773e-05} +{"train_loss": 0.0033061469439417124, "global_step": 24617, "epoch": 206, "lr": 7.406438271039627e-05} +{"train_loss": 0.006136844400316477, "global_step": 24618, "epoch": 206, "lr": 7.406244065363695e-05} +{"train_loss": 0.0033959392458200455, "global_step": 24619, "epoch": 206, "lr": 7.406049854963359e-05} +{"train_loss": 0.0024114970583468676, "global_step": 24620, "epoch": 206, "lr": 7.405855639839002e-05} +{"train_loss": 0.004702328704297543, "global_step": 24621, "epoch": 206, "lr": 7.405661419991004e-05} +{"train_loss": 0.0028102314099669456, "global_step": 24622, "epoch": 206, "lr": 7.405467195419749e-05} +{"train_loss": 0.0030354817863553762, "global_step": 24623, "epoch": 206, "lr": 7.405272966125614e-05} +{"train_loss": 0.002208864316344261, "global_step": 24624, "epoch": 206, "lr": 7.405078732108983e-05} +{"train_loss": 0.0035793341230601072, "global_step": 24625, "epoch": 206, "lr": 7.404884493370238e-05} +{"train_loss": 0.004406636580824852, "global_step": 24626, "epoch": 206, "lr": 7.404690249909758e-05} +{"train_loss": 0.004531611688435078, "global_step": 24627, "epoch": 206, "lr": 7.404496001727925e-05} +{"train_loss": 0.003741783555597067, "global_step": 24628, "epoch": 206, "lr": 7.404301748825123e-05} +{"train_loss": 0.002598769497126341, "global_step": 24629, "epoch": 206, "lr": 7.40410749120173e-05} +{"train_loss": 0.0015946890925988555, "global_step": 24630, "epoch": 206, "lr": 7.403913228858128e-05} +{"train_loss": 0.004055113531649113, "global_step": 24631, "epoch": 206, "lr": 7.403718961794702e-05} +{"train_loss": 0.004058183932935177, "global_step": 24632, "epoch": 206, "lr": 7.403524690011829e-05, "val_loss": 0.017294803634285927} +{"train_loss": 0.0026636274997144938, "global_step": 24633, "epoch": 207, "lr": 7.40333041350989e-05} +{"train_loss": 0.005527236964553595, "global_step": 24634, "epoch": 207, "lr": 7.403136132289272e-05} +{"train_loss": 0.0034260423853993416, "global_step": 24635, "epoch": 207, "lr": 7.40294184635035e-05} +{"train_loss": 0.004451618529856205, "global_step": 24636, "epoch": 207, "lr": 7.40274755569351e-05} +{"train_loss": 0.0029228953644633293, "global_step": 24637, "epoch": 207, "lr": 7.402553260319131e-05} +{"train_loss": 0.0035392746794968843, "global_step": 24638, "epoch": 207, "lr": 7.402358960227596e-05} +{"train_loss": 0.0033217468298971653, "global_step": 24639, "epoch": 207, "lr": 7.402164655419286e-05} +{"train_loss": 0.0022744806483387947, "global_step": 24640, "epoch": 207, "lr": 7.401970345894582e-05} +{"train_loss": 0.004730773624032736, "global_step": 24641, "epoch": 207, "lr": 7.401776031653866e-05} +{"train_loss": 0.00452353386208415, "global_step": 24642, "epoch": 207, "lr": 7.401581712697519e-05} +{"train_loss": 0.0029427295085042715, "global_step": 24643, "epoch": 207, "lr": 7.401387389025924e-05} +{"train_loss": 0.004360474646091461, "global_step": 24644, "epoch": 207, "lr": 7.401193060639459e-05} +{"train_loss": 0.004679023288190365, "global_step": 24645, "epoch": 207, "lr": 7.40099872753851e-05} +{"train_loss": 0.0030369157902896404, "global_step": 24646, "epoch": 207, "lr": 7.400804389723458e-05} +{"train_loss": 0.004110574256628752, "global_step": 24647, "epoch": 207, "lr": 7.40061004719468e-05} +{"train_loss": 0.004078458994626999, "global_step": 24648, "epoch": 207, "lr": 7.400415699952561e-05} +{"train_loss": 0.0028257137164473534, "global_step": 24649, "epoch": 207, "lr": 7.400221347997483e-05} +{"train_loss": 0.0026095202192664146, "global_step": 24650, "epoch": 207, "lr": 7.400026991329826e-05} +{"train_loss": 0.0058915261179208755, "global_step": 24651, "epoch": 207, "lr": 7.399832629949974e-05} +{"train_loss": 0.0037269992753863335, "global_step": 24652, "epoch": 207, "lr": 7.399638263858306e-05} +{"train_loss": 0.004166046157479286, "global_step": 24653, "epoch": 207, "lr": 7.399443893055204e-05} +{"train_loss": 0.0043977973982691765, "global_step": 24654, "epoch": 207, "lr": 7.399249517541051e-05} +{"train_loss": 0.0046150595881044865, "global_step": 24655, "epoch": 207, "lr": 7.399055137316228e-05} +{"train_loss": 0.003328643972054124, "global_step": 24656, "epoch": 207, "lr": 7.398860752381118e-05} +{"train_loss": 0.003267850959673524, "global_step": 24657, "epoch": 207, "lr": 7.398666362736098e-05} +{"train_loss": 0.003483640495687723, "global_step": 24658, "epoch": 207, "lr": 7.398471968381555e-05} +{"train_loss": 0.004031555727124214, "global_step": 24659, "epoch": 207, "lr": 7.398277569317869e-05} +{"train_loss": 0.004825142212212086, "global_step": 24660, "epoch": 207, "lr": 7.39808316554542e-05} +{"train_loss": 0.0033757544588297606, "global_step": 24661, "epoch": 207, "lr": 7.39788875706459e-05} +{"train_loss": 0.004448084160685539, "global_step": 24662, "epoch": 207, "lr": 7.397694343875764e-05} +{"train_loss": 0.004330539144575596, "global_step": 24663, "epoch": 207, "lr": 7.39749992597932e-05} +{"train_loss": 0.004029493313282728, "global_step": 24664, "epoch": 207, "lr": 7.39730550337564e-05} +{"train_loss": 0.0049714320339262486, "global_step": 24665, "epoch": 207, "lr": 7.397111076065109e-05} +{"train_loss": 0.004301004111766815, "global_step": 24666, "epoch": 207, "lr": 7.396916644048105e-05} +{"train_loss": 0.002709368709474802, "global_step": 24667, "epoch": 207, "lr": 7.396722207325012e-05} +{"train_loss": 0.0029512092005461454, "global_step": 24668, "epoch": 207, "lr": 7.396527765896211e-05} +{"train_loss": 0.0038657691329717636, "global_step": 24669, "epoch": 207, "lr": 7.396333319762083e-05} +{"train_loss": 0.004451199434697628, "global_step": 24670, "epoch": 207, "lr": 7.39613886892301e-05} +{"train_loss": 0.0037129907868802547, "global_step": 24671, "epoch": 207, "lr": 7.395944413379375e-05} +{"train_loss": 0.0044665890745818615, "global_step": 24672, "epoch": 207, "lr": 7.39574995313156e-05} +{"train_loss": 0.001952423364855349, "global_step": 24673, "epoch": 207, "lr": 7.395555488179945e-05} +{"train_loss": 0.0032834920566529036, "global_step": 24674, "epoch": 207, "lr": 7.395361018524913e-05} +{"train_loss": 0.003088489407673478, "global_step": 24675, "epoch": 207, "lr": 7.395166544166847e-05} +{"train_loss": 0.005424425937235355, "global_step": 24676, "epoch": 207, "lr": 7.394972065106125e-05} +{"train_loss": 0.003499248530715704, "global_step": 24677, "epoch": 207, "lr": 7.394777581343132e-05} +{"train_loss": 0.0031942897476255894, "global_step": 24678, "epoch": 207, "lr": 7.394583092878248e-05} +{"train_loss": 0.0037050643004477024, "global_step": 24679, "epoch": 207, "lr": 7.394388599711859e-05} +{"train_loss": 0.002862286986783147, "global_step": 24680, "epoch": 207, "lr": 7.39419410184434e-05} +{"train_loss": 0.0028476067818701267, "global_step": 24681, "epoch": 207, "lr": 7.39399959927608e-05} +{"train_loss": 0.004901637323200703, "global_step": 24682, "epoch": 207, "lr": 7.393805092007456e-05} +{"train_loss": 0.0046491133980453014, "global_step": 24683, "epoch": 207, "lr": 7.393610580038852e-05} +{"train_loss": 0.005040905438363552, "global_step": 24684, "epoch": 207, "lr": 7.393416063370648e-05} +{"train_loss": 0.004762457683682442, "global_step": 24685, "epoch": 207, "lr": 7.393221542003229e-05} +{"train_loss": 0.004110444337129593, "global_step": 24686, "epoch": 207, "lr": 7.393027015936975e-05} +{"train_loss": 0.0034528481774032116, "global_step": 24687, "epoch": 207, "lr": 7.392832485172266e-05} +{"train_loss": 0.004836168140172958, "global_step": 24688, "epoch": 207, "lr": 7.392637949709488e-05} +{"train_loss": 0.00465907109901309, "global_step": 24689, "epoch": 207, "lr": 7.39244340954902e-05} +{"train_loss": 0.0031434064731001854, "global_step": 24690, "epoch": 207, "lr": 7.392248864691246e-05} +{"train_loss": 0.004429062362760305, "global_step": 24691, "epoch": 207, "lr": 7.392054315136546e-05} +{"train_loss": 0.004749155603349209, "global_step": 24692, "epoch": 207, "lr": 7.391859760885303e-05} +{"train_loss": 0.004804821219295263, "global_step": 24693, "epoch": 207, "lr": 7.3916652019379e-05} +{"train_loss": 0.006015514489263296, "global_step": 24694, "epoch": 207, "lr": 7.391470638294717e-05} +{"train_loss": 0.003400072455406189, "global_step": 24695, "epoch": 207, "lr": 7.391276069956137e-05} +{"train_loss": 0.0018531540408730507, "global_step": 24696, "epoch": 207, "lr": 7.391081496922542e-05} +{"train_loss": 0.003740689717233181, "global_step": 24697, "epoch": 207, "lr": 7.390886919194314e-05} +{"train_loss": 0.003060702932998538, "global_step": 24698, "epoch": 207, "lr": 7.390692336771834e-05} +{"train_loss": 0.0033690803684294224, "global_step": 24699, "epoch": 207, "lr": 7.390497749655487e-05} +{"train_loss": 0.007323660887777805, "global_step": 24700, "epoch": 207, "lr": 7.390303157845651e-05} +{"train_loss": 0.002278188243508339, "global_step": 24701, "epoch": 207, "lr": 7.39010856134271e-05} +{"train_loss": 0.004531013313680887, "global_step": 24702, "epoch": 207, "lr": 7.389913960147048e-05} +{"train_loss": 0.0024110637605190277, "global_step": 24703, "epoch": 207, "lr": 7.389719354259044e-05} +{"train_loss": 0.005135995801538229, "global_step": 24704, "epoch": 207, "lr": 7.389524743679082e-05} +{"train_loss": 0.006876533851027489, "global_step": 24705, "epoch": 207, "lr": 7.389330128407543e-05} +{"train_loss": 0.004418334923684597, "global_step": 24706, "epoch": 207, "lr": 7.389135508444809e-05} +{"train_loss": 0.003133969847112894, "global_step": 24707, "epoch": 207, "lr": 7.388940883791264e-05} +{"train_loss": 0.003588904393836856, "global_step": 24708, "epoch": 207, "lr": 7.388746254447289e-05} +{"train_loss": 0.0060790120624005795, "global_step": 24709, "epoch": 207, "lr": 7.388551620413265e-05} +{"train_loss": 0.003372564446181059, "global_step": 24710, "epoch": 207, "lr": 7.388356981689575e-05} +{"train_loss": 0.004760397598147392, "global_step": 24711, "epoch": 207, "lr": 7.388162338276601e-05} +{"train_loss": 0.003364222589880228, "global_step": 24712, "epoch": 207, "lr": 7.387967690174726e-05} +{"train_loss": 0.0036215565633028746, "global_step": 24713, "epoch": 207, "lr": 7.387773037384333e-05} +{"train_loss": 0.0029345767106860876, "global_step": 24714, "epoch": 207, "lr": 7.3875783799058e-05} +{"train_loss": 0.006673295982182026, "global_step": 24715, "epoch": 207, "lr": 7.387383717739513e-05} +{"train_loss": 0.004579905420541763, "global_step": 24716, "epoch": 207, "lr": 7.387189050885853e-05} +{"train_loss": 0.004595614969730377, "global_step": 24717, "epoch": 207, "lr": 7.386994379345202e-05} +{"train_loss": 0.005753146950155497, "global_step": 24718, "epoch": 207, "lr": 7.386799703117944e-05} +{"train_loss": 0.004374167416244745, "global_step": 24719, "epoch": 207, "lr": 7.386605022204458e-05} +{"train_loss": 0.0034394545946270227, "global_step": 24720, "epoch": 207, "lr": 7.38641033660513e-05} +{"train_loss": 0.006932773161679506, "global_step": 24721, "epoch": 207, "lr": 7.386215646320337e-05} +{"train_loss": 0.005987162236124277, "global_step": 24722, "epoch": 207, "lr": 7.386020951350468e-05} +{"train_loss": 0.004205862991511822, "global_step": 24723, "epoch": 207, "lr": 7.3858262516959e-05} +{"train_loss": 0.007031966000795364, "global_step": 24724, "epoch": 207, "lr": 7.385631547357017e-05} +{"train_loss": 0.002622575731948018, "global_step": 24725, "epoch": 207, "lr": 7.385436838334203e-05} +{"train_loss": 0.0038435838650912046, "global_step": 24726, "epoch": 207, "lr": 7.385242124627838e-05} +{"train_loss": 0.004730864427983761, "global_step": 24727, "epoch": 207, "lr": 7.385047406238304e-05} +{"train_loss": 0.0033727383706718683, "global_step": 24728, "epoch": 207, "lr": 7.384852683165984e-05} +{"train_loss": 0.004502087831497192, "global_step": 24729, "epoch": 207, "lr": 7.384657955411261e-05} +{"train_loss": 0.005091737490147352, "global_step": 24730, "epoch": 207, "lr": 7.384463222974515e-05} +{"train_loss": 0.0035779739264398813, "global_step": 24731, "epoch": 207, "lr": 7.384268485856134e-05} +{"train_loss": 0.004704361315816641, "global_step": 24732, "epoch": 207, "lr": 7.384073744056495e-05} +{"train_loss": 0.007531388662755489, "global_step": 24733, "epoch": 207, "lr": 7.383878997575981e-05} +{"train_loss": 0.0023330484982579947, "global_step": 24734, "epoch": 207, "lr": 7.383684246414975e-05} +{"train_loss": 0.0035629826597869396, "global_step": 24735, "epoch": 207, "lr": 7.383489490573862e-05} +{"train_loss": 0.004930336959660053, "global_step": 24736, "epoch": 207, "lr": 7.383294730053018e-05} +{"train_loss": 0.005358174908906221, "global_step": 24737, "epoch": 207, "lr": 7.383099964852833e-05} +{"train_loss": 0.004108477383852005, "global_step": 24738, "epoch": 207, "lr": 7.382905194973684e-05} +{"train_loss": 0.005635297857224941, "global_step": 24739, "epoch": 207, "lr": 7.382710420415957e-05} +{"train_loss": 0.00554839801043272, "global_step": 24740, "epoch": 207, "lr": 7.382515641180032e-05} +{"train_loss": 0.002922763815149665, "global_step": 24741, "epoch": 207, "lr": 7.382320857266291e-05} +{"train_loss": 0.003918585367500782, "global_step": 24742, "epoch": 207, "lr": 7.382126068675118e-05} +{"train_loss": 0.003744741901755333, "global_step": 24743, "epoch": 207, "lr": 7.381931275406895e-05} +{"train_loss": 0.005135508254170418, "global_step": 24744, "epoch": 207, "lr": 7.381736477462006e-05} +{"train_loss": 0.0044190241023898125, "global_step": 24745, "epoch": 207, "lr": 7.381541674840831e-05} +{"train_loss": 0.0027587292715907097, "global_step": 24746, "epoch": 207, "lr": 7.381346867543752e-05} +{"train_loss": 0.004205770790576935, "global_step": 24747, "epoch": 207, "lr": 7.381152055571153e-05} +{"train_loss": 0.003617984475567937, "global_step": 24748, "epoch": 207, "lr": 7.380957238923417e-05} +{"train_loss": 0.004480175673961639, "global_step": 24749, "epoch": 207, "lr": 7.380762417600927e-05} +{"train_loss": 0.004185056313872337, "global_step": 24750, "epoch": 207, "lr": 7.380567591604062e-05} +{"train_loss": 0.004122672018501125, "global_step": 24751, "epoch": 207, "lr": 7.380372760933208e-05, "val_loss": 0.012248670682311058} +{"train_loss": 0.0035040262155234814, "global_step": 24752, "epoch": 208, "lr": 7.380177925588746e-05} +{"train_loss": 0.004603980109095573, "global_step": 24753, "epoch": 208, "lr": 7.37998308557106e-05} +{"train_loss": 0.0035928713623434305, "global_step": 24754, "epoch": 208, "lr": 7.37978824088053e-05} +{"train_loss": 0.005305551923811436, "global_step": 24755, "epoch": 208, "lr": 7.379593391517541e-05} +{"train_loss": 0.0037708948366343975, "global_step": 24756, "epoch": 208, "lr": 7.379398537482475e-05} +{"train_loss": 0.004509433638304472, "global_step": 24757, "epoch": 208, "lr": 7.379203678775714e-05} +{"train_loss": 0.0035086541902273893, "global_step": 24758, "epoch": 208, "lr": 7.379008815397638e-05} +{"train_loss": 0.005219537299126387, "global_step": 24759, "epoch": 208, "lr": 7.378813947348637e-05} +{"train_loss": 0.0031221939716488123, "global_step": 24760, "epoch": 208, "lr": 7.378619074629085e-05} +{"train_loss": 0.004438017960637808, "global_step": 24761, "epoch": 208, "lr": 7.378424197239371e-05} +{"train_loss": 0.0022944749798625708, "global_step": 24762, "epoch": 208, "lr": 7.378229315179874e-05} +{"train_loss": 0.005726618692278862, "global_step": 24763, "epoch": 208, "lr": 7.37803442845098e-05} +{"train_loss": 0.0022126499097794294, "global_step": 24764, "epoch": 208, "lr": 7.377839537053066e-05} +{"train_loss": 0.004580020438879728, "global_step": 24765, "epoch": 208, "lr": 7.37764464098652e-05} +{"train_loss": 0.0021881824359297752, "global_step": 24766, "epoch": 208, "lr": 7.377449740251723e-05} +{"train_loss": 0.0035575884394347668, "global_step": 24767, "epoch": 208, "lr": 7.377254834849057e-05} +{"train_loss": 0.0061713093891739845, "global_step": 24768, "epoch": 208, "lr": 7.377059924778904e-05} +{"train_loss": 0.0030884849838912487, "global_step": 24769, "epoch": 208, "lr": 7.37686501004165e-05} +{"train_loss": 0.0022242784034460783, "global_step": 24770, "epoch": 208, "lr": 7.376670090637675e-05} +{"train_loss": 0.0036301587242633104, "global_step": 24771, "epoch": 208, "lr": 7.37647516656736e-05} +{"train_loss": 0.003952271770685911, "global_step": 24772, "epoch": 208, "lr": 7.376280237831092e-05} +{"train_loss": 0.00448396522551775, "global_step": 24773, "epoch": 208, "lr": 7.37608530442925e-05} +{"train_loss": 0.0015989405801519752, "global_step": 24774, "epoch": 208, "lr": 7.37589036636222e-05} +{"train_loss": 0.005132175981998444, "global_step": 24775, "epoch": 208, "lr": 7.375695423630381e-05} +{"train_loss": 0.004008189775049686, "global_step": 24776, "epoch": 208, "lr": 7.375500476234121e-05} +{"train_loss": 0.004847563803195953, "global_step": 24777, "epoch": 208, "lr": 7.375305524173818e-05} +{"train_loss": 0.0032012644223868847, "global_step": 24778, "epoch": 208, "lr": 7.375110567449855e-05} +{"train_loss": 0.004341623745858669, "global_step": 24779, "epoch": 208, "lr": 7.374915606062617e-05} +{"train_loss": 0.003857564879581332, "global_step": 24780, "epoch": 208, "lr": 7.374720640012487e-05} +{"train_loss": 0.004589879885315895, "global_step": 24781, "epoch": 208, "lr": 7.374525669299847e-05} +{"train_loss": 0.004033513832837343, "global_step": 24782, "epoch": 208, "lr": 7.374330693925079e-05} +{"train_loss": 0.0033213046845048666, "global_step": 24783, "epoch": 208, "lr": 7.374135713888566e-05} +{"train_loss": 0.002812915248796344, "global_step": 24784, "epoch": 208, "lr": 7.37394072919069e-05} +{"train_loss": 0.0037342391442507505, "global_step": 24785, "epoch": 208, "lr": 7.373745739831836e-05} +{"train_loss": 0.0037729674950242043, "global_step": 24786, "epoch": 208, "lr": 7.373550745812386e-05} +{"train_loss": 0.0035234722308814526, "global_step": 24787, "epoch": 208, "lr": 7.373355747132722e-05} +{"train_loss": 0.0028027244843542576, "global_step": 24788, "epoch": 208, "lr": 7.373160743793229e-05} +{"train_loss": 0.0030879448167979717, "global_step": 24789, "epoch": 208, "lr": 7.372965735794288e-05} +{"train_loss": 0.002414523856714368, "global_step": 24790, "epoch": 208, "lr": 7.372770723136282e-05} +{"train_loss": 0.005178089719265699, "global_step": 24791, "epoch": 208, "lr": 7.372575705819593e-05} +{"train_loss": 0.0062147327698767185, "global_step": 24792, "epoch": 208, "lr": 7.372380683844607e-05} +{"train_loss": 0.00429656682536006, "global_step": 24793, "epoch": 208, "lr": 7.372185657211704e-05} +{"train_loss": 0.002789233112707734, "global_step": 24794, "epoch": 208, "lr": 7.371990625921268e-05} +{"train_loss": 0.004082608036696911, "global_step": 24795, "epoch": 208, "lr": 7.371795589973682e-05} +{"train_loss": 0.004162735305726528, "global_step": 24796, "epoch": 208, "lr": 7.371600549369328e-05} +{"train_loss": 0.007065167650580406, "global_step": 24797, "epoch": 208, "lr": 7.37140550410859e-05} +{"train_loss": 0.004020058549940586, "global_step": 24798, "epoch": 208, "lr": 7.371210454191851e-05} +{"train_loss": 0.002711788285523653, "global_step": 24799, "epoch": 208, "lr": 7.371015399619494e-05} +{"train_loss": 0.003444806905463338, "global_step": 24800, "epoch": 208, "lr": 7.370820340391901e-05} +{"train_loss": 0.004590487107634544, "global_step": 24801, "epoch": 208, "lr": 7.370625276509456e-05} +{"train_loss": 0.0056737130507826805, "global_step": 24802, "epoch": 208, "lr": 7.370430207972541e-05} +{"train_loss": 0.0024675391614437103, "global_step": 24803, "epoch": 208, "lr": 7.370235134781539e-05} +{"train_loss": 0.0018358377274125814, "global_step": 24804, "epoch": 208, "lr": 7.370040056936834e-05} +{"train_loss": 0.0038474402390420437, "global_step": 24805, "epoch": 208, "lr": 7.369844974438809e-05} +{"train_loss": 0.005994400009512901, "global_step": 24806, "epoch": 208, "lr": 7.369649887287847e-05} +{"train_loss": 0.00465814396739006, "global_step": 24807, "epoch": 208, "lr": 7.36945479548433e-05} +{"train_loss": 0.0032822792418301105, "global_step": 24808, "epoch": 208, "lr": 7.369259699028641e-05} +{"train_loss": 0.0033618530724197626, "global_step": 24809, "epoch": 208, "lr": 7.369064597921164e-05} +{"train_loss": 0.0042347777634859085, "global_step": 24810, "epoch": 208, "lr": 7.368869492162283e-05} +{"train_loss": 0.0055591207928955555, "global_step": 24811, "epoch": 208, "lr": 7.368674381752378e-05} +{"train_loss": 0.005179365165531635, "global_step": 24812, "epoch": 208, "lr": 7.368479266691834e-05} +{"train_loss": 0.003699543420225382, "global_step": 24813, "epoch": 208, "lr": 7.368284146981037e-05} +{"train_loss": 0.005426014773547649, "global_step": 24814, "epoch": 208, "lr": 7.368089022620365e-05} +{"train_loss": 0.003651695791631937, "global_step": 24815, "epoch": 208, "lr": 7.367893893610203e-05} +{"train_loss": 0.006031797733157873, "global_step": 24816, "epoch": 208, "lr": 7.367698759950934e-05} +{"train_loss": 0.0024089873768389225, "global_step": 24817, "epoch": 208, "lr": 7.367503621642942e-05} +{"train_loss": 0.004446685314178467, "global_step": 24818, "epoch": 208, "lr": 7.367308478686608e-05} +{"train_loss": 0.0032458172645419836, "global_step": 24819, "epoch": 208, "lr": 7.367113331082318e-05} +{"train_loss": 0.0041135153733193874, "global_step": 24820, "epoch": 208, "lr": 7.366918178830455e-05} +{"train_loss": 0.0027351530734449625, "global_step": 24821, "epoch": 208, "lr": 7.366723021931399e-05} +{"train_loss": 0.002607652684673667, "global_step": 24822, "epoch": 208, "lr": 7.366527860385537e-05} +{"train_loss": 0.0043227835558354855, "global_step": 24823, "epoch": 208, "lr": 7.366332694193249e-05} +{"train_loss": 0.00477979239076376, "global_step": 24824, "epoch": 208, "lr": 7.36613752335492e-05} +{"train_loss": 0.0030426920857280493, "global_step": 24825, "epoch": 208, "lr": 7.365942347870933e-05} +{"train_loss": 0.00324059696868062, "global_step": 24826, "epoch": 208, "lr": 7.36574716774167e-05} +{"train_loss": 0.0030064599122852087, "global_step": 24827, "epoch": 208, "lr": 7.365551982967518e-05} +{"train_loss": 0.004398735240101814, "global_step": 24828, "epoch": 208, "lr": 7.365356793548855e-05} +{"train_loss": 0.005438464228063822, "global_step": 24829, "epoch": 208, "lr": 7.365161599486067e-05} +{"train_loss": 0.0022518369369208813, "global_step": 24830, "epoch": 208, "lr": 7.364966400779536e-05} +{"train_loss": 0.0033910158090293407, "global_step": 24831, "epoch": 208, "lr": 7.364771197429649e-05} +{"train_loss": 0.006121787708252668, "global_step": 24832, "epoch": 208, "lr": 7.364575989436784e-05} +{"train_loss": 0.003911973908543587, "global_step": 24833, "epoch": 208, "lr": 7.364380776801327e-05} +{"train_loss": 0.003449636045843363, "global_step": 24834, "epoch": 208, "lr": 7.36418555952366e-05} +{"train_loss": 0.0038930962327867746, "global_step": 24835, "epoch": 208, "lr": 7.363990337604167e-05} +{"train_loss": 0.003448428586125374, "global_step": 24836, "epoch": 208, "lr": 7.363795111043233e-05} +{"train_loss": 0.0047644744627177715, "global_step": 24837, "epoch": 208, "lr": 7.36359987984124e-05} +{"train_loss": 0.003603840246796608, "global_step": 24838, "epoch": 208, "lr": 7.363404643998572e-05} +{"train_loss": 0.0035427375696599483, "global_step": 24839, "epoch": 208, "lr": 7.36320940351561e-05} +{"train_loss": 0.003718009917065501, "global_step": 24840, "epoch": 208, "lr": 7.363014158392739e-05} +{"train_loss": 0.00275323330424726, "global_step": 24841, "epoch": 208, "lr": 7.362818908630343e-05} +{"train_loss": 0.004289119970053434, "global_step": 24842, "epoch": 208, "lr": 7.362623654228802e-05} +{"train_loss": 0.0030835368670523167, "global_step": 24843, "epoch": 208, "lr": 7.362428395188505e-05} +{"train_loss": 0.0030106999911367893, "global_step": 24844, "epoch": 208, "lr": 7.36223313150983e-05} +{"train_loss": 0.0035391580313444138, "global_step": 24845, "epoch": 208, "lr": 7.362037863193164e-05} +{"train_loss": 0.0031038334127515554, "global_step": 24846, "epoch": 208, "lr": 7.361842590238889e-05} +{"train_loss": 0.00311831827275455, "global_step": 24847, "epoch": 208, "lr": 7.361647312647388e-05} +{"train_loss": 0.002304930705577135, "global_step": 24848, "epoch": 208, "lr": 7.361452030419044e-05} +{"train_loss": 0.0044045234099030495, "global_step": 24849, "epoch": 208, "lr": 7.361256743554241e-05} +{"train_loss": 0.0022363297175616026, "global_step": 24850, "epoch": 208, "lr": 7.361061452053364e-05} +{"train_loss": 0.003638649359345436, "global_step": 24851, "epoch": 208, "lr": 7.360866155916795e-05} +{"train_loss": 0.004498446825891733, "global_step": 24852, "epoch": 208, "lr": 7.360670855144916e-05} +{"train_loss": 0.004811441525816917, "global_step": 24853, "epoch": 208, "lr": 7.360475549738114e-05} +{"train_loss": 0.004698770586401224, "global_step": 24854, "epoch": 208, "lr": 7.360280239696768e-05} +{"train_loss": 0.003525643376633525, "global_step": 24855, "epoch": 208, "lr": 7.360084925021266e-05} +{"train_loss": 0.0027196079026907682, "global_step": 24856, "epoch": 208, "lr": 7.35988960571199e-05} +{"train_loss": 0.0020720772445201874, "global_step": 24857, "epoch": 208, "lr": 7.359694281769321e-05} +{"train_loss": 0.002457672031596303, "global_step": 24858, "epoch": 208, "lr": 7.359498953193647e-05} +{"train_loss": 0.005618006456643343, "global_step": 24859, "epoch": 208, "lr": 7.359303619985346e-05} +{"train_loss": 0.0030955683905631304, "global_step": 24860, "epoch": 208, "lr": 7.359108282144806e-05} +{"train_loss": 0.004285313654690981, "global_step": 24861, "epoch": 208, "lr": 7.358912939672407e-05} +{"train_loss": 0.001983404392376542, "global_step": 24862, "epoch": 208, "lr": 7.358717592568535e-05} +{"train_loss": 0.0033012977801263332, "global_step": 24863, "epoch": 208, "lr": 7.358522240833575e-05} +{"train_loss": 0.002023599809035659, "global_step": 24864, "epoch": 208, "lr": 7.358326884467908e-05} +{"train_loss": 0.0022919396869838238, "global_step": 24865, "epoch": 208, "lr": 7.358131523471917e-05} +{"train_loss": 0.004168829880654812, "global_step": 24866, "epoch": 208, "lr": 7.357936157845988e-05} +{"train_loss": 0.00604258943349123, "global_step": 24867, "epoch": 208, "lr": 7.357740787590501e-05} +{"train_loss": 0.002746485872194171, "global_step": 24868, "epoch": 208, "lr": 7.357545412705843e-05} +{"train_loss": 0.001963680610060692, "global_step": 24869, "epoch": 208, "lr": 7.357350033192397e-05} +{"train_loss": 0.0037904537230057, "global_step": 24870, "epoch": 208, "lr": 7.357154649050545e-05, "val_loss": 0.01586897298693657} +{"train_loss": 0.0033574579283595085, "global_step": 24871, "epoch": 209, "lr": 7.356959260280672e-05} +{"train_loss": 0.004342182073742151, "global_step": 24872, "epoch": 209, "lr": 7.356763866883163e-05} +{"train_loss": 0.0037821652367711067, "global_step": 24873, "epoch": 209, "lr": 7.356568468858398e-05} +{"train_loss": 0.004802453797310591, "global_step": 24874, "epoch": 209, "lr": 7.356373066206763e-05} +{"train_loss": 0.0031863576732575893, "global_step": 24875, "epoch": 209, "lr": 7.356177658928643e-05} +{"train_loss": 0.004198934882879257, "global_step": 24876, "epoch": 209, "lr": 7.355982247024418e-05} +{"train_loss": 0.004444416146725416, "global_step": 24877, "epoch": 209, "lr": 7.355786830494474e-05} +{"train_loss": 0.005150325130671263, "global_step": 24878, "epoch": 209, "lr": 7.355591409339193e-05} +{"train_loss": 0.005024473648518324, "global_step": 24879, "epoch": 209, "lr": 7.355395983558961e-05} +{"train_loss": 0.0038391114212572575, "global_step": 24880, "epoch": 209, "lr": 7.35520055315416e-05} +{"train_loss": 0.004973402246832848, "global_step": 24881, "epoch": 209, "lr": 7.355005118125175e-05} +{"train_loss": 0.003722366178408265, "global_step": 24882, "epoch": 209, "lr": 7.35480967847239e-05} +{"train_loss": 0.0030711607541888952, "global_step": 24883, "epoch": 209, "lr": 7.354614234196187e-05} +{"train_loss": 0.005179624073207378, "global_step": 24884, "epoch": 209, "lr": 7.35441878529695e-05} +{"train_loss": 0.00458905752748251, "global_step": 24885, "epoch": 209, "lr": 7.354223331775063e-05} +{"train_loss": 0.0030181994661688805, "global_step": 24886, "epoch": 209, "lr": 7.35402787363091e-05} +{"train_loss": 0.003020408097654581, "global_step": 24887, "epoch": 209, "lr": 7.353832410864876e-05} +{"train_loss": 0.004588100593537092, "global_step": 24888, "epoch": 209, "lr": 7.353636943477343e-05} +{"train_loss": 0.004042016342282295, "global_step": 24889, "epoch": 209, "lr": 7.353441471468695e-05} +{"train_loss": 0.0030794176273047924, "global_step": 24890, "epoch": 209, "lr": 7.353245994839316e-05} +{"train_loss": 0.003257466945797205, "global_step": 24891, "epoch": 209, "lr": 7.35305051358959e-05} +{"train_loss": 0.0031738774850964546, "global_step": 24892, "epoch": 209, "lr": 7.3528550277199e-05} +{"train_loss": 0.002932718489319086, "global_step": 24893, "epoch": 209, "lr": 7.352659537230633e-05} +{"train_loss": 0.004734170623123646, "global_step": 24894, "epoch": 209, "lr": 7.352464042122169e-05} +{"train_loss": 0.005898569710552692, "global_step": 24895, "epoch": 209, "lr": 7.352268542394893e-05} +{"train_loss": 0.002974043833091855, "global_step": 24896, "epoch": 209, "lr": 7.352073038049189e-05} +{"train_loss": 0.00443278718739748, "global_step": 24897, "epoch": 209, "lr": 7.351877529085441e-05} +{"train_loss": 0.004963114857673645, "global_step": 24898, "epoch": 209, "lr": 7.351682015504031e-05} +{"train_loss": 0.006173601374030113, "global_step": 24899, "epoch": 209, "lr": 7.351486497305347e-05} +{"train_loss": 0.0040071564726531506, "global_step": 24900, "epoch": 209, "lr": 7.351290974489768e-05} +{"train_loss": 0.00420471653342247, "global_step": 24901, "epoch": 209, "lr": 7.351095447057683e-05} +{"train_loss": 0.002705428283661604, "global_step": 24902, "epoch": 209, "lr": 7.350899915009472e-05} +{"train_loss": 0.0034464807249605656, "global_step": 24903, "epoch": 209, "lr": 7.35070437834552e-05} +{"train_loss": 0.0034538679756224155, "global_step": 24904, "epoch": 209, "lr": 7.350508837066213e-05} +{"train_loss": 0.0020619758870452642, "global_step": 24905, "epoch": 209, "lr": 7.35031329117193e-05} +{"train_loss": 0.005354094784706831, "global_step": 24906, "epoch": 209, "lr": 7.350117740663059e-05} +{"train_loss": 0.004990261048078537, "global_step": 24907, "epoch": 209, "lr": 7.349922185539985e-05} +{"train_loss": 0.0040491013787686825, "global_step": 24908, "epoch": 209, "lr": 7.349726625803087e-05} +{"train_loss": 0.0043776677921414375, "global_step": 24909, "epoch": 209, "lr": 7.349531061452753e-05} +{"train_loss": 0.006307498086243868, "global_step": 24910, "epoch": 209, "lr": 7.349335492489367e-05} +{"train_loss": 0.004871897399425507, "global_step": 24911, "epoch": 209, "lr": 7.349139918913309e-05} +{"train_loss": 0.005460946820676327, "global_step": 24912, "epoch": 209, "lr": 7.348944340724968e-05} +{"train_loss": 0.004256001673638821, "global_step": 24913, "epoch": 209, "lr": 7.348748757924726e-05} +{"train_loss": 0.004604110028594732, "global_step": 24914, "epoch": 209, "lr": 7.348553170512965e-05} +{"train_loss": 0.004169005900621414, "global_step": 24915, "epoch": 209, "lr": 7.348357578490072e-05} +{"train_loss": 0.005303064826875925, "global_step": 24916, "epoch": 209, "lr": 7.348161981856428e-05} +{"train_loss": 0.003386326367035508, "global_step": 24917, "epoch": 209, "lr": 7.347966380612421e-05} +{"train_loss": 0.006157758180052042, "global_step": 24918, "epoch": 209, "lr": 7.34777077475843e-05} +{"train_loss": 0.003483760403469205, "global_step": 24919, "epoch": 209, "lr": 7.347575164294845e-05} +{"train_loss": 0.003849914763122797, "global_step": 24920, "epoch": 209, "lr": 7.347379549222047e-05} +{"train_loss": 0.003850021865218878, "global_step": 24921, "epoch": 209, "lr": 7.347183929540417e-05} +{"train_loss": 0.002038436708971858, "global_step": 24922, "epoch": 209, "lr": 7.346988305250345e-05} +{"train_loss": 0.0030781705863773823, "global_step": 24923, "epoch": 209, "lr": 7.34679267635221e-05} +{"train_loss": 0.006218730937689543, "global_step": 24924, "epoch": 209, "lr": 7.346597042846399e-05} +{"train_loss": 0.0035924569237977266, "global_step": 24925, "epoch": 209, "lr": 7.346401404733297e-05} +{"train_loss": 0.003110563848167658, "global_step": 24926, "epoch": 209, "lr": 7.346205762013285e-05} +{"train_loss": 0.0030591520480811596, "global_step": 24927, "epoch": 209, "lr": 7.34601011468675e-05} +{"train_loss": 0.004203794524073601, "global_step": 24928, "epoch": 209, "lr": 7.345814462754074e-05} +{"train_loss": 0.0048524364829063416, "global_step": 24929, "epoch": 209, "lr": 7.34561880621564e-05} +{"train_loss": 0.004133114591240883, "global_step": 24930, "epoch": 209, "lr": 7.345423145071836e-05} +{"train_loss": 0.003227504435926676, "global_step": 24931, "epoch": 209, "lr": 7.345227479323045e-05} +{"train_loss": 0.004093494266271591, "global_step": 24932, "epoch": 209, "lr": 7.345031808969649e-05} +{"train_loss": 0.0038434797897934914, "global_step": 24933, "epoch": 209, "lr": 7.344836134012035e-05} +{"train_loss": 0.003799786791205406, "global_step": 24934, "epoch": 209, "lr": 7.344640454450583e-05} +{"train_loss": 0.0048935264348983765, "global_step": 24935, "epoch": 209, "lr": 7.344444770285681e-05} +{"train_loss": 0.00407306058332324, "global_step": 24936, "epoch": 209, "lr": 7.344249081517714e-05} +{"train_loss": 0.0019931625574827194, "global_step": 24937, "epoch": 209, "lr": 7.344053388147064e-05} +{"train_loss": 0.0034007953945547342, "global_step": 24938, "epoch": 209, "lr": 7.343857690174114e-05} +{"train_loss": 0.007123423740267754, "global_step": 24939, "epoch": 209, "lr": 7.34366198759925e-05} +{"train_loss": 0.004354072734713554, "global_step": 24940, "epoch": 209, "lr": 7.343466280422858e-05} +{"train_loss": 0.003395993961021304, "global_step": 24941, "epoch": 209, "lr": 7.343270568645319e-05} +{"train_loss": 0.003952141385525465, "global_step": 24942, "epoch": 209, "lr": 7.343074852267018e-05} +{"train_loss": 0.004699161276221275, "global_step": 24943, "epoch": 209, "lr": 7.34287913128834e-05} +{"train_loss": 0.0029246045742183924, "global_step": 24944, "epoch": 209, "lr": 7.34268340570967e-05} +{"train_loss": 0.002446977188810706, "global_step": 24945, "epoch": 209, "lr": 7.34248767553139e-05} +{"train_loss": 0.003514273790642619, "global_step": 24946, "epoch": 209, "lr": 7.342291940753889e-05} +{"train_loss": 0.0032125888392329216, "global_step": 24947, "epoch": 209, "lr": 7.342096201377544e-05} +{"train_loss": 0.00361016602255404, "global_step": 24948, "epoch": 209, "lr": 7.341900457402746e-05} +{"train_loss": 0.004135785158723593, "global_step": 24949, "epoch": 209, "lr": 7.341704708829875e-05} +{"train_loss": 0.0024772854521870613, "global_step": 24950, "epoch": 209, "lr": 7.341508955659318e-05} +{"train_loss": 0.004397350363433361, "global_step": 24951, "epoch": 209, "lr": 7.341313197891457e-05} +{"train_loss": 0.003655961947515607, "global_step": 24952, "epoch": 209, "lr": 7.341117435526679e-05} +{"train_loss": 0.0023813950829207897, "global_step": 24953, "epoch": 209, "lr": 7.340921668565367e-05} +{"train_loss": 0.0029457653872668743, "global_step": 24954, "epoch": 209, "lr": 7.340725897007905e-05} +{"train_loss": 0.004907786380499601, "global_step": 24955, "epoch": 209, "lr": 7.340530120854677e-05} +{"train_loss": 0.00468473369255662, "global_step": 24956, "epoch": 209, "lr": 7.34033434010607e-05} +{"train_loss": 0.003519403748214245, "global_step": 24957, "epoch": 209, "lr": 7.340138554762465e-05} +{"train_loss": 0.002180134877562523, "global_step": 24958, "epoch": 209, "lr": 7.33994276482425e-05} +{"train_loss": 0.003089194418862462, "global_step": 24959, "epoch": 209, "lr": 7.339746970291806e-05} +{"train_loss": 0.0036006569862365723, "global_step": 24960, "epoch": 209, "lr": 7.339551171165517e-05} +{"train_loss": 0.0036210189573466778, "global_step": 24961, "epoch": 209, "lr": 7.339355367445772e-05} +{"train_loss": 0.0035294287372380495, "global_step": 24962, "epoch": 209, "lr": 7.339159559132951e-05} +{"train_loss": 0.0034642061218619347, "global_step": 24963, "epoch": 209, "lr": 7.338963746227441e-05} +{"train_loss": 0.0024298238568007946, "global_step": 24964, "epoch": 209, "lr": 7.338767928729625e-05} +{"train_loss": 0.0024164323695003986, "global_step": 24965, "epoch": 209, "lr": 7.338572106639888e-05} +{"train_loss": 0.005403823219239712, "global_step": 24966, "epoch": 209, "lr": 7.338376279958614e-05} +{"train_loss": 0.005114329047501087, "global_step": 24967, "epoch": 209, "lr": 7.338180448686189e-05} +{"train_loss": 0.0016626202268525958, "global_step": 24968, "epoch": 209, "lr": 7.337984612822996e-05} +{"train_loss": 0.006126134656369686, "global_step": 24969, "epoch": 209, "lr": 7.337788772369421e-05} +{"train_loss": 0.0024443534202873707, "global_step": 24970, "epoch": 209, "lr": 7.337592927325848e-05} +{"train_loss": 0.0033253622241318226, "global_step": 24971, "epoch": 209, "lr": 7.337397077692658e-05} +{"train_loss": 0.0031704094726592302, "global_step": 24972, "epoch": 209, "lr": 7.33720122347024e-05} +{"train_loss": 0.005824731197208166, "global_step": 24973, "epoch": 209, "lr": 7.337005364658977e-05} +{"train_loss": 0.0032815805170685053, "global_step": 24974, "epoch": 209, "lr": 7.336809501259254e-05} +{"train_loss": 0.003712332807481289, "global_step": 24975, "epoch": 209, "lr": 7.336613633271456e-05} +{"train_loss": 0.003925041761249304, "global_step": 24976, "epoch": 209, "lr": 7.336417760695965e-05} +{"train_loss": 0.0028056513983756304, "global_step": 24977, "epoch": 209, "lr": 7.33622188353317e-05} +{"train_loss": 0.0019126455299556255, "global_step": 24978, "epoch": 209, "lr": 7.336026001783451e-05} +{"train_loss": 0.0045307897962629795, "global_step": 24979, "epoch": 209, "lr": 7.335830115447194e-05} +{"train_loss": 0.005510968156158924, "global_step": 24980, "epoch": 209, "lr": 7.335634224524786e-05} +{"train_loss": 0.0034500877372920513, "global_step": 24981, "epoch": 209, "lr": 7.335438329016607e-05} +{"train_loss": 0.00604181457310915, "global_step": 24982, "epoch": 209, "lr": 7.335242428923046e-05} +{"train_loss": 0.002096667420119047, "global_step": 24983, "epoch": 209, "lr": 7.335046524244486e-05} +{"train_loss": 0.0027497343253344297, "global_step": 24984, "epoch": 209, "lr": 7.334850614981312e-05} +{"train_loss": 0.0025924674700945616, "global_step": 24985, "epoch": 209, "lr": 7.334654701133907e-05} +{"train_loss": 0.004332107957452536, "global_step": 24986, "epoch": 209, "lr": 7.334458782702658e-05} +{"train_loss": 0.00329687655903399, "global_step": 24987, "epoch": 209, "lr": 7.334262859687948e-05} +{"train_loss": 0.004049520939588547, "global_step": 24988, "epoch": 209, "lr": 7.334066932090164e-05} +{"train_loss": 0.003906669033526936, "global_step": 24989, "epoch": 209, "lr": 7.333870999909686e-05, "val_loss": 0.020298093557357788} +{"train_loss": 0.005271194502711296, "global_step": 24990, "epoch": 210, "lr": 7.333675063146904e-05} +{"train_loss": 0.0034212698228657246, "global_step": 24991, "epoch": 210, "lr": 7.3334791218022e-05} +{"train_loss": 0.0022549526765942574, "global_step": 24992, "epoch": 210, "lr": 7.333283175875957e-05} +{"train_loss": 0.004978138022124767, "global_step": 24993, "epoch": 210, "lr": 7.333087225368564e-05} +{"train_loss": 0.002880455693230033, "global_step": 24994, "epoch": 210, "lr": 7.332891270280403e-05} +{"train_loss": 0.00560937263071537, "global_step": 24995, "epoch": 210, "lr": 7.332695310611859e-05} +{"train_loss": 0.003047446720302105, "global_step": 24996, "epoch": 210, "lr": 7.332499346363317e-05} +{"train_loss": 0.006008737254887819, "global_step": 24997, "epoch": 210, "lr": 7.332303377535162e-05} +{"train_loss": 0.00386275677010417, "global_step": 24998, "epoch": 210, "lr": 7.332107404127777e-05} +{"train_loss": 0.0047196573577821255, "global_step": 24999, "epoch": 210, "lr": 7.33191142614155e-05} +{"train_loss": 0.003178210696205497, "global_step": 25000, "epoch": 210, "lr": 7.331715443576863e-05} +{"train_loss": 0.005454261787235737, "global_step": 25001, "epoch": 210, "lr": 7.331519456434102e-05} +{"train_loss": 0.007181193679571152, "global_step": 25002, "epoch": 210, "lr": 7.331323464713651e-05} +{"train_loss": 0.004649731796234846, "global_step": 25003, "epoch": 210, "lr": 7.331127468415897e-05} +{"train_loss": 0.004142552148550749, "global_step": 25004, "epoch": 210, "lr": 7.330931467541222e-05} +{"train_loss": 0.0035154272336512804, "global_step": 25005, "epoch": 210, "lr": 7.330735462090013e-05} +{"train_loss": 0.004293282516300678, "global_step": 25006, "epoch": 210, "lr": 7.330539452062654e-05} +{"train_loss": 0.003803327912464738, "global_step": 25007, "epoch": 210, "lr": 7.33034343745953e-05} +{"train_loss": 0.002506229095160961, "global_step": 25008, "epoch": 210, "lr": 7.330147418281025e-05} +{"train_loss": 0.0034995065070688725, "global_step": 25009, "epoch": 210, "lr": 7.329951394527524e-05} +{"train_loss": 0.0042502256110310555, "global_step": 25010, "epoch": 210, "lr": 7.329755366199414e-05} +{"train_loss": 0.005692328792065382, "global_step": 25011, "epoch": 210, "lr": 7.329559333297076e-05} +{"train_loss": 0.0051540182903409, "global_step": 25012, "epoch": 210, "lr": 7.329363295820898e-05} +{"train_loss": 0.004333277232944965, "global_step": 25013, "epoch": 210, "lr": 7.329167253771265e-05} +{"train_loss": 0.0035219474229961634, "global_step": 25014, "epoch": 210, "lr": 7.32897120714856e-05} +{"train_loss": 0.0041058119386434555, "global_step": 25015, "epoch": 210, "lr": 7.328775155953168e-05} +{"train_loss": 0.002437953371554613, "global_step": 25016, "epoch": 210, "lr": 7.328579100185476e-05} +{"train_loss": 0.0023574659135192633, "global_step": 25017, "epoch": 210, "lr": 7.328383039845868e-05} +{"train_loss": 0.004006709437817335, "global_step": 25018, "epoch": 210, "lr": 7.328186974934728e-05} +{"train_loss": 0.003212209325283766, "global_step": 25019, "epoch": 210, "lr": 7.327990905452442e-05} +{"train_loss": 0.006262725219130516, "global_step": 25020, "epoch": 210, "lr": 7.327794831399394e-05} +{"train_loss": 0.007070486433804035, "global_step": 25021, "epoch": 210, "lr": 7.32759875277597e-05} +{"train_loss": 0.0033907301258295774, "global_step": 25022, "epoch": 210, "lr": 7.327402669582554e-05} +{"train_loss": 0.00425936421379447, "global_step": 25023, "epoch": 210, "lr": 7.327206581819532e-05} +{"train_loss": 0.005279855336993933, "global_step": 25024, "epoch": 210, "lr": 7.327010489487288e-05} +{"train_loss": 0.0035761548206210136, "global_step": 25025, "epoch": 210, "lr": 7.326814392586208e-05} +{"train_loss": 0.0033405537251383066, "global_step": 25026, "epoch": 210, "lr": 7.326618291116678e-05} +{"train_loss": 0.007551582995802164, "global_step": 25027, "epoch": 210, "lr": 7.32642218507908e-05} +{"train_loss": 0.00436015147715807, "global_step": 25028, "epoch": 210, "lr": 7.3262260744738e-05} +{"train_loss": 0.005342225544154644, "global_step": 25029, "epoch": 210, "lr": 7.326029959301224e-05} +{"train_loss": 0.0065458184108138084, "global_step": 25030, "epoch": 210, "lr": 7.325833839561736e-05} +{"train_loss": 0.0059767113998532295, "global_step": 25031, "epoch": 210, "lr": 7.325637715255722e-05} +{"train_loss": 0.004548666067421436, "global_step": 25032, "epoch": 210, "lr": 7.325441586383568e-05} +{"train_loss": 0.003363176714628935, "global_step": 25033, "epoch": 210, "lr": 7.325245452945658e-05} +{"train_loss": 0.0027830111794173717, "global_step": 25034, "epoch": 210, "lr": 7.325049314942375e-05} +{"train_loss": 0.006995579693466425, "global_step": 25035, "epoch": 210, "lr": 7.324853172374107e-05} +{"train_loss": 0.0039542424492537975, "global_step": 25036, "epoch": 210, "lr": 7.324657025241239e-05} +{"train_loss": 0.009010327979922295, "global_step": 25037, "epoch": 210, "lr": 7.324460873544155e-05} +{"train_loss": 0.003943499177694321, "global_step": 25038, "epoch": 210, "lr": 7.32426471728324e-05} +{"train_loss": 0.005696149077266455, "global_step": 25039, "epoch": 210, "lr": 7.324068556458879e-05} +{"train_loss": 0.002457454800605774, "global_step": 25040, "epoch": 210, "lr": 7.32387239107146e-05} +{"train_loss": 0.003358451183885336, "global_step": 25041, "epoch": 210, "lr": 7.323676221121362e-05} +{"train_loss": 0.006970780901610851, "global_step": 25042, "epoch": 210, "lr": 7.323480046608977e-05} +{"train_loss": 0.004068585112690926, "global_step": 25043, "epoch": 210, "lr": 7.323283867534687e-05} +{"train_loss": 0.005906539037823677, "global_step": 25044, "epoch": 210, "lr": 7.323087683898878e-05} +{"train_loss": 0.003554439637809992, "global_step": 25045, "epoch": 210, "lr": 7.322891495701933e-05} +{"train_loss": 0.0019678703974932432, "global_step": 25046, "epoch": 210, "lr": 7.322695302944238e-05} +{"train_loss": 0.005268463399261236, "global_step": 25047, "epoch": 210, "lr": 7.32249910562618e-05} +{"train_loss": 0.0037516597658395767, "global_step": 25048, "epoch": 210, "lr": 7.322302903748143e-05} +{"train_loss": 0.0037977430038154125, "global_step": 25049, "epoch": 210, "lr": 7.322106697310512e-05} +{"train_loss": 0.007868953049182892, "global_step": 25050, "epoch": 210, "lr": 7.32191048631367e-05} +{"train_loss": 0.005026771686971188, "global_step": 25051, "epoch": 210, "lr": 7.32171427075801e-05} +{"train_loss": 0.00439680740237236, "global_step": 25052, "epoch": 210, "lr": 7.32151805064391e-05} +{"train_loss": 0.005502599757164717, "global_step": 25053, "epoch": 210, "lr": 7.321321825971757e-05} +{"train_loss": 0.0061379605904221535, "global_step": 25054, "epoch": 210, "lr": 7.321125596741935e-05} +{"train_loss": 0.005424830596894026, "global_step": 25055, "epoch": 210, "lr": 7.320929362954834e-05} +{"train_loss": 0.004999321885406971, "global_step": 25056, "epoch": 210, "lr": 7.320733124610835e-05} +{"train_loss": 0.003943846095353365, "global_step": 25057, "epoch": 210, "lr": 7.320536881710324e-05} +{"train_loss": 0.002669883193448186, "global_step": 25058, "epoch": 210, "lr": 7.320340634253687e-05} +{"train_loss": 0.0032138903625309467, "global_step": 25059, "epoch": 210, "lr": 7.320144382241309e-05} +{"train_loss": 0.0038250964134931564, "global_step": 25060, "epoch": 210, "lr": 7.319948125673574e-05} +{"train_loss": 0.003938769455999136, "global_step": 25061, "epoch": 210, "lr": 7.319751864550871e-05} +{"train_loss": 0.0028291130438447, "global_step": 25062, "epoch": 210, "lr": 7.319555598873582e-05} +{"train_loss": 0.0046173036098480225, "global_step": 25063, "epoch": 210, "lr": 7.319359328642094e-05} +{"train_loss": 0.0044606272131204605, "global_step": 25064, "epoch": 210, "lr": 7.31916305385679e-05} +{"train_loss": 0.004137901589274406, "global_step": 25065, "epoch": 210, "lr": 7.31896677451806e-05} +{"train_loss": 0.005537340417504311, "global_step": 25066, "epoch": 210, "lr": 7.318770490626284e-05} +{"train_loss": 0.0035294604022055864, "global_step": 25067, "epoch": 210, "lr": 7.31857420218185e-05} +{"train_loss": 0.0033867310266941786, "global_step": 25068, "epoch": 210, "lr": 7.318377909185144e-05} +{"train_loss": 0.007531492039561272, "global_step": 25069, "epoch": 210, "lr": 7.31818161163655e-05} +{"train_loss": 0.003359951311722398, "global_step": 25070, "epoch": 210, "lr": 7.317985309536456e-05} +{"train_loss": 0.002137946430593729, "global_step": 25071, "epoch": 210, "lr": 7.317789002885244e-05} +{"train_loss": 0.005872513633221388, "global_step": 25072, "epoch": 210, "lr": 7.3175926916833e-05} +{"train_loss": 0.002355564385652542, "global_step": 25073, "epoch": 210, "lr": 7.317396375931012e-05} +{"train_loss": 0.00563292670994997, "global_step": 25074, "epoch": 210, "lr": 7.317200055628764e-05} +{"train_loss": 0.00674474285915494, "global_step": 25075, "epoch": 210, "lr": 7.317003730776939e-05} +{"train_loss": 0.0022873966954648495, "global_step": 25076, "epoch": 210, "lr": 7.316807401375927e-05} +{"train_loss": 0.0031544731464236975, "global_step": 25077, "epoch": 210, "lr": 7.316611067426111e-05} +{"train_loss": 0.004066568333655596, "global_step": 25078, "epoch": 210, "lr": 7.316414728927875e-05} +{"train_loss": 0.005072506610304117, "global_step": 25079, "epoch": 210, "lr": 7.316218385881607e-05} +{"train_loss": 0.004121797624975443, "global_step": 25080, "epoch": 210, "lr": 7.316022038287692e-05} +{"train_loss": 0.00509331189095974, "global_step": 25081, "epoch": 210, "lr": 7.315825686146514e-05} +{"train_loss": 0.004001175984740257, "global_step": 25082, "epoch": 210, "lr": 7.315629329458461e-05} +{"train_loss": 0.004935281816869974, "global_step": 25083, "epoch": 210, "lr": 7.315432968223916e-05} +{"train_loss": 0.004887023940682411, "global_step": 25084, "epoch": 210, "lr": 7.315236602443267e-05} +{"train_loss": 0.004428834188729525, "global_step": 25085, "epoch": 210, "lr": 7.315040232116899e-05} +{"train_loss": 0.0035770947579294443, "global_step": 25086, "epoch": 210, "lr": 7.314843857245195e-05} +{"train_loss": 0.0063154990784823895, "global_step": 25087, "epoch": 210, "lr": 7.314647477828542e-05} +{"train_loss": 0.005583429709076881, "global_step": 25088, "epoch": 210, "lr": 7.314451093867328e-05} +{"train_loss": 0.004369640722870827, "global_step": 25089, "epoch": 210, "lr": 7.314254705361936e-05} +{"train_loss": 0.00383473327383399, "global_step": 25090, "epoch": 210, "lr": 7.314058312312751e-05} +{"train_loss": 0.0029530569445341825, "global_step": 25091, "epoch": 210, "lr": 7.31386191472016e-05} +{"train_loss": 0.004540521651506424, "global_step": 25092, "epoch": 210, "lr": 7.313665512584548e-05} +{"train_loss": 0.0046887993812561035, "global_step": 25093, "epoch": 210, "lr": 7.313469105906304e-05} +{"train_loss": 0.00471622496843338, "global_step": 25094, "epoch": 210, "lr": 7.313272694685806e-05} +{"train_loss": 0.004601148888468742, "global_step": 25095, "epoch": 210, "lr": 7.313076278923449e-05} +{"train_loss": 0.006424422841519117, "global_step": 25096, "epoch": 210, "lr": 7.31287985861961e-05} +{"train_loss": 0.003705509239807725, "global_step": 25097, "epoch": 210, "lr": 7.31268343377468e-05} +{"train_loss": 0.004734208341687918, "global_step": 25098, "epoch": 210, "lr": 7.312487004389043e-05} +{"train_loss": 0.0037943185307085514, "global_step": 25099, "epoch": 210, "lr": 7.312290570463084e-05} +{"train_loss": 0.004309019539505243, "global_step": 25100, "epoch": 210, "lr": 7.312094131997189e-05} +{"train_loss": 0.0037110066041350365, "global_step": 25101, "epoch": 210, "lr": 7.311897688991747e-05} +{"train_loss": 0.004348103888332844, "global_step": 25102, "epoch": 210, "lr": 7.31170124144714e-05} +{"train_loss": 0.005262560211122036, "global_step": 25103, "epoch": 210, "lr": 7.311504789363754e-05} +{"train_loss": 0.0030258905608206987, "global_step": 25104, "epoch": 210, "lr": 7.311308332741974e-05} +{"train_loss": 0.0028510293923318386, "global_step": 25105, "epoch": 210, "lr": 7.311111871582188e-05} +{"train_loss": 0.002748085418716073, "global_step": 25106, "epoch": 210, "lr": 7.310915405884781e-05} +{"train_loss": 0.004855690058320761, "global_step": 25107, "epoch": 210, "lr": 7.310718935650139e-05} +{"train_loss": 0.0044226919656948135, "global_step": 25108, "epoch": 210, "lr": 7.310522460878647e-05, "val_loss": 0.023002969101071358, "train_action_mse_error": 9.281963866669685e-05} +{"train_loss": 0.005356871988624334, "global_step": 25109, "epoch": 211, "lr": 7.310325981570691e-05} +{"train_loss": 0.005113980732858181, "global_step": 25110, "epoch": 211, "lr": 7.310129497726656e-05} +{"train_loss": 0.003516351105645299, "global_step": 25111, "epoch": 211, "lr": 7.309933009346928e-05} +{"train_loss": 0.0035657091066241264, "global_step": 25112, "epoch": 211, "lr": 7.309736516431896e-05} +{"train_loss": 0.0031502980273216963, "global_step": 25113, "epoch": 211, "lr": 7.30954001898194e-05} +{"train_loss": 0.0034174490720033646, "global_step": 25114, "epoch": 211, "lr": 7.30934351699745e-05} +{"train_loss": 0.003748163115233183, "global_step": 25115, "epoch": 211, "lr": 7.309147010478811e-05} +{"train_loss": 0.00589267211034894, "global_step": 25116, "epoch": 211, "lr": 7.308950499426407e-05} +{"train_loss": 0.0038340261671692133, "global_step": 25117, "epoch": 211, "lr": 7.308753983840628e-05} +{"train_loss": 0.002783494535833597, "global_step": 25118, "epoch": 211, "lr": 7.308557463721857e-05} +{"train_loss": 0.003122440306469798, "global_step": 25119, "epoch": 211, "lr": 7.308360939070479e-05} +{"train_loss": 0.003438397077843547, "global_step": 25120, "epoch": 211, "lr": 7.308164409886882e-05} +{"train_loss": 0.0035439389757812023, "global_step": 25121, "epoch": 211, "lr": 7.307967876171449e-05} +{"train_loss": 0.00567222572863102, "global_step": 25122, "epoch": 211, "lr": 7.307771337924568e-05} +{"train_loss": 0.003007245948538184, "global_step": 25123, "epoch": 211, "lr": 7.307574795146625e-05} +{"train_loss": 0.004327541217207909, "global_step": 25124, "epoch": 211, "lr": 7.307378247838006e-05} +{"train_loss": 0.006938904523849487, "global_step": 25125, "epoch": 211, "lr": 7.307181695999095e-05} +{"train_loss": 0.0034549471456557512, "global_step": 25126, "epoch": 211, "lr": 7.306985139630281e-05} +{"train_loss": 0.0033218590542674065, "global_step": 25127, "epoch": 211, "lr": 7.306788578731947e-05} +{"train_loss": 0.004576236009597778, "global_step": 25128, "epoch": 211, "lr": 7.306592013304481e-05} +{"train_loss": 0.004829154349863529, "global_step": 25129, "epoch": 211, "lr": 7.306395443348266e-05} +{"train_loss": 0.005942036397755146, "global_step": 25130, "epoch": 211, "lr": 7.306198868863691e-05} +{"train_loss": 0.0031539457850158215, "global_step": 25131, "epoch": 211, "lr": 7.306002289851141e-05} +{"train_loss": 0.005933205131441355, "global_step": 25132, "epoch": 211, "lr": 7.305805706311002e-05} +{"train_loss": 0.003190572140738368, "global_step": 25133, "epoch": 211, "lr": 7.30560911824366e-05} +{"train_loss": 0.005289018619805574, "global_step": 25134, "epoch": 211, "lr": 7.3054125256495e-05} +{"train_loss": 0.005074303597211838, "global_step": 25135, "epoch": 211, "lr": 7.30521592852891e-05} +{"train_loss": 0.005401282571256161, "global_step": 25136, "epoch": 211, "lr": 7.305019326882274e-05} +{"train_loss": 0.0027046434115618467, "global_step": 25137, "epoch": 211, "lr": 7.304822720709978e-05} +{"train_loss": 0.00390000082552433, "global_step": 25138, "epoch": 211, "lr": 7.304626110012411e-05} +{"train_loss": 0.002816187683492899, "global_step": 25139, "epoch": 211, "lr": 7.304429494789956e-05} +{"train_loss": 0.0037262984551489353, "global_step": 25140, "epoch": 211, "lr": 7.304232875042999e-05} +{"train_loss": 0.002511372324079275, "global_step": 25141, "epoch": 211, "lr": 7.304036250771927e-05} +{"train_loss": 0.0047874148003757, "global_step": 25142, "epoch": 211, "lr": 7.303839621977127e-05} +{"train_loss": 0.004602345172315836, "global_step": 25143, "epoch": 211, "lr": 7.303642988658984e-05} +{"train_loss": 0.004565717186778784, "global_step": 25144, "epoch": 211, "lr": 7.303446350817883e-05} +{"train_loss": 0.0022727474570274353, "global_step": 25145, "epoch": 211, "lr": 7.303249708454212e-05} +{"train_loss": 0.004814308136701584, "global_step": 25146, "epoch": 211, "lr": 7.303053061568356e-05} +{"train_loss": 0.0030294458847492933, "global_step": 25147, "epoch": 211, "lr": 7.302856410160701e-05} +{"train_loss": 0.004636459052562714, "global_step": 25148, "epoch": 211, "lr": 7.302659754231633e-05} +{"train_loss": 0.003006340702995658, "global_step": 25149, "epoch": 211, "lr": 7.302463093781539e-05} +{"train_loss": 0.004476884845644236, "global_step": 25150, "epoch": 211, "lr": 7.302266428810806e-05} +{"train_loss": 0.0037269582971930504, "global_step": 25151, "epoch": 211, "lr": 7.302069759319819e-05} +{"train_loss": 0.0042884559370577335, "global_step": 25152, "epoch": 211, "lr": 7.301873085308962e-05} +{"train_loss": 0.006544487085193396, "global_step": 25153, "epoch": 211, "lr": 7.301676406778623e-05} +{"train_loss": 0.004968944471329451, "global_step": 25154, "epoch": 211, "lr": 7.301479723729189e-05} +{"train_loss": 0.005983658600598574, "global_step": 25155, "epoch": 211, "lr": 7.301283036161046e-05} +{"train_loss": 0.0039006576407700777, "global_step": 25156, "epoch": 211, "lr": 7.301086344074579e-05} +{"train_loss": 0.004313215147703886, "global_step": 25157, "epoch": 211, "lr": 7.300889647470177e-05} +{"train_loss": 0.0032163735013455153, "global_step": 25158, "epoch": 211, "lr": 7.300692946348223e-05} +{"train_loss": 0.007561790756881237, "global_step": 25159, "epoch": 211, "lr": 7.300496240709101e-05} +{"train_loss": 0.0038809534162282944, "global_step": 25160, "epoch": 211, "lr": 7.300299530553203e-05} +{"train_loss": 0.0031530556734651327, "global_step": 25161, "epoch": 211, "lr": 7.300102815880912e-05} +{"train_loss": 0.005294735077768564, "global_step": 25162, "epoch": 211, "lr": 7.299906096692615e-05} +{"train_loss": 0.00375362578779459, "global_step": 25163, "epoch": 211, "lr": 7.299709372988699e-05} +{"train_loss": 0.004405190236866474, "global_step": 25164, "epoch": 211, "lr": 7.299512644769548e-05} +{"train_loss": 0.004440534394234419, "global_step": 25165, "epoch": 211, "lr": 7.29931591203555e-05} +{"train_loss": 0.0044359443709254265, "global_step": 25166, "epoch": 211, "lr": 7.299119174787091e-05} +{"train_loss": 0.004565490409731865, "global_step": 25167, "epoch": 211, "lr": 7.298922433024557e-05} +{"train_loss": 0.004958875477313995, "global_step": 25168, "epoch": 211, "lr": 7.298725686748335e-05} +{"train_loss": 0.004261855036020279, "global_step": 25169, "epoch": 211, "lr": 7.298528935958811e-05} +{"train_loss": 0.0037609334103763103, "global_step": 25170, "epoch": 211, "lr": 7.298332180656371e-05} +{"train_loss": 0.003717961721122265, "global_step": 25171, "epoch": 211, "lr": 7.2981354208414e-05} +{"train_loss": 0.004947898909449577, "global_step": 25172, "epoch": 211, "lr": 7.297938656514286e-05} +{"train_loss": 0.003407035954296589, "global_step": 25173, "epoch": 211, "lr": 7.297741887675415e-05} +{"train_loss": 0.004235033877193928, "global_step": 25174, "epoch": 211, "lr": 7.297545114325173e-05} +{"train_loss": 0.00311340787447989, "global_step": 25175, "epoch": 211, "lr": 7.297348336463947e-05} +{"train_loss": 0.006240622606128454, "global_step": 25176, "epoch": 211, "lr": 7.297151554092125e-05} +{"train_loss": 0.004103595856577158, "global_step": 25177, "epoch": 211, "lr": 7.296954767210088e-05} +{"train_loss": 0.006483785342425108, "global_step": 25178, "epoch": 211, "lr": 7.296757975818227e-05} +{"train_loss": 0.003406965173780918, "global_step": 25179, "epoch": 211, "lr": 7.296561179916927e-05} +{"train_loss": 0.005338524002581835, "global_step": 25180, "epoch": 211, "lr": 7.296364379506575e-05} +{"train_loss": 0.003190875519067049, "global_step": 25181, "epoch": 211, "lr": 7.296167574587555e-05} +{"train_loss": 0.004579587373882532, "global_step": 25182, "epoch": 211, "lr": 7.295970765160258e-05} +{"train_loss": 0.0054359836503863335, "global_step": 25183, "epoch": 211, "lr": 7.295773951225067e-05} +{"train_loss": 0.0037863613106310368, "global_step": 25184, "epoch": 211, "lr": 7.295577132782367e-05} +{"train_loss": 0.004062858410179615, "global_step": 25185, "epoch": 211, "lr": 7.295380309832549e-05} +{"train_loss": 0.004044156055897474, "global_step": 25186, "epoch": 211, "lr": 7.295183482375995e-05} +{"train_loss": 0.005617182236164808, "global_step": 25187, "epoch": 211, "lr": 7.294986650413095e-05} +{"train_loss": 0.0037685923743993044, "global_step": 25188, "epoch": 211, "lr": 7.294789813944234e-05} +{"train_loss": 0.004847473464906216, "global_step": 25189, "epoch": 211, "lr": 7.294592972969799e-05} +{"train_loss": 0.004310415592044592, "global_step": 25190, "epoch": 211, "lr": 7.294396127490174e-05} +{"train_loss": 0.003997868858277798, "global_step": 25191, "epoch": 211, "lr": 7.294199277505748e-05} +{"train_loss": 0.003973348066210747, "global_step": 25192, "epoch": 211, "lr": 7.294002423016906e-05} +{"train_loss": 0.0034637844655662775, "global_step": 25193, "epoch": 211, "lr": 7.293805564024037e-05} +{"train_loss": 0.004518991336226463, "global_step": 25194, "epoch": 211, "lr": 7.293608700527524e-05} +{"train_loss": 0.006073851604014635, "global_step": 25195, "epoch": 211, "lr": 7.293411832527757e-05} +{"train_loss": 0.005401098169386387, "global_step": 25196, "epoch": 211, "lr": 7.293214960025119e-05} +{"train_loss": 0.003945232834666967, "global_step": 25197, "epoch": 211, "lr": 7.29301808302e-05} +{"train_loss": 0.0030426764860749245, "global_step": 25198, "epoch": 211, "lr": 7.292821201512784e-05} +{"train_loss": 0.005379734560847282, "global_step": 25199, "epoch": 211, "lr": 7.29262431550386e-05} +{"train_loss": 0.0024074031971395016, "global_step": 25200, "epoch": 211, "lr": 7.292427424993611e-05} +{"train_loss": 0.0056471023708581924, "global_step": 25201, "epoch": 211, "lr": 7.292230529982428e-05} +{"train_loss": 0.004290313925594091, "global_step": 25202, "epoch": 211, "lr": 7.292033630470694e-05} +{"train_loss": 0.0034644503612071276, "global_step": 25203, "epoch": 211, "lr": 7.291836726458796e-05} +{"train_loss": 0.004820041358470917, "global_step": 25204, "epoch": 211, "lr": 7.291639817947122e-05} +{"train_loss": 0.0036110698711127043, "global_step": 25205, "epoch": 211, "lr": 7.291442904936059e-05} +{"train_loss": 0.004652101080864668, "global_step": 25206, "epoch": 211, "lr": 7.291245987425992e-05} +{"train_loss": 0.0027178709860891104, "global_step": 25207, "epoch": 211, "lr": 7.291049065417308e-05} +{"train_loss": 0.006414675619453192, "global_step": 25208, "epoch": 211, "lr": 7.290852138910396e-05} +{"train_loss": 0.0025327166076749563, "global_step": 25209, "epoch": 211, "lr": 7.290655207905639e-05} +{"train_loss": 0.00420259777456522, "global_step": 25210, "epoch": 211, "lr": 7.290458272403425e-05} +{"train_loss": 0.004530608654022217, "global_step": 25211, "epoch": 211, "lr": 7.29026133240414e-05} +{"train_loss": 0.0025837491266429424, "global_step": 25212, "epoch": 211, "lr": 7.290064387908172e-05} +{"train_loss": 0.006704979110509157, "global_step": 25213, "epoch": 211, "lr": 7.289867438915908e-05} +{"train_loss": 0.003142264671623707, "global_step": 25214, "epoch": 211, "lr": 7.289670485427734e-05} +{"train_loss": 0.0030720618087798357, "global_step": 25215, "epoch": 211, "lr": 7.289473527444036e-05} +{"train_loss": 0.004097737371921539, "global_step": 25216, "epoch": 211, "lr": 7.289276564965202e-05} +{"train_loss": 0.0029422955121845007, "global_step": 25217, "epoch": 211, "lr": 7.289079597991618e-05} +{"train_loss": 0.0049305204302072525, "global_step": 25218, "epoch": 211, "lr": 7.288882626523669e-05} +{"train_loss": 0.0031068038661032915, "global_step": 25219, "epoch": 211, "lr": 7.288685650561744e-05} +{"train_loss": 0.005046968348324299, "global_step": 25220, "epoch": 211, "lr": 7.288488670106232e-05} +{"train_loss": 0.004387463442981243, "global_step": 25221, "epoch": 211, "lr": 7.288291685157514e-05} +{"train_loss": 0.0035448167473077774, "global_step": 25222, "epoch": 211, "lr": 7.288094695715982e-05} +{"train_loss": 0.004279581364244223, "global_step": 25223, "epoch": 211, "lr": 7.287897701782018e-05} +{"train_loss": 0.0037399730645120144, "global_step": 25224, "epoch": 211, "lr": 7.287700703356014e-05} +{"train_loss": 0.004649297334253788, "global_step": 25225, "epoch": 211, "lr": 7.287503700438352e-05} +{"train_loss": 0.0036943433806300163, "global_step": 25226, "epoch": 211, "lr": 7.287306693029422e-05} +{"train_loss": 0.004252993396068571, "global_step": 25227, "epoch": 211, "lr": 7.28710968112961e-05, "val_loss": 0.04221075400710106} +{"train_loss": 0.0013733032392337918, "global_step": 25228, "epoch": 212, "lr": 7.286912664739301e-05} +{"train_loss": 0.005107910837978125, "global_step": 25229, "epoch": 212, "lr": 7.286715643858884e-05} +{"train_loss": 0.007369956932961941, "global_step": 25230, "epoch": 212, "lr": 7.286518618488744e-05} +{"train_loss": 0.002345422748476267, "global_step": 25231, "epoch": 212, "lr": 7.28632158862927e-05} +{"train_loss": 0.004980625584721565, "global_step": 25232, "epoch": 212, "lr": 7.286124554280849e-05} +{"train_loss": 0.004148859065026045, "global_step": 25233, "epoch": 212, "lr": 7.285927515443865e-05} +{"train_loss": 0.0042864419519901276, "global_step": 25234, "epoch": 212, "lr": 7.285730472118707e-05} +{"train_loss": 0.0045790174044668674, "global_step": 25235, "epoch": 212, "lr": 7.285533424305762e-05} +{"train_loss": 0.004913290962576866, "global_step": 25236, "epoch": 212, "lr": 7.285336372005416e-05} +{"train_loss": 0.004811498802155256, "global_step": 25237, "epoch": 212, "lr": 7.285139315218054e-05} +{"train_loss": 0.00405656173825264, "global_step": 25238, "epoch": 212, "lr": 7.284942253944069e-05} +{"train_loss": 0.004044807981699705, "global_step": 25239, "epoch": 212, "lr": 7.284745188183843e-05} +{"train_loss": 0.002839685883373022, "global_step": 25240, "epoch": 212, "lr": 7.284548117937762e-05} +{"train_loss": 0.004952374380081892, "global_step": 25241, "epoch": 212, "lr": 7.284351043206217e-05} +{"train_loss": 0.002098191762343049, "global_step": 25242, "epoch": 212, "lr": 7.284153963989591e-05} +{"train_loss": 0.005365333985537291, "global_step": 25243, "epoch": 212, "lr": 7.283956880288274e-05} +{"train_loss": 0.006470121908932924, "global_step": 25244, "epoch": 212, "lr": 7.28375979210265e-05} +{"train_loss": 0.002773323329165578, "global_step": 25245, "epoch": 212, "lr": 7.283562699433109e-05} +{"train_loss": 0.00476225558668375, "global_step": 25246, "epoch": 212, "lr": 7.283365602280036e-05} +{"train_loss": 0.004113524686545134, "global_step": 25247, "epoch": 212, "lr": 7.283168500643818e-05} +{"train_loss": 0.0036901591811329126, "global_step": 25248, "epoch": 212, "lr": 7.282971394524844e-05} +{"train_loss": 0.0035125501453876495, "global_step": 25249, "epoch": 212, "lr": 7.282774283923499e-05} +{"train_loss": 0.00483236787840724, "global_step": 25250, "epoch": 212, "lr": 7.28257716884017e-05} +{"train_loss": 0.0032602634746581316, "global_step": 25251, "epoch": 212, "lr": 7.282380049275246e-05} +{"train_loss": 0.0019761540461331606, "global_step": 25252, "epoch": 212, "lr": 7.282182925229112e-05} +{"train_loss": 0.002823186805471778, "global_step": 25253, "epoch": 212, "lr": 7.281985796702156e-05} +{"train_loss": 0.003653808729723096, "global_step": 25254, "epoch": 212, "lr": 7.281788663694764e-05} +{"train_loss": 0.0024060613941401243, "global_step": 25255, "epoch": 212, "lr": 7.281591526207323e-05} +{"train_loss": 0.004530265461653471, "global_step": 25256, "epoch": 212, "lr": 7.28139438424022e-05} +{"train_loss": 0.0037046708166599274, "global_step": 25257, "epoch": 212, "lr": 7.281197237793847e-05} +{"train_loss": 0.004084172658622265, "global_step": 25258, "epoch": 212, "lr": 7.281000086868584e-05} +{"train_loss": 0.006305166985839605, "global_step": 25259, "epoch": 212, "lr": 7.280802931464821e-05} +{"train_loss": 0.0036556844133883715, "global_step": 25260, "epoch": 212, "lr": 7.280605771582945e-05} +{"train_loss": 0.004129457753151655, "global_step": 25261, "epoch": 212, "lr": 7.280408607223345e-05} +{"train_loss": 0.0023975723888725042, "global_step": 25262, "epoch": 212, "lr": 7.280211438386405e-05} +{"train_loss": 0.004859849810600281, "global_step": 25263, "epoch": 212, "lr": 7.280014265072513e-05} +{"train_loss": 0.003914134576916695, "global_step": 25264, "epoch": 212, "lr": 7.279817087282058e-05} +{"train_loss": 0.0022223456762731075, "global_step": 25265, "epoch": 212, "lr": 7.279619905015423e-05} +{"train_loss": 0.0038263651076704264, "global_step": 25266, "epoch": 212, "lr": 7.279422718273e-05} +{"train_loss": 0.005349988117814064, "global_step": 25267, "epoch": 212, "lr": 7.279225527055173e-05} +{"train_loss": 0.0042921691201627254, "global_step": 25268, "epoch": 212, "lr": 7.279028331362331e-05} +{"train_loss": 0.005042197648435831, "global_step": 25269, "epoch": 212, "lr": 7.278831131194861e-05} +{"train_loss": 0.0044894590973854065, "global_step": 25270, "epoch": 212, "lr": 7.278633926553148e-05} +{"train_loss": 0.003655278356745839, "global_step": 25271, "epoch": 212, "lr": 7.278436717437582e-05} +{"train_loss": 0.002929981332272291, "global_step": 25272, "epoch": 212, "lr": 7.278239503848548e-05} +{"train_loss": 0.006358062848448753, "global_step": 25273, "epoch": 212, "lr": 7.278042285786436e-05} +{"train_loss": 0.0031991852447390556, "global_step": 25274, "epoch": 212, "lr": 7.277845063251629e-05} +{"train_loss": 0.0032501642126590014, "global_step": 25275, "epoch": 212, "lr": 7.277647836244516e-05} +{"train_loss": 0.003255414078012109, "global_step": 25276, "epoch": 212, "lr": 7.277450604765488e-05} +{"train_loss": 0.005245661828666925, "global_step": 25277, "epoch": 212, "lr": 7.277253368814927e-05} +{"train_loss": 0.0031822246965020895, "global_step": 25278, "epoch": 212, "lr": 7.277056128393222e-05} +{"train_loss": 0.0048708803951740265, "global_step": 25279, "epoch": 212, "lr": 7.276858883500761e-05} +{"train_loss": 0.0037914335262030363, "global_step": 25280, "epoch": 212, "lr": 7.276661634137932e-05} +{"train_loss": 0.004949457943439484, "global_step": 25281, "epoch": 212, "lr": 7.276464380305119e-05} +{"train_loss": 0.003775373101234436, "global_step": 25282, "epoch": 212, "lr": 7.276267122002712e-05} +{"train_loss": 0.0045129950158298016, "global_step": 25283, "epoch": 212, "lr": 7.276069859231098e-05} +{"train_loss": 0.004723517689853907, "global_step": 25284, "epoch": 212, "lr": 7.275872591990665e-05} +{"train_loss": 0.0038394650910049677, "global_step": 25285, "epoch": 212, "lr": 7.275675320281798e-05} +{"train_loss": 0.003553831484168768, "global_step": 25286, "epoch": 212, "lr": 7.275478044104887e-05} +{"train_loss": 0.005735547281801701, "global_step": 25287, "epoch": 212, "lr": 7.275280763460315e-05} +{"train_loss": 0.00438270065933466, "global_step": 25288, "epoch": 212, "lr": 7.275083478348476e-05} +{"train_loss": 0.005390515550971031, "global_step": 25289, "epoch": 212, "lr": 7.274886188769751e-05} +{"train_loss": 0.005633252207189798, "global_step": 25290, "epoch": 212, "lr": 7.274688894724532e-05} +{"train_loss": 0.007669608108699322, "global_step": 25291, "epoch": 212, "lr": 7.274491596213204e-05} +{"train_loss": 0.004214500077068806, "global_step": 25292, "epoch": 212, "lr": 7.274294293236153e-05} +{"train_loss": 0.003724901471287012, "global_step": 25293, "epoch": 212, "lr": 7.27409698579377e-05} +{"train_loss": 0.00519416481256485, "global_step": 25294, "epoch": 212, "lr": 7.27389967388644e-05} +{"train_loss": 0.004979236051440239, "global_step": 25295, "epoch": 212, "lr": 7.273702357514549e-05} +{"train_loss": 0.005844390485435724, "global_step": 25296, "epoch": 212, "lr": 7.273505036678488e-05} +{"train_loss": 0.0036656123120337725, "global_step": 25297, "epoch": 212, "lr": 7.273307711378644e-05} +{"train_loss": 0.005931006278842688, "global_step": 25298, "epoch": 212, "lr": 7.273110381615402e-05} +{"train_loss": 0.00437223631888628, "global_step": 25299, "epoch": 212, "lr": 7.27291304738915e-05} +{"train_loss": 0.00561636732891202, "global_step": 25300, "epoch": 212, "lr": 7.272715708700276e-05} +{"train_loss": 0.0062080551870167255, "global_step": 25301, "epoch": 212, "lr": 7.272518365549169e-05} +{"train_loss": 0.004966226406395435, "global_step": 25302, "epoch": 212, "lr": 7.272321017936214e-05} +{"train_loss": 0.006172981578856707, "global_step": 25303, "epoch": 212, "lr": 7.272123665861799e-05} +{"train_loss": 0.003945635166019201, "global_step": 25304, "epoch": 212, "lr": 7.271926309326312e-05} +{"train_loss": 0.00378641439601779, "global_step": 25305, "epoch": 212, "lr": 7.271728948330141e-05} +{"train_loss": 0.0021295109763741493, "global_step": 25306, "epoch": 212, "lr": 7.271531582873672e-05} +{"train_loss": 0.005105762742459774, "global_step": 25307, "epoch": 212, "lr": 7.271334212957294e-05} +{"train_loss": 0.0037373327650129795, "global_step": 25308, "epoch": 212, "lr": 7.271136838581396e-05} +{"train_loss": 0.0036733285523951054, "global_step": 25309, "epoch": 212, "lr": 7.270939459746362e-05} +{"train_loss": 0.0031807138584554195, "global_step": 25310, "epoch": 212, "lr": 7.270742076452581e-05} +{"train_loss": 0.005254786927253008, "global_step": 25311, "epoch": 212, "lr": 7.270544688700439e-05} +{"train_loss": 0.00420392444357276, "global_step": 25312, "epoch": 212, "lr": 7.270347296490326e-05} +{"train_loss": 0.003398934844881296, "global_step": 25313, "epoch": 212, "lr": 7.270149899822629e-05} +{"train_loss": 0.007313036359846592, "global_step": 25314, "epoch": 212, "lr": 7.269952498697734e-05} +{"train_loss": 0.003518933430314064, "global_step": 25315, "epoch": 212, "lr": 7.269755093116031e-05} +{"train_loss": 0.0032687161583453417, "global_step": 25316, "epoch": 212, "lr": 7.269557683077906e-05} +{"train_loss": 0.004018133040517569, "global_step": 25317, "epoch": 212, "lr": 7.269360268583746e-05} +{"train_loss": 0.006463396828621626, "global_step": 25318, "epoch": 212, "lr": 7.269162849633942e-05} +{"train_loss": 0.0035990416072309017, "global_step": 25319, "epoch": 212, "lr": 7.268965426228878e-05} +{"train_loss": 0.004746398888528347, "global_step": 25320, "epoch": 212, "lr": 7.268767998368942e-05} +{"train_loss": 0.00424246396869421, "global_step": 25321, "epoch": 212, "lr": 7.268570566054523e-05} +{"train_loss": 0.0029675480909645557, "global_step": 25322, "epoch": 212, "lr": 7.268373129286008e-05} +{"train_loss": 0.005286307539790869, "global_step": 25323, "epoch": 212, "lr": 7.268175688063785e-05} +{"train_loss": 0.00354190357029438, "global_step": 25324, "epoch": 212, "lr": 7.267978242388241e-05} +{"train_loss": 0.004959366284310818, "global_step": 25325, "epoch": 212, "lr": 7.267780792259763e-05} +{"train_loss": 0.002543788403272629, "global_step": 25326, "epoch": 212, "lr": 7.267583337678742e-05} +{"train_loss": 0.005166737362742424, "global_step": 25327, "epoch": 212, "lr": 7.267385878645563e-05} +{"train_loss": 0.0022678598761558533, "global_step": 25328, "epoch": 212, "lr": 7.267188415160613e-05} +{"train_loss": 0.00327878980897367, "global_step": 25329, "epoch": 212, "lr": 7.26699094722428e-05} +{"train_loss": 0.005173377692699432, "global_step": 25330, "epoch": 212, "lr": 7.266793474836954e-05} +{"train_loss": 0.0038120339158922434, "global_step": 25331, "epoch": 212, "lr": 7.26659599799902e-05} +{"train_loss": 0.0071595776826143265, "global_step": 25332, "epoch": 212, "lr": 7.266398516710868e-05} +{"train_loss": 0.002434560563415289, "global_step": 25333, "epoch": 212, "lr": 7.266201030972885e-05} +{"train_loss": 0.00533002894371748, "global_step": 25334, "epoch": 212, "lr": 7.266003540785457e-05} +{"train_loss": 0.00218054186552763, "global_step": 25335, "epoch": 212, "lr": 7.265806046148975e-05} +{"train_loss": 0.004357147961854935, "global_step": 25336, "epoch": 212, "lr": 7.265608547063822e-05} +{"train_loss": 0.003481182735413313, "global_step": 25337, "epoch": 212, "lr": 7.26541104353039e-05} +{"train_loss": 0.0027769464068114758, "global_step": 25338, "epoch": 212, "lr": 7.265213535549066e-05} +{"train_loss": 0.002694106660783291, "global_step": 25339, "epoch": 212, "lr": 7.265016023120237e-05} +{"train_loss": 0.003505165223032236, "global_step": 25340, "epoch": 212, "lr": 7.264818506244292e-05} +{"train_loss": 0.0037887785583734512, "global_step": 25341, "epoch": 212, "lr": 7.264620984921616e-05} +{"train_loss": 0.003327776212245226, "global_step": 25342, "epoch": 212, "lr": 7.2644234591526e-05} +{"train_loss": 0.0032230434007942677, "global_step": 25343, "epoch": 212, "lr": 7.264225928937629e-05} +{"train_loss": 0.004787461366504431, "global_step": 25344, "epoch": 212, "lr": 7.264028394277094e-05} +{"train_loss": 0.0038431943394243717, "global_step": 25345, "epoch": 212, "lr": 7.263830855171379e-05} +{"train_loss": 0.004205987658625578, "global_step": 25346, "epoch": 212, "lr": 7.263633311620877e-05, "val_loss": 0.011947942897677422} +{"train_loss": 0.0032521476969122887, "global_step": 25347, "epoch": 213, "lr": 7.26343576362597e-05} +{"train_loss": 0.003814354771748185, "global_step": 25348, "epoch": 213, "lr": 7.26323821118705e-05} +{"train_loss": 0.003658812493085861, "global_step": 25349, "epoch": 213, "lr": 7.263040654304502e-05} +{"train_loss": 0.006310449447482824, "global_step": 25350, "epoch": 213, "lr": 7.262843092978717e-05} +{"train_loss": 0.00402590399608016, "global_step": 25351, "epoch": 213, "lr": 7.262645527210083e-05} +{"train_loss": 0.003590454114601016, "global_step": 25352, "epoch": 213, "lr": 7.262447956998983e-05} +{"train_loss": 0.005377182271331549, "global_step": 25353, "epoch": 213, "lr": 7.26225038234581e-05} +{"train_loss": 0.0035640287678688765, "global_step": 25354, "epoch": 213, "lr": 7.262052803250949e-05} +{"train_loss": 0.003559528384357691, "global_step": 25355, "epoch": 213, "lr": 7.26185521971479e-05} +{"train_loss": 0.0037044761702418327, "global_step": 25356, "epoch": 213, "lr": 7.26165763173772e-05} +{"train_loss": 0.005188626237213612, "global_step": 25357, "epoch": 213, "lr": 7.261460039320125e-05} +{"train_loss": 0.005874048452824354, "global_step": 25358, "epoch": 213, "lr": 7.261262442462397e-05} +{"train_loss": 0.004295450635254383, "global_step": 25359, "epoch": 213, "lr": 7.261064841164921e-05} +{"train_loss": 0.0033582181204110384, "global_step": 25360, "epoch": 213, "lr": 7.260867235428086e-05} +{"train_loss": 0.0030552006792277098, "global_step": 25361, "epoch": 213, "lr": 7.26066962525228e-05} +{"train_loss": 0.004026318900287151, "global_step": 25362, "epoch": 213, "lr": 7.26047201063789e-05} +{"train_loss": 0.0040963441133499146, "global_step": 25363, "epoch": 213, "lr": 7.260274391585304e-05} +{"train_loss": 0.003814034629613161, "global_step": 25364, "epoch": 213, "lr": 7.260076768094913e-05} +{"train_loss": 0.004100908525288105, "global_step": 25365, "epoch": 213, "lr": 7.2598791401671e-05} +{"train_loss": 0.0037915899883955717, "global_step": 25366, "epoch": 213, "lr": 7.259681507802257e-05} +{"train_loss": 0.0037609031423926353, "global_step": 25367, "epoch": 213, "lr": 7.259483871000771e-05} +{"train_loss": 0.002772147301584482, "global_step": 25368, "epoch": 213, "lr": 7.25928622976303e-05} +{"train_loss": 0.004754315596073866, "global_step": 25369, "epoch": 213, "lr": 7.259088584089419e-05} +{"train_loss": 0.004953013267368078, "global_step": 25370, "epoch": 213, "lr": 7.258890933980333e-05} +{"train_loss": 0.0025155963376164436, "global_step": 25371, "epoch": 213, "lr": 7.258693279436155e-05} +{"train_loss": 0.0030961281154304743, "global_step": 25372, "epoch": 213, "lr": 7.258495620457272e-05} +{"train_loss": 0.004558509681373835, "global_step": 25373, "epoch": 213, "lr": 7.258297957044076e-05} +{"train_loss": 0.004113830626010895, "global_step": 25374, "epoch": 213, "lr": 7.258100289196953e-05} +{"train_loss": 0.003015699330717325, "global_step": 25375, "epoch": 213, "lr": 7.257902616916292e-05} +{"train_loss": 0.003277695272117853, "global_step": 25376, "epoch": 213, "lr": 7.257704940202478e-05} +{"train_loss": 0.0024869374465197325, "global_step": 25377, "epoch": 213, "lr": 7.257507259055904e-05} +{"train_loss": 0.004210987128317356, "global_step": 25378, "epoch": 213, "lr": 7.257309573476954e-05} +{"train_loss": 0.004367493558675051, "global_step": 25379, "epoch": 213, "lr": 7.257111883466018e-05} +{"train_loss": 0.004600089974701405, "global_step": 25380, "epoch": 213, "lr": 7.256914189023485e-05} +{"train_loss": 0.0031084460206329823, "global_step": 25381, "epoch": 213, "lr": 7.25671649014974e-05} +{"train_loss": 0.0031849981751292944, "global_step": 25382, "epoch": 213, "lr": 7.256518786845176e-05} +{"train_loss": 0.0066963001154363155, "global_step": 25383, "epoch": 213, "lr": 7.256321079110178e-05} +{"train_loss": 0.003308660816401243, "global_step": 25384, "epoch": 213, "lr": 7.256123366945134e-05} +{"train_loss": 0.005220451857894659, "global_step": 25385, "epoch": 213, "lr": 7.255925650350433e-05} +{"train_loss": 0.0054724980145692825, "global_step": 25386, "epoch": 213, "lr": 7.255727929326461e-05} +{"train_loss": 0.004237412475049496, "global_step": 25387, "epoch": 213, "lr": 7.25553020387361e-05} +{"train_loss": 0.003266872139647603, "global_step": 25388, "epoch": 213, "lr": 7.255332473992266e-05} +{"train_loss": 0.00633222283795476, "global_step": 25389, "epoch": 213, "lr": 7.25513473968282e-05} +{"train_loss": 0.003583441488444805, "global_step": 25390, "epoch": 213, "lr": 7.254937000945656e-05} +{"train_loss": 0.007119821850210428, "global_step": 25391, "epoch": 213, "lr": 7.254739257781163e-05} +{"train_loss": 0.004500438924878836, "global_step": 25392, "epoch": 213, "lr": 7.25454151018973e-05} +{"train_loss": 0.0038425964303314686, "global_step": 25393, "epoch": 213, "lr": 7.254343758171748e-05} +{"train_loss": 0.0051324693486094475, "global_step": 25394, "epoch": 213, "lr": 7.254146001727602e-05} +{"train_loss": 0.0033594558481127024, "global_step": 25395, "epoch": 213, "lr": 7.25394824085768e-05} +{"train_loss": 0.004212229512631893, "global_step": 25396, "epoch": 213, "lr": 7.253750475562372e-05} +{"train_loss": 0.0039046399760991335, "global_step": 25397, "epoch": 213, "lr": 7.253552705842067e-05} +{"train_loss": 0.005376164801418781, "global_step": 25398, "epoch": 213, "lr": 7.25335493169715e-05} +{"train_loss": 0.005414916202425957, "global_step": 25399, "epoch": 213, "lr": 7.253157153128012e-05} +{"train_loss": 0.004026731010526419, "global_step": 25400, "epoch": 213, "lr": 7.252959370135042e-05} +{"train_loss": 0.005964423064142466, "global_step": 25401, "epoch": 213, "lr": 7.252761582718626e-05} +{"train_loss": 0.0056107197888195515, "global_step": 25402, "epoch": 213, "lr": 7.252563790879153e-05} +{"train_loss": 0.006275226827710867, "global_step": 25403, "epoch": 213, "lr": 7.252365994617012e-05} +{"train_loss": 0.0031142556108534336, "global_step": 25404, "epoch": 213, "lr": 7.252168193932591e-05} +{"train_loss": 0.004010483156889677, "global_step": 25405, "epoch": 213, "lr": 7.251970388826278e-05} +{"train_loss": 0.0032977203372865915, "global_step": 25406, "epoch": 213, "lr": 7.251772579298462e-05} +{"train_loss": 0.004641285631805658, "global_step": 25407, "epoch": 213, "lr": 7.251574765349531e-05} +{"train_loss": 0.004015217535197735, "global_step": 25408, "epoch": 213, "lr": 7.251376946979874e-05} +{"train_loss": 0.006352790165692568, "global_step": 25409, "epoch": 213, "lr": 7.25117912418988e-05} +{"train_loss": 0.004517237655818462, "global_step": 25410, "epoch": 213, "lr": 7.250981296979934e-05} +{"train_loss": 0.004213299602270126, "global_step": 25411, "epoch": 213, "lr": 7.250783465350427e-05} +{"train_loss": 0.004966428503394127, "global_step": 25412, "epoch": 213, "lr": 7.250585629301747e-05} +{"train_loss": 0.005034583620727062, "global_step": 25413, "epoch": 213, "lr": 7.250387788834282e-05} +{"train_loss": 0.0052619557827711105, "global_step": 25414, "epoch": 213, "lr": 7.250189943948424e-05} +{"train_loss": 0.004480214789509773, "global_step": 25415, "epoch": 213, "lr": 7.249992094644557e-05} +{"train_loss": 0.0035893339663743973, "global_step": 25416, "epoch": 213, "lr": 7.249794240923068e-05} +{"train_loss": 0.004738651216030121, "global_step": 25417, "epoch": 213, "lr": 7.249596382784352e-05} +{"train_loss": 0.00540090911090374, "global_step": 25418, "epoch": 213, "lr": 7.249398520228793e-05} +{"train_loss": 0.0040634493343532085, "global_step": 25419, "epoch": 213, "lr": 7.24920065325678e-05} +{"train_loss": 0.0019808891229331493, "global_step": 25420, "epoch": 213, "lr": 7.249002781868703e-05} +{"train_loss": 0.003787495195865631, "global_step": 25421, "epoch": 213, "lr": 7.248804906064948e-05} +{"train_loss": 0.0031198712531477213, "global_step": 25422, "epoch": 213, "lr": 7.248607025845905e-05} +{"train_loss": 0.005112398415803909, "global_step": 25423, "epoch": 213, "lr": 7.248409141211962e-05} +{"train_loss": 0.004809146281331778, "global_step": 25424, "epoch": 213, "lr": 7.248211252163508e-05} +{"train_loss": 0.00420845951884985, "global_step": 25425, "epoch": 213, "lr": 7.248013358700932e-05} +{"train_loss": 0.004351217299699783, "global_step": 25426, "epoch": 213, "lr": 7.24781546082462e-05} +{"train_loss": 0.0034533182624727488, "global_step": 25427, "epoch": 213, "lr": 7.247617558534965e-05} +{"train_loss": 0.004864714574068785, "global_step": 25428, "epoch": 213, "lr": 7.247419651832352e-05} +{"train_loss": 0.0025884658098220825, "global_step": 25429, "epoch": 213, "lr": 7.24722174071717e-05} +{"train_loss": 0.004248037934303284, "global_step": 25430, "epoch": 213, "lr": 7.24702382518981e-05} +{"train_loss": 0.003456812584772706, "global_step": 25431, "epoch": 213, "lr": 7.246825905250656e-05} +{"train_loss": 0.004165558610111475, "global_step": 25432, "epoch": 213, "lr": 7.246627980900101e-05} +{"train_loss": 0.005813647992908955, "global_step": 25433, "epoch": 213, "lr": 7.246430052138533e-05} +{"train_loss": 0.002935097087174654, "global_step": 25434, "epoch": 213, "lr": 7.246232118966338e-05} +{"train_loss": 0.004080836195498705, "global_step": 25435, "epoch": 213, "lr": 7.246034181383907e-05} +{"train_loss": 0.004313929472118616, "global_step": 25436, "epoch": 213, "lr": 7.245836239391628e-05} +{"train_loss": 0.006898725870996714, "global_step": 25437, "epoch": 213, "lr": 7.245638292989889e-05} +{"train_loss": 0.006010627374053001, "global_step": 25438, "epoch": 213, "lr": 7.245440342179079e-05} +{"train_loss": 0.005240665748715401, "global_step": 25439, "epoch": 213, "lr": 7.245242386959588e-05} +{"train_loss": 0.003592235269024968, "global_step": 25440, "epoch": 213, "lr": 7.245044427331802e-05} +{"train_loss": 0.0018730885349214077, "global_step": 25441, "epoch": 213, "lr": 7.244846463296112e-05} +{"train_loss": 0.004372869618237019, "global_step": 25442, "epoch": 213, "lr": 7.244648494852905e-05} +{"train_loss": 0.0021257877815514803, "global_step": 25443, "epoch": 213, "lr": 7.24445052200257e-05} +{"train_loss": 0.0017765031661838293, "global_step": 25444, "epoch": 213, "lr": 7.244252544745496e-05} +{"train_loss": 0.0066109346225857735, "global_step": 25445, "epoch": 213, "lr": 7.244054563082075e-05} +{"train_loss": 0.00395103357732296, "global_step": 25446, "epoch": 213, "lr": 7.243856577012689e-05} +{"train_loss": 0.006724645383656025, "global_step": 25447, "epoch": 213, "lr": 7.243658586537731e-05} +{"train_loss": 0.004070522263646126, "global_step": 25448, "epoch": 213, "lr": 7.243460591657591e-05} +{"train_loss": 0.005079540889710188, "global_step": 25449, "epoch": 213, "lr": 7.243262592372655e-05} +{"train_loss": 0.002747011138126254, "global_step": 25450, "epoch": 213, "lr": 7.243064588683312e-05} +{"train_loss": 0.0049577015452086926, "global_step": 25451, "epoch": 213, "lr": 7.242866580589951e-05} +{"train_loss": 0.003540750127285719, "global_step": 25452, "epoch": 213, "lr": 7.242668568092962e-05} +{"train_loss": 0.0026516427751630545, "global_step": 25453, "epoch": 213, "lr": 7.242470551192733e-05} +{"train_loss": 0.003264484228566289, "global_step": 25454, "epoch": 213, "lr": 7.242272529889652e-05} +{"train_loss": 0.005169016309082508, "global_step": 25455, "epoch": 213, "lr": 7.242074504184109e-05} +{"train_loss": 0.003821047954261303, "global_step": 25456, "epoch": 213, "lr": 7.24187647407649e-05} +{"train_loss": 0.0047014011070132256, "global_step": 25457, "epoch": 213, "lr": 7.241678439567189e-05} +{"train_loss": 0.002985841827467084, "global_step": 25458, "epoch": 213, "lr": 7.241480400656592e-05} +{"train_loss": 0.004555881023406982, "global_step": 25459, "epoch": 213, "lr": 7.241282357345086e-05} +{"train_loss": 0.0030948154162615538, "global_step": 25460, "epoch": 213, "lr": 7.241084309633062e-05} +{"train_loss": 0.003830991219729185, "global_step": 25461, "epoch": 213, "lr": 7.240886257520908e-05} +{"train_loss": 0.005308231338858604, "global_step": 25462, "epoch": 213, "lr": 7.240688201009012e-05} +{"train_loss": 0.0032873901072889566, "global_step": 25463, "epoch": 213, "lr": 7.240490140097767e-05} +{"train_loss": 0.0031699752435088158, "global_step": 25464, "epoch": 213, "lr": 7.240292074787558e-05} +{"train_loss": 0.00421460354974603, "global_step": 25465, "epoch": 213, "lr": 7.240094005078775e-05, "val_loss": 0.02681771293282509} +{"train_loss": 0.005034479778259993, "global_step": 25466, "epoch": 214, "lr": 7.239895930971805e-05} +{"train_loss": 0.005451311357319355, "global_step": 25467, "epoch": 214, "lr": 7.23969785246704e-05} +{"train_loss": 0.004452172201126814, "global_step": 25468, "epoch": 214, "lr": 7.239499769564868e-05} +{"train_loss": 0.005458686966449022, "global_step": 25469, "epoch": 214, "lr": 7.239301682265676e-05} +{"train_loss": 0.0021861332934349775, "global_step": 25470, "epoch": 214, "lr": 7.239103590569856e-05} +{"train_loss": 0.005186554975807667, "global_step": 25471, "epoch": 214, "lr": 7.238905494477795e-05} +{"train_loss": 0.004427875857800245, "global_step": 25472, "epoch": 214, "lr": 7.238707393989882e-05} +{"train_loss": 0.0033849943429231644, "global_step": 25473, "epoch": 214, "lr": 7.238509289106506e-05} +{"train_loss": 0.00474317604675889, "global_step": 25474, "epoch": 214, "lr": 7.238311179828055e-05} +{"train_loss": 0.0024896818213164806, "global_step": 25475, "epoch": 214, "lr": 7.238113066154922e-05} +{"train_loss": 0.0037040356546640396, "global_step": 25476, "epoch": 214, "lr": 7.237914948087491e-05} +{"train_loss": 0.0035921346861869097, "global_step": 25477, "epoch": 214, "lr": 7.237716825626153e-05} +{"train_loss": 0.004107004962861538, "global_step": 25478, "epoch": 214, "lr": 7.237518698771298e-05} +{"train_loss": 0.0031310373451560736, "global_step": 25479, "epoch": 214, "lr": 7.237320567523313e-05} +{"train_loss": 0.0037825184408575296, "global_step": 25480, "epoch": 214, "lr": 7.237122431882589e-05} +{"train_loss": 0.0052423859015107155, "global_step": 25481, "epoch": 214, "lr": 7.236924291849514e-05} +{"train_loss": 0.004218844696879387, "global_step": 25482, "epoch": 214, "lr": 7.236726147424477e-05} +{"train_loss": 0.005510916467756033, "global_step": 25483, "epoch": 214, "lr": 7.236527998607868e-05} +{"train_loss": 0.0024259823840111494, "global_step": 25484, "epoch": 214, "lr": 7.236329845400074e-05} +{"train_loss": 0.0050544217228889465, "global_step": 25485, "epoch": 214, "lr": 7.236131687801486e-05} +{"train_loss": 0.0058636534959077835, "global_step": 25486, "epoch": 214, "lr": 7.235933525812492e-05} +{"train_loss": 0.0045079682022333145, "global_step": 25487, "epoch": 214, "lr": 7.235735359433481e-05} +{"train_loss": 0.004578724037855864, "global_step": 25488, "epoch": 214, "lr": 7.235537188664842e-05} +{"train_loss": 0.004997822921723127, "global_step": 25489, "epoch": 214, "lr": 7.235339013506967e-05} +{"train_loss": 0.003497338853776455, "global_step": 25490, "epoch": 214, "lr": 7.23514083396024e-05} +{"train_loss": 0.002353786490857601, "global_step": 25491, "epoch": 214, "lr": 7.234942650025054e-05} +{"train_loss": 0.004261862952262163, "global_step": 25492, "epoch": 214, "lr": 7.234744461701797e-05} +{"train_loss": 0.0035577742382884026, "global_step": 25493, "epoch": 214, "lr": 7.234546268990859e-05} +{"train_loss": 0.0026751598343253136, "global_step": 25494, "epoch": 214, "lr": 7.234348071892625e-05} +{"train_loss": 0.0030108275823295116, "global_step": 25495, "epoch": 214, "lr": 7.23414987040749e-05} +{"train_loss": 0.004869513213634491, "global_step": 25496, "epoch": 214, "lr": 7.233951664535838e-05} +{"train_loss": 0.0050373803824186325, "global_step": 25497, "epoch": 214, "lr": 7.233753454278063e-05} +{"train_loss": 0.003524893894791603, "global_step": 25498, "epoch": 214, "lr": 7.233555239634551e-05} +{"train_loss": 0.0035523385740816593, "global_step": 25499, "epoch": 214, "lr": 7.23335702060569e-05} +{"train_loss": 0.004015709273517132, "global_step": 25500, "epoch": 214, "lr": 7.233158797191875e-05} +{"train_loss": 0.005014410708099604, "global_step": 25501, "epoch": 214, "lr": 7.232960569393487e-05} +{"train_loss": 0.002618083031848073, "global_step": 25502, "epoch": 214, "lr": 7.232762337210924e-05} +{"train_loss": 0.001484459382481873, "global_step": 25503, "epoch": 214, "lr": 7.232564100644567e-05} +{"train_loss": 0.0033153654076159, "global_step": 25504, "epoch": 214, "lr": 7.23236585969481e-05} +{"train_loss": 0.0034057695884257555, "global_step": 25505, "epoch": 214, "lr": 7.232167614362042e-05} +{"train_loss": 0.0035812302958220243, "global_step": 25506, "epoch": 214, "lr": 7.23196936464665e-05} +{"train_loss": 0.0036397301591932774, "global_step": 25507, "epoch": 214, "lr": 7.231771110549027e-05} +{"train_loss": 0.0043418495915830135, "global_step": 25508, "epoch": 214, "lr": 7.231572852069557e-05} +{"train_loss": 0.0030617634765803814, "global_step": 25509, "epoch": 214, "lr": 7.231374589208633e-05} +{"train_loss": 0.0034424203913658857, "global_step": 25510, "epoch": 214, "lr": 7.231176321966643e-05} +{"train_loss": 0.003027027938514948, "global_step": 25511, "epoch": 214, "lr": 7.230978050343977e-05} +{"train_loss": 0.005956798326224089, "global_step": 25512, "epoch": 214, "lr": 7.230779774341024e-05} +{"train_loss": 0.0036044216249138117, "global_step": 25513, "epoch": 214, "lr": 7.230581493958174e-05} +{"train_loss": 0.0017780696507543325, "global_step": 25514, "epoch": 214, "lr": 7.230383209195815e-05} +{"train_loss": 0.003348149824887514, "global_step": 25515, "epoch": 214, "lr": 7.230184920054336e-05} +{"train_loss": 0.0050255246460437775, "global_step": 25516, "epoch": 214, "lr": 7.229986626534129e-05} +{"train_loss": 0.0030124871991574764, "global_step": 25517, "epoch": 214, "lr": 7.22978832863558e-05} +{"train_loss": 0.0032399320043623447, "global_step": 25518, "epoch": 214, "lr": 7.22959002635908e-05} +{"train_loss": 0.004072617273777723, "global_step": 25519, "epoch": 214, "lr": 7.22939171970502e-05} +{"train_loss": 0.003975699655711651, "global_step": 25520, "epoch": 214, "lr": 7.229193408673785e-05} +{"train_loss": 0.007426347583532333, "global_step": 25521, "epoch": 214, "lr": 7.228995093265769e-05} +{"train_loss": 0.0040897708386182785, "global_step": 25522, "epoch": 214, "lr": 7.228796773481358e-05} +{"train_loss": 0.0029894234612584114, "global_step": 25523, "epoch": 214, "lr": 7.228598449320944e-05} +{"train_loss": 0.004394217859953642, "global_step": 25524, "epoch": 214, "lr": 7.228400120784913e-05} +{"train_loss": 0.002687356900423765, "global_step": 25525, "epoch": 214, "lr": 7.228201787873657e-05} +{"train_loss": 0.004572057165205479, "global_step": 25526, "epoch": 214, "lr": 7.228003450587565e-05} +{"train_loss": 0.0028970749117434025, "global_step": 25527, "epoch": 214, "lr": 7.227805108927025e-05} +{"train_loss": 0.004315240774303675, "global_step": 25528, "epoch": 214, "lr": 7.227606762892431e-05} +{"train_loss": 0.003603691700845957, "global_step": 25529, "epoch": 214, "lr": 7.227408412484166e-05} +{"train_loss": 0.003988619428128004, "global_step": 25530, "epoch": 214, "lr": 7.227210057702624e-05} +{"train_loss": 0.0031982013024389744, "global_step": 25531, "epoch": 214, "lr": 7.227011698548193e-05} +{"train_loss": 0.003500264836475253, "global_step": 25532, "epoch": 214, "lr": 7.226813335021262e-05} +{"train_loss": 0.004469811450690031, "global_step": 25533, "epoch": 214, "lr": 7.226614967122222e-05} +{"train_loss": 0.005915503483265638, "global_step": 25534, "epoch": 214, "lr": 7.226416594851461e-05} +{"train_loss": 0.0047296034172177315, "global_step": 25535, "epoch": 214, "lr": 7.226218218209368e-05} +{"train_loss": 0.003486325265839696, "global_step": 25536, "epoch": 214, "lr": 7.226019837196334e-05} +{"train_loss": 0.0026323285419493914, "global_step": 25537, "epoch": 214, "lr": 7.225821451812746e-05} +{"train_loss": 0.00390975084155798, "global_step": 25538, "epoch": 214, "lr": 7.225623062058999e-05} +{"train_loss": 0.00223839795216918, "global_step": 25539, "epoch": 214, "lr": 7.225424667935476e-05} +{"train_loss": 0.0038928391877561808, "global_step": 25540, "epoch": 214, "lr": 7.225226269442571e-05} +{"train_loss": 0.004234713967889547, "global_step": 25541, "epoch": 214, "lr": 7.225027866580672e-05} +{"train_loss": 0.0033016775269061327, "global_step": 25542, "epoch": 214, "lr": 7.224829459350167e-05} +{"train_loss": 0.0030009339097887278, "global_step": 25543, "epoch": 214, "lr": 7.224631047751447e-05} +{"train_loss": 0.004765127785503864, "global_step": 25544, "epoch": 214, "lr": 7.224432631784903e-05} +{"train_loss": 0.003264625323936343, "global_step": 25545, "epoch": 214, "lr": 7.224234211450922e-05} +{"train_loss": 0.004995911382138729, "global_step": 25546, "epoch": 214, "lr": 7.224035786749895e-05} +{"train_loss": 0.004358732141554356, "global_step": 25547, "epoch": 214, "lr": 7.223837357682211e-05} +{"train_loss": 0.0031328375916928053, "global_step": 25548, "epoch": 214, "lr": 7.223638924248261e-05} +{"train_loss": 0.003837894182652235, "global_step": 25549, "epoch": 214, "lr": 7.223440486448433e-05} +{"train_loss": 0.005713441409170628, "global_step": 25550, "epoch": 214, "lr": 7.223242044283117e-05} +{"train_loss": 0.004179754294455051, "global_step": 25551, "epoch": 214, "lr": 7.223043597752703e-05} +{"train_loss": 0.006187645718455315, "global_step": 25552, "epoch": 214, "lr": 7.222845146857582e-05} +{"train_loss": 0.002654331037774682, "global_step": 25553, "epoch": 214, "lr": 7.222646691598139e-05} +{"train_loss": 0.005446762312203646, "global_step": 25554, "epoch": 214, "lr": 7.222448231974769e-05} +{"train_loss": 0.003102326299995184, "global_step": 25555, "epoch": 214, "lr": 7.222249767987859e-05} +{"train_loss": 0.005724180024117231, "global_step": 25556, "epoch": 214, "lr": 7.222051299637797e-05} +{"train_loss": 0.0025860394816845655, "global_step": 25557, "epoch": 214, "lr": 7.221852826924976e-05} +{"train_loss": 0.0028275528457015753, "global_step": 25558, "epoch": 214, "lr": 7.221654349849786e-05} +{"train_loss": 0.003168699098750949, "global_step": 25559, "epoch": 214, "lr": 7.221455868412613e-05} +{"train_loss": 0.0044838301837444305, "global_step": 25560, "epoch": 214, "lr": 7.221257382613848e-05} +{"train_loss": 0.0029655052348971367, "global_step": 25561, "epoch": 214, "lr": 7.221058892453883e-05} +{"train_loss": 0.0050813909620046616, "global_step": 25562, "epoch": 214, "lr": 7.220860397933106e-05} +{"train_loss": 0.003563414793461561, "global_step": 25563, "epoch": 214, "lr": 7.220661899051906e-05} +{"train_loss": 0.005798477213829756, "global_step": 25564, "epoch": 214, "lr": 7.220463395810674e-05} +{"train_loss": 0.002642542589455843, "global_step": 25565, "epoch": 214, "lr": 7.220264888209801e-05} +{"train_loss": 0.00352918216958642, "global_step": 25566, "epoch": 214, "lr": 7.220066376249673e-05} +{"train_loss": 0.004994540475308895, "global_step": 25567, "epoch": 214, "lr": 7.219867859930682e-05} +{"train_loss": 0.0020581886637955904, "global_step": 25568, "epoch": 214, "lr": 7.219669339253219e-05} +{"train_loss": 0.00327706360258162, "global_step": 25569, "epoch": 214, "lr": 7.219470814217671e-05} +{"train_loss": 0.005750253330916166, "global_step": 25570, "epoch": 214, "lr": 7.21927228482443e-05} +{"train_loss": 0.002324737375602126, "global_step": 25571, "epoch": 214, "lr": 7.219073751073887e-05} +{"train_loss": 0.004709531553089619, "global_step": 25572, "epoch": 214, "lr": 7.218875212966426e-05} +{"train_loss": 0.004730260465294123, "global_step": 25573, "epoch": 214, "lr": 7.218676670502442e-05} +{"train_loss": 0.0036577440332621336, "global_step": 25574, "epoch": 214, "lr": 7.218478123682322e-05} +{"train_loss": 0.005168506875634193, "global_step": 25575, "epoch": 214, "lr": 7.21827957250646e-05} +{"train_loss": 0.004313555546104908, "global_step": 25576, "epoch": 214, "lr": 7.218081016975242e-05} +{"train_loss": 0.004402167163789272, "global_step": 25577, "epoch": 214, "lr": 7.217882457089058e-05} +{"train_loss": 0.0064790076576173306, "global_step": 25578, "epoch": 214, "lr": 7.217683892848299e-05} +{"train_loss": 0.005124709568917751, "global_step": 25579, "epoch": 214, "lr": 7.217485324253354e-05} +{"train_loss": 0.0029571426566690207, "global_step": 25580, "epoch": 214, "lr": 7.217286751304615e-05} +{"train_loss": 0.0040118801407516, "global_step": 25581, "epoch": 214, "lr": 7.21708817400247e-05} +{"train_loss": 0.0035001325886696577, "global_step": 25582, "epoch": 214, "lr": 7.21688959234731e-05} +{"train_loss": 0.002145135309547186, "global_step": 25583, "epoch": 214, "lr": 7.216691006339522e-05} +{"train_loss": 0.003948360962300178, "global_step": 25584, "epoch": 214, "lr": 7.216492415979499e-05, "val_loss": 0.01820703037083149} +{"train_loss": 0.003800897393375635, "global_step": 25585, "epoch": 215, "lr": 7.21629382126763e-05} +{"train_loss": 0.004163715057075024, "global_step": 25586, "epoch": 215, "lr": 7.216095222204305e-05} +{"train_loss": 0.0058159660547971725, "global_step": 25587, "epoch": 215, "lr": 7.215896618789913e-05} +{"train_loss": 0.003101650159806013, "global_step": 25588, "epoch": 215, "lr": 7.215698011024846e-05} +{"train_loss": 0.00399499898776412, "global_step": 25589, "epoch": 215, "lr": 7.215499398909492e-05} +{"train_loss": 0.0020899653900414705, "global_step": 25590, "epoch": 215, "lr": 7.215300782444243e-05} +{"train_loss": 0.002156190574169159, "global_step": 25591, "epoch": 215, "lr": 7.215102161629486e-05} +{"train_loss": 0.0031183618120849133, "global_step": 25592, "epoch": 215, "lr": 7.214903536465613e-05} +{"train_loss": 0.00439756503328681, "global_step": 25593, "epoch": 215, "lr": 7.214704906953012e-05} +{"train_loss": 0.00561877153813839, "global_step": 25594, "epoch": 215, "lr": 7.214506273092075e-05} +{"train_loss": 0.0026050424203276634, "global_step": 25595, "epoch": 215, "lr": 7.214307634883192e-05} +{"train_loss": 0.004741334822028875, "global_step": 25596, "epoch": 215, "lr": 7.214108992326755e-05} +{"train_loss": 0.004268520977348089, "global_step": 25597, "epoch": 215, "lr": 7.213910345423149e-05} +{"train_loss": 0.0028037463780492544, "global_step": 25598, "epoch": 215, "lr": 7.213711694172767e-05} +{"train_loss": 0.004271848127245903, "global_step": 25599, "epoch": 215, "lr": 7.213513038575998e-05} +{"train_loss": 0.004074407275766134, "global_step": 25600, "epoch": 215, "lr": 7.213314378633234e-05} +{"train_loss": 0.0042841993272304535, "global_step": 25601, "epoch": 215, "lr": 7.213115714344862e-05} +{"train_loss": 0.006465057842433453, "global_step": 25602, "epoch": 215, "lr": 7.212917045711277e-05} +{"train_loss": 0.0032764198258519173, "global_step": 25603, "epoch": 215, "lr": 7.212718372732863e-05} +{"train_loss": 0.003021609503775835, "global_step": 25604, "epoch": 215, "lr": 7.212519695410013e-05} +{"train_loss": 0.006100477185100317, "global_step": 25605, "epoch": 215, "lr": 7.212321013743118e-05} +{"train_loss": 0.00459684431552887, "global_step": 25606, "epoch": 215, "lr": 7.212122327732565e-05} +{"train_loss": 0.004762685392051935, "global_step": 25607, "epoch": 215, "lr": 7.211923637378748e-05} +{"train_loss": 0.00388171779923141, "global_step": 25608, "epoch": 215, "lr": 7.211724942682055e-05} +{"train_loss": 0.003220949089154601, "global_step": 25609, "epoch": 215, "lr": 7.211526243642875e-05} +{"train_loss": 0.0017786768730729818, "global_step": 25610, "epoch": 215, "lr": 7.211327540261601e-05} +{"train_loss": 0.005655661690980196, "global_step": 25611, "epoch": 215, "lr": 7.21112883253862e-05} +{"train_loss": 0.004313239827752113, "global_step": 25612, "epoch": 215, "lr": 7.210930120474325e-05} +{"train_loss": 0.00409350311383605, "global_step": 25613, "epoch": 215, "lr": 7.210731404069105e-05} +{"train_loss": 0.005198413971811533, "global_step": 25614, "epoch": 215, "lr": 7.210532683323349e-05} +{"train_loss": 0.003855697112157941, "global_step": 25615, "epoch": 215, "lr": 7.21033395823745e-05} +{"train_loss": 0.004726053215563297, "global_step": 25616, "epoch": 215, "lr": 7.210135228811797e-05} +{"train_loss": 0.004369314294308424, "global_step": 25617, "epoch": 215, "lr": 7.209936495046777e-05} +{"train_loss": 0.00514263054355979, "global_step": 25618, "epoch": 215, "lr": 7.209737756942784e-05} +{"train_loss": 0.0029160769190639257, "global_step": 25619, "epoch": 215, "lr": 7.209539014500207e-05} +{"train_loss": 0.0038286081980913877, "global_step": 25620, "epoch": 215, "lr": 7.209340267719435e-05} +{"train_loss": 0.0034241576213389635, "global_step": 25621, "epoch": 215, "lr": 7.209141516600863e-05} +{"train_loss": 0.0033901415299624205, "global_step": 25622, "epoch": 215, "lr": 7.208942761144874e-05} +{"train_loss": 0.003620594972744584, "global_step": 25623, "epoch": 215, "lr": 7.208744001351864e-05} +{"train_loss": 0.003506684908643365, "global_step": 25624, "epoch": 215, "lr": 7.20854523722222e-05} +{"train_loss": 0.0035163091961294413, "global_step": 25625, "epoch": 215, "lr": 7.208346468756332e-05} +{"train_loss": 0.003467810107395053, "global_step": 25626, "epoch": 215, "lr": 7.208147695954594e-05} +{"train_loss": 0.003488359274342656, "global_step": 25627, "epoch": 215, "lr": 7.207948918817394e-05} +{"train_loss": 0.004707128740847111, "global_step": 25628, "epoch": 215, "lr": 7.20775013734512e-05} +{"train_loss": 0.002749514998868108, "global_step": 25629, "epoch": 215, "lr": 7.207551351538167e-05} +{"train_loss": 0.003466634312644601, "global_step": 25630, "epoch": 215, "lr": 7.20735256139692e-05} +{"train_loss": 0.0038886102847754955, "global_step": 25631, "epoch": 215, "lr": 7.207153766921774e-05} +{"train_loss": 0.004417894873768091, "global_step": 25632, "epoch": 215, "lr": 7.206954968113118e-05} +{"train_loss": 0.00482341879978776, "global_step": 25633, "epoch": 215, "lr": 7.20675616497134e-05} +{"train_loss": 0.003208455629646778, "global_step": 25634, "epoch": 215, "lr": 7.206557357496833e-05} +{"train_loss": 0.005116893444210291, "global_step": 25635, "epoch": 215, "lr": 7.206358545689986e-05} +{"train_loss": 0.0021376372314989567, "global_step": 25636, "epoch": 215, "lr": 7.206159729551189e-05} +{"train_loss": 0.003495520446449518, "global_step": 25637, "epoch": 215, "lr": 7.205960909080834e-05} +{"train_loss": 0.004325586836785078, "global_step": 25638, "epoch": 215, "lr": 7.20576208427931e-05} +{"train_loss": 0.004278971813619137, "global_step": 25639, "epoch": 215, "lr": 7.205563255147009e-05} +{"train_loss": 0.004141594748944044, "global_step": 25640, "epoch": 215, "lr": 7.20536442168432e-05} +{"train_loss": 0.0035755683202296495, "global_step": 25641, "epoch": 215, "lr": 7.205165583891632e-05} +{"train_loss": 0.002916610799729824, "global_step": 25642, "epoch": 215, "lr": 7.204966741769338e-05} +{"train_loss": 0.0035873092710971832, "global_step": 25643, "epoch": 215, "lr": 7.204767895317826e-05} +{"train_loss": 0.0033008030150085688, "global_step": 25644, "epoch": 215, "lr": 7.20456904453749e-05} +{"train_loss": 0.003510075621306896, "global_step": 25645, "epoch": 215, "lr": 7.204370189428716e-05} +{"train_loss": 0.0040183356031775475, "global_step": 25646, "epoch": 215, "lr": 7.204171329991899e-05} +{"train_loss": 0.002574056386947632, "global_step": 25647, "epoch": 215, "lr": 7.203972466227426e-05} +{"train_loss": 0.004098143428564072, "global_step": 25648, "epoch": 215, "lr": 7.203773598135687e-05} +{"train_loss": 0.0022979951463639736, "global_step": 25649, "epoch": 215, "lr": 7.203574725717076e-05} +{"train_loss": 0.0033741858787834644, "global_step": 25650, "epoch": 215, "lr": 7.203375848971981e-05} +{"train_loss": 0.002986769424751401, "global_step": 25651, "epoch": 215, "lr": 7.203176967900792e-05} +{"train_loss": 0.0032016769982874393, "global_step": 25652, "epoch": 215, "lr": 7.202978082503902e-05} +{"train_loss": 0.004101394675672054, "global_step": 25653, "epoch": 215, "lr": 7.202779192781699e-05} +{"train_loss": 0.0034525375813245773, "global_step": 25654, "epoch": 215, "lr": 7.202580298734575e-05} +{"train_loss": 0.00400101114064455, "global_step": 25655, "epoch": 215, "lr": 7.202381400362919e-05} +{"train_loss": 0.004833909682929516, "global_step": 25656, "epoch": 215, "lr": 7.202182497667123e-05} +{"train_loss": 0.005089612677693367, "global_step": 25657, "epoch": 215, "lr": 7.201983590647575e-05} +{"train_loss": 0.003225765423849225, "global_step": 25658, "epoch": 215, "lr": 7.201784679304669e-05} +{"train_loss": 0.0028934692963957787, "global_step": 25659, "epoch": 215, "lr": 7.201585763638794e-05} +{"train_loss": 0.004906481131911278, "global_step": 25660, "epoch": 215, "lr": 7.201386843650342e-05} +{"train_loss": 0.0027365079149603844, "global_step": 25661, "epoch": 215, "lr": 7.2011879193397e-05} +{"train_loss": 0.003934258595108986, "global_step": 25662, "epoch": 215, "lr": 7.200988990707261e-05} +{"train_loss": 0.0054081459529697895, "global_step": 25663, "epoch": 215, "lr": 7.200790057753415e-05} +{"train_loss": 0.003277287818491459, "global_step": 25664, "epoch": 215, "lr": 7.200591120478555e-05} +{"train_loss": 0.0036963466554880142, "global_step": 25665, "epoch": 215, "lr": 7.200392178883069e-05} +{"train_loss": 0.003006456885486841, "global_step": 25666, "epoch": 215, "lr": 7.200193232967346e-05} +{"train_loss": 0.004586072638630867, "global_step": 25667, "epoch": 215, "lr": 7.199994282731779e-05} +{"train_loss": 0.005252179689705372, "global_step": 25668, "epoch": 215, "lr": 7.199795328176759e-05} +{"train_loss": 0.003032197942957282, "global_step": 25669, "epoch": 215, "lr": 7.199596369302676e-05} +{"train_loss": 0.0036345080006867647, "global_step": 25670, "epoch": 215, "lr": 7.19939740610992e-05} +{"train_loss": 0.0038531646132469177, "global_step": 25671, "epoch": 215, "lr": 7.199198438598884e-05} +{"train_loss": 0.003577398369088769, "global_step": 25672, "epoch": 215, "lr": 7.198999466769954e-05} +{"train_loss": 0.004713209345936775, "global_step": 25673, "epoch": 215, "lr": 7.198800490623525e-05} +{"train_loss": 0.004460514988750219, "global_step": 25674, "epoch": 215, "lr": 7.198601510159986e-05} +{"train_loss": 0.0037018191069364548, "global_step": 25675, "epoch": 215, "lr": 7.198402525379728e-05} +{"train_loss": 0.006153724156320095, "global_step": 25676, "epoch": 215, "lr": 7.198203536283141e-05} +{"train_loss": 0.005721531342715025, "global_step": 25677, "epoch": 215, "lr": 7.198004542870616e-05} +{"train_loss": 0.0034477696754038334, "global_step": 25678, "epoch": 215, "lr": 7.197805545142544e-05} +{"train_loss": 0.0041062901727855206, "global_step": 25679, "epoch": 215, "lr": 7.197606543099317e-05} +{"train_loss": 0.0023251639213413, "global_step": 25680, "epoch": 215, "lr": 7.197407536741322e-05} +{"train_loss": 0.005272692069411278, "global_step": 25681, "epoch": 215, "lr": 7.197208526068954e-05} +{"train_loss": 0.0051582083106040955, "global_step": 25682, "epoch": 215, "lr": 7.197009511082601e-05} +{"train_loss": 0.0037024598568677902, "global_step": 25683, "epoch": 215, "lr": 7.196810491782656e-05} +{"train_loss": 0.003971772268414497, "global_step": 25684, "epoch": 215, "lr": 7.196611468169506e-05} +{"train_loss": 0.005639887880533934, "global_step": 25685, "epoch": 215, "lr": 7.196412440243545e-05} +{"train_loss": 0.004985007457435131, "global_step": 25686, "epoch": 215, "lr": 7.196213408005164e-05} +{"train_loss": 0.004882355220615864, "global_step": 25687, "epoch": 215, "lr": 7.196014371454751e-05} +{"train_loss": 0.002747617894783616, "global_step": 25688, "epoch": 215, "lr": 7.195815330592699e-05} +{"train_loss": 0.00556202745065093, "global_step": 25689, "epoch": 215, "lr": 7.195616285419397e-05} +{"train_loss": 0.0024342474061995745, "global_step": 25690, "epoch": 215, "lr": 7.195417235935239e-05} +{"train_loss": 0.00515817990526557, "global_step": 25691, "epoch": 215, "lr": 7.195218182140613e-05} +{"train_loss": 0.004617555532604456, "global_step": 25692, "epoch": 215, "lr": 7.19501912403591e-05} +{"train_loss": 0.0038735985290259123, "global_step": 25693, "epoch": 215, "lr": 7.19482006162152e-05} +{"train_loss": 0.003539211116731167, "global_step": 25694, "epoch": 215, "lr": 7.194620994897839e-05} +{"train_loss": 0.005550697911530733, "global_step": 25695, "epoch": 215, "lr": 7.194421923865252e-05} +{"train_loss": 0.0041634379886090755, "global_step": 25696, "epoch": 215, "lr": 7.194222848524152e-05} +{"train_loss": 0.0054682400077581406, "global_step": 25697, "epoch": 215, "lr": 7.194023768874932e-05} +{"train_loss": 0.003994138911366463, "global_step": 25698, "epoch": 215, "lr": 7.193824684917978e-05} +{"train_loss": 0.005690612364560366, "global_step": 25699, "epoch": 215, "lr": 7.193625596653684e-05} +{"train_loss": 0.004393295384943485, "global_step": 25700, "epoch": 215, "lr": 7.193426504082442e-05} +{"train_loss": 0.0033175195567309856, "global_step": 25701, "epoch": 215, "lr": 7.193227407204639e-05} +{"train_loss": 0.004151072818785906, "global_step": 25702, "epoch": 215, "lr": 7.19302830602067e-05} +{"train_loss": 0.003998885279474389, "global_step": 25703, "epoch": 215, "lr": 7.192829200530925e-05, "val_loss": 0.019361326470971107, "train_action_mse_error": 0.00010039295739261433} +{"train_loss": 0.00473277922719717, "global_step": 25704, "epoch": 216, "lr": 7.192630090735793e-05} +{"train_loss": 0.004292624071240425, "global_step": 25705, "epoch": 216, "lr": 7.192430976635666e-05} +{"train_loss": 0.004335856065154076, "global_step": 25706, "epoch": 216, "lr": 7.192231858230934e-05} +{"train_loss": 0.0025371627416461706, "global_step": 25707, "epoch": 216, "lr": 7.19203273552199e-05} +{"train_loss": 0.004131285008043051, "global_step": 25708, "epoch": 216, "lr": 7.191833608509224e-05} +{"train_loss": 0.0035740286111831665, "global_step": 25709, "epoch": 216, "lr": 7.191634477193028e-05} +{"train_loss": 0.0027276005130261183, "global_step": 25710, "epoch": 216, "lr": 7.19143534157379e-05} +{"train_loss": 0.003368957433849573, "global_step": 25711, "epoch": 216, "lr": 7.191236201651903e-05} +{"train_loss": 0.004038945306092501, "global_step": 25712, "epoch": 216, "lr": 7.191037057427758e-05} +{"train_loss": 0.0025607673451304436, "global_step": 25713, "epoch": 216, "lr": 7.190837908901746e-05} +{"train_loss": 0.003657134249806404, "global_step": 25714, "epoch": 216, "lr": 7.190638756074258e-05} +{"train_loss": 0.0021129180677235126, "global_step": 25715, "epoch": 216, "lr": 7.190439598945686e-05} +{"train_loss": 0.0032447597477585077, "global_step": 25716, "epoch": 216, "lr": 7.190240437516419e-05} +{"train_loss": 0.004831286147236824, "global_step": 25717, "epoch": 216, "lr": 7.190041271786848e-05} +{"train_loss": 0.0026294835843145847, "global_step": 25718, "epoch": 216, "lr": 7.189842101757366e-05} +{"train_loss": 0.004207249730825424, "global_step": 25719, "epoch": 216, "lr": 7.189642927428362e-05} +{"train_loss": 0.005555708892643452, "global_step": 25720, "epoch": 216, "lr": 7.189443748800229e-05} +{"train_loss": 0.003481025341898203, "global_step": 25721, "epoch": 216, "lr": 7.189244565873357e-05} +{"train_loss": 0.0034450131934136152, "global_step": 25722, "epoch": 216, "lr": 7.189045378648138e-05} +{"train_loss": 0.0021013792138546705, "global_step": 25723, "epoch": 216, "lr": 7.188846187124961e-05} +{"train_loss": 0.003931073006242514, "global_step": 25724, "epoch": 216, "lr": 7.188646991304218e-05} +{"train_loss": 0.0026134198997169733, "global_step": 25725, "epoch": 216, "lr": 7.1884477911863e-05} +{"train_loss": 0.002961826277896762, "global_step": 25726, "epoch": 216, "lr": 7.1882485867716e-05} +{"train_loss": 0.0035227718763053417, "global_step": 25727, "epoch": 216, "lr": 7.188049378060506e-05} +{"train_loss": 0.005033636000007391, "global_step": 25728, "epoch": 216, "lr": 7.187850165053412e-05} +{"train_loss": 0.004392958711832762, "global_step": 25729, "epoch": 216, "lr": 7.187650947750709e-05} +{"train_loss": 0.0032224117312580347, "global_step": 25730, "epoch": 216, "lr": 7.187451726152785e-05} +{"train_loss": 0.0027350843884050846, "global_step": 25731, "epoch": 216, "lr": 7.187252500260035e-05} +{"train_loss": 0.005166295450180769, "global_step": 25732, "epoch": 216, "lr": 7.187053270072846e-05} +{"train_loss": 0.002900684019550681, "global_step": 25733, "epoch": 216, "lr": 7.186854035591614e-05} +{"train_loss": 0.005052819848060608, "global_step": 25734, "epoch": 216, "lr": 7.186654796816728e-05} +{"train_loss": 0.003545928280800581, "global_step": 25735, "epoch": 216, "lr": 7.186455553748577e-05} +{"train_loss": 0.0028890713583678007, "global_step": 25736, "epoch": 216, "lr": 7.186256306387555e-05} +{"train_loss": 0.0055076247081160545, "global_step": 25737, "epoch": 216, "lr": 7.186057054734053e-05} +{"train_loss": 0.00412067212164402, "global_step": 25738, "epoch": 216, "lr": 7.18585779878846e-05} +{"train_loss": 0.003276323201134801, "global_step": 25739, "epoch": 216, "lr": 7.185658538551168e-05} +{"train_loss": 0.0023842588998377323, "global_step": 25740, "epoch": 216, "lr": 7.185459274022572e-05} +{"train_loss": 0.0033737379126250744, "global_step": 25741, "epoch": 216, "lr": 7.185260005203058e-05} +{"train_loss": 0.004825678654015064, "global_step": 25742, "epoch": 216, "lr": 7.18506073209302e-05} +{"train_loss": 0.003029886167496443, "global_step": 25743, "epoch": 216, "lr": 7.184861454692849e-05} +{"train_loss": 0.004154715687036514, "global_step": 25744, "epoch": 216, "lr": 7.184662173002935e-05} +{"train_loss": 0.0033494431991130114, "global_step": 25745, "epoch": 216, "lr": 7.184462887023671e-05} +{"train_loss": 0.0022439658641815186, "global_step": 25746, "epoch": 216, "lr": 7.184263596755448e-05} +{"train_loss": 0.002457774942740798, "global_step": 25747, "epoch": 216, "lr": 7.184064302198656e-05} +{"train_loss": 0.002769522136077285, "global_step": 25748, "epoch": 216, "lr": 7.183865003353687e-05} +{"train_loss": 0.00288693280890584, "global_step": 25749, "epoch": 216, "lr": 7.183665700220933e-05} +{"train_loss": 0.004460692405700684, "global_step": 25750, "epoch": 216, "lr": 7.183466392800784e-05} +{"train_loss": 0.003389958990737796, "global_step": 25751, "epoch": 216, "lr": 7.183267081093633e-05} +{"train_loss": 0.004471451044082642, "global_step": 25752, "epoch": 216, "lr": 7.18306776509987e-05} +{"train_loss": 0.0028158959466964006, "global_step": 25753, "epoch": 216, "lr": 7.182868444819887e-05} +{"train_loss": 0.004671559669077396, "global_step": 25754, "epoch": 216, "lr": 7.182669120254075e-05} +{"train_loss": 0.004887521266937256, "global_step": 25755, "epoch": 216, "lr": 7.182469791402824e-05} +{"train_loss": 0.0025663175620138645, "global_step": 25756, "epoch": 216, "lr": 7.182270458266527e-05} +{"train_loss": 0.002650936832651496, "global_step": 25757, "epoch": 216, "lr": 7.182071120845575e-05} +{"train_loss": 0.0026185731403529644, "global_step": 25758, "epoch": 216, "lr": 7.18187177914036e-05} +{"train_loss": 0.003848510328680277, "global_step": 25759, "epoch": 216, "lr": 7.181672433151273e-05} +{"train_loss": 0.004660121630877256, "global_step": 25760, "epoch": 216, "lr": 7.181473082878704e-05} +{"train_loss": 0.0053996858187019825, "global_step": 25761, "epoch": 216, "lr": 7.181273728323048e-05} +{"train_loss": 0.00292436545714736, "global_step": 25762, "epoch": 216, "lr": 7.181074369484692e-05} +{"train_loss": 0.0038706997875124216, "global_step": 25763, "epoch": 216, "lr": 7.180875006364031e-05} +{"train_loss": 0.003341727890074253, "global_step": 25764, "epoch": 216, "lr": 7.180675638961454e-05} +{"train_loss": 0.0036593135446310043, "global_step": 25765, "epoch": 216, "lr": 7.180476267277353e-05} +{"train_loss": 0.0037536558229476213, "global_step": 25766, "epoch": 216, "lr": 7.180276891312122e-05} +{"train_loss": 0.003897432703524828, "global_step": 25767, "epoch": 216, "lr": 7.180077511066148e-05} +{"train_loss": 0.0035858892370015383, "global_step": 25768, "epoch": 216, "lr": 7.179878126539825e-05} +{"train_loss": 0.0046857502311468124, "global_step": 25769, "epoch": 216, "lr": 7.179678737733545e-05} +{"train_loss": 0.0030920582357794046, "global_step": 25770, "epoch": 216, "lr": 7.179479344647699e-05} +{"train_loss": 0.00392776308581233, "global_step": 25771, "epoch": 216, "lr": 7.179279947282677e-05} +{"train_loss": 0.004312485922127962, "global_step": 25772, "epoch": 216, "lr": 7.179080545638872e-05} +{"train_loss": 0.0036627959925681353, "global_step": 25773, "epoch": 216, "lr": 7.178881139716675e-05} +{"train_loss": 0.004490702413022518, "global_step": 25774, "epoch": 216, "lr": 7.17868172951648e-05} +{"train_loss": 0.004665684886276722, "global_step": 25775, "epoch": 216, "lr": 7.178482315038672e-05} +{"train_loss": 0.0029543181881308556, "global_step": 25776, "epoch": 216, "lr": 7.178282896283648e-05} +{"train_loss": 0.003093921346589923, "global_step": 25777, "epoch": 216, "lr": 7.178083473251799e-05} +{"train_loss": 0.0038004093803465366, "global_step": 25778, "epoch": 216, "lr": 7.177884045943516e-05} +{"train_loss": 0.0024566599167883396, "global_step": 25779, "epoch": 216, "lr": 7.17768461435919e-05} +{"train_loss": 0.00298405927605927, "global_step": 25780, "epoch": 216, "lr": 7.177485178499214e-05} +{"train_loss": 0.0036241381894797087, "global_step": 25781, "epoch": 216, "lr": 7.177285738363977e-05} +{"train_loss": 0.005674459505826235, "global_step": 25782, "epoch": 216, "lr": 7.177086293953873e-05} +{"train_loss": 0.0033257226459681988, "global_step": 25783, "epoch": 216, "lr": 7.176886845269292e-05} +{"train_loss": 0.0028821879532188177, "global_step": 25784, "epoch": 216, "lr": 7.176687392310628e-05} +{"train_loss": 0.0031201171223074198, "global_step": 25785, "epoch": 216, "lr": 7.176487935078269e-05} +{"train_loss": 0.003320224117487669, "global_step": 25786, "epoch": 216, "lr": 7.176288473572608e-05} +{"train_loss": 0.004668890498578548, "global_step": 25787, "epoch": 216, "lr": 7.176089007794038e-05} +{"train_loss": 0.0028969268314540386, "global_step": 25788, "epoch": 216, "lr": 7.17588953774295e-05} +{"train_loss": 0.0018757699290290475, "global_step": 25789, "epoch": 216, "lr": 7.175690063419734e-05} +{"train_loss": 0.002367233159020543, "global_step": 25790, "epoch": 216, "lr": 7.175490584824784e-05} +{"train_loss": 0.00351967616006732, "global_step": 25791, "epoch": 216, "lr": 7.17529110195849e-05} +{"train_loss": 0.002534610917791724, "global_step": 25792, "epoch": 216, "lr": 7.175091614821245e-05} +{"train_loss": 0.00324842007830739, "global_step": 25793, "epoch": 216, "lr": 7.17489212341344e-05} +{"train_loss": 0.0029663562308996916, "global_step": 25794, "epoch": 216, "lr": 7.174692627735466e-05} +{"train_loss": 0.005174805410206318, "global_step": 25795, "epoch": 216, "lr": 7.174493127787717e-05} +{"train_loss": 0.0036388004664331675, "global_step": 25796, "epoch": 216, "lr": 7.174293623570583e-05} +{"train_loss": 0.002847807016223669, "global_step": 25797, "epoch": 216, "lr": 7.174094115084454e-05} +{"train_loss": 0.001745802816003561, "global_step": 25798, "epoch": 216, "lr": 7.173894602329725e-05} +{"train_loss": 0.006207694299519062, "global_step": 25799, "epoch": 216, "lr": 7.173695085306784e-05} +{"train_loss": 0.004275410436093807, "global_step": 25800, "epoch": 216, "lr": 7.173495564016027e-05} +{"train_loss": 0.003864640835672617, "global_step": 25801, "epoch": 216, "lr": 7.173296038457843e-05} +{"train_loss": 0.005024618469178677, "global_step": 25802, "epoch": 216, "lr": 7.173096508632624e-05} +{"train_loss": 0.004906818270683289, "global_step": 25803, "epoch": 216, "lr": 7.172896974540763e-05} +{"train_loss": 0.0029169158078730106, "global_step": 25804, "epoch": 216, "lr": 7.172697436182652e-05} +{"train_loss": 0.004727340769022703, "global_step": 25805, "epoch": 216, "lr": 7.172497893558679e-05} +{"train_loss": 0.0023802854120731354, "global_step": 25806, "epoch": 216, "lr": 7.172298346669239e-05} +{"train_loss": 0.0023037209175527096, "global_step": 25807, "epoch": 216, "lr": 7.172098795514724e-05} +{"train_loss": 0.0036137085407972336, "global_step": 25808, "epoch": 216, "lr": 7.171899240095526e-05} +{"train_loss": 0.0053341505117714405, "global_step": 25809, "epoch": 216, "lr": 7.171699680412034e-05} +{"train_loss": 0.003967342432588339, "global_step": 25810, "epoch": 216, "lr": 7.171500116464642e-05} +{"train_loss": 0.0033336139749735594, "global_step": 25811, "epoch": 216, "lr": 7.171300548253743e-05} +{"train_loss": 0.004895027261227369, "global_step": 25812, "epoch": 216, "lr": 7.171100975779726e-05} +{"train_loss": 0.0026905506383627653, "global_step": 25813, "epoch": 216, "lr": 7.170901399042984e-05} +{"train_loss": 0.0049900212325155735, "global_step": 25814, "epoch": 216, "lr": 7.17070181804391e-05} +{"train_loss": 0.006052297540009022, "global_step": 25815, "epoch": 216, "lr": 7.170502232782896e-05} +{"train_loss": 0.004307888448238373, "global_step": 25816, "epoch": 216, "lr": 7.170302643260331e-05} +{"train_loss": 0.0028310632333159447, "global_step": 25817, "epoch": 216, "lr": 7.170103049476609e-05} +{"train_loss": 0.004225042648613453, "global_step": 25818, "epoch": 216, "lr": 7.16990345143212e-05} +{"train_loss": 0.003609594888985157, "global_step": 25819, "epoch": 216, "lr": 7.16970384912726e-05} +{"train_loss": 0.004894934594631195, "global_step": 25820, "epoch": 216, "lr": 7.169504242562417e-05} +{"train_loss": 0.005462197121232748, "global_step": 25821, "epoch": 216, "lr": 7.169304631737986e-05} +{"train_loss": 0.00370113187989987, "global_step": 25822, "epoch": 216, "lr": 7.169105016654354e-05, "val_loss": 0.013201978988945484} +{"train_loss": 0.0041722701862454414, "global_step": 25823, "epoch": 217, "lr": 7.168905397311918e-05} +{"train_loss": 0.002110344124957919, "global_step": 25824, "epoch": 217, "lr": 7.168705773711066e-05} +{"train_loss": 0.002876922721043229, "global_step": 25825, "epoch": 217, "lr": 7.168506145852194e-05} +{"train_loss": 0.005427439697086811, "global_step": 25826, "epoch": 217, "lr": 7.16830651373569e-05} +{"train_loss": 0.0037053143605589867, "global_step": 25827, "epoch": 217, "lr": 7.16810687736195e-05} +{"train_loss": 0.002385296393185854, "global_step": 25828, "epoch": 217, "lr": 7.167907236731363e-05} +{"train_loss": 0.0022069180849939585, "global_step": 25829, "epoch": 217, "lr": 7.167707591844322e-05} +{"train_loss": 0.004756329581141472, "global_step": 25830, "epoch": 217, "lr": 7.167507942701218e-05} +{"train_loss": 0.004892116878181696, "global_step": 25831, "epoch": 217, "lr": 7.167308289302444e-05} +{"train_loss": 0.003211771370843053, "global_step": 25832, "epoch": 217, "lr": 7.167108631648392e-05} +{"train_loss": 0.006911766715347767, "global_step": 25833, "epoch": 217, "lr": 7.166908969739453e-05} +{"train_loss": 0.0035412770230323076, "global_step": 25834, "epoch": 217, "lr": 7.16670930357602e-05} +{"train_loss": 0.004370079375803471, "global_step": 25835, "epoch": 217, "lr": 7.166509633158485e-05} +{"train_loss": 0.0048097362741827965, "global_step": 25836, "epoch": 217, "lr": 7.16630995848724e-05} +{"train_loss": 0.0035006229300051928, "global_step": 25837, "epoch": 217, "lr": 7.166110279562676e-05} +{"train_loss": 0.0046860044822096825, "global_step": 25838, "epoch": 217, "lr": 7.165910596385187e-05} +{"train_loss": 0.002527539851143956, "global_step": 25839, "epoch": 217, "lr": 7.165710908955164e-05} +{"train_loss": 0.0024634019937366247, "global_step": 25840, "epoch": 217, "lr": 7.165511217272997e-05} +{"train_loss": 0.004309231415390968, "global_step": 25841, "epoch": 217, "lr": 7.165311521339082e-05} +{"train_loss": 0.0058543747290968895, "global_step": 25842, "epoch": 217, "lr": 7.165111821153809e-05} +{"train_loss": 0.0028955910820513964, "global_step": 25843, "epoch": 217, "lr": 7.164912116717568e-05} +{"train_loss": 0.0033217708114534616, "global_step": 25844, "epoch": 217, "lr": 7.164712408030757e-05} +{"train_loss": 0.004294543527066708, "global_step": 25845, "epoch": 217, "lr": 7.164512695093762e-05} +{"train_loss": 0.0029739798046648502, "global_step": 25846, "epoch": 217, "lr": 7.164312977906978e-05} +{"train_loss": 0.004944026470184326, "global_step": 25847, "epoch": 217, "lr": 7.164113256470796e-05} +{"train_loss": 0.00433043297380209, "global_step": 25848, "epoch": 217, "lr": 7.16391353078561e-05} +{"train_loss": 0.008635341189801693, "global_step": 25849, "epoch": 217, "lr": 7.163713800851811e-05} +{"train_loss": 0.00512490002438426, "global_step": 25850, "epoch": 217, "lr": 7.163514066669791e-05} +{"train_loss": 0.003383242292329669, "global_step": 25851, "epoch": 217, "lr": 7.163314328239942e-05} +{"train_loss": 0.002476076828315854, "global_step": 25852, "epoch": 217, "lr": 7.163114585562656e-05} +{"train_loss": 0.003278065240010619, "global_step": 25853, "epoch": 217, "lr": 7.162914838638327e-05} +{"train_loss": 0.004450903739780188, "global_step": 25854, "epoch": 217, "lr": 7.162715087467346e-05} +{"train_loss": 0.00489734997972846, "global_step": 25855, "epoch": 217, "lr": 7.162515332050102e-05} +{"train_loss": 0.007445088122040033, "global_step": 25856, "epoch": 217, "lr": 7.162315572386993e-05} +{"train_loss": 0.002822580048814416, "global_step": 25857, "epoch": 217, "lr": 7.162115808478407e-05} +{"train_loss": 0.006144179962575436, "global_step": 25858, "epoch": 217, "lr": 7.161916040324737e-05} +{"train_loss": 0.003841989440843463, "global_step": 25859, "epoch": 217, "lr": 7.161716267926377e-05} +{"train_loss": 0.006831165868788958, "global_step": 25860, "epoch": 217, "lr": 7.161516491283718e-05} +{"train_loss": 0.00688449339941144, "global_step": 25861, "epoch": 217, "lr": 7.161316710397152e-05} +{"train_loss": 0.005650732200592756, "global_step": 25862, "epoch": 217, "lr": 7.161116925267073e-05} +{"train_loss": 0.004162275232374668, "global_step": 25863, "epoch": 217, "lr": 7.16091713589387e-05} +{"train_loss": 0.00436755595728755, "global_step": 25864, "epoch": 217, "lr": 7.160717342277937e-05} +{"train_loss": 0.006797532085329294, "global_step": 25865, "epoch": 217, "lr": 7.160517544419668e-05} +{"train_loss": 0.0033633909188210964, "global_step": 25866, "epoch": 217, "lr": 7.160317742319453e-05} +{"train_loss": 0.007691127713769674, "global_step": 25867, "epoch": 217, "lr": 7.160117935977684e-05} +{"train_loss": 0.004579818807542324, "global_step": 25868, "epoch": 217, "lr": 7.159918125394755e-05} +{"train_loss": 0.004754839465022087, "global_step": 25869, "epoch": 217, "lr": 7.159718310571057e-05} +{"train_loss": 0.004991599824279547, "global_step": 25870, "epoch": 217, "lr": 7.159518491506982e-05} +{"train_loss": 0.005786953493952751, "global_step": 25871, "epoch": 217, "lr": 7.159318668202925e-05} +{"train_loss": 0.004497826099395752, "global_step": 25872, "epoch": 217, "lr": 7.159118840659276e-05} +{"train_loss": 0.004505244083702564, "global_step": 25873, "epoch": 217, "lr": 7.158919008876426e-05} +{"train_loss": 0.0022863070480525494, "global_step": 25874, "epoch": 217, "lr": 7.158719172854772e-05} +{"train_loss": 0.0047276075929403305, "global_step": 25875, "epoch": 217, "lr": 7.158519332594701e-05} +{"train_loss": 0.004534037783741951, "global_step": 25876, "epoch": 217, "lr": 7.158319488096608e-05} +{"train_loss": 0.0034582894295454025, "global_step": 25877, "epoch": 217, "lr": 7.158119639360887e-05} +{"train_loss": 0.005857763811945915, "global_step": 25878, "epoch": 217, "lr": 7.15791978638793e-05} +{"train_loss": 0.0038362035993486643, "global_step": 25879, "epoch": 217, "lr": 7.157719929178125e-05} +{"train_loss": 0.003532168222591281, "global_step": 25880, "epoch": 217, "lr": 7.15752006773187e-05} +{"train_loss": 0.003811738919466734, "global_step": 25881, "epoch": 217, "lr": 7.157320202049551e-05} +{"train_loss": 0.00393403135240078, "global_step": 25882, "epoch": 217, "lr": 7.157120332131567e-05} +{"train_loss": 0.007515814155340195, "global_step": 25883, "epoch": 217, "lr": 7.156920457978306e-05} +{"train_loss": 0.0033035383094102144, "global_step": 25884, "epoch": 217, "lr": 7.156720579590164e-05} +{"train_loss": 0.0022636980284005404, "global_step": 25885, "epoch": 217, "lr": 7.156520696967532e-05} +{"train_loss": 0.004534110426902771, "global_step": 25886, "epoch": 217, "lr": 7.156320810110801e-05} +{"train_loss": 0.004678039345890284, "global_step": 25887, "epoch": 217, "lr": 7.156120919020364e-05} +{"train_loss": 0.004506603814661503, "global_step": 25888, "epoch": 217, "lr": 7.155921023696614e-05} +{"train_loss": 0.0042396592907607555, "global_step": 25889, "epoch": 217, "lr": 7.155721124139943e-05} +{"train_loss": 0.0027810479514300823, "global_step": 25890, "epoch": 217, "lr": 7.155521220350745e-05} +{"train_loss": 0.0045206486247479916, "global_step": 25891, "epoch": 217, "lr": 7.15532131232941e-05} +{"train_loss": 0.004713120404630899, "global_step": 25892, "epoch": 217, "lr": 7.155121400076335e-05} +{"train_loss": 0.005000412464141846, "global_step": 25893, "epoch": 217, "lr": 7.154921483591905e-05} +{"train_loss": 0.003854114096611738, "global_step": 25894, "epoch": 217, "lr": 7.15472156287652e-05} +{"train_loss": 0.003615931374952197, "global_step": 25895, "epoch": 217, "lr": 7.154521637930567e-05} +{"train_loss": 0.004357687663286924, "global_step": 25896, "epoch": 217, "lr": 7.154321708754444e-05} +{"train_loss": 0.0047500221990048885, "global_step": 25897, "epoch": 217, "lr": 7.15412177534854e-05} +{"train_loss": 0.0037483705673366785, "global_step": 25898, "epoch": 217, "lr": 7.153921837713247e-05} +{"train_loss": 0.002428618958219886, "global_step": 25899, "epoch": 217, "lr": 7.153721895848957e-05} +{"train_loss": 0.005143971648067236, "global_step": 25900, "epoch": 217, "lr": 7.153521949756066e-05} +{"train_loss": 0.005509892012923956, "global_step": 25901, "epoch": 217, "lr": 7.153321999434965e-05} +{"train_loss": 0.003800874575972557, "global_step": 25902, "epoch": 217, "lr": 7.153122044886045e-05} +{"train_loss": 0.003899717703461647, "global_step": 25903, "epoch": 217, "lr": 7.152922086109702e-05} +{"train_loss": 0.003898180555552244, "global_step": 25904, "epoch": 217, "lr": 7.152722123106325e-05} +{"train_loss": 0.0030153270345181227, "global_step": 25905, "epoch": 217, "lr": 7.152522155876307e-05} +{"train_loss": 0.0035979552194476128, "global_step": 25906, "epoch": 217, "lr": 7.152322184420043e-05} +{"train_loss": 0.003047382226213813, "global_step": 25907, "epoch": 217, "lr": 7.152122208737923e-05} +{"train_loss": 0.004987041931599379, "global_step": 25908, "epoch": 217, "lr": 7.151922228830342e-05} +{"train_loss": 0.0033903911244124174, "global_step": 25909, "epoch": 217, "lr": 7.151722244697692e-05} +{"train_loss": 0.004259866196662188, "global_step": 25910, "epoch": 217, "lr": 7.151522256340366e-05} +{"train_loss": 0.005081953946501017, "global_step": 25911, "epoch": 217, "lr": 7.151322263758756e-05} +{"train_loss": 0.003977495711296797, "global_step": 25912, "epoch": 217, "lr": 7.151122266953251e-05} +{"train_loss": 0.004292648751288652, "global_step": 25913, "epoch": 217, "lr": 7.150922265924251e-05} +{"train_loss": 0.0032559139654040337, "global_step": 25914, "epoch": 217, "lr": 7.150722260672142e-05} +{"train_loss": 0.0025795279070734978, "global_step": 25915, "epoch": 217, "lr": 7.150522251197323e-05} +{"train_loss": 0.0033745865803211927, "global_step": 25916, "epoch": 217, "lr": 7.150322237500182e-05} +{"train_loss": 0.006055185105651617, "global_step": 25917, "epoch": 217, "lr": 7.150122219581113e-05} +{"train_loss": 0.0026706522330641747, "global_step": 25918, "epoch": 217, "lr": 7.149922197440507e-05} +{"train_loss": 0.0024881043937057257, "global_step": 25919, "epoch": 217, "lr": 7.14972217107876e-05} +{"train_loss": 0.005118336528539658, "global_step": 25920, "epoch": 217, "lr": 7.149522140496263e-05} +{"train_loss": 0.00458166329190135, "global_step": 25921, "epoch": 217, "lr": 7.149322105693408e-05} +{"train_loss": 0.005086633376777172, "global_step": 25922, "epoch": 217, "lr": 7.14912206667059e-05} +{"train_loss": 0.0038595946971327066, "global_step": 25923, "epoch": 217, "lr": 7.148922023428199e-05} +{"train_loss": 0.0033417819067835808, "global_step": 25924, "epoch": 217, "lr": 7.148721975966632e-05} +{"train_loss": 0.0038900866638869047, "global_step": 25925, "epoch": 217, "lr": 7.148521924286275e-05} +{"train_loss": 0.002766174031421542, "global_step": 25926, "epoch": 217, "lr": 7.148321868387527e-05} +{"train_loss": 0.004524988122284412, "global_step": 25927, "epoch": 217, "lr": 7.148121808270779e-05} +{"train_loss": 0.005048293154686689, "global_step": 25928, "epoch": 217, "lr": 7.147921743936423e-05} +{"train_loss": 0.004026986658573151, "global_step": 25929, "epoch": 217, "lr": 7.147721675384852e-05} +{"train_loss": 0.0038938571233302355, "global_step": 25930, "epoch": 217, "lr": 7.147521602616458e-05} +{"train_loss": 0.0046274540945887566, "global_step": 25931, "epoch": 217, "lr": 7.147321525631636e-05} +{"train_loss": 0.004528974648565054, "global_step": 25932, "epoch": 217, "lr": 7.147121444430778e-05} +{"train_loss": 0.0031820281874388456, "global_step": 25933, "epoch": 217, "lr": 7.146921359014274e-05} +{"train_loss": 0.0031387540511786938, "global_step": 25934, "epoch": 217, "lr": 7.146721269382522e-05} +{"train_loss": 0.004635287448763847, "global_step": 25935, "epoch": 217, "lr": 7.146521175535912e-05} +{"train_loss": 0.0032689457293599844, "global_step": 25936, "epoch": 217, "lr": 7.146321077474835e-05} +{"train_loss": 0.0025657631922513247, "global_step": 25937, "epoch": 217, "lr": 7.146120975199687e-05} +{"train_loss": 0.0025216839276254177, "global_step": 25938, "epoch": 217, "lr": 7.145920868710859e-05} +{"train_loss": 0.0030553697142750025, "global_step": 25939, "epoch": 217, "lr": 7.145720758008745e-05} +{"train_loss": 0.0024008851032704115, "global_step": 25940, "epoch": 217, "lr": 7.145520643093738e-05} +{"train_loss": 0.004192636078301848, "global_step": 25941, "epoch": 217, "lr": 7.14532052396623e-05, "val_loss": 0.012756680138409138} +{"train_loss": 0.0032168335746973753, "global_step": 25942, "epoch": 218, "lr": 7.145120400626615e-05} +{"train_loss": 0.005608865525573492, "global_step": 25943, "epoch": 218, "lr": 7.144920273075284e-05} +{"train_loss": 0.004536307416856289, "global_step": 25944, "epoch": 218, "lr": 7.144720141312633e-05} +{"train_loss": 0.0019528188277035952, "global_step": 25945, "epoch": 218, "lr": 7.14452000533905e-05} +{"train_loss": 0.003422050504013896, "global_step": 25946, "epoch": 218, "lr": 7.144319865154934e-05} +{"train_loss": 0.005903002806007862, "global_step": 25947, "epoch": 218, "lr": 7.144119720760675e-05} +{"train_loss": 0.005231388844549656, "global_step": 25948, "epoch": 218, "lr": 7.143919572156666e-05} +{"train_loss": 0.003610251471400261, "global_step": 25949, "epoch": 218, "lr": 7.143719419343298e-05} +{"train_loss": 0.002045957837253809, "global_step": 25950, "epoch": 218, "lr": 7.143519262320967e-05} +{"train_loss": 0.003455301746726036, "global_step": 25951, "epoch": 218, "lr": 7.143319101090065e-05} +{"train_loss": 0.002502649324014783, "global_step": 25952, "epoch": 218, "lr": 7.143118935650986e-05} +{"train_loss": 0.003534486051648855, "global_step": 25953, "epoch": 218, "lr": 7.14291876600412e-05} +{"train_loss": 0.003636446548625827, "global_step": 25954, "epoch": 218, "lr": 7.142718592149863e-05} +{"train_loss": 0.0023988126777112484, "global_step": 25955, "epoch": 218, "lr": 7.142518414088607e-05} +{"train_loss": 0.0025134868919849396, "global_step": 25956, "epoch": 218, "lr": 7.142318231820744e-05} +{"train_loss": 0.005590478423982859, "global_step": 25957, "epoch": 218, "lr": 7.142118045346668e-05} +{"train_loss": 0.004892304539680481, "global_step": 25958, "epoch": 218, "lr": 7.141917854666773e-05} +{"train_loss": 0.002291099401190877, "global_step": 25959, "epoch": 218, "lr": 7.141717659781452e-05} +{"train_loss": 0.0019085198873654008, "global_step": 25960, "epoch": 218, "lr": 7.141517460691097e-05} +{"train_loss": 0.0035637770779430866, "global_step": 25961, "epoch": 218, "lr": 7.1413172573961e-05} +{"train_loss": 0.004018425941467285, "global_step": 25962, "epoch": 218, "lr": 7.141117049896855e-05} +{"train_loss": 0.0021774894557893276, "global_step": 25963, "epoch": 218, "lr": 7.140916838193756e-05} +{"train_loss": 0.0033826581202447414, "global_step": 25964, "epoch": 218, "lr": 7.140716622287196e-05} +{"train_loss": 0.00473802862688899, "global_step": 25965, "epoch": 218, "lr": 7.140516402177568e-05} +{"train_loss": 0.003932304680347443, "global_step": 25966, "epoch": 218, "lr": 7.140316177865264e-05} +{"train_loss": 0.0046163140796124935, "global_step": 25967, "epoch": 218, "lr": 7.140115949350677e-05} +{"train_loss": 0.002428296720609069, "global_step": 25968, "epoch": 218, "lr": 7.139915716634202e-05} +{"train_loss": 0.004891417920589447, "global_step": 25969, "epoch": 218, "lr": 7.139715479716232e-05} +{"train_loss": 0.001622901065275073, "global_step": 25970, "epoch": 218, "lr": 7.139515238597156e-05} +{"train_loss": 0.0033119141589850187, "global_step": 25971, "epoch": 218, "lr": 7.139314993277373e-05} +{"train_loss": 0.0030408245511353016, "global_step": 25972, "epoch": 218, "lr": 7.139114743757274e-05} +{"train_loss": 0.003975235857069492, "global_step": 25973, "epoch": 218, "lr": 7.13891449003725e-05} +{"train_loss": 0.0031837881542742252, "global_step": 25974, "epoch": 218, "lr": 7.138714232117696e-05} +{"train_loss": 0.0029625752940773964, "global_step": 25975, "epoch": 218, "lr": 7.138513969999007e-05} +{"train_loss": 0.004884313326328993, "global_step": 25976, "epoch": 218, "lr": 7.138313703681572e-05} +{"train_loss": 0.004130996763706207, "global_step": 25977, "epoch": 218, "lr": 7.138113433165788e-05} +{"train_loss": 0.004236364271491766, "global_step": 25978, "epoch": 218, "lr": 7.137913158452047e-05} +{"train_loss": 0.0028323198202997446, "global_step": 25979, "epoch": 218, "lr": 7.137712879540741e-05} +{"train_loss": 0.004764265846461058, "global_step": 25980, "epoch": 218, "lr": 7.137512596432266e-05} +{"train_loss": 0.0034961053170263767, "global_step": 25981, "epoch": 218, "lr": 7.137312309127011e-05} +{"train_loss": 0.0027451091445982456, "global_step": 25982, "epoch": 218, "lr": 7.137112017625372e-05} +{"train_loss": 0.0030673618894070387, "global_step": 25983, "epoch": 218, "lr": 7.136911721927742e-05} +{"train_loss": 0.0032264133915305138, "global_step": 25984, "epoch": 218, "lr": 7.136711422034516e-05} +{"train_loss": 0.0030351222958415747, "global_step": 25985, "epoch": 218, "lr": 7.136511117946083e-05} +{"train_loss": 0.0025687599554657936, "global_step": 25986, "epoch": 218, "lr": 7.13631080966284e-05} +{"train_loss": 0.00371335307136178, "global_step": 25987, "epoch": 218, "lr": 7.136110497185178e-05} +{"train_loss": 0.004021761938929558, "global_step": 25988, "epoch": 218, "lr": 7.135910180513493e-05} +{"train_loss": 0.002668843837454915, "global_step": 25989, "epoch": 218, "lr": 7.135709859648174e-05} +{"train_loss": 0.006418550852686167, "global_step": 25990, "epoch": 218, "lr": 7.135509534589617e-05} +{"train_loss": 0.003123026806861162, "global_step": 25991, "epoch": 218, "lr": 7.135309205338216e-05} +{"train_loss": 0.001817347016185522, "global_step": 25992, "epoch": 218, "lr": 7.135108871894365e-05} +{"train_loss": 0.004518656060099602, "global_step": 25993, "epoch": 218, "lr": 7.134908534258453e-05} +{"train_loss": 0.005279695149511099, "global_step": 25994, "epoch": 218, "lr": 7.134708192430879e-05} +{"train_loss": 0.002421686192974448, "global_step": 25995, "epoch": 218, "lr": 7.134507846412032e-05} +{"train_loss": 0.0027901926077902317, "global_step": 25996, "epoch": 218, "lr": 7.134307496202308e-05} +{"train_loss": 0.0017110889311879873, "global_step": 25997, "epoch": 218, "lr": 7.134107141802097e-05} +{"train_loss": 0.0036244697403162718, "global_step": 25998, "epoch": 218, "lr": 7.133906783211796e-05} +{"train_loss": 0.00653594546020031, "global_step": 25999, "epoch": 218, "lr": 7.133706420431798e-05} +{"train_loss": 0.0034577972255647182, "global_step": 26000, "epoch": 218, "lr": 7.133506053462494e-05} +{"train_loss": 0.003160404972732067, "global_step": 26001, "epoch": 218, "lr": 7.133305682304279e-05} +{"train_loss": 0.0021140894386917353, "global_step": 26002, "epoch": 218, "lr": 7.133105306957547e-05} +{"train_loss": 0.0027757894713431597, "global_step": 26003, "epoch": 218, "lr": 7.13290492742269e-05} +{"train_loss": 0.004799104295670986, "global_step": 26004, "epoch": 218, "lr": 7.132704543700102e-05} +{"train_loss": 0.004836713429540396, "global_step": 26005, "epoch": 218, "lr": 7.132504155790177e-05} +{"train_loss": 0.002734111389145255, "global_step": 26006, "epoch": 218, "lr": 7.132303763693306e-05} +{"train_loss": 0.004128803964704275, "global_step": 26007, "epoch": 218, "lr": 7.132103367409886e-05} +{"train_loss": 0.002474697306752205, "global_step": 26008, "epoch": 218, "lr": 7.13190296694031e-05} +{"train_loss": 0.004252249840646982, "global_step": 26009, "epoch": 218, "lr": 7.131702562284969e-05} +{"train_loss": 0.004877755418419838, "global_step": 26010, "epoch": 218, "lr": 7.131502153444257e-05} +{"train_loss": 0.003916139714419842, "global_step": 26011, "epoch": 218, "lr": 7.131301740418569e-05} +{"train_loss": 0.006595062091946602, "global_step": 26012, "epoch": 218, "lr": 7.131101323208297e-05} +{"train_loss": 0.003244286635890603, "global_step": 26013, "epoch": 218, "lr": 7.130900901813837e-05} +{"train_loss": 0.0026796269230544567, "global_step": 26014, "epoch": 218, "lr": 7.130700476235579e-05} +{"train_loss": 0.003685439471155405, "global_step": 26015, "epoch": 218, "lr": 7.130500046473919e-05} +{"train_loss": 0.0051981802098453045, "global_step": 26016, "epoch": 218, "lr": 7.130299612529251e-05} +{"train_loss": 0.0038491785526275635, "global_step": 26017, "epoch": 218, "lr": 7.130099174401966e-05} +{"train_loss": 0.0034126511309295893, "global_step": 26018, "epoch": 218, "lr": 7.129898732092458e-05} +{"train_loss": 0.003165690926834941, "global_step": 26019, "epoch": 218, "lr": 7.129698285601122e-05} +{"train_loss": 0.004340201150625944, "global_step": 26020, "epoch": 218, "lr": 7.129497834928352e-05} +{"train_loss": 0.0030336775816977024, "global_step": 26021, "epoch": 218, "lr": 7.129297380074538e-05} +{"train_loss": 0.00581831531599164, "global_step": 26022, "epoch": 218, "lr": 7.129096921040078e-05} +{"train_loss": 0.003244789782911539, "global_step": 26023, "epoch": 218, "lr": 7.128896457825364e-05} +{"train_loss": 0.004722100682556629, "global_step": 26024, "epoch": 218, "lr": 7.128695990430788e-05} +{"train_loss": 0.005873784888535738, "global_step": 26025, "epoch": 218, "lr": 7.128495518856746e-05} +{"train_loss": 0.004164264537394047, "global_step": 26026, "epoch": 218, "lr": 7.12829504310363e-05} +{"train_loss": 0.002914229640737176, "global_step": 26027, "epoch": 218, "lr": 7.128094563171834e-05} +{"train_loss": 0.005596236791461706, "global_step": 26028, "epoch": 218, "lr": 7.127894079061752e-05} +{"train_loss": 0.004311654716730118, "global_step": 26029, "epoch": 218, "lr": 7.127693590773776e-05} +{"train_loss": 0.0026898582000285387, "global_step": 26030, "epoch": 218, "lr": 7.127493098308302e-05} +{"train_loss": 0.0037611783482134342, "global_step": 26031, "epoch": 218, "lr": 7.127292601665723e-05} +{"train_loss": 0.004278271459043026, "global_step": 26032, "epoch": 218, "lr": 7.12709210084643e-05} +{"train_loss": 0.0050674546509981155, "global_step": 26033, "epoch": 218, "lr": 7.126891595850821e-05} +{"train_loss": 0.004116588272154331, "global_step": 26034, "epoch": 218, "lr": 7.126691086679289e-05} +{"train_loss": 0.0020009346771985292, "global_step": 26035, "epoch": 218, "lr": 7.126490573332225e-05} +{"train_loss": 0.0033939986024051905, "global_step": 26036, "epoch": 218, "lr": 7.126290055810022e-05} +{"train_loss": 0.002437807619571686, "global_step": 26037, "epoch": 218, "lr": 7.126089534113078e-05} +{"train_loss": 0.0041159032844007015, "global_step": 26038, "epoch": 218, "lr": 7.125889008241783e-05} +{"train_loss": 0.0024833695497363806, "global_step": 26039, "epoch": 218, "lr": 7.125688478196531e-05} +{"train_loss": 0.0036222010385245085, "global_step": 26040, "epoch": 218, "lr": 7.125487943977719e-05} +{"train_loss": 0.0032862999942153692, "global_step": 26041, "epoch": 218, "lr": 7.125287405585738e-05} +{"train_loss": 0.003049749182537198, "global_step": 26042, "epoch": 218, "lr": 7.12508686302098e-05} +{"train_loss": 0.003243293846026063, "global_step": 26043, "epoch": 218, "lr": 7.124886316283844e-05} +{"train_loss": 0.0037699383683502674, "global_step": 26044, "epoch": 218, "lr": 7.12468576537472e-05} +{"train_loss": 0.0031999244820326567, "global_step": 26045, "epoch": 218, "lr": 7.124485210294002e-05} +{"train_loss": 0.006511016748845577, "global_step": 26046, "epoch": 218, "lr": 7.124284651042084e-05} +{"train_loss": 0.005290286149829626, "global_step": 26047, "epoch": 218, "lr": 7.124084087619362e-05} +{"train_loss": 0.006119112484157085, "global_step": 26048, "epoch": 218, "lr": 7.123883520026226e-05} +{"train_loss": 0.005487305577844381, "global_step": 26049, "epoch": 218, "lr": 7.12368294826307e-05} +{"train_loss": 0.004060141742229462, "global_step": 26050, "epoch": 218, "lr": 7.123482372330292e-05} +{"train_loss": 0.003164969151839614, "global_step": 26051, "epoch": 218, "lr": 7.123281792228283e-05} +{"train_loss": 0.0038694841787219048, "global_step": 26052, "epoch": 218, "lr": 7.123081207957436e-05} +{"train_loss": 0.0043160878121852875, "global_step": 26053, "epoch": 218, "lr": 7.122880619518147e-05} +{"train_loss": 0.005133324768394232, "global_step": 26054, "epoch": 218, "lr": 7.122680026910807e-05} +{"train_loss": 0.0032186461612582207, "global_step": 26055, "epoch": 218, "lr": 7.122479430135813e-05} +{"train_loss": 0.003935923334211111, "global_step": 26056, "epoch": 218, "lr": 7.122278829193557e-05} +{"train_loss": 0.0050827437080442905, "global_step": 26057, "epoch": 218, "lr": 7.122078224084434e-05} +{"train_loss": 0.003103397088125348, "global_step": 26058, "epoch": 218, "lr": 7.121877614808835e-05} +{"train_loss": 0.002612668089568615, "global_step": 26059, "epoch": 218, "lr": 7.121677001367159e-05} +{"train_loss": 0.003765403333182658, "global_step": 26060, "epoch": 218, "lr": 7.121476383759795e-05, "val_loss": 0.024028073996305466} +{"train_loss": 0.003950792830437422, "global_step": 26061, "epoch": 219, "lr": 7.121275761987139e-05} +{"train_loss": 0.005201749503612518, "global_step": 26062, "epoch": 219, "lr": 7.121075136049584e-05} +{"train_loss": 0.0036117734853178263, "global_step": 26063, "epoch": 219, "lr": 7.120874505947526e-05} +{"train_loss": 0.002010203432291746, "global_step": 26064, "epoch": 219, "lr": 7.120673871681356e-05} +{"train_loss": 0.00603058747947216, "global_step": 26065, "epoch": 219, "lr": 7.12047323325147e-05} +{"train_loss": 0.003162259701639414, "global_step": 26066, "epoch": 219, "lr": 7.120272590658262e-05} +{"train_loss": 0.0035385950468480587, "global_step": 26067, "epoch": 219, "lr": 7.120071943902125e-05} +{"train_loss": 0.0031120642088353634, "global_step": 26068, "epoch": 219, "lr": 7.119871292983453e-05} +{"train_loss": 0.0037809594068676233, "global_step": 26069, "epoch": 219, "lr": 7.11967063790264e-05} +{"train_loss": 0.004575212486088276, "global_step": 26070, "epoch": 219, "lr": 7.11946997866008e-05} +{"train_loss": 0.002986727049574256, "global_step": 26071, "epoch": 219, "lr": 7.119269315256168e-05} +{"train_loss": 0.003643640549853444, "global_step": 26072, "epoch": 219, "lr": 7.119068647691295e-05} +{"train_loss": 0.005399117711931467, "global_step": 26073, "epoch": 219, "lr": 7.118867975965859e-05} +{"train_loss": 0.0019599273800849915, "global_step": 26074, "epoch": 219, "lr": 7.118667300080253e-05} +{"train_loss": 0.002561328699812293, "global_step": 26075, "epoch": 219, "lr": 7.118466620034869e-05} +{"train_loss": 0.004387470427900553, "global_step": 26076, "epoch": 219, "lr": 7.118265935830101e-05} +{"train_loss": 0.005825872998684645, "global_step": 26077, "epoch": 219, "lr": 7.118065247466346e-05} +{"train_loss": 0.0028551709838211536, "global_step": 26078, "epoch": 219, "lr": 7.117864554943996e-05} +{"train_loss": 0.0025037347804754972, "global_step": 26079, "epoch": 219, "lr": 7.117663858263444e-05} +{"train_loss": 0.002583696274086833, "global_step": 26080, "epoch": 219, "lr": 7.117463157425086e-05} +{"train_loss": 0.0050704083405435085, "global_step": 26081, "epoch": 219, "lr": 7.117262452429314e-05} +{"train_loss": 0.0022170289885252714, "global_step": 26082, "epoch": 219, "lr": 7.117061743276525e-05} +{"train_loss": 0.005419617053121328, "global_step": 26083, "epoch": 219, "lr": 7.116861029967112e-05} +{"train_loss": 0.003662847215309739, "global_step": 26084, "epoch": 219, "lr": 7.116660312501467e-05} +{"train_loss": 0.006403443403542042, "global_step": 26085, "epoch": 219, "lr": 7.116459590879987e-05} +{"train_loss": 0.0035207357723265886, "global_step": 26086, "epoch": 219, "lr": 7.116258865103062e-05} +{"train_loss": 0.00439878785982728, "global_step": 26087, "epoch": 219, "lr": 7.116058135171091e-05} +{"train_loss": 0.005165919661521912, "global_step": 26088, "epoch": 219, "lr": 7.115857401084466e-05} +{"train_loss": 0.003554216120392084, "global_step": 26089, "epoch": 219, "lr": 7.115656662843579e-05} +{"train_loss": 0.0024501567240804434, "global_step": 26090, "epoch": 219, "lr": 7.115455920448827e-05} +{"train_loss": 0.003375845029950142, "global_step": 26091, "epoch": 219, "lr": 7.115255173900606e-05} +{"train_loss": 0.0031564508099108934, "global_step": 26092, "epoch": 219, "lr": 7.115054423199306e-05} +{"train_loss": 0.004097125492990017, "global_step": 26093, "epoch": 219, "lr": 7.11485366834532e-05} +{"train_loss": 0.0025966670364141464, "global_step": 26094, "epoch": 219, "lr": 7.114652909339048e-05} +{"train_loss": 0.0039954958483576775, "global_step": 26095, "epoch": 219, "lr": 7.114452146180879e-05} +{"train_loss": 0.003085772041231394, "global_step": 26096, "epoch": 219, "lr": 7.11425137887121e-05} +{"train_loss": 0.005363487638533115, "global_step": 26097, "epoch": 219, "lr": 7.114050607410435e-05} +{"train_loss": 0.0016274222871288657, "global_step": 26098, "epoch": 219, "lr": 7.113849831798946e-05} +{"train_loss": 0.004623908083885908, "global_step": 26099, "epoch": 219, "lr": 7.11364905203714e-05} +{"train_loss": 0.003790986957028508, "global_step": 26100, "epoch": 219, "lr": 7.113448268125408e-05} +{"train_loss": 0.005586238577961922, "global_step": 26101, "epoch": 219, "lr": 7.113247480064148e-05} +{"train_loss": 0.0023174146190285683, "global_step": 26102, "epoch": 219, "lr": 7.113046687853752e-05} +{"train_loss": 0.002972617046907544, "global_step": 26103, "epoch": 219, "lr": 7.112845891494614e-05} +{"train_loss": 0.0019928920082747936, "global_step": 26104, "epoch": 219, "lr": 7.112645090987129e-05} +{"train_loss": 0.0034177135676145554, "global_step": 26105, "epoch": 219, "lr": 7.112444286331689e-05} +{"train_loss": 0.002068624831736088, "global_step": 26106, "epoch": 219, "lr": 7.112243477528694e-05} +{"train_loss": 0.0026809528935700655, "global_step": 26107, "epoch": 219, "lr": 7.112042664578533e-05} +{"train_loss": 0.005066980607807636, "global_step": 26108, "epoch": 219, "lr": 7.111841847481602e-05} +{"train_loss": 0.004584203939884901, "global_step": 26109, "epoch": 219, "lr": 7.111641026238293e-05} +{"train_loss": 0.004277790896594524, "global_step": 26110, "epoch": 219, "lr": 7.111440200849007e-05} +{"train_loss": 0.003832680406048894, "global_step": 26111, "epoch": 219, "lr": 7.11123937131413e-05} +{"train_loss": 0.0027096932753920555, "global_step": 26112, "epoch": 219, "lr": 7.111038537634062e-05} +{"train_loss": 0.0026708568911999464, "global_step": 26113, "epoch": 219, "lr": 7.110837699809194e-05} +{"train_loss": 0.0026648463681340218, "global_step": 26114, "epoch": 219, "lr": 7.110636857839923e-05} +{"train_loss": 0.003014822956174612, "global_step": 26115, "epoch": 219, "lr": 7.110436011726641e-05} +{"train_loss": 0.002689415356144309, "global_step": 26116, "epoch": 219, "lr": 7.110235161469745e-05} +{"train_loss": 0.0030506865587085485, "global_step": 26117, "epoch": 219, "lr": 7.110034307069626e-05} +{"train_loss": 0.00399923836812377, "global_step": 26118, "epoch": 219, "lr": 7.10983344852668e-05} +{"train_loss": 0.0027457247488200665, "global_step": 26119, "epoch": 219, "lr": 7.109632585841302e-05} +{"train_loss": 0.0037104440852999687, "global_step": 26120, "epoch": 219, "lr": 7.109431719013885e-05} +{"train_loss": 0.003088607219979167, "global_step": 26121, "epoch": 219, "lr": 7.109230848044826e-05} +{"train_loss": 0.003214955562725663, "global_step": 26122, "epoch": 219, "lr": 7.109029972934516e-05} +{"train_loss": 0.00391981890425086, "global_step": 26123, "epoch": 219, "lr": 7.108829093683351e-05} +{"train_loss": 0.003095057560130954, "global_step": 26124, "epoch": 219, "lr": 7.108628210291726e-05} +{"train_loss": 0.0035172190982848406, "global_step": 26125, "epoch": 219, "lr": 7.108427322760033e-05} +{"train_loss": 0.0056903790682554245, "global_step": 26126, "epoch": 219, "lr": 7.10822643108867e-05} +{"train_loss": 0.002763758646324277, "global_step": 26127, "epoch": 219, "lr": 7.10802553527803e-05} +{"train_loss": 0.0030128376092761755, "global_step": 26128, "epoch": 219, "lr": 7.107824635328507e-05} +{"train_loss": 0.005537974648177624, "global_step": 26129, "epoch": 219, "lr": 7.107623731240497e-05} +{"train_loss": 0.0037805300671607256, "global_step": 26130, "epoch": 219, "lr": 7.10742282301439e-05} +{"train_loss": 0.003455334110185504, "global_step": 26131, "epoch": 219, "lr": 7.107221910650583e-05} +{"train_loss": 0.0030713933520019054, "global_step": 26132, "epoch": 219, "lr": 7.107020994149473e-05} +{"train_loss": 0.005209208000451326, "global_step": 26133, "epoch": 219, "lr": 7.106820073511452e-05} +{"train_loss": 0.002819273853674531, "global_step": 26134, "epoch": 219, "lr": 7.106619148736913e-05} +{"train_loss": 0.003894059220328927, "global_step": 26135, "epoch": 219, "lr": 7.106418219826255e-05} +{"train_loss": 0.0024625472724437714, "global_step": 26136, "epoch": 219, "lr": 7.106217286779868e-05} +{"train_loss": 0.0036138431169092655, "global_step": 26137, "epoch": 219, "lr": 7.10601634959815e-05} +{"train_loss": 0.0034002535976469517, "global_step": 26138, "epoch": 219, "lr": 7.105815408281492e-05} +{"train_loss": 0.005869246553629637, "global_step": 26139, "epoch": 219, "lr": 7.105614462830291e-05} +{"train_loss": 0.003761458210647106, "global_step": 26140, "epoch": 219, "lr": 7.105413513244942e-05} +{"train_loss": 0.0046378616243600845, "global_step": 26141, "epoch": 219, "lr": 7.105212559525838e-05} +{"train_loss": 0.002921204548329115, "global_step": 26142, "epoch": 219, "lr": 7.105011601673374e-05} +{"train_loss": 0.0025127967819571495, "global_step": 26143, "epoch": 219, "lr": 7.104810639687944e-05} +{"train_loss": 0.0031520077027380466, "global_step": 26144, "epoch": 219, "lr": 7.104609673569944e-05} +{"train_loss": 0.003086184849962592, "global_step": 26145, "epoch": 219, "lr": 7.104408703319767e-05} +{"train_loss": 0.002382757607847452, "global_step": 26146, "epoch": 219, "lr": 7.104207728937808e-05} +{"train_loss": 0.002252759877592325, "global_step": 26147, "epoch": 219, "lr": 7.104006750424465e-05} +{"train_loss": 0.003606767626479268, "global_step": 26148, "epoch": 219, "lr": 7.103805767780128e-05} +{"train_loss": 0.0028903901111334562, "global_step": 26149, "epoch": 219, "lr": 7.103604781005191e-05} +{"train_loss": 0.004153807647526264, "global_step": 26150, "epoch": 219, "lr": 7.103403790100052e-05} +{"train_loss": 0.0026369085535407066, "global_step": 26151, "epoch": 219, "lr": 7.103202795065105e-05} +{"train_loss": 0.0037190921138972044, "global_step": 26152, "epoch": 219, "lr": 7.103001795900744e-05} +{"train_loss": 0.0046615018509328365, "global_step": 26153, "epoch": 219, "lr": 7.102800792607363e-05} +{"train_loss": 0.0027472495567053556, "global_step": 26154, "epoch": 219, "lr": 7.102599785185356e-05} +{"train_loss": 0.0039058516267687082, "global_step": 26155, "epoch": 219, "lr": 7.102398773635121e-05} +{"train_loss": 0.0031667358707636595, "global_step": 26156, "epoch": 219, "lr": 7.10219775795705e-05} +{"train_loss": 0.003889474319294095, "global_step": 26157, "epoch": 219, "lr": 7.101996738151537e-05} +{"train_loss": 0.006214333698153496, "global_step": 26158, "epoch": 219, "lr": 7.10179571421898e-05} +{"train_loss": 0.0030676706228405237, "global_step": 26159, "epoch": 219, "lr": 7.101594686159771e-05} +{"train_loss": 0.002633193973451853, "global_step": 26160, "epoch": 219, "lr": 7.101393653974306e-05} +{"train_loss": 0.0028315528761595488, "global_step": 26161, "epoch": 219, "lr": 7.101192617662979e-05} +{"train_loss": 0.0045204078778624535, "global_step": 26162, "epoch": 219, "lr": 7.100991577226184e-05} +{"train_loss": 0.0035081137903034687, "global_step": 26163, "epoch": 219, "lr": 7.100790532664315e-05} +{"train_loss": 0.004010101314634085, "global_step": 26164, "epoch": 219, "lr": 7.10058948397777e-05} +{"train_loss": 0.002245883923023939, "global_step": 26165, "epoch": 219, "lr": 7.100388431166942e-05} +{"train_loss": 0.004046767950057983, "global_step": 26166, "epoch": 219, "lr": 7.100187374232226e-05} +{"train_loss": 0.005003714468330145, "global_step": 26167, "epoch": 219, "lr": 7.099986313174017e-05} +{"train_loss": 0.0029733891133219004, "global_step": 26168, "epoch": 219, "lr": 7.099785247992707e-05} +{"train_loss": 0.005642701871693134, "global_step": 26169, "epoch": 219, "lr": 7.099584178688693e-05} +{"train_loss": 0.003401709022000432, "global_step": 26170, "epoch": 219, "lr": 7.099383105262373e-05} +{"train_loss": 0.005388243123888969, "global_step": 26171, "epoch": 219, "lr": 7.099182027714136e-05} +{"train_loss": 0.003192615695297718, "global_step": 26172, "epoch": 219, "lr": 7.09898094604438e-05} +{"train_loss": 0.002794936764985323, "global_step": 26173, "epoch": 219, "lr": 7.098779860253499e-05} +{"train_loss": 0.0070120589807629585, "global_step": 26174, "epoch": 219, "lr": 7.098578770341889e-05} +{"train_loss": 0.0033062968868762255, "global_step": 26175, "epoch": 219, "lr": 7.098377676309942e-05} +{"train_loss": 0.002414209069684148, "global_step": 26176, "epoch": 219, "lr": 7.098176578158054e-05} +{"train_loss": 0.0028046935331076384, "global_step": 26177, "epoch": 219, "lr": 7.097975475886622e-05} +{"train_loss": 0.00637022964656353, "global_step": 26178, "epoch": 219, "lr": 7.09777436949604e-05} +{"train_loss": 0.003660410260116415, "global_step": 26179, "epoch": 219, "lr": 7.097573258986702e-05, "val_loss": 0.028310241177678108} +{"train_loss": 0.002900415565818548, "global_step": 26180, "epoch": 220, "lr": 7.097372144359002e-05} +{"train_loss": 0.00405036611482501, "global_step": 26181, "epoch": 220, "lr": 7.097171025613336e-05} +{"train_loss": 0.002615655306726694, "global_step": 26182, "epoch": 220, "lr": 7.0969699027501e-05} +{"train_loss": 0.002345879329368472, "global_step": 26183, "epoch": 220, "lr": 7.096768775769685e-05} +{"train_loss": 0.0029056216590106487, "global_step": 26184, "epoch": 220, "lr": 7.09656764467249e-05} +{"train_loss": 0.0038130490574985743, "global_step": 26185, "epoch": 220, "lr": 7.09636650945891e-05} +{"train_loss": 0.0039634318090975285, "global_step": 26186, "epoch": 220, "lr": 7.096165370129336e-05} +{"train_loss": 0.0017419314244762063, "global_step": 26187, "epoch": 220, "lr": 7.095964226684164e-05} +{"train_loss": 0.003758157603442669, "global_step": 26188, "epoch": 220, "lr": 7.095763079123793e-05} +{"train_loss": 0.005481356289237738, "global_step": 26189, "epoch": 220, "lr": 7.095561927448614e-05} +{"train_loss": 0.004323760513216257, "global_step": 26190, "epoch": 220, "lr": 7.095360771659024e-05} +{"train_loss": 0.004062403924763203, "global_step": 26191, "epoch": 220, "lr": 7.095159611755417e-05} +{"train_loss": 0.004182804375886917, "global_step": 26192, "epoch": 220, "lr": 7.094958447738187e-05} +{"train_loss": 0.003916937392205, "global_step": 26193, "epoch": 220, "lr": 7.094757279607729e-05} +{"train_loss": 0.005276781041175127, "global_step": 26194, "epoch": 220, "lr": 7.09455610736444e-05} +{"train_loss": 0.005143944174051285, "global_step": 26195, "epoch": 220, "lr": 7.094354931008714e-05} +{"train_loss": 0.002583406399935484, "global_step": 26196, "epoch": 220, "lr": 7.094153750540945e-05} +{"train_loss": 0.00502169132232666, "global_step": 26197, "epoch": 220, "lr": 7.093952565961532e-05} +{"train_loss": 0.0038222428411245346, "global_step": 26198, "epoch": 220, "lr": 7.093751377270862e-05} +{"train_loss": 0.005095270462334156, "global_step": 26199, "epoch": 220, "lr": 7.093550184469339e-05} +{"train_loss": 0.0021614183206111193, "global_step": 26200, "epoch": 220, "lr": 7.093348987557352e-05} +{"train_loss": 0.003984416369348764, "global_step": 26201, "epoch": 220, "lr": 7.093147786535296e-05} +{"train_loss": 0.0032404491212219, "global_step": 26202, "epoch": 220, "lr": 7.092946581403571e-05} +{"train_loss": 0.0033829028252512217, "global_step": 26203, "epoch": 220, "lr": 7.092745372162568e-05} +{"train_loss": 0.0037749321199953556, "global_step": 26204, "epoch": 220, "lr": 7.092544158812683e-05} +{"train_loss": 0.0027936669066548347, "global_step": 26205, "epoch": 220, "lr": 7.09234294135431e-05} +{"train_loss": 0.0042304182425141335, "global_step": 26206, "epoch": 220, "lr": 7.092141719787847e-05} +{"train_loss": 0.004502873867750168, "global_step": 26207, "epoch": 220, "lr": 7.091940494113687e-05} +{"train_loss": 0.0031878312584012747, "global_step": 26208, "epoch": 220, "lr": 7.091739264332225e-05} +{"train_loss": 0.003065240802243352, "global_step": 26209, "epoch": 220, "lr": 7.091538030443856e-05} +{"train_loss": 0.0025199116207659245, "global_step": 26210, "epoch": 220, "lr": 7.091336792448976e-05} +{"train_loss": 0.008282061666250229, "global_step": 26211, "epoch": 220, "lr": 7.091135550347979e-05} +{"train_loss": 0.0035981580149382353, "global_step": 26212, "epoch": 220, "lr": 7.090934304141261e-05} +{"train_loss": 0.0032433008309453726, "global_step": 26213, "epoch": 220, "lr": 7.090733053829218e-05} +{"train_loss": 0.004679704084992409, "global_step": 26214, "epoch": 220, "lr": 7.090531799412242e-05} +{"train_loss": 0.0034310773480683565, "global_step": 26215, "epoch": 220, "lr": 7.09033054089073e-05} +{"train_loss": 0.0037735947407782078, "global_step": 26216, "epoch": 220, "lr": 7.09012927826508e-05} +{"train_loss": 0.0038831226993352175, "global_step": 26217, "epoch": 220, "lr": 7.089928011535683e-05} +{"train_loss": 0.002983289770781994, "global_step": 26218, "epoch": 220, "lr": 7.089726740702935e-05} +{"train_loss": 0.002980278106406331, "global_step": 26219, "epoch": 220, "lr": 7.089525465767233e-05} +{"train_loss": 0.0034104855731129646, "global_step": 26220, "epoch": 220, "lr": 7.089324186728969e-05} +{"train_loss": 0.0024988327641040087, "global_step": 26221, "epoch": 220, "lr": 7.089122903588543e-05} +{"train_loss": 0.004437964875251055, "global_step": 26222, "epoch": 220, "lr": 7.088921616346346e-05} +{"train_loss": 0.0033695604652166367, "global_step": 26223, "epoch": 220, "lr": 7.088720325002773e-05} +{"train_loss": 0.004305245820432901, "global_step": 26224, "epoch": 220, "lr": 7.088519029558223e-05} +{"train_loss": 0.0030090815853327513, "global_step": 26225, "epoch": 220, "lr": 7.088317730013088e-05} +{"train_loss": 0.0027872927021235228, "global_step": 26226, "epoch": 220, "lr": 7.088116426367765e-05} +{"train_loss": 0.003170841606333852, "global_step": 26227, "epoch": 220, "lr": 7.087915118622647e-05} +{"train_loss": 0.0032681594602763653, "global_step": 26228, "epoch": 220, "lr": 7.087713806778131e-05} +{"train_loss": 0.0039093708619475365, "global_step": 26229, "epoch": 220, "lr": 7.087512490834615e-05} +{"train_loss": 0.004637344740331173, "global_step": 26230, "epoch": 220, "lr": 7.087311170792488e-05} +{"train_loss": 0.0031436055433005095, "global_step": 26231, "epoch": 220, "lr": 7.08710984665215e-05} +{"train_loss": 0.004569082520902157, "global_step": 26232, "epoch": 220, "lr": 7.086908518413994e-05} +{"train_loss": 0.004114728420972824, "global_step": 26233, "epoch": 220, "lr": 7.086707186078417e-05} +{"train_loss": 0.0021479518618434668, "global_step": 26234, "epoch": 220, "lr": 7.086505849645812e-05} +{"train_loss": 0.004574193619191647, "global_step": 26235, "epoch": 220, "lr": 7.086304509116578e-05} +{"train_loss": 0.0023826421238482, "global_step": 26236, "epoch": 220, "lr": 7.086103164491104e-05} +{"train_loss": 0.0058613126166164875, "global_step": 26237, "epoch": 220, "lr": 7.085901815769791e-05} +{"train_loss": 0.004848651587963104, "global_step": 26238, "epoch": 220, "lr": 7.085700462953034e-05} +{"train_loss": 0.0024652795400470495, "global_step": 26239, "epoch": 220, "lr": 7.085499106041225e-05} +{"train_loss": 0.003452862845733762, "global_step": 26240, "epoch": 220, "lr": 7.085297745034764e-05} +{"train_loss": 0.00436370586976409, "global_step": 26241, "epoch": 220, "lr": 7.085096379934041e-05} +{"train_loss": 0.0028788773342967033, "global_step": 26242, "epoch": 220, "lr": 7.084895010739456e-05} +{"train_loss": 0.003236685646697879, "global_step": 26243, "epoch": 220, "lr": 7.084693637451401e-05} +{"train_loss": 0.0030479980632662773, "global_step": 26244, "epoch": 220, "lr": 7.084492260070275e-05} +{"train_loss": 0.0030660650227218866, "global_step": 26245, "epoch": 220, "lr": 7.084290878596469e-05} +{"train_loss": 0.002670403104275465, "global_step": 26246, "epoch": 220, "lr": 7.08408949303038e-05} +{"train_loss": 0.004805970471352339, "global_step": 26247, "epoch": 220, "lr": 7.083888103372407e-05} +{"train_loss": 0.00409455131739378, "global_step": 26248, "epoch": 220, "lr": 7.08368670962294e-05} +{"train_loss": 0.00263252598233521, "global_step": 26249, "epoch": 220, "lr": 7.083485311782376e-05} +{"train_loss": 0.0028626362327486277, "global_step": 26250, "epoch": 220, "lr": 7.083283909851112e-05} +{"train_loss": 0.0035786861553788185, "global_step": 26251, "epoch": 220, "lr": 7.083082503829544e-05} +{"train_loss": 0.0036288700066506863, "global_step": 26252, "epoch": 220, "lr": 7.082881093718064e-05} +{"train_loss": 0.003216092474758625, "global_step": 26253, "epoch": 220, "lr": 7.08267967951707e-05} +{"train_loss": 0.0022814576514065266, "global_step": 26254, "epoch": 220, "lr": 7.082478261226958e-05} +{"train_loss": 0.003665443742647767, "global_step": 26255, "epoch": 220, "lr": 7.082276838848121e-05} +{"train_loss": 0.0033262246288359165, "global_step": 26256, "epoch": 220, "lr": 7.082075412380957e-05} +{"train_loss": 0.0020222871098667383, "global_step": 26257, "epoch": 220, "lr": 7.08187398182586e-05} +{"train_loss": 0.0024288545828312635, "global_step": 26258, "epoch": 220, "lr": 7.081672547183226e-05} +{"train_loss": 0.004339325707405806, "global_step": 26259, "epoch": 220, "lr": 7.08147110845345e-05} +{"train_loss": 0.003936649300158024, "global_step": 26260, "epoch": 220, "lr": 7.08126966563693e-05} +{"train_loss": 0.0036131558008491993, "global_step": 26261, "epoch": 220, "lr": 7.081068218734056e-05} +{"train_loss": 0.0043769050389528275, "global_step": 26262, "epoch": 220, "lr": 7.080866767745228e-05} +{"train_loss": 0.004513570573180914, "global_step": 26263, "epoch": 220, "lr": 7.080665312670841e-05} +{"train_loss": 0.004245175048708916, "global_step": 26264, "epoch": 220, "lr": 7.08046385351129e-05} +{"train_loss": 0.004740952514111996, "global_step": 26265, "epoch": 220, "lr": 7.08026239026697e-05} +{"train_loss": 0.0035253993701189756, "global_step": 26266, "epoch": 220, "lr": 7.080060922938278e-05} +{"train_loss": 0.0029259503353387117, "global_step": 26267, "epoch": 220, "lr": 7.079859451525607e-05} +{"train_loss": 0.0038539643865078688, "global_step": 26268, "epoch": 220, "lr": 7.079657976029354e-05} +{"train_loss": 0.003415032522752881, "global_step": 26269, "epoch": 220, "lr": 7.079456496449916e-05} +{"train_loss": 0.005460804328322411, "global_step": 26270, "epoch": 220, "lr": 7.079255012787688e-05} +{"train_loss": 0.00279027852229774, "global_step": 26271, "epoch": 220, "lr": 7.079053525043063e-05} +{"train_loss": 0.002631708513945341, "global_step": 26272, "epoch": 220, "lr": 7.07885203321644e-05} +{"train_loss": 0.004890613257884979, "global_step": 26273, "epoch": 220, "lr": 7.078650537308212e-05} +{"train_loss": 0.004415501840412617, "global_step": 26274, "epoch": 220, "lr": 7.078449037318777e-05} +{"train_loss": 0.004332507960498333, "global_step": 26275, "epoch": 220, "lr": 7.078247533248527e-05} +{"train_loss": 0.0025998237542808056, "global_step": 26276, "epoch": 220, "lr": 7.078046025097863e-05} +{"train_loss": 0.0031544051598757505, "global_step": 26277, "epoch": 220, "lr": 7.077844512867176e-05} +{"train_loss": 0.005656029097735882, "global_step": 26278, "epoch": 220, "lr": 7.077642996556863e-05} +{"train_loss": 0.0037687518633902073, "global_step": 26279, "epoch": 220, "lr": 7.077441476167322e-05} +{"train_loss": 0.0019808169454336166, "global_step": 26280, "epoch": 220, "lr": 7.077239951698946e-05} +{"train_loss": 0.002458657370880246, "global_step": 26281, "epoch": 220, "lr": 7.077038423152129e-05} +{"train_loss": 0.0027616184670478106, "global_step": 26282, "epoch": 220, "lr": 7.076836890527271e-05} +{"train_loss": 0.003010363318026066, "global_step": 26283, "epoch": 220, "lr": 7.076635353824765e-05} +{"train_loss": 0.002458300208672881, "global_step": 26284, "epoch": 220, "lr": 7.076433813045007e-05} +{"train_loss": 0.005220103543251753, "global_step": 26285, "epoch": 220, "lr": 7.076232268188392e-05} +{"train_loss": 0.0037757446989417076, "global_step": 26286, "epoch": 220, "lr": 7.07603071925532e-05} +{"train_loss": 0.0032921608071774244, "global_step": 26287, "epoch": 220, "lr": 7.07582916624618e-05} +{"train_loss": 0.0023531548213213682, "global_step": 26288, "epoch": 220, "lr": 7.075627609161373e-05} +{"train_loss": 0.003990811295807362, "global_step": 26289, "epoch": 220, "lr": 7.075426048001293e-05} +{"train_loss": 0.004972724709659815, "global_step": 26290, "epoch": 220, "lr": 7.075224482766337e-05} +{"train_loss": 0.003954925574362278, "global_step": 26291, "epoch": 220, "lr": 7.075022913456897e-05} +{"train_loss": 0.0031028026714920998, "global_step": 26292, "epoch": 220, "lr": 7.074821340073372e-05} +{"train_loss": 0.003549494780600071, "global_step": 26293, "epoch": 220, "lr": 7.074619762616157e-05} +{"train_loss": 0.003140257205814123, "global_step": 26294, "epoch": 220, "lr": 7.074418181085648e-05} +{"train_loss": 0.0021486743353307247, "global_step": 26295, "epoch": 220, "lr": 7.07421659548224e-05} +{"train_loss": 0.0024637661408632994, "global_step": 26296, "epoch": 220, "lr": 7.07401500580633e-05} +{"train_loss": 0.003465757705271244, "global_step": 26297, "epoch": 220, "lr": 7.073813412058311e-05} +{"train_loss": 0.003633295521414017, "global_step": 26298, "epoch": 220, "lr": 7.073611814238586e-05, "val_loss": 0.011828463524580002, "train_action_mse_error": 7.625568105140701e-05} +{"train_loss": 0.004786915611475706, "global_step": 26299, "epoch": 221, "lr": 7.073410212347541e-05} +{"train_loss": 0.004003047943115234, "global_step": 26300, "epoch": 221, "lr": 7.073208606385578e-05} +{"train_loss": 0.0030988205689936876, "global_step": 26301, "epoch": 221, "lr": 7.073006996353091e-05} +{"train_loss": 0.006825776770710945, "global_step": 26302, "epoch": 221, "lr": 7.072805382250477e-05} +{"train_loss": 0.0025880392640829086, "global_step": 26303, "epoch": 221, "lr": 7.07260376407813e-05} +{"train_loss": 0.0026809298433363438, "global_step": 26304, "epoch": 221, "lr": 7.072402141836447e-05} +{"train_loss": 0.0054206084460020065, "global_step": 26305, "epoch": 221, "lr": 7.072200515525824e-05} +{"train_loss": 0.002989837434142828, "global_step": 26306, "epoch": 221, "lr": 7.071998885146658e-05} +{"train_loss": 0.005812571384012699, "global_step": 26307, "epoch": 221, "lr": 7.071797250699343e-05} +{"train_loss": 0.003387146396562457, "global_step": 26308, "epoch": 221, "lr": 7.071595612184274e-05} +{"train_loss": 0.004079420119524002, "global_step": 26309, "epoch": 221, "lr": 7.071393969601849e-05} +{"train_loss": 0.003804693231359124, "global_step": 26310, "epoch": 221, "lr": 7.071192322952464e-05} +{"train_loss": 0.003539350815117359, "global_step": 26311, "epoch": 221, "lr": 7.070990672236515e-05} +{"train_loss": 0.005127040669322014, "global_step": 26312, "epoch": 221, "lr": 7.070789017454395e-05} +{"train_loss": 0.003660662565380335, "global_step": 26313, "epoch": 221, "lr": 7.070587358606503e-05} +{"train_loss": 0.005135332699865103, "global_step": 26314, "epoch": 221, "lr": 7.070385695693234e-05} +{"train_loss": 0.002189374528825283, "global_step": 26315, "epoch": 221, "lr": 7.070184028714984e-05} +{"train_loss": 0.004375221207737923, "global_step": 26316, "epoch": 221, "lr": 7.069982357672149e-05} +{"train_loss": 0.002650896552950144, "global_step": 26317, "epoch": 221, "lr": 7.069780682565124e-05} +{"train_loss": 0.004333834629505873, "global_step": 26318, "epoch": 221, "lr": 7.069579003394305e-05} +{"train_loss": 0.0018728837603703141, "global_step": 26319, "epoch": 221, "lr": 7.06937732016009e-05} +{"train_loss": 0.0036856275983154774, "global_step": 26320, "epoch": 221, "lr": 7.069175632862872e-05} +{"train_loss": 0.002155701396986842, "global_step": 26321, "epoch": 221, "lr": 7.068973941503049e-05} +{"train_loss": 0.0035114672500640154, "global_step": 26322, "epoch": 221, "lr": 7.06877224608102e-05} +{"train_loss": 0.00392031017690897, "global_step": 26323, "epoch": 221, "lr": 7.068570546597175e-05} +{"train_loss": 0.003317385446280241, "global_step": 26324, "epoch": 221, "lr": 7.068368843051913e-05} +{"train_loss": 0.005900127813220024, "global_step": 26325, "epoch": 221, "lr": 7.068167135445632e-05} +{"train_loss": 0.004745112266391516, "global_step": 26326, "epoch": 221, "lr": 7.067965423778721e-05} +{"train_loss": 0.004669119603931904, "global_step": 26327, "epoch": 221, "lr": 7.067763708051585e-05} +{"train_loss": 0.005504573695361614, "global_step": 26328, "epoch": 221, "lr": 7.067561988264615e-05} +{"train_loss": 0.0038262070156633854, "global_step": 26329, "epoch": 221, "lr": 7.067360264418208e-05} +{"train_loss": 0.004555799067020416, "global_step": 26330, "epoch": 221, "lr": 7.067158536512759e-05} +{"train_loss": 0.0032241838052868843, "global_step": 26331, "epoch": 221, "lr": 7.066956804548665e-05} +{"train_loss": 0.004508058074861765, "global_step": 26332, "epoch": 221, "lr": 7.066755068526322e-05} +{"train_loss": 0.004498129244893789, "global_step": 26333, "epoch": 221, "lr": 7.066553328446127e-05} +{"train_loss": 0.002137742703780532, "global_step": 26334, "epoch": 221, "lr": 7.066351584308474e-05} +{"train_loss": 0.0027746325358748436, "global_step": 26335, "epoch": 221, "lr": 7.066149836113763e-05} +{"train_loss": 0.0026747691445052624, "global_step": 26336, "epoch": 221, "lr": 7.065948083862386e-05} +{"train_loss": 0.005045333877205849, "global_step": 26337, "epoch": 221, "lr": 7.065746327554741e-05} +{"train_loss": 0.004208105616271496, "global_step": 26338, "epoch": 221, "lr": 7.065544567191222e-05} +{"train_loss": 0.004299904685467482, "global_step": 26339, "epoch": 221, "lr": 7.065342802772229e-05} +{"train_loss": 0.004133718088269234, "global_step": 26340, "epoch": 221, "lr": 7.065141034298156e-05} +{"train_loss": 0.002922439482063055, "global_step": 26341, "epoch": 221, "lr": 7.064939261769399e-05} +{"train_loss": 0.005515613127499819, "global_step": 26342, "epoch": 221, "lr": 7.064737485186354e-05} +{"train_loss": 0.004255414940416813, "global_step": 26343, "epoch": 221, "lr": 7.064535704549418e-05} +{"train_loss": 0.005909888539463282, "global_step": 26344, "epoch": 221, "lr": 7.064333919858985e-05} +{"train_loss": 0.0035197811666876078, "global_step": 26345, "epoch": 221, "lr": 7.064132131115455e-05} +{"train_loss": 0.00556869525462389, "global_step": 26346, "epoch": 221, "lr": 7.063930338319221e-05} +{"train_loss": 0.0035511204041540623, "global_step": 26347, "epoch": 221, "lr": 7.06372854147068e-05} +{"train_loss": 0.0033469824120402336, "global_step": 26348, "epoch": 221, "lr": 7.06352674057023e-05} +{"train_loss": 0.003851537825539708, "global_step": 26349, "epoch": 221, "lr": 7.063324935618265e-05} +{"train_loss": 0.003174216253682971, "global_step": 26350, "epoch": 221, "lr": 7.063123126615181e-05} +{"train_loss": 0.005304340738803148, "global_step": 26351, "epoch": 221, "lr": 7.062921313561376e-05} +{"train_loss": 0.00526368198916316, "global_step": 26352, "epoch": 221, "lr": 7.062719496457245e-05} +{"train_loss": 0.0045881071127951145, "global_step": 26353, "epoch": 221, "lr": 7.062517675303186e-05} +{"train_loss": 0.0036496887914836407, "global_step": 26354, "epoch": 221, "lr": 7.062315850099593e-05} +{"train_loss": 0.003098882269114256, "global_step": 26355, "epoch": 221, "lr": 7.062114020846861e-05} +{"train_loss": 0.004660620354115963, "global_step": 26356, "epoch": 221, "lr": 7.061912187545391e-05} +{"train_loss": 0.0032551025506109, "global_step": 26357, "epoch": 221, "lr": 7.061710350195576e-05} +{"train_loss": 0.0038999817334115505, "global_step": 26358, "epoch": 221, "lr": 7.061508508797813e-05} +{"train_loss": 0.004223390016704798, "global_step": 26359, "epoch": 221, "lr": 7.061306663352499e-05} +{"train_loss": 0.00322740594856441, "global_step": 26360, "epoch": 221, "lr": 7.061104813860029e-05} +{"train_loss": 0.003156383289024234, "global_step": 26361, "epoch": 221, "lr": 7.060902960320799e-05} +{"train_loss": 0.0032651207875460386, "global_step": 26362, "epoch": 221, "lr": 7.060701102735207e-05} +{"train_loss": 0.003596504218876362, "global_step": 26363, "epoch": 221, "lr": 7.060499241103649e-05} +{"train_loss": 0.00576822180300951, "global_step": 26364, "epoch": 221, "lr": 7.06029737542652e-05} +{"train_loss": 0.003033352317288518, "global_step": 26365, "epoch": 221, "lr": 7.060095505704217e-05} +{"train_loss": 0.003041913965716958, "global_step": 26366, "epoch": 221, "lr": 7.059893631937138e-05} +{"train_loss": 0.004467998631298542, "global_step": 26367, "epoch": 221, "lr": 7.059691754125677e-05} +{"train_loss": 0.0053500463254749775, "global_step": 26368, "epoch": 221, "lr": 7.05948987227023e-05} +{"train_loss": 0.0028273919597268105, "global_step": 26369, "epoch": 221, "lr": 7.059287986371196e-05} +{"train_loss": 0.0044850236736238, "global_step": 26370, "epoch": 221, "lr": 7.05908609642897e-05} +{"train_loss": 0.004432734102010727, "global_step": 26371, "epoch": 221, "lr": 7.058884202443948e-05} +{"train_loss": 0.003910824190825224, "global_step": 26372, "epoch": 221, "lr": 7.058682304416528e-05} +{"train_loss": 0.00456944340839982, "global_step": 26373, "epoch": 221, "lr": 7.058480402347105e-05} +{"train_loss": 0.0037088803946971893, "global_step": 26374, "epoch": 221, "lr": 7.058278496236075e-05} +{"train_loss": 0.0021399296820163727, "global_step": 26375, "epoch": 221, "lr": 7.058076586083835e-05} +{"train_loss": 0.0049635195173323154, "global_step": 26376, "epoch": 221, "lr": 7.057874671890783e-05} +{"train_loss": 0.0038285250775516033, "global_step": 26377, "epoch": 221, "lr": 7.057672753657311e-05} +{"train_loss": 0.0031679740641266108, "global_step": 26378, "epoch": 221, "lr": 7.057470831383821e-05} +{"train_loss": 0.002098226686939597, "global_step": 26379, "epoch": 221, "lr": 7.057268905070706e-05} +{"train_loss": 0.003651211503893137, "global_step": 26380, "epoch": 221, "lr": 7.057066974718364e-05} +{"train_loss": 0.004582948051393032, "global_step": 26381, "epoch": 221, "lr": 7.05686504032719e-05} +{"train_loss": 0.003434925340116024, "global_step": 26382, "epoch": 221, "lr": 7.05666310189758e-05} +{"train_loss": 0.0020767119713127613, "global_step": 26383, "epoch": 221, "lr": 7.056461159429933e-05} +{"train_loss": 0.003109396668151021, "global_step": 26384, "epoch": 221, "lr": 7.056259212924644e-05} +{"train_loss": 0.003441379638388753, "global_step": 26385, "epoch": 221, "lr": 7.05605726238211e-05} +{"train_loss": 0.006412990856915712, "global_step": 26386, "epoch": 221, "lr": 7.055855307802728e-05} +{"train_loss": 0.00380706530995667, "global_step": 26387, "epoch": 221, "lr": 7.055653349186892e-05} +{"train_loss": 0.002658835146576166, "global_step": 26388, "epoch": 221, "lr": 7.055451386535001e-05} +{"train_loss": 0.005353329703211784, "global_step": 26389, "epoch": 221, "lr": 7.05524941984745e-05} +{"train_loss": 0.002139527816325426, "global_step": 26390, "epoch": 221, "lr": 7.055047449124638e-05} +{"train_loss": 0.0026747281663119793, "global_step": 26391, "epoch": 221, "lr": 7.054845474366959e-05} +{"train_loss": 0.003955446183681488, "global_step": 26392, "epoch": 221, "lr": 7.054643495574811e-05} +{"train_loss": 0.0031913327984511852, "global_step": 26393, "epoch": 221, "lr": 7.05444151274859e-05} +{"train_loss": 0.004051712807267904, "global_step": 26394, "epoch": 221, "lr": 7.054239525888692e-05} +{"train_loss": 0.004955514334142208, "global_step": 26395, "epoch": 221, "lr": 7.054037534995514e-05} +{"train_loss": 0.006548748351633549, "global_step": 26396, "epoch": 221, "lr": 7.053835540069452e-05} +{"train_loss": 0.002956350101158023, "global_step": 26397, "epoch": 221, "lr": 7.053633541110905e-05} +{"train_loss": 0.003953470382839441, "global_step": 26398, "epoch": 221, "lr": 7.053431538120268e-05} +{"train_loss": 0.0027813303750008345, "global_step": 26399, "epoch": 221, "lr": 7.053229531097937e-05} +{"train_loss": 0.003029630519449711, "global_step": 26400, "epoch": 221, "lr": 7.053027520044309e-05} +{"train_loss": 0.002471926622092724, "global_step": 26401, "epoch": 221, "lr": 7.05282550495978e-05} +{"train_loss": 0.0033434657379984856, "global_step": 26402, "epoch": 221, "lr": 7.052623485844748e-05} +{"train_loss": 0.0034674396738409996, "global_step": 26403, "epoch": 221, "lr": 7.05242146269961e-05} +{"train_loss": 0.002873604418709874, "global_step": 26404, "epoch": 221, "lr": 7.052219435524761e-05} +{"train_loss": 0.004600583575665951, "global_step": 26405, "epoch": 221, "lr": 7.052017404320598e-05} +{"train_loss": 0.0023633278906345367, "global_step": 26406, "epoch": 221, "lr": 7.051815369087518e-05} +{"train_loss": 0.004638891201466322, "global_step": 26407, "epoch": 221, "lr": 7.051613329825919e-05} +{"train_loss": 0.0031114553567022085, "global_step": 26408, "epoch": 221, "lr": 7.051411286536195e-05} +{"train_loss": 0.001660699606873095, "global_step": 26409, "epoch": 221, "lr": 7.051209239218744e-05} +{"train_loss": 0.003957269713282585, "global_step": 26410, "epoch": 221, "lr": 7.051007187873964e-05} +{"train_loss": 0.0022240832913666964, "global_step": 26411, "epoch": 221, "lr": 7.05080513250225e-05} +{"train_loss": 0.006317845545709133, "global_step": 26412, "epoch": 221, "lr": 7.050603073103999e-05} +{"train_loss": 0.002511301776394248, "global_step": 26413, "epoch": 221, "lr": 7.05040100967961e-05} +{"train_loss": 0.004494617227464914, "global_step": 26414, "epoch": 221, "lr": 7.050198942229474e-05} +{"train_loss": 0.002191276755183935, "global_step": 26415, "epoch": 221, "lr": 7.049996870753994e-05} +{"train_loss": 0.0024093426764011383, "global_step": 26416, "epoch": 221, "lr": 7.049794795253564e-05} +{"train_loss": 0.0038372612687438226, "global_step": 26417, "epoch": 221, "lr": 7.04959271572858e-05, "val_loss": 0.021115096285939217} +{"train_loss": 0.005766018759459257, "global_step": 26418, "epoch": 222, "lr": 7.049390632179439e-05} +{"train_loss": 0.0031914717983454466, "global_step": 26419, "epoch": 222, "lr": 7.04918854460654e-05} +{"train_loss": 0.002337332349270582, "global_step": 26420, "epoch": 222, "lr": 7.048986453010276e-05} +{"train_loss": 0.002754087094217539, "global_step": 26421, "epoch": 222, "lr": 7.048784357391048e-05} +{"train_loss": 0.0043711974285542965, "global_step": 26422, "epoch": 222, "lr": 7.048582257749252e-05} +{"train_loss": 0.0030778239015489817, "global_step": 26423, "epoch": 222, "lr": 7.048380154085281e-05} +{"train_loss": 0.0030614587012678385, "global_step": 26424, "epoch": 222, "lr": 7.048178046399536e-05} +{"train_loss": 0.004001663997769356, "global_step": 26425, "epoch": 222, "lr": 7.047975934692413e-05} +{"train_loss": 0.005692091770470142, "global_step": 26426, "epoch": 222, "lr": 7.047773818964305e-05} +{"train_loss": 0.0061842468567192554, "global_step": 26427, "epoch": 222, "lr": 7.047571699215614e-05} +{"train_loss": 0.004843784961849451, "global_step": 26428, "epoch": 222, "lr": 7.047369575446735e-05} +{"train_loss": 0.004183599259704351, "global_step": 26429, "epoch": 222, "lr": 7.047167447658064e-05} +{"train_loss": 0.0028927677776664495, "global_step": 26430, "epoch": 222, "lr": 7.046965315849999e-05} +{"train_loss": 0.002149085281416774, "global_step": 26431, "epoch": 222, "lr": 7.046763180022935e-05} +{"train_loss": 0.0024280219804495573, "global_step": 26432, "epoch": 222, "lr": 7.04656104017727e-05} +{"train_loss": 0.0041639311239123344, "global_step": 26433, "epoch": 222, "lr": 7.046358896313402e-05} +{"train_loss": 0.0027421710547059774, "global_step": 26434, "epoch": 222, "lr": 7.046156748431726e-05} +{"train_loss": 0.0038220458664000034, "global_step": 26435, "epoch": 222, "lr": 7.04595459653264e-05} +{"train_loss": 0.0053182328119874, "global_step": 26436, "epoch": 222, "lr": 7.045752440616542e-05} +{"train_loss": 0.0019046771340072155, "global_step": 26437, "epoch": 222, "lr": 7.045550280683827e-05} +{"train_loss": 0.0060044764541089535, "global_step": 26438, "epoch": 222, "lr": 7.045348116734892e-05} +{"train_loss": 0.004546579904854298, "global_step": 26439, "epoch": 222, "lr": 7.045145948770135e-05} +{"train_loss": 0.0032261160667985678, "global_step": 26440, "epoch": 222, "lr": 7.044943776789952e-05} +{"train_loss": 0.0045587364584207535, "global_step": 26441, "epoch": 222, "lr": 7.044741600794741e-05} +{"train_loss": 0.0029863056261092424, "global_step": 26442, "epoch": 222, "lr": 7.044539420784899e-05} +{"train_loss": 0.0029757313895970583, "global_step": 26443, "epoch": 222, "lr": 7.044337236760821e-05} +{"train_loss": 0.0034105386584997177, "global_step": 26444, "epoch": 222, "lr": 7.044135048722905e-05} +{"train_loss": 0.003831475507467985, "global_step": 26445, "epoch": 222, "lr": 7.04393285667155e-05} +{"train_loss": 0.0025539721827954054, "global_step": 26446, "epoch": 222, "lr": 7.043730660607148e-05} +{"train_loss": 0.004344729240983725, "global_step": 26447, "epoch": 222, "lr": 7.043528460530102e-05} +{"train_loss": 0.0037122368812561035, "global_step": 26448, "epoch": 222, "lr": 7.043326256440806e-05} +{"train_loss": 0.004415004514157772, "global_step": 26449, "epoch": 222, "lr": 7.043124048339656e-05} +{"train_loss": 0.003623649710789323, "global_step": 26450, "epoch": 222, "lr": 7.042921836227051e-05} +{"train_loss": 0.004447549115866423, "global_step": 26451, "epoch": 222, "lr": 7.042719620103388e-05} +{"train_loss": 0.00461927056312561, "global_step": 26452, "epoch": 222, "lr": 7.04251739996906e-05} +{"train_loss": 0.0032536799553781748, "global_step": 26453, "epoch": 222, "lr": 7.04231517582447e-05} +{"train_loss": 0.003982397727668285, "global_step": 26454, "epoch": 222, "lr": 7.042112947670012e-05} +{"train_loss": 0.006205141078680754, "global_step": 26455, "epoch": 222, "lr": 7.041910715506084e-05} +{"train_loss": 0.00400970783084631, "global_step": 26456, "epoch": 222, "lr": 7.041708479333082e-05} +{"train_loss": 0.003909831866621971, "global_step": 26457, "epoch": 222, "lr": 7.041506239151402e-05} +{"train_loss": 0.0035965314600616693, "global_step": 26458, "epoch": 222, "lr": 7.041303994961444e-05} +{"train_loss": 0.0038015362806618214, "global_step": 26459, "epoch": 222, "lr": 7.041101746763604e-05} +{"train_loss": 0.002819216111674905, "global_step": 26460, "epoch": 222, "lr": 7.040899494558278e-05} +{"train_loss": 0.0036516059190034866, "global_step": 26461, "epoch": 222, "lr": 7.040697238345864e-05} +{"train_loss": 0.008214921690523624, "global_step": 26462, "epoch": 222, "lr": 7.040494978126759e-05} +{"train_loss": 0.0032137990929186344, "global_step": 26463, "epoch": 222, "lr": 7.040292713901361e-05} +{"train_loss": 0.002643684856593609, "global_step": 26464, "epoch": 222, "lr": 7.040090445670066e-05} +{"train_loss": 0.005256292410194874, "global_step": 26465, "epoch": 222, "lr": 7.03988817343327e-05} +{"train_loss": 0.006125027779489756, "global_step": 26466, "epoch": 222, "lr": 7.039685897191372e-05} +{"train_loss": 0.0038129391614347696, "global_step": 26467, "epoch": 222, "lr": 7.039483616944769e-05} +{"train_loss": 0.004390898160636425, "global_step": 26468, "epoch": 222, "lr": 7.03928133269386e-05} +{"train_loss": 0.004468314349651337, "global_step": 26469, "epoch": 222, "lr": 7.039079044439037e-05} +{"train_loss": 0.004187293350696564, "global_step": 26470, "epoch": 222, "lr": 7.038876752180699e-05} +{"train_loss": 0.004781718365848064, "global_step": 26471, "epoch": 222, "lr": 7.038674455919247e-05} +{"train_loss": 0.003417614381760359, "global_step": 26472, "epoch": 222, "lr": 7.038472155655075e-05} +{"train_loss": 0.005047081969678402, "global_step": 26473, "epoch": 222, "lr": 7.038269851388582e-05} +{"train_loss": 0.004141161218285561, "global_step": 26474, "epoch": 222, "lr": 7.038067543120161e-05} +{"train_loss": 0.003705833340063691, "global_step": 26475, "epoch": 222, "lr": 7.037865230850213e-05} +{"train_loss": 0.0026175782550126314, "global_step": 26476, "epoch": 222, "lr": 7.037662914579135e-05} +{"train_loss": 0.005161572247743607, "global_step": 26477, "epoch": 222, "lr": 7.037460594307324e-05} +{"train_loss": 0.004722321406006813, "global_step": 26478, "epoch": 222, "lr": 7.037258270035177e-05} +{"train_loss": 0.0026523652486503124, "global_step": 26479, "epoch": 222, "lr": 7.03705594176309e-05} +{"train_loss": 0.004184774123132229, "global_step": 26480, "epoch": 222, "lr": 7.036853609491461e-05} +{"train_loss": 0.004447250161319971, "global_step": 26481, "epoch": 222, "lr": 7.036651273220688e-05} +{"train_loss": 0.004201832693070173, "global_step": 26482, "epoch": 222, "lr": 7.036448932951168e-05} +{"train_loss": 0.0056653390638530254, "global_step": 26483, "epoch": 222, "lr": 7.036246588683298e-05} +{"train_loss": 0.004538669716566801, "global_step": 26484, "epoch": 222, "lr": 7.036044240417475e-05} +{"train_loss": 0.0020230163354426622, "global_step": 26485, "epoch": 222, "lr": 7.035841888154096e-05} +{"train_loss": 0.0026664086617529392, "global_step": 26486, "epoch": 222, "lr": 7.03563953189356e-05} +{"train_loss": 0.004506246652454138, "global_step": 26487, "epoch": 222, "lr": 7.035437171636263e-05} +{"train_loss": 0.005515307653695345, "global_step": 26488, "epoch": 222, "lr": 7.035234807382604e-05} +{"train_loss": 0.005163619760423899, "global_step": 26489, "epoch": 222, "lr": 7.035032439132977e-05} +{"train_loss": 0.002881463849917054, "global_step": 26490, "epoch": 222, "lr": 7.034830066887781e-05} +{"train_loss": 0.004208166152238846, "global_step": 26491, "epoch": 222, "lr": 7.034627690647416e-05} +{"train_loss": 0.0029782154597342014, "global_step": 26492, "epoch": 222, "lr": 7.034425310412275e-05} +{"train_loss": 0.0019116956973448396, "global_step": 26493, "epoch": 222, "lr": 7.034222926182758e-05} +{"train_loss": 0.0030124669428914785, "global_step": 26494, "epoch": 222, "lr": 7.03402053795926e-05} +{"train_loss": 0.007324104197323322, "global_step": 26495, "epoch": 222, "lr": 7.033818145742182e-05} +{"train_loss": 0.0030851690098643303, "global_step": 26496, "epoch": 222, "lr": 7.033615749531918e-05} +{"train_loss": 0.00362949725240469, "global_step": 26497, "epoch": 222, "lr": 7.033413349328867e-05} +{"train_loss": 0.003185857553035021, "global_step": 26498, "epoch": 222, "lr": 7.033210945133427e-05} +{"train_loss": 0.005169488023966551, "global_step": 26499, "epoch": 222, "lr": 7.033008536945994e-05} +{"train_loss": 0.0049294657073915005, "global_step": 26500, "epoch": 222, "lr": 7.032806124766965e-05} +{"train_loss": 0.0032461185473948717, "global_step": 26501, "epoch": 222, "lr": 7.032603708596738e-05} +{"train_loss": 0.002985255094245076, "global_step": 26502, "epoch": 222, "lr": 7.032401288435713e-05} +{"train_loss": 0.003997921943664551, "global_step": 26503, "epoch": 222, "lr": 7.032198864284282e-05} +{"train_loss": 0.003593516768887639, "global_step": 26504, "epoch": 222, "lr": 7.03199643614285e-05} +{"train_loss": 0.003371936036273837, "global_step": 26505, "epoch": 222, "lr": 7.031794004011808e-05} +{"train_loss": 0.003047399688512087, "global_step": 26506, "epoch": 222, "lr": 7.031591567891555e-05} +{"train_loss": 0.004418998956680298, "global_step": 26507, "epoch": 222, "lr": 7.031389127782489e-05} +{"train_loss": 0.0026807147078216076, "global_step": 26508, "epoch": 222, "lr": 7.031186683685009e-05} +{"train_loss": 0.0028675184585154057, "global_step": 26509, "epoch": 222, "lr": 7.030984235599509e-05} +{"train_loss": 0.003923631738871336, "global_step": 26510, "epoch": 222, "lr": 7.030781783526388e-05} +{"train_loss": 0.0018893713131546974, "global_step": 26511, "epoch": 222, "lr": 7.030579327466046e-05} +{"train_loss": 0.0037509165704250336, "global_step": 26512, "epoch": 222, "lr": 7.030376867418879e-05} +{"train_loss": 0.0027368038427084684, "global_step": 26513, "epoch": 222, "lr": 7.030174403385282e-05} +{"train_loss": 0.0028008962981402874, "global_step": 26514, "epoch": 222, "lr": 7.029971935365654e-05} +{"train_loss": 0.004716654308140278, "global_step": 26515, "epoch": 222, "lr": 7.029769463360394e-05} +{"train_loss": 0.003942382987588644, "global_step": 26516, "epoch": 222, "lr": 7.0295669873699e-05} +{"train_loss": 0.0023742164485156536, "global_step": 26517, "epoch": 222, "lr": 7.029364507394565e-05} +{"train_loss": 0.0033580707386136055, "global_step": 26518, "epoch": 222, "lr": 7.029162023434791e-05} +{"train_loss": 0.0018262004014104605, "global_step": 26519, "epoch": 222, "lr": 7.028959535490974e-05} +{"train_loss": 0.002909249858930707, "global_step": 26520, "epoch": 222, "lr": 7.028757043563512e-05} +{"train_loss": 0.003059349488466978, "global_step": 26521, "epoch": 222, "lr": 7.028554547652801e-05} +{"train_loss": 0.005439384374767542, "global_step": 26522, "epoch": 222, "lr": 7.028352047759243e-05} +{"train_loss": 0.002423669211566448, "global_step": 26523, "epoch": 222, "lr": 7.028149543883231e-05} +{"train_loss": 0.002325782086700201, "global_step": 26524, "epoch": 222, "lr": 7.027947036025162e-05} +{"train_loss": 0.0024114204570651054, "global_step": 26525, "epoch": 222, "lr": 7.027744524185438e-05} +{"train_loss": 0.005633768625557423, "global_step": 26526, "epoch": 222, "lr": 7.027542008364453e-05} +{"train_loss": 0.002776809735223651, "global_step": 26527, "epoch": 222, "lr": 7.027339488562607e-05} +{"train_loss": 0.0034726152662187815, "global_step": 26528, "epoch": 222, "lr": 7.027136964780296e-05} +{"train_loss": 0.003933848813176155, "global_step": 26529, "epoch": 222, "lr": 7.026934437017918e-05} +{"train_loss": 0.002699786564335227, "global_step": 26530, "epoch": 222, "lr": 7.026731905275872e-05} +{"train_loss": 0.0061654760502278805, "global_step": 26531, "epoch": 222, "lr": 7.026529369554552e-05} +{"train_loss": 0.0018063108436763287, "global_step": 26532, "epoch": 222, "lr": 7.02632682985436e-05} +{"train_loss": 0.003145905677229166, "global_step": 26533, "epoch": 222, "lr": 7.02612428617569e-05} +{"train_loss": 0.002163232769817114, "global_step": 26534, "epoch": 222, "lr": 7.025921738518942e-05} +{"train_loss": 0.00446266820654273, "global_step": 26535, "epoch": 222, "lr": 7.025719186884514e-05} +{"train_loss": 0.0038138156386968844, "global_step": 26536, "epoch": 222, "lr": 7.025516631272803e-05, "val_loss": 0.017493408173322678} +{"train_loss": 0.0050799660384655, "global_step": 26537, "epoch": 223, "lr": 7.025314071684206e-05} +{"train_loss": 0.003773254342377186, "global_step": 26538, "epoch": 223, "lr": 7.02511150811912e-05} +{"train_loss": 0.0022343834862113, "global_step": 26539, "epoch": 223, "lr": 7.024908940577945e-05} +{"train_loss": 0.0052292621694505215, "global_step": 26540, "epoch": 223, "lr": 7.024706369061078e-05} +{"train_loss": 0.0019815254490822554, "global_step": 26541, "epoch": 223, "lr": 7.024503793568915e-05} +{"train_loss": 0.0017412914894521236, "global_step": 26542, "epoch": 223, "lr": 7.024301214101858e-05} +{"train_loss": 0.002834279788658023, "global_step": 26543, "epoch": 223, "lr": 7.024098630660299e-05} +{"train_loss": 0.004036447964608669, "global_step": 26544, "epoch": 223, "lr": 7.02389604324464e-05} +{"train_loss": 0.003482008818536997, "global_step": 26545, "epoch": 223, "lr": 7.023693451855276e-05} +{"train_loss": 0.0054541281424462795, "global_step": 26546, "epoch": 223, "lr": 7.023490856492607e-05} +{"train_loss": 0.002607041737064719, "global_step": 26547, "epoch": 223, "lr": 7.02328825715703e-05} +{"train_loss": 0.0035118521191179752, "global_step": 26548, "epoch": 223, "lr": 7.023085653848944e-05} +{"train_loss": 0.004894486628472805, "global_step": 26549, "epoch": 223, "lr": 7.022883046568742e-05} +{"train_loss": 0.0030295562464743853, "global_step": 26550, "epoch": 223, "lr": 7.022680435316826e-05} +{"train_loss": 0.003044682089239359, "global_step": 26551, "epoch": 223, "lr": 7.022477820093595e-05} +{"train_loss": 0.002732188208028674, "global_step": 26552, "epoch": 223, "lr": 7.022275200899444e-05} +{"train_loss": 0.00430133193731308, "global_step": 26553, "epoch": 223, "lr": 7.022072577734771e-05} +{"train_loss": 0.005746669601649046, "global_step": 26554, "epoch": 223, "lr": 7.021869950599978e-05} +{"train_loss": 0.0026861215010285378, "global_step": 26555, "epoch": 223, "lr": 7.021667319495455e-05} +{"train_loss": 0.0035622850991785526, "global_step": 26556, "epoch": 223, "lr": 7.021464684421606e-05} +{"train_loss": 0.003820869605988264, "global_step": 26557, "epoch": 223, "lr": 7.021262045378827e-05} +{"train_loss": 0.0016178378136828542, "global_step": 26558, "epoch": 223, "lr": 7.021059402367516e-05} +{"train_loss": 0.0024244075175374746, "global_step": 26559, "epoch": 223, "lr": 7.02085675538807e-05} +{"train_loss": 0.003957787994295359, "global_step": 26560, "epoch": 223, "lr": 7.020654104440889e-05} +{"train_loss": 0.005748318042606115, "global_step": 26561, "epoch": 223, "lr": 7.020451449526369e-05} +{"train_loss": 0.002038233680650592, "global_step": 26562, "epoch": 223, "lr": 7.020248790644908e-05} +{"train_loss": 0.0029959462117403746, "global_step": 26563, "epoch": 223, "lr": 7.020046127796904e-05} +{"train_loss": 0.004094944801181555, "global_step": 26564, "epoch": 223, "lr": 7.019843460982756e-05} +{"train_loss": 0.0020942611154168844, "global_step": 26565, "epoch": 223, "lr": 7.019640790202862e-05} +{"train_loss": 0.006904686335474253, "global_step": 26566, "epoch": 223, "lr": 7.019438115457618e-05} +{"train_loss": 0.0028445147909224033, "global_step": 26567, "epoch": 223, "lr": 7.019235436747422e-05} +{"train_loss": 0.0034415144473314285, "global_step": 26568, "epoch": 223, "lr": 7.019032754072674e-05} +{"train_loss": 0.004435038194060326, "global_step": 26569, "epoch": 223, "lr": 7.018830067433771e-05} +{"train_loss": 0.0032267377246171236, "global_step": 26570, "epoch": 223, "lr": 7.01862737683111e-05} +{"train_loss": 0.003424470778554678, "global_step": 26571, "epoch": 223, "lr": 7.01842468226509e-05} +{"train_loss": 0.0037419856525957584, "global_step": 26572, "epoch": 223, "lr": 7.01822198373611e-05} +{"train_loss": 0.003980393987149, "global_step": 26573, "epoch": 223, "lr": 7.018019281244567e-05} +{"train_loss": 0.0028886275831609964, "global_step": 26574, "epoch": 223, "lr": 7.017816574790858e-05} +{"train_loss": 0.0030194048304110765, "global_step": 26575, "epoch": 223, "lr": 7.017613864375381e-05} +{"train_loss": 0.005098646506667137, "global_step": 26576, "epoch": 223, "lr": 7.017411149998533e-05} +{"train_loss": 0.003258641343563795, "global_step": 26577, "epoch": 223, "lr": 7.017208431660718e-05} +{"train_loss": 0.003409755416214466, "global_step": 26578, "epoch": 223, "lr": 7.017005709362327e-05} +{"train_loss": 0.0032899104990065098, "global_step": 26579, "epoch": 223, "lr": 7.016802983103763e-05} +{"train_loss": 0.003183916909620166, "global_step": 26580, "epoch": 223, "lr": 7.016600252885419e-05} +{"train_loss": 0.004486898425966501, "global_step": 26581, "epoch": 223, "lr": 7.016397518707698e-05} +{"train_loss": 0.003134401747956872, "global_step": 26582, "epoch": 223, "lr": 7.016194780570996e-05} +{"train_loss": 0.003490978851914406, "global_step": 26583, "epoch": 223, "lr": 7.015992038475709e-05} +{"train_loss": 0.0033959115389734507, "global_step": 26584, "epoch": 223, "lr": 7.015789292422237e-05} +{"train_loss": 0.002937918296083808, "global_step": 26585, "epoch": 223, "lr": 7.015586542410978e-05} +{"train_loss": 0.0031098625622689724, "global_step": 26586, "epoch": 223, "lr": 7.015383788442332e-05} +{"train_loss": 0.004579526372253895, "global_step": 26587, "epoch": 223, "lr": 7.015181030516696e-05} +{"train_loss": 0.0018503620522096753, "global_step": 26588, "epoch": 223, "lr": 7.014978268634465e-05} +{"train_loss": 0.002726478036493063, "global_step": 26589, "epoch": 223, "lr": 7.014775502796039e-05} +{"train_loss": 0.002570193959400058, "global_step": 26590, "epoch": 223, "lr": 7.014572733001818e-05} +{"train_loss": 0.0028252070769667625, "global_step": 26591, "epoch": 223, "lr": 7.014369959252198e-05} +{"train_loss": 0.004256135784089565, "global_step": 26592, "epoch": 223, "lr": 7.01416718154758e-05} +{"train_loss": 0.0038429873529821634, "global_step": 26593, "epoch": 223, "lr": 7.013964399888357e-05} +{"train_loss": 0.00547401187941432, "global_step": 26594, "epoch": 223, "lr": 7.013761614274931e-05} +{"train_loss": 0.003166200825944543, "global_step": 26595, "epoch": 223, "lr": 7.0135588247077e-05} +{"train_loss": 0.003333748783916235, "global_step": 26596, "epoch": 223, "lr": 7.01335603118706e-05} +{"train_loss": 0.004655321128666401, "global_step": 26597, "epoch": 223, "lr": 7.013153233713411e-05} +{"train_loss": 0.0022480932530015707, "global_step": 26598, "epoch": 223, "lr": 7.012950432287151e-05} +{"train_loss": 0.0029049308504909277, "global_step": 26599, "epoch": 223, "lr": 7.012747626908679e-05} +{"train_loss": 0.004433941096067429, "global_step": 26600, "epoch": 223, "lr": 7.01254481757839e-05} +{"train_loss": 0.0017374721355736256, "global_step": 26601, "epoch": 223, "lr": 7.012342004296686e-05} +{"train_loss": 0.0022584267426282167, "global_step": 26602, "epoch": 223, "lr": 7.012139187063962e-05} +{"train_loss": 0.002489620354026556, "global_step": 26603, "epoch": 223, "lr": 7.011936365880618e-05} +{"train_loss": 0.0024393878411501646, "global_step": 26604, "epoch": 223, "lr": 7.011733540747053e-05} +{"train_loss": 0.003921689465641975, "global_step": 26605, "epoch": 223, "lr": 7.011530711663664e-05} +{"train_loss": 0.002379844430834055, "global_step": 26606, "epoch": 223, "lr": 7.011327878630849e-05} +{"train_loss": 0.002506745047867298, "global_step": 26607, "epoch": 223, "lr": 7.011125041649005e-05} +{"train_loss": 0.0036407369188964367, "global_step": 26608, "epoch": 223, "lr": 7.010922200718534e-05} +{"train_loss": 0.0030201307963579893, "global_step": 26609, "epoch": 223, "lr": 7.010719355839831e-05} +{"train_loss": 0.002747380407527089, "global_step": 26610, "epoch": 223, "lr": 7.010516507013296e-05} +{"train_loss": 0.0030132506508380175, "global_step": 26611, "epoch": 223, "lr": 7.010313654239327e-05} +{"train_loss": 0.00202648201957345, "global_step": 26612, "epoch": 223, "lr": 7.010110797518321e-05} +{"train_loss": 0.004969590809196234, "global_step": 26613, "epoch": 223, "lr": 7.009907936850677e-05} +{"train_loss": 0.004246766213327646, "global_step": 26614, "epoch": 223, "lr": 7.009705072236795e-05} +{"train_loss": 0.003633651416748762, "global_step": 26615, "epoch": 223, "lr": 7.00950220367707e-05} +{"train_loss": 0.002999757183715701, "global_step": 26616, "epoch": 223, "lr": 7.009299331171902e-05} +{"train_loss": 0.0017747707897797227, "global_step": 26617, "epoch": 223, "lr": 7.009096454721689e-05} +{"train_loss": 0.002703380538150668, "global_step": 26618, "epoch": 223, "lr": 7.008893574326831e-05} +{"train_loss": 0.003820478217676282, "global_step": 26619, "epoch": 223, "lr": 7.008690689987726e-05} +{"train_loss": 0.005195974837988615, "global_step": 26620, "epoch": 223, "lr": 7.00848780170477e-05} +{"train_loss": 0.002120277378708124, "global_step": 26621, "epoch": 223, "lr": 7.008284909478363e-05} +{"train_loss": 0.0038562710396945477, "global_step": 26622, "epoch": 223, "lr": 7.008082013308902e-05} +{"train_loss": 0.004161134362220764, "global_step": 26623, "epoch": 223, "lr": 7.00787911319679e-05} +{"train_loss": 0.0035462502855807543, "global_step": 26624, "epoch": 223, "lr": 7.00767620914242e-05} +{"train_loss": 0.001709287753328681, "global_step": 26625, "epoch": 223, "lr": 7.00747330114619e-05} +{"train_loss": 0.0015129846287891269, "global_step": 26626, "epoch": 223, "lr": 7.007270389208503e-05} +{"train_loss": 0.0030032030772417784, "global_step": 26627, "epoch": 223, "lr": 7.007067473329755e-05} +{"train_loss": 0.004138217307627201, "global_step": 26628, "epoch": 223, "lr": 7.006864553510343e-05} +{"train_loss": 0.0039223176427185535, "global_step": 26629, "epoch": 223, "lr": 7.00666162975067e-05} +{"train_loss": 0.005640826653689146, "global_step": 26630, "epoch": 223, "lr": 7.006458702051129e-05} +{"train_loss": 0.0025680544786155224, "global_step": 26631, "epoch": 223, "lr": 7.006255770412121e-05} +{"train_loss": 0.002674740506336093, "global_step": 26632, "epoch": 223, "lr": 7.006052834834044e-05} +{"train_loss": 0.0029981110710650682, "global_step": 26633, "epoch": 223, "lr": 7.005849895317295e-05} +{"train_loss": 0.004015768878161907, "global_step": 26634, "epoch": 223, "lr": 7.005646951862276e-05} +{"train_loss": 0.004278466105461121, "global_step": 26635, "epoch": 223, "lr": 7.005444004469383e-05} +{"train_loss": 0.003420718712732196, "global_step": 26636, "epoch": 223, "lr": 7.005241053139016e-05} +{"train_loss": 0.0027204141952097416, "global_step": 26637, "epoch": 223, "lr": 7.005038097871572e-05} +{"train_loss": 0.0026464066468179226, "global_step": 26638, "epoch": 223, "lr": 7.004835138667448e-05} +{"train_loss": 0.003681698814034462, "global_step": 26639, "epoch": 223, "lr": 7.004632175527046e-05} +{"train_loss": 0.0035220198333263397, "global_step": 26640, "epoch": 223, "lr": 7.004429208450762e-05} +{"train_loss": 0.004690973088145256, "global_step": 26641, "epoch": 223, "lr": 7.004226237438996e-05} +{"train_loss": 0.002841467270627618, "global_step": 26642, "epoch": 223, "lr": 7.004023262492148e-05} +{"train_loss": 0.002488057129085064, "global_step": 26643, "epoch": 223, "lr": 7.003820283610612e-05} +{"train_loss": 0.004002789501100779, "global_step": 26644, "epoch": 223, "lr": 7.00361730079479e-05} +{"train_loss": 0.003560359124094248, "global_step": 26645, "epoch": 223, "lr": 7.003414314045077e-05} +{"train_loss": 0.0035825043451040983, "global_step": 26646, "epoch": 223, "lr": 7.003211323361875e-05} +{"train_loss": 0.0038362089544534683, "global_step": 26647, "epoch": 223, "lr": 7.003008328745584e-05} +{"train_loss": 0.002779454691335559, "global_step": 26648, "epoch": 223, "lr": 7.002805330196598e-05} +{"train_loss": 0.0043568797409534454, "global_step": 26649, "epoch": 223, "lr": 7.002602327715318e-05} +{"train_loss": 0.004578298423439264, "global_step": 26650, "epoch": 223, "lr": 7.002399321302142e-05} +{"train_loss": 0.003946381621062756, "global_step": 26651, "epoch": 223, "lr": 7.002196310957469e-05} +{"train_loss": 0.0044517116621136665, "global_step": 26652, "epoch": 223, "lr": 7.001993296681698e-05} +{"train_loss": 0.003053162945434451, "global_step": 26653, "epoch": 223, "lr": 7.001790278475226e-05} +{"train_loss": 0.0044126384891569614, "global_step": 26654, "epoch": 223, "lr": 7.001587256338454e-05} +{"train_loss": 0.0034495793956042338, "global_step": 26655, "epoch": 223, "lr": 7.00138423027178e-05, "val_loss": 0.023790739476680756} +{"train_loss": 0.00544504402205348, "global_step": 26656, "epoch": 224, "lr": 7.0011812002756e-05} +{"train_loss": 0.0022401604801416397, "global_step": 26657, "epoch": 224, "lr": 7.000978166350316e-05} +{"train_loss": 0.002874844940379262, "global_step": 26658, "epoch": 224, "lr": 7.000775128496325e-05} +{"train_loss": 0.0022749188356101513, "global_step": 26659, "epoch": 224, "lr": 7.000572086714024e-05} +{"train_loss": 0.0039747050032019615, "global_step": 26660, "epoch": 224, "lr": 7.000369041003814e-05} +{"train_loss": 0.002518139546737075, "global_step": 26661, "epoch": 224, "lr": 7.000165991366094e-05} +{"train_loss": 0.0040728929452598095, "global_step": 26662, "epoch": 224, "lr": 6.999962937801262e-05} +{"train_loss": 0.004054351709783077, "global_step": 26663, "epoch": 224, "lr": 6.999759880309716e-05} +{"train_loss": 0.0038976245559751987, "global_step": 26664, "epoch": 224, "lr": 6.999556818891855e-05} +{"train_loss": 0.0041259038262069225, "global_step": 26665, "epoch": 224, "lr": 6.999353753548077e-05} +{"train_loss": 0.002530932193621993, "global_step": 26666, "epoch": 224, "lr": 6.999150684278782e-05} +{"train_loss": 0.00252537801861763, "global_step": 26667, "epoch": 224, "lr": 6.998947611084369e-05} +{"train_loss": 0.0028679233510047197, "global_step": 26668, "epoch": 224, "lr": 6.998744533965234e-05} +{"train_loss": 0.0035200410056859255, "global_step": 26669, "epoch": 224, "lr": 6.99854145292178e-05} +{"train_loss": 0.003591751679778099, "global_step": 26670, "epoch": 224, "lr": 6.998338367954403e-05} +{"train_loss": 0.003227346809580922, "global_step": 26671, "epoch": 224, "lr": 6.9981352790635e-05} +{"train_loss": 0.0032913601025938988, "global_step": 26672, "epoch": 224, "lr": 6.997932186249473e-05} +{"train_loss": 0.003241474274545908, "global_step": 26673, "epoch": 224, "lr": 6.997729089512721e-05} +{"train_loss": 0.002718562725931406, "global_step": 26674, "epoch": 224, "lr": 6.99752598885364e-05} +{"train_loss": 0.003811394330114126, "global_step": 26675, "epoch": 224, "lr": 6.997322884272632e-05} +{"train_loss": 0.004428934305906296, "global_step": 26676, "epoch": 224, "lr": 6.997119775770092e-05} +{"train_loss": 0.002955275122076273, "global_step": 26677, "epoch": 224, "lr": 6.99691666334642e-05} +{"train_loss": 0.0037325615994632244, "global_step": 26678, "epoch": 224, "lr": 6.996713547002016e-05} +{"train_loss": 0.004287426825612783, "global_step": 26679, "epoch": 224, "lr": 6.99651042673728e-05} +{"train_loss": 0.004657267592847347, "global_step": 26680, "epoch": 224, "lr": 6.996307302552608e-05} +{"train_loss": 0.005923419259488583, "global_step": 26681, "epoch": 224, "lr": 6.996104174448398e-05} +{"train_loss": 0.004298959393054247, "global_step": 26682, "epoch": 224, "lr": 6.995901042425053e-05} +{"train_loss": 0.002627498470246792, "global_step": 26683, "epoch": 224, "lr": 6.995697906482969e-05} +{"train_loss": 0.0036142724566161633, "global_step": 26684, "epoch": 224, "lr": 6.995494766622544e-05} +{"train_loss": 0.001940157380886376, "global_step": 26685, "epoch": 224, "lr": 6.99529162284418e-05} +{"train_loss": 0.0020842356607317924, "global_step": 26686, "epoch": 224, "lr": 6.995088475148275e-05} +{"train_loss": 0.004210208542644978, "global_step": 26687, "epoch": 224, "lr": 6.994885323535225e-05} +{"train_loss": 0.0029272602405399084, "global_step": 26688, "epoch": 224, "lr": 6.99468216800543e-05} +{"train_loss": 0.0035621952265501022, "global_step": 26689, "epoch": 224, "lr": 6.994479008559293e-05} +{"train_loss": 0.0037010484375059605, "global_step": 26690, "epoch": 224, "lr": 6.994275845197207e-05} +{"train_loss": 0.00307781295850873, "global_step": 26691, "epoch": 224, "lr": 6.994072677919573e-05} +{"train_loss": 0.0031787280458956957, "global_step": 26692, "epoch": 224, "lr": 6.993869506726792e-05} +{"train_loss": 0.0031989298295229673, "global_step": 26693, "epoch": 224, "lr": 6.993666331619261e-05} +{"train_loss": 0.00395658053457737, "global_step": 26694, "epoch": 224, "lr": 6.99346315259738e-05} +{"train_loss": 0.003677132073789835, "global_step": 26695, "epoch": 224, "lr": 6.993259969661544e-05} +{"train_loss": 0.0033602940384298563, "global_step": 26696, "epoch": 224, "lr": 6.993056782812158e-05} +{"train_loss": 0.0034480802714824677, "global_step": 26697, "epoch": 224, "lr": 6.992853592049616e-05} +{"train_loss": 0.005903781391680241, "global_step": 26698, "epoch": 224, "lr": 6.992650397374318e-05} +{"train_loss": 0.0044657508842647076, "global_step": 26699, "epoch": 224, "lr": 6.992447198786665e-05} +{"train_loss": 0.0027021325659006834, "global_step": 26700, "epoch": 224, "lr": 6.992243996287055e-05} +{"train_loss": 0.004486876539885998, "global_step": 26701, "epoch": 224, "lr": 6.992040789875887e-05} +{"train_loss": 0.0028911989647895098, "global_step": 26702, "epoch": 224, "lr": 6.99183757955356e-05} +{"train_loss": 0.0038494134787470102, "global_step": 26703, "epoch": 224, "lr": 6.991634365320473e-05} +{"train_loss": 0.002810008591040969, "global_step": 26704, "epoch": 224, "lr": 6.991431147177023e-05} +{"train_loss": 0.005940005648881197, "global_step": 26705, "epoch": 224, "lr": 6.991227925123614e-05} +{"train_loss": 0.005974696483463049, "global_step": 26706, "epoch": 224, "lr": 6.99102469916064e-05} +{"train_loss": 0.004657444544136524, "global_step": 26707, "epoch": 224, "lr": 6.990821469288499e-05} +{"train_loss": 0.005195794627070427, "global_step": 26708, "epoch": 224, "lr": 6.990618235507595e-05} +{"train_loss": 0.0036832625046372414, "global_step": 26709, "epoch": 224, "lr": 6.990414997818325e-05} +{"train_loss": 0.0036461935378611088, "global_step": 26710, "epoch": 224, "lr": 6.990211756221088e-05} +{"train_loss": 0.0024035025853663683, "global_step": 26711, "epoch": 224, "lr": 6.990008510716283e-05} +{"train_loss": 0.004315750207751989, "global_step": 26712, "epoch": 224, "lr": 6.989805261304307e-05} +{"train_loss": 0.003343099495396018, "global_step": 26713, "epoch": 224, "lr": 6.989602007985563e-05} +{"train_loss": 0.002839842112734914, "global_step": 26714, "epoch": 224, "lr": 6.989398750760446e-05} +{"train_loss": 0.00359907653182745, "global_step": 26715, "epoch": 224, "lr": 6.989195489629359e-05} +{"train_loss": 0.003899743314832449, "global_step": 26716, "epoch": 224, "lr": 6.988992224592699e-05} +{"train_loss": 0.004047847352921963, "global_step": 26717, "epoch": 224, "lr": 6.988788955650863e-05} +{"train_loss": 0.0036551454104483128, "global_step": 26718, "epoch": 224, "lr": 6.988585682804254e-05} +{"train_loss": 0.0031118786428123713, "global_step": 26719, "epoch": 224, "lr": 6.98838240605327e-05} +{"train_loss": 0.00516534922644496, "global_step": 26720, "epoch": 224, "lr": 6.988179125398309e-05} +{"train_loss": 0.0052225892432034016, "global_step": 26721, "epoch": 224, "lr": 6.987975840839771e-05} +{"train_loss": 0.002557376865297556, "global_step": 26722, "epoch": 224, "lr": 6.987772552378053e-05} +{"train_loss": 0.002423597266897559, "global_step": 26723, "epoch": 224, "lr": 6.987569260013557e-05} +{"train_loss": 0.003957048524171114, "global_step": 26724, "epoch": 224, "lr": 6.987365963746684e-05} +{"train_loss": 0.003714001737535, "global_step": 26725, "epoch": 224, "lr": 6.987162663577827e-05} +{"train_loss": 0.004648993723094463, "global_step": 26726, "epoch": 224, "lr": 6.98695935950739e-05} +{"train_loss": 0.004246220923960209, "global_step": 26727, "epoch": 224, "lr": 6.98675605153577e-05} +{"train_loss": 0.0043258145451545715, "global_step": 26728, "epoch": 224, "lr": 6.986552739663366e-05} +{"train_loss": 0.0029065704438835382, "global_step": 26729, "epoch": 224, "lr": 6.986349423890579e-05} +{"train_loss": 0.00693932268768549, "global_step": 26730, "epoch": 224, "lr": 6.986146104217807e-05} +{"train_loss": 0.004997453652322292, "global_step": 26731, "epoch": 224, "lr": 6.985942780645448e-05} +{"train_loss": 0.0028762833680957556, "global_step": 26732, "epoch": 224, "lr": 6.985739453173903e-05} +{"train_loss": 0.0024855313822627068, "global_step": 26733, "epoch": 224, "lr": 6.985536121803571e-05} +{"train_loss": 0.0048269303515553474, "global_step": 26734, "epoch": 224, "lr": 6.985332786534851e-05} +{"train_loss": 0.0026756676379591227, "global_step": 26735, "epoch": 224, "lr": 6.985129447368143e-05} +{"train_loss": 0.0023581748828291893, "global_step": 26736, "epoch": 224, "lr": 6.984926104303845e-05} +{"train_loss": 0.0038599150720983744, "global_step": 26737, "epoch": 224, "lr": 6.984722757342356e-05} +{"train_loss": 0.0037896055728197098, "global_step": 26738, "epoch": 224, "lr": 6.984519406484077e-05} +{"train_loss": 0.004740473814308643, "global_step": 26739, "epoch": 224, "lr": 6.984316051729405e-05} +{"train_loss": 0.0034172004088759422, "global_step": 26740, "epoch": 224, "lr": 6.98411269307874e-05} +{"train_loss": 0.0033611971884965897, "global_step": 26741, "epoch": 224, "lr": 6.983909330532483e-05} +{"train_loss": 0.0028830335941165686, "global_step": 26742, "epoch": 224, "lr": 6.983705964091034e-05} +{"train_loss": 0.00407361751422286, "global_step": 26743, "epoch": 224, "lr": 6.983502593754786e-05} +{"train_loss": 0.005639023147523403, "global_step": 26744, "epoch": 224, "lr": 6.983299219524145e-05} +{"train_loss": 0.004407802596688271, "global_step": 26745, "epoch": 224, "lr": 6.983095841399507e-05} +{"train_loss": 0.004465674050152302, "global_step": 26746, "epoch": 224, "lr": 6.982892459381272e-05} +{"train_loss": 0.003190599847584963, "global_step": 26747, "epoch": 224, "lr": 6.982689073469841e-05} +{"train_loss": 0.005531547125428915, "global_step": 26748, "epoch": 224, "lr": 6.98248568366561e-05} +{"train_loss": 0.004734761081635952, "global_step": 26749, "epoch": 224, "lr": 6.98228228996898e-05} +{"train_loss": 0.004138553980737925, "global_step": 26750, "epoch": 224, "lr": 6.982078892380352e-05} +{"train_loss": 0.0037463069893419743, "global_step": 26751, "epoch": 224, "lr": 6.981875490900122e-05} +{"train_loss": 0.00438660616055131, "global_step": 26752, "epoch": 224, "lr": 6.981672085528693e-05} +{"train_loss": 0.0033553042449057102, "global_step": 26753, "epoch": 224, "lr": 6.981468676266462e-05} +{"train_loss": 0.0038619462866336107, "global_step": 26754, "epoch": 224, "lr": 6.981265263113829e-05} +{"train_loss": 0.003163796616718173, "global_step": 26755, "epoch": 224, "lr": 6.981061846071193e-05} +{"train_loss": 0.0040830690413713455, "global_step": 26756, "epoch": 224, "lr": 6.980858425138956e-05} +{"train_loss": 0.0030978803988546133, "global_step": 26757, "epoch": 224, "lr": 6.980655000317511e-05} +{"train_loss": 0.0026768394745886326, "global_step": 26758, "epoch": 224, "lr": 6.980451571607265e-05} +{"train_loss": 0.002881368389353156, "global_step": 26759, "epoch": 224, "lr": 6.980248139008611e-05} +{"train_loss": 0.003043553326278925, "global_step": 26760, "epoch": 224, "lr": 6.980044702521954e-05} +{"train_loss": 0.003234272124245763, "global_step": 26761, "epoch": 224, "lr": 6.97984126214769e-05} +{"train_loss": 0.0022740010172128677, "global_step": 26762, "epoch": 224, "lr": 6.979637817886219e-05} +{"train_loss": 0.0034066839143633842, "global_step": 26763, "epoch": 224, "lr": 6.979434369737941e-05} +{"train_loss": 0.0016188279259949923, "global_step": 26764, "epoch": 224, "lr": 6.979230917703254e-05} +{"train_loss": 0.0031154232565313578, "global_step": 26765, "epoch": 224, "lr": 6.979027461782558e-05} +{"train_loss": 0.0029109297320246696, "global_step": 26766, "epoch": 224, "lr": 6.978824001976255e-05} +{"train_loss": 0.004502793774008751, "global_step": 26767, "epoch": 224, "lr": 6.978620538284742e-05} +{"train_loss": 0.002212244551628828, "global_step": 26768, "epoch": 224, "lr": 6.978417070708418e-05} +{"train_loss": 0.00317987147718668, "global_step": 26769, "epoch": 224, "lr": 6.978213599247683e-05} +{"train_loss": 0.003950406797230244, "global_step": 26770, "epoch": 224, "lr": 6.978010123902938e-05} +{"train_loss": 0.004743534605950117, "global_step": 26771, "epoch": 224, "lr": 6.977806644674582e-05} +{"train_loss": 0.002791959559544921, "global_step": 26772, "epoch": 224, "lr": 6.977603161563013e-05} +{"train_loss": 0.004246846307069063, "global_step": 26773, "epoch": 224, "lr": 6.977399674568631e-05} +{"train_loss": 0.0036706567689103364, "global_step": 26774, "epoch": 224, "lr": 6.977196183691839e-05, "val_loss": 0.011662224307656288} +{"train_loss": 0.004688579589128494, "global_step": 26775, "epoch": 225, "lr": 6.97699268893303e-05} +{"train_loss": 0.00435355119407177, "global_step": 26776, "epoch": 225, "lr": 6.976789190292609e-05} +{"train_loss": 0.0034311104100197554, "global_step": 26777, "epoch": 225, "lr": 6.976585687770972e-05} +{"train_loss": 0.0032502547837793827, "global_step": 26778, "epoch": 225, "lr": 6.976382181368522e-05} +{"train_loss": 0.00286119501106441, "global_step": 26779, "epoch": 225, "lr": 6.976178671085656e-05} +{"train_loss": 0.0033681027125567198, "global_step": 26780, "epoch": 225, "lr": 6.975975156922773e-05} +{"train_loss": 0.003615226596593857, "global_step": 26781, "epoch": 225, "lr": 6.975771638880275e-05} +{"train_loss": 0.003391367383301258, "global_step": 26782, "epoch": 225, "lr": 6.97556811695856e-05} +{"train_loss": 0.003595074638724327, "global_step": 26783, "epoch": 225, "lr": 6.975364591158029e-05} +{"train_loss": 0.00307307462207973, "global_step": 26784, "epoch": 225, "lr": 6.97516106147908e-05} +{"train_loss": 0.004402255639433861, "global_step": 26785, "epoch": 225, "lr": 6.974957527922114e-05} +{"train_loss": 0.0060420711524784565, "global_step": 26786, "epoch": 225, "lr": 6.97475399048753e-05} +{"train_loss": 0.003957831766456366, "global_step": 26787, "epoch": 225, "lr": 6.974550449175728e-05} +{"train_loss": 0.003931417595595121, "global_step": 26788, "epoch": 225, "lr": 6.974346903987104e-05} +{"train_loss": 0.004429287277162075, "global_step": 26789, "epoch": 225, "lr": 6.974143354922064e-05} +{"train_loss": 0.004082064144313335, "global_step": 26790, "epoch": 225, "lr": 6.973939801981003e-05} +{"train_loss": 0.003357223467901349, "global_step": 26791, "epoch": 225, "lr": 6.973736245164322e-05} +{"train_loss": 0.004455752205103636, "global_step": 26792, "epoch": 225, "lr": 6.973532684472421e-05} +{"train_loss": 0.002538505010306835, "global_step": 26793, "epoch": 225, "lr": 6.9733291199057e-05} +{"train_loss": 0.0023051470052450895, "global_step": 26794, "epoch": 225, "lr": 6.973125551464557e-05} +{"train_loss": 0.002714135218411684, "global_step": 26795, "epoch": 225, "lr": 6.972921979149393e-05} +{"train_loss": 0.0021338954102247953, "global_step": 26796, "epoch": 225, "lr": 6.972718402960608e-05} +{"train_loss": 0.00469715241342783, "global_step": 26797, "epoch": 225, "lr": 6.972514822898601e-05} +{"train_loss": 0.004013805650174618, "global_step": 26798, "epoch": 225, "lr": 6.972311238963773e-05} +{"train_loss": 0.0037930086255073547, "global_step": 26799, "epoch": 225, "lr": 6.972107651156521e-05} +{"train_loss": 0.006513340398669243, "global_step": 26800, "epoch": 225, "lr": 6.971904059477247e-05} +{"train_loss": 0.0025928497780114412, "global_step": 26801, "epoch": 225, "lr": 6.97170046392635e-05} +{"train_loss": 0.002441120333969593, "global_step": 26802, "epoch": 225, "lr": 6.971496864504229e-05} +{"train_loss": 0.004706877749413252, "global_step": 26803, "epoch": 225, "lr": 6.971293261211285e-05} +{"train_loss": 0.0024835243821144104, "global_step": 26804, "epoch": 225, "lr": 6.971089654047918e-05} +{"train_loss": 0.002254168037325144, "global_step": 26805, "epoch": 225, "lr": 6.970886043014527e-05} +{"train_loss": 0.0020251935347914696, "global_step": 26806, "epoch": 225, "lr": 6.970682428111511e-05} +{"train_loss": 0.0051419660449028015, "global_step": 26807, "epoch": 225, "lr": 6.970478809339272e-05} +{"train_loss": 0.0027488628402352333, "global_step": 26808, "epoch": 225, "lr": 6.970275186698206e-05} +{"train_loss": 0.0028687980957329273, "global_step": 26809, "epoch": 225, "lr": 6.970071560188715e-05} +{"train_loss": 0.004879954736679792, "global_step": 26810, "epoch": 225, "lr": 6.969867929811202e-05} +{"train_loss": 0.00413671275600791, "global_step": 26811, "epoch": 225, "lr": 6.969664295566063e-05} +{"train_loss": 0.0024961819872260094, "global_step": 26812, "epoch": 225, "lr": 6.969460657453696e-05} +{"train_loss": 0.004869797267019749, "global_step": 26813, "epoch": 225, "lr": 6.969257015474507e-05} +{"train_loss": 0.002511340659111738, "global_step": 26814, "epoch": 225, "lr": 6.96905336962889e-05} +{"train_loss": 0.003466434311121702, "global_step": 26815, "epoch": 225, "lr": 6.968849719917246e-05} +{"train_loss": 0.0034735098015516996, "global_step": 26816, "epoch": 225, "lr": 6.968646066339977e-05} +{"train_loss": 0.0043728104792535305, "global_step": 26817, "epoch": 225, "lr": 6.968442408897483e-05} +{"train_loss": 0.0026152082718908787, "global_step": 26818, "epoch": 225, "lr": 6.968238747590163e-05} +{"train_loss": 0.002729591680690646, "global_step": 26819, "epoch": 225, "lr": 6.968035082418414e-05} +{"train_loss": 0.00382974767126143, "global_step": 26820, "epoch": 225, "lr": 6.967831413382639e-05} +{"train_loss": 0.0030426245648413897, "global_step": 26821, "epoch": 225, "lr": 6.967627740483238e-05} +{"train_loss": 0.0034207713324576616, "global_step": 26822, "epoch": 225, "lr": 6.96742406372061e-05} +{"train_loss": 0.003911557141691446, "global_step": 26823, "epoch": 225, "lr": 6.967220383095155e-05} +{"train_loss": 0.0026500134263187647, "global_step": 26824, "epoch": 225, "lr": 6.967016698607274e-05} +{"train_loss": 0.0020474563352763653, "global_step": 26825, "epoch": 225, "lr": 6.966813010257365e-05} +{"train_loss": 0.002687818603590131, "global_step": 26826, "epoch": 225, "lr": 6.96660931804583e-05} +{"train_loss": 0.0036565896589308977, "global_step": 26827, "epoch": 225, "lr": 6.966405621973064e-05} +{"train_loss": 0.0037820907309651375, "global_step": 26828, "epoch": 225, "lr": 6.966201922039474e-05} +{"train_loss": 0.0040503269992768764, "global_step": 26829, "epoch": 225, "lr": 6.965998218245455e-05} +{"train_loss": 0.00247110053896904, "global_step": 26830, "epoch": 225, "lr": 6.965794510591409e-05} +{"train_loss": 0.003083499614149332, "global_step": 26831, "epoch": 225, "lr": 6.965590799077736e-05} +{"train_loss": 0.003949528560042381, "global_step": 26832, "epoch": 225, "lr": 6.965387083704835e-05} +{"train_loss": 0.0021503842435777187, "global_step": 26833, "epoch": 225, "lr": 6.965183364473106e-05} +{"train_loss": 0.004130800254642963, "global_step": 26834, "epoch": 225, "lr": 6.96497964138295e-05} +{"train_loss": 0.0032801709603518248, "global_step": 26835, "epoch": 225, "lr": 6.964775914434766e-05} +{"train_loss": 0.0038447920233011246, "global_step": 26836, "epoch": 225, "lr": 6.964572183628955e-05} +{"train_loss": 0.002723312471061945, "global_step": 26837, "epoch": 225, "lr": 6.964368448965916e-05} +{"train_loss": 0.002017054706811905, "global_step": 26838, "epoch": 225, "lr": 6.96416471044605e-05} +{"train_loss": 0.0032348190434277058, "global_step": 26839, "epoch": 225, "lr": 6.963960968069756e-05} +{"train_loss": 0.002783654723316431, "global_step": 26840, "epoch": 225, "lr": 6.963757221837435e-05} +{"train_loss": 0.004242634400725365, "global_step": 26841, "epoch": 225, "lr": 6.963553471749486e-05} +{"train_loss": 0.005304063204675913, "global_step": 26842, "epoch": 225, "lr": 6.963349717806309e-05} +{"train_loss": 0.003691582242026925, "global_step": 26843, "epoch": 225, "lr": 6.963145960008306e-05} +{"train_loss": 0.0026302882470190525, "global_step": 26844, "epoch": 225, "lr": 6.962942198355874e-05} +{"train_loss": 0.0027161885518580675, "global_step": 26845, "epoch": 225, "lr": 6.962738432849415e-05} +{"train_loss": 0.00353699317201972, "global_step": 26846, "epoch": 225, "lr": 6.962534663489329e-05} +{"train_loss": 0.004609252326190472, "global_step": 26847, "epoch": 225, "lr": 6.962330890276016e-05} +{"train_loss": 0.0020772868301719427, "global_step": 26848, "epoch": 225, "lr": 6.962127113209875e-05} +{"train_loss": 0.003247619839385152, "global_step": 26849, "epoch": 225, "lr": 6.961923332291309e-05} +{"train_loss": 0.00435107946395874, "global_step": 26850, "epoch": 225, "lr": 6.961719547520716e-05} +{"train_loss": 0.0016907078679651022, "global_step": 26851, "epoch": 225, "lr": 6.961515758898494e-05} +{"train_loss": 0.0028845008928328753, "global_step": 26852, "epoch": 225, "lr": 6.961311966425046e-05} +{"train_loss": 0.0021966188214719296, "global_step": 26853, "epoch": 225, "lr": 6.961108170100773e-05} +{"train_loss": 0.0023517259396612644, "global_step": 26854, "epoch": 225, "lr": 6.960904369926073e-05} +{"train_loss": 0.0035442158114165068, "global_step": 26855, "epoch": 225, "lr": 6.960700565901347e-05} +{"train_loss": 0.0028873630799353123, "global_step": 26856, "epoch": 225, "lr": 6.960496758026994e-05} +{"train_loss": 0.002476949244737625, "global_step": 26857, "epoch": 225, "lr": 6.960292946303416e-05} +{"train_loss": 0.002722520614042878, "global_step": 26858, "epoch": 225, "lr": 6.960089130731011e-05} +{"train_loss": 0.0020467624999582767, "global_step": 26859, "epoch": 225, "lr": 6.959885311310182e-05} +{"train_loss": 0.0059806969948112965, "global_step": 26860, "epoch": 225, "lr": 6.959681488041326e-05} +{"train_loss": 0.003715124214068055, "global_step": 26861, "epoch": 225, "lr": 6.959477660924847e-05} +{"train_loss": 0.003844540100544691, "global_step": 26862, "epoch": 225, "lr": 6.959273829961141e-05} +{"train_loss": 0.002707200590521097, "global_step": 26863, "epoch": 225, "lr": 6.959069995150611e-05} +{"train_loss": 0.004396694712340832, "global_step": 26864, "epoch": 225, "lr": 6.958866156493654e-05} +{"train_loss": 0.002464079763740301, "global_step": 26865, "epoch": 225, "lr": 6.958662313990675e-05} +{"train_loss": 0.003656088374555111, "global_step": 26866, "epoch": 225, "lr": 6.958458467642071e-05} +{"train_loss": 0.0029166946187615395, "global_step": 26867, "epoch": 225, "lr": 6.958254617448243e-05} +{"train_loss": 0.003628523088991642, "global_step": 26868, "epoch": 225, "lr": 6.958050763409593e-05} +{"train_loss": 0.0019889650866389275, "global_step": 26869, "epoch": 225, "lr": 6.957846905526517e-05} +{"train_loss": 0.0026265692431479692, "global_step": 26870, "epoch": 225, "lr": 6.95764304379942e-05} +{"train_loss": 0.005253270734101534, "global_step": 26871, "epoch": 225, "lr": 6.957439178228699e-05} +{"train_loss": 0.003181013511493802, "global_step": 26872, "epoch": 225, "lr": 6.957235308814755e-05} +{"train_loss": 0.0025585198309272528, "global_step": 26873, "epoch": 225, "lr": 6.957031435557988e-05} +{"train_loss": 0.002355740638449788, "global_step": 26874, "epoch": 225, "lr": 6.956827558458801e-05} +{"train_loss": 0.004088093526661396, "global_step": 26875, "epoch": 225, "lr": 6.956623677517591e-05} +{"train_loss": 0.003980142995715141, "global_step": 26876, "epoch": 225, "lr": 6.956419792734758e-05} +{"train_loss": 0.0041020712815225124, "global_step": 26877, "epoch": 225, "lr": 6.956215904110706e-05} +{"train_loss": 0.002871627453714609, "global_step": 26878, "epoch": 225, "lr": 6.956012011645832e-05} +{"train_loss": 0.004243556410074234, "global_step": 26879, "epoch": 225, "lr": 6.955808115340538e-05} +{"train_loss": 0.004056422971189022, "global_step": 26880, "epoch": 225, "lr": 6.955604215195221e-05} +{"train_loss": 0.0024021673016250134, "global_step": 26881, "epoch": 225, "lr": 6.955400311210287e-05} +{"train_loss": 0.004652637988328934, "global_step": 26882, "epoch": 225, "lr": 6.955196403386132e-05} +{"train_loss": 0.003665271447971463, "global_step": 26883, "epoch": 225, "lr": 6.954992491723158e-05} +{"train_loss": 0.004148108419030905, "global_step": 26884, "epoch": 225, "lr": 6.954788576221767e-05} +{"train_loss": 0.0024089624639600515, "global_step": 26885, "epoch": 225, "lr": 6.954584656882355e-05} +{"train_loss": 0.0034341812133789062, "global_step": 26886, "epoch": 225, "lr": 6.954380733705326e-05} +{"train_loss": 0.0026930784806609154, "global_step": 26887, "epoch": 225, "lr": 6.954176806691079e-05} +{"train_loss": 0.002171336906030774, "global_step": 26888, "epoch": 225, "lr": 6.953972875840016e-05} +{"train_loss": 0.002328122965991497, "global_step": 26889, "epoch": 225, "lr": 6.953768941152534e-05} +{"train_loss": 0.003177735721692443, "global_step": 26890, "epoch": 225, "lr": 6.953565002629035e-05} +{"train_loss": 0.0024000711273401976, "global_step": 26891, "epoch": 225, "lr": 6.953361060269922e-05} +{"train_loss": 0.004054876510053873, "global_step": 26892, "epoch": 225, "lr": 6.953157114075591e-05} +{"train_loss": 0.0033918035083583425, "global_step": 26893, "epoch": 225, "lr": 6.952953164046447e-05, "val_loss": 0.023793162778019905, "train_action_mse_error": 6.224053504411131e-05} +{"train_loss": 0.003458644263446331, "global_step": 26894, "epoch": 226, "lr": 6.952749210182888e-05} +{"train_loss": 0.0042471326887607574, "global_step": 26895, "epoch": 226, "lr": 6.952545252485312e-05} +{"train_loss": 0.004370440728962421, "global_step": 26896, "epoch": 226, "lr": 6.952341290954123e-05} +{"train_loss": 0.003277745796367526, "global_step": 26897, "epoch": 226, "lr": 6.952137325589722e-05} +{"train_loss": 0.002722437959164381, "global_step": 26898, "epoch": 226, "lr": 6.951933356392505e-05} +{"train_loss": 0.0037423339672386646, "global_step": 26899, "epoch": 226, "lr": 6.951729383362878e-05} +{"train_loss": 0.002187318168580532, "global_step": 26900, "epoch": 226, "lr": 6.951525406501238e-05} +{"train_loss": 0.004279670305550098, "global_step": 26901, "epoch": 226, "lr": 6.951321425807986e-05} +{"train_loss": 0.0036238087341189384, "global_step": 26902, "epoch": 226, "lr": 6.951117441283523e-05} +{"train_loss": 0.0032613251823931932, "global_step": 26903, "epoch": 226, "lr": 6.950913452928249e-05} +{"train_loss": 0.004066644702106714, "global_step": 26904, "epoch": 226, "lr": 6.950709460742566e-05} +{"train_loss": 0.00194634054787457, "global_step": 26905, "epoch": 226, "lr": 6.950505464726874e-05} +{"train_loss": 0.0025142852682620287, "global_step": 26906, "epoch": 226, "lr": 6.950301464881572e-05} +{"train_loss": 0.003947829827666283, "global_step": 26907, "epoch": 226, "lr": 6.950097461207061e-05} +{"train_loss": 0.002713974332436919, "global_step": 26908, "epoch": 226, "lr": 6.949893453703741e-05} +{"train_loss": 0.002925050910562277, "global_step": 26909, "epoch": 226, "lr": 6.949689442372016e-05} +{"train_loss": 0.004258260130882263, "global_step": 26910, "epoch": 226, "lr": 6.949485427212282e-05} +{"train_loss": 0.0044647264294326305, "global_step": 26911, "epoch": 226, "lr": 6.949281408224942e-05} +{"train_loss": 0.0038240812718868256, "global_step": 26912, "epoch": 226, "lr": 6.949077385410397e-05} +{"train_loss": 0.004737425595521927, "global_step": 26913, "epoch": 226, "lr": 6.948873358769045e-05} +{"train_loss": 0.0032370134722441435, "global_step": 26914, "epoch": 226, "lr": 6.94866932830129e-05} +{"train_loss": 0.0021728824358433485, "global_step": 26915, "epoch": 226, "lr": 6.948465294007531e-05} +{"train_loss": 0.002118219854310155, "global_step": 26916, "epoch": 226, "lr": 6.94826125588817e-05} +{"train_loss": 0.0022240530233830214, "global_step": 26917, "epoch": 226, "lr": 6.948057213943603e-05} +{"train_loss": 0.0031564359087496996, "global_step": 26918, "epoch": 226, "lr": 6.947853168174235e-05} +{"train_loss": 0.0030122401658445597, "global_step": 26919, "epoch": 226, "lr": 6.947649118580466e-05} +{"train_loss": 0.0065589952282607555, "global_step": 26920, "epoch": 226, "lr": 6.947445065162696e-05} +{"train_loss": 0.004760961513966322, "global_step": 26921, "epoch": 226, "lr": 6.947241007921325e-05} +{"train_loss": 0.003005905309692025, "global_step": 26922, "epoch": 226, "lr": 6.947036946856754e-05} +{"train_loss": 0.0034967754036188126, "global_step": 26923, "epoch": 226, "lr": 6.946832881969385e-05} +{"train_loss": 0.002677203854545951, "global_step": 26924, "epoch": 226, "lr": 6.946628813259618e-05} +{"train_loss": 0.004461150150746107, "global_step": 26925, "epoch": 226, "lr": 6.946424740727853e-05} +{"train_loss": 0.002099445788189769, "global_step": 26926, "epoch": 226, "lr": 6.94622066437449e-05} +{"train_loss": 0.002876262180507183, "global_step": 26927, "epoch": 226, "lr": 6.94601658419993e-05} +{"train_loss": 0.004260251298546791, "global_step": 26928, "epoch": 226, "lr": 6.945812500204575e-05} +{"train_loss": 0.0028990888968110085, "global_step": 26929, "epoch": 226, "lr": 6.945608412388827e-05} +{"train_loss": 0.004304667003452778, "global_step": 26930, "epoch": 226, "lr": 6.945404320753082e-05} +{"train_loss": 0.0039149499498307705, "global_step": 26931, "epoch": 226, "lr": 6.945200225297745e-05} +{"train_loss": 0.0048014395870268345, "global_step": 26932, "epoch": 226, "lr": 6.944996126023214e-05} +{"train_loss": 0.002988687949255109, "global_step": 26933, "epoch": 226, "lr": 6.944792022929892e-05} +{"train_loss": 0.002264615846797824, "global_step": 26934, "epoch": 226, "lr": 6.944587916018179e-05} +{"train_loss": 0.004080111160874367, "global_step": 26935, "epoch": 226, "lr": 6.944383805288474e-05} +{"train_loss": 0.0034996068570762873, "global_step": 26936, "epoch": 226, "lr": 6.944179690741179e-05} +{"train_loss": 0.00363506143912673, "global_step": 26937, "epoch": 226, "lr": 6.943975572376697e-05} +{"train_loss": 0.003179850522428751, "global_step": 26938, "epoch": 226, "lr": 6.943771450195427e-05} +{"train_loss": 0.002197675406932831, "global_step": 26939, "epoch": 226, "lr": 6.943567324197766e-05} +{"train_loss": 0.00272709340788424, "global_step": 26940, "epoch": 226, "lr": 6.943363194384121e-05} +{"train_loss": 0.0029230783693492413, "global_step": 26941, "epoch": 226, "lr": 6.943159060754888e-05} +{"train_loss": 0.003752834163606167, "global_step": 26942, "epoch": 226, "lr": 6.94295492331047e-05} +{"train_loss": 0.005128440447151661, "global_step": 26943, "epoch": 226, "lr": 6.94275078205127e-05} +{"train_loss": 0.004039900843054056, "global_step": 26944, "epoch": 226, "lr": 6.942546636977684e-05} +{"train_loss": 0.002635024720802903, "global_step": 26945, "epoch": 226, "lr": 6.942342488090116e-05} +{"train_loss": 0.004634428303688765, "global_step": 26946, "epoch": 226, "lr": 6.942138335388967e-05} +{"train_loss": 0.0023923316039144993, "global_step": 26947, "epoch": 226, "lr": 6.941934178874635e-05} +{"train_loss": 0.007451132405549288, "global_step": 26948, "epoch": 226, "lr": 6.941730018547524e-05} +{"train_loss": 0.0028523006476461887, "global_step": 26949, "epoch": 226, "lr": 6.941525854408034e-05} +{"train_loss": 0.005321167875081301, "global_step": 26950, "epoch": 226, "lr": 6.941321686456563e-05} +{"train_loss": 0.004029258154332638, "global_step": 26951, "epoch": 226, "lr": 6.941117514693515e-05} +{"train_loss": 0.0055947573855519295, "global_step": 26952, "epoch": 226, "lr": 6.940913339119292e-05} +{"train_loss": 0.0026333460118621588, "global_step": 26953, "epoch": 226, "lr": 6.94070915973429e-05} +{"train_loss": 0.00394799280911684, "global_step": 26954, "epoch": 226, "lr": 6.940504976538916e-05} +{"train_loss": 0.006175165064632893, "global_step": 26955, "epoch": 226, "lr": 6.940300789533568e-05} +{"train_loss": 0.0035910431761294603, "global_step": 26956, "epoch": 226, "lr": 6.940096598718645e-05} +{"train_loss": 0.004211794584989548, "global_step": 26957, "epoch": 226, "lr": 6.93989240409455e-05} +{"train_loss": 0.005171554628759623, "global_step": 26958, "epoch": 226, "lr": 6.939688205661683e-05} +{"train_loss": 0.004985745996236801, "global_step": 26959, "epoch": 226, "lr": 6.939484003420446e-05} +{"train_loss": 0.002334383549168706, "global_step": 26960, "epoch": 226, "lr": 6.939279797371239e-05} +{"train_loss": 0.001961237285286188, "global_step": 26961, "epoch": 226, "lr": 6.939075587514463e-05} +{"train_loss": 0.004155782051384449, "global_step": 26962, "epoch": 226, "lr": 6.93887137385052e-05} +{"train_loss": 0.00680964533239603, "global_step": 26963, "epoch": 226, "lr": 6.93866715637981e-05} +{"train_loss": 0.004556295461952686, "global_step": 26964, "epoch": 226, "lr": 6.938462935102735e-05} +{"train_loss": 0.0027877555694431067, "global_step": 26965, "epoch": 226, "lr": 6.938258710019694e-05} +{"train_loss": 0.0031966327223926783, "global_step": 26966, "epoch": 226, "lr": 6.938054481131088e-05} +{"train_loss": 0.004462098702788353, "global_step": 26967, "epoch": 226, "lr": 6.937850248437321e-05} +{"train_loss": 0.0055756582878530025, "global_step": 26968, "epoch": 226, "lr": 6.937646011938792e-05} +{"train_loss": 0.005296655464917421, "global_step": 26969, "epoch": 226, "lr": 6.937441771635902e-05} +{"train_loss": 0.004171995911747217, "global_step": 26970, "epoch": 226, "lr": 6.937237527529051e-05} +{"train_loss": 0.005372543819248676, "global_step": 26971, "epoch": 226, "lr": 6.937033279618641e-05} +{"train_loss": 0.004319762345403433, "global_step": 26972, "epoch": 226, "lr": 6.936829027905075e-05} +{"train_loss": 0.0028790184296667576, "global_step": 26973, "epoch": 226, "lr": 6.93662477238875e-05} +{"train_loss": 0.0038255457766354084, "global_step": 26974, "epoch": 226, "lr": 6.936420513070071e-05} +{"train_loss": 0.005510193761438131, "global_step": 26975, "epoch": 226, "lr": 6.936216249949436e-05} +{"train_loss": 0.0020036636851727962, "global_step": 26976, "epoch": 226, "lr": 6.936011983027247e-05} +{"train_loss": 0.004746235441416502, "global_step": 26977, "epoch": 226, "lr": 6.935807712303907e-05} +{"train_loss": 0.0032830166164785624, "global_step": 26978, "epoch": 226, "lr": 6.935603437779814e-05} +{"train_loss": 0.004332325421273708, "global_step": 26979, "epoch": 226, "lr": 6.93539915945537e-05} +{"train_loss": 0.0024452009238302708, "global_step": 26980, "epoch": 226, "lr": 6.935194877330978e-05} +{"train_loss": 0.0058564962819218636, "global_step": 26981, "epoch": 226, "lr": 6.934990591407035e-05} +{"train_loss": 0.003956529777497053, "global_step": 26982, "epoch": 226, "lr": 6.934786301683947e-05} +{"train_loss": 0.0044505964033305645, "global_step": 26983, "epoch": 226, "lr": 6.934582008162112e-05} +{"train_loss": 0.002678899560123682, "global_step": 26984, "epoch": 226, "lr": 6.934377710841932e-05} +{"train_loss": 0.004039479419589043, "global_step": 26985, "epoch": 226, "lr": 6.934173409723807e-05} +{"train_loss": 0.004253539722412825, "global_step": 26986, "epoch": 226, "lr": 6.933969104808141e-05} +{"train_loss": 0.003956188913434744, "global_step": 26987, "epoch": 226, "lr": 6.933764796095334e-05} +{"train_loss": 0.0030481726862490177, "global_step": 26988, "epoch": 226, "lr": 6.933560483585784e-05} +{"train_loss": 0.003645458724349737, "global_step": 26989, "epoch": 226, "lr": 6.933356167279896e-05} +{"train_loss": 0.0034966901876032352, "global_step": 26990, "epoch": 226, "lr": 6.93315184717807e-05} +{"train_loss": 0.004582567606121302, "global_step": 26991, "epoch": 226, "lr": 6.932947523280705e-05} +{"train_loss": 0.003500767517834902, "global_step": 26992, "epoch": 226, "lr": 6.932743195588206e-05} +{"train_loss": 0.0026970498729497194, "global_step": 26993, "epoch": 226, "lr": 6.932538864100972e-05} +{"train_loss": 0.0024007156025618315, "global_step": 26994, "epoch": 226, "lr": 6.932334528819405e-05} +{"train_loss": 0.0027139922603964806, "global_step": 26995, "epoch": 226, "lr": 6.932130189743902e-05} +{"train_loss": 0.0036782517563551664, "global_step": 26996, "epoch": 226, "lr": 6.931925846874869e-05} +{"train_loss": 0.0038459240458905697, "global_step": 26997, "epoch": 226, "lr": 6.931721500212708e-05} +{"train_loss": 0.003042327705770731, "global_step": 26998, "epoch": 226, "lr": 6.931517149757818e-05} +{"train_loss": 0.004843293689191341, "global_step": 26999, "epoch": 226, "lr": 6.9313127955106e-05} +{"train_loss": 0.004055825527757406, "global_step": 27000, "epoch": 226, "lr": 6.931108437471455e-05} +{"train_loss": 0.004727160558104515, "global_step": 27001, "epoch": 226, "lr": 6.930904075640786e-05} +{"train_loss": 0.003176473779603839, "global_step": 27002, "epoch": 226, "lr": 6.930699710018992e-05} +{"train_loss": 0.0035722837783396244, "global_step": 27003, "epoch": 226, "lr": 6.930495340606475e-05} +{"train_loss": 0.004060560837388039, "global_step": 27004, "epoch": 226, "lr": 6.930290967403638e-05} +{"train_loss": 0.002714012051001191, "global_step": 27005, "epoch": 226, "lr": 6.930086590410881e-05} +{"train_loss": 0.002093914896249771, "global_step": 27006, "epoch": 226, "lr": 6.929882209628605e-05} +{"train_loss": 0.00438262103125453, "global_step": 27007, "epoch": 226, "lr": 6.929677825057211e-05} +{"train_loss": 0.004557433072477579, "global_step": 27008, "epoch": 226, "lr": 6.9294734366971e-05} +{"train_loss": 0.0027787305880337954, "global_step": 27009, "epoch": 226, "lr": 6.929269044548677e-05} +{"train_loss": 0.004030488897114992, "global_step": 27010, "epoch": 226, "lr": 6.929064648612336e-05} +{"train_loss": 0.002443123608827591, "global_step": 27011, "epoch": 226, "lr": 6.928860248888486e-05} +{"train_loss": 0.003737669314860421, "global_step": 27012, "epoch": 226, "lr": 6.928655845377523e-05, "val_loss": 0.011252593249082565} +{"train_loss": 0.002569539239630103, "global_step": 27013, "epoch": 227, "lr": 6.928451438079852e-05} +{"train_loss": 0.005086557939648628, "global_step": 27014, "epoch": 227, "lr": 6.928247026995871e-05} +{"train_loss": 0.002418301533907652, "global_step": 27015, "epoch": 227, "lr": 6.928042612125983e-05} +{"train_loss": 0.0032536874059587717, "global_step": 27016, "epoch": 227, "lr": 6.92783819347059e-05} +{"train_loss": 0.004344551358371973, "global_step": 27017, "epoch": 227, "lr": 6.927633771030093e-05} +{"train_loss": 0.004403682425618172, "global_step": 27018, "epoch": 227, "lr": 6.927429344804894e-05} +{"train_loss": 0.0034092036075890064, "global_step": 27019, "epoch": 227, "lr": 6.927224914795392e-05} +{"train_loss": 0.0028907523956149817, "global_step": 27020, "epoch": 227, "lr": 6.927020481001989e-05} +{"train_loss": 0.006721634417772293, "global_step": 27021, "epoch": 227, "lr": 6.926816043425089e-05} +{"train_loss": 0.004844031762331724, "global_step": 27022, "epoch": 227, "lr": 6.92661160206509e-05} +{"train_loss": 0.004635979421436787, "global_step": 27023, "epoch": 227, "lr": 6.926407156922396e-05} +{"train_loss": 0.0019925846718251705, "global_step": 27024, "epoch": 227, "lr": 6.926202707997406e-05} +{"train_loss": 0.004022462759166956, "global_step": 27025, "epoch": 227, "lr": 6.925998255290524e-05} +{"train_loss": 0.004430701024830341, "global_step": 27026, "epoch": 227, "lr": 6.92579379880215e-05} +{"train_loss": 0.003804093459621072, "global_step": 27027, "epoch": 227, "lr": 6.925589338532686e-05} +{"train_loss": 0.0034679234959185123, "global_step": 27028, "epoch": 227, "lr": 6.925384874482533e-05} +{"train_loss": 0.003610478714108467, "global_step": 27029, "epoch": 227, "lr": 6.925180406652092e-05} +{"train_loss": 0.004196509253233671, "global_step": 27030, "epoch": 227, "lr": 6.924975935041764e-05} +{"train_loss": 0.0029432715382426977, "global_step": 27031, "epoch": 227, "lr": 6.924771459651953e-05} +{"train_loss": 0.0021545947529375553, "global_step": 27032, "epoch": 227, "lr": 6.924566980483058e-05} +{"train_loss": 0.0035141941625624895, "global_step": 27033, "epoch": 227, "lr": 6.924362497535482e-05} +{"train_loss": 0.002584905130788684, "global_step": 27034, "epoch": 227, "lr": 6.924158010809625e-05} +{"train_loss": 0.004183610435575247, "global_step": 27035, "epoch": 227, "lr": 6.923953520305889e-05} +{"train_loss": 0.0029187416657805443, "global_step": 27036, "epoch": 227, "lr": 6.923749026024676e-05} +{"train_loss": 0.0033820816315710545, "global_step": 27037, "epoch": 227, "lr": 6.923544527966389e-05} +{"train_loss": 0.005726874340325594, "global_step": 27038, "epoch": 227, "lr": 6.923340026131427e-05} +{"train_loss": 0.0032279607839882374, "global_step": 27039, "epoch": 227, "lr": 6.923135520520192e-05} +{"train_loss": 0.002329108538106084, "global_step": 27040, "epoch": 227, "lr": 6.922931011133086e-05} +{"train_loss": 0.0024156891740858555, "global_step": 27041, "epoch": 227, "lr": 6.92272649797051e-05} +{"train_loss": 0.008400085382163525, "global_step": 27042, "epoch": 227, "lr": 6.922521981032866e-05} +{"train_loss": 0.002233481965959072, "global_step": 27043, "epoch": 227, "lr": 6.922317460320556e-05} +{"train_loss": 0.0023703647311776876, "global_step": 27044, "epoch": 227, "lr": 6.922112935833982e-05} +{"train_loss": 0.004248394165188074, "global_step": 27045, "epoch": 227, "lr": 6.92190840757354e-05} +{"train_loss": 0.005340619944036007, "global_step": 27046, "epoch": 227, "lr": 6.92170387553964e-05} +{"train_loss": 0.006229191552847624, "global_step": 27047, "epoch": 227, "lr": 6.92149933973268e-05} +{"train_loss": 0.0024681666400283575, "global_step": 27048, "epoch": 227, "lr": 6.92129480015306e-05} +{"train_loss": 0.0026797009631991386, "global_step": 27049, "epoch": 227, "lr": 6.921090256801183e-05} +{"train_loss": 0.003335776273161173, "global_step": 27050, "epoch": 227, "lr": 6.920885709677453e-05} +{"train_loss": 0.002893624594435096, "global_step": 27051, "epoch": 227, "lr": 6.920681158782266e-05} +{"train_loss": 0.003388614859431982, "global_step": 27052, "epoch": 227, "lr": 6.920476604116028e-05} +{"train_loss": 0.002757805399596691, "global_step": 27053, "epoch": 227, "lr": 6.920272045679139e-05} +{"train_loss": 0.005485898349434137, "global_step": 27054, "epoch": 227, "lr": 6.920067483472001e-05} +{"train_loss": 0.00581336161121726, "global_step": 27055, "epoch": 227, "lr": 6.919862917495016e-05} +{"train_loss": 0.004551060497760773, "global_step": 27056, "epoch": 227, "lr": 6.919658347748586e-05} +{"train_loss": 0.0036110731307417154, "global_step": 27057, "epoch": 227, "lr": 6.919453774233111e-05} +{"train_loss": 0.0041334317065775394, "global_step": 27058, "epoch": 227, "lr": 6.919249196948994e-05} +{"train_loss": 0.003625746350735426, "global_step": 27059, "epoch": 227, "lr": 6.919044615896635e-05} +{"train_loss": 0.004029429517686367, "global_step": 27060, "epoch": 227, "lr": 6.918840031076438e-05} +{"train_loss": 0.004427365027368069, "global_step": 27061, "epoch": 227, "lr": 6.918635442488804e-05} +{"train_loss": 0.00396931916475296, "global_step": 27062, "epoch": 227, "lr": 6.918430850134133e-05} +{"train_loss": 0.002599454950541258, "global_step": 27063, "epoch": 227, "lr": 6.918226254012827e-05} +{"train_loss": 0.002981256926432252, "global_step": 27064, "epoch": 227, "lr": 6.91802165412529e-05} +{"train_loss": 0.0022112883161753416, "global_step": 27065, "epoch": 227, "lr": 6.917817050471924e-05} +{"train_loss": 0.0021034670062363148, "global_step": 27066, "epoch": 227, "lr": 6.917612443053127e-05} +{"train_loss": 0.007639004848897457, "global_step": 27067, "epoch": 227, "lr": 6.917407831869304e-05} +{"train_loss": 0.005593443755060434, "global_step": 27068, "epoch": 227, "lr": 6.917203216920856e-05} +{"train_loss": 0.0025930339470505714, "global_step": 27069, "epoch": 227, "lr": 6.916998598208184e-05} +{"train_loss": 0.0035394805017858744, "global_step": 27070, "epoch": 227, "lr": 6.91679397573169e-05} +{"train_loss": 0.005473812110722065, "global_step": 27071, "epoch": 227, "lr": 6.916589349491775e-05} +{"train_loss": 0.004501787014305592, "global_step": 27072, "epoch": 227, "lr": 6.916384719488841e-05} +{"train_loss": 0.0021749238949269056, "global_step": 27073, "epoch": 227, "lr": 6.916180085723292e-05} +{"train_loss": 0.006132775451987982, "global_step": 27074, "epoch": 227, "lr": 6.915975448195527e-05} +{"train_loss": 0.0037059031892567873, "global_step": 27075, "epoch": 227, "lr": 6.91577080690595e-05} +{"train_loss": 0.0032015296164900064, "global_step": 27076, "epoch": 227, "lr": 6.91556616185496e-05} +{"train_loss": 0.002527044853195548, "global_step": 27077, "epoch": 227, "lr": 6.915361513042962e-05} +{"train_loss": 0.004404065664857626, "global_step": 27078, "epoch": 227, "lr": 6.915156860470355e-05} +{"train_loss": 0.0059937420301139355, "global_step": 27079, "epoch": 227, "lr": 6.914952204137543e-05} +{"train_loss": 0.004486719146370888, "global_step": 27080, "epoch": 227, "lr": 6.914747544044927e-05} +{"train_loss": 0.0030931709334254265, "global_step": 27081, "epoch": 227, "lr": 6.91454288019291e-05} +{"train_loss": 0.003278526710346341, "global_step": 27082, "epoch": 227, "lr": 6.91433821258189e-05} +{"train_loss": 0.0050887479446828365, "global_step": 27083, "epoch": 227, "lr": 6.914133541212273e-05} +{"train_loss": 0.004249510820955038, "global_step": 27084, "epoch": 227, "lr": 6.913928866084458e-05} +{"train_loss": 0.002791422652080655, "global_step": 27085, "epoch": 227, "lr": 6.913724187198849e-05} +{"train_loss": 0.0029536786023527384, "global_step": 27086, "epoch": 227, "lr": 6.913519504555846e-05} +{"train_loss": 0.004375974182039499, "global_step": 27087, "epoch": 227, "lr": 6.913314818155855e-05} +{"train_loss": 0.0036529400385916233, "global_step": 27088, "epoch": 227, "lr": 6.913110127999272e-05} +{"train_loss": 0.003966093063354492, "global_step": 27089, "epoch": 227, "lr": 6.912905434086503e-05} +{"train_loss": 0.004831473808735609, "global_step": 27090, "epoch": 227, "lr": 6.912700736417947e-05} +{"train_loss": 0.003174685640260577, "global_step": 27091, "epoch": 227, "lr": 6.912496034994009e-05} +{"train_loss": 0.0042706448584795, "global_step": 27092, "epoch": 227, "lr": 6.912291329815089e-05} +{"train_loss": 0.002464679768308997, "global_step": 27093, "epoch": 227, "lr": 6.912086620881589e-05} +{"train_loss": 0.0029590087942779064, "global_step": 27094, "epoch": 227, "lr": 6.91188190819391e-05} +{"train_loss": 0.006045951042324305, "global_step": 27095, "epoch": 227, "lr": 6.911677191752456e-05} +{"train_loss": 0.00271099922247231, "global_step": 27096, "epoch": 227, "lr": 6.911472471557629e-05} +{"train_loss": 0.004691156093031168, "global_step": 27097, "epoch": 227, "lr": 6.911267747609829e-05} +{"train_loss": 0.003738842438906431, "global_step": 27098, "epoch": 227, "lr": 6.911063019909459e-05} +{"train_loss": 0.0038226251490414143, "global_step": 27099, "epoch": 227, "lr": 6.91085828845692e-05} +{"train_loss": 0.0022219789680093527, "global_step": 27100, "epoch": 227, "lr": 6.910653553252617e-05} +{"train_loss": 0.003124191425740719, "global_step": 27101, "epoch": 227, "lr": 6.910448814296951e-05} +{"train_loss": 0.00440704170614481, "global_step": 27102, "epoch": 227, "lr": 6.910244071590319e-05} +{"train_loss": 0.005304396618157625, "global_step": 27103, "epoch": 227, "lr": 6.910039325133129e-05} +{"train_loss": 0.002821817295625806, "global_step": 27104, "epoch": 227, "lr": 6.90983457492578e-05} +{"train_loss": 0.0036528543569147587, "global_step": 27105, "epoch": 227, "lr": 6.909629820968677e-05} +{"train_loss": 0.00437879329547286, "global_step": 27106, "epoch": 227, "lr": 6.909425063262219e-05} +{"train_loss": 0.0035003835801035166, "global_step": 27107, "epoch": 227, "lr": 6.909220301806806e-05} +{"train_loss": 0.005425220355391502, "global_step": 27108, "epoch": 227, "lr": 6.909015536602845e-05} +{"train_loss": 0.0032117071095854044, "global_step": 27109, "epoch": 227, "lr": 6.908810767650737e-05} +{"train_loss": 0.002607452217489481, "global_step": 27110, "epoch": 227, "lr": 6.908605994950881e-05} +{"train_loss": 0.0023436876945197582, "global_step": 27111, "epoch": 227, "lr": 6.908401218503682e-05} +{"train_loss": 0.002782213967293501, "global_step": 27112, "epoch": 227, "lr": 6.908196438309542e-05} +{"train_loss": 0.005697433836758137, "global_step": 27113, "epoch": 227, "lr": 6.907991654368861e-05} +{"train_loss": 0.0031716988887637854, "global_step": 27114, "epoch": 227, "lr": 6.907786866682042e-05} +{"train_loss": 0.0023473724722862244, "global_step": 27115, "epoch": 227, "lr": 6.907582075249488e-05} +{"train_loss": 0.0028736544772982597, "global_step": 27116, "epoch": 227, "lr": 6.907377280071599e-05} +{"train_loss": 0.002051651244983077, "global_step": 27117, "epoch": 227, "lr": 6.907172481148781e-05} +{"train_loss": 0.0062523880042135715, "global_step": 27118, "epoch": 227, "lr": 6.906967678481433e-05} +{"train_loss": 0.0037972661666572094, "global_step": 27119, "epoch": 227, "lr": 6.906762872069956e-05} +{"train_loss": 0.005143459886312485, "global_step": 27120, "epoch": 227, "lr": 6.906558061914755e-05} +{"train_loss": 0.0020026671700179577, "global_step": 27121, "epoch": 227, "lr": 6.906353248016231e-05} +{"train_loss": 0.003955455031245947, "global_step": 27122, "epoch": 227, "lr": 6.906148430374786e-05} +{"train_loss": 0.004795460496097803, "global_step": 27123, "epoch": 227, "lr": 6.905943608990821e-05} +{"train_loss": 0.00295609375461936, "global_step": 27124, "epoch": 227, "lr": 6.90573878386474e-05} +{"train_loss": 0.0031804244499653578, "global_step": 27125, "epoch": 227, "lr": 6.905533954996945e-05} +{"train_loss": 0.0024911263026297092, "global_step": 27126, "epoch": 227, "lr": 6.905329122387838e-05} +{"train_loss": 0.003363213501870632, "global_step": 27127, "epoch": 227, "lr": 6.905124286037821e-05} +{"train_loss": 0.004804024938493967, "global_step": 27128, "epoch": 227, "lr": 6.904919445947295e-05} +{"train_loss": 0.0039391061291098595, "global_step": 27129, "epoch": 227, "lr": 6.904714602116663e-05} +{"train_loss": 0.002561231842264533, "global_step": 27130, "epoch": 227, "lr": 6.904509754546327e-05} +{"train_loss": 0.0037836426841642927, "global_step": 27131, "epoch": 227, "lr": 6.904304903236691e-05, "val_loss": 0.018641140311956406} +{"train_loss": 0.002216676250100136, "global_step": 27132, "epoch": 228, "lr": 6.904100048188155e-05} +{"train_loss": 0.0034732918720692396, "global_step": 27133, "epoch": 228, "lr": 6.903895189401122e-05} +{"train_loss": 0.002269483869895339, "global_step": 27134, "epoch": 228, "lr": 6.903690326875994e-05} +{"train_loss": 0.002189562888815999, "global_step": 27135, "epoch": 228, "lr": 6.903485460613174e-05} +{"train_loss": 0.0031746893655508757, "global_step": 27136, "epoch": 228, "lr": 6.903280590613062e-05} +{"train_loss": 0.001763824955560267, "global_step": 27137, "epoch": 228, "lr": 6.903075716876065e-05} +{"train_loss": 0.002029804978519678, "global_step": 27138, "epoch": 228, "lr": 6.90287083940258e-05} +{"train_loss": 0.005289923865348101, "global_step": 27139, "epoch": 228, "lr": 6.902665958193012e-05} +{"train_loss": 0.004513564519584179, "global_step": 27140, "epoch": 228, "lr": 6.902461073247762e-05} +{"train_loss": 0.002629048191010952, "global_step": 27141, "epoch": 228, "lr": 6.902256184567234e-05} +{"train_loss": 0.003123384667560458, "global_step": 27142, "epoch": 228, "lr": 6.902051292151827e-05} +{"train_loss": 0.0036492343060672283, "global_step": 27143, "epoch": 228, "lr": 6.901846396001949e-05} +{"train_loss": 0.00432257866486907, "global_step": 27144, "epoch": 228, "lr": 6.901641496117996e-05} +{"train_loss": 0.0024260245263576508, "global_step": 27145, "epoch": 228, "lr": 6.901436592500374e-05} +{"train_loss": 0.008618728257715702, "global_step": 27146, "epoch": 228, "lr": 6.901231685149484e-05} +{"train_loss": 0.0033824259880930185, "global_step": 27147, "epoch": 228, "lr": 6.901026774065729e-05} +{"train_loss": 0.00330175063572824, "global_step": 27148, "epoch": 228, "lr": 6.900821859249511e-05} +{"train_loss": 0.003507728222757578, "global_step": 27149, "epoch": 228, "lr": 6.900616940701233e-05} +{"train_loss": 0.003923323471099138, "global_step": 27150, "epoch": 228, "lr": 6.900412018421296e-05} +{"train_loss": 0.002110892441123724, "global_step": 27151, "epoch": 228, "lr": 6.900207092410104e-05} +{"train_loss": 0.003783550811931491, "global_step": 27152, "epoch": 228, "lr": 6.900002162668057e-05} +{"train_loss": 0.002572385361418128, "global_step": 27153, "epoch": 228, "lr": 6.89979722919556e-05} +{"train_loss": 0.003488060785457492, "global_step": 27154, "epoch": 228, "lr": 6.899592291993012e-05} +{"train_loss": 0.004277357365936041, "global_step": 27155, "epoch": 228, "lr": 6.89938735106082e-05} +{"train_loss": 0.003332120832055807, "global_step": 27156, "epoch": 228, "lr": 6.899182406399383e-05} +{"train_loss": 0.004738963209092617, "global_step": 27157, "epoch": 228, "lr": 6.898977458009104e-05} +{"train_loss": 0.003997589461505413, "global_step": 27158, "epoch": 228, "lr": 6.898772505890385e-05} +{"train_loss": 0.0027489641215652227, "global_step": 27159, "epoch": 228, "lr": 6.89856755004363e-05} +{"train_loss": 0.005682838149368763, "global_step": 27160, "epoch": 228, "lr": 6.89836259046924e-05} +{"train_loss": 0.0038725007325410843, "global_step": 27161, "epoch": 228, "lr": 6.898157627167618e-05} +{"train_loss": 0.002671991242095828, "global_step": 27162, "epoch": 228, "lr": 6.897952660139166e-05} +{"train_loss": 0.004276016727089882, "global_step": 27163, "epoch": 228, "lr": 6.897747689384286e-05} +{"train_loss": 0.003981146961450577, "global_step": 27164, "epoch": 228, "lr": 6.897542714903382e-05} +{"train_loss": 0.0041532451286911964, "global_step": 27165, "epoch": 228, "lr": 6.897337736696856e-05} +{"train_loss": 0.0037550556007772684, "global_step": 27166, "epoch": 228, "lr": 6.89713275476511e-05} +{"train_loss": 0.0028472740668803453, "global_step": 27167, "epoch": 228, "lr": 6.896927769108545e-05} +{"train_loss": 0.0033784210681915283, "global_step": 27168, "epoch": 228, "lr": 6.896722779727568e-05} +{"train_loss": 0.003039621515199542, "global_step": 27169, "epoch": 228, "lr": 6.896517786622578e-05} +{"train_loss": 0.00467307586222887, "global_step": 27170, "epoch": 228, "lr": 6.896312789793975e-05} +{"train_loss": 0.00388645613566041, "global_step": 27171, "epoch": 228, "lr": 6.896107789242167e-05} +{"train_loss": 0.0031455920543521643, "global_step": 27172, "epoch": 228, "lr": 6.895902784967552e-05} +{"train_loss": 0.004515114240348339, "global_step": 27173, "epoch": 228, "lr": 6.895697776970535e-05} +{"train_loss": 0.003568611340597272, "global_step": 27174, "epoch": 228, "lr": 6.895492765251519e-05} +{"train_loss": 0.0029478000942617655, "global_step": 27175, "epoch": 228, "lr": 6.895287749810906e-05} +{"train_loss": 0.0021523386240005493, "global_step": 27176, "epoch": 228, "lr": 6.895082730649096e-05} +{"train_loss": 0.0024088278878480196, "global_step": 27177, "epoch": 228, "lr": 6.894877707766496e-05} +{"train_loss": 0.00266186217777431, "global_step": 27178, "epoch": 228, "lr": 6.894672681163502e-05} +{"train_loss": 0.0034777673427015543, "global_step": 27179, "epoch": 228, "lr": 6.894467650840523e-05} +{"train_loss": 0.00449276203289628, "global_step": 27180, "epoch": 228, "lr": 6.894262616797959e-05} +{"train_loss": 0.004143285099416971, "global_step": 27181, "epoch": 228, "lr": 6.894057579036214e-05} +{"train_loss": 0.004682197701185942, "global_step": 27182, "epoch": 228, "lr": 6.893852537555687e-05} +{"train_loss": 0.0020422302186489105, "global_step": 27183, "epoch": 228, "lr": 6.893647492356784e-05} +{"train_loss": 0.003220980055630207, "global_step": 27184, "epoch": 228, "lr": 6.893442443439907e-05} +{"train_loss": 0.007539814803749323, "global_step": 27185, "epoch": 228, "lr": 6.893237390805458e-05} +{"train_loss": 0.004275434650480747, "global_step": 27186, "epoch": 228, "lr": 6.893032334453838e-05} +{"train_loss": 0.004272664897143841, "global_step": 27187, "epoch": 228, "lr": 6.892827274385453e-05} +{"train_loss": 0.003299620235338807, "global_step": 27188, "epoch": 228, "lr": 6.892622210600705e-05} +{"train_loss": 0.0030879455152899027, "global_step": 27189, "epoch": 228, "lr": 6.892417143099992e-05} +{"train_loss": 0.002246510237455368, "global_step": 27190, "epoch": 228, "lr": 6.892212071883722e-05} +{"train_loss": 0.005091297440230846, "global_step": 27191, "epoch": 228, "lr": 6.892006996952296e-05} +{"train_loss": 0.0035882177762687206, "global_step": 27192, "epoch": 228, "lr": 6.891801918306117e-05} +{"train_loss": 0.003951504826545715, "global_step": 27193, "epoch": 228, "lr": 6.891596835945585e-05} +{"train_loss": 0.003407510928809643, "global_step": 27194, "epoch": 228, "lr": 6.891391749871106e-05} +{"train_loss": 0.002564437221735716, "global_step": 27195, "epoch": 228, "lr": 6.891186660083081e-05} +{"train_loss": 0.00363391125574708, "global_step": 27196, "epoch": 228, "lr": 6.890981566581914e-05} +{"train_loss": 0.004124123603105545, "global_step": 27197, "epoch": 228, "lr": 6.890776469368005e-05} +{"train_loss": 0.0023991314228624105, "global_step": 27198, "epoch": 228, "lr": 6.89057136844176e-05} +{"train_loss": 0.0033697413746267557, "global_step": 27199, "epoch": 228, "lr": 6.890366263803578e-05} +{"train_loss": 0.0032520988024771214, "global_step": 27200, "epoch": 228, "lr": 6.890161155453867e-05} +{"train_loss": 0.004041297826915979, "global_step": 27201, "epoch": 228, "lr": 6.889956043393024e-05} +{"train_loss": 0.0030399716924875975, "global_step": 27202, "epoch": 228, "lr": 6.889750927621456e-05} +{"train_loss": 0.004509748425334692, "global_step": 27203, "epoch": 228, "lr": 6.889545808139562e-05} +{"train_loss": 0.002899028593674302, "global_step": 27204, "epoch": 228, "lr": 6.889340684947747e-05} +{"train_loss": 0.004521127324551344, "global_step": 27205, "epoch": 228, "lr": 6.889135558046415e-05} +{"train_loss": 0.004015456419438124, "global_step": 27206, "epoch": 228, "lr": 6.888930427435967e-05} +{"train_loss": 0.002349898684769869, "global_step": 27207, "epoch": 228, "lr": 6.888725293116804e-05} +{"train_loss": 0.0029781111516058445, "global_step": 27208, "epoch": 228, "lr": 6.888520155089331e-05} +{"train_loss": 0.004137635231018066, "global_step": 27209, "epoch": 228, "lr": 6.888315013353952e-05} +{"train_loss": 0.002739672316238284, "global_step": 27210, "epoch": 228, "lr": 6.888109867911068e-05} +{"train_loss": 0.0038541737012565136, "global_step": 27211, "epoch": 228, "lr": 6.88790471876108e-05} +{"train_loss": 0.0030228744726628065, "global_step": 27212, "epoch": 228, "lr": 6.887699565904394e-05} +{"train_loss": 0.003474093973636627, "global_step": 27213, "epoch": 228, "lr": 6.887494409341411e-05} +{"train_loss": 0.004046522080898285, "global_step": 27214, "epoch": 228, "lr": 6.887289249072535e-05} +{"train_loss": 0.0046699559316039085, "global_step": 27215, "epoch": 228, "lr": 6.88708408509817e-05} +{"train_loss": 0.0039994800463318825, "global_step": 27216, "epoch": 228, "lr": 6.886878917418715e-05} +{"train_loss": 0.004414320457726717, "global_step": 27217, "epoch": 228, "lr": 6.886673746034575e-05} +{"train_loss": 0.002388997934758663, "global_step": 27218, "epoch": 228, "lr": 6.886468570946151e-05} +{"train_loss": 0.002543845446780324, "global_step": 27219, "epoch": 228, "lr": 6.88626339215385e-05} +{"train_loss": 0.002173182088881731, "global_step": 27220, "epoch": 228, "lr": 6.886058209658072e-05} +{"train_loss": 0.0031004336196929216, "global_step": 27221, "epoch": 228, "lr": 6.88585302345922e-05} +{"train_loss": 0.004209436010569334, "global_step": 27222, "epoch": 228, "lr": 6.885647833557696e-05} +{"train_loss": 0.0021533009130507708, "global_step": 27223, "epoch": 228, "lr": 6.885442639953905e-05} +{"train_loss": 0.00572612788528204, "global_step": 27224, "epoch": 228, "lr": 6.885237442648249e-05} +{"train_loss": 0.003180830040946603, "global_step": 27225, "epoch": 228, "lr": 6.885032241641131e-05} +{"train_loss": 0.004102905746549368, "global_step": 27226, "epoch": 228, "lr": 6.884827036932952e-05} +{"train_loss": 0.0023360401391983032, "global_step": 27227, "epoch": 228, "lr": 6.884621828524117e-05} +{"train_loss": 0.0035441904328763485, "global_step": 27228, "epoch": 228, "lr": 6.884416616415029e-05} +{"train_loss": 0.0024336869828402996, "global_step": 27229, "epoch": 228, "lr": 6.88421140060609e-05} +{"train_loss": 0.002261015120893717, "global_step": 27230, "epoch": 228, "lr": 6.884006181097703e-05} +{"train_loss": 0.006362274754792452, "global_step": 27231, "epoch": 228, "lr": 6.883800957890271e-05} +{"train_loss": 0.003193874144926667, "global_step": 27232, "epoch": 228, "lr": 6.883595730984198e-05} +{"train_loss": 0.0030079723801463842, "global_step": 27233, "epoch": 228, "lr": 6.883390500379885e-05} +{"train_loss": 0.005630810745060444, "global_step": 27234, "epoch": 228, "lr": 6.883185266077737e-05} +{"train_loss": 0.0024793585762381554, "global_step": 27235, "epoch": 228, "lr": 6.882980028078156e-05} +{"train_loss": 0.005804410204291344, "global_step": 27236, "epoch": 228, "lr": 6.882774786381544e-05} +{"train_loss": 0.005216093733906746, "global_step": 27237, "epoch": 228, "lr": 6.882569540988306e-05} +{"train_loss": 0.0034403917379677296, "global_step": 27238, "epoch": 228, "lr": 6.882364291898843e-05} +{"train_loss": 0.0016552304150536656, "global_step": 27239, "epoch": 228, "lr": 6.882159039113558e-05} +{"train_loss": 0.002247690688818693, "global_step": 27240, "epoch": 228, "lr": 6.881953782632855e-05} +{"train_loss": 0.0037525598891079426, "global_step": 27241, "epoch": 228, "lr": 6.881748522457138e-05} +{"train_loss": 0.002933588344603777, "global_step": 27242, "epoch": 228, "lr": 6.881543258586808e-05} +{"train_loss": 0.004288451746106148, "global_step": 27243, "epoch": 228, "lr": 6.881337991022269e-05} +{"train_loss": 0.0019828341901302338, "global_step": 27244, "epoch": 228, "lr": 6.881132719763922e-05} +{"train_loss": 0.002110775327309966, "global_step": 27245, "epoch": 228, "lr": 6.880927444812175e-05} +{"train_loss": 0.003849450498819351, "global_step": 27246, "epoch": 228, "lr": 6.880722166167427e-05} +{"train_loss": 0.0042575811967253685, "global_step": 27247, "epoch": 228, "lr": 6.880516883830082e-05} +{"train_loss": 0.003763705026358366, "global_step": 27248, "epoch": 228, "lr": 6.880311597800542e-05} +{"train_loss": 0.0030405293218791485, "global_step": 27249, "epoch": 228, "lr": 6.88010630807921e-05} +{"train_loss": 0.0035532020529372103, "global_step": 27250, "epoch": 228, "lr": 6.879901014666494e-05, "val_loss": 0.018380772322416306} +{"train_loss": 0.003753075608983636, "global_step": 27251, "epoch": 229, "lr": 6.879695717562791e-05} +{"train_loss": 0.003936389926820993, "global_step": 27252, "epoch": 229, "lr": 6.879490416768506e-05} +{"train_loss": 0.004430308472365141, "global_step": 27253, "epoch": 229, "lr": 6.879285112284042e-05} +{"train_loss": 0.005164389964193106, "global_step": 27254, "epoch": 229, "lr": 6.879079804109803e-05} +{"train_loss": 0.0036747176200151443, "global_step": 27255, "epoch": 229, "lr": 6.878874492246191e-05} +{"train_loss": 0.0027488337364047766, "global_step": 27256, "epoch": 229, "lr": 6.878669176693612e-05} +{"train_loss": 0.0034785300958901644, "global_step": 27257, "epoch": 229, "lr": 6.878463857452464e-05} +{"train_loss": 0.003673620754852891, "global_step": 27258, "epoch": 229, "lr": 6.878258534523155e-05} +{"train_loss": 0.0034701479598879814, "global_step": 27259, "epoch": 229, "lr": 6.878053207906084e-05} +{"train_loss": 0.002954199444502592, "global_step": 27260, "epoch": 229, "lr": 6.877847877601658e-05} +{"train_loss": 0.003608640981838107, "global_step": 27261, "epoch": 229, "lr": 6.877642543610276e-05} +{"train_loss": 0.0030638857278972864, "global_step": 27262, "epoch": 229, "lr": 6.877437205932344e-05} +{"train_loss": 0.0025958879850804806, "global_step": 27263, "epoch": 229, "lr": 6.877231864568266e-05} +{"train_loss": 0.001680833869613707, "global_step": 27264, "epoch": 229, "lr": 6.877026519518444e-05} +{"train_loss": 0.0046133375726640224, "global_step": 27265, "epoch": 229, "lr": 6.87682117078328e-05} +{"train_loss": 0.003718010615557432, "global_step": 27266, "epoch": 229, "lr": 6.876615818363177e-05} +{"train_loss": 0.0023842703085392714, "global_step": 27267, "epoch": 229, "lr": 6.876410462258542e-05} +{"train_loss": 0.0036634437274187803, "global_step": 27268, "epoch": 229, "lr": 6.876205102469774e-05} +{"train_loss": 0.0031449594534933567, "global_step": 27269, "epoch": 229, "lr": 6.875999738997279e-05} +{"train_loss": 0.0036759458016604185, "global_step": 27270, "epoch": 229, "lr": 6.875794371841458e-05} +{"train_loss": 0.00623964611440897, "global_step": 27271, "epoch": 229, "lr": 6.875589001002714e-05} +{"train_loss": 0.0030093409586697817, "global_step": 27272, "epoch": 229, "lr": 6.875383626481453e-05} +{"train_loss": 0.002555384999141097, "global_step": 27273, "epoch": 229, "lr": 6.875178248278075e-05} +{"train_loss": 0.00417097844183445, "global_step": 27274, "epoch": 229, "lr": 6.874972866392986e-05} +{"train_loss": 0.006741966120898724, "global_step": 27275, "epoch": 229, "lr": 6.874767480826588e-05} +{"train_loss": 0.00347485882230103, "global_step": 27276, "epoch": 229, "lr": 6.874562091579284e-05} +{"train_loss": 0.003512660041451454, "global_step": 27277, "epoch": 229, "lr": 6.874356698651479e-05} +{"train_loss": 0.0025696882512420416, "global_step": 27278, "epoch": 229, "lr": 6.874151302043573e-05} +{"train_loss": 0.003239140845835209, "global_step": 27279, "epoch": 229, "lr": 6.873945901755971e-05} +{"train_loss": 0.0050309887155890465, "global_step": 27280, "epoch": 229, "lr": 6.873740497789078e-05} +{"train_loss": 0.0033279499039053917, "global_step": 27281, "epoch": 229, "lr": 6.873535090143296e-05} +{"train_loss": 0.0027888205368071795, "global_step": 27282, "epoch": 229, "lr": 6.873329678819028e-05} +{"train_loss": 0.006022904999554157, "global_step": 27283, "epoch": 229, "lr": 6.873124263816675e-05} +{"train_loss": 0.0042920359410345554, "global_step": 27284, "epoch": 229, "lr": 6.872918845136645e-05} +{"train_loss": 0.004429420456290245, "global_step": 27285, "epoch": 229, "lr": 6.872713422779337e-05} +{"train_loss": 0.0020892759785056114, "global_step": 27286, "epoch": 229, "lr": 6.872507996745157e-05} +{"train_loss": 0.0023020184598863125, "global_step": 27287, "epoch": 229, "lr": 6.872302567034508e-05} +{"train_loss": 0.004559505730867386, "global_step": 27288, "epoch": 229, "lr": 6.872097133647793e-05} +{"train_loss": 0.0030329686123877764, "global_step": 27289, "epoch": 229, "lr": 6.871891696585415e-05} +{"train_loss": 0.003985944669693708, "global_step": 27290, "epoch": 229, "lr": 6.871686255847778e-05} +{"train_loss": 0.004759030882269144, "global_step": 27291, "epoch": 229, "lr": 6.871480811435285e-05} +{"train_loss": 0.005042807199060917, "global_step": 27292, "epoch": 229, "lr": 6.871275363348338e-05} +{"train_loss": 0.005276814568787813, "global_step": 27293, "epoch": 229, "lr": 6.871069911587343e-05} +{"train_loss": 0.0027498516719788313, "global_step": 27294, "epoch": 229, "lr": 6.870864456152702e-05} +{"train_loss": 0.003124665003269911, "global_step": 27295, "epoch": 229, "lr": 6.870658997044818e-05} +{"train_loss": 0.004237085580825806, "global_step": 27296, "epoch": 229, "lr": 6.870453534264096e-05} +{"train_loss": 0.002665339969098568, "global_step": 27297, "epoch": 229, "lr": 6.870248067810936e-05} +{"train_loss": 0.0031764013692736626, "global_step": 27298, "epoch": 229, "lr": 6.870042597685747e-05} +{"train_loss": 0.0044487155973911285, "global_step": 27299, "epoch": 229, "lr": 6.869837123888926e-05} +{"train_loss": 0.004069707356393337, "global_step": 27300, "epoch": 229, "lr": 6.869631646420882e-05} +{"train_loss": 0.004014716949313879, "global_step": 27301, "epoch": 229, "lr": 6.869426165282014e-05} +{"train_loss": 0.0028522894717752934, "global_step": 27302, "epoch": 229, "lr": 6.86922068047273e-05} +{"train_loss": 0.00170292635448277, "global_step": 27303, "epoch": 229, "lr": 6.869015191993428e-05} +{"train_loss": 0.005837750155478716, "global_step": 27304, "epoch": 229, "lr": 6.868809699844517e-05} +{"train_loss": 0.0036120533477514982, "global_step": 27305, "epoch": 229, "lr": 6.868604204026396e-05} +{"train_loss": 0.004087317734956741, "global_step": 27306, "epoch": 229, "lr": 6.868398704539471e-05} +{"train_loss": 0.003061913186684251, "global_step": 27307, "epoch": 229, "lr": 6.868193201384146e-05} +{"train_loss": 0.005184544716030359, "global_step": 27308, "epoch": 229, "lr": 6.86798769456082e-05} +{"train_loss": 0.004409469198435545, "global_step": 27309, "epoch": 229, "lr": 6.867782184069902e-05} +{"train_loss": 0.0034432050306349993, "global_step": 27310, "epoch": 229, "lr": 6.867576669911792e-05} +{"train_loss": 0.005958183668553829, "global_step": 27311, "epoch": 229, "lr": 6.867371152086894e-05} +{"train_loss": 0.0036475793458521366, "global_step": 27312, "epoch": 229, "lr": 6.867165630595615e-05} +{"train_loss": 0.0043359845876693726, "global_step": 27313, "epoch": 229, "lr": 6.866960105438355e-05} +{"train_loss": 0.0061235069297254086, "global_step": 27314, "epoch": 229, "lr": 6.866754576615517e-05} +{"train_loss": 0.00412162346765399, "global_step": 27315, "epoch": 229, "lr": 6.866549044127507e-05} +{"train_loss": 0.0042093535885214806, "global_step": 27316, "epoch": 229, "lr": 6.866343507974726e-05} +{"train_loss": 0.0026823857333511114, "global_step": 27317, "epoch": 229, "lr": 6.866137968157581e-05} +{"train_loss": 0.005506397690623999, "global_step": 27318, "epoch": 229, "lr": 6.865932424676473e-05} +{"train_loss": 0.004189667291939259, "global_step": 27319, "epoch": 229, "lr": 6.865726877531805e-05} +{"train_loss": 0.0034470907412469387, "global_step": 27320, "epoch": 229, "lr": 6.865521326723983e-05} +{"train_loss": 0.0027839995454996824, "global_step": 27321, "epoch": 229, "lr": 6.865315772253407e-05} +{"train_loss": 0.004153993912041187, "global_step": 27322, "epoch": 229, "lr": 6.865110214120484e-05} +{"train_loss": 0.00441960571333766, "global_step": 27323, "epoch": 229, "lr": 6.864904652325617e-05} +{"train_loss": 0.0038344154600054026, "global_step": 27324, "epoch": 229, "lr": 6.864699086869208e-05} +{"train_loss": 0.00590426055714488, "global_step": 27325, "epoch": 229, "lr": 6.864493517751662e-05} +{"train_loss": 0.007027056999504566, "global_step": 27326, "epoch": 229, "lr": 6.864287944973379e-05} +{"train_loss": 0.0045059495605528355, "global_step": 27327, "epoch": 229, "lr": 6.86408236853477e-05} +{"train_loss": 0.002903902204707265, "global_step": 27328, "epoch": 229, "lr": 6.863876788436233e-05} +{"train_loss": 0.004200709983706474, "global_step": 27329, "epoch": 229, "lr": 6.863671204678174e-05} +{"train_loss": 0.003702619345858693, "global_step": 27330, "epoch": 229, "lr": 6.863465617260993e-05} +{"train_loss": 0.0025021452456712723, "global_step": 27331, "epoch": 229, "lr": 6.8632600261851e-05} +{"train_loss": 0.003556584008038044, "global_step": 27332, "epoch": 229, "lr": 6.863054431450892e-05} +{"train_loss": 0.00268719089217484, "global_step": 27333, "epoch": 229, "lr": 6.862848833058778e-05} +{"train_loss": 0.004757529124617577, "global_step": 27334, "epoch": 229, "lr": 6.862643231009158e-05} +{"train_loss": 0.0030473212245851755, "global_step": 27335, "epoch": 229, "lr": 6.862437625302437e-05} +{"train_loss": 0.008066749200224876, "global_step": 27336, "epoch": 229, "lr": 6.862232015939019e-05} +{"train_loss": 0.004142118152230978, "global_step": 27337, "epoch": 229, "lr": 6.862026402919307e-05} +{"train_loss": 0.005299422424286604, "global_step": 27338, "epoch": 229, "lr": 6.861820786243707e-05} +{"train_loss": 0.004675254225730896, "global_step": 27339, "epoch": 229, "lr": 6.861615165912618e-05} +{"train_loss": 0.0036773807369172573, "global_step": 27340, "epoch": 229, "lr": 6.86140954192645e-05} +{"train_loss": 0.004075432661920786, "global_step": 27341, "epoch": 229, "lr": 6.861203914285599e-05} +{"train_loss": 0.003772524418309331, "global_step": 27342, "epoch": 229, "lr": 6.860998282990475e-05} +{"train_loss": 0.008659039624035358, "global_step": 27343, "epoch": 229, "lr": 6.86079264804148e-05} +{"train_loss": 0.0030076908878982067, "global_step": 27344, "epoch": 229, "lr": 6.860587009439017e-05} +{"train_loss": 0.004919618368148804, "global_step": 27345, "epoch": 229, "lr": 6.86038136718349e-05} +{"train_loss": 0.0023683980107307434, "global_step": 27346, "epoch": 229, "lr": 6.860175721275302e-05} +{"train_loss": 0.002969005610793829, "global_step": 27347, "epoch": 229, "lr": 6.859970071714858e-05} +{"train_loss": 0.006520998198539019, "global_step": 27348, "epoch": 229, "lr": 6.859764418502563e-05} +{"train_loss": 0.00473241601139307, "global_step": 27349, "epoch": 229, "lr": 6.85955876163882e-05} +{"train_loss": 0.0031293025240302086, "global_step": 27350, "epoch": 229, "lr": 6.859353101124031e-05} +{"train_loss": 0.002896419959142804, "global_step": 27351, "epoch": 229, "lr": 6.859147436958599e-05} +{"train_loss": 0.0035409557167440653, "global_step": 27352, "epoch": 229, "lr": 6.858941769142931e-05} +{"train_loss": 0.0036540634464472532, "global_step": 27353, "epoch": 229, "lr": 6.85873609767743e-05} +{"train_loss": 0.004079979844391346, "global_step": 27354, "epoch": 229, "lr": 6.858530422562498e-05} +{"train_loss": 0.0033572441898286343, "global_step": 27355, "epoch": 229, "lr": 6.858324743798542e-05} +{"train_loss": 0.0019606887362897396, "global_step": 27356, "epoch": 229, "lr": 6.858119061385963e-05} +{"train_loss": 0.003940167371183634, "global_step": 27357, "epoch": 229, "lr": 6.857913375325165e-05} +{"train_loss": 0.0028552664443850517, "global_step": 27358, "epoch": 229, "lr": 6.857707685616552e-05} +{"train_loss": 0.007831085473299026, "global_step": 27359, "epoch": 229, "lr": 6.857501992260529e-05} +{"train_loss": 0.002476075431331992, "global_step": 27360, "epoch": 229, "lr": 6.8572962952575e-05} +{"train_loss": 0.006258155684918165, "global_step": 27361, "epoch": 229, "lr": 6.857090594607868e-05} +{"train_loss": 0.004405679646879435, "global_step": 27362, "epoch": 229, "lr": 6.856884890312036e-05} +{"train_loss": 0.002800420392304659, "global_step": 27363, "epoch": 229, "lr": 6.856679182370412e-05} +{"train_loss": 0.003118057968094945, "global_step": 27364, "epoch": 229, "lr": 6.856473470783394e-05} +{"train_loss": 0.004910244606435299, "global_step": 27365, "epoch": 229, "lr": 6.856267755551389e-05} +{"train_loss": 0.006619296036660671, "global_step": 27366, "epoch": 229, "lr": 6.8560620366748e-05} +{"train_loss": 0.0030859613325446844, "global_step": 27367, "epoch": 229, "lr": 6.855856314154032e-05} +{"train_loss": 0.006388324312865734, "global_step": 27368, "epoch": 229, "lr": 6.855650587989489e-05} +{"train_loss": 0.004012119800768041, "global_step": 27369, "epoch": 229, "lr": 6.855444858181574e-05, "val_loss": 0.014893101528286934} +{"train_loss": 0.0033160275779664516, "global_step": 27370, "epoch": 230, "lr": 6.855239124730692e-05} +{"train_loss": 0.004763502161949873, "global_step": 27371, "epoch": 230, "lr": 6.855033387637246e-05} +{"train_loss": 0.003974159248173237, "global_step": 27372, "epoch": 230, "lr": 6.854827646901638e-05} +{"train_loss": 0.004428774584084749, "global_step": 27373, "epoch": 230, "lr": 6.854621902524276e-05} +{"train_loss": 0.00230269692838192, "global_step": 27374, "epoch": 230, "lr": 6.854416154505561e-05} +{"train_loss": 0.0029159733094274998, "global_step": 27375, "epoch": 230, "lr": 6.854210402845899e-05} +{"train_loss": 0.0037724399007856846, "global_step": 27376, "epoch": 230, "lr": 6.854004647545694e-05} +{"train_loss": 0.002778403228148818, "global_step": 27377, "epoch": 230, "lr": 6.853798888605346e-05} +{"train_loss": 0.003637854242697358, "global_step": 27378, "epoch": 230, "lr": 6.853593126025264e-05} +{"train_loss": 0.004383017774671316, "global_step": 27379, "epoch": 230, "lr": 6.853387359805849e-05} +{"train_loss": 0.003124566050246358, "global_step": 27380, "epoch": 230, "lr": 6.853181589947506e-05} +{"train_loss": 0.006011916324496269, "global_step": 27381, "epoch": 230, "lr": 6.85297581645064e-05} +{"train_loss": 0.0029412962030619383, "global_step": 27382, "epoch": 230, "lr": 6.852770039315653e-05} +{"train_loss": 0.004114922136068344, "global_step": 27383, "epoch": 230, "lr": 6.85256425854295e-05} +{"train_loss": 0.002508737612515688, "global_step": 27384, "epoch": 230, "lr": 6.852358474132937e-05} +{"train_loss": 0.002758974675089121, "global_step": 27385, "epoch": 230, "lr": 6.852152686086013e-05} +{"train_loss": 0.0034710008185356855, "global_step": 27386, "epoch": 230, "lr": 6.851946894402585e-05} +{"train_loss": 0.0053516593761742115, "global_step": 27387, "epoch": 230, "lr": 6.85174109908306e-05} +{"train_loss": 0.003633375745266676, "global_step": 27388, "epoch": 230, "lr": 6.851535300127839e-05} +{"train_loss": 0.001936661428771913, "global_step": 27389, "epoch": 230, "lr": 6.851329497537323e-05} +{"train_loss": 0.0033547787461429834, "global_step": 27390, "epoch": 230, "lr": 6.851123691311922e-05} +{"train_loss": 0.0049805548042058945, "global_step": 27391, "epoch": 230, "lr": 6.850917881452036e-05} +{"train_loss": 0.0052479044534265995, "global_step": 27392, "epoch": 230, "lr": 6.850712067958072e-05} +{"train_loss": 0.005675749387592077, "global_step": 27393, "epoch": 230, "lr": 6.85050625083043e-05} +{"train_loss": 0.0035076909698545933, "global_step": 27394, "epoch": 230, "lr": 6.850300430069518e-05} +{"train_loss": 0.006866233889013529, "global_step": 27395, "epoch": 230, "lr": 6.85009460567574e-05} +{"train_loss": 0.002844165777787566, "global_step": 27396, "epoch": 230, "lr": 6.849888777649498e-05} +{"train_loss": 0.006222842261195183, "global_step": 27397, "epoch": 230, "lr": 6.849682945991196e-05} +{"train_loss": 0.0033304591197520494, "global_step": 27398, "epoch": 230, "lr": 6.84947711070124e-05} +{"train_loss": 0.0039167022332549095, "global_step": 27399, "epoch": 230, "lr": 6.849271271780034e-05} +{"train_loss": 0.003595400135964155, "global_step": 27400, "epoch": 230, "lr": 6.849065429227981e-05} +{"train_loss": 0.0036343089304864407, "global_step": 27401, "epoch": 230, "lr": 6.848859583045487e-05} +{"train_loss": 0.0028671782929450274, "global_step": 27402, "epoch": 230, "lr": 6.848653733232952e-05} +{"train_loss": 0.004465762060135603, "global_step": 27403, "epoch": 230, "lr": 6.848447879790783e-05} +{"train_loss": 0.008166788145899773, "global_step": 27404, "epoch": 230, "lr": 6.848242022719386e-05} +{"train_loss": 0.0028405420016497374, "global_step": 27405, "epoch": 230, "lr": 6.848036162019162e-05} +{"train_loss": 0.0040083336643874645, "global_step": 27406, "epoch": 230, "lr": 6.847830297690517e-05} +{"train_loss": 0.005641949828714132, "global_step": 27407, "epoch": 230, "lr": 6.847624429733854e-05} +{"train_loss": 0.005122085101902485, "global_step": 27408, "epoch": 230, "lr": 6.847418558149578e-05} +{"train_loss": 0.004508845042437315, "global_step": 27409, "epoch": 230, "lr": 6.847212682938093e-05} +{"train_loss": 0.003361167386174202, "global_step": 27410, "epoch": 230, "lr": 6.847006804099803e-05} +{"train_loss": 0.003032726002857089, "global_step": 27411, "epoch": 230, "lr": 6.846800921635112e-05} +{"train_loss": 0.0028647975996136665, "global_step": 27412, "epoch": 230, "lr": 6.846595035544426e-05} +{"train_loss": 0.0058321114629507065, "global_step": 27413, "epoch": 230, "lr": 6.846389145828149e-05} +{"train_loss": 0.004224799107760191, "global_step": 27414, "epoch": 230, "lr": 6.846183252486683e-05} +{"train_loss": 0.005184713285416365, "global_step": 27415, "epoch": 230, "lr": 6.845977355520434e-05} +{"train_loss": 0.004254388157278299, "global_step": 27416, "epoch": 230, "lr": 6.845771454929804e-05} +{"train_loss": 0.005073595326393843, "global_step": 27417, "epoch": 230, "lr": 6.8455655507152e-05} +{"train_loss": 0.005785741377621889, "global_step": 27418, "epoch": 230, "lr": 6.845359642877024e-05} +{"train_loss": 0.004287643823772669, "global_step": 27419, "epoch": 230, "lr": 6.845153731415683e-05} +{"train_loss": 0.005059282295405865, "global_step": 27420, "epoch": 230, "lr": 6.84494781633158e-05} +{"train_loss": 0.004338993225246668, "global_step": 27421, "epoch": 230, "lr": 6.844741897625117e-05} +{"train_loss": 0.002620765706524253, "global_step": 27422, "epoch": 230, "lr": 6.844535975296703e-05} +{"train_loss": 0.006068785209208727, "global_step": 27423, "epoch": 230, "lr": 6.844330049346737e-05} +{"train_loss": 0.0061621409840881824, "global_step": 27424, "epoch": 230, "lr": 6.844124119775628e-05} +{"train_loss": 0.0031530458945780993, "global_step": 27425, "epoch": 230, "lr": 6.843918186583778e-05} +{"train_loss": 0.004106590058654547, "global_step": 27426, "epoch": 230, "lr": 6.84371224977159e-05} +{"train_loss": 0.004291127901524305, "global_step": 27427, "epoch": 230, "lr": 6.843506309339472e-05} +{"train_loss": 0.003423156216740608, "global_step": 27428, "epoch": 230, "lr": 6.843300365287825e-05} +{"train_loss": 0.005162376444786787, "global_step": 27429, "epoch": 230, "lr": 6.843094417617055e-05} +{"train_loss": 0.006610256619751453, "global_step": 27430, "epoch": 230, "lr": 6.842888466327566e-05} +{"train_loss": 0.003696753177791834, "global_step": 27431, "epoch": 230, "lr": 6.842682511419763e-05} +{"train_loss": 0.006411661393940449, "global_step": 27432, "epoch": 230, "lr": 6.84247655289405e-05} +{"train_loss": 0.0030638319440186024, "global_step": 27433, "epoch": 230, "lr": 6.84227059075083e-05} +{"train_loss": 0.004446961916983128, "global_step": 27434, "epoch": 230, "lr": 6.84206462499051e-05} +{"train_loss": 0.0035839013289660215, "global_step": 27435, "epoch": 230, "lr": 6.841858655613492e-05} +{"train_loss": 0.00436297757551074, "global_step": 27436, "epoch": 230, "lr": 6.84165268262018e-05} +{"train_loss": 0.004920440725982189, "global_step": 27437, "epoch": 230, "lr": 6.841446706010981e-05} +{"train_loss": 0.003750718431547284, "global_step": 27438, "epoch": 230, "lr": 6.841240725786298e-05} +{"train_loss": 0.0042997365817427635, "global_step": 27439, "epoch": 230, "lr": 6.841034741946537e-05} +{"train_loss": 0.003819713369011879, "global_step": 27440, "epoch": 230, "lr": 6.840828754492099e-05} +{"train_loss": 0.003986682277172804, "global_step": 27441, "epoch": 230, "lr": 6.840622763423391e-05} +{"train_loss": 0.0024556266143918037, "global_step": 27442, "epoch": 230, "lr": 6.840416768740817e-05} +{"train_loss": 0.00354445306584239, "global_step": 27443, "epoch": 230, "lr": 6.840210770444779e-05} +{"train_loss": 0.003799028927460313, "global_step": 27444, "epoch": 230, "lr": 6.840004768535687e-05} +{"train_loss": 0.004640062339603901, "global_step": 27445, "epoch": 230, "lr": 6.839798763013942e-05} +{"train_loss": 0.004263537470251322, "global_step": 27446, "epoch": 230, "lr": 6.839592753879947e-05} +{"train_loss": 0.00545525411143899, "global_step": 27447, "epoch": 230, "lr": 6.839386741134109e-05} +{"train_loss": 0.002241747220978141, "global_step": 27448, "epoch": 230, "lr": 6.839180724776831e-05} +{"train_loss": 0.0027506838086992502, "global_step": 27449, "epoch": 230, "lr": 6.838974704808519e-05} +{"train_loss": 0.0034209724981337786, "global_step": 27450, "epoch": 230, "lr": 6.838768681229576e-05} +{"train_loss": 0.0031187578570097685, "global_step": 27451, "epoch": 230, "lr": 6.838562654040408e-05} +{"train_loss": 0.004278632812201977, "global_step": 27452, "epoch": 230, "lr": 6.838356623241417e-05} +{"train_loss": 0.0063901739194989204, "global_step": 27453, "epoch": 230, "lr": 6.838150588833011e-05} +{"train_loss": 0.00288011459633708, "global_step": 27454, "epoch": 230, "lr": 6.837944550815591e-05} +{"train_loss": 0.005753961391746998, "global_step": 27455, "epoch": 230, "lr": 6.837738509189565e-05} +{"train_loss": 0.004739781841635704, "global_step": 27456, "epoch": 230, "lr": 6.837532463955335e-05} +{"train_loss": 0.0029197665862739086, "global_step": 27457, "epoch": 230, "lr": 6.837326415113306e-05} +{"train_loss": 0.002978171454742551, "global_step": 27458, "epoch": 230, "lr": 6.837120362663884e-05} +{"train_loss": 0.00416173692792654, "global_step": 27459, "epoch": 230, "lr": 6.83691430660747e-05} +{"train_loss": 0.0045018065720796585, "global_step": 27460, "epoch": 230, "lr": 6.836708246944473e-05} +{"train_loss": 0.002810381120070815, "global_step": 27461, "epoch": 230, "lr": 6.836502183675295e-05} +{"train_loss": 0.004721739795058966, "global_step": 27462, "epoch": 230, "lr": 6.836296116800342e-05} +{"train_loss": 0.004595469683408737, "global_step": 27463, "epoch": 230, "lr": 6.836090046320017e-05} +{"train_loss": 0.00459341611713171, "global_step": 27464, "epoch": 230, "lr": 6.835883972234725e-05} +{"train_loss": 0.004075370263308287, "global_step": 27465, "epoch": 230, "lr": 6.835677894544872e-05} +{"train_loss": 0.004020243883132935, "global_step": 27466, "epoch": 230, "lr": 6.835471813250861e-05} +{"train_loss": 0.003437807084992528, "global_step": 27467, "epoch": 230, "lr": 6.835265728353097e-05} +{"train_loss": 0.002557117026299238, "global_step": 27468, "epoch": 230, "lr": 6.835059639851985e-05} +{"train_loss": 0.001638146466575563, "global_step": 27469, "epoch": 230, "lr": 6.83485354774793e-05} +{"train_loss": 0.0037807156331837177, "global_step": 27470, "epoch": 230, "lr": 6.834647452041336e-05} +{"train_loss": 0.0036236303858458996, "global_step": 27471, "epoch": 230, "lr": 6.834441352732606e-05} +{"train_loss": 0.002057329285889864, "global_step": 27472, "epoch": 230, "lr": 6.834235249822148e-05} +{"train_loss": 0.0021458533592522144, "global_step": 27473, "epoch": 230, "lr": 6.834029143310366e-05} +{"train_loss": 0.002254107967019081, "global_step": 27474, "epoch": 230, "lr": 6.833823033197662e-05} +{"train_loss": 0.0015088381478562951, "global_step": 27475, "epoch": 230, "lr": 6.833616919484442e-05} +{"train_loss": 0.00458418158814311, "global_step": 27476, "epoch": 230, "lr": 6.833410802171112e-05} +{"train_loss": 0.004411847330629826, "global_step": 27477, "epoch": 230, "lr": 6.833204681258076e-05} +{"train_loss": 0.002514827763661742, "global_step": 27478, "epoch": 230, "lr": 6.832998556745736e-05} +{"train_loss": 0.002854117890819907, "global_step": 27479, "epoch": 230, "lr": 6.832792428634502e-05} +{"train_loss": 0.0024695871397852898, "global_step": 27480, "epoch": 230, "lr": 6.832586296924775e-05} +{"train_loss": 0.0038916494231671095, "global_step": 27481, "epoch": 230, "lr": 6.83238016161696e-05} +{"train_loss": 0.003492813091725111, "global_step": 27482, "epoch": 230, "lr": 6.832174022711464e-05} +{"train_loss": 0.0037576230242848396, "global_step": 27483, "epoch": 230, "lr": 6.83196788020869e-05} +{"train_loss": 0.003543614875525236, "global_step": 27484, "epoch": 230, "lr": 6.831761734109041e-05} +{"train_loss": 0.002611343516036868, "global_step": 27485, "epoch": 230, "lr": 6.831555584412924e-05} +{"train_loss": 0.0052216374315321445, "global_step": 27486, "epoch": 230, "lr": 6.831349431120744e-05} +{"train_loss": 0.003570035332813859, "global_step": 27487, "epoch": 230, "lr": 6.831143274232903e-05} +{"train_loss": 0.003961764016783475, "global_step": 27488, "epoch": 230, "lr": 6.830937113749811e-05, "val_loss": 0.027682123705744743, "train_action_mse_error": 6.345228757709265e-05} +{"train_loss": 0.0025518820621073246, "global_step": 27489, "epoch": 231, "lr": 6.830730949671868e-05} +{"train_loss": 0.0018717010971158743, "global_step": 27490, "epoch": 231, "lr": 6.830524781999481e-05} +{"train_loss": 0.0039385161362588406, "global_step": 27491, "epoch": 231, "lr": 6.830318610733053e-05} +{"train_loss": 0.0027692934963852167, "global_step": 27492, "epoch": 231, "lr": 6.830112435872989e-05} +{"train_loss": 0.0029657878912985325, "global_step": 27493, "epoch": 231, "lr": 6.829906257419697e-05} +{"train_loss": 0.0030168304219841957, "global_step": 27494, "epoch": 231, "lr": 6.829700075373579e-05} +{"train_loss": 0.0017166199395433068, "global_step": 27495, "epoch": 231, "lr": 6.829493889735042e-05} +{"train_loss": 0.0027614901773631573, "global_step": 27496, "epoch": 231, "lr": 6.829287700504487e-05} +{"train_loss": 0.002801260445266962, "global_step": 27497, "epoch": 231, "lr": 6.82908150768232e-05} +{"train_loss": 0.0023358953185379505, "global_step": 27498, "epoch": 231, "lr": 6.828875311268949e-05} +{"train_loss": 0.0034828768111765385, "global_step": 27499, "epoch": 231, "lr": 6.828669111264776e-05} +{"train_loss": 0.002375513082370162, "global_step": 27500, "epoch": 231, "lr": 6.828462907670205e-05} +{"train_loss": 0.003979471977800131, "global_step": 27501, "epoch": 231, "lr": 6.828256700485646e-05} +{"train_loss": 0.002615711186081171, "global_step": 27502, "epoch": 231, "lr": 6.828050489711498e-05} +{"train_loss": 0.0033553866669535637, "global_step": 27503, "epoch": 231, "lr": 6.827844275348169e-05} +{"train_loss": 0.002160388510674238, "global_step": 27504, "epoch": 231, "lr": 6.827638057396062e-05} +{"train_loss": 0.003527125809341669, "global_step": 27505, "epoch": 231, "lr": 6.827431835855583e-05} +{"train_loss": 0.002120189368724823, "global_step": 27506, "epoch": 231, "lr": 6.827225610727138e-05} +{"train_loss": 0.0030872575007379055, "global_step": 27507, "epoch": 231, "lr": 6.82701938201113e-05} +{"train_loss": 0.003420973429456353, "global_step": 27508, "epoch": 231, "lr": 6.826813149707964e-05} +{"train_loss": 0.004411895759403706, "global_step": 27509, "epoch": 231, "lr": 6.826606913818045e-05} +{"train_loss": 0.006264365278184414, "global_step": 27510, "epoch": 231, "lr": 6.82640067434178e-05} +{"train_loss": 0.00277512869797647, "global_step": 27511, "epoch": 231, "lr": 6.826194431279573e-05} +{"train_loss": 0.004649017006158829, "global_step": 27512, "epoch": 231, "lr": 6.825988184631827e-05} +{"train_loss": 0.0029020546935498714, "global_step": 27513, "epoch": 231, "lr": 6.82578193439895e-05} +{"train_loss": 0.004544263239949942, "global_step": 27514, "epoch": 231, "lr": 6.825575680581343e-05} +{"train_loss": 0.00338528910651803, "global_step": 27515, "epoch": 231, "lr": 6.825369423179413e-05} +{"train_loss": 0.004225661512464285, "global_step": 27516, "epoch": 231, "lr": 6.825163162193567e-05} +{"train_loss": 0.0038084769621491432, "global_step": 27517, "epoch": 231, "lr": 6.824956897624207e-05} +{"train_loss": 0.0026648531202226877, "global_step": 27518, "epoch": 231, "lr": 6.824750629471739e-05} +{"train_loss": 0.005692600272595882, "global_step": 27519, "epoch": 231, "lr": 6.82454435773657e-05} +{"train_loss": 0.0026496904902160168, "global_step": 27520, "epoch": 231, "lr": 6.824338082419102e-05} +{"train_loss": 0.0018763199914246798, "global_step": 27521, "epoch": 231, "lr": 6.824131803519739e-05} +{"train_loss": 0.001842390513047576, "global_step": 27522, "epoch": 231, "lr": 6.823925521038891e-05} +{"train_loss": 0.002120153745636344, "global_step": 27523, "epoch": 231, "lr": 6.823719234976958e-05} +{"train_loss": 0.004237532150000334, "global_step": 27524, "epoch": 231, "lr": 6.823512945334348e-05} +{"train_loss": 0.004178881179541349, "global_step": 27525, "epoch": 231, "lr": 6.823306652111465e-05} +{"train_loss": 0.0023723531048744917, "global_step": 27526, "epoch": 231, "lr": 6.823100355308715e-05} +{"train_loss": 0.00447428971529007, "global_step": 27527, "epoch": 231, "lr": 6.8228940549265e-05} +{"train_loss": 0.003345467383041978, "global_step": 27528, "epoch": 231, "lr": 6.82268775096523e-05} +{"train_loss": 0.0023726054932922125, "global_step": 27529, "epoch": 231, "lr": 6.822481443425306e-05} +{"train_loss": 0.0037319310940802097, "global_step": 27530, "epoch": 231, "lr": 6.822275132307134e-05} +{"train_loss": 0.003170761978253722, "global_step": 27531, "epoch": 231, "lr": 6.82206881761112e-05} +{"train_loss": 0.0036088533233851194, "global_step": 27532, "epoch": 231, "lr": 6.821862499337669e-05} +{"train_loss": 0.0035256054252386093, "global_step": 27533, "epoch": 231, "lr": 6.821656177487186e-05} +{"train_loss": 0.003739802399650216, "global_step": 27534, "epoch": 231, "lr": 6.821449852060073e-05} +{"train_loss": 0.0030038042459636927, "global_step": 27535, "epoch": 231, "lr": 6.821243523056741e-05} +{"train_loss": 0.002809440018609166, "global_step": 27536, "epoch": 231, "lr": 6.821037190477591e-05} +{"train_loss": 0.0033329525031149387, "global_step": 27537, "epoch": 231, "lr": 6.820830854323027e-05} +{"train_loss": 0.003519821912050247, "global_step": 27538, "epoch": 231, "lr": 6.820624514593459e-05} +{"train_loss": 0.003195415250957012, "global_step": 27539, "epoch": 231, "lr": 6.820418171289287e-05} +{"train_loss": 0.0020127033349126577, "global_step": 27540, "epoch": 231, "lr": 6.820211824410919e-05} +{"train_loss": 0.004056165460497141, "global_step": 27541, "epoch": 231, "lr": 6.82000547395876e-05} +{"train_loss": 0.00387542974203825, "global_step": 27542, "epoch": 231, "lr": 6.819799119933215e-05} +{"train_loss": 0.003527960041537881, "global_step": 27543, "epoch": 231, "lr": 6.819592762334688e-05} +{"train_loss": 0.0028746449388563633, "global_step": 27544, "epoch": 231, "lr": 6.819386401163585e-05} +{"train_loss": 0.0030824739951640368, "global_step": 27545, "epoch": 231, "lr": 6.819180036420313e-05} +{"train_loss": 0.0023431070148944855, "global_step": 27546, "epoch": 231, "lr": 6.818973668105273e-05} +{"train_loss": 0.0022678428795188665, "global_step": 27547, "epoch": 231, "lr": 6.818767296218874e-05} +{"train_loss": 0.003039043629541993, "global_step": 27548, "epoch": 231, "lr": 6.818560920761519e-05} +{"train_loss": 0.004218015819787979, "global_step": 27549, "epoch": 231, "lr": 6.818354541733614e-05} +{"train_loss": 0.0034311627969145775, "global_step": 27550, "epoch": 231, "lr": 6.818148159135565e-05} +{"train_loss": 0.00448458781465888, "global_step": 27551, "epoch": 231, "lr": 6.817941772967777e-05} +{"train_loss": 0.006304947193711996, "global_step": 27552, "epoch": 231, "lr": 6.817735383230652e-05} +{"train_loss": 0.0027035819366574287, "global_step": 27553, "epoch": 231, "lr": 6.817528989924598e-05} +{"train_loss": 0.00528402766212821, "global_step": 27554, "epoch": 231, "lr": 6.817322593050022e-05} +{"train_loss": 0.0030066154431551695, "global_step": 27555, "epoch": 231, "lr": 6.817116192607325e-05} +{"train_loss": 0.0026840127538889647, "global_step": 27556, "epoch": 231, "lr": 6.816909788596916e-05} +{"train_loss": 0.004592616111040115, "global_step": 27557, "epoch": 231, "lr": 6.816703381019198e-05} +{"train_loss": 0.004238674882799387, "global_step": 27558, "epoch": 231, "lr": 6.816496969874577e-05} +{"train_loss": 0.003992016892880201, "global_step": 27559, "epoch": 231, "lr": 6.816290555163459e-05} +{"train_loss": 0.0021801567636430264, "global_step": 27560, "epoch": 231, "lr": 6.816084136886248e-05} +{"train_loss": 0.003407153533771634, "global_step": 27561, "epoch": 231, "lr": 6.81587771504335e-05} +{"train_loss": 0.003786772722378373, "global_step": 27562, "epoch": 231, "lr": 6.815671289635171e-05} +{"train_loss": 0.002038360573351383, "global_step": 27563, "epoch": 231, "lr": 6.815464860662116e-05} +{"train_loss": 0.004223861265927553, "global_step": 27564, "epoch": 231, "lr": 6.815258428124587e-05} +{"train_loss": 0.0031552589498460293, "global_step": 27565, "epoch": 231, "lr": 6.815051992022993e-05} +{"train_loss": 0.002338007790967822, "global_step": 27566, "epoch": 231, "lr": 6.814845552357738e-05} +{"train_loss": 0.002193417167291045, "global_step": 27567, "epoch": 231, "lr": 6.814639109129228e-05} +{"train_loss": 0.004342882428318262, "global_step": 27568, "epoch": 231, "lr": 6.814432662337868e-05} +{"train_loss": 0.003017040900886059, "global_step": 27569, "epoch": 231, "lr": 6.814226211984064e-05} +{"train_loss": 0.0027363444678485394, "global_step": 27570, "epoch": 231, "lr": 6.814019758068221e-05} +{"train_loss": 0.006352324970066547, "global_step": 27571, "epoch": 231, "lr": 6.813813300590744e-05} +{"train_loss": 0.0033594509586691856, "global_step": 27572, "epoch": 231, "lr": 6.813606839552037e-05} +{"train_loss": 0.003562367055565119, "global_step": 27573, "epoch": 231, "lr": 6.813400374952507e-05} +{"train_loss": 0.0021725506521761417, "global_step": 27574, "epoch": 231, "lr": 6.813193906792558e-05} +{"train_loss": 0.0016192973125725985, "global_step": 27575, "epoch": 231, "lr": 6.812987435072599e-05} +{"train_loss": 0.004886654205620289, "global_step": 27576, "epoch": 231, "lr": 6.812780959793032e-05} +{"train_loss": 0.004208913538604975, "global_step": 27577, "epoch": 231, "lr": 6.812574480954263e-05} +{"train_loss": 0.0037197726778686047, "global_step": 27578, "epoch": 231, "lr": 6.812367998556697e-05} +{"train_loss": 0.0042387694120407104, "global_step": 27579, "epoch": 231, "lr": 6.81216151260074e-05} +{"train_loss": 0.0024094190448522568, "global_step": 27580, "epoch": 231, "lr": 6.811955023086798e-05} +{"train_loss": 0.0026847636327147484, "global_step": 27581, "epoch": 231, "lr": 6.811748530015276e-05} +{"train_loss": 0.003376792185008526, "global_step": 27582, "epoch": 231, "lr": 6.81154203338658e-05} +{"train_loss": 0.004074502270668745, "global_step": 27583, "epoch": 231, "lr": 6.811335533201115e-05} +{"train_loss": 0.0032861591316759586, "global_step": 27584, "epoch": 231, "lr": 6.811129029459285e-05} +{"train_loss": 0.0041724517941474915, "global_step": 27585, "epoch": 231, "lr": 6.810922522161495e-05} +{"train_loss": 0.0032766552176326513, "global_step": 27586, "epoch": 231, "lr": 6.810716011308154e-05} +{"train_loss": 0.003623733762651682, "global_step": 27587, "epoch": 231, "lr": 6.810509496899667e-05} +{"train_loss": 0.00274973944760859, "global_step": 27588, "epoch": 231, "lr": 6.810302978936437e-05} +{"train_loss": 0.0027332871686667204, "global_step": 27589, "epoch": 231, "lr": 6.810096457418869e-05} +{"train_loss": 0.0047019412741065025, "global_step": 27590, "epoch": 231, "lr": 6.809889932347371e-05} +{"train_loss": 0.004043825902044773, "global_step": 27591, "epoch": 231, "lr": 6.809683403722346e-05} +{"train_loss": 0.0024728444404900074, "global_step": 27592, "epoch": 231, "lr": 6.809476871544204e-05} +{"train_loss": 0.0032716228161007166, "global_step": 27593, "epoch": 231, "lr": 6.809270335813345e-05} +{"train_loss": 0.004259821027517319, "global_step": 27594, "epoch": 231, "lr": 6.809063796530178e-05} +{"train_loss": 0.0035183909349143505, "global_step": 27595, "epoch": 231, "lr": 6.808857253695109e-05} +{"train_loss": 0.0034598824568092823, "global_step": 27596, "epoch": 231, "lr": 6.808650707308541e-05} +{"train_loss": 0.004559588618576527, "global_step": 27597, "epoch": 231, "lr": 6.808444157370879e-05} +{"train_loss": 0.00343025173060596, "global_step": 27598, "epoch": 231, "lr": 6.808237603882531e-05} +{"train_loss": 0.004609141498804092, "global_step": 27599, "epoch": 231, "lr": 6.808031046843902e-05} +{"train_loss": 0.002737055765464902, "global_step": 27600, "epoch": 231, "lr": 6.807824486255396e-05} +{"train_loss": 0.005324948113411665, "global_step": 27601, "epoch": 231, "lr": 6.807617922117421e-05} +{"train_loss": 0.0030987453646957874, "global_step": 27602, "epoch": 231, "lr": 6.807411354430381e-05} +{"train_loss": 0.003658914240077138, "global_step": 27603, "epoch": 231, "lr": 6.807204783194683e-05} +{"train_loss": 0.0038855308666825294, "global_step": 27604, "epoch": 231, "lr": 6.80699820841073e-05} +{"train_loss": 0.0023981393314898014, "global_step": 27605, "epoch": 231, "lr": 6.80679163007893e-05} +{"train_loss": 0.0033623897470533848, "global_step": 27606, "epoch": 231, "lr": 6.806585048199687e-05} +{"train_loss": 0.0033797825453802943, "global_step": 27607, "epoch": 231, "lr": 6.806378462773407e-05, "val_loss": 0.009418623521924019} +{"train_loss": 0.0028151574078947306, "global_step": 27608, "epoch": 232, "lr": 6.806171873800498e-05} +{"train_loss": 0.0026496502105146646, "global_step": 27609, "epoch": 232, "lr": 6.80596528128136e-05} +{"train_loss": 0.002095629461109638, "global_step": 27610, "epoch": 232, "lr": 6.805758685216405e-05} +{"train_loss": 0.002767655299976468, "global_step": 27611, "epoch": 232, "lr": 6.805552085606033e-05} +{"train_loss": 0.004099435172975063, "global_step": 27612, "epoch": 232, "lr": 6.805345482450654e-05} +{"train_loss": 0.0027610422112047672, "global_step": 27613, "epoch": 232, "lr": 6.805138875750674e-05} +{"train_loss": 0.0026939092203974724, "global_step": 27614, "epoch": 232, "lr": 6.804932265506494e-05} +{"train_loss": 0.00356620573438704, "global_step": 27615, "epoch": 232, "lr": 6.804725651718524e-05} +{"train_loss": 0.0033587440848350525, "global_step": 27616, "epoch": 232, "lr": 6.804519034387166e-05} +{"train_loss": 0.0021470333449542522, "global_step": 27617, "epoch": 232, "lr": 6.804312413512828e-05} +{"train_loss": 0.0029994144570082426, "global_step": 27618, "epoch": 232, "lr": 6.804105789095917e-05} +{"train_loss": 0.003073120955377817, "global_step": 27619, "epoch": 232, "lr": 6.803899161136836e-05} +{"train_loss": 0.0038480940274894238, "global_step": 27620, "epoch": 232, "lr": 6.803692529635992e-05} +{"train_loss": 0.0018677983898669481, "global_step": 27621, "epoch": 232, "lr": 6.80348589459379e-05} +{"train_loss": 0.003043792676180601, "global_step": 27622, "epoch": 232, "lr": 6.803279256010637e-05} +{"train_loss": 0.0022692058701068163, "global_step": 27623, "epoch": 232, "lr": 6.803072613886937e-05} +{"train_loss": 0.0024856063537299633, "global_step": 27624, "epoch": 232, "lr": 6.802865968223095e-05} +{"train_loss": 0.002310343086719513, "global_step": 27625, "epoch": 232, "lr": 6.802659319019521e-05} +{"train_loss": 0.0020900496747344732, "global_step": 27626, "epoch": 232, "lr": 6.802452666276617e-05} +{"train_loss": 0.004909194074571133, "global_step": 27627, "epoch": 232, "lr": 6.802246009994791e-05} +{"train_loss": 0.0031923719216138124, "global_step": 27628, "epoch": 232, "lr": 6.802039350174446e-05} +{"train_loss": 0.002956095850095153, "global_step": 27629, "epoch": 232, "lr": 6.801832686815988e-05} +{"train_loss": 0.00218314491212368, "global_step": 27630, "epoch": 232, "lr": 6.801626019919827e-05} +{"train_loss": 0.0034229899756610394, "global_step": 27631, "epoch": 232, "lr": 6.801419349486364e-05} +{"train_loss": 0.0035106968134641647, "global_step": 27632, "epoch": 232, "lr": 6.801212675516006e-05} +{"train_loss": 0.004140117205679417, "global_step": 27633, "epoch": 232, "lr": 6.801005998009161e-05} +{"train_loss": 0.0021463483572006226, "global_step": 27634, "epoch": 232, "lr": 6.800799316966233e-05} +{"train_loss": 0.0026252041570842266, "global_step": 27635, "epoch": 232, "lr": 6.800592632387627e-05} +{"train_loss": 0.002703665290027857, "global_step": 27636, "epoch": 232, "lr": 6.80038594427375e-05} +{"train_loss": 0.0028485534712672234, "global_step": 27637, "epoch": 232, "lr": 6.800179252625007e-05} +{"train_loss": 0.0027816626243293285, "global_step": 27638, "epoch": 232, "lr": 6.799972557441805e-05} +{"train_loss": 0.002691722707822919, "global_step": 27639, "epoch": 232, "lr": 6.79976585872455e-05} +{"train_loss": 0.002890627598389983, "global_step": 27640, "epoch": 232, "lr": 6.799559156473645e-05} +{"train_loss": 0.002308550523594022, "global_step": 27641, "epoch": 232, "lr": 6.799352450689499e-05} +{"train_loss": 0.002732587279751897, "global_step": 27642, "epoch": 232, "lr": 6.799145741372516e-05} +{"train_loss": 0.002983325393870473, "global_step": 27643, "epoch": 232, "lr": 6.798939028523104e-05} +{"train_loss": 0.0045862807892262936, "global_step": 27644, "epoch": 232, "lr": 6.798732312141665e-05} +{"train_loss": 0.0031849918887019157, "global_step": 27645, "epoch": 232, "lr": 6.798525592228611e-05} +{"train_loss": 0.0037912577390670776, "global_step": 27646, "epoch": 232, "lr": 6.798318868784342e-05} +{"train_loss": 0.0018704491667449474, "global_step": 27647, "epoch": 232, "lr": 6.798112141809265e-05} +{"train_loss": 0.002371980343014002, "global_step": 27648, "epoch": 232, "lr": 6.797905411303788e-05} +{"train_loss": 0.002192242071032524, "global_step": 27649, "epoch": 232, "lr": 6.797698677268316e-05} +{"train_loss": 0.0030848714523017406, "global_step": 27650, "epoch": 232, "lr": 6.797491939703254e-05} +{"train_loss": 0.003097748151049018, "global_step": 27651, "epoch": 232, "lr": 6.79728519860901e-05} +{"train_loss": 0.0027968341019004583, "global_step": 27652, "epoch": 232, "lr": 6.797078453985988e-05} +{"train_loss": 0.0025269880425184965, "global_step": 27653, "epoch": 232, "lr": 6.796871705834594e-05} +{"train_loss": 0.004411374218761921, "global_step": 27654, "epoch": 232, "lr": 6.796664954155235e-05} +{"train_loss": 0.003711610333994031, "global_step": 27655, "epoch": 232, "lr": 6.796458198948315e-05} +{"train_loss": 0.0020891788881272078, "global_step": 27656, "epoch": 232, "lr": 6.796251440214242e-05} +{"train_loss": 0.0019400141900405288, "global_step": 27657, "epoch": 232, "lr": 6.79604467795342e-05} +{"train_loss": 0.0017130175838246942, "global_step": 27658, "epoch": 232, "lr": 6.795837912166259e-05} +{"train_loss": 0.0036285356618463993, "global_step": 27659, "epoch": 232, "lr": 6.795631142853159e-05} +{"train_loss": 0.001801501726731658, "global_step": 27660, "epoch": 232, "lr": 6.79542437001453e-05} +{"train_loss": 0.0025535626336932182, "global_step": 27661, "epoch": 232, "lr": 6.795217593650778e-05} +{"train_loss": 0.004417201038450003, "global_step": 27662, "epoch": 232, "lr": 6.795010813762308e-05} +{"train_loss": 0.002071970608085394, "global_step": 27663, "epoch": 232, "lr": 6.794804030349526e-05} +{"train_loss": 0.004439212381839752, "global_step": 27664, "epoch": 232, "lr": 6.794597243412838e-05} +{"train_loss": 0.003583515528589487, "global_step": 27665, "epoch": 232, "lr": 6.79439045295265e-05} +{"train_loss": 0.0029504538979381323, "global_step": 27666, "epoch": 232, "lr": 6.794183658969367e-05} +{"train_loss": 0.0034939150791615248, "global_step": 27667, "epoch": 232, "lr": 6.793976861463396e-05} +{"train_loss": 0.0029287454672157764, "global_step": 27668, "epoch": 232, "lr": 6.793770060435145e-05} +{"train_loss": 0.003894631052389741, "global_step": 27669, "epoch": 232, "lr": 6.793563255885017e-05} +{"train_loss": 0.005698840599507093, "global_step": 27670, "epoch": 232, "lr": 6.79335644781342e-05} +{"train_loss": 0.0023128464818000793, "global_step": 27671, "epoch": 232, "lr": 6.793149636220759e-05} +{"train_loss": 0.0020056606736034155, "global_step": 27672, "epoch": 232, "lr": 6.792942821107438e-05} +{"train_loss": 0.0036027301102876663, "global_step": 27673, "epoch": 232, "lr": 6.792736002473867e-05} +{"train_loss": 0.0027922717854380608, "global_step": 27674, "epoch": 232, "lr": 6.792529180320451e-05} +{"train_loss": 0.0031398667488247156, "global_step": 27675, "epoch": 232, "lr": 6.792322354647593e-05} +{"train_loss": 0.0027597935404628515, "global_step": 27676, "epoch": 232, "lr": 6.792115525455704e-05} +{"train_loss": 0.00575830927118659, "global_step": 27677, "epoch": 232, "lr": 6.791908692745187e-05} +{"train_loss": 0.004308717325329781, "global_step": 27678, "epoch": 232, "lr": 6.79170185651645e-05} +{"train_loss": 0.004473129753023386, "global_step": 27679, "epoch": 232, "lr": 6.791495016769896e-05} +{"train_loss": 0.003498295322060585, "global_step": 27680, "epoch": 232, "lr": 6.791288173505932e-05} +{"train_loss": 0.0033223400823771954, "global_step": 27681, "epoch": 232, "lr": 6.791081326724968e-05} +{"train_loss": 0.002078816993162036, "global_step": 27682, "epoch": 232, "lr": 6.790874476427407e-05} +{"train_loss": 0.004034035373479128, "global_step": 27683, "epoch": 232, "lr": 6.790667622613654e-05} +{"train_loss": 0.0032265367917716503, "global_step": 27684, "epoch": 232, "lr": 6.790460765284115e-05} +{"train_loss": 0.003981352783739567, "global_step": 27685, "epoch": 232, "lr": 6.790253904439198e-05} +{"train_loss": 0.0027125088963657618, "global_step": 27686, "epoch": 232, "lr": 6.790047040079312e-05} +{"train_loss": 0.0038346059154719114, "global_step": 27687, "epoch": 232, "lr": 6.789840172204856e-05} +{"train_loss": 0.0025829956866800785, "global_step": 27688, "epoch": 232, "lr": 6.789633300816243e-05} +{"train_loss": 0.0050642299465835094, "global_step": 27689, "epoch": 232, "lr": 6.789426425913874e-05} +{"train_loss": 0.004555258899927139, "global_step": 27690, "epoch": 232, "lr": 6.789219547498159e-05} +{"train_loss": 0.0025355236139148474, "global_step": 27691, "epoch": 232, "lr": 6.789012665569501e-05} +{"train_loss": 0.004322484601289034, "global_step": 27692, "epoch": 232, "lr": 6.788805780128307e-05} +{"train_loss": 0.0024319193325936794, "global_step": 27693, "epoch": 232, "lr": 6.788598891174987e-05} +{"train_loss": 0.0029458084609359503, "global_step": 27694, "epoch": 232, "lr": 6.788391998709941e-05} +{"train_loss": 0.0032025573309510946, "global_step": 27695, "epoch": 232, "lr": 6.788185102733582e-05} +{"train_loss": 0.0032422186341136694, "global_step": 27696, "epoch": 232, "lr": 6.78797820324631e-05} +{"train_loss": 0.002045416971668601, "global_step": 27697, "epoch": 232, "lr": 6.787771300248534e-05} +{"train_loss": 0.002777128480374813, "global_step": 27698, "epoch": 232, "lr": 6.787564393740661e-05} +{"train_loss": 0.004885195754468441, "global_step": 27699, "epoch": 232, "lr": 6.787357483723096e-05} +{"train_loss": 0.0038676513358950615, "global_step": 27700, "epoch": 232, "lr": 6.787150570196244e-05} +{"train_loss": 0.003780860686674714, "global_step": 27701, "epoch": 232, "lr": 6.786943653160516e-05} +{"train_loss": 0.004275655373930931, "global_step": 27702, "epoch": 232, "lr": 6.786736732616312e-05} +{"train_loss": 0.004626152105629444, "global_step": 27703, "epoch": 232, "lr": 6.786529808564044e-05} +{"train_loss": 0.00425347127020359, "global_step": 27704, "epoch": 232, "lr": 6.786322881004113e-05} +{"train_loss": 0.0047922455705702305, "global_step": 27705, "epoch": 232, "lr": 6.786115949936928e-05} +{"train_loss": 0.0034584472887218, "global_step": 27706, "epoch": 232, "lr": 6.785909015362896e-05} +{"train_loss": 0.0020804801024496555, "global_step": 27707, "epoch": 232, "lr": 6.785702077282423e-05} +{"train_loss": 0.00676378607749939, "global_step": 27708, "epoch": 232, "lr": 6.785495135695914e-05} +{"train_loss": 0.0038267429918050766, "global_step": 27709, "epoch": 232, "lr": 6.785288190603777e-05} +{"train_loss": 0.0043451618403196335, "global_step": 27710, "epoch": 232, "lr": 6.785081242006416e-05} +{"train_loss": 0.0028330881614238024, "global_step": 27711, "epoch": 232, "lr": 6.784874289904239e-05} +{"train_loss": 0.002252322854474187, "global_step": 27712, "epoch": 232, "lr": 6.784667334297652e-05} +{"train_loss": 0.0033253533765673637, "global_step": 27713, "epoch": 232, "lr": 6.784460375187061e-05} +{"train_loss": 0.00527830608189106, "global_step": 27714, "epoch": 232, "lr": 6.784253412572875e-05} +{"train_loss": 0.0020560123957693577, "global_step": 27715, "epoch": 232, "lr": 6.784046446455497e-05} +{"train_loss": 0.003906623460352421, "global_step": 27716, "epoch": 232, "lr": 6.783839476835333e-05} +{"train_loss": 0.006932244170457125, "global_step": 27717, "epoch": 232, "lr": 6.783632503712792e-05} +{"train_loss": 0.005513580050319433, "global_step": 27718, "epoch": 232, "lr": 6.783425527088279e-05} +{"train_loss": 0.0030953739769756794, "global_step": 27719, "epoch": 232, "lr": 6.7832185469622e-05} +{"train_loss": 0.00313202035613358, "global_step": 27720, "epoch": 232, "lr": 6.783011563334962e-05} +{"train_loss": 0.0023212179075926542, "global_step": 27721, "epoch": 232, "lr": 6.782804576206971e-05} +{"train_loss": 0.0036485115997493267, "global_step": 27722, "epoch": 232, "lr": 6.782597585578634e-05} +{"train_loss": 0.005582099314779043, "global_step": 27723, "epoch": 232, "lr": 6.782390591450357e-05} +{"train_loss": 0.003936894237995148, "global_step": 27724, "epoch": 232, "lr": 6.782183593822546e-05} +{"train_loss": 0.004597207996994257, "global_step": 27725, "epoch": 232, "lr": 6.781976592695609e-05} +{"train_loss": 0.003319574921086681, "global_step": 27726, "epoch": 232, "lr": 6.781769588069952e-05, "val_loss": 0.01896153762936592} +{"train_loss": 0.0044578309170901775, "global_step": 27727, "epoch": 233, "lr": 6.781562579945979e-05} +{"train_loss": 0.0037448399234563112, "global_step": 27728, "epoch": 233, "lr": 6.7813555683241e-05} +{"train_loss": 0.003739854320883751, "global_step": 27729, "epoch": 233, "lr": 6.781148553204718e-05} +{"train_loss": 0.003793739015236497, "global_step": 27730, "epoch": 233, "lr": 6.78094153458824e-05} +{"train_loss": 0.003182410728186369, "global_step": 27731, "epoch": 233, "lr": 6.780734512475077e-05} +{"train_loss": 0.0028245062567293644, "global_step": 27732, "epoch": 233, "lr": 6.780527486865631e-05} +{"train_loss": 0.004473072476685047, "global_step": 27733, "epoch": 233, "lr": 6.780320457760308e-05} +{"train_loss": 0.0043609351851046085, "global_step": 27734, "epoch": 233, "lr": 6.780113425159516e-05} +{"train_loss": 0.003542743157595396, "global_step": 27735, "epoch": 233, "lr": 6.779906389063663e-05} +{"train_loss": 0.0025702305138111115, "global_step": 27736, "epoch": 233, "lr": 6.779699349473154e-05} +{"train_loss": 0.0023795724846422672, "global_step": 27737, "epoch": 233, "lr": 6.779492306388394e-05} +{"train_loss": 0.00218060240149498, "global_step": 27738, "epoch": 233, "lr": 6.779285259809791e-05} +{"train_loss": 0.0031256082002073526, "global_step": 27739, "epoch": 233, "lr": 6.779078209737753e-05} +{"train_loss": 0.0023224595934152603, "global_step": 27740, "epoch": 233, "lr": 6.778871156172683e-05} +{"train_loss": 0.002069528214633465, "global_step": 27741, "epoch": 233, "lr": 6.77866409911499e-05} +{"train_loss": 0.0027549369260668755, "global_step": 27742, "epoch": 233, "lr": 6.778457038565081e-05} +{"train_loss": 0.003841554746031761, "global_step": 27743, "epoch": 233, "lr": 6.778249974523361e-05} +{"train_loss": 0.003247898304834962, "global_step": 27744, "epoch": 233, "lr": 6.778042906990237e-05} +{"train_loss": 0.004219937138259411, "global_step": 27745, "epoch": 233, "lr": 6.777835835966117e-05} +{"train_loss": 0.0018880697898566723, "global_step": 27746, "epoch": 233, "lr": 6.777628761451406e-05} +{"train_loss": 0.003991496749222279, "global_step": 27747, "epoch": 233, "lr": 6.77742168344651e-05} +{"train_loss": 0.003919241484254599, "global_step": 27748, "epoch": 233, "lr": 6.777214601951835e-05} +{"train_loss": 0.0027718141209334135, "global_step": 27749, "epoch": 233, "lr": 6.777007516967792e-05} +{"train_loss": 0.004522776231169701, "global_step": 27750, "epoch": 233, "lr": 6.776800428494782e-05} +{"train_loss": 0.003489569528028369, "global_step": 27751, "epoch": 233, "lr": 6.776593336533217e-05} +{"train_loss": 0.002960652345791459, "global_step": 27752, "epoch": 233, "lr": 6.776386241083499e-05} +{"train_loss": 0.0027555269189178944, "global_step": 27753, "epoch": 233, "lr": 6.776179142146038e-05} +{"train_loss": 0.004186962731182575, "global_step": 27754, "epoch": 233, "lr": 6.775972039721237e-05} +{"train_loss": 0.0021634665317833424, "global_step": 27755, "epoch": 233, "lr": 6.775764933809505e-05} +{"train_loss": 0.004341045394539833, "global_step": 27756, "epoch": 233, "lr": 6.775557824411247e-05} +{"train_loss": 0.006126974709331989, "global_step": 27757, "epoch": 233, "lr": 6.775350711526874e-05} +{"train_loss": 0.0034970128908753395, "global_step": 27758, "epoch": 233, "lr": 6.775143595156786e-05} +{"train_loss": 0.005755960009992123, "global_step": 27759, "epoch": 233, "lr": 6.774936475301396e-05} +{"train_loss": 0.002483238000422716, "global_step": 27760, "epoch": 233, "lr": 6.774729351961107e-05} +{"train_loss": 0.0019463831558823586, "global_step": 27761, "epoch": 233, "lr": 6.774522225136326e-05} +{"train_loss": 0.0037021921016275883, "global_step": 27762, "epoch": 233, "lr": 6.774315094827461e-05} +{"train_loss": 0.003523646155372262, "global_step": 27763, "epoch": 233, "lr": 6.774107961034917e-05} +{"train_loss": 0.0033628810197114944, "global_step": 27764, "epoch": 233, "lr": 6.773900823759103e-05} +{"train_loss": 0.0030778071377426386, "global_step": 27765, "epoch": 233, "lr": 6.773693683000424e-05} +{"train_loss": 0.00457853963598609, "global_step": 27766, "epoch": 233, "lr": 6.773486538759286e-05} +{"train_loss": 0.004107884131371975, "global_step": 27767, "epoch": 233, "lr": 6.773279391036098e-05} +{"train_loss": 0.0028883509803563356, "global_step": 27768, "epoch": 233, "lr": 6.773072239831263e-05} +{"train_loss": 0.001766043365933001, "global_step": 27769, "epoch": 233, "lr": 6.772865085145192e-05} +{"train_loss": 0.005137393716722727, "global_step": 27770, "epoch": 233, "lr": 6.772657926978288e-05} +{"train_loss": 0.002962281694635749, "global_step": 27771, "epoch": 233, "lr": 6.772450765330961e-05} +{"train_loss": 0.003573694033548236, "global_step": 27772, "epoch": 233, "lr": 6.772243600203616e-05} +{"train_loss": 0.00277735129930079, "global_step": 27773, "epoch": 233, "lr": 6.77203643159666e-05} +{"train_loss": 0.0040135676972568035, "global_step": 27774, "epoch": 233, "lr": 6.7718292595105e-05} +{"train_loss": 0.0033782210666686296, "global_step": 27775, "epoch": 233, "lr": 6.771622083945542e-05} +{"train_loss": 0.002724638907238841, "global_step": 27776, "epoch": 233, "lr": 6.771414904902194e-05} +{"train_loss": 0.002973336260765791, "global_step": 27777, "epoch": 233, "lr": 6.771207722380862e-05} +{"train_loss": 0.0026871596928685904, "global_step": 27778, "epoch": 233, "lr": 6.771000536381952e-05} +{"train_loss": 0.0028776645194739103, "global_step": 27779, "epoch": 233, "lr": 6.770793346905873e-05} +{"train_loss": 0.003755889367312193, "global_step": 27780, "epoch": 233, "lr": 6.770586153953029e-05} +{"train_loss": 0.0026340619660913944, "global_step": 27781, "epoch": 233, "lr": 6.770378957523829e-05} +{"train_loss": 0.003945101983845234, "global_step": 27782, "epoch": 233, "lr": 6.77017175761868e-05} +{"train_loss": 0.004596843384206295, "global_step": 27783, "epoch": 233, "lr": 6.769964554237988e-05} +{"train_loss": 0.0043072085827589035, "global_step": 27784, "epoch": 233, "lr": 6.769757347382157e-05} +{"train_loss": 0.003980191890150309, "global_step": 27785, "epoch": 233, "lr": 6.7695501370516e-05} +{"train_loss": 0.0020289449021220207, "global_step": 27786, "epoch": 233, "lr": 6.769342923246717e-05} +{"train_loss": 0.0032911302987486124, "global_step": 27787, "epoch": 233, "lr": 6.76913570596792e-05} +{"train_loss": 0.0032501465175300837, "global_step": 27788, "epoch": 233, "lr": 6.768928485215613e-05} +{"train_loss": 0.002898769685998559, "global_step": 27789, "epoch": 233, "lr": 6.768721260990205e-05} +{"train_loss": 0.005175968632102013, "global_step": 27790, "epoch": 233, "lr": 6.768514033292101e-05} +{"train_loss": 0.0029915773775428534, "global_step": 27791, "epoch": 233, "lr": 6.768306802121709e-05} +{"train_loss": 0.0020891991443932056, "global_step": 27792, "epoch": 233, "lr": 6.768099567479435e-05} +{"train_loss": 0.002566184150055051, "global_step": 27793, "epoch": 233, "lr": 6.767892329365687e-05} +{"train_loss": 0.0034683155827224255, "global_step": 27794, "epoch": 233, "lr": 6.76768508778087e-05} +{"train_loss": 0.0030286710243672132, "global_step": 27795, "epoch": 233, "lr": 6.767477842725396e-05} +{"train_loss": 0.0023508816957473755, "global_step": 27796, "epoch": 233, "lr": 6.767270594199664e-05} +{"train_loss": 0.0025295668747276068, "global_step": 27797, "epoch": 233, "lr": 6.767063342204087e-05} +{"train_loss": 0.0018350897589698434, "global_step": 27798, "epoch": 233, "lr": 6.76685608673907e-05} +{"train_loss": 0.0027506384067237377, "global_step": 27799, "epoch": 233, "lr": 6.76664882780502e-05} +{"train_loss": 0.0029146363958716393, "global_step": 27800, "epoch": 233, "lr": 6.766441565402342e-05} +{"train_loss": 0.0038514065090566874, "global_step": 27801, "epoch": 233, "lr": 6.766234299531446e-05} +{"train_loss": 0.005133041646331549, "global_step": 27802, "epoch": 233, "lr": 6.766027030192738e-05} +{"train_loss": 0.0016608283622190356, "global_step": 27803, "epoch": 233, "lr": 6.765819757386624e-05} +{"train_loss": 0.0032104032579809427, "global_step": 27804, "epoch": 233, "lr": 6.76561248111351e-05} +{"train_loss": 0.006193863693624735, "global_step": 27805, "epoch": 233, "lr": 6.765405201373807e-05} +{"train_loss": 0.003932424355298281, "global_step": 27806, "epoch": 233, "lr": 6.765197918167916e-05} +{"train_loss": 0.002858896739780903, "global_step": 27807, "epoch": 233, "lr": 6.764990631496251e-05} +{"train_loss": 0.0026581392157822847, "global_step": 27808, "epoch": 233, "lr": 6.764783341359215e-05} +{"train_loss": 0.0036131395027041435, "global_step": 27809, "epoch": 233, "lr": 6.764576047757214e-05} +{"train_loss": 0.003735214937478304, "global_step": 27810, "epoch": 233, "lr": 6.764368750690658e-05} +{"train_loss": 0.0026193209923803806, "global_step": 27811, "epoch": 233, "lr": 6.764161450159952e-05} +{"train_loss": 0.0054757301695644855, "global_step": 27812, "epoch": 233, "lr": 6.763954146165503e-05} +{"train_loss": 0.002914176555350423, "global_step": 27813, "epoch": 233, "lr": 6.763746838707719e-05} +{"train_loss": 0.001754674594849348, "global_step": 27814, "epoch": 233, "lr": 6.763539527787006e-05} +{"train_loss": 0.004769563674926758, "global_step": 27815, "epoch": 233, "lr": 6.763332213403773e-05} +{"train_loss": 0.0034490569960325956, "global_step": 27816, "epoch": 233, "lr": 6.763124895558423e-05} +{"train_loss": 0.004282411187887192, "global_step": 27817, "epoch": 233, "lr": 6.762917574251367e-05} +{"train_loss": 0.004014925565570593, "global_step": 27818, "epoch": 233, "lr": 6.762710249483011e-05} +{"train_loss": 0.0030403980053961277, "global_step": 27819, "epoch": 233, "lr": 6.76250292125376e-05} +{"train_loss": 0.004642424173653126, "global_step": 27820, "epoch": 233, "lr": 6.762295589564025e-05} +{"train_loss": 0.0049948724918067455, "global_step": 27821, "epoch": 233, "lr": 6.762088254414209e-05} +{"train_loss": 0.002632620744407177, "global_step": 27822, "epoch": 233, "lr": 6.761880915804724e-05} +{"train_loss": 0.0034227180294692516, "global_step": 27823, "epoch": 233, "lr": 6.761673573735972e-05} +{"train_loss": 0.0030057798139750957, "global_step": 27824, "epoch": 233, "lr": 6.76146622820836e-05} +{"train_loss": 0.005074335262179375, "global_step": 27825, "epoch": 233, "lr": 6.761258879222301e-05} +{"train_loss": 0.0049063111655414104, "global_step": 27826, "epoch": 233, "lr": 6.761051526778197e-05} +{"train_loss": 0.003578199539333582, "global_step": 27827, "epoch": 233, "lr": 6.760844170876457e-05} +{"train_loss": 0.0027275672182440758, "global_step": 27828, "epoch": 233, "lr": 6.760636811517486e-05} +{"train_loss": 0.003969764802604914, "global_step": 27829, "epoch": 233, "lr": 6.760429448701694e-05} +{"train_loss": 0.004479111637920141, "global_step": 27830, "epoch": 233, "lr": 6.760222082429487e-05} +{"train_loss": 0.0027955889236181974, "global_step": 27831, "epoch": 233, "lr": 6.76001471270127e-05} +{"train_loss": 0.004732663277536631, "global_step": 27832, "epoch": 233, "lr": 6.759807339517454e-05} +{"train_loss": 0.0034436513669788837, "global_step": 27833, "epoch": 233, "lr": 6.759599962878444e-05} +{"train_loss": 0.0032228867057710886, "global_step": 27834, "epoch": 233, "lr": 6.759392582784648e-05} +{"train_loss": 0.003279286902397871, "global_step": 27835, "epoch": 233, "lr": 6.759185199236472e-05} +{"train_loss": 0.003363370429724455, "global_step": 27836, "epoch": 233, "lr": 6.758977812234324e-05} +{"train_loss": 0.003865648526698351, "global_step": 27837, "epoch": 233, "lr": 6.758770421778611e-05} +{"train_loss": 0.0036432109773159027, "global_step": 27838, "epoch": 233, "lr": 6.75856302786974e-05} +{"train_loss": 0.004206435289233923, "global_step": 27839, "epoch": 233, "lr": 6.758355630508118e-05} +{"train_loss": 0.00452265702188015, "global_step": 27840, "epoch": 233, "lr": 6.758148229694152e-05} +{"train_loss": 0.004158804193139076, "global_step": 27841, "epoch": 233, "lr": 6.757940825428251e-05} +{"train_loss": 0.005666686221957207, "global_step": 27842, "epoch": 233, "lr": 6.75773341771082e-05} +{"train_loss": 0.0036759674549102783, "global_step": 27843, "epoch": 233, "lr": 6.757526006542269e-05} +{"train_loss": 0.002375289797782898, "global_step": 27844, "epoch": 233, "lr": 6.757318591923002e-05} +{"train_loss": 0.0034914961360598437, "global_step": 27845, "epoch": 233, "lr": 6.757111173853429e-05, "val_loss": 0.016395974904298782} +{"train_loss": 0.0020717026200145483, "global_step": 27846, "epoch": 234, "lr": 6.756903752333954e-05} +{"train_loss": 0.0035845499951392412, "global_step": 27847, "epoch": 234, "lr": 6.756696327364987e-05} +{"train_loss": 0.0025633578188717365, "global_step": 27848, "epoch": 234, "lr": 6.756488898946935e-05} +{"train_loss": 0.0014818201307207346, "global_step": 27849, "epoch": 234, "lr": 6.756281467080204e-05} +{"train_loss": 0.0030034787487238646, "global_step": 27850, "epoch": 234, "lr": 6.756074031765203e-05} +{"train_loss": 0.003993689082562923, "global_step": 27851, "epoch": 234, "lr": 6.755866593002338e-05} +{"train_loss": 0.003664434887468815, "global_step": 27852, "epoch": 234, "lr": 6.755659150792015e-05} +{"train_loss": 0.003878482850268483, "global_step": 27853, "epoch": 234, "lr": 6.755451705134644e-05} +{"train_loss": 0.007335154339671135, "global_step": 27854, "epoch": 234, "lr": 6.75524425603063e-05} +{"train_loss": 0.0028174796607345343, "global_step": 27855, "epoch": 234, "lr": 6.755036803480382e-05} +{"train_loss": 0.0024128917139023542, "global_step": 27856, "epoch": 234, "lr": 6.754829347484307e-05} +{"train_loss": 0.004008648917078972, "global_step": 27857, "epoch": 234, "lr": 6.754621888042813e-05} +{"train_loss": 0.0029504357371479273, "global_step": 27858, "epoch": 234, "lr": 6.754414425156306e-05} +{"train_loss": 0.0034992615692317486, "global_step": 27859, "epoch": 234, "lr": 6.754206958825193e-05} +{"train_loss": 0.0036195656284689903, "global_step": 27860, "epoch": 234, "lr": 6.753999489049882e-05} +{"train_loss": 0.0038262743037194014, "global_step": 27861, "epoch": 234, "lr": 6.753792015830781e-05} +{"train_loss": 0.003770102048292756, "global_step": 27862, "epoch": 234, "lr": 6.753584539168296e-05} +{"train_loss": 0.004604906775057316, "global_step": 27863, "epoch": 234, "lr": 6.753377059062835e-05} +{"train_loss": 0.003314900677651167, "global_step": 27864, "epoch": 234, "lr": 6.753169575514808e-05} +{"train_loss": 0.0037302507553249598, "global_step": 27865, "epoch": 234, "lr": 6.752962088524617e-05} +{"train_loss": 0.002424319041892886, "global_step": 27866, "epoch": 234, "lr": 6.752754598092674e-05} +{"train_loss": 0.0028373440727591515, "global_step": 27867, "epoch": 234, "lr": 6.752547104219382e-05} +{"train_loss": 0.0023295849096029997, "global_step": 27868, "epoch": 234, "lr": 6.752339606905154e-05} +{"train_loss": 0.004331110045313835, "global_step": 27869, "epoch": 234, "lr": 6.752132106150393e-05} +{"train_loss": 0.005437977146357298, "global_step": 27870, "epoch": 234, "lr": 6.751924601955507e-05} +{"train_loss": 0.004691466689109802, "global_step": 27871, "epoch": 234, "lr": 6.751717094320905e-05} +{"train_loss": 0.0027060294523835182, "global_step": 27872, "epoch": 234, "lr": 6.751509583246994e-05} +{"train_loss": 0.0026815033052116632, "global_step": 27873, "epoch": 234, "lr": 6.75130206873418e-05} +{"train_loss": 0.0018150405958294868, "global_step": 27874, "epoch": 234, "lr": 6.751094550782872e-05} +{"train_loss": 0.0032868734560906887, "global_step": 27875, "epoch": 234, "lr": 6.750887029393478e-05} +{"train_loss": 0.0031578370835632086, "global_step": 27876, "epoch": 234, "lr": 6.750679504566404e-05} +{"train_loss": 0.0027861581183969975, "global_step": 27877, "epoch": 234, "lr": 6.750471976302057e-05} +{"train_loss": 0.004520362708717585, "global_step": 27878, "epoch": 234, "lr": 6.750264444600846e-05} +{"train_loss": 0.004418577998876572, "global_step": 27879, "epoch": 234, "lr": 6.750056909463177e-05} +{"train_loss": 0.005921343341469765, "global_step": 27880, "epoch": 234, "lr": 6.749849370889458e-05} +{"train_loss": 0.002587474649772048, "global_step": 27881, "epoch": 234, "lr": 6.749641828880098e-05} +{"train_loss": 0.0037405143957585096, "global_step": 27882, "epoch": 234, "lr": 6.749434283435502e-05} +{"train_loss": 0.0023949232418090105, "global_step": 27883, "epoch": 234, "lr": 6.74922673455608e-05} +{"train_loss": 0.003239345271140337, "global_step": 27884, "epoch": 234, "lr": 6.749019182242237e-05} +{"train_loss": 0.005819854326546192, "global_step": 27885, "epoch": 234, "lr": 6.748811626494383e-05} +{"train_loss": 0.0031359221320599318, "global_step": 27886, "epoch": 234, "lr": 6.748604067312922e-05} +{"train_loss": 0.0043533118441700935, "global_step": 27887, "epoch": 234, "lr": 6.748396504698265e-05} +{"train_loss": 0.003127709263935685, "global_step": 27888, "epoch": 234, "lr": 6.748188938650819e-05} +{"train_loss": 0.002913265721872449, "global_step": 27889, "epoch": 234, "lr": 6.747981369170989e-05} +{"train_loss": 0.002669993322342634, "global_step": 27890, "epoch": 234, "lr": 6.747773796259186e-05} +{"train_loss": 0.004084401298314333, "global_step": 27891, "epoch": 234, "lr": 6.747566219915815e-05} +{"train_loss": 0.002907478017732501, "global_step": 27892, "epoch": 234, "lr": 6.747358640141284e-05} +{"train_loss": 0.0025108575355261564, "global_step": 27893, "epoch": 234, "lr": 6.747151056936002e-05} +{"train_loss": 0.004607034381479025, "global_step": 27894, "epoch": 234, "lr": 6.746943470300375e-05} +{"train_loss": 0.004569097422063351, "global_step": 27895, "epoch": 234, "lr": 6.746735880234813e-05} +{"train_loss": 0.00392664410173893, "global_step": 27896, "epoch": 234, "lr": 6.74652828673972e-05} +{"train_loss": 0.0035192749928683043, "global_step": 27897, "epoch": 234, "lr": 6.746320689815504e-05} +{"train_loss": 0.0030808509327471256, "global_step": 27898, "epoch": 234, "lr": 6.746113089462576e-05} +{"train_loss": 0.0044507961720228195, "global_step": 27899, "epoch": 234, "lr": 6.74590548568134e-05} +{"train_loss": 0.0018345598364248872, "global_step": 27900, "epoch": 234, "lr": 6.745697878472205e-05} +{"train_loss": 0.002621605060994625, "global_step": 27901, "epoch": 234, "lr": 6.74549026783558e-05} +{"train_loss": 0.003243151120841503, "global_step": 27902, "epoch": 234, "lr": 6.745282653771871e-05} +{"train_loss": 0.0028237693477422, "global_step": 27903, "epoch": 234, "lr": 6.745075036281487e-05} +{"train_loss": 0.004042723681777716, "global_step": 27904, "epoch": 234, "lr": 6.744867415364833e-05} +{"train_loss": 0.002651605289429426, "global_step": 27905, "epoch": 234, "lr": 6.744659791022318e-05} +{"train_loss": 0.0032979107927531004, "global_step": 27906, "epoch": 234, "lr": 6.74445216325435e-05} +{"train_loss": 0.0037739290855824947, "global_step": 27907, "epoch": 234, "lr": 6.744244532061336e-05} +{"train_loss": 0.003194640390574932, "global_step": 27908, "epoch": 234, "lr": 6.744036897443688e-05} +{"train_loss": 0.0039917523972690105, "global_step": 27909, "epoch": 234, "lr": 6.743829259401807e-05} +{"train_loss": 0.0032141697593033314, "global_step": 27910, "epoch": 234, "lr": 6.743621617936103e-05} +{"train_loss": 0.003042292781174183, "global_step": 27911, "epoch": 234, "lr": 6.743413973046986e-05} +{"train_loss": 0.005106835626065731, "global_step": 27912, "epoch": 234, "lr": 6.74320632473486e-05} +{"train_loss": 0.004531530663371086, "global_step": 27913, "epoch": 234, "lr": 6.742998673000136e-05} +{"train_loss": 0.00442437594756484, "global_step": 27914, "epoch": 234, "lr": 6.742791017843219e-05} +{"train_loss": 0.004715259652584791, "global_step": 27915, "epoch": 234, "lr": 6.74258335926452e-05} +{"train_loss": 0.002062520245090127, "global_step": 27916, "epoch": 234, "lr": 6.742375697264443e-05} +{"train_loss": 0.0034422860480844975, "global_step": 27917, "epoch": 234, "lr": 6.742168031843398e-05} +{"train_loss": 0.004665056709200144, "global_step": 27918, "epoch": 234, "lr": 6.741960363001792e-05} +{"train_loss": 0.004140239208936691, "global_step": 27919, "epoch": 234, "lr": 6.741752690740033e-05} +{"train_loss": 0.005711010657250881, "global_step": 27920, "epoch": 234, "lr": 6.74154501505853e-05} +{"train_loss": 0.003840220393612981, "global_step": 27921, "epoch": 234, "lr": 6.741337335957687e-05} +{"train_loss": 0.0030603548511862755, "global_step": 27922, "epoch": 234, "lr": 6.741129653437916e-05} +{"train_loss": 0.002869662828743458, "global_step": 27923, "epoch": 234, "lr": 6.740921967499623e-05} +{"train_loss": 0.0024649978149682283, "global_step": 27924, "epoch": 234, "lr": 6.740714278143214e-05} +{"train_loss": 0.005785522051155567, "global_step": 27925, "epoch": 234, "lr": 6.7405065853691e-05} +{"train_loss": 0.002532078418880701, "global_step": 27926, "epoch": 234, "lr": 6.740298889177686e-05} +{"train_loss": 0.002757362090051174, "global_step": 27927, "epoch": 234, "lr": 6.740091189569383e-05} +{"train_loss": 0.0031822642777115107, "global_step": 27928, "epoch": 234, "lr": 6.739883486544596e-05} +{"train_loss": 0.0037667378783226013, "global_step": 27929, "epoch": 234, "lr": 6.739675780103734e-05} +{"train_loss": 0.0041845450177788734, "global_step": 27930, "epoch": 234, "lr": 6.739468070247204e-05} +{"train_loss": 0.003588221501559019, "global_step": 27931, "epoch": 234, "lr": 6.739260356975413e-05} +{"train_loss": 0.005056607071310282, "global_step": 27932, "epoch": 234, "lr": 6.739052640288771e-05} +{"train_loss": 0.003792382078245282, "global_step": 27933, "epoch": 234, "lr": 6.738844920187685e-05} +{"train_loss": 0.002507148776203394, "global_step": 27934, "epoch": 234, "lr": 6.738637196672563e-05} +{"train_loss": 0.004316999576985836, "global_step": 27935, "epoch": 234, "lr": 6.738429469743813e-05} +{"train_loss": 0.002121708821505308, "global_step": 27936, "epoch": 234, "lr": 6.738221739401842e-05} +{"train_loss": 0.00328638288192451, "global_step": 27937, "epoch": 234, "lr": 6.738014005647058e-05} +{"train_loss": 0.0030545901972800493, "global_step": 27938, "epoch": 234, "lr": 6.73780626847987e-05} +{"train_loss": 0.0039884913712739944, "global_step": 27939, "epoch": 234, "lr": 6.737598527900684e-05} +{"train_loss": 0.003645368618890643, "global_step": 27940, "epoch": 234, "lr": 6.73739078390991e-05} +{"train_loss": 0.002031526993960142, "global_step": 27941, "epoch": 234, "lr": 6.737183036507954e-05} +{"train_loss": 0.0036314064636826515, "global_step": 27942, "epoch": 234, "lr": 6.736975285695225e-05} +{"train_loss": 0.0016008701641112566, "global_step": 27943, "epoch": 234, "lr": 6.73676753147213e-05} +{"train_loss": 0.005310434382408857, "global_step": 27944, "epoch": 234, "lr": 6.736559773839078e-05} +{"train_loss": 0.00208897958509624, "global_step": 27945, "epoch": 234, "lr": 6.736352012796479e-05} +{"train_loss": 0.002586474409326911, "global_step": 27946, "epoch": 234, "lr": 6.736144248344735e-05} +{"train_loss": 0.004320582840591669, "global_step": 27947, "epoch": 234, "lr": 6.735936480484257e-05} +{"train_loss": 0.0058492752723395824, "global_step": 27948, "epoch": 234, "lr": 6.735728709215455e-05} +{"train_loss": 0.0030410222243517637, "global_step": 27949, "epoch": 234, "lr": 6.735520934538733e-05} +{"train_loss": 0.002486390992999077, "global_step": 27950, "epoch": 234, "lr": 6.735313156454504e-05} +{"train_loss": 0.004756485112011433, "global_step": 27951, "epoch": 234, "lr": 6.735105374963171e-05} +{"train_loss": 0.0032322064507752657, "global_step": 27952, "epoch": 234, "lr": 6.734897590065143e-05} +{"train_loss": 0.0024683321826159954, "global_step": 27953, "epoch": 234, "lr": 6.734689801760832e-05} +{"train_loss": 0.0027195492293685675, "global_step": 27954, "epoch": 234, "lr": 6.73448201005064e-05} +{"train_loss": 0.0016573731554672122, "global_step": 27955, "epoch": 234, "lr": 6.73427421493498e-05} +{"train_loss": 0.00477096252143383, "global_step": 27956, "epoch": 234, "lr": 6.734066416414256e-05} +{"train_loss": 0.004544274415820837, "global_step": 27957, "epoch": 234, "lr": 6.73385861448888e-05} +{"train_loss": 0.004694229923188686, "global_step": 27958, "epoch": 234, "lr": 6.733650809159257e-05} +{"train_loss": 0.0027466556057333946, "global_step": 27959, "epoch": 234, "lr": 6.733443000425794e-05} +{"train_loss": 0.0028020902536809444, "global_step": 27960, "epoch": 234, "lr": 6.733235188288904e-05} +{"train_loss": 0.003229002468287945, "global_step": 27961, "epoch": 234, "lr": 6.733027372748989e-05} +{"train_loss": 0.004023023881018162, "global_step": 27962, "epoch": 234, "lr": 6.732819553806461e-05} +{"train_loss": 0.0034298941027373075, "global_step": 27963, "epoch": 234, "lr": 6.732611731461726e-05} +{"train_loss": 0.0035178422939595804, "global_step": 27964, "epoch": 234, "lr": 6.732403905715197e-05, "val_loss": 0.013701686635613441} +{"train_loss": 0.0027168041560798883, "global_step": 27965, "epoch": 235, "lr": 6.732196076567274e-05} +{"train_loss": 0.0041050235740840435, "global_step": 27966, "epoch": 235, "lr": 6.73198824401837e-05} +{"train_loss": 0.0028175250627100468, "global_step": 27967, "epoch": 235, "lr": 6.731780408068892e-05} +{"train_loss": 0.0018197876634076238, "global_step": 27968, "epoch": 235, "lr": 6.731572568719248e-05} +{"train_loss": 0.0024315030314028263, "global_step": 27969, "epoch": 235, "lr": 6.731364725969846e-05} +{"train_loss": 0.0028835004195570946, "global_step": 27970, "epoch": 235, "lr": 6.731156879821096e-05} +{"train_loss": 0.003799512516707182, "global_step": 27971, "epoch": 235, "lr": 6.730949030273403e-05} +{"train_loss": 0.002526989672333002, "global_step": 27972, "epoch": 235, "lr": 6.730741177327177e-05} +{"train_loss": 0.003949161618947983, "global_step": 27973, "epoch": 235, "lr": 6.730533320982825e-05} +{"train_loss": 0.002432888140901923, "global_step": 27974, "epoch": 235, "lr": 6.730325461240756e-05} +{"train_loss": 0.001956058433279395, "global_step": 27975, "epoch": 235, "lr": 6.730117598101379e-05} +{"train_loss": 0.0030101416632533073, "global_step": 27976, "epoch": 235, "lr": 6.729909731565099e-05} +{"train_loss": 0.0037012998946011066, "global_step": 27977, "epoch": 235, "lr": 6.729701861632328e-05} +{"train_loss": 0.004906203132122755, "global_step": 27978, "epoch": 235, "lr": 6.729493988303472e-05} +{"train_loss": 0.002968772314488888, "global_step": 27979, "epoch": 235, "lr": 6.729286111578937e-05} +{"train_loss": 0.004519987385720015, "global_step": 27980, "epoch": 235, "lr": 6.729078231459136e-05} +{"train_loss": 0.0018899580463767052, "global_step": 27981, "epoch": 235, "lr": 6.728870347944474e-05} +{"train_loss": 0.0037026647478342056, "global_step": 27982, "epoch": 235, "lr": 6.728662461035357e-05} +{"train_loss": 0.008856849744915962, "global_step": 27983, "epoch": 235, "lr": 6.728454570732201e-05} +{"train_loss": 0.0028429930098354816, "global_step": 27984, "epoch": 235, "lr": 6.728246677035406e-05} +{"train_loss": 0.003249497851356864, "global_step": 27985, "epoch": 235, "lr": 6.728038779945384e-05} +{"train_loss": 0.0059589808806777, "global_step": 27986, "epoch": 235, "lr": 6.727830879462542e-05} +{"train_loss": 0.005563861690461636, "global_step": 27987, "epoch": 235, "lr": 6.727622975587287e-05} +{"train_loss": 0.003794345073401928, "global_step": 27988, "epoch": 235, "lr": 6.727415068320031e-05} +{"train_loss": 0.005260438192635775, "global_step": 27989, "epoch": 235, "lr": 6.72720715766118e-05} +{"train_loss": 0.0033505272585898638, "global_step": 27990, "epoch": 235, "lr": 6.726999243611142e-05} +{"train_loss": 0.0045111156068742275, "global_step": 27991, "epoch": 235, "lr": 6.726791326170326e-05} +{"train_loss": 0.004761053249239922, "global_step": 27992, "epoch": 235, "lr": 6.72658340533914e-05} +{"train_loss": 0.0023264631163328886, "global_step": 27993, "epoch": 235, "lr": 6.72637548111799e-05} +{"train_loss": 0.004756871145218611, "global_step": 27994, "epoch": 235, "lr": 6.726167553507287e-05} +{"train_loss": 0.0032098651863634586, "global_step": 27995, "epoch": 235, "lr": 6.725959622507441e-05} +{"train_loss": 0.004797759931534529, "global_step": 27996, "epoch": 235, "lr": 6.725751688118854e-05} +{"train_loss": 0.003634345019236207, "global_step": 27997, "epoch": 235, "lr": 6.725543750341939e-05} +{"train_loss": 0.005333147011697292, "global_step": 27998, "epoch": 235, "lr": 6.725335809177104e-05} +{"train_loss": 0.004081279970705509, "global_step": 27999, "epoch": 235, "lr": 6.725127864624757e-05} +{"train_loss": 0.0039376490749418736, "global_step": 28000, "epoch": 235, "lr": 6.724919916685303e-05} +{"train_loss": 0.004683042876422405, "global_step": 28001, "epoch": 235, "lr": 6.724711965359155e-05} +{"train_loss": 0.003360099159181118, "global_step": 28002, "epoch": 235, "lr": 6.724504010646719e-05} +{"train_loss": 0.0053288815543055534, "global_step": 28003, "epoch": 235, "lr": 6.724296052548404e-05} +{"train_loss": 0.0049702078104019165, "global_step": 28004, "epoch": 235, "lr": 6.724088091064617e-05} +{"train_loss": 0.00474056089296937, "global_step": 28005, "epoch": 235, "lr": 6.723880126195769e-05} +{"train_loss": 0.0018331962637603283, "global_step": 28006, "epoch": 235, "lr": 6.723672157942264e-05} +{"train_loss": 0.0036815046332776546, "global_step": 28007, "epoch": 235, "lr": 6.723464186304515e-05} +{"train_loss": 0.004325426183640957, "global_step": 28008, "epoch": 235, "lr": 6.723256211282927e-05} +{"train_loss": 0.0026135232765227556, "global_step": 28009, "epoch": 235, "lr": 6.723048232877911e-05} +{"train_loss": 0.004161306656897068, "global_step": 28010, "epoch": 235, "lr": 6.722840251089873e-05} +{"train_loss": 0.0029872108716517687, "global_step": 28011, "epoch": 235, "lr": 6.722632265919222e-05} +{"train_loss": 0.004133176989853382, "global_step": 28012, "epoch": 235, "lr": 6.722424277366366e-05} +{"train_loss": 0.005308409221470356, "global_step": 28013, "epoch": 235, "lr": 6.722216285431715e-05} +{"train_loss": 0.002477211644873023, "global_step": 28014, "epoch": 235, "lr": 6.722008290115676e-05} +{"train_loss": 0.006434200797230005, "global_step": 28015, "epoch": 235, "lr": 6.721800291418658e-05} +{"train_loss": 0.002649028552696109, "global_step": 28016, "epoch": 235, "lr": 6.721592289341069e-05} +{"train_loss": 0.004058685153722763, "global_step": 28017, "epoch": 235, "lr": 6.721384283883317e-05} +{"train_loss": 0.0031990152783691883, "global_step": 28018, "epoch": 235, "lr": 6.721176275045811e-05} +{"train_loss": 0.0033390922471880913, "global_step": 28019, "epoch": 235, "lr": 6.720968262828959e-05} +{"train_loss": 0.003897774498909712, "global_step": 28020, "epoch": 235, "lr": 6.72076024723317e-05} +{"train_loss": 0.003985472023487091, "global_step": 28021, "epoch": 235, "lr": 6.720552228258852e-05} +{"train_loss": 0.0028252985794097185, "global_step": 28022, "epoch": 235, "lr": 6.720344205906413e-05} +{"train_loss": 0.003883365774527192, "global_step": 28023, "epoch": 235, "lr": 6.720136180176263e-05} +{"train_loss": 0.0038309593219310045, "global_step": 28024, "epoch": 235, "lr": 6.719928151068808e-05} +{"train_loss": 0.004170301835983992, "global_step": 28025, "epoch": 235, "lr": 6.71972011858446e-05} +{"train_loss": 0.002884785644710064, "global_step": 28026, "epoch": 235, "lr": 6.719512082723623e-05} +{"train_loss": 0.003919434733688831, "global_step": 28027, "epoch": 235, "lr": 6.719304043486709e-05} +{"train_loss": 0.0018790332833305001, "global_step": 28028, "epoch": 235, "lr": 6.719096000874126e-05} +{"train_loss": 0.0043260809034109116, "global_step": 28029, "epoch": 235, "lr": 6.71888795488628e-05} +{"train_loss": 0.0023146378807723522, "global_step": 28030, "epoch": 235, "lr": 6.718679905523581e-05} +{"train_loss": 0.005040287971496582, "global_step": 28031, "epoch": 235, "lr": 6.718471852786439e-05} +{"train_loss": 0.004115895833820105, "global_step": 28032, "epoch": 235, "lr": 6.718263796675261e-05} +{"train_loss": 0.0037200890947133303, "global_step": 28033, "epoch": 235, "lr": 6.718055737190455e-05} +{"train_loss": 0.004357648082077503, "global_step": 28034, "epoch": 235, "lr": 6.71784767433243e-05} +{"train_loss": 0.0033455071970820427, "global_step": 28035, "epoch": 235, "lr": 6.717639608101595e-05} +{"train_loss": 0.003233223222196102, "global_step": 28036, "epoch": 235, "lr": 6.717431538498357e-05} +{"train_loss": 0.002780990209430456, "global_step": 28037, "epoch": 235, "lr": 6.717223465523125e-05} +{"train_loss": 0.003950666170567274, "global_step": 28038, "epoch": 235, "lr": 6.717015389176311e-05} +{"train_loss": 0.0023302112240344286, "global_step": 28039, "epoch": 235, "lr": 6.71680730945832e-05} +{"train_loss": 0.003264174796640873, "global_step": 28040, "epoch": 235, "lr": 6.71659922636956e-05} +{"train_loss": 0.003427003277465701, "global_step": 28041, "epoch": 235, "lr": 6.716391139910443e-05} +{"train_loss": 0.004800440277904272, "global_step": 28042, "epoch": 235, "lr": 6.716183050081373e-05} +{"train_loss": 0.006387854460626841, "global_step": 28043, "epoch": 235, "lr": 6.715974956882762e-05} +{"train_loss": 0.0024685258977115154, "global_step": 28044, "epoch": 235, "lr": 6.715766860315017e-05} +{"train_loss": 0.003896266920492053, "global_step": 28045, "epoch": 235, "lr": 6.715558760378547e-05} +{"train_loss": 0.002947706263512373, "global_step": 28046, "epoch": 235, "lr": 6.715350657073763e-05} +{"train_loss": 0.0030230970587581396, "global_step": 28047, "epoch": 235, "lr": 6.715142550401068e-05} +{"train_loss": 0.004585238639265299, "global_step": 28048, "epoch": 235, "lr": 6.714934440360876e-05} +{"train_loss": 0.003919013775885105, "global_step": 28049, "epoch": 235, "lr": 6.714726326953592e-05} +{"train_loss": 0.0028670558240264654, "global_step": 28050, "epoch": 235, "lr": 6.714518210179627e-05} +{"train_loss": 0.0026458119973540306, "global_step": 28051, "epoch": 235, "lr": 6.714310090039388e-05} +{"train_loss": 0.0035577055532485247, "global_step": 28052, "epoch": 235, "lr": 6.714101966533284e-05} +{"train_loss": 0.0020117906387895346, "global_step": 28053, "epoch": 235, "lr": 6.713893839661724e-05} +{"train_loss": 0.002801240189000964, "global_step": 28054, "epoch": 235, "lr": 6.713685709425117e-05} +{"train_loss": 0.0053965081460773945, "global_step": 28055, "epoch": 235, "lr": 6.713477575823872e-05} +{"train_loss": 0.005210812669247389, "global_step": 28056, "epoch": 235, "lr": 6.713269438858397e-05} +{"train_loss": 0.0034866000059992075, "global_step": 28057, "epoch": 235, "lr": 6.713061298529097e-05} +{"train_loss": 0.0019141040975227952, "global_step": 28058, "epoch": 235, "lr": 6.712853154836388e-05} +{"train_loss": 0.003111552679911256, "global_step": 28059, "epoch": 235, "lr": 6.712645007780674e-05} +{"train_loss": 0.0035157587844878435, "global_step": 28060, "epoch": 235, "lr": 6.712436857362364e-05} +{"train_loss": 0.003032925073057413, "global_step": 28061, "epoch": 235, "lr": 6.712228703581867e-05} +{"train_loss": 0.004143171943724155, "global_step": 28062, "epoch": 235, "lr": 6.712020546439593e-05} +{"train_loss": 0.0023904205299913883, "global_step": 28063, "epoch": 235, "lr": 6.711812385935947e-05} +{"train_loss": 0.003501271829009056, "global_step": 28064, "epoch": 235, "lr": 6.711604222071344e-05} +{"train_loss": 0.002443011850118637, "global_step": 28065, "epoch": 235, "lr": 6.711396054846186e-05} +{"train_loss": 0.0035366893280297518, "global_step": 28066, "epoch": 235, "lr": 6.711187884260885e-05} +{"train_loss": 0.00482433196157217, "global_step": 28067, "epoch": 235, "lr": 6.71097971031585e-05} +{"train_loss": 0.0035196105018258095, "global_step": 28068, "epoch": 235, "lr": 6.710771533011489e-05} +{"train_loss": 0.00417202478274703, "global_step": 28069, "epoch": 235, "lr": 6.710563352348212e-05} +{"train_loss": 0.0021163506899029016, "global_step": 28070, "epoch": 235, "lr": 6.710355168326424e-05} +{"train_loss": 0.0034577501937747, "global_step": 28071, "epoch": 235, "lr": 6.710146980946539e-05} +{"train_loss": 0.0051891859620809555, "global_step": 28072, "epoch": 235, "lr": 6.70993879020896e-05} +{"train_loss": 0.002866393653675914, "global_step": 28073, "epoch": 235, "lr": 6.709730596114102e-05} +{"train_loss": 0.0023686732165515423, "global_step": 28074, "epoch": 235, "lr": 6.709522398662369e-05} +{"train_loss": 0.003564764279872179, "global_step": 28075, "epoch": 235, "lr": 6.709314197854172e-05} +{"train_loss": 0.007535918615758419, "global_step": 28076, "epoch": 235, "lr": 6.709105993689919e-05} +{"train_loss": 0.0024542580358684063, "global_step": 28077, "epoch": 235, "lr": 6.70889778617002e-05} +{"train_loss": 0.0031945647206157446, "global_step": 28078, "epoch": 235, "lr": 6.708689575294881e-05} +{"train_loss": 0.004130234010517597, "global_step": 28079, "epoch": 235, "lr": 6.708481361064915e-05} +{"train_loss": 0.0032581889536231756, "global_step": 28080, "epoch": 235, "lr": 6.708273143480525e-05} +{"train_loss": 0.007246395573019981, "global_step": 28081, "epoch": 235, "lr": 6.708064922542125e-05} +{"train_loss": 0.0024045254103839397, "global_step": 28082, "epoch": 235, "lr": 6.707856698250123e-05} +{"train_loss": 0.0037083220697485472, "global_step": 28083, "epoch": 235, "lr": 6.707648470604926e-05, "val_loss": 0.020770834758877754, "train_action_mse_error": 6.862357258796692e-05} +{"train_loss": 0.0029421967919915915, "global_step": 28084, "epoch": 236, "lr": 6.707440239606943e-05} +{"train_loss": 0.006039084866642952, "global_step": 28085, "epoch": 236, "lr": 6.707232005256583e-05} +{"train_loss": 0.0027203841600567102, "global_step": 28086, "epoch": 236, "lr": 6.707023767554257e-05} +{"train_loss": 0.002774524502456188, "global_step": 28087, "epoch": 236, "lr": 6.706815526500371e-05} +{"train_loss": 0.004501851741224527, "global_step": 28088, "epoch": 236, "lr": 6.706607282095335e-05} +{"train_loss": 0.003672473132610321, "global_step": 28089, "epoch": 236, "lr": 6.706399034339559e-05} +{"train_loss": 0.0032993534114211798, "global_step": 28090, "epoch": 236, "lr": 6.706190783233451e-05} +{"train_loss": 0.005283899139612913, "global_step": 28091, "epoch": 236, "lr": 6.705982528777419e-05} +{"train_loss": 0.0034455370623618364, "global_step": 28092, "epoch": 236, "lr": 6.705774270971872e-05} +{"train_loss": 0.0029794438742101192, "global_step": 28093, "epoch": 236, "lr": 6.70556600981722e-05} +{"train_loss": 0.003147352021187544, "global_step": 28094, "epoch": 236, "lr": 6.705357745313871e-05} +{"train_loss": 0.0030590398237109184, "global_step": 28095, "epoch": 236, "lr": 6.705149477462235e-05} +{"train_loss": 0.002603176049888134, "global_step": 28096, "epoch": 236, "lr": 6.70494120626272e-05} +{"train_loss": 0.0033132568933069706, "global_step": 28097, "epoch": 236, "lr": 6.704732931715735e-05} +{"train_loss": 0.0036639305762946606, "global_step": 28098, "epoch": 236, "lr": 6.704524653821689e-05} +{"train_loss": 0.002877583960071206, "global_step": 28099, "epoch": 236, "lr": 6.70431637258099e-05} +{"train_loss": 0.004337402060627937, "global_step": 28100, "epoch": 236, "lr": 6.704108087994049e-05} +{"train_loss": 0.004012910183519125, "global_step": 28101, "epoch": 236, "lr": 6.703899800061272e-05} +{"train_loss": 0.0034240614622831345, "global_step": 28102, "epoch": 236, "lr": 6.703691508783072e-05} +{"train_loss": 0.004267305135726929, "global_step": 28103, "epoch": 236, "lr": 6.703483214159856e-05} +{"train_loss": 0.002762629883363843, "global_step": 28104, "epoch": 236, "lr": 6.70327491619203e-05} +{"train_loss": 0.002368634333834052, "global_step": 28105, "epoch": 236, "lr": 6.703066614880008e-05} +{"train_loss": 0.005033864639699459, "global_step": 28106, "epoch": 236, "lr": 6.702858310224196e-05} +{"train_loss": 0.003482602769508958, "global_step": 28107, "epoch": 236, "lr": 6.702650002225004e-05} +{"train_loss": 0.004896390251815319, "global_step": 28108, "epoch": 236, "lr": 6.702441690882841e-05} +{"train_loss": 0.003042482538148761, "global_step": 28109, "epoch": 236, "lr": 6.702233376198114e-05} +{"train_loss": 0.0033209521789103746, "global_step": 28110, "epoch": 236, "lr": 6.702025058171235e-05} +{"train_loss": 0.003659517038613558, "global_step": 28111, "epoch": 236, "lr": 6.701816736802611e-05} +{"train_loss": 0.003985017072409391, "global_step": 28112, "epoch": 236, "lr": 6.701608412092653e-05} +{"train_loss": 0.003785806242376566, "global_step": 28113, "epoch": 236, "lr": 6.701400084041767e-05} +{"train_loss": 0.003544804872944951, "global_step": 28114, "epoch": 236, "lr": 6.701191752650364e-05} +{"train_loss": 0.0033621108159422874, "global_step": 28115, "epoch": 236, "lr": 6.700983417918853e-05} +{"train_loss": 0.004525095224380493, "global_step": 28116, "epoch": 236, "lr": 6.700775079847643e-05} +{"train_loss": 0.004338366910815239, "global_step": 28117, "epoch": 236, "lr": 6.700566738437141e-05} +{"train_loss": 0.003175971331074834, "global_step": 28118, "epoch": 236, "lr": 6.70035839368776e-05} +{"train_loss": 0.0030101228039711714, "global_step": 28119, "epoch": 236, "lr": 6.700150045599906e-05} +{"train_loss": 0.0036622690968215466, "global_step": 28120, "epoch": 236, "lr": 6.69994169417399e-05} +{"train_loss": 0.003479061648249626, "global_step": 28121, "epoch": 236, "lr": 6.69973333941042e-05} +{"train_loss": 0.003103752387687564, "global_step": 28122, "epoch": 236, "lr": 6.699524981309604e-05} +{"train_loss": 0.0023279781453311443, "global_step": 28123, "epoch": 236, "lr": 6.699316619871954e-05} +{"train_loss": 0.005628705956041813, "global_step": 28124, "epoch": 236, "lr": 6.699108255097876e-05} +{"train_loss": 0.0021907095797359943, "global_step": 28125, "epoch": 236, "lr": 6.698899886987779e-05} +{"train_loss": 0.0038594617508351803, "global_step": 28126, "epoch": 236, "lr": 6.698691515542076e-05} +{"train_loss": 0.0036953771486878395, "global_step": 28127, "epoch": 236, "lr": 6.698483140761174e-05} +{"train_loss": 0.003418662818148732, "global_step": 28128, "epoch": 236, "lr": 6.698274762645481e-05} +{"train_loss": 0.0057059689424932, "global_step": 28129, "epoch": 236, "lr": 6.698066381195407e-05} +{"train_loss": 0.0040417686104774475, "global_step": 28130, "epoch": 236, "lr": 6.697857996411361e-05} +{"train_loss": 0.0031766174361109734, "global_step": 28131, "epoch": 236, "lr": 6.697649608293751e-05} +{"train_loss": 0.002877943916246295, "global_step": 28132, "epoch": 236, "lr": 6.697441216842988e-05} +{"train_loss": 0.0043597593903541565, "global_step": 28133, "epoch": 236, "lr": 6.697232822059481e-05} +{"train_loss": 0.0031757899560034275, "global_step": 28134, "epoch": 236, "lr": 6.697024423943639e-05} +{"train_loss": 0.0027542999014258385, "global_step": 28135, "epoch": 236, "lr": 6.696816022495871e-05} +{"train_loss": 0.0028420123271644115, "global_step": 28136, "epoch": 236, "lr": 6.696607617716585e-05} +{"train_loss": 0.0031283595599234104, "global_step": 28137, "epoch": 236, "lr": 6.696399209606191e-05} +{"train_loss": 0.004096294287592173, "global_step": 28138, "epoch": 236, "lr": 6.696190798165098e-05} +{"train_loss": 0.0027038929983973503, "global_step": 28139, "epoch": 236, "lr": 6.695982383393718e-05} +{"train_loss": 0.004395196679979563, "global_step": 28140, "epoch": 236, "lr": 6.695773965292456e-05} +{"train_loss": 0.00406864145770669, "global_step": 28141, "epoch": 236, "lr": 6.695565543861724e-05} +{"train_loss": 0.004194951616227627, "global_step": 28142, "epoch": 236, "lr": 6.695357119101931e-05} +{"train_loss": 0.0036496755201369524, "global_step": 28143, "epoch": 236, "lr": 6.695148691013483e-05} +{"train_loss": 0.002680400852113962, "global_step": 28144, "epoch": 236, "lr": 6.694940259596793e-05} +{"train_loss": 0.004102269187569618, "global_step": 28145, "epoch": 236, "lr": 6.694731824852268e-05} +{"train_loss": 0.00232521235011518, "global_step": 28146, "epoch": 236, "lr": 6.694523386780319e-05} +{"train_loss": 0.00353427417576313, "global_step": 28147, "epoch": 236, "lr": 6.694314945381354e-05} +{"train_loss": 0.0018691422883421183, "global_step": 28148, "epoch": 236, "lr": 6.694106500655783e-05} +{"train_loss": 0.002548012649640441, "global_step": 28149, "epoch": 236, "lr": 6.693898052604014e-05} +{"train_loss": 0.0035233136732131243, "global_step": 28150, "epoch": 236, "lr": 6.693689601226458e-05} +{"train_loss": 0.0035471650771796703, "global_step": 28151, "epoch": 236, "lr": 6.693481146523522e-05} +{"train_loss": 0.002679091179743409, "global_step": 28152, "epoch": 236, "lr": 6.693272688495617e-05} +{"train_loss": 0.0025955343153327703, "global_step": 28153, "epoch": 236, "lr": 6.693064227143154e-05} +{"train_loss": 0.0041032577864825726, "global_step": 28154, "epoch": 236, "lr": 6.692855762466539e-05} +{"train_loss": 0.0015988965751603246, "global_step": 28155, "epoch": 236, "lr": 6.692647294466182e-05} +{"train_loss": 0.0014704368077218533, "global_step": 28156, "epoch": 236, "lr": 6.692438823142494e-05} +{"train_loss": 0.0025880716275423765, "global_step": 28157, "epoch": 236, "lr": 6.692230348495882e-05} +{"train_loss": 0.002466106554493308, "global_step": 28158, "epoch": 236, "lr": 6.692021870526758e-05} +{"train_loss": 0.004277578555047512, "global_step": 28159, "epoch": 236, "lr": 6.691813389235528e-05} +{"train_loss": 0.002554057165980339, "global_step": 28160, "epoch": 236, "lr": 6.691604904622605e-05} +{"train_loss": 0.002866273047402501, "global_step": 28161, "epoch": 236, "lr": 6.691396416688396e-05} +{"train_loss": 0.002100997604429722, "global_step": 28162, "epoch": 236, "lr": 6.69118792543331e-05} +{"train_loss": 0.00249081221409142, "global_step": 28163, "epoch": 236, "lr": 6.690979430857758e-05} +{"train_loss": 0.0029977059457451105, "global_step": 28164, "epoch": 236, "lr": 6.690770932962148e-05} +{"train_loss": 0.0027506607584655285, "global_step": 28165, "epoch": 236, "lr": 6.69056243174689e-05} +{"train_loss": 0.002217786153778434, "global_step": 28166, "epoch": 236, "lr": 6.690353927212394e-05} +{"train_loss": 0.004544801078736782, "global_step": 28167, "epoch": 236, "lr": 6.690145419359067e-05} +{"train_loss": 0.004570398014038801, "global_step": 28168, "epoch": 236, "lr": 6.68993690818732e-05} +{"train_loss": 0.004254122264683247, "global_step": 28169, "epoch": 236, "lr": 6.689728393697564e-05} +{"train_loss": 0.0037852793466299772, "global_step": 28170, "epoch": 236, "lr": 6.689519875890205e-05} +{"train_loss": 0.0024232077412307262, "global_step": 28171, "epoch": 236, "lr": 6.689311354765657e-05} +{"train_loss": 0.0033281133510172367, "global_step": 28172, "epoch": 236, "lr": 6.689102830324325e-05} +{"train_loss": 0.0031322839204221964, "global_step": 28173, "epoch": 236, "lr": 6.68889430256662e-05} +{"train_loss": 0.004050952382385731, "global_step": 28174, "epoch": 236, "lr": 6.688685771492951e-05} +{"train_loss": 0.004045382142066956, "global_step": 28175, "epoch": 236, "lr": 6.688477237103729e-05} +{"train_loss": 0.004710806533694267, "global_step": 28176, "epoch": 236, "lr": 6.688268699399362e-05} +{"train_loss": 0.0028890399262309074, "global_step": 28177, "epoch": 236, "lr": 6.68806015838026e-05} +{"train_loss": 0.0031921041663736105, "global_step": 28178, "epoch": 236, "lr": 6.687851614046832e-05} +{"train_loss": 0.0038805375806987286, "global_step": 28179, "epoch": 236, "lr": 6.687643066399486e-05} +{"train_loss": 0.0018325323471799493, "global_step": 28180, "epoch": 236, "lr": 6.687434515438637e-05} +{"train_loss": 0.003236255142837763, "global_step": 28181, "epoch": 236, "lr": 6.687225961164687e-05} +{"train_loss": 0.0031852207612246275, "global_step": 28182, "epoch": 236, "lr": 6.687017403578051e-05} +{"train_loss": 0.002986314706504345, "global_step": 28183, "epoch": 236, "lr": 6.686808842679136e-05} +{"train_loss": 0.002853038953617215, "global_step": 28184, "epoch": 236, "lr": 6.686600278468351e-05} +{"train_loss": 0.003591811517253518, "global_step": 28185, "epoch": 236, "lr": 6.686391710946107e-05} +{"train_loss": 0.00364006869494915, "global_step": 28186, "epoch": 236, "lr": 6.686183140112814e-05} +{"train_loss": 0.003561625722795725, "global_step": 28187, "epoch": 236, "lr": 6.68597456596888e-05} +{"train_loss": 0.0035740721505135298, "global_step": 28188, "epoch": 236, "lr": 6.685765988514715e-05} +{"train_loss": 0.0037062664050608873, "global_step": 28189, "epoch": 236, "lr": 6.685557407750729e-05} +{"train_loss": 0.0023888431023806334, "global_step": 28190, "epoch": 236, "lr": 6.685348823677331e-05} +{"train_loss": 0.003948897123336792, "global_step": 28191, "epoch": 236, "lr": 6.685140236294932e-05} +{"train_loss": 0.0036700444761663675, "global_step": 28192, "epoch": 236, "lr": 6.684931645603936e-05} +{"train_loss": 0.0021371436305344105, "global_step": 28193, "epoch": 236, "lr": 6.68472305160476e-05} +{"train_loss": 0.004045116249471903, "global_step": 28194, "epoch": 236, "lr": 6.68451445429781e-05} +{"train_loss": 0.0035563712008297443, "global_step": 28195, "epoch": 236, "lr": 6.684305853683495e-05} +{"train_loss": 0.003097298089414835, "global_step": 28196, "epoch": 236, "lr": 6.684097249762227e-05} +{"train_loss": 0.004044265020638704, "global_step": 28197, "epoch": 236, "lr": 6.683888642534412e-05} +{"train_loss": 0.0027277679182589054, "global_step": 28198, "epoch": 236, "lr": 6.683680032000464e-05} +{"train_loss": 0.00280511612072587, "global_step": 28199, "epoch": 236, "lr": 6.683471418160787e-05} +{"train_loss": 0.005278195720165968, "global_step": 28200, "epoch": 236, "lr": 6.683262801015796e-05} +{"train_loss": 0.004226532764732838, "global_step": 28201, "epoch": 236, "lr": 6.683054180565898e-05} +{"train_loss": 0.0034315923988005193, "global_step": 28202, "epoch": 236, "lr": 6.682845556811502e-05, "val_loss": 0.021772967651486397} +{"train_loss": 0.0028079436160624027, "global_step": 28203, "epoch": 237, "lr": 6.682636929753019e-05} +{"train_loss": 0.002755152527242899, "global_step": 28204, "epoch": 237, "lr": 6.682428299390858e-05} +{"train_loss": 0.0021255414467304945, "global_step": 28205, "epoch": 237, "lr": 6.682219665725429e-05} +{"train_loss": 0.0035825329832732677, "global_step": 28206, "epoch": 237, "lr": 6.682011028757141e-05} +{"train_loss": 0.0039835828356444836, "global_step": 28207, "epoch": 237, "lr": 6.681802388486404e-05} +{"train_loss": 0.001810785848647356, "global_step": 28208, "epoch": 237, "lr": 6.681593744913628e-05} +{"train_loss": 0.004188518039882183, "global_step": 28209, "epoch": 237, "lr": 6.681385098039223e-05} +{"train_loss": 0.002291743876412511, "global_step": 28210, "epoch": 237, "lr": 6.681176447863597e-05} +{"train_loss": 0.001688505057245493, "global_step": 28211, "epoch": 237, "lr": 6.68096779438716e-05} +{"train_loss": 0.004619213752448559, "global_step": 28212, "epoch": 237, "lr": 6.680759137610324e-05} +{"train_loss": 0.003911406733095646, "global_step": 28213, "epoch": 237, "lr": 6.680550477533497e-05} +{"train_loss": 0.0028271162882447243, "global_step": 28214, "epoch": 237, "lr": 6.680341814157088e-05} +{"train_loss": 0.0021436167880892754, "global_step": 28215, "epoch": 237, "lr": 6.680133147481507e-05} +{"train_loss": 0.002270499709993601, "global_step": 28216, "epoch": 237, "lr": 6.679924477507165e-05} +{"train_loss": 0.001438287552446127, "global_step": 28217, "epoch": 237, "lr": 6.67971580423447e-05} +{"train_loss": 0.0030269816052168608, "global_step": 28218, "epoch": 237, "lr": 6.679507127663832e-05} +{"train_loss": 0.0031894848216325045, "global_step": 28219, "epoch": 237, "lr": 6.679298447795663e-05} +{"train_loss": 0.003658456727862358, "global_step": 28220, "epoch": 237, "lr": 6.679089764630369e-05} +{"train_loss": 0.003855181159451604, "global_step": 28221, "epoch": 237, "lr": 6.678881078168362e-05} +{"train_loss": 0.002652372233569622, "global_step": 28222, "epoch": 237, "lr": 6.678672388410052e-05} +{"train_loss": 0.002719334326684475, "global_step": 28223, "epoch": 237, "lr": 6.678463695355848e-05} +{"train_loss": 0.0034853483084589243, "global_step": 28224, "epoch": 237, "lr": 6.678254999006159e-05} +{"train_loss": 0.0025739383418112993, "global_step": 28225, "epoch": 237, "lr": 6.678046299361397e-05} +{"train_loss": 0.002812853781506419, "global_step": 28226, "epoch": 237, "lr": 6.67783759642197e-05} +{"train_loss": 0.0019462915370240808, "global_step": 28227, "epoch": 237, "lr": 6.677628890188288e-05} +{"train_loss": 0.004232141654938459, "global_step": 28228, "epoch": 237, "lr": 6.67742018066076e-05} +{"train_loss": 0.0018940909067168832, "global_step": 28229, "epoch": 237, "lr": 6.6772114678398e-05} +{"train_loss": 0.00419950345531106, "global_step": 28230, "epoch": 237, "lr": 6.677002751725811e-05} +{"train_loss": 0.002331300638616085, "global_step": 28231, "epoch": 237, "lr": 6.676794032319207e-05} +{"train_loss": 0.0040689739398658276, "global_step": 28232, "epoch": 237, "lr": 6.676585309620396e-05} +{"train_loss": 0.0026128122117370367, "global_step": 28233, "epoch": 237, "lr": 6.676376583629791e-05} +{"train_loss": 0.0037490352988243103, "global_step": 28234, "epoch": 237, "lr": 6.676167854347798e-05} +{"train_loss": 0.0033093944657593966, "global_step": 28235, "epoch": 237, "lr": 6.675959121774829e-05} +{"train_loss": 0.006370509508997202, "global_step": 28236, "epoch": 237, "lr": 6.675750385911293e-05} +{"train_loss": 0.0022454687859863043, "global_step": 28237, "epoch": 237, "lr": 6.675541646757601e-05} +{"train_loss": 0.0036197120789438486, "global_step": 28238, "epoch": 237, "lr": 6.675332904314163e-05} +{"train_loss": 0.001968900440260768, "global_step": 28239, "epoch": 237, "lr": 6.675124158581385e-05} +{"train_loss": 0.0032062181271612644, "global_step": 28240, "epoch": 237, "lr": 6.674915409559682e-05} +{"train_loss": 0.0028438956942409277, "global_step": 28241, "epoch": 237, "lr": 6.67470665724946e-05} +{"train_loss": 0.001865121186710894, "global_step": 28242, "epoch": 237, "lr": 6.674497901651132e-05} +{"train_loss": 0.005604718346148729, "global_step": 28243, "epoch": 237, "lr": 6.674289142765105e-05} +{"train_loss": 0.0027298214845359325, "global_step": 28244, "epoch": 237, "lr": 6.67408038059179e-05} +{"train_loss": 0.0027973679825663567, "global_step": 28245, "epoch": 237, "lr": 6.673871615131597e-05} +{"train_loss": 0.003333556465804577, "global_step": 28246, "epoch": 237, "lr": 6.673662846384938e-05} +{"train_loss": 0.0037492476403713226, "global_step": 28247, "epoch": 237, "lr": 6.673454074352219e-05} +{"train_loss": 0.004700249060988426, "global_step": 28248, "epoch": 237, "lr": 6.673245299033853e-05} +{"train_loss": 0.0042623355984687805, "global_step": 28249, "epoch": 237, "lr": 6.673036520430247e-05} +{"train_loss": 0.003865219186991453, "global_step": 28250, "epoch": 237, "lr": 6.672827738541813e-05} +{"train_loss": 0.0037693798076361418, "global_step": 28251, "epoch": 237, "lr": 6.67261895336896e-05} +{"train_loss": 0.004328145179897547, "global_step": 28252, "epoch": 237, "lr": 6.672410164912099e-05} +{"train_loss": 0.0036452217027544975, "global_step": 28253, "epoch": 237, "lr": 6.67220137317164e-05} +{"train_loss": 0.003941004630178213, "global_step": 28254, "epoch": 237, "lr": 6.67199257814799e-05} +{"train_loss": 0.0028505336958914995, "global_step": 28255, "epoch": 237, "lr": 6.671783779841562e-05} +{"train_loss": 0.0044990647584199905, "global_step": 28256, "epoch": 237, "lr": 6.671574978252766e-05} +{"train_loss": 0.00401343172416091, "global_step": 28257, "epoch": 237, "lr": 6.671366173382012e-05} +{"train_loss": 0.0027494130190461874, "global_step": 28258, "epoch": 237, "lr": 6.671157365229707e-05} +{"train_loss": 0.0038410197012126446, "global_step": 28259, "epoch": 237, "lr": 6.670948553796266e-05} +{"train_loss": 0.0020400595385581255, "global_step": 28260, "epoch": 237, "lr": 6.670739739082093e-05} +{"train_loss": 0.0052903019823133945, "global_step": 28261, "epoch": 237, "lr": 6.670530921087603e-05} +{"train_loss": 0.005341629963368177, "global_step": 28262, "epoch": 237, "lr": 6.670322099813203e-05} +{"train_loss": 0.003342791460454464, "global_step": 28263, "epoch": 237, "lr": 6.670113275259303e-05} +{"train_loss": 0.002284076064825058, "global_step": 28264, "epoch": 237, "lr": 6.669904447426316e-05} +{"train_loss": 0.00399243738502264, "global_step": 28265, "epoch": 237, "lr": 6.669695616314649e-05} +{"train_loss": 0.002427279017865658, "global_step": 28266, "epoch": 237, "lr": 6.669486781924712e-05} +{"train_loss": 0.002495133550837636, "global_step": 28267, "epoch": 237, "lr": 6.669277944256918e-05} +{"train_loss": 0.0049491869285702705, "global_step": 28268, "epoch": 237, "lr": 6.669069103311674e-05} +{"train_loss": 0.003487883135676384, "global_step": 28269, "epoch": 237, "lr": 6.668860259089391e-05} +{"train_loss": 0.004239792004227638, "global_step": 28270, "epoch": 237, "lr": 6.66865141159048e-05} +{"train_loss": 0.005183238070458174, "global_step": 28271, "epoch": 237, "lr": 6.668442560815351e-05} +{"train_loss": 0.0035591707564890385, "global_step": 28272, "epoch": 237, "lr": 6.668233706764412e-05} +{"train_loss": 0.004498708061873913, "global_step": 28273, "epoch": 237, "lr": 6.668024849438074e-05} +{"train_loss": 0.0028506843373179436, "global_step": 28274, "epoch": 237, "lr": 6.667815988836748e-05} +{"train_loss": 0.0050507294945418835, "global_step": 28275, "epoch": 237, "lr": 6.667607124960842e-05} +{"train_loss": 0.003038539318367839, "global_step": 28276, "epoch": 237, "lr": 6.667398257810771e-05} +{"train_loss": 0.002587861381471157, "global_step": 28277, "epoch": 237, "lr": 6.66718938738694e-05} +{"train_loss": 0.003881145268678665, "global_step": 28278, "epoch": 237, "lr": 6.66698051368976e-05} +{"train_loss": 0.00376978050917387, "global_step": 28279, "epoch": 237, "lr": 6.666771636719642e-05} +{"train_loss": 0.00378447026014328, "global_step": 28280, "epoch": 237, "lr": 6.666562756476997e-05} +{"train_loss": 0.004561746027320623, "global_step": 28281, "epoch": 237, "lr": 6.666353872962232e-05} +{"train_loss": 0.004427791107445955, "global_step": 28282, "epoch": 237, "lr": 6.66614498617576e-05} +{"train_loss": 0.0030444797594100237, "global_step": 28283, "epoch": 237, "lr": 6.66593609611799e-05} +{"train_loss": 0.002700702054426074, "global_step": 28284, "epoch": 237, "lr": 6.665727202789334e-05} +{"train_loss": 0.003990796394646168, "global_step": 28285, "epoch": 237, "lr": 6.6655183061902e-05} +{"train_loss": 0.004135763738304377, "global_step": 28286, "epoch": 237, "lr": 6.665309406320998e-05} +{"train_loss": 0.0040445453487336636, "global_step": 28287, "epoch": 237, "lr": 6.66510050318214e-05} +{"train_loss": 0.004083935637027025, "global_step": 28288, "epoch": 237, "lr": 6.664891596774034e-05} +{"train_loss": 0.003907582722604275, "global_step": 28289, "epoch": 237, "lr": 6.664682687097093e-05} +{"train_loss": 0.0036848506424576044, "global_step": 28290, "epoch": 237, "lr": 6.664473774151724e-05} +{"train_loss": 0.0027169163804501295, "global_step": 28291, "epoch": 237, "lr": 6.664264857938339e-05} +{"train_loss": 0.0037014405243098736, "global_step": 28292, "epoch": 237, "lr": 6.664055938457346e-05} +{"train_loss": 0.0027799042873084545, "global_step": 28293, "epoch": 237, "lr": 6.66384701570916e-05} +{"train_loss": 0.0026791593991219997, "global_step": 28294, "epoch": 237, "lr": 6.663638089694185e-05} +{"train_loss": 0.0032573568169027567, "global_step": 28295, "epoch": 237, "lr": 6.663429160412836e-05} +{"train_loss": 0.005265297368168831, "global_step": 28296, "epoch": 237, "lr": 6.663220227865523e-05} +{"train_loss": 0.002828243188560009, "global_step": 28297, "epoch": 237, "lr": 6.663011292052652e-05} +{"train_loss": 0.0031208305153995752, "global_step": 28298, "epoch": 237, "lr": 6.662802352974637e-05} +{"train_loss": 0.0020943619310855865, "global_step": 28299, "epoch": 237, "lr": 6.662593410631887e-05} +{"train_loss": 0.004177185241132975, "global_step": 28300, "epoch": 237, "lr": 6.662384465024813e-05} +{"train_loss": 0.0035589137114584446, "global_step": 28301, "epoch": 237, "lr": 6.662175516153824e-05} +{"train_loss": 0.003017937997356057, "global_step": 28302, "epoch": 237, "lr": 6.661966564019332e-05} +{"train_loss": 0.0031674792990088463, "global_step": 28303, "epoch": 237, "lr": 6.661757608621746e-05} +{"train_loss": 0.0059515805914998055, "global_step": 28304, "epoch": 237, "lr": 6.661548649961476e-05} +{"train_loss": 0.0032368595711886883, "global_step": 28305, "epoch": 237, "lr": 6.661339688038933e-05} +{"train_loss": 0.002845208626240492, "global_step": 28306, "epoch": 237, "lr": 6.661130722854527e-05} +{"train_loss": 0.0037339257542043924, "global_step": 28307, "epoch": 237, "lr": 6.660921754408668e-05} +{"train_loss": 0.004771990701556206, "global_step": 28308, "epoch": 237, "lr": 6.660712782701767e-05} +{"train_loss": 0.003912160638719797, "global_step": 28309, "epoch": 237, "lr": 6.660503807734234e-05} +{"train_loss": 0.0023451929446309805, "global_step": 28310, "epoch": 237, "lr": 6.66029482950648e-05} +{"train_loss": 0.00554195512086153, "global_step": 28311, "epoch": 237, "lr": 6.660085848018912e-05} +{"train_loss": 0.0023983903229236603, "global_step": 28312, "epoch": 237, "lr": 6.659876863271945e-05} +{"train_loss": 0.005098850466310978, "global_step": 28313, "epoch": 237, "lr": 6.659667875265986e-05} +{"train_loss": 0.003590247593820095, "global_step": 28314, "epoch": 237, "lr": 6.659458884001446e-05} +{"train_loss": 0.0029795696027576923, "global_step": 28315, "epoch": 237, "lr": 6.659249889478735e-05} +{"train_loss": 0.005269573535770178, "global_step": 28316, "epoch": 237, "lr": 6.659040891698267e-05} +{"train_loss": 0.003991936799138784, "global_step": 28317, "epoch": 237, "lr": 6.658831890660447e-05} +{"train_loss": 0.002930157817900181, "global_step": 28318, "epoch": 237, "lr": 6.65862288636569e-05} +{"train_loss": 0.004113487433642149, "global_step": 28319, "epoch": 237, "lr": 6.658413878814402e-05} +{"train_loss": 0.004649678710848093, "global_step": 28320, "epoch": 237, "lr": 6.658204868006996e-05} +{"train_loss": 0.0034905118983191976, "global_step": 28321, "epoch": 237, "lr": 6.657995853943884e-05, "val_loss": 0.02360045537352562} +{"train_loss": 0.005107654258608818, "global_step": 28322, "epoch": 238, "lr": 6.657786836625473e-05} +{"train_loss": 0.0039516533724963665, "global_step": 28323, "epoch": 238, "lr": 6.657577816052174e-05} +{"train_loss": 0.0025741765275597572, "global_step": 28324, "epoch": 238, "lr": 6.657368792224398e-05} +{"train_loss": 0.004202311858534813, "global_step": 28325, "epoch": 238, "lr": 6.657159765142555e-05} +{"train_loss": 0.003596353344619274, "global_step": 28326, "epoch": 238, "lr": 6.656950734807057e-05} +{"train_loss": 0.005314650479704142, "global_step": 28327, "epoch": 238, "lr": 6.656741701218313e-05} +{"train_loss": 0.004593343939632177, "global_step": 28328, "epoch": 238, "lr": 6.656532664376734e-05} +{"train_loss": 0.0024414388462901115, "global_step": 28329, "epoch": 238, "lr": 6.65632362428273e-05} +{"train_loss": 0.004703382961452007, "global_step": 28330, "epoch": 238, "lr": 6.65611458093671e-05} +{"train_loss": 0.0035663838498294353, "global_step": 28331, "epoch": 238, "lr": 6.655905534339088e-05} +{"train_loss": 0.003401108318939805, "global_step": 28332, "epoch": 238, "lr": 6.655696484490271e-05} +{"train_loss": 0.0031124907545745373, "global_step": 28333, "epoch": 238, "lr": 6.655487431390671e-05} +{"train_loss": 0.004456629045307636, "global_step": 28334, "epoch": 238, "lr": 6.655278375040699e-05} +{"train_loss": 0.002866231370717287, "global_step": 28335, "epoch": 238, "lr": 6.655069315440764e-05} +{"train_loss": 0.0030917138792574406, "global_step": 28336, "epoch": 238, "lr": 6.654860252591278e-05} +{"train_loss": 0.0048227193765342236, "global_step": 28337, "epoch": 238, "lr": 6.65465118649265e-05} +{"train_loss": 0.002827134681865573, "global_step": 28338, "epoch": 238, "lr": 6.65444211714529e-05} +{"train_loss": 0.006430065259337425, "global_step": 28339, "epoch": 238, "lr": 6.654233044549612e-05} +{"train_loss": 0.0033825584687292576, "global_step": 28340, "epoch": 238, "lr": 6.654023968706025e-05} +{"train_loss": 0.002300008200109005, "global_step": 28341, "epoch": 238, "lr": 6.653814889614935e-05} +{"train_loss": 0.008030418306589127, "global_step": 28342, "epoch": 238, "lr": 6.65360580727676e-05} +{"train_loss": 0.005352096166461706, "global_step": 28343, "epoch": 238, "lr": 6.653396721691903e-05} +{"train_loss": 0.0039386264979839325, "global_step": 28344, "epoch": 238, "lr": 6.65318763286078e-05} +{"train_loss": 0.0029509940650314093, "global_step": 28345, "epoch": 238, "lr": 6.6529785407838e-05} +{"train_loss": 0.004600880201905966, "global_step": 28346, "epoch": 238, "lr": 6.652769445461374e-05} +{"train_loss": 0.004064141307026148, "global_step": 28347, "epoch": 238, "lr": 6.65256034689391e-05} +{"train_loss": 0.00416044145822525, "global_step": 28348, "epoch": 238, "lr": 6.65235124508182e-05} +{"train_loss": 0.005081614945083857, "global_step": 28349, "epoch": 238, "lr": 6.652142140025517e-05} +{"train_loss": 0.005400851834565401, "global_step": 28350, "epoch": 238, "lr": 6.651933031725406e-05} +{"train_loss": 0.0021328118164092302, "global_step": 28351, "epoch": 238, "lr": 6.651723920181904e-05} +{"train_loss": 0.004682869650423527, "global_step": 28352, "epoch": 238, "lr": 6.651514805395417e-05} +{"train_loss": 0.003660554066300392, "global_step": 28353, "epoch": 238, "lr": 6.651305687366358e-05} +{"train_loss": 0.0031704495195299387, "global_step": 28354, "epoch": 238, "lr": 6.651096566095137e-05} +{"train_loss": 0.005141441710293293, "global_step": 28355, "epoch": 238, "lr": 6.650887441582163e-05} +{"train_loss": 0.0028119327034801245, "global_step": 28356, "epoch": 238, "lr": 6.65067831382785e-05} +{"train_loss": 0.0031647635623812675, "global_step": 28357, "epoch": 238, "lr": 6.650469182832604e-05} +{"train_loss": 0.002428904175758362, "global_step": 28358, "epoch": 238, "lr": 6.650260048596838e-05} +{"train_loss": 0.004371446557343006, "global_step": 28359, "epoch": 238, "lr": 6.650050911120967e-05} +{"train_loss": 0.004551609046757221, "global_step": 28360, "epoch": 238, "lr": 6.649841770405393e-05} +{"train_loss": 0.004309257958084345, "global_step": 28361, "epoch": 238, "lr": 6.649632626450533e-05} +{"train_loss": 0.005065294913947582, "global_step": 28362, "epoch": 238, "lr": 6.649423479256795e-05} +{"train_loss": 0.0024901162832975388, "global_step": 28363, "epoch": 238, "lr": 6.649214328824589e-05} +{"train_loss": 0.0025083061773329973, "global_step": 28364, "epoch": 238, "lr": 6.649005175154329e-05} +{"train_loss": 0.002960024168714881, "global_step": 28365, "epoch": 238, "lr": 6.648796018246422e-05} +{"train_loss": 0.004472246393561363, "global_step": 28366, "epoch": 238, "lr": 6.648586858101279e-05} +{"train_loss": 0.001979559427127242, "global_step": 28367, "epoch": 238, "lr": 6.648377694719314e-05} +{"train_loss": 0.003977297339588404, "global_step": 28368, "epoch": 238, "lr": 6.648168528100934e-05} +{"train_loss": 0.00501724099740386, "global_step": 28369, "epoch": 238, "lr": 6.647959358246551e-05} +{"train_loss": 0.0026137223467230797, "global_step": 28370, "epoch": 238, "lr": 6.647750185156578e-05} +{"train_loss": 0.003543310333043337, "global_step": 28371, "epoch": 238, "lr": 6.647541008831423e-05} +{"train_loss": 0.002091370290145278, "global_step": 28372, "epoch": 238, "lr": 6.647331829271496e-05} +{"train_loss": 0.006796953268349171, "global_step": 28373, "epoch": 238, "lr": 6.647122646477211e-05} +{"train_loss": 0.0030914125964045525, "global_step": 28374, "epoch": 238, "lr": 6.646913460448975e-05} +{"train_loss": 0.002598996041342616, "global_step": 28375, "epoch": 238, "lr": 6.6467042711872e-05} +{"train_loss": 0.0030608498491346836, "global_step": 28376, "epoch": 238, "lr": 6.646495078692298e-05} +{"train_loss": 0.004001782741397619, "global_step": 28377, "epoch": 238, "lr": 6.646285882964678e-05} +{"train_loss": 0.002209798200055957, "global_step": 28378, "epoch": 238, "lr": 6.646076684004753e-05} +{"train_loss": 0.0019872100092470646, "global_step": 28379, "epoch": 238, "lr": 6.64586748181293e-05} +{"train_loss": 0.0061150346882641315, "global_step": 28380, "epoch": 238, "lr": 6.645658276389625e-05} +{"train_loss": 0.003203892381861806, "global_step": 28381, "epoch": 238, "lr": 6.645449067735244e-05} +{"train_loss": 0.0025590802542865276, "global_step": 28382, "epoch": 238, "lr": 6.645239855850199e-05} +{"train_loss": 0.002218431793153286, "global_step": 28383, "epoch": 238, "lr": 6.645030640734901e-05} +{"train_loss": 0.0035722842440009117, "global_step": 28384, "epoch": 238, "lr": 6.644821422389763e-05} +{"train_loss": 0.0020136453676968813, "global_step": 28385, "epoch": 238, "lr": 6.644612200815192e-05} +{"train_loss": 0.003816549899056554, "global_step": 28386, "epoch": 238, "lr": 6.644402976011602e-05} +{"train_loss": 0.002952823881059885, "global_step": 28387, "epoch": 238, "lr": 6.644193747979403e-05} +{"train_loss": 0.0030866251327097416, "global_step": 28388, "epoch": 238, "lr": 6.643984516719004e-05} +{"train_loss": 0.004933780990540981, "global_step": 28389, "epoch": 238, "lr": 6.643775282230817e-05} +{"train_loss": 0.0017703525954857469, "global_step": 28390, "epoch": 238, "lr": 6.643566044515254e-05} +{"train_loss": 0.0030088601633906364, "global_step": 28391, "epoch": 238, "lr": 6.643356803572724e-05} +{"train_loss": 0.004379380494356155, "global_step": 28392, "epoch": 238, "lr": 6.643147559403638e-05} +{"train_loss": 0.0037232432514429092, "global_step": 28393, "epoch": 238, "lr": 6.642938312008408e-05} +{"train_loss": 0.002965525956824422, "global_step": 28394, "epoch": 238, "lr": 6.642729061387443e-05} +{"train_loss": 0.002870232332497835, "global_step": 28395, "epoch": 238, "lr": 6.642519807541156e-05} +{"train_loss": 0.0022277594543993473, "global_step": 28396, "epoch": 238, "lr": 6.642310550469957e-05} +{"train_loss": 0.004693853203207254, "global_step": 28397, "epoch": 238, "lr": 6.642101290174256e-05} +{"train_loss": 0.002316382247954607, "global_step": 28398, "epoch": 238, "lr": 6.641892026654464e-05} +{"train_loss": 0.0035167746245861053, "global_step": 28399, "epoch": 238, "lr": 6.641682759910994e-05} +{"train_loss": 0.005697394255548716, "global_step": 28400, "epoch": 238, "lr": 6.641473489944255e-05} +{"train_loss": 0.005563309881836176, "global_step": 28401, "epoch": 238, "lr": 6.641264216754657e-05} +{"train_loss": 0.0021901456639170647, "global_step": 28402, "epoch": 238, "lr": 6.641054940342612e-05} +{"train_loss": 0.004620252177119255, "global_step": 28403, "epoch": 238, "lr": 6.640845660708532e-05} +{"train_loss": 0.00483449874445796, "global_step": 28404, "epoch": 238, "lr": 6.640636377852827e-05} +{"train_loss": 0.004756382666528225, "global_step": 28405, "epoch": 238, "lr": 6.640427091775908e-05} +{"train_loss": 0.0031201590318232775, "global_step": 28406, "epoch": 238, "lr": 6.640217802478184e-05} +{"train_loss": 0.0043663447722792625, "global_step": 28407, "epoch": 238, "lr": 6.640008509960068e-05} +{"train_loss": 0.0032384758815169334, "global_step": 28408, "epoch": 238, "lr": 6.63979921422197e-05} +{"train_loss": 0.0046812086366117, "global_step": 28409, "epoch": 238, "lr": 6.639589915264305e-05} +{"train_loss": 0.002661596518009901, "global_step": 28410, "epoch": 238, "lr": 6.639380613087478e-05} +{"train_loss": 0.0039998916909098625, "global_step": 28411, "epoch": 238, "lr": 6.639171307691901e-05} +{"train_loss": 0.0038274400867521763, "global_step": 28412, "epoch": 238, "lr": 6.638961999077988e-05} +{"train_loss": 0.0020457394421100616, "global_step": 28413, "epoch": 238, "lr": 6.638752687246147e-05} +{"train_loss": 0.002140316879376769, "global_step": 28414, "epoch": 238, "lr": 6.638543372196791e-05} +{"train_loss": 0.0032174831721931696, "global_step": 28415, "epoch": 238, "lr": 6.638334053930329e-05} +{"train_loss": 0.0029827975668013096, "global_step": 28416, "epoch": 238, "lr": 6.638124732447175e-05} +{"train_loss": 0.003930726088583469, "global_step": 28417, "epoch": 238, "lr": 6.637915407747736e-05} +{"train_loss": 0.004129413049668074, "global_step": 28418, "epoch": 238, "lr": 6.637706079832427e-05} +{"train_loss": 0.0033784639090299606, "global_step": 28419, "epoch": 238, "lr": 6.637496748701657e-05} +{"train_loss": 0.0036644521169364452, "global_step": 28420, "epoch": 238, "lr": 6.637287414355835e-05} +{"train_loss": 0.0036743946839123964, "global_step": 28421, "epoch": 238, "lr": 6.637078076795375e-05} +{"train_loss": 0.0030522169545292854, "global_step": 28422, "epoch": 238, "lr": 6.636868736020689e-05} +{"train_loss": 0.0040449658408761024, "global_step": 28423, "epoch": 238, "lr": 6.636659392032185e-05} +{"train_loss": 0.0024365847930312157, "global_step": 28424, "epoch": 238, "lr": 6.636450044830274e-05} +{"train_loss": 0.00364474393427372, "global_step": 28425, "epoch": 238, "lr": 6.63624069441537e-05} +{"train_loss": 0.003548051230609417, "global_step": 28426, "epoch": 238, "lr": 6.63603134078788e-05} +{"train_loss": 0.0043577151373028755, "global_step": 28427, "epoch": 238, "lr": 6.635821983948218e-05} +{"train_loss": 0.004089977592229843, "global_step": 28428, "epoch": 238, "lr": 6.635612623896797e-05} +{"train_loss": 0.002770742867141962, "global_step": 28429, "epoch": 238, "lr": 6.635403260634022e-05} +{"train_loss": 0.005173888988792896, "global_step": 28430, "epoch": 238, "lr": 6.635193894160309e-05} +{"train_loss": 0.002466205507516861, "global_step": 28431, "epoch": 238, "lr": 6.634984524476067e-05} +{"train_loss": 0.003143193433061242, "global_step": 28432, "epoch": 238, "lr": 6.634775151581707e-05} +{"train_loss": 0.004159353207796812, "global_step": 28433, "epoch": 238, "lr": 6.634565775477639e-05} +{"train_loss": 0.002481456147506833, "global_step": 28434, "epoch": 238, "lr": 6.634356396164279e-05} +{"train_loss": 0.003262226702645421, "global_step": 28435, "epoch": 238, "lr": 6.634147013642033e-05} +{"train_loss": 0.003690604818984866, "global_step": 28436, "epoch": 238, "lr": 6.633937627911315e-05} +{"train_loss": 0.0018425555899739265, "global_step": 28437, "epoch": 238, "lr": 6.633728238972536e-05} +{"train_loss": 0.006350954528898001, "global_step": 28438, "epoch": 238, "lr": 6.633518846826104e-05} +{"train_loss": 0.0027216547168791294, "global_step": 28439, "epoch": 238, "lr": 6.633309451472432e-05} +{"train_loss": 0.003673326228980069, "global_step": 28440, "epoch": 238, "lr": 6.633100052911934e-05, "val_loss": 0.01989164762198925} +{"train_loss": 0.007724231109023094, "global_step": 28441, "epoch": 239, "lr": 6.632890651145017e-05} +{"train_loss": 0.003875776194036007, "global_step": 28442, "epoch": 239, "lr": 6.632681246172094e-05} +{"train_loss": 0.003650826634839177, "global_step": 28443, "epoch": 239, "lr": 6.632471837993575e-05} +{"train_loss": 0.00339097180403769, "global_step": 28444, "epoch": 239, "lr": 6.632262426609873e-05} +{"train_loss": 0.0060087768360972404, "global_step": 28445, "epoch": 239, "lr": 6.632053012021396e-05} +{"train_loss": 0.003914806991815567, "global_step": 28446, "epoch": 239, "lr": 6.631843594228559e-05} +{"train_loss": 0.004692959599196911, "global_step": 28447, "epoch": 239, "lr": 6.631634173231772e-05} +{"train_loss": 0.0069046346470713615, "global_step": 28448, "epoch": 239, "lr": 6.631424749031443e-05} +{"train_loss": 0.005565257277339697, "global_step": 28449, "epoch": 239, "lr": 6.631215321627988e-05} +{"train_loss": 0.002997299423441291, "global_step": 28450, "epoch": 239, "lr": 6.631005891021816e-05} +{"train_loss": 0.004711298272013664, "global_step": 28451, "epoch": 239, "lr": 6.630796457213338e-05} +{"train_loss": 0.003834844334051013, "global_step": 28452, "epoch": 239, "lr": 6.630587020202964e-05} +{"train_loss": 0.0035059305373579264, "global_step": 28453, "epoch": 239, "lr": 6.63037757999111e-05} +{"train_loss": 0.003695076797157526, "global_step": 28454, "epoch": 239, "lr": 6.63016813657818e-05} +{"train_loss": 0.0032356525771319866, "global_step": 28455, "epoch": 239, "lr": 6.62995868996459e-05} +{"train_loss": 0.005453627090901136, "global_step": 28456, "epoch": 239, "lr": 6.629749240150751e-05} +{"train_loss": 0.006865413393825293, "global_step": 28457, "epoch": 239, "lr": 6.629539787137074e-05} +{"train_loss": 0.003426109440624714, "global_step": 28458, "epoch": 239, "lr": 6.629330330923969e-05} +{"train_loss": 0.004369003232568502, "global_step": 28459, "epoch": 239, "lr": 6.629120871511848e-05} +{"train_loss": 0.003551872679963708, "global_step": 28460, "epoch": 239, "lr": 6.628911408901122e-05} +{"train_loss": 0.005298686679452658, "global_step": 28461, "epoch": 239, "lr": 6.628701943092202e-05} +{"train_loss": 0.004144384991377592, "global_step": 28462, "epoch": 239, "lr": 6.628492474085501e-05} +{"train_loss": 0.004617375321686268, "global_step": 28463, "epoch": 239, "lr": 6.628283001881427e-05} +{"train_loss": 0.005929538514465094, "global_step": 28464, "epoch": 239, "lr": 6.628073526480397e-05} +{"train_loss": 0.004611525218933821, "global_step": 28465, "epoch": 239, "lr": 6.627864047882814e-05} +{"train_loss": 0.003986467607319355, "global_step": 28466, "epoch": 239, "lr": 6.627654566089097e-05} +{"train_loss": 0.0053557478822767735, "global_step": 28467, "epoch": 239, "lr": 6.627445081099652e-05} +{"train_loss": 0.005053746048361063, "global_step": 28468, "epoch": 239, "lr": 6.627235592914894e-05} +{"train_loss": 0.005426390562206507, "global_step": 28469, "epoch": 239, "lr": 6.627026101535233e-05} +{"train_loss": 0.0037100205663591623, "global_step": 28470, "epoch": 239, "lr": 6.626816606961079e-05} +{"train_loss": 0.005195992067456245, "global_step": 28471, "epoch": 239, "lr": 6.626607109192845e-05} +{"train_loss": 0.0023712862748652697, "global_step": 28472, "epoch": 239, "lr": 6.626397608230943e-05} +{"train_loss": 0.0037781214341521263, "global_step": 28473, "epoch": 239, "lr": 6.626188104075781e-05} +{"train_loss": 0.006414325442165136, "global_step": 28474, "epoch": 239, "lr": 6.625978596727773e-05} +{"train_loss": 0.0034466965589672327, "global_step": 28475, "epoch": 239, "lr": 6.62576908618733e-05} +{"train_loss": 0.0032054861076176167, "global_step": 28476, "epoch": 239, "lr": 6.625559572454862e-05} +{"train_loss": 0.002980461809784174, "global_step": 28477, "epoch": 239, "lr": 6.625350055530783e-05} +{"train_loss": 0.0030160737223923206, "global_step": 28478, "epoch": 239, "lr": 6.625140535415503e-05} +{"train_loss": 0.0029508243314921856, "global_step": 28479, "epoch": 239, "lr": 6.624931012109433e-05} +{"train_loss": 0.005059008486568928, "global_step": 28480, "epoch": 239, "lr": 6.624721485612984e-05} +{"train_loss": 0.005038680043071508, "global_step": 28481, "epoch": 239, "lr": 6.624511955926567e-05} +{"train_loss": 0.005278724245727062, "global_step": 28482, "epoch": 239, "lr": 6.624302423050593e-05} +{"train_loss": 0.0049438769929111, "global_step": 28483, "epoch": 239, "lr": 6.624092886985477e-05} +{"train_loss": 0.0034669344313442707, "global_step": 28484, "epoch": 239, "lr": 6.62388334773163e-05} +{"train_loss": 0.0054451292380690575, "global_step": 28485, "epoch": 239, "lr": 6.623673805289459e-05} +{"train_loss": 0.005852506961673498, "global_step": 28486, "epoch": 239, "lr": 6.623464259659378e-05} +{"train_loss": 0.0038672008085995913, "global_step": 28487, "epoch": 239, "lr": 6.623254710841799e-05} +{"train_loss": 0.003278719959780574, "global_step": 28488, "epoch": 239, "lr": 6.623045158837132e-05} +{"train_loss": 0.003753402503207326, "global_step": 28489, "epoch": 239, "lr": 6.62283560364579e-05} +{"train_loss": 0.0035309740342199802, "global_step": 28490, "epoch": 239, "lr": 6.622626045268184e-05} +{"train_loss": 0.00560026103630662, "global_step": 28491, "epoch": 239, "lr": 6.622416483704726e-05} +{"train_loss": 0.002814080100506544, "global_step": 28492, "epoch": 239, "lr": 6.622206918955825e-05} +{"train_loss": 0.004285670816898346, "global_step": 28493, "epoch": 239, "lr": 6.621997351021894e-05} +{"train_loss": 0.005402558017522097, "global_step": 28494, "epoch": 239, "lr": 6.621787779903343e-05} +{"train_loss": 0.0037361907307058573, "global_step": 28495, "epoch": 239, "lr": 6.621578205600587e-05} +{"train_loss": 0.005310392472893, "global_step": 28496, "epoch": 239, "lr": 6.621368628114035e-05} +{"train_loss": 0.005778824910521507, "global_step": 28497, "epoch": 239, "lr": 6.621159047444098e-05} +{"train_loss": 0.0036089150235056877, "global_step": 28498, "epoch": 239, "lr": 6.62094946359119e-05} +{"train_loss": 0.0034939893521368504, "global_step": 28499, "epoch": 239, "lr": 6.620739876555721e-05} +{"train_loss": 0.003085471224039793, "global_step": 28500, "epoch": 239, "lr": 6.620530286338102e-05} +{"train_loss": 0.004174991976469755, "global_step": 28501, "epoch": 239, "lr": 6.620320692938745e-05} +{"train_loss": 0.004218571353703737, "global_step": 28502, "epoch": 239, "lr": 6.62011109635806e-05} +{"train_loss": 0.004231484141200781, "global_step": 28503, "epoch": 239, "lr": 6.619901496596462e-05} +{"train_loss": 0.003580812830477953, "global_step": 28504, "epoch": 239, "lr": 6.61969189365436e-05} +{"train_loss": 0.00407600961625576, "global_step": 28505, "epoch": 239, "lr": 6.619482287532164e-05} +{"train_loss": 0.005220821592956781, "global_step": 28506, "epoch": 239, "lr": 6.61927267823029e-05} +{"train_loss": 0.004800859373062849, "global_step": 28507, "epoch": 239, "lr": 6.619063065749145e-05} +{"train_loss": 0.004233347252011299, "global_step": 28508, "epoch": 239, "lr": 6.618853450089145e-05} +{"train_loss": 0.004677037242799997, "global_step": 28509, "epoch": 239, "lr": 6.618643831250698e-05} +{"train_loss": 0.003161936067044735, "global_step": 28510, "epoch": 239, "lr": 6.618434209234217e-05} +{"train_loss": 0.004234225954860449, "global_step": 28511, "epoch": 239, "lr": 6.618224584040112e-05} +{"train_loss": 0.002232474507763982, "global_step": 28512, "epoch": 239, "lr": 6.618014955668798e-05} +{"train_loss": 0.0021466363687068224, "global_step": 28513, "epoch": 239, "lr": 6.617805324120683e-05} +{"train_loss": 0.0024679601192474365, "global_step": 28514, "epoch": 239, "lr": 6.61759568939618e-05} +{"train_loss": 0.0029623559676110744, "global_step": 28515, "epoch": 239, "lr": 6.617386051495703e-05} +{"train_loss": 0.0054082064889371395, "global_step": 28516, "epoch": 239, "lr": 6.617176410419658e-05} +{"train_loss": 0.005209417548030615, "global_step": 28517, "epoch": 239, "lr": 6.61696676616846e-05} +{"train_loss": 0.0029394340235739946, "global_step": 28518, "epoch": 239, "lr": 6.616757118742523e-05} +{"train_loss": 0.0028960152994841337, "global_step": 28519, "epoch": 239, "lr": 6.616547468142255e-05} +{"train_loss": 0.0044726962223649025, "global_step": 28520, "epoch": 239, "lr": 6.616337814368068e-05} +{"train_loss": 0.004658951424062252, "global_step": 28521, "epoch": 239, "lr": 6.616128157420376e-05} +{"train_loss": 0.0037292498163878918, "global_step": 28522, "epoch": 239, "lr": 6.615918497299589e-05} +{"train_loss": 0.0036542550660669804, "global_step": 28523, "epoch": 239, "lr": 6.615708834006117e-05} +{"train_loss": 0.0023283986374735832, "global_step": 28524, "epoch": 239, "lr": 6.615499167540374e-05} +{"train_loss": 0.004242682829499245, "global_step": 28525, "epoch": 239, "lr": 6.615289497902771e-05} +{"train_loss": 0.00426713889464736, "global_step": 28526, "epoch": 239, "lr": 6.61507982509372e-05} +{"train_loss": 0.0036318181082606316, "global_step": 28527, "epoch": 239, "lr": 6.614870149113633e-05} +{"train_loss": 0.004324801731854677, "global_step": 28528, "epoch": 239, "lr": 6.61466046996292e-05} +{"train_loss": 0.0023063188418745995, "global_step": 28529, "epoch": 239, "lr": 6.614450787641994e-05} +{"train_loss": 0.004377724602818489, "global_step": 28530, "epoch": 239, "lr": 6.614241102151266e-05} +{"train_loss": 0.0029795009177178144, "global_step": 28531, "epoch": 239, "lr": 6.614031413491146e-05} +{"train_loss": 0.002628884743899107, "global_step": 28532, "epoch": 239, "lr": 6.61382172166205e-05} +{"train_loss": 0.002235857769846916, "global_step": 28533, "epoch": 239, "lr": 6.613612026664387e-05} +{"train_loss": 0.002990440698340535, "global_step": 28534, "epoch": 239, "lr": 6.613402328498572e-05} +{"train_loss": 0.002100384794175625, "global_step": 28535, "epoch": 239, "lr": 6.61319262716501e-05} +{"train_loss": 0.00231725350022316, "global_step": 28536, "epoch": 239, "lr": 6.612982922664119e-05} +{"train_loss": 0.002190591301769018, "global_step": 28537, "epoch": 239, "lr": 6.612773214996306e-05} +{"train_loss": 0.0023528554011136293, "global_step": 28538, "epoch": 239, "lr": 6.612563504161987e-05} +{"train_loss": 0.003031922969967127, "global_step": 28539, "epoch": 239, "lr": 6.612353790161572e-05} +{"train_loss": 0.002210170030593872, "global_step": 28540, "epoch": 239, "lr": 6.612144072995471e-05} +{"train_loss": 0.0025786440819501877, "global_step": 28541, "epoch": 239, "lr": 6.6119343526641e-05} +{"train_loss": 0.0029440864454954863, "global_step": 28542, "epoch": 239, "lr": 6.611724629167865e-05} +{"train_loss": 0.0033094899263232946, "global_step": 28543, "epoch": 239, "lr": 6.611514902507184e-05} +{"train_loss": 0.0015981642063707113, "global_step": 28544, "epoch": 239, "lr": 6.611305172682463e-05} +{"train_loss": 0.0026494136545807123, "global_step": 28545, "epoch": 239, "lr": 6.611095439694117e-05} +{"train_loss": 0.001740416744723916, "global_step": 28546, "epoch": 239, "lr": 6.610885703542558e-05} +{"train_loss": 0.003492176067084074, "global_step": 28547, "epoch": 239, "lr": 6.610675964228196e-05} +{"train_loss": 0.0029183696024119854, "global_step": 28548, "epoch": 239, "lr": 6.610466221751443e-05} +{"train_loss": 0.0030559676233679056, "global_step": 28549, "epoch": 239, "lr": 6.610256476112714e-05} +{"train_loss": 0.005093684419989586, "global_step": 28550, "epoch": 239, "lr": 6.610046727312417e-05} +{"train_loss": 0.0019982748199254274, "global_step": 28551, "epoch": 239, "lr": 6.609836975350966e-05} +{"train_loss": 0.0022425029892474413, "global_step": 28552, "epoch": 239, "lr": 6.609627220228771e-05} +{"train_loss": 0.0036755844485014677, "global_step": 28553, "epoch": 239, "lr": 6.609417461946247e-05} +{"train_loss": 0.0035990653559565544, "global_step": 28554, "epoch": 239, "lr": 6.609207700503802e-05} +{"train_loss": 0.0033965245820581913, "global_step": 28555, "epoch": 239, "lr": 6.608997935901851e-05} +{"train_loss": 0.0029803388752043247, "global_step": 28556, "epoch": 239, "lr": 6.608788168140802e-05} +{"train_loss": 0.0042690918780863285, "global_step": 28557, "epoch": 239, "lr": 6.608578397221072e-05} +{"train_loss": 0.004392318427562714, "global_step": 28558, "epoch": 239, "lr": 6.608368623143069e-05} +{"train_loss": 0.0039056813825673166, "global_step": 28559, "epoch": 239, "lr": 6.608158845907206e-05, "val_loss": 0.014240200631320477} +{"train_loss": 0.004305383190512657, "global_step": 28560, "epoch": 240, "lr": 6.607949065513896e-05} +{"train_loss": 0.0040976316668093204, "global_step": 28561, "epoch": 240, "lr": 6.607739281963547e-05} +{"train_loss": 0.0016725369496271014, "global_step": 28562, "epoch": 240, "lr": 6.607529495256576e-05} +{"train_loss": 0.0038379053585231304, "global_step": 28563, "epoch": 240, "lr": 6.607319705393392e-05} +{"train_loss": 0.002121842000633478, "global_step": 28564, "epoch": 240, "lr": 6.607109912374407e-05} +{"train_loss": 0.004208406899124384, "global_step": 28565, "epoch": 240, "lr": 6.606900116200034e-05} +{"train_loss": 0.004508852958679199, "global_step": 28566, "epoch": 240, "lr": 6.606690316870684e-05} +{"train_loss": 0.0025305193848907948, "global_step": 28567, "epoch": 240, "lr": 6.60648051438677e-05} +{"train_loss": 0.0014413524186238647, "global_step": 28568, "epoch": 240, "lr": 6.606270708748702e-05} +{"train_loss": 0.001599111477844417, "global_step": 28569, "epoch": 240, "lr": 6.606060899956893e-05} +{"train_loss": 0.0034785314928740263, "global_step": 28570, "epoch": 240, "lr": 6.605851088011756e-05} +{"train_loss": 0.004595934879034758, "global_step": 28571, "epoch": 240, "lr": 6.6056412729137e-05} +{"train_loss": 0.004296406172215939, "global_step": 28572, "epoch": 240, "lr": 6.605431454663142e-05} +{"train_loss": 0.001953969243913889, "global_step": 28573, "epoch": 240, "lr": 6.60522163326049e-05} +{"train_loss": 0.0028385939076542854, "global_step": 28574, "epoch": 240, "lr": 6.605011808706157e-05} +{"train_loss": 0.0028065661899745464, "global_step": 28575, "epoch": 240, "lr": 6.604801981000553e-05} +{"train_loss": 0.0038214754313230515, "global_step": 28576, "epoch": 240, "lr": 6.604592150144092e-05} +{"train_loss": 0.004761848598718643, "global_step": 28577, "epoch": 240, "lr": 6.604382316137186e-05} +{"train_loss": 0.002129064640030265, "global_step": 28578, "epoch": 240, "lr": 6.604172478980249e-05} +{"train_loss": 0.0035616469103842974, "global_step": 28579, "epoch": 240, "lr": 6.603962638673688e-05} +{"train_loss": 0.0034828614443540573, "global_step": 28580, "epoch": 240, "lr": 6.603752795217917e-05} +{"train_loss": 0.002002432942390442, "global_step": 28581, "epoch": 240, "lr": 6.603542948613351e-05} +{"train_loss": 0.003417614381760359, "global_step": 28582, "epoch": 240, "lr": 6.603333098860398e-05} +{"train_loss": 0.004318527411669493, "global_step": 28583, "epoch": 240, "lr": 6.603123245959472e-05} +{"train_loss": 0.002972880145534873, "global_step": 28584, "epoch": 240, "lr": 6.602913389910987e-05} +{"train_loss": 0.00478194048628211, "global_step": 28585, "epoch": 240, "lr": 6.602703530715352e-05} +{"train_loss": 0.002137297298759222, "global_step": 28586, "epoch": 240, "lr": 6.602493668372978e-05} +{"train_loss": 0.0026159051340073347, "global_step": 28587, "epoch": 240, "lr": 6.60228380288428e-05} +{"train_loss": 0.005382596515119076, "global_step": 28588, "epoch": 240, "lr": 6.60207393424967e-05} +{"train_loss": 0.0028343326412141323, "global_step": 28589, "epoch": 240, "lr": 6.601864062469558e-05} +{"train_loss": 0.001486957655288279, "global_step": 28590, "epoch": 240, "lr": 6.601654187544356e-05} +{"train_loss": 0.0030630792025476694, "global_step": 28591, "epoch": 240, "lr": 6.60144430947448e-05} +{"train_loss": 0.0035001817159354687, "global_step": 28592, "epoch": 240, "lr": 6.601234428260337e-05} +{"train_loss": 0.0019121771911159158, "global_step": 28593, "epoch": 240, "lr": 6.601024543902341e-05} +{"train_loss": 0.0038788404781371355, "global_step": 28594, "epoch": 240, "lr": 6.600814656400904e-05} +{"train_loss": 0.0037219154182821512, "global_step": 28595, "epoch": 240, "lr": 6.60060476575644e-05} +{"train_loss": 0.004196705296635628, "global_step": 28596, "epoch": 240, "lr": 6.600394871969358e-05} +{"train_loss": 0.0031731114722788334, "global_step": 28597, "epoch": 240, "lr": 6.600184975040073e-05} +{"train_loss": 0.0028929829131811857, "global_step": 28598, "epoch": 240, "lr": 6.599975074968996e-05} +{"train_loss": 0.0038631607312709093, "global_step": 28599, "epoch": 240, "lr": 6.599765171756538e-05} +{"train_loss": 0.0032109366729855537, "global_step": 28600, "epoch": 240, "lr": 6.599555265403112e-05} +{"train_loss": 0.0020796856842935085, "global_step": 28601, "epoch": 240, "lr": 6.59934535590913e-05} +{"train_loss": 0.001964392140507698, "global_step": 28602, "epoch": 240, "lr": 6.599135443275003e-05} +{"train_loss": 0.005852631758898497, "global_step": 28603, "epoch": 240, "lr": 6.598925527501149e-05} +{"train_loss": 0.0028983631636947393, "global_step": 28604, "epoch": 240, "lr": 6.598715608587973e-05} +{"train_loss": 0.0032751390244811773, "global_step": 28605, "epoch": 240, "lr": 6.598505686535887e-05} +{"train_loss": 0.0017307527596130967, "global_step": 28606, "epoch": 240, "lr": 6.598295761345309e-05} +{"train_loss": 0.00514549994841218, "global_step": 28607, "epoch": 240, "lr": 6.598085833016648e-05} +{"train_loss": 0.00250905635766685, "global_step": 28608, "epoch": 240, "lr": 6.597875901550314e-05} +{"train_loss": 0.00235364749096334, "global_step": 28609, "epoch": 240, "lr": 6.597665966946722e-05} +{"train_loss": 0.005313404370099306, "global_step": 28610, "epoch": 240, "lr": 6.597456029206286e-05} +{"train_loss": 0.002155747963115573, "global_step": 28611, "epoch": 240, "lr": 6.597246088329415e-05} +{"train_loss": 0.002907827729359269, "global_step": 28612, "epoch": 240, "lr": 6.59703614431652e-05} +{"train_loss": 0.002788265235722065, "global_step": 28613, "epoch": 240, "lr": 6.596826197168015e-05} +{"train_loss": 0.0026353965513408184, "global_step": 28614, "epoch": 240, "lr": 6.596616246884315e-05} +{"train_loss": 0.0032456873450428247, "global_step": 28615, "epoch": 240, "lr": 6.596406293465825e-05} +{"train_loss": 0.0038770241662859917, "global_step": 28616, "epoch": 240, "lr": 6.596196336912967e-05} +{"train_loss": 0.002490790095180273, "global_step": 28617, "epoch": 240, "lr": 6.595986377226145e-05} +{"train_loss": 0.0020595318637788296, "global_step": 28618, "epoch": 240, "lr": 6.595776414405774e-05} +{"train_loss": 0.0032633082009851933, "global_step": 28619, "epoch": 240, "lr": 6.595566448452268e-05} +{"train_loss": 0.004000726621598005, "global_step": 28620, "epoch": 240, "lr": 6.595356479366038e-05} +{"train_loss": 0.002687350381165743, "global_step": 28621, "epoch": 240, "lr": 6.595146507147495e-05} +{"train_loss": 0.002807429526001215, "global_step": 28622, "epoch": 240, "lr": 6.594936531797054e-05} +{"train_loss": 0.003176130587235093, "global_step": 28623, "epoch": 240, "lr": 6.594726553315122e-05} +{"train_loss": 0.002758475486189127, "global_step": 28624, "epoch": 240, "lr": 6.594516571702118e-05} +{"train_loss": 0.004677891731262207, "global_step": 28625, "epoch": 240, "lr": 6.59430658695845e-05} +{"train_loss": 0.0023885902483016253, "global_step": 28626, "epoch": 240, "lr": 6.59409659908453e-05} +{"train_loss": 0.0027412527706474066, "global_step": 28627, "epoch": 240, "lr": 6.593886608080774e-05} +{"train_loss": 0.0041701472364366055, "global_step": 28628, "epoch": 240, "lr": 6.59367661394759e-05} +{"train_loss": 0.004676898941397667, "global_step": 28629, "epoch": 240, "lr": 6.593466616685393e-05} +{"train_loss": 0.003789922222495079, "global_step": 28630, "epoch": 240, "lr": 6.593256616294594e-05} +{"train_loss": 0.0028207607101649046, "global_step": 28631, "epoch": 240, "lr": 6.593046612775606e-05} +{"train_loss": 0.003606516867876053, "global_step": 28632, "epoch": 240, "lr": 6.592836606128843e-05} +{"train_loss": 0.0035884275566786528, "global_step": 28633, "epoch": 240, "lr": 6.592626596354714e-05} +{"train_loss": 0.003284347476437688, "global_step": 28634, "epoch": 240, "lr": 6.592416583453632e-05} +{"train_loss": 0.00269297044724226, "global_step": 28635, "epoch": 240, "lr": 6.592206567426012e-05} +{"train_loss": 0.0032671685330569744, "global_step": 28636, "epoch": 240, "lr": 6.591996548272264e-05} +{"train_loss": 0.0015639688353985548, "global_step": 28637, "epoch": 240, "lr": 6.5917865259928e-05} +{"train_loss": 0.0027323041576892138, "global_step": 28638, "epoch": 240, "lr": 6.591576500588033e-05} +{"train_loss": 0.001851669861935079, "global_step": 28639, "epoch": 240, "lr": 6.591366472058377e-05} +{"train_loss": 0.002910362323746085, "global_step": 28640, "epoch": 240, "lr": 6.591156440404241e-05} +{"train_loss": 0.002217261353507638, "global_step": 28641, "epoch": 240, "lr": 6.590946405626041e-05} +{"train_loss": 0.0046977149322628975, "global_step": 28642, "epoch": 240, "lr": 6.590736367724189e-05} +{"train_loss": 0.002601685468107462, "global_step": 28643, "epoch": 240, "lr": 6.590526326699093e-05} +{"train_loss": 0.003100100439041853, "global_step": 28644, "epoch": 240, "lr": 6.59031628255117e-05} +{"train_loss": 0.005305557046085596, "global_step": 28645, "epoch": 240, "lr": 6.59010623528083e-05} +{"train_loss": 0.0018308227881789207, "global_step": 28646, "epoch": 240, "lr": 6.589896184888488e-05} +{"train_loss": 0.003347305115312338, "global_step": 28647, "epoch": 240, "lr": 6.589686131374553e-05} +{"train_loss": 0.004471508786082268, "global_step": 28648, "epoch": 240, "lr": 6.58947607473944e-05} +{"train_loss": 0.0029024682007730007, "global_step": 28649, "epoch": 240, "lr": 6.589266014983559e-05} +{"train_loss": 0.0025636800564825535, "global_step": 28650, "epoch": 240, "lr": 6.589055952107325e-05} +{"train_loss": 0.0033504788298159838, "global_step": 28651, "epoch": 240, "lr": 6.58884588611115e-05} +{"train_loss": 0.003878089366480708, "global_step": 28652, "epoch": 240, "lr": 6.588635816995446e-05} +{"train_loss": 0.0027957523707300425, "global_step": 28653, "epoch": 240, "lr": 6.588425744760625e-05} +{"train_loss": 0.003413637401536107, "global_step": 28654, "epoch": 240, "lr": 6.5882156694071e-05} +{"train_loss": 0.002644310938194394, "global_step": 28655, "epoch": 240, "lr": 6.588005590935282e-05} +{"train_loss": 0.0024884105660021305, "global_step": 28656, "epoch": 240, "lr": 6.587795509345585e-05} +{"train_loss": 0.00170044950209558, "global_step": 28657, "epoch": 240, "lr": 6.587585424638423e-05} +{"train_loss": 0.0025903447531163692, "global_step": 28658, "epoch": 240, "lr": 6.587375336814204e-05} +{"train_loss": 0.005387878976762295, "global_step": 28659, "epoch": 240, "lr": 6.587165245873345e-05} +{"train_loss": 0.0020442435052245855, "global_step": 28660, "epoch": 240, "lr": 6.586955151816256e-05} +{"train_loss": 0.003988896030932665, "global_step": 28661, "epoch": 240, "lr": 6.58674505464335e-05} +{"train_loss": 0.0032717164140194654, "global_step": 28662, "epoch": 240, "lr": 6.586534954355039e-05} +{"train_loss": 0.0031511965207755566, "global_step": 28663, "epoch": 240, "lr": 6.586324850951737e-05} +{"train_loss": 0.0023538856767117977, "global_step": 28664, "epoch": 240, "lr": 6.586114744433854e-05} +{"train_loss": 0.005041824653744698, "global_step": 28665, "epoch": 240, "lr": 6.585904634801806e-05} +{"train_loss": 0.005185501184314489, "global_step": 28666, "epoch": 240, "lr": 6.585694522056004e-05} +{"train_loss": 0.0030619462486356497, "global_step": 28667, "epoch": 240, "lr": 6.585484406196859e-05} +{"train_loss": 0.003110895399004221, "global_step": 28668, "epoch": 240, "lr": 6.585274287224785e-05} +{"train_loss": 0.001936475746333599, "global_step": 28669, "epoch": 240, "lr": 6.585064165140195e-05} +{"train_loss": 0.003926414996385574, "global_step": 28670, "epoch": 240, "lr": 6.5848540399435e-05} +{"train_loss": 0.002991157118231058, "global_step": 28671, "epoch": 240, "lr": 6.584643911635113e-05} +{"train_loss": 0.002735369373112917, "global_step": 28672, "epoch": 240, "lr": 6.584433780215448e-05} +{"train_loss": 0.002875196747481823, "global_step": 28673, "epoch": 240, "lr": 6.584223645684917e-05} +{"train_loss": 0.0026986836455762386, "global_step": 28674, "epoch": 240, "lr": 6.584013508043931e-05} +{"train_loss": 0.002564770635217428, "global_step": 28675, "epoch": 240, "lr": 6.583803367292904e-05} +{"train_loss": 0.0020172400400042534, "global_step": 28676, "epoch": 240, "lr": 6.583593223432249e-05} +{"train_loss": 0.0037921930197626352, "global_step": 28677, "epoch": 240, "lr": 6.583383076462377e-05} +{"train_loss": 0.003194729598951252, "global_step": 28678, "epoch": 240, "lr": 6.583172926383701e-05, "val_loss": 0.029254572466015816, "train_action_mse_error": 4.991678724763915e-05} +{"train_loss": 0.003525525564327836, "global_step": 28679, "epoch": 241, "lr": 6.582962773196635e-05} +{"train_loss": 0.006001248024404049, "global_step": 28680, "epoch": 241, "lr": 6.58275261690159e-05} +{"train_loss": 0.002785634947940707, "global_step": 28681, "epoch": 241, "lr": 6.58254245749898e-05} +{"train_loss": 0.002311134012416005, "global_step": 28682, "epoch": 241, "lr": 6.582332294989218e-05} +{"train_loss": 0.003732645884156227, "global_step": 28683, "epoch": 241, "lr": 6.582122129372714e-05} +{"train_loss": 0.0038088310975581408, "global_step": 28684, "epoch": 241, "lr": 6.581911960649882e-05} +{"train_loss": 0.004022936802357435, "global_step": 28685, "epoch": 241, "lr": 6.581701788821136e-05} +{"train_loss": 0.0036271284334361553, "global_step": 28686, "epoch": 241, "lr": 6.581491613886886e-05} +{"train_loss": 0.003335251472890377, "global_step": 28687, "epoch": 241, "lr": 6.581281435847548e-05} +{"train_loss": 0.004602769855409861, "global_step": 28688, "epoch": 241, "lr": 6.581071254703533e-05} +{"train_loss": 0.003105674870312214, "global_step": 28689, "epoch": 241, "lr": 6.580861070455251e-05} +{"train_loss": 0.004271128214895725, "global_step": 28690, "epoch": 241, "lr": 6.580650883103118e-05} +{"train_loss": 0.004300481174141169, "global_step": 28691, "epoch": 241, "lr": 6.580440692647548e-05} +{"train_loss": 0.004343920852988958, "global_step": 28692, "epoch": 241, "lr": 6.580230499088951e-05} +{"train_loss": 0.0027530111838132143, "global_step": 28693, "epoch": 241, "lr": 6.580020302427739e-05} +{"train_loss": 0.00236203009262681, "global_step": 28694, "epoch": 241, "lr": 6.579810102664325e-05} +{"train_loss": 0.0026349991094321012, "global_step": 28695, "epoch": 241, "lr": 6.579599899799125e-05} +{"train_loss": 0.0041016205213963985, "global_step": 28696, "epoch": 241, "lr": 6.579389693832548e-05} +{"train_loss": 0.003922445233911276, "global_step": 28697, "epoch": 241, "lr": 6.579179484765008e-05} +{"train_loss": 0.0031006617937237024, "global_step": 28698, "epoch": 241, "lr": 6.578969272596917e-05} +{"train_loss": 0.004422512836754322, "global_step": 28699, "epoch": 241, "lr": 6.57875905732869e-05} +{"train_loss": 0.00531684048473835, "global_step": 28700, "epoch": 241, "lr": 6.578548838960738e-05} +{"train_loss": 0.003348809666931629, "global_step": 28701, "epoch": 241, "lr": 6.578338617493474e-05} +{"train_loss": 0.004307994619011879, "global_step": 28702, "epoch": 241, "lr": 6.57812839292731e-05} +{"train_loss": 0.0032416831236332655, "global_step": 28703, "epoch": 241, "lr": 6.577918165262662e-05} +{"train_loss": 0.0031339155975729227, "global_step": 28704, "epoch": 241, "lr": 6.577707934499938e-05} +{"train_loss": 0.004588307347148657, "global_step": 28705, "epoch": 241, "lr": 6.577497700639553e-05} +{"train_loss": 0.0030843846034258604, "global_step": 28706, "epoch": 241, "lr": 6.577287463681921e-05} +{"train_loss": 0.0028119487687945366, "global_step": 28707, "epoch": 241, "lr": 6.577077223627452e-05} +{"train_loss": 0.0038910212460905313, "global_step": 28708, "epoch": 241, "lr": 6.576866980476562e-05} +{"train_loss": 0.0031229881569743156, "global_step": 28709, "epoch": 241, "lr": 6.57665673422966e-05} +{"train_loss": 0.0035110642202198505, "global_step": 28710, "epoch": 241, "lr": 6.576446484887164e-05} +{"train_loss": 0.00319222966209054, "global_step": 28711, "epoch": 241, "lr": 6.576236232449481e-05} +{"train_loss": 0.003407885553315282, "global_step": 28712, "epoch": 241, "lr": 6.576025976917027e-05} +{"train_loss": 0.002679495606571436, "global_step": 28713, "epoch": 241, "lr": 6.575815718290214e-05} +{"train_loss": 0.0025699655525386333, "global_step": 28714, "epoch": 241, "lr": 6.575605456569456e-05} +{"train_loss": 0.002177485264837742, "global_step": 28715, "epoch": 241, "lr": 6.575395191755165e-05} +{"train_loss": 0.0024379268288612366, "global_step": 28716, "epoch": 241, "lr": 6.575184923847754e-05} +{"train_loss": 0.004812215454876423, "global_step": 28717, "epoch": 241, "lr": 6.574974652847636e-05} +{"train_loss": 0.0017694704001769423, "global_step": 28718, "epoch": 241, "lr": 6.574764378755223e-05} +{"train_loss": 0.003224140964448452, "global_step": 28719, "epoch": 241, "lr": 6.574554101570928e-05} +{"train_loss": 0.0033899606205523014, "global_step": 28720, "epoch": 241, "lr": 6.574343821295165e-05} +{"train_loss": 0.005398766603320837, "global_step": 28721, "epoch": 241, "lr": 6.574133537928346e-05} +{"train_loss": 0.0030482353176921606, "global_step": 28722, "epoch": 241, "lr": 6.573923251470886e-05} +{"train_loss": 0.005360338371247053, "global_step": 28723, "epoch": 241, "lr": 6.573712961923193e-05} +{"train_loss": 0.0026766802184283733, "global_step": 28724, "epoch": 241, "lr": 6.573502669285683e-05} +{"train_loss": 0.0032232452649623156, "global_step": 28725, "epoch": 241, "lr": 6.57329237355877e-05} +{"train_loss": 0.002685899380594492, "global_step": 28726, "epoch": 241, "lr": 6.573082074742865e-05} +{"train_loss": 0.002871300559490919, "global_step": 28727, "epoch": 241, "lr": 6.572871772838381e-05} +{"train_loss": 0.002241674344986677, "global_step": 28728, "epoch": 241, "lr": 6.57266146784573e-05} +{"train_loss": 0.0026705439668148756, "global_step": 28729, "epoch": 241, "lr": 6.572451159765328e-05} +{"train_loss": 0.0049135261215269566, "global_step": 28730, "epoch": 241, "lr": 6.572240848597584e-05} +{"train_loss": 0.004518481437116861, "global_step": 28731, "epoch": 241, "lr": 6.572030534342916e-05} +{"train_loss": 0.00299616320990026, "global_step": 28732, "epoch": 241, "lr": 6.571820217001732e-05} +{"train_loss": 0.0033669662661850452, "global_step": 28733, "epoch": 241, "lr": 6.571609896574447e-05} +{"train_loss": 0.0028643542900681496, "global_step": 28734, "epoch": 241, "lr": 6.571399573061475e-05} +{"train_loss": 0.004277829546481371, "global_step": 28735, "epoch": 241, "lr": 6.571189246463227e-05} +{"train_loss": 0.003668372519314289, "global_step": 28736, "epoch": 241, "lr": 6.570978916780118e-05} +{"train_loss": 0.0020029142033308744, "global_step": 28737, "epoch": 241, "lr": 6.570768584012559e-05} +{"train_loss": 0.0036621810868382454, "global_step": 28738, "epoch": 241, "lr": 6.570558248160963e-05} +{"train_loss": 0.002528262557461858, "global_step": 28739, "epoch": 241, "lr": 6.570347909225745e-05} +{"train_loss": 0.0037229249719530344, "global_step": 28740, "epoch": 241, "lr": 6.570137567207315e-05} +{"train_loss": 0.003486200235784054, "global_step": 28741, "epoch": 241, "lr": 6.569927222106089e-05} +{"train_loss": 0.003439519787207246, "global_step": 28742, "epoch": 241, "lr": 6.569716873922477e-05} +{"train_loss": 0.002639407990500331, "global_step": 28743, "epoch": 241, "lr": 6.569506522656897e-05} +{"train_loss": 0.00294362660497427, "global_step": 28744, "epoch": 241, "lr": 6.569296168309756e-05} +{"train_loss": 0.003491561394184828, "global_step": 28745, "epoch": 241, "lr": 6.56908581088147e-05} +{"train_loss": 0.0036288502160459757, "global_step": 28746, "epoch": 241, "lr": 6.56887545037245e-05} +{"train_loss": 0.0029199239797890186, "global_step": 28747, "epoch": 241, "lr": 6.568665086783113e-05} +{"train_loss": 0.004948383662849665, "global_step": 28748, "epoch": 241, "lr": 6.568454720113868e-05} +{"train_loss": 0.005156783387064934, "global_step": 28749, "epoch": 241, "lr": 6.568244350365131e-05} +{"train_loss": 0.003097672713920474, "global_step": 28750, "epoch": 241, "lr": 6.568033977537313e-05} +{"train_loss": 0.0026160581037402153, "global_step": 28751, "epoch": 241, "lr": 6.567823601630828e-05} +{"train_loss": 0.004061517771333456, "global_step": 28752, "epoch": 241, "lr": 6.56761322264609e-05} +{"train_loss": 0.004026109352707863, "global_step": 28753, "epoch": 241, "lr": 6.567402840583509e-05} +{"train_loss": 0.002869986230507493, "global_step": 28754, "epoch": 241, "lr": 6.567192455443502e-05} +{"train_loss": 0.0029351997654885054, "global_step": 28755, "epoch": 241, "lr": 6.566982067226479e-05} +{"train_loss": 0.004910025279968977, "global_step": 28756, "epoch": 241, "lr": 6.566771675932853e-05} +{"train_loss": 0.0018653610022738576, "global_step": 28757, "epoch": 241, "lr": 6.56656128156304e-05} +{"train_loss": 0.004349920433014631, "global_step": 28758, "epoch": 241, "lr": 6.56635088411745e-05} +{"train_loss": 0.0038809222169220448, "global_step": 28759, "epoch": 241, "lr": 6.5661404835965e-05} +{"train_loss": 0.006225700955837965, "global_step": 28760, "epoch": 241, "lr": 6.565930080000597e-05} +{"train_loss": 0.0019810243975371122, "global_step": 28761, "epoch": 241, "lr": 6.565719673330159e-05} +{"train_loss": 0.004422762431204319, "global_step": 28762, "epoch": 241, "lr": 6.565509263585597e-05} +{"train_loss": 0.003984612412750721, "global_step": 28763, "epoch": 241, "lr": 6.565298850767325e-05} +{"train_loss": 0.004626359324902296, "global_step": 28764, "epoch": 241, "lr": 6.565088434875756e-05} +{"train_loss": 0.0027674518059939146, "global_step": 28765, "epoch": 241, "lr": 6.564878015911304e-05} +{"train_loss": 0.002993498696014285, "global_step": 28766, "epoch": 241, "lr": 6.564667593874383e-05} +{"train_loss": 0.0026336985174566507, "global_step": 28767, "epoch": 241, "lr": 6.564457168765401e-05} +{"train_loss": 0.0028671338222920895, "global_step": 28768, "epoch": 241, "lr": 6.564246740584776e-05} +{"train_loss": 0.0030869159381836653, "global_step": 28769, "epoch": 241, "lr": 6.56403630933292e-05} +{"train_loss": 0.003306681988760829, "global_step": 28770, "epoch": 241, "lr": 6.563825875010244e-05} +{"train_loss": 0.00399779761210084, "global_step": 28771, "epoch": 241, "lr": 6.563615437617163e-05} +{"train_loss": 0.004120491910725832, "global_step": 28772, "epoch": 241, "lr": 6.563404997154092e-05} +{"train_loss": 0.0024274876341223717, "global_step": 28773, "epoch": 241, "lr": 6.563194553621442e-05} +{"train_loss": 0.0046957870945334435, "global_step": 28774, "epoch": 241, "lr": 6.562984107019625e-05} +{"train_loss": 0.0024484482128173113, "global_step": 28775, "epoch": 241, "lr": 6.562773657349057e-05} +{"train_loss": 0.003781391540542245, "global_step": 28776, "epoch": 241, "lr": 6.562563204610149e-05} +{"train_loss": 0.0017841296503320336, "global_step": 28777, "epoch": 241, "lr": 6.562352748803317e-05} +{"train_loss": 0.005299034062772989, "global_step": 28778, "epoch": 241, "lr": 6.56214228992897e-05} +{"train_loss": 0.0038770034443587065, "global_step": 28779, "epoch": 241, "lr": 6.561931827987524e-05} +{"train_loss": 0.0020282079931348562, "global_step": 28780, "epoch": 241, "lr": 6.561721362979391e-05} +{"train_loss": 0.004754634574055672, "global_step": 28781, "epoch": 241, "lr": 6.561510894904987e-05} +{"train_loss": 0.0025416810531169176, "global_step": 28782, "epoch": 241, "lr": 6.561300423764723e-05} +{"train_loss": 0.002930379007011652, "global_step": 28783, "epoch": 241, "lr": 6.56108994955901e-05} +{"train_loss": 0.0017150138737633824, "global_step": 28784, "epoch": 241, "lr": 6.560879472288266e-05} +{"train_loss": 0.003925363998860121, "global_step": 28785, "epoch": 241, "lr": 6.560668991952901e-05} +{"train_loss": 0.004804497584700584, "global_step": 28786, "epoch": 241, "lr": 6.56045850855333e-05} +{"train_loss": 0.002723597688600421, "global_step": 28787, "epoch": 241, "lr": 6.560248022089965e-05} +{"train_loss": 0.0045735700987279415, "global_step": 28788, "epoch": 241, "lr": 6.56003753256322e-05} +{"train_loss": 0.007368098944425583, "global_step": 28789, "epoch": 241, "lr": 6.559827039973508e-05} +{"train_loss": 0.002765137003734708, "global_step": 28790, "epoch": 241, "lr": 6.559616544321241e-05} +{"train_loss": 0.004887932445853949, "global_step": 28791, "epoch": 241, "lr": 6.559406045606836e-05} +{"train_loss": 0.0035093901678919792, "global_step": 28792, "epoch": 241, "lr": 6.5591955438307e-05} +{"train_loss": 0.002735597314313054, "global_step": 28793, "epoch": 241, "lr": 6.558985038993253e-05} +{"train_loss": 0.0024323395919054747, "global_step": 28794, "epoch": 241, "lr": 6.558774531094905e-05} +{"train_loss": 0.005248825531452894, "global_step": 28795, "epoch": 241, "lr": 6.558564020136069e-05} +{"train_loss": 0.0034323320724070072, "global_step": 28796, "epoch": 241, "lr": 6.558353506117157e-05} +{"train_loss": 0.0035318822830821537, "global_step": 28797, "epoch": 241, "lr": 6.558142989038588e-05, "val_loss": 0.01874089427292347} +{"train_loss": 0.00456836074590683, "global_step": 28798, "epoch": 242, "lr": 6.557932468900771e-05} +{"train_loss": 0.0028958411421626806, "global_step": 28799, "epoch": 242, "lr": 6.557721945704119e-05} +{"train_loss": 0.0027848973404616117, "global_step": 28800, "epoch": 242, "lr": 6.557511419449047e-05} +{"train_loss": 0.005624269135296345, "global_step": 28801, "epoch": 242, "lr": 6.557300890135967e-05} +{"train_loss": 0.0029303627088665962, "global_step": 28802, "epoch": 242, "lr": 6.557090357765294e-05} +{"train_loss": 0.001968994038179517, "global_step": 28803, "epoch": 242, "lr": 6.556879822337441e-05} +{"train_loss": 0.004452347289770842, "global_step": 28804, "epoch": 242, "lr": 6.556669283852821e-05} +{"train_loss": 0.004172555170953274, "global_step": 28805, "epoch": 242, "lr": 6.556458742311845e-05} +{"train_loss": 0.005643086042255163, "global_step": 28806, "epoch": 242, "lr": 6.556248197714929e-05} +{"train_loss": 0.004147533793002367, "global_step": 28807, "epoch": 242, "lr": 6.556037650062488e-05} +{"train_loss": 0.003026999067515135, "global_step": 28808, "epoch": 242, "lr": 6.555827099354931e-05} +{"train_loss": 0.0033402955159544945, "global_step": 28809, "epoch": 242, "lr": 6.555616545592674e-05} +{"train_loss": 0.0027337123174220324, "global_step": 28810, "epoch": 242, "lr": 6.555405988776131e-05} +{"train_loss": 0.0029839815106242895, "global_step": 28811, "epoch": 242, "lr": 6.555195428905714e-05} +{"train_loss": 0.004923748318105936, "global_step": 28812, "epoch": 242, "lr": 6.554984865981837e-05} +{"train_loss": 0.0030205450020730495, "global_step": 28813, "epoch": 242, "lr": 6.554774300004913e-05} +{"train_loss": 0.00373080070130527, "global_step": 28814, "epoch": 242, "lr": 6.554563730975356e-05} +{"train_loss": 0.0025733651127666235, "global_step": 28815, "epoch": 242, "lr": 6.55435315889358e-05} +{"train_loss": 0.004485366865992546, "global_step": 28816, "epoch": 242, "lr": 6.554142583759999e-05} +{"train_loss": 0.0024640560150146484, "global_step": 28817, "epoch": 242, "lr": 6.553932005575024e-05} +{"train_loss": 0.0039488947950303555, "global_step": 28818, "epoch": 242, "lr": 6.553721424339068e-05} +{"train_loss": 0.002274143975228071, "global_step": 28819, "epoch": 242, "lr": 6.553510840052546e-05} +{"train_loss": 0.0031840249430388212, "global_step": 28820, "epoch": 242, "lr": 6.553300252715871e-05} +{"train_loss": 0.0038457673508673906, "global_step": 28821, "epoch": 242, "lr": 6.553089662329458e-05} +{"train_loss": 0.004638399463146925, "global_step": 28822, "epoch": 242, "lr": 6.55287906889372e-05} +{"train_loss": 0.0022185209672898054, "global_step": 28823, "epoch": 242, "lr": 6.55266847240907e-05} +{"train_loss": 0.002849767915904522, "global_step": 28824, "epoch": 242, "lr": 6.55245787287592e-05} +{"train_loss": 0.003996893763542175, "global_step": 28825, "epoch": 242, "lr": 6.552247270294685e-05} +{"train_loss": 0.003144723130390048, "global_step": 28826, "epoch": 242, "lr": 6.552036664665779e-05} +{"train_loss": 0.005333693698048592, "global_step": 28827, "epoch": 242, "lr": 6.551826055989613e-05} +{"train_loss": 0.0019412669353187084, "global_step": 28828, "epoch": 242, "lr": 6.551615444266605e-05} +{"train_loss": 0.006009533070027828, "global_step": 28829, "epoch": 242, "lr": 6.551404829497166e-05} +{"train_loss": 0.00218849815428257, "global_step": 28830, "epoch": 242, "lr": 6.551194211681706e-05} +{"train_loss": 0.0038551476318389177, "global_step": 28831, "epoch": 242, "lr": 6.550983590820644e-05} +{"train_loss": 0.003256309311836958, "global_step": 28832, "epoch": 242, "lr": 6.550772966914391e-05} +{"train_loss": 0.0037698894739151, "global_step": 28833, "epoch": 242, "lr": 6.550562339963362e-05} +{"train_loss": 0.0041250078938901424, "global_step": 28834, "epoch": 242, "lr": 6.550351709967968e-05} +{"train_loss": 0.004146988969296217, "global_step": 28835, "epoch": 242, "lr": 6.550141076928627e-05} +{"train_loss": 0.0024882603902369738, "global_step": 28836, "epoch": 242, "lr": 6.549930440845746e-05} +{"train_loss": 0.004463370889425278, "global_step": 28837, "epoch": 242, "lr": 6.549719801719745e-05} +{"train_loss": 0.004064637701958418, "global_step": 28838, "epoch": 242, "lr": 6.549509159551033e-05} +{"train_loss": 0.0042400844395160675, "global_step": 28839, "epoch": 242, "lr": 6.549298514340025e-05} +{"train_loss": 0.0030754434410482645, "global_step": 28840, "epoch": 242, "lr": 6.549087866087135e-05} +{"train_loss": 0.0028824913315474987, "global_step": 28841, "epoch": 242, "lr": 6.548877214792778e-05} +{"train_loss": 0.002968470798805356, "global_step": 28842, "epoch": 242, "lr": 6.548666560457364e-05} +{"train_loss": 0.004139383789151907, "global_step": 28843, "epoch": 242, "lr": 6.548455903081311e-05} +{"train_loss": 0.003611334366723895, "global_step": 28844, "epoch": 242, "lr": 6.548245242665028e-05} +{"train_loss": 0.0036245069932192564, "global_step": 28845, "epoch": 242, "lr": 6.548034579208932e-05} +{"train_loss": 0.004183143377304077, "global_step": 28846, "epoch": 242, "lr": 6.547823912713434e-05} +{"train_loss": 0.004490709863603115, "global_step": 28847, "epoch": 242, "lr": 6.54761324317895e-05} +{"train_loss": 0.0029745420906692743, "global_step": 28848, "epoch": 242, "lr": 6.547402570605895e-05} +{"train_loss": 0.004208666272461414, "global_step": 28849, "epoch": 242, "lr": 6.547191894994679e-05} +{"train_loss": 0.003426177892833948, "global_step": 28850, "epoch": 242, "lr": 6.546981216345715e-05} +{"train_loss": 0.0035614888183772564, "global_step": 28851, "epoch": 242, "lr": 6.546770534659422e-05} +{"train_loss": 0.005609411280602217, "global_step": 28852, "epoch": 242, "lr": 6.546559849936207e-05} +{"train_loss": 0.0026199137791991234, "global_step": 28853, "epoch": 242, "lr": 6.546349162176488e-05} +{"train_loss": 0.003756479825824499, "global_step": 28854, "epoch": 242, "lr": 6.54613847138068e-05} +{"train_loss": 0.00346805970184505, "global_step": 28855, "epoch": 242, "lr": 6.545927777549192e-05} +{"train_loss": 0.0036449034232646227, "global_step": 28856, "epoch": 242, "lr": 6.545717080682441e-05} +{"train_loss": 0.0035839497577399015, "global_step": 28857, "epoch": 242, "lr": 6.545506380780838e-05} +{"train_loss": 0.003668883815407753, "global_step": 28858, "epoch": 242, "lr": 6.5452956778448e-05} +{"train_loss": 0.0038060685619711876, "global_step": 28859, "epoch": 242, "lr": 6.545084971874738e-05} +{"train_loss": 0.002122282749041915, "global_step": 28860, "epoch": 242, "lr": 6.544874262871067e-05} +{"train_loss": 0.006702991668134928, "global_step": 28861, "epoch": 242, "lr": 6.5446635508342e-05} +{"train_loss": 0.005939883179962635, "global_step": 28862, "epoch": 242, "lr": 6.544452835764552e-05} +{"train_loss": 0.0019037823658436537, "global_step": 28863, "epoch": 242, "lr": 6.544242117662536e-05} +{"train_loss": 0.0045655034482479095, "global_step": 28864, "epoch": 242, "lr": 6.544031396528564e-05} +{"train_loss": 0.004243845585733652, "global_step": 28865, "epoch": 242, "lr": 6.543820672363053e-05} +{"train_loss": 0.003802779596298933, "global_step": 28866, "epoch": 242, "lr": 6.543609945166415e-05} +{"train_loss": 0.002163517754524946, "global_step": 28867, "epoch": 242, "lr": 6.543399214939063e-05} +{"train_loss": 0.003225405002012849, "global_step": 28868, "epoch": 242, "lr": 6.543188481681411e-05} +{"train_loss": 0.004781248979270458, "global_step": 28869, "epoch": 242, "lr": 6.542977745393875e-05} +{"train_loss": 0.0032271957024931908, "global_step": 28870, "epoch": 242, "lr": 6.542767006076865e-05} +{"train_loss": 0.004041585605591536, "global_step": 28871, "epoch": 242, "lr": 6.542556263730798e-05} +{"train_loss": 0.003367395605891943, "global_step": 28872, "epoch": 242, "lr": 6.542345518356086e-05} +{"train_loss": 0.0035574017092585564, "global_step": 28873, "epoch": 242, "lr": 6.542134769953145e-05} +{"train_loss": 0.0025574618484824896, "global_step": 28874, "epoch": 242, "lr": 6.541924018522386e-05} +{"train_loss": 0.004463423974812031, "global_step": 28875, "epoch": 242, "lr": 6.541713264064224e-05} +{"train_loss": 0.0025159926153719425, "global_step": 28876, "epoch": 242, "lr": 6.541502506579072e-05} +{"train_loss": 0.0022450739052146673, "global_step": 28877, "epoch": 242, "lr": 6.541291746067345e-05} +{"train_loss": 0.0038248535711318254, "global_step": 28878, "epoch": 242, "lr": 6.541080982529458e-05} +{"train_loss": 0.005087274592369795, "global_step": 28879, "epoch": 242, "lr": 6.54087021596582e-05} +{"train_loss": 0.0028264496941119432, "global_step": 28880, "epoch": 242, "lr": 6.540659446376848e-05} +{"train_loss": 0.00457102432847023, "global_step": 28881, "epoch": 242, "lr": 6.540448673762958e-05} +{"train_loss": 0.0038652531802654266, "global_step": 28882, "epoch": 242, "lr": 6.540237898124562e-05} +{"train_loss": 0.003636940848082304, "global_step": 28883, "epoch": 242, "lr": 6.54002711946207e-05} +{"train_loss": 0.0039504836313426495, "global_step": 28884, "epoch": 242, "lr": 6.539816337775903e-05} +{"train_loss": 0.0032189139164984226, "global_step": 28885, "epoch": 242, "lr": 6.53960555306647e-05} +{"train_loss": 0.0036794128827750683, "global_step": 28886, "epoch": 242, "lr": 6.539394765334185e-05} +{"train_loss": 0.0021303414832800627, "global_step": 28887, "epoch": 242, "lr": 6.539183974579465e-05} +{"train_loss": 0.0023696525022387505, "global_step": 28888, "epoch": 242, "lr": 6.53897318080272e-05} +{"train_loss": 0.0024522715248167515, "global_step": 28889, "epoch": 242, "lr": 6.538762384004366e-05} +{"train_loss": 0.0019862200133502483, "global_step": 28890, "epoch": 242, "lr": 6.538551584184816e-05} +{"train_loss": 0.00224791606888175, "global_step": 28891, "epoch": 242, "lr": 6.538340781344485e-05} +{"train_loss": 0.002641150029376149, "global_step": 28892, "epoch": 242, "lr": 6.538129975483786e-05} +{"train_loss": 0.004530585370957851, "global_step": 28893, "epoch": 242, "lr": 6.537919166603132e-05} +{"train_loss": 0.004042717162519693, "global_step": 28894, "epoch": 242, "lr": 6.537708354702938e-05} +{"train_loss": 0.0025308055337518454, "global_step": 28895, "epoch": 242, "lr": 6.537497539783619e-05} +{"train_loss": 0.004769842140376568, "global_step": 28896, "epoch": 242, "lr": 6.537286721845588e-05} +{"train_loss": 0.0036645710933953524, "global_step": 28897, "epoch": 242, "lr": 6.537075900889258e-05} +{"train_loss": 0.0021926916670054197, "global_step": 28898, "epoch": 242, "lr": 6.536865076915046e-05} +{"train_loss": 0.00371735286898911, "global_step": 28899, "epoch": 242, "lr": 6.53665424992336e-05} +{"train_loss": 0.0018467010231688619, "global_step": 28900, "epoch": 242, "lr": 6.53644341991462e-05} +{"train_loss": 0.0024460768327116966, "global_step": 28901, "epoch": 242, "lr": 6.536232586889236e-05} +{"train_loss": 0.004281207453459501, "global_step": 28902, "epoch": 242, "lr": 6.536021750847625e-05} +{"train_loss": 0.0029637895058840513, "global_step": 28903, "epoch": 242, "lr": 6.535810911790199e-05} +{"train_loss": 0.002456571441143751, "global_step": 28904, "epoch": 242, "lr": 6.535600069717373e-05} +{"train_loss": 0.0038588072638958693, "global_step": 28905, "epoch": 242, "lr": 6.535389224629557e-05} +{"train_loss": 0.0025023415219038725, "global_step": 28906, "epoch": 242, "lr": 6.535178376527172e-05} +{"train_loss": 0.004631929099559784, "global_step": 28907, "epoch": 242, "lr": 6.534967525410627e-05} +{"train_loss": 0.00230157608166337, "global_step": 28908, "epoch": 242, "lr": 6.534756671280336e-05} +{"train_loss": 0.0017555620288476348, "global_step": 28909, "epoch": 242, "lr": 6.534545814136716e-05} +{"train_loss": 0.004235313273966312, "global_step": 28910, "epoch": 242, "lr": 6.53433495398018e-05} +{"train_loss": 0.002886299742385745, "global_step": 28911, "epoch": 242, "lr": 6.534124090811138e-05} +{"train_loss": 0.003878324758261442, "global_step": 28912, "epoch": 242, "lr": 6.53391322463001e-05} +{"train_loss": 0.001643077819608152, "global_step": 28913, "epoch": 242, "lr": 6.533702355437205e-05} +{"train_loss": 0.005140576511621475, "global_step": 28914, "epoch": 242, "lr": 6.533491483233141e-05} +{"train_loss": 0.001722444430924952, "global_step": 28915, "epoch": 242, "lr": 6.53328060801823e-05} +{"train_loss": 0.0035049313143240054, "global_step": 28916, "epoch": 242, "lr": 6.533069729792886e-05, "val_loss": 0.02389502339065075} +{"train_loss": 0.0023150923661887646, "global_step": 28917, "epoch": 243, "lr": 6.532858848557523e-05} +{"train_loss": 0.0036291603464633226, "global_step": 28918, "epoch": 243, "lr": 6.532647964312557e-05} +{"train_loss": 0.00453395489603281, "global_step": 28919, "epoch": 243, "lr": 6.5324370770584e-05} +{"train_loss": 0.002374885370954871, "global_step": 28920, "epoch": 243, "lr": 6.532226186795464e-05} +{"train_loss": 0.0014126930618658662, "global_step": 28921, "epoch": 243, "lr": 6.532015293524169e-05} +{"train_loss": 0.0028342308942228556, "global_step": 28922, "epoch": 243, "lr": 6.531804397244924e-05} +{"train_loss": 0.0032086516730487347, "global_step": 28923, "epoch": 243, "lr": 6.531593497958146e-05} +{"train_loss": 0.002631501294672489, "global_step": 28924, "epoch": 243, "lr": 6.531382595664247e-05} +{"train_loss": 0.005441846791654825, "global_step": 28925, "epoch": 243, "lr": 6.531171690363642e-05} +{"train_loss": 0.0026197878178209066, "global_step": 28926, "epoch": 243, "lr": 6.530960782056743e-05} +{"train_loss": 0.0031855786219239235, "global_step": 28927, "epoch": 243, "lr": 6.530749870743969e-05} +{"train_loss": 0.005246096756309271, "global_step": 28928, "epoch": 243, "lr": 6.530538956425729e-05} +{"train_loss": 0.003182233078405261, "global_step": 28929, "epoch": 243, "lr": 6.53032803910244e-05} +{"train_loss": 0.0026924607809633017, "global_step": 28930, "epoch": 243, "lr": 6.530117118774515e-05} +{"train_loss": 0.00281707476824522, "global_step": 28931, "epoch": 243, "lr": 6.529906195442369e-05} +{"train_loss": 0.003478608326986432, "global_step": 28932, "epoch": 243, "lr": 6.529695269106415e-05} +{"train_loss": 0.0029937331564724445, "global_step": 28933, "epoch": 243, "lr": 6.529484339767069e-05} +{"train_loss": 0.0034696634393185377, "global_step": 28934, "epoch": 243, "lr": 6.529273407424743e-05} +{"train_loss": 0.0027923001907765865, "global_step": 28935, "epoch": 243, "lr": 6.529062472079854e-05} +{"train_loss": 0.003467777045443654, "global_step": 28936, "epoch": 243, "lr": 6.528851533732811e-05} +{"train_loss": 0.0036259214393794537, "global_step": 28937, "epoch": 243, "lr": 6.528640592384033e-05} +{"train_loss": 0.0032452356535941362, "global_step": 28938, "epoch": 243, "lr": 6.528429648033932e-05} +{"train_loss": 0.003383275354281068, "global_step": 28939, "epoch": 243, "lr": 6.528218700682923e-05} +{"train_loss": 0.0037245964631438255, "global_step": 28940, "epoch": 243, "lr": 6.52800775033142e-05} +{"train_loss": 0.004533539991825819, "global_step": 28941, "epoch": 243, "lr": 6.527796796979837e-05} +{"train_loss": 0.0029458526987582445, "global_step": 28942, "epoch": 243, "lr": 6.527585840628587e-05} +{"train_loss": 0.00434379605576396, "global_step": 28943, "epoch": 243, "lr": 6.527374881278086e-05} +{"train_loss": 0.0045255073346197605, "global_step": 28944, "epoch": 243, "lr": 6.52716391892875e-05} +{"train_loss": 0.00276713608764112, "global_step": 28945, "epoch": 243, "lr": 6.526952953580988e-05} +{"train_loss": 0.0025539507623761892, "global_step": 28946, "epoch": 243, "lr": 6.526741985235217e-05} +{"train_loss": 0.0028246110305190086, "global_step": 28947, "epoch": 243, "lr": 6.526531013891853e-05} +{"train_loss": 0.0063503398559987545, "global_step": 28948, "epoch": 243, "lr": 6.526320039551308e-05} +{"train_loss": 0.00507480651140213, "global_step": 28949, "epoch": 243, "lr": 6.526109062213997e-05} +{"train_loss": 0.00273579522036016, "global_step": 28950, "epoch": 243, "lr": 6.525898081880332e-05} +{"train_loss": 0.003905786667019129, "global_step": 28951, "epoch": 243, "lr": 6.52568709855073e-05} +{"train_loss": 0.004128719680011272, "global_step": 28952, "epoch": 243, "lr": 6.525476112225605e-05} +{"train_loss": 0.0032862548250705004, "global_step": 28953, "epoch": 243, "lr": 6.52526512290537e-05} +{"train_loss": 0.0033419232349842787, "global_step": 28954, "epoch": 243, "lr": 6.525054130590441e-05} +{"train_loss": 0.0019298141123726964, "global_step": 28955, "epoch": 243, "lr": 6.52484313528123e-05} +{"train_loss": 0.0026915634516626596, "global_step": 28956, "epoch": 243, "lr": 6.524632136978153e-05} +{"train_loss": 0.003801332088187337, "global_step": 28957, "epoch": 243, "lr": 6.524421135681623e-05} +{"train_loss": 0.002918417565524578, "global_step": 28958, "epoch": 243, "lr": 6.524210131392056e-05} +{"train_loss": 0.0034061064943671227, "global_step": 28959, "epoch": 243, "lr": 6.523999124109865e-05} +{"train_loss": 0.0038716632407158613, "global_step": 28960, "epoch": 243, "lr": 6.523788113835463e-05} +{"train_loss": 0.00288475607521832, "global_step": 28961, "epoch": 243, "lr": 6.523577100569268e-05} +{"train_loss": 0.0035208268091082573, "global_step": 28962, "epoch": 243, "lr": 6.52336608431169e-05} +{"train_loss": 0.004448172636330128, "global_step": 28963, "epoch": 243, "lr": 6.523155065063147e-05} +{"train_loss": 0.0030979022849351168, "global_step": 28964, "epoch": 243, "lr": 6.52294404282405e-05} +{"train_loss": 0.003941700793802738, "global_step": 28965, "epoch": 243, "lr": 6.522733017594816e-05} +{"train_loss": 0.0034495024010539055, "global_step": 28966, "epoch": 243, "lr": 6.52252198937586e-05} +{"train_loss": 0.005063438788056374, "global_step": 28967, "epoch": 243, "lr": 6.522310958167594e-05} +{"train_loss": 0.002928773406893015, "global_step": 28968, "epoch": 243, "lr": 6.522099923970433e-05} +{"train_loss": 0.003089319448918104, "global_step": 28969, "epoch": 243, "lr": 6.521888886784791e-05} +{"train_loss": 0.004903140012174845, "global_step": 28970, "epoch": 243, "lr": 6.521677846611082e-05} +{"train_loss": 0.004203637596219778, "global_step": 28971, "epoch": 243, "lr": 6.521466803449722e-05} +{"train_loss": 0.003811202012002468, "global_step": 28972, "epoch": 243, "lr": 6.521255757301124e-05} +{"train_loss": 0.004160098731517792, "global_step": 28973, "epoch": 243, "lr": 6.521044708165704e-05} +{"train_loss": 0.0038254987448453903, "global_step": 28974, "epoch": 243, "lr": 6.520833656043874e-05} +{"train_loss": 0.0026726529467850924, "global_step": 28975, "epoch": 243, "lr": 6.52062260093605e-05} +{"train_loss": 0.0031365184113383293, "global_step": 28976, "epoch": 243, "lr": 6.520411542842646e-05} +{"train_loss": 0.0037444650661200285, "global_step": 28977, "epoch": 243, "lr": 6.520200481764076e-05} +{"train_loss": 0.0033624584320932627, "global_step": 28978, "epoch": 243, "lr": 6.519989417700754e-05} +{"train_loss": 0.004460684955120087, "global_step": 28979, "epoch": 243, "lr": 6.519778350653097e-05} +{"train_loss": 0.0018858881667256355, "global_step": 28980, "epoch": 243, "lr": 6.519567280621517e-05} +{"train_loss": 0.00285468902438879, "global_step": 28981, "epoch": 243, "lr": 6.519356207606428e-05} +{"train_loss": 0.0047175767831504345, "global_step": 28982, "epoch": 243, "lr": 6.519145131608247e-05} +{"train_loss": 0.0021816687658429146, "global_step": 28983, "epoch": 243, "lr": 6.518934052627386e-05} +{"train_loss": 0.0035931640304625034, "global_step": 28984, "epoch": 243, "lr": 6.51872297066426e-05} +{"train_loss": 0.00505642406642437, "global_step": 28985, "epoch": 243, "lr": 6.518511885719285e-05} +{"train_loss": 0.003191846888512373, "global_step": 28986, "epoch": 243, "lr": 6.518300797792872e-05} +{"train_loss": 0.0032270716037601233, "global_step": 28987, "epoch": 243, "lr": 6.518089706885439e-05} +{"train_loss": 0.004160863813012838, "global_step": 28988, "epoch": 243, "lr": 6.517878612997399e-05} +{"train_loss": 0.0033926914911717176, "global_step": 28989, "epoch": 243, "lr": 6.517667516129166e-05} +{"train_loss": 0.0032974116038531065, "global_step": 28990, "epoch": 243, "lr": 6.517456416281156e-05} +{"train_loss": 0.003959344234317541, "global_step": 28991, "epoch": 243, "lr": 6.517245313453782e-05} +{"train_loss": 0.0026431595906615257, "global_step": 28992, "epoch": 243, "lr": 6.517034207647458e-05} +{"train_loss": 0.002530336380004883, "global_step": 28993, "epoch": 243, "lr": 6.516823098862598e-05} +{"train_loss": 0.0029535265639424324, "global_step": 28994, "epoch": 243, "lr": 6.51661198709962e-05} +{"train_loss": 0.002906707813963294, "global_step": 28995, "epoch": 243, "lr": 6.516400872358937e-05} +{"train_loss": 0.002884502988308668, "global_step": 28996, "epoch": 243, "lr": 6.516189754640963e-05} +{"train_loss": 0.002090456895530224, "global_step": 28997, "epoch": 243, "lr": 6.515978633946112e-05} +{"train_loss": 0.0030179903842508793, "global_step": 28998, "epoch": 243, "lr": 6.515767510274798e-05} +{"train_loss": 0.004011965356767178, "global_step": 28999, "epoch": 243, "lr": 6.515556383627436e-05} +{"train_loss": 0.0022225864231586456, "global_step": 29000, "epoch": 243, "lr": 6.515345254004444e-05} +{"train_loss": 0.0026812581345438957, "global_step": 29001, "epoch": 243, "lr": 6.51513412140623e-05} +{"train_loss": 0.003094958607107401, "global_step": 29002, "epoch": 243, "lr": 6.514922985833214e-05} +{"train_loss": 0.0029292996041476727, "global_step": 29003, "epoch": 243, "lr": 6.514711847285808e-05} +{"train_loss": 0.0038006040267646313, "global_step": 29004, "epoch": 243, "lr": 6.514500705764428e-05} +{"train_loss": 0.002890549832955003, "global_step": 29005, "epoch": 243, "lr": 6.514289561269487e-05} +{"train_loss": 0.0021246219985187054, "global_step": 29006, "epoch": 243, "lr": 6.514078413801399e-05} +{"train_loss": 0.004008417017757893, "global_step": 29007, "epoch": 243, "lr": 6.51386726336058e-05} +{"train_loss": 0.002244718372821808, "global_step": 29008, "epoch": 243, "lr": 6.513656109947445e-05} +{"train_loss": 0.0036526035983115435, "global_step": 29009, "epoch": 243, "lr": 6.513444953562409e-05} +{"train_loss": 0.002742969198152423, "global_step": 29010, "epoch": 243, "lr": 6.513233794205884e-05} +{"train_loss": 0.003239384386688471, "global_step": 29011, "epoch": 243, "lr": 6.513022631878286e-05} +{"train_loss": 0.002860863460227847, "global_step": 29012, "epoch": 243, "lr": 6.512811466580031e-05} +{"train_loss": 0.002786911092698574, "global_step": 29013, "epoch": 243, "lr": 6.512600298311531e-05} +{"train_loss": 0.0022608160506933928, "global_step": 29014, "epoch": 243, "lr": 6.512389127073203e-05} +{"train_loss": 0.0050169178284704685, "global_step": 29015, "epoch": 243, "lr": 6.512177952865459e-05} +{"train_loss": 0.002617441350594163, "global_step": 29016, "epoch": 243, "lr": 6.511966775688718e-05} +{"train_loss": 0.0036196429282426834, "global_step": 29017, "epoch": 243, "lr": 6.511755595543389e-05} +{"train_loss": 0.0030789142474532127, "global_step": 29018, "epoch": 243, "lr": 6.51154441242989e-05} +{"train_loss": 0.0029266872443258762, "global_step": 29019, "epoch": 243, "lr": 6.511333226348638e-05} +{"train_loss": 0.002389871748164296, "global_step": 29020, "epoch": 243, "lr": 6.51112203730004e-05} +{"train_loss": 0.0014429239090532064, "global_step": 29021, "epoch": 243, "lr": 6.510910845284518e-05} +{"train_loss": 0.0024829437024891376, "global_step": 29022, "epoch": 243, "lr": 6.510699650302483e-05} +{"train_loss": 0.0048287189565598965, "global_step": 29023, "epoch": 243, "lr": 6.510488452354353e-05} +{"train_loss": 0.0025266571901738644, "global_step": 29024, "epoch": 243, "lr": 6.510277251440538e-05} +{"train_loss": 0.0019694555085152388, "global_step": 29025, "epoch": 243, "lr": 6.510066047561455e-05} +{"train_loss": 0.0025998109485954046, "global_step": 29026, "epoch": 243, "lr": 6.509854840717517e-05} +{"train_loss": 0.004453168250620365, "global_step": 29027, "epoch": 243, "lr": 6.509643630909142e-05} +{"train_loss": 0.0035015761386603117, "global_step": 29028, "epoch": 243, "lr": 6.509432418136744e-05} +{"train_loss": 0.0025397674180567265, "global_step": 29029, "epoch": 243, "lr": 6.509221202400737e-05} +{"train_loss": 0.004076065961271524, "global_step": 29030, "epoch": 243, "lr": 6.509009983701534e-05} +{"train_loss": 0.0029871275182813406, "global_step": 29031, "epoch": 243, "lr": 6.508798762039552e-05} +{"train_loss": 0.0031069854740053415, "global_step": 29032, "epoch": 243, "lr": 6.508587537415204e-05} +{"train_loss": 0.002108832122758031, "global_step": 29033, "epoch": 243, "lr": 6.508376309828905e-05} +{"train_loss": 0.0025857407599687576, "global_step": 29034, "epoch": 243, "lr": 6.508165079281072e-05} +{"train_loss": 0.003302910889522368, "global_step": 29035, "epoch": 243, "lr": 6.507953845772116e-05, "val_loss": 0.008597790263593197} +{"train_loss": 0.0024038185365498066, "global_step": 29036, "epoch": 244, "lr": 6.507742609302457e-05} +{"train_loss": 0.0018462821608409286, "global_step": 29037, "epoch": 244, "lr": 6.507531369872503e-05} +{"train_loss": 0.0031166309490799904, "global_step": 29038, "epoch": 244, "lr": 6.507320127482674e-05} +{"train_loss": 0.0019047579262405634, "global_step": 29039, "epoch": 244, "lr": 6.507108882133382e-05} +{"train_loss": 0.0021215309388935566, "global_step": 29040, "epoch": 244, "lr": 6.506897633825045e-05} +{"train_loss": 0.0033224907238036394, "global_step": 29041, "epoch": 244, "lr": 6.506686382558073e-05} +{"train_loss": 0.0025407865177839994, "global_step": 29042, "epoch": 244, "lr": 6.506475128332883e-05} +{"train_loss": 0.0022189421579241753, "global_step": 29043, "epoch": 244, "lr": 6.506263871149891e-05} +{"train_loss": 0.00499688321724534, "global_step": 29044, "epoch": 244, "lr": 6.506052611009511e-05} +{"train_loss": 0.001308977953158319, "global_step": 29045, "epoch": 244, "lr": 6.505841347912157e-05} +{"train_loss": 0.003867749823257327, "global_step": 29046, "epoch": 244, "lr": 6.505630081858245e-05} +{"train_loss": 0.003358866088092327, "global_step": 29047, "epoch": 244, "lr": 6.505418812848189e-05} +{"train_loss": 0.002378650475293398, "global_step": 29048, "epoch": 244, "lr": 6.505207540882404e-05} +{"train_loss": 0.0035287323407828808, "global_step": 29049, "epoch": 244, "lr": 6.504996265961306e-05} +{"train_loss": 0.00570656917989254, "global_step": 29050, "epoch": 244, "lr": 6.504784988085306e-05} +{"train_loss": 0.0036624963395297527, "global_step": 29051, "epoch": 244, "lr": 6.504573707254823e-05} +{"train_loss": 0.0030033986549824476, "global_step": 29052, "epoch": 244, "lr": 6.50436242347027e-05} +{"train_loss": 0.0029051373712718487, "global_step": 29053, "epoch": 244, "lr": 6.504151136732062e-05} +{"train_loss": 0.004324987065047026, "global_step": 29054, "epoch": 244, "lr": 6.503939847040615e-05} +{"train_loss": 0.003236415097489953, "global_step": 29055, "epoch": 244, "lr": 6.503728554396343e-05} +{"train_loss": 0.0020150160416960716, "global_step": 29056, "epoch": 244, "lr": 6.503517258799659e-05} +{"train_loss": 0.0030723048839718103, "global_step": 29057, "epoch": 244, "lr": 6.503305960250979e-05} +{"train_loss": 0.002966419095173478, "global_step": 29058, "epoch": 244, "lr": 6.50309465875072e-05} +{"train_loss": 0.002725957427173853, "global_step": 29059, "epoch": 244, "lr": 6.502883354299294e-05} +{"train_loss": 0.0024789972230792046, "global_step": 29060, "epoch": 244, "lr": 6.502672046897118e-05} +{"train_loss": 0.0026103626005351543, "global_step": 29061, "epoch": 244, "lr": 6.502460736544606e-05} +{"train_loss": 0.0037741896230727434, "global_step": 29062, "epoch": 244, "lr": 6.502249423242171e-05} +{"train_loss": 0.0031066080555319786, "global_step": 29063, "epoch": 244, "lr": 6.502038106990232e-05} +{"train_loss": 0.002898067468777299, "global_step": 29064, "epoch": 244, "lr": 6.501826787789201e-05} +{"train_loss": 0.0018173542339354753, "global_step": 29065, "epoch": 244, "lr": 6.501615465639492e-05} +{"train_loss": 0.0023828649427741766, "global_step": 29066, "epoch": 244, "lr": 6.501404140541524e-05} +{"train_loss": 0.003739649895578623, "global_step": 29067, "epoch": 244, "lr": 6.501192812495709e-05} +{"train_loss": 0.0028743341099470854, "global_step": 29068, "epoch": 244, "lr": 6.500981481502462e-05} +{"train_loss": 0.006539538037031889, "global_step": 29069, "epoch": 244, "lr": 6.500770147562197e-05} +{"train_loss": 0.0025649049784988165, "global_step": 29070, "epoch": 244, "lr": 6.500558810675331e-05} +{"train_loss": 0.003987000789493322, "global_step": 29071, "epoch": 244, "lr": 6.500347470842279e-05} +{"train_loss": 0.002391254296526313, "global_step": 29072, "epoch": 244, "lr": 6.500136128063453e-05} +{"train_loss": 0.0018352523911744356, "global_step": 29073, "epoch": 244, "lr": 6.499924782339271e-05} +{"train_loss": 0.0027415999211370945, "global_step": 29074, "epoch": 244, "lr": 6.499713433670147e-05} +{"train_loss": 0.003293524496257305, "global_step": 29075, "epoch": 244, "lr": 6.499502082056495e-05} +{"train_loss": 0.003635371569544077, "global_step": 29076, "epoch": 244, "lr": 6.499290727498732e-05} +{"train_loss": 0.0029579566325992346, "global_step": 29077, "epoch": 244, "lr": 6.499079369997272e-05} +{"train_loss": 0.003178204642608762, "global_step": 29078, "epoch": 244, "lr": 6.498868009552529e-05} +{"train_loss": 0.0033526322804391384, "global_step": 29079, "epoch": 244, "lr": 6.49865664616492e-05} +{"train_loss": 0.004087769892066717, "global_step": 29080, "epoch": 244, "lr": 6.498445279834857e-05} +{"train_loss": 0.0039240336045622826, "global_step": 29081, "epoch": 244, "lr": 6.49823391056276e-05} +{"train_loss": 0.005231515970081091, "global_step": 29082, "epoch": 244, "lr": 6.498022538349037e-05} +{"train_loss": 0.0015052626840770245, "global_step": 29083, "epoch": 244, "lr": 6.497811163194108e-05} +{"train_loss": 0.002369882306084037, "global_step": 29084, "epoch": 244, "lr": 6.497599785098387e-05} +{"train_loss": 0.004553677048534155, "global_step": 29085, "epoch": 244, "lr": 6.49738840406229e-05} +{"train_loss": 0.004113152157515287, "global_step": 29086, "epoch": 244, "lr": 6.497177020086229e-05} +{"train_loss": 0.0029195554088801146, "global_step": 29087, "epoch": 244, "lr": 6.496965633170622e-05} +{"train_loss": 0.006114168092608452, "global_step": 29088, "epoch": 244, "lr": 6.496754243315882e-05} +{"train_loss": 0.0037684119306504726, "global_step": 29089, "epoch": 244, "lr": 6.496542850522426e-05} +{"train_loss": 0.0038009602576494217, "global_step": 29090, "epoch": 244, "lr": 6.496331454790668e-05} +{"train_loss": 0.0028634502086788416, "global_step": 29091, "epoch": 244, "lr": 6.496120056121021e-05} +{"train_loss": 0.003620242001488805, "global_step": 29092, "epoch": 244, "lr": 6.495908654513904e-05} +{"train_loss": 0.0030493359081447124, "global_step": 29093, "epoch": 244, "lr": 6.49569724996973e-05} +{"train_loss": 0.003903172444552183, "global_step": 29094, "epoch": 244, "lr": 6.495485842488913e-05} +{"train_loss": 0.0027603853959590197, "global_step": 29095, "epoch": 244, "lr": 6.49527443207187e-05} +{"train_loss": 0.004227837081998587, "global_step": 29096, "epoch": 244, "lr": 6.495063018719016e-05} +{"train_loss": 0.001885954407043755, "global_step": 29097, "epoch": 244, "lr": 6.494851602430766e-05} +{"train_loss": 0.003229833673685789, "global_step": 29098, "epoch": 244, "lr": 6.494640183207534e-05} +{"train_loss": 0.005739821121096611, "global_step": 29099, "epoch": 244, "lr": 6.494428761049736e-05} +{"train_loss": 0.00343875540420413, "global_step": 29100, "epoch": 244, "lr": 6.494217335957786e-05} +{"train_loss": 0.004302290268242359, "global_step": 29101, "epoch": 244, "lr": 6.4940059079321e-05} +{"train_loss": 0.0034546044189482927, "global_step": 29102, "epoch": 244, "lr": 6.493794476973093e-05} +{"train_loss": 0.004763101227581501, "global_step": 29103, "epoch": 244, "lr": 6.49358304308118e-05} +{"train_loss": 0.0031685347203165293, "global_step": 29104, "epoch": 244, "lr": 6.493371606256777e-05} +{"train_loss": 0.004987095482647419, "global_step": 29105, "epoch": 244, "lr": 6.493160166500298e-05} +{"train_loss": 0.005358646623790264, "global_step": 29106, "epoch": 244, "lr": 6.49294872381216e-05} +{"train_loss": 0.003324126126244664, "global_step": 29107, "epoch": 244, "lr": 6.492737278192775e-05} +{"train_loss": 0.004050237126648426, "global_step": 29108, "epoch": 244, "lr": 6.49252582964256e-05} +{"train_loss": 0.004975360818207264, "global_step": 29109, "epoch": 244, "lr": 6.492314378161929e-05} +{"train_loss": 0.0024594319984316826, "global_step": 29110, "epoch": 244, "lr": 6.492102923751297e-05} +{"train_loss": 0.0042607164941728115, "global_step": 29111, "epoch": 244, "lr": 6.491891466411084e-05} +{"train_loss": 0.00379571202211082, "global_step": 29112, "epoch": 244, "lr": 6.4916800061417e-05} +{"train_loss": 0.00385081279091537, "global_step": 29113, "epoch": 244, "lr": 6.491468542943562e-05} +{"train_loss": 0.003113728715106845, "global_step": 29114, "epoch": 244, "lr": 6.491257076817085e-05} +{"train_loss": 0.004370530601590872, "global_step": 29115, "epoch": 244, "lr": 6.491045607762682e-05} +{"train_loss": 0.0032114991918206215, "global_step": 29116, "epoch": 244, "lr": 6.490834135780773e-05} +{"train_loss": 0.0026374859735369682, "global_step": 29117, "epoch": 244, "lr": 6.490622660871769e-05} +{"train_loss": 0.004570971708744764, "global_step": 29118, "epoch": 244, "lr": 6.490411183036086e-05} +{"train_loss": 0.0021799819078296423, "global_step": 29119, "epoch": 244, "lr": 6.490199702274142e-05} +{"train_loss": 0.0028755480889230967, "global_step": 29120, "epoch": 244, "lr": 6.48998821858635e-05} +{"train_loss": 0.003456955077126622, "global_step": 29121, "epoch": 244, "lr": 6.489776731973123e-05} +{"train_loss": 0.0036359596997499466, "global_step": 29122, "epoch": 244, "lr": 6.489565242434878e-05} +{"train_loss": 0.00461439648643136, "global_step": 29123, "epoch": 244, "lr": 6.489353749972034e-05} +{"train_loss": 0.002744358265772462, "global_step": 29124, "epoch": 244, "lr": 6.489142254585001e-05} +{"train_loss": 0.006392912473529577, "global_step": 29125, "epoch": 244, "lr": 6.488930756274197e-05} +{"train_loss": 0.0034767636097967625, "global_step": 29126, "epoch": 244, "lr": 6.488719255040035e-05} +{"train_loss": 0.0018206223612651229, "global_step": 29127, "epoch": 244, "lr": 6.488507750882934e-05} +{"train_loss": 0.003305118763819337, "global_step": 29128, "epoch": 244, "lr": 6.488296243803306e-05} +{"train_loss": 0.003038182621821761, "global_step": 29129, "epoch": 244, "lr": 6.488084733801567e-05} +{"train_loss": 0.004345242399722338, "global_step": 29130, "epoch": 244, "lr": 6.487873220878134e-05} +{"train_loss": 0.004199388902634382, "global_step": 29131, "epoch": 244, "lr": 6.48766170503342e-05} +{"train_loss": 0.0048707351088523865, "global_step": 29132, "epoch": 244, "lr": 6.487450186267841e-05} +{"train_loss": 0.004994753748178482, "global_step": 29133, "epoch": 244, "lr": 6.487238664581813e-05} +{"train_loss": 0.0037384035531431437, "global_step": 29134, "epoch": 244, "lr": 6.487027139975749e-05} +{"train_loss": 0.003634446067735553, "global_step": 29135, "epoch": 244, "lr": 6.486815612450067e-05} +{"train_loss": 0.0030089328065514565, "global_step": 29136, "epoch": 244, "lr": 6.486604082005185e-05} +{"train_loss": 0.004524425603449345, "global_step": 29137, "epoch": 244, "lr": 6.486392548641512e-05} +{"train_loss": 0.0026158085092902184, "global_step": 29138, "epoch": 244, "lr": 6.486181012359465e-05} +{"train_loss": 0.005508300382643938, "global_step": 29139, "epoch": 244, "lr": 6.48596947315946e-05} +{"train_loss": 0.003171038581058383, "global_step": 29140, "epoch": 244, "lr": 6.485757931041914e-05} +{"train_loss": 0.00354290334507823, "global_step": 29141, "epoch": 244, "lr": 6.48554638600724e-05} +{"train_loss": 0.004602366127073765, "global_step": 29142, "epoch": 244, "lr": 6.485334838055854e-05} +{"train_loss": 0.004920613951981068, "global_step": 29143, "epoch": 244, "lr": 6.485123287188172e-05} +{"train_loss": 0.0021410402841866016, "global_step": 29144, "epoch": 244, "lr": 6.484911733404611e-05} +{"train_loss": 0.002661501057446003, "global_step": 29145, "epoch": 244, "lr": 6.484700176705583e-05} +{"train_loss": 0.002577731851488352, "global_step": 29146, "epoch": 244, "lr": 6.484488617091506e-05} +{"train_loss": 0.005538521334528923, "global_step": 29147, "epoch": 244, "lr": 6.484277054562793e-05} +{"train_loss": 0.005853452254086733, "global_step": 29148, "epoch": 244, "lr": 6.484065489119861e-05} +{"train_loss": 0.003587303915992379, "global_step": 29149, "epoch": 244, "lr": 6.483853920763125e-05} +{"train_loss": 0.005108329933136702, "global_step": 29150, "epoch": 244, "lr": 6.483642349493e-05} +{"train_loss": 0.005427499767392874, "global_step": 29151, "epoch": 244, "lr": 6.483430775309902e-05} +{"train_loss": 0.0038195387460291386, "global_step": 29152, "epoch": 244, "lr": 6.483219198214247e-05} +{"train_loss": 0.003921880852431059, "global_step": 29153, "epoch": 244, "lr": 6.483007618206448e-05} +{"train_loss": 0.003537030248832302, "global_step": 29154, "epoch": 244, "lr": 6.482796035286922e-05, "val_loss": 0.029361803084611893} +{"train_loss": 0.005422818474471569, "global_step": 29155, "epoch": 245, "lr": 6.482584449456086e-05} +{"train_loss": 0.0030111821833997965, "global_step": 29156, "epoch": 245, "lr": 6.482372860714353e-05} +{"train_loss": 0.004417966119945049, "global_step": 29157, "epoch": 245, "lr": 6.482161269062139e-05} +{"train_loss": 0.006619465537369251, "global_step": 29158, "epoch": 245, "lr": 6.48194967449986e-05} +{"train_loss": 0.00523463124409318, "global_step": 29159, "epoch": 245, "lr": 6.48173807702793e-05} +{"train_loss": 0.005229474510997534, "global_step": 29160, "epoch": 245, "lr": 6.481526476646767e-05} +{"train_loss": 0.004466993734240532, "global_step": 29161, "epoch": 245, "lr": 6.481314873356785e-05} +{"train_loss": 0.004920411854982376, "global_step": 29162, "epoch": 245, "lr": 6.4811032671584e-05} +{"train_loss": 0.003109340090304613, "global_step": 29163, "epoch": 245, "lr": 6.480891658052024e-05} +{"train_loss": 0.005245967768132687, "global_step": 29164, "epoch": 245, "lr": 6.480680046038077e-05} +{"train_loss": 0.001758610480464995, "global_step": 29165, "epoch": 245, "lr": 6.480468431116975e-05} +{"train_loss": 0.003251400776207447, "global_step": 29166, "epoch": 245, "lr": 6.48025681328913e-05} +{"train_loss": 0.00545897800475359, "global_step": 29167, "epoch": 245, "lr": 6.480045192554958e-05} +{"train_loss": 0.0041490658186376095, "global_step": 29168, "epoch": 245, "lr": 6.479833568914877e-05} +{"train_loss": 0.005173221230506897, "global_step": 29169, "epoch": 245, "lr": 6.4796219423693e-05} +{"train_loss": 0.004495846573263407, "global_step": 29170, "epoch": 245, "lr": 6.479410312918643e-05} +{"train_loss": 0.0026661057490855455, "global_step": 29171, "epoch": 245, "lr": 6.479198680563322e-05} +{"train_loss": 0.004399157594889402, "global_step": 29172, "epoch": 245, "lr": 6.478987045303752e-05} +{"train_loss": 0.0035635815002024174, "global_step": 29173, "epoch": 245, "lr": 6.47877540714035e-05} +{"train_loss": 0.004985692445188761, "global_step": 29174, "epoch": 245, "lr": 6.47856376607353e-05} +{"train_loss": 0.00464596739038825, "global_step": 29175, "epoch": 245, "lr": 6.478352122103708e-05} +{"train_loss": 0.005916461814194918, "global_step": 29176, "epoch": 245, "lr": 6.478140475231301e-05} +{"train_loss": 0.0038759158924221992, "global_step": 29177, "epoch": 245, "lr": 6.47792882545672e-05} +{"train_loss": 0.0032730617094784975, "global_step": 29178, "epoch": 245, "lr": 6.477717172780386e-05} +{"train_loss": 0.0036015277728438377, "global_step": 29179, "epoch": 245, "lr": 6.47750551720271e-05} +{"train_loss": 0.006082384847104549, "global_step": 29180, "epoch": 245, "lr": 6.477293858724114e-05} +{"train_loss": 0.005606493912637234, "global_step": 29181, "epoch": 245, "lr": 6.477082197345006e-05} +{"train_loss": 0.003259398275986314, "global_step": 29182, "epoch": 245, "lr": 6.476870533065806e-05} +{"train_loss": 0.0020305283833295107, "global_step": 29183, "epoch": 245, "lr": 6.476658865886927e-05} +{"train_loss": 0.00405364204198122, "global_step": 29184, "epoch": 245, "lr": 6.476447195808788e-05} +{"train_loss": 0.005085589364171028, "global_step": 29185, "epoch": 245, "lr": 6.476235522831802e-05} +{"train_loss": 0.004258091561496258, "global_step": 29186, "epoch": 245, "lr": 6.476023846956385e-05} +{"train_loss": 0.0037713695783168077, "global_step": 29187, "epoch": 245, "lr": 6.475812168182954e-05} +{"train_loss": 0.005722458939999342, "global_step": 29188, "epoch": 245, "lr": 6.475600486511921e-05} +{"train_loss": 0.0055631352588534355, "global_step": 29189, "epoch": 245, "lr": 6.475388801943706e-05} +{"train_loss": 0.003859620774164796, "global_step": 29190, "epoch": 245, "lr": 6.475177114478722e-05} +{"train_loss": 0.002885761670768261, "global_step": 29191, "epoch": 245, "lr": 6.474965424117385e-05} +{"train_loss": 0.002269929274916649, "global_step": 29192, "epoch": 245, "lr": 6.474753730860113e-05} +{"train_loss": 0.003058093599975109, "global_step": 29193, "epoch": 245, "lr": 6.474542034707317e-05} +{"train_loss": 0.003262450685724616, "global_step": 29194, "epoch": 245, "lr": 6.474330335659417e-05} +{"train_loss": 0.003195226425305009, "global_step": 29195, "epoch": 245, "lr": 6.474118633716825e-05} +{"train_loss": 0.0018371748737990856, "global_step": 29196, "epoch": 245, "lr": 6.47390692887996e-05} +{"train_loss": 0.004505263175815344, "global_step": 29197, "epoch": 245, "lr": 6.473695221149237e-05} +{"train_loss": 0.0028873374685645103, "global_step": 29198, "epoch": 245, "lr": 6.47348351052507e-05} +{"train_loss": 0.0037628740537911654, "global_step": 29199, "epoch": 245, "lr": 6.473271797007876e-05} +{"train_loss": 0.003759587649255991, "global_step": 29200, "epoch": 245, "lr": 6.473060080598069e-05} +{"train_loss": 0.0049566724337637424, "global_step": 29201, "epoch": 245, "lr": 6.472848361296067e-05} +{"train_loss": 0.0036727716214954853, "global_step": 29202, "epoch": 245, "lr": 6.472636639102283e-05} +{"train_loss": 0.0028976064641028643, "global_step": 29203, "epoch": 245, "lr": 6.472424914017137e-05} +{"train_loss": 0.0034677484072744846, "global_step": 29204, "epoch": 245, "lr": 6.472213186041039e-05} +{"train_loss": 0.003089388133957982, "global_step": 29205, "epoch": 245, "lr": 6.47200145517441e-05} +{"train_loss": 0.003181526670232415, "global_step": 29206, "epoch": 245, "lr": 6.471789721417662e-05} +{"train_loss": 0.005025539547204971, "global_step": 29207, "epoch": 245, "lr": 6.471577984771213e-05} +{"train_loss": 0.0063404967077076435, "global_step": 29208, "epoch": 245, "lr": 6.471366245235477e-05} +{"train_loss": 0.003217796329408884, "global_step": 29209, "epoch": 245, "lr": 6.471154502810872e-05} +{"train_loss": 0.0030046903993934393, "global_step": 29210, "epoch": 245, "lr": 6.47094275749781e-05} +{"train_loss": 0.0021018467377871275, "global_step": 29211, "epoch": 245, "lr": 6.470731009296711e-05} +{"train_loss": 0.001387028838507831, "global_step": 29212, "epoch": 245, "lr": 6.470519258207989e-05} +{"train_loss": 0.003587717656046152, "global_step": 29213, "epoch": 245, "lr": 6.470307504232058e-05} +{"train_loss": 0.004833215847611427, "global_step": 29214, "epoch": 245, "lr": 6.470095747369336e-05} +{"train_loss": 0.004258268978446722, "global_step": 29215, "epoch": 245, "lr": 6.469883987620238e-05} +{"train_loss": 0.004075299017131329, "global_step": 29216, "epoch": 245, "lr": 6.469672224985181e-05} +{"train_loss": 0.00234023854136467, "global_step": 29217, "epoch": 245, "lr": 6.469460459464578e-05} +{"train_loss": 0.0035594890359789133, "global_step": 29218, "epoch": 245, "lr": 6.469248691058846e-05} +{"train_loss": 0.00473548099398613, "global_step": 29219, "epoch": 245, "lr": 6.469036919768403e-05} +{"train_loss": 0.005484124645590782, "global_step": 29220, "epoch": 245, "lr": 6.468825145593663e-05} +{"train_loss": 0.002168132457882166, "global_step": 29221, "epoch": 245, "lr": 6.46861336853504e-05} +{"train_loss": 0.0032643715385347605, "global_step": 29222, "epoch": 245, "lr": 6.468401588592951e-05} +{"train_loss": 0.002379588782787323, "global_step": 29223, "epoch": 245, "lr": 6.468189805767815e-05} +{"train_loss": 0.0043573640286922455, "global_step": 29224, "epoch": 245, "lr": 6.467978020060044e-05} +{"train_loss": 0.0034884680062532425, "global_step": 29225, "epoch": 245, "lr": 6.467766231470054e-05} +{"train_loss": 0.00524421501904726, "global_step": 29226, "epoch": 245, "lr": 6.467554439998263e-05} +{"train_loss": 0.0062821232713758945, "global_step": 29227, "epoch": 245, "lr": 6.467342645645085e-05} +{"train_loss": 0.0022224853746593, "global_step": 29228, "epoch": 245, "lr": 6.467130848410936e-05} +{"train_loss": 0.002668960951268673, "global_step": 29229, "epoch": 245, "lr": 6.466919048296234e-05} +{"train_loss": 0.002991402754560113, "global_step": 29230, "epoch": 245, "lr": 6.466707245301393e-05} +{"train_loss": 0.003766470355913043, "global_step": 29231, "epoch": 245, "lr": 6.466495439426828e-05} +{"train_loss": 0.005333256907761097, "global_step": 29232, "epoch": 245, "lr": 6.466283630672956e-05} +{"train_loss": 0.004370871931314468, "global_step": 29233, "epoch": 245, "lr": 6.466071819040192e-05} +{"train_loss": 0.0033824024721980095, "global_step": 29234, "epoch": 245, "lr": 6.465860004528954e-05} +{"train_loss": 0.0038588750176131725, "global_step": 29235, "epoch": 245, "lr": 6.465648187139656e-05} +{"train_loss": 0.0028439213056117296, "global_step": 29236, "epoch": 245, "lr": 6.465436366872715e-05} +{"train_loss": 0.003904696786776185, "global_step": 29237, "epoch": 245, "lr": 6.465224543728545e-05} +{"train_loss": 0.005164142232388258, "global_step": 29238, "epoch": 245, "lr": 6.465012717707563e-05} +{"train_loss": 0.0033162685576826334, "global_step": 29239, "epoch": 245, "lr": 6.464800888810188e-05} +{"train_loss": 0.0077485498040914536, "global_step": 29240, "epoch": 245, "lr": 6.46458905703683e-05} +{"train_loss": 0.005941829644143581, "global_step": 29241, "epoch": 245, "lr": 6.464377222387908e-05} +{"train_loss": 0.004050725605338812, "global_step": 29242, "epoch": 245, "lr": 6.464165384863838e-05} +{"train_loss": 0.002541791647672653, "global_step": 29243, "epoch": 245, "lr": 6.463953544465036e-05} +{"train_loss": 0.0024363358970731497, "global_step": 29244, "epoch": 245, "lr": 6.463741701191918e-05} +{"train_loss": 0.003182850079610944, "global_step": 29245, "epoch": 245, "lr": 6.463529855044899e-05} +{"train_loss": 0.00398014672100544, "global_step": 29246, "epoch": 245, "lr": 6.463318006024395e-05} +{"train_loss": 0.0025208243168890476, "global_step": 29247, "epoch": 245, "lr": 6.463106154130823e-05} +{"train_loss": 0.004396372474730015, "global_step": 29248, "epoch": 245, "lr": 6.4628942993646e-05} +{"train_loss": 0.004183698445558548, "global_step": 29249, "epoch": 245, "lr": 6.462682441726139e-05} +{"train_loss": 0.0024647116661071777, "global_step": 29250, "epoch": 245, "lr": 6.462470581215857e-05} +{"train_loss": 0.002515329048037529, "global_step": 29251, "epoch": 245, "lr": 6.46225871783417e-05} +{"train_loss": 0.004011766519397497, "global_step": 29252, "epoch": 245, "lr": 6.462046851581494e-05} +{"train_loss": 0.002308234106749296, "global_step": 29253, "epoch": 245, "lr": 6.461834982458245e-05} +{"train_loss": 0.004112481139600277, "global_step": 29254, "epoch": 245, "lr": 6.46162311046484e-05} +{"train_loss": 0.007861359044909477, "global_step": 29255, "epoch": 245, "lr": 6.461411235601696e-05} +{"train_loss": 0.0026270397938787937, "global_step": 29256, "epoch": 245, "lr": 6.461199357869224e-05} +{"train_loss": 0.003609058680012822, "global_step": 29257, "epoch": 245, "lr": 6.460987477267845e-05} +{"train_loss": 0.00420067785307765, "global_step": 29258, "epoch": 245, "lr": 6.460775593797972e-05} +{"train_loss": 0.0044746859930455685, "global_step": 29259, "epoch": 245, "lr": 6.460563707460024e-05} +{"train_loss": 0.0029345944058150053, "global_step": 29260, "epoch": 245, "lr": 6.460351818254413e-05} +{"train_loss": 0.004757565911859274, "global_step": 29261, "epoch": 245, "lr": 6.460139926181559e-05} +{"train_loss": 0.002990278648212552, "global_step": 29262, "epoch": 245, "lr": 6.459928031241875e-05} +{"train_loss": 0.0038306869100779295, "global_step": 29263, "epoch": 245, "lr": 6.45971613343578e-05} +{"train_loss": 0.004430362954735756, "global_step": 29264, "epoch": 245, "lr": 6.459504232763687e-05} +{"train_loss": 0.004282274283468723, "global_step": 29265, "epoch": 245, "lr": 6.459292329226012e-05} +{"train_loss": 0.0031960720662027597, "global_step": 29266, "epoch": 245, "lr": 6.459080422823174e-05} +{"train_loss": 0.0024627011734992266, "global_step": 29267, "epoch": 245, "lr": 6.45886851355559e-05} +{"train_loss": 0.004711466375738382, "global_step": 29268, "epoch": 245, "lr": 6.45865660142367e-05} +{"train_loss": 0.002365832682698965, "global_step": 29269, "epoch": 245, "lr": 6.458444686427833e-05} +{"train_loss": 0.005503122694790363, "global_step": 29270, "epoch": 245, "lr": 6.458232768568498e-05} +{"train_loss": 0.003879792056977749, "global_step": 29271, "epoch": 245, "lr": 6.458020847846078e-05} +{"train_loss": 0.005272550042718649, "global_step": 29272, "epoch": 245, "lr": 6.45780892426099e-05} +{"train_loss": 0.003953492131960743, "global_step": 29273, "epoch": 245, "lr": 6.457596997813649e-05, "val_loss": 0.021471349522471428, "train_action_mse_error": 5.929287726758048e-05} +{"train_loss": 0.0036998819559812546, "global_step": 29274, "epoch": 246, "lr": 6.457385068504472e-05} +{"train_loss": 0.0048896148800849915, "global_step": 29275, "epoch": 246, "lr": 6.457173136333876e-05} +{"train_loss": 0.0026580721605569124, "global_step": 29276, "epoch": 246, "lr": 6.456961201302276e-05} +{"train_loss": 0.0038702175952494144, "global_step": 29277, "epoch": 246, "lr": 6.456749263410089e-05} +{"train_loss": 0.004680224694311619, "global_step": 29278, "epoch": 246, "lr": 6.456537322657729e-05} +{"train_loss": 0.0036006702575832605, "global_step": 29279, "epoch": 246, "lr": 6.456325379045615e-05} +{"train_loss": 0.003799408907070756, "global_step": 29280, "epoch": 246, "lr": 6.456113432574162e-05} +{"train_loss": 0.003289859276264906, "global_step": 29281, "epoch": 246, "lr": 6.455901483243785e-05} +{"train_loss": 0.004527920391410589, "global_step": 29282, "epoch": 246, "lr": 6.4556895310549e-05} +{"train_loss": 0.006065639201551676, "global_step": 29283, "epoch": 246, "lr": 6.455477576007924e-05} +{"train_loss": 0.003871493274345994, "global_step": 29284, "epoch": 246, "lr": 6.455265618103276e-05} +{"train_loss": 0.0041353399865329266, "global_step": 29285, "epoch": 246, "lr": 6.455053657341367e-05} +{"train_loss": 0.002516625914722681, "global_step": 29286, "epoch": 246, "lr": 6.454841693722618e-05} +{"train_loss": 0.0032293687108904123, "global_step": 29287, "epoch": 246, "lr": 6.454629727247439e-05} +{"train_loss": 0.002509587211534381, "global_step": 29288, "epoch": 246, "lr": 6.454417757916254e-05} +{"train_loss": 0.004181100986897945, "global_step": 29289, "epoch": 246, "lr": 6.454205785729473e-05} +{"train_loss": 0.0038138728123158216, "global_step": 29290, "epoch": 246, "lr": 6.453993810687513e-05} +{"train_loss": 0.003189025679603219, "global_step": 29291, "epoch": 246, "lr": 6.453781832790793e-05} +{"train_loss": 0.0022799670696258545, "global_step": 29292, "epoch": 246, "lr": 6.453569852039728e-05} +{"train_loss": 0.002139963209629059, "global_step": 29293, "epoch": 246, "lr": 6.453357868434734e-05} +{"train_loss": 0.003640127135440707, "global_step": 29294, "epoch": 246, "lr": 6.453145881976226e-05} +{"train_loss": 0.0030719067435711622, "global_step": 29295, "epoch": 246, "lr": 6.452933892664621e-05} +{"train_loss": 0.002253871178254485, "global_step": 29296, "epoch": 246, "lr": 6.452721900500337e-05} +{"train_loss": 0.00203888607211411, "global_step": 29297, "epoch": 246, "lr": 6.452509905483788e-05} +{"train_loss": 0.0025726333260536194, "global_step": 29298, "epoch": 246, "lr": 6.452297907615391e-05} +{"train_loss": 0.0034103954676538706, "global_step": 29299, "epoch": 246, "lr": 6.452085906895563e-05} +{"train_loss": 0.0025377545971423388, "global_step": 29300, "epoch": 246, "lr": 6.451873903324719e-05} +{"train_loss": 0.0025051934644579887, "global_step": 29301, "epoch": 246, "lr": 6.451661896903274e-05} +{"train_loss": 0.0024883514270186424, "global_step": 29302, "epoch": 246, "lr": 6.451449887631649e-05} +{"train_loss": 0.003012979868799448, "global_step": 29303, "epoch": 246, "lr": 6.451237875510255e-05} +{"train_loss": 0.004977331962436438, "global_step": 29304, "epoch": 246, "lr": 6.451025860539512e-05} +{"train_loss": 0.0027327374555170536, "global_step": 29305, "epoch": 246, "lr": 6.450813842719833e-05} +{"train_loss": 0.0035251853987574577, "global_step": 29306, "epoch": 246, "lr": 6.450601822051636e-05} +{"train_loss": 0.0023146620951592922, "global_step": 29307, "epoch": 246, "lr": 6.45038979853534e-05} +{"train_loss": 0.003430241020396352, "global_step": 29308, "epoch": 246, "lr": 6.450177772171355e-05} +{"train_loss": 0.0030243510846048594, "global_step": 29309, "epoch": 246, "lr": 6.449965742960104e-05} +{"train_loss": 0.0029692023526877165, "global_step": 29310, "epoch": 246, "lr": 6.449753710901998e-05} +{"train_loss": 0.00418614037334919, "global_step": 29311, "epoch": 246, "lr": 6.449541675997457e-05} +{"train_loss": 0.002287422539666295, "global_step": 29312, "epoch": 246, "lr": 6.449329638246895e-05} +{"train_loss": 0.002569046802818775, "global_step": 29313, "epoch": 246, "lr": 6.44911759765073e-05} +{"train_loss": 0.0031785776372998953, "global_step": 29314, "epoch": 246, "lr": 6.448905554209376e-05} +{"train_loss": 0.004111782647669315, "global_step": 29315, "epoch": 246, "lr": 6.448693507923252e-05} +{"train_loss": 0.0028795793186873198, "global_step": 29316, "epoch": 246, "lr": 6.448481458792771e-05} +{"train_loss": 0.0027881793212145567, "global_step": 29317, "epoch": 246, "lr": 6.448269406818353e-05} +{"train_loss": 0.0029051576275378466, "global_step": 29318, "epoch": 246, "lr": 6.448057352000414e-05} +{"train_loss": 0.0033171125687658787, "global_step": 29319, "epoch": 246, "lr": 6.447845294339368e-05} +{"train_loss": 0.002314807614311576, "global_step": 29320, "epoch": 246, "lr": 6.447633233835631e-05} +{"train_loss": 0.003870725631713867, "global_step": 29321, "epoch": 246, "lr": 6.447421170489621e-05} +{"train_loss": 0.002955687465146184, "global_step": 29322, "epoch": 246, "lr": 6.447209104301756e-05} +{"train_loss": 0.002563120098784566, "global_step": 29323, "epoch": 246, "lr": 6.446997035272449e-05} +{"train_loss": 0.002721638884395361, "global_step": 29324, "epoch": 246, "lr": 6.446784963402118e-05} +{"train_loss": 0.00394046027213335, "global_step": 29325, "epoch": 246, "lr": 6.44657288869118e-05} +{"train_loss": 0.0027688087429851294, "global_step": 29326, "epoch": 246, "lr": 6.44636081114005e-05} +{"train_loss": 0.004033960867673159, "global_step": 29327, "epoch": 246, "lr": 6.446148730749147e-05} +{"train_loss": 0.00381760043092072, "global_step": 29328, "epoch": 246, "lr": 6.445936647518883e-05} +{"train_loss": 0.0036707876715809107, "global_step": 29329, "epoch": 246, "lr": 6.445724561449677e-05} +{"train_loss": 0.0017906619468703866, "global_step": 29330, "epoch": 246, "lr": 6.445512472541948e-05} +{"train_loss": 0.004274140112102032, "global_step": 29331, "epoch": 246, "lr": 6.445300380796108e-05} +{"train_loss": 0.005494867451488972, "global_step": 29332, "epoch": 246, "lr": 6.445088286212574e-05} +{"train_loss": 0.0026841661892831326, "global_step": 29333, "epoch": 246, "lr": 6.444876188791764e-05} +{"train_loss": 0.0026833743322640657, "global_step": 29334, "epoch": 246, "lr": 6.444664088534094e-05} +{"train_loss": 0.003016240429133177, "global_step": 29335, "epoch": 246, "lr": 6.444451985439981e-05} +{"train_loss": 0.002896026475355029, "global_step": 29336, "epoch": 246, "lr": 6.444239879509843e-05} +{"train_loss": 0.002868280978873372, "global_step": 29337, "epoch": 246, "lr": 6.44402777074409e-05} +{"train_loss": 0.004453141242265701, "global_step": 29338, "epoch": 246, "lr": 6.443815659143145e-05} +{"train_loss": 0.0035570270847529173, "global_step": 29339, "epoch": 246, "lr": 6.443603544707422e-05} +{"train_loss": 0.0016061096685007215, "global_step": 29340, "epoch": 246, "lr": 6.443391427437337e-05} +{"train_loss": 0.0022397739812731743, "global_step": 29341, "epoch": 246, "lr": 6.443179307333307e-05} +{"train_loss": 0.002451278967782855, "global_step": 29342, "epoch": 246, "lr": 6.442967184395749e-05} +{"train_loss": 0.0022478613536804914, "global_step": 29343, "epoch": 246, "lr": 6.442755058625081e-05} +{"train_loss": 0.003916403744369745, "global_step": 29344, "epoch": 246, "lr": 6.442542930021715e-05} +{"train_loss": 0.0028691792394965887, "global_step": 29345, "epoch": 246, "lr": 6.442330798586071e-05} +{"train_loss": 0.0024079405702650547, "global_step": 29346, "epoch": 246, "lr": 6.442118664318566e-05} +{"train_loss": 0.0027609760873019695, "global_step": 29347, "epoch": 246, "lr": 6.441906527219613e-05} +{"train_loss": 0.00680058728903532, "global_step": 29348, "epoch": 246, "lr": 6.441694387289632e-05} +{"train_loss": 0.0020434397738426924, "global_step": 29349, "epoch": 246, "lr": 6.441482244529038e-05} +{"train_loss": 0.003974666353315115, "global_step": 29350, "epoch": 246, "lr": 6.441270098938247e-05} +{"train_loss": 0.001957972999662161, "global_step": 29351, "epoch": 246, "lr": 6.441057950517674e-05} +{"train_loss": 0.004652067553251982, "global_step": 29352, "epoch": 246, "lr": 6.44084579926774e-05} +{"train_loss": 0.0018084632465615869, "global_step": 29353, "epoch": 246, "lr": 6.44063364518886e-05} +{"train_loss": 0.0017034891061484814, "global_step": 29354, "epoch": 246, "lr": 6.440421488281448e-05} +{"train_loss": 0.0026681828312575817, "global_step": 29355, "epoch": 246, "lr": 6.440209328545923e-05} +{"train_loss": 0.003044447163119912, "global_step": 29356, "epoch": 246, "lr": 6.439997165982703e-05} +{"train_loss": 0.0028441837057471275, "global_step": 29357, "epoch": 246, "lr": 6.439785000592199e-05} +{"train_loss": 0.002692517125979066, "global_step": 29358, "epoch": 246, "lr": 6.439572832374831e-05} +{"train_loss": 0.0027628543321043253, "global_step": 29359, "epoch": 246, "lr": 6.439360661331018e-05} +{"train_loss": 0.0037685963325202465, "global_step": 29360, "epoch": 246, "lr": 6.439148487461173e-05} +{"train_loss": 0.003920003771781921, "global_step": 29361, "epoch": 246, "lr": 6.438936310765714e-05} +{"train_loss": 0.0035626126918941736, "global_step": 29362, "epoch": 246, "lr": 6.438724131245056e-05} +{"train_loss": 0.0019608354195952415, "global_step": 29363, "epoch": 246, "lr": 6.438511948899619e-05} +{"train_loss": 0.00260604708455503, "global_step": 29364, "epoch": 246, "lr": 6.438299763729817e-05} +{"train_loss": 0.003346856217831373, "global_step": 29365, "epoch": 246, "lr": 6.438087575736065e-05} +{"train_loss": 0.0016413966659456491, "global_step": 29366, "epoch": 246, "lr": 6.437875384918783e-05} +{"train_loss": 0.00219320273026824, "global_step": 29367, "epoch": 246, "lr": 6.437663191278385e-05} +{"train_loss": 0.003024093573912978, "global_step": 29368, "epoch": 246, "lr": 6.437450994815292e-05} +{"train_loss": 0.00247401325032115, "global_step": 29369, "epoch": 246, "lr": 6.437238795529917e-05} +{"train_loss": 0.00268892222084105, "global_step": 29370, "epoch": 246, "lr": 6.437026593422674e-05} +{"train_loss": 0.003692758735269308, "global_step": 29371, "epoch": 246, "lr": 6.436814388493986e-05} +{"train_loss": 0.00328335864469409, "global_step": 29372, "epoch": 246, "lr": 6.436602180744264e-05} +{"train_loss": 0.0027280084323138, "global_step": 29373, "epoch": 246, "lr": 6.436389970173928e-05} +{"train_loss": 0.003646938130259514, "global_step": 29374, "epoch": 246, "lr": 6.436177756783395e-05} +{"train_loss": 0.0027593194972723722, "global_step": 29375, "epoch": 246, "lr": 6.435965540573078e-05} +{"train_loss": 0.0017452056054025888, "global_step": 29376, "epoch": 246, "lr": 6.435753321543399e-05} +{"train_loss": 0.0027466032188385725, "global_step": 29377, "epoch": 246, "lr": 6.435541099694769e-05} +{"train_loss": 0.0028879486490041018, "global_step": 29378, "epoch": 246, "lr": 6.435328875027609e-05} +{"train_loss": 0.002890302799642086, "global_step": 29379, "epoch": 246, "lr": 6.435116647542333e-05} +{"train_loss": 0.0031533779110759497, "global_step": 29380, "epoch": 246, "lr": 6.43490441723936e-05} +{"train_loss": 0.002712115878239274, "global_step": 29381, "epoch": 246, "lr": 6.434692184119105e-05} +{"train_loss": 0.00311183906160295, "global_step": 29382, "epoch": 246, "lr": 6.434479948181986e-05} +{"train_loss": 0.0018873998196795583, "global_step": 29383, "epoch": 246, "lr": 6.434267709428418e-05} +{"train_loss": 0.002856836887076497, "global_step": 29384, "epoch": 246, "lr": 6.434055467858819e-05} +{"train_loss": 0.0017986757447943091, "global_step": 29385, "epoch": 246, "lr": 6.433843223473603e-05} +{"train_loss": 0.0034428867511451244, "global_step": 29386, "epoch": 246, "lr": 6.433630976273193e-05} +{"train_loss": 0.003742121858522296, "global_step": 29387, "epoch": 246, "lr": 6.433418726257999e-05} +{"train_loss": 0.0033217838499695063, "global_step": 29388, "epoch": 246, "lr": 6.433206473428441e-05} +{"train_loss": 0.005241405684500933, "global_step": 29389, "epoch": 246, "lr": 6.432994217784934e-05} +{"train_loss": 0.0018991123652085662, "global_step": 29390, "epoch": 246, "lr": 6.432781959327898e-05} +{"train_loss": 0.004306817427277565, "global_step": 29391, "epoch": 246, "lr": 6.432569698057746e-05} +{"train_loss": 0.0031405020164748452, "global_step": 29392, "epoch": 246, "lr": 6.432357433974898e-05, "val_loss": 0.01434405893087387} +{"train_loss": 0.0016818311996757984, "global_step": 29393, "epoch": 247, "lr": 6.432145167079771e-05} +{"train_loss": 0.0034822754096239805, "global_step": 29394, "epoch": 247, "lr": 6.431932897372777e-05} +{"train_loss": 0.00326768821105361, "global_step": 29395, "epoch": 247, "lr": 6.431720624854336e-05} +{"train_loss": 0.0027229441329836845, "global_step": 29396, "epoch": 247, "lr": 6.431508349524863e-05} +{"train_loss": 0.003651815000921488, "global_step": 29397, "epoch": 247, "lr": 6.43129607138478e-05} +{"train_loss": 0.003778146579861641, "global_step": 29398, "epoch": 247, "lr": 6.431083790434497e-05} +{"train_loss": 0.0039544194005429745, "global_step": 29399, "epoch": 247, "lr": 6.430871506674436e-05} +{"train_loss": 0.0027751813177019358, "global_step": 29400, "epoch": 247, "lr": 6.430659220105011e-05} +{"train_loss": 0.0027354091871529818, "global_step": 29401, "epoch": 247, "lr": 6.430446930726639e-05} +{"train_loss": 0.0031276752706617117, "global_step": 29402, "epoch": 247, "lr": 6.430234638539738e-05} +{"train_loss": 0.004568912088871002, "global_step": 29403, "epoch": 247, "lr": 6.430022343544723e-05} +{"train_loss": 0.002864615526050329, "global_step": 29404, "epoch": 247, "lr": 6.429810045742013e-05} +{"train_loss": 0.0015526036731898785, "global_step": 29405, "epoch": 247, "lr": 6.429597745132023e-05} +{"train_loss": 0.0038707093335688114, "global_step": 29406, "epoch": 247, "lr": 6.42938544171517e-05} +{"train_loss": 0.004605526570230722, "global_step": 29407, "epoch": 247, "lr": 6.429173135491872e-05} +{"train_loss": 0.002725346479564905, "global_step": 29408, "epoch": 247, "lr": 6.428960826462546e-05} +{"train_loss": 0.0030438348185271025, "global_step": 29409, "epoch": 247, "lr": 6.428748514627607e-05} +{"train_loss": 0.0018181357299908996, "global_step": 29410, "epoch": 247, "lr": 6.428536199987474e-05} +{"train_loss": 0.0020669500809162855, "global_step": 29411, "epoch": 247, "lr": 6.428323882542562e-05} +{"train_loss": 0.003122763242572546, "global_step": 29412, "epoch": 247, "lr": 6.428111562293289e-05} +{"train_loss": 0.0036986167542636395, "global_step": 29413, "epoch": 247, "lr": 6.427899239240072e-05} +{"train_loss": 0.0022022647317498922, "global_step": 29414, "epoch": 247, "lr": 6.427686913383326e-05} +{"train_loss": 0.0023106548469513655, "global_step": 29415, "epoch": 247, "lr": 6.42747458472347e-05} +{"train_loss": 0.0021910271607339382, "global_step": 29416, "epoch": 247, "lr": 6.42726225326092e-05} +{"train_loss": 0.0017736563459038734, "global_step": 29417, "epoch": 247, "lr": 6.427049918996093e-05} +{"train_loss": 0.0043621058575809, "global_step": 29418, "epoch": 247, "lr": 6.426837581929408e-05} +{"train_loss": 0.002111598150804639, "global_step": 29419, "epoch": 247, "lr": 6.426625242061277e-05} +{"train_loss": 0.004547405522316694, "global_step": 29420, "epoch": 247, "lr": 6.42641289939212e-05} +{"train_loss": 0.003167289774864912, "global_step": 29421, "epoch": 247, "lr": 6.426200553922354e-05} +{"train_loss": 0.005366568453609943, "global_step": 29422, "epoch": 247, "lr": 6.425988205652397e-05} +{"train_loss": 0.0022070924751460552, "global_step": 29423, "epoch": 247, "lr": 6.425775854582663e-05} +{"train_loss": 0.003058400936424732, "global_step": 29424, "epoch": 247, "lr": 6.425563500713571e-05} +{"train_loss": 0.0027979325968772173, "global_step": 29425, "epoch": 247, "lr": 6.425351144045537e-05} +{"train_loss": 0.002313286764547229, "global_step": 29426, "epoch": 247, "lr": 6.425138784578979e-05} +{"train_loss": 0.005471831187605858, "global_step": 29427, "epoch": 247, "lr": 6.424926422314312e-05} +{"train_loss": 0.002620919141918421, "global_step": 29428, "epoch": 247, "lr": 6.424714057251956e-05} +{"train_loss": 0.0018301247619092464, "global_step": 29429, "epoch": 247, "lr": 6.424501689392325e-05} +{"train_loss": 0.002799148904159665, "global_step": 29430, "epoch": 247, "lr": 6.424289318735837e-05} +{"train_loss": 0.0017238273285329342, "global_step": 29431, "epoch": 247, "lr": 6.424076945282911e-05} +{"train_loss": 0.0031960250344127417, "global_step": 29432, "epoch": 247, "lr": 6.423864569033959e-05} +{"train_loss": 0.004028174560517073, "global_step": 29433, "epoch": 247, "lr": 6.423652189989403e-05} +{"train_loss": 0.0020325251389294863, "global_step": 29434, "epoch": 247, "lr": 6.423439808149658e-05} +{"train_loss": 0.003305286867544055, "global_step": 29435, "epoch": 247, "lr": 6.42322742351514e-05} +{"train_loss": 0.003277821931988001, "global_step": 29436, "epoch": 247, "lr": 6.423015036086268e-05} +{"train_loss": 0.001965875970199704, "global_step": 29437, "epoch": 247, "lr": 6.422802645863458e-05} +{"train_loss": 0.0028079007752239704, "global_step": 29438, "epoch": 247, "lr": 6.422590252847125e-05} +{"train_loss": 0.002275963546708226, "global_step": 29439, "epoch": 247, "lr": 6.42237785703769e-05} +{"train_loss": 0.002511691302061081, "global_step": 29440, "epoch": 247, "lr": 6.422165458435567e-05} +{"train_loss": 0.002278727712109685, "global_step": 29441, "epoch": 247, "lr": 6.421953057041175e-05} +{"train_loss": 0.0031742877326905727, "global_step": 29442, "epoch": 247, "lr": 6.42174065285493e-05} +{"train_loss": 0.0021597049199044704, "global_step": 29443, "epoch": 247, "lr": 6.42152824587725e-05} +{"train_loss": 0.0019686389714479446, "global_step": 29444, "epoch": 247, "lr": 6.421315836108549e-05} +{"train_loss": 0.0036210822872817516, "global_step": 29445, "epoch": 247, "lr": 6.421103423549248e-05} +{"train_loss": 0.0018404761794954538, "global_step": 29446, "epoch": 247, "lr": 6.42089100819976e-05} +{"train_loss": 0.0027837653178721666, "global_step": 29447, "epoch": 247, "lr": 6.420678590060507e-05} +{"train_loss": 0.001859006006270647, "global_step": 29448, "epoch": 247, "lr": 6.420466169131902e-05} +{"train_loss": 0.004033567383885384, "global_step": 29449, "epoch": 247, "lr": 6.420253745414364e-05} +{"train_loss": 0.0038069882430136204, "global_step": 29450, "epoch": 247, "lr": 6.42004131890831e-05} +{"train_loss": 0.0030238975305110216, "global_step": 29451, "epoch": 247, "lr": 6.419828889614154e-05} +{"train_loss": 0.005254233255982399, "global_step": 29452, "epoch": 247, "lr": 6.419616457532318e-05} +{"train_loss": 0.003469252958893776, "global_step": 29453, "epoch": 247, "lr": 6.419404022663215e-05} +{"train_loss": 0.0025959606282413006, "global_step": 29454, "epoch": 247, "lr": 6.419191585007266e-05} +{"train_loss": 0.0017241481691598892, "global_step": 29455, "epoch": 247, "lr": 6.418979144564885e-05} +{"train_loss": 0.002346237888559699, "global_step": 29456, "epoch": 247, "lr": 6.41876670133649e-05} +{"train_loss": 0.002764142118394375, "global_step": 29457, "epoch": 247, "lr": 6.418554255322497e-05} +{"train_loss": 0.005016083363443613, "global_step": 29458, "epoch": 247, "lr": 6.418341806523325e-05} +{"train_loss": 0.0060128988698124886, "global_step": 29459, "epoch": 247, "lr": 6.41812935493939e-05} +{"train_loss": 0.002190626924857497, "global_step": 29460, "epoch": 247, "lr": 6.417916900571112e-05} +{"train_loss": 0.0036535323597490788, "global_step": 29461, "epoch": 247, "lr": 6.417704443418903e-05} +{"train_loss": 0.003763998858630657, "global_step": 29462, "epoch": 247, "lr": 6.417491983483185e-05} +{"train_loss": 0.00400302279740572, "global_step": 29463, "epoch": 247, "lr": 6.41727952076437e-05} +{"train_loss": 0.0031236682552844286, "global_step": 29464, "epoch": 247, "lr": 6.417067055262881e-05} +{"train_loss": 0.0019733626395463943, "global_step": 29465, "epoch": 247, "lr": 6.41685458697913e-05} +{"train_loss": 0.005281900987029076, "global_step": 29466, "epoch": 247, "lr": 6.416642115913538e-05} +{"train_loss": 0.0045622470788657665, "global_step": 29467, "epoch": 247, "lr": 6.41642964206652e-05} +{"train_loss": 0.003571472130715847, "global_step": 29468, "epoch": 247, "lr": 6.416217165438493e-05} +{"train_loss": 0.0040814527310431, "global_step": 29469, "epoch": 247, "lr": 6.416004686029876e-05} +{"train_loss": 0.0037778920959681273, "global_step": 29470, "epoch": 247, "lr": 6.415792203841085e-05} +{"train_loss": 0.002467133104801178, "global_step": 29471, "epoch": 247, "lr": 6.415579718872536e-05} +{"train_loss": 0.004754026420414448, "global_step": 29472, "epoch": 247, "lr": 6.415367231124648e-05} +{"train_loss": 0.004158549010753632, "global_step": 29473, "epoch": 247, "lr": 6.415154740597838e-05} +{"train_loss": 0.002329644514247775, "global_step": 29474, "epoch": 247, "lr": 6.414942247292523e-05} +{"train_loss": 0.00339217740111053, "global_step": 29475, "epoch": 247, "lr": 6.41472975120912e-05} +{"train_loss": 0.0038902568630874157, "global_step": 29476, "epoch": 247, "lr": 6.414517252348046e-05} +{"train_loss": 0.002167755737900734, "global_step": 29477, "epoch": 247, "lr": 6.414304750709719e-05} +{"train_loss": 0.0024134740233421326, "global_step": 29478, "epoch": 247, "lr": 6.414092246294554e-05} +{"train_loss": 0.0038693202659487724, "global_step": 29479, "epoch": 247, "lr": 6.413879739102971e-05} +{"train_loss": 0.0028775606770068407, "global_step": 29480, "epoch": 247, "lr": 6.413667229135388e-05} +{"train_loss": 0.002757331123575568, "global_step": 29481, "epoch": 247, "lr": 6.413454716392218e-05} +{"train_loss": 0.002764809411019087, "global_step": 29482, "epoch": 247, "lr": 6.413242200873881e-05} +{"train_loss": 0.0027275229804217815, "global_step": 29483, "epoch": 247, "lr": 6.413029682580796e-05} +{"train_loss": 0.0048785340040922165, "global_step": 29484, "epoch": 247, "lr": 6.412817161513376e-05} +{"train_loss": 0.003603550838306546, "global_step": 29485, "epoch": 247, "lr": 6.41260463767204e-05} +{"train_loss": 0.00413668155670166, "global_step": 29486, "epoch": 247, "lr": 6.412392111057208e-05} +{"train_loss": 0.002881658496335149, "global_step": 29487, "epoch": 247, "lr": 6.412179581669293e-05} +{"train_loss": 0.0034382950980216265, "global_step": 29488, "epoch": 247, "lr": 6.411967049508715e-05} +{"train_loss": 0.0043441192246973515, "global_step": 29489, "epoch": 247, "lr": 6.411754514575891e-05} +{"train_loss": 0.003458669874817133, "global_step": 29490, "epoch": 247, "lr": 6.411541976871238e-05} +{"train_loss": 0.0020096362568438053, "global_step": 29491, "epoch": 247, "lr": 6.411329436395171e-05} +{"train_loss": 0.005119768902659416, "global_step": 29492, "epoch": 247, "lr": 6.411116893148112e-05} +{"train_loss": 0.0030862572602927685, "global_step": 29493, "epoch": 247, "lr": 6.410904347130475e-05} +{"train_loss": 0.002290671458467841, "global_step": 29494, "epoch": 247, "lr": 6.410691798342677e-05} +{"train_loss": 0.0029756571166217327, "global_step": 29495, "epoch": 247, "lr": 6.410479246785137e-05} +{"train_loss": 0.0033007259480655193, "global_step": 29496, "epoch": 247, "lr": 6.410266692458272e-05} +{"train_loss": 0.0021646206732839346, "global_step": 29497, "epoch": 247, "lr": 6.410054135362499e-05} +{"train_loss": 0.0030838295351713896, "global_step": 29498, "epoch": 247, "lr": 6.409841575498234e-05} +{"train_loss": 0.003462122054770589, "global_step": 29499, "epoch": 247, "lr": 6.409629012865899e-05} +{"train_loss": 0.003276512725278735, "global_step": 29500, "epoch": 247, "lr": 6.409416447465906e-05} +{"train_loss": 0.003201906569302082, "global_step": 29501, "epoch": 247, "lr": 6.409203879298674e-05} +{"train_loss": 0.0016415814170613885, "global_step": 29502, "epoch": 247, "lr": 6.40899130836462e-05} +{"train_loss": 0.0029152415227144957, "global_step": 29503, "epoch": 247, "lr": 6.408778734664163e-05} +{"train_loss": 0.004587898030877113, "global_step": 29504, "epoch": 247, "lr": 6.40856615819772e-05} +{"train_loss": 0.0031748011242598295, "global_step": 29505, "epoch": 247, "lr": 6.408353578965707e-05} +{"train_loss": 0.0023157938849180937, "global_step": 29506, "epoch": 247, "lr": 6.408140996968542e-05} +{"train_loss": 0.0026461512316018343, "global_step": 29507, "epoch": 247, "lr": 6.407928412206643e-05} +{"train_loss": 0.002547618467360735, "global_step": 29508, "epoch": 247, "lr": 6.407715824680427e-05} +{"train_loss": 0.003135883016511798, "global_step": 29509, "epoch": 247, "lr": 6.407503234390312e-05} +{"train_loss": 0.0024152658879756927, "global_step": 29510, "epoch": 247, "lr": 6.407290641336714e-05} +{"train_loss": 0.003127241413257703, "global_step": 29511, "epoch": 247, "lr": 6.407078045520052e-05, "val_loss": 0.023314762860536575} +{"train_loss": 0.0022339753340929747, "global_step": 29512, "epoch": 248, "lr": 6.406865446940742e-05} +{"train_loss": 0.005038739647716284, "global_step": 29513, "epoch": 248, "lr": 6.406652845599203e-05} +{"train_loss": 0.003792119212448597, "global_step": 29514, "epoch": 248, "lr": 6.406440241495851e-05} +{"train_loss": 0.0018227032851427794, "global_step": 29515, "epoch": 248, "lr": 6.406227634631103e-05} +{"train_loss": 0.0033646286465227604, "global_step": 29516, "epoch": 248, "lr": 6.406015025005377e-05} +{"train_loss": 0.00324234482832253, "global_step": 29517, "epoch": 248, "lr": 6.40580241261909e-05} +{"train_loss": 0.0027923223096877337, "global_step": 29518, "epoch": 248, "lr": 6.405589797472664e-05} +{"train_loss": 0.002154187299311161, "global_step": 29519, "epoch": 248, "lr": 6.405377179566509e-05} +{"train_loss": 0.004232991486787796, "global_step": 29520, "epoch": 248, "lr": 6.405164558901047e-05} +{"train_loss": 0.0021824012510478497, "global_step": 29521, "epoch": 248, "lr": 6.404951935476694e-05} +{"train_loss": 0.005158738698810339, "global_step": 29522, "epoch": 248, "lr": 6.404739309293868e-05} +{"train_loss": 0.0015653145965188742, "global_step": 29523, "epoch": 248, "lr": 6.404526680352987e-05} +{"train_loss": 0.0028505928348749876, "global_step": 29524, "epoch": 248, "lr": 6.404314048654469e-05} +{"train_loss": 0.003343046410009265, "global_step": 29525, "epoch": 248, "lr": 6.404101414198728e-05} +{"train_loss": 0.0022839789744466543, "global_step": 29526, "epoch": 248, "lr": 6.403888776986185e-05} +{"train_loss": 0.0033969043288379908, "global_step": 29527, "epoch": 248, "lr": 6.403676137017256e-05} +{"train_loss": 0.002339185681194067, "global_step": 29528, "epoch": 248, "lr": 6.403463494292361e-05} +{"train_loss": 0.0032216119579970837, "global_step": 29529, "epoch": 248, "lr": 6.403250848811912e-05} +{"train_loss": 0.004365224856883287, "global_step": 29530, "epoch": 248, "lr": 6.403038200576332e-05} +{"train_loss": 0.004061887040734291, "global_step": 29531, "epoch": 248, "lr": 6.402825549586038e-05} +{"train_loss": 0.001649087411351502, "global_step": 29532, "epoch": 248, "lr": 6.402612895841444e-05} +{"train_loss": 0.0035850023850798607, "global_step": 29533, "epoch": 248, "lr": 6.402400239342969e-05} +{"train_loss": 0.002135704504325986, "global_step": 29534, "epoch": 248, "lr": 6.402187580091031e-05} +{"train_loss": 0.003925277851521969, "global_step": 29535, "epoch": 248, "lr": 6.401974918086048e-05} +{"train_loss": 0.0051882765255868435, "global_step": 29536, "epoch": 248, "lr": 6.401762253328436e-05} +{"train_loss": 0.003036605892702937, "global_step": 29537, "epoch": 248, "lr": 6.401549585818615e-05} +{"train_loss": 0.002872439566999674, "global_step": 29538, "epoch": 248, "lr": 6.401336915557e-05} +{"train_loss": 0.003449074225500226, "global_step": 29539, "epoch": 248, "lr": 6.40112424254401e-05} +{"train_loss": 0.004364167805761099, "global_step": 29540, "epoch": 248, "lr": 6.400911566780062e-05} +{"train_loss": 0.0030695083551108837, "global_step": 29541, "epoch": 248, "lr": 6.400698888265574e-05} +{"train_loss": 0.0030299373902380466, "global_step": 29542, "epoch": 248, "lr": 6.400486207000964e-05} +{"train_loss": 0.0016938878688961267, "global_step": 29543, "epoch": 248, "lr": 6.40027352298665e-05} +{"train_loss": 0.002703792881220579, "global_step": 29544, "epoch": 248, "lr": 6.400060836223048e-05} +{"train_loss": 0.0035739887971431017, "global_step": 29545, "epoch": 248, "lr": 6.399848146710575e-05} +{"train_loss": 0.0031624799594283104, "global_step": 29546, "epoch": 248, "lr": 6.399635454449648e-05} +{"train_loss": 0.002986072562634945, "global_step": 29547, "epoch": 248, "lr": 6.39942275944069e-05} +{"train_loss": 0.004907235503196716, "global_step": 29548, "epoch": 248, "lr": 6.399210061684112e-05} +{"train_loss": 0.003216293640434742, "global_step": 29549, "epoch": 248, "lr": 6.398997361180336e-05} +{"train_loss": 0.00198915833607316, "global_step": 29550, "epoch": 248, "lr": 6.398784657929779e-05} +{"train_loss": 0.0019194143824279308, "global_step": 29551, "epoch": 248, "lr": 6.398571951932856e-05} +{"train_loss": 0.002844663802534342, "global_step": 29552, "epoch": 248, "lr": 6.398359243189987e-05} +{"train_loss": 0.002740981988608837, "global_step": 29553, "epoch": 248, "lr": 6.398146531701589e-05} +{"train_loss": 0.0035281411837786436, "global_step": 29554, "epoch": 248, "lr": 6.39793381746808e-05} +{"train_loss": 0.003598262323066592, "global_step": 29555, "epoch": 248, "lr": 6.397721100489876e-05} +{"train_loss": 0.003752379212528467, "global_step": 29556, "epoch": 248, "lr": 6.397508380767397e-05} +{"train_loss": 0.00347930402494967, "global_step": 29557, "epoch": 248, "lr": 6.397295658301059e-05} +{"train_loss": 0.0038447792176157236, "global_step": 29558, "epoch": 248, "lr": 6.397082933091281e-05} +{"train_loss": 0.0034783410374075174, "global_step": 29559, "epoch": 248, "lr": 6.39687020513848e-05} +{"train_loss": 0.004601390101015568, "global_step": 29560, "epoch": 248, "lr": 6.396657474443074e-05} +{"train_loss": 0.0038366897497326136, "global_step": 29561, "epoch": 248, "lr": 6.396444741005478e-05} +{"train_loss": 0.003071755636483431, "global_step": 29562, "epoch": 248, "lr": 6.396232004826115e-05} +{"train_loss": 0.001957473112270236, "global_step": 29563, "epoch": 248, "lr": 6.396019265905397e-05} +{"train_loss": 0.002653873059898615, "global_step": 29564, "epoch": 248, "lr": 6.395806524243746e-05} +{"train_loss": 0.0020587134640663862, "global_step": 29565, "epoch": 248, "lr": 6.395593779841578e-05} +{"train_loss": 0.004062889143824577, "global_step": 29566, "epoch": 248, "lr": 6.39538103269931e-05} +{"train_loss": 0.0030621723271906376, "global_step": 29567, "epoch": 248, "lr": 6.39516828281736e-05} +{"train_loss": 0.004322705324739218, "global_step": 29568, "epoch": 248, "lr": 6.394955530196147e-05} +{"train_loss": 0.002140811877325177, "global_step": 29569, "epoch": 248, "lr": 6.394742774836088e-05} +{"train_loss": 0.0020283767953515053, "global_step": 29570, "epoch": 248, "lr": 6.394530016737599e-05} +{"train_loss": 0.003868134692311287, "global_step": 29571, "epoch": 248, "lr": 6.3943172559011e-05} +{"train_loss": 0.001964591210708022, "global_step": 29572, "epoch": 248, "lr": 6.394104492327009e-05} +{"train_loss": 0.0035065473057329655, "global_step": 29573, "epoch": 248, "lr": 6.393891726015742e-05} +{"train_loss": 0.0026833724696189165, "global_step": 29574, "epoch": 248, "lr": 6.393678956967718e-05} +{"train_loss": 0.002574312034994364, "global_step": 29575, "epoch": 248, "lr": 6.393466185183354e-05} +{"train_loss": 0.003656010376289487, "global_step": 29576, "epoch": 248, "lr": 6.393253410663068e-05} +{"train_loss": 0.0028701594565063715, "global_step": 29577, "epoch": 248, "lr": 6.393040633407277e-05} +{"train_loss": 0.003018326824530959, "global_step": 29578, "epoch": 248, "lr": 6.392827853416401e-05} +{"train_loss": 0.0015490561490878463, "global_step": 29579, "epoch": 248, "lr": 6.392615070690855e-05} +{"train_loss": 0.002851220779120922, "global_step": 29580, "epoch": 248, "lr": 6.392402285231059e-05} +{"train_loss": 0.004146158695220947, "global_step": 29581, "epoch": 248, "lr": 6.392189497037431e-05} +{"train_loss": 0.002823438262566924, "global_step": 29582, "epoch": 248, "lr": 6.391976706110385e-05} +{"train_loss": 0.0032860676292330027, "global_step": 29583, "epoch": 248, "lr": 6.391763912450343e-05} +{"train_loss": 0.0029598104301840067, "global_step": 29584, "epoch": 248, "lr": 6.391551116057722e-05} +{"train_loss": 0.00310071581043303, "global_step": 29585, "epoch": 248, "lr": 6.391338316932936e-05} +{"train_loss": 0.003491882933303714, "global_step": 29586, "epoch": 248, "lr": 6.391125515076409e-05} +{"train_loss": 0.0034379614517092705, "global_step": 29587, "epoch": 248, "lr": 6.390912710488554e-05} +{"train_loss": 0.0035709389485418797, "global_step": 29588, "epoch": 248, "lr": 6.39069990316979e-05} +{"train_loss": 0.002929970156401396, "global_step": 29589, "epoch": 248, "lr": 6.390487093120536e-05} +{"train_loss": 0.0027729689609259367, "global_step": 29590, "epoch": 248, "lr": 6.390274280341211e-05} +{"train_loss": 0.003364835400134325, "global_step": 29591, "epoch": 248, "lr": 6.390061464832229e-05} +{"train_loss": 0.002819199813529849, "global_step": 29592, "epoch": 248, "lr": 6.38984864659401e-05} +{"train_loss": 0.0023501862306147814, "global_step": 29593, "epoch": 248, "lr": 6.389635825626973e-05} +{"train_loss": 0.003688390599563718, "global_step": 29594, "epoch": 248, "lr": 6.389423001931533e-05} +{"train_loss": 0.004637322388589382, "global_step": 29595, "epoch": 248, "lr": 6.389210175508109e-05} +{"train_loss": 0.003004960250109434, "global_step": 29596, "epoch": 248, "lr": 6.388997346357121e-05} +{"train_loss": 0.0024461359716951847, "global_step": 29597, "epoch": 248, "lr": 6.388784514478984e-05} +{"train_loss": 0.001968205440789461, "global_step": 29598, "epoch": 248, "lr": 6.388571679874116e-05} +{"train_loss": 0.0034381630830466747, "global_step": 29599, "epoch": 248, "lr": 6.388358842542939e-05} +{"train_loss": 0.0018260418437421322, "global_step": 29600, "epoch": 248, "lr": 6.388146002485865e-05} +{"train_loss": 0.0044220793060958385, "global_step": 29601, "epoch": 248, "lr": 6.387933159703316e-05} +{"train_loss": 0.0038032904267311096, "global_step": 29602, "epoch": 248, "lr": 6.387720314195707e-05} +{"train_loss": 0.0032427881378680468, "global_step": 29603, "epoch": 248, "lr": 6.387507465963457e-05} +{"train_loss": 0.0039921351708471775, "global_step": 29604, "epoch": 248, "lr": 6.387294615006987e-05} +{"train_loss": 0.004235021770000458, "global_step": 29605, "epoch": 248, "lr": 6.38708176132671e-05} +{"train_loss": 0.005257905926555395, "global_step": 29606, "epoch": 248, "lr": 6.386868904923047e-05} +{"train_loss": 0.003709932090714574, "global_step": 29607, "epoch": 248, "lr": 6.386656045796415e-05} +{"train_loss": 0.003741292981430888, "global_step": 29608, "epoch": 248, "lr": 6.386443183947231e-05} +{"train_loss": 0.002436180366203189, "global_step": 29609, "epoch": 248, "lr": 6.386230319375915e-05} +{"train_loss": 0.0038583092391490936, "global_step": 29610, "epoch": 248, "lr": 6.386017452082885e-05} +{"train_loss": 0.004052299540489912, "global_step": 29611, "epoch": 248, "lr": 6.385804582068557e-05} +{"train_loss": 0.0028761415742337704, "global_step": 29612, "epoch": 248, "lr": 6.385591709333349e-05} +{"train_loss": 0.004026171751320362, "global_step": 29613, "epoch": 248, "lr": 6.38537883387768e-05} +{"train_loss": 0.0032583961728960276, "global_step": 29614, "epoch": 248, "lr": 6.385165955701969e-05} +{"train_loss": 0.002914703916758299, "global_step": 29615, "epoch": 248, "lr": 6.38495307480663e-05} +{"train_loss": 0.0034096743911504745, "global_step": 29616, "epoch": 248, "lr": 6.384740191192085e-05} +{"train_loss": 0.002935377648100257, "global_step": 29617, "epoch": 248, "lr": 6.384527304858751e-05} +{"train_loss": 0.0034674934577196836, "global_step": 29618, "epoch": 248, "lr": 6.384314415807046e-05} +{"train_loss": 0.002046317793428898, "global_step": 29619, "epoch": 248, "lr": 6.384101524037385e-05} +{"train_loss": 0.004479214549064636, "global_step": 29620, "epoch": 248, "lr": 6.38388862955019e-05} +{"train_loss": 0.004306655377149582, "global_step": 29621, "epoch": 248, "lr": 6.383675732345878e-05} +{"train_loss": 0.0038002110086381435, "global_step": 29622, "epoch": 248, "lr": 6.383462832424865e-05} +{"train_loss": 0.004895067773759365, "global_step": 29623, "epoch": 248, "lr": 6.383249929787573e-05} +{"train_loss": 0.003220899263396859, "global_step": 29624, "epoch": 248, "lr": 6.383037024434417e-05} +{"train_loss": 0.004419115372002125, "global_step": 29625, "epoch": 248, "lr": 6.382824116365815e-05} +{"train_loss": 0.0032684234902262688, "global_step": 29626, "epoch": 248, "lr": 6.382611205582185e-05} +{"train_loss": 0.003243088023737073, "global_step": 29627, "epoch": 248, "lr": 6.382398292083946e-05} +{"train_loss": 0.003811286762356758, "global_step": 29628, "epoch": 248, "lr": 6.382185375871516e-05} +{"train_loss": 0.004503844305872917, "global_step": 29629, "epoch": 248, "lr": 6.381972456945312e-05} +{"train_loss": 0.003262576390793469, "global_step": 29630, "epoch": 248, "lr": 6.381759535305752e-05, "val_loss": 0.023340964689850807} +{"train_loss": 0.003454804653301835, "global_step": 29631, "epoch": 249, "lr": 6.381546610953257e-05} +{"train_loss": 0.0020977933891117573, "global_step": 29632, "epoch": 249, "lr": 6.381333683888242e-05} +{"train_loss": 0.004407715983688831, "global_step": 29633, "epoch": 249, "lr": 6.381120754111125e-05} +{"train_loss": 0.004396624397486448, "global_step": 29634, "epoch": 249, "lr": 6.380907821622326e-05} +{"train_loss": 0.0033003061544150114, "global_step": 29635, "epoch": 249, "lr": 6.380694886422262e-05} +{"train_loss": 0.0027572924736887217, "global_step": 29636, "epoch": 249, "lr": 6.38048194851135e-05} +{"train_loss": 0.0026623508892953396, "global_step": 29637, "epoch": 249, "lr": 6.38026900789001e-05} +{"train_loss": 0.0026000121142715216, "global_step": 29638, "epoch": 249, "lr": 6.380056064558659e-05} +{"train_loss": 0.002847270807251334, "global_step": 29639, "epoch": 249, "lr": 6.379843118517714e-05} +{"train_loss": 0.002216682769358158, "global_step": 29640, "epoch": 249, "lr": 6.379630169767597e-05} +{"train_loss": 0.003942875657230616, "global_step": 29641, "epoch": 249, "lr": 6.379417218308723e-05} +{"train_loss": 0.002758986782282591, "global_step": 29642, "epoch": 249, "lr": 6.37920426414151e-05} +{"train_loss": 0.004552590195089579, "global_step": 29643, "epoch": 249, "lr": 6.378991307266376e-05} +{"train_loss": 0.0037820436991751194, "global_step": 29644, "epoch": 249, "lr": 6.378778347683742e-05} +{"train_loss": 0.002476286143064499, "global_step": 29645, "epoch": 249, "lr": 6.378565385394022e-05} +{"train_loss": 0.0025637682992964983, "global_step": 29646, "epoch": 249, "lr": 6.378352420397638e-05} +{"train_loss": 0.0019058417528867722, "global_step": 29647, "epoch": 249, "lr": 6.378139452695004e-05} +{"train_loss": 0.002548999385908246, "global_step": 29648, "epoch": 249, "lr": 6.377926482286542e-05} +{"train_loss": 0.003465681802481413, "global_step": 29649, "epoch": 249, "lr": 6.377713509172667e-05} +{"train_loss": 0.004984450526535511, "global_step": 29650, "epoch": 249, "lr": 6.377500533353802e-05} +{"train_loss": 0.004155738279223442, "global_step": 29651, "epoch": 249, "lr": 6.377287554830359e-05} +{"train_loss": 0.002594775054603815, "global_step": 29652, "epoch": 249, "lr": 6.37707457360276e-05} +{"train_loss": 0.0014478309312835336, "global_step": 29653, "epoch": 249, "lr": 6.376861589671421e-05} +{"train_loss": 0.005582405719906092, "global_step": 29654, "epoch": 249, "lr": 6.376648603036762e-05} +{"train_loss": 0.0031514849979430437, "global_step": 29655, "epoch": 249, "lr": 6.376435613699202e-05} +{"train_loss": 0.0038384017534554005, "global_step": 29656, "epoch": 249, "lr": 6.376222621659156e-05} +{"train_loss": 0.004291611257940531, "global_step": 29657, "epoch": 249, "lr": 6.376009626917045e-05} +{"train_loss": 0.003411194309592247, "global_step": 29658, "epoch": 249, "lr": 6.375796629473285e-05} +{"train_loss": 0.004378362093120813, "global_step": 29659, "epoch": 249, "lr": 6.375583629328296e-05} +{"train_loss": 0.005144006572663784, "global_step": 29660, "epoch": 249, "lr": 6.375370626482495e-05} +{"train_loss": 0.0023505957797169685, "global_step": 29661, "epoch": 249, "lr": 6.375157620936301e-05} +{"train_loss": 0.0033889133483171463, "global_step": 29662, "epoch": 249, "lr": 6.374944612690133e-05} +{"train_loss": 0.005261362995952368, "global_step": 29663, "epoch": 249, "lr": 6.374731601744406e-05} +{"train_loss": 0.0034493606071919203, "global_step": 29664, "epoch": 249, "lr": 6.374518588099543e-05} +{"train_loss": 0.004972741939127445, "global_step": 29665, "epoch": 249, "lr": 6.374305571755957e-05} +{"train_loss": 0.004378179088234901, "global_step": 29666, "epoch": 249, "lr": 6.374092552714071e-05} +{"train_loss": 0.0037385195028036833, "global_step": 29667, "epoch": 249, "lr": 6.3738795309743e-05} +{"train_loss": 0.0030192395206540823, "global_step": 29668, "epoch": 249, "lr": 6.373666506537063e-05} +{"train_loss": 0.002749438164755702, "global_step": 29669, "epoch": 249, "lr": 6.373453479402778e-05} +{"train_loss": 0.0020050914026796818, "global_step": 29670, "epoch": 249, "lr": 6.373240449571865e-05} +{"train_loss": 0.002681298414245248, "global_step": 29671, "epoch": 249, "lr": 6.373027417044741e-05} +{"train_loss": 0.0031994220335036516, "global_step": 29672, "epoch": 249, "lr": 6.372814381821825e-05} +{"train_loss": 0.0029481586534529924, "global_step": 29673, "epoch": 249, "lr": 6.372601343903533e-05} +{"train_loss": 0.0033284504897892475, "global_step": 29674, "epoch": 249, "lr": 6.372388303290285e-05} +{"train_loss": 0.003421430941671133, "global_step": 29675, "epoch": 249, "lr": 6.372175259982501e-05} +{"train_loss": 0.0046198065392673016, "global_step": 29676, "epoch": 249, "lr": 6.371962213980597e-05} +{"train_loss": 0.0037203184328973293, "global_step": 29677, "epoch": 249, "lr": 6.37174916528499e-05} +{"train_loss": 0.0017479229718446732, "global_step": 29678, "epoch": 249, "lr": 6.371536113896102e-05} +{"train_loss": 0.0021771087776869535, "global_step": 29679, "epoch": 249, "lr": 6.371323059814349e-05} +{"train_loss": 0.00595272658392787, "global_step": 29680, "epoch": 249, "lr": 6.371110003040148e-05} +{"train_loss": 0.004229706712067127, "global_step": 29681, "epoch": 249, "lr": 6.370896943573922e-05} +{"train_loss": 0.0033267000690102577, "global_step": 29682, "epoch": 249, "lr": 6.370683881416085e-05} +{"train_loss": 0.001775604672729969, "global_step": 29683, "epoch": 249, "lr": 6.370470816567055e-05} +{"train_loss": 0.004821548704057932, "global_step": 29684, "epoch": 249, "lr": 6.370257749027253e-05} +{"train_loss": 0.0034468781668692827, "global_step": 29685, "epoch": 249, "lr": 6.370044678797096e-05} +{"train_loss": 0.003130947472527623, "global_step": 29686, "epoch": 249, "lr": 6.369831605877003e-05} +{"train_loss": 0.0013780355220660567, "global_step": 29687, "epoch": 249, "lr": 6.369618530267393e-05} +{"train_loss": 0.003644554642960429, "global_step": 29688, "epoch": 249, "lr": 6.369405451968682e-05} +{"train_loss": 0.0026412303559482098, "global_step": 29689, "epoch": 249, "lr": 6.36919237098129e-05} +{"train_loss": 0.0028987617697566748, "global_step": 29690, "epoch": 249, "lr": 6.368979287305635e-05} +{"train_loss": 0.0022220753598958254, "global_step": 29691, "epoch": 249, "lr": 6.368766200942135e-05} +{"train_loss": 0.0030960354488343, "global_step": 29692, "epoch": 249, "lr": 6.36855311189121e-05} +{"train_loss": 0.0033205938525497913, "global_step": 29693, "epoch": 249, "lr": 6.368340020153278e-05} +{"train_loss": 0.002433603396639228, "global_step": 29694, "epoch": 249, "lr": 6.368126925728754e-05} +{"train_loss": 0.003198016667738557, "global_step": 29695, "epoch": 249, "lr": 6.36791382861806e-05} +{"train_loss": 0.0024918164126574993, "global_step": 29696, "epoch": 249, "lr": 6.367700728821614e-05} +{"train_loss": 0.0030490413773804903, "global_step": 29697, "epoch": 249, "lr": 6.367487626339834e-05} +{"train_loss": 0.0020956944208592176, "global_step": 29698, "epoch": 249, "lr": 6.367274521173136e-05} +{"train_loss": 0.0030065802857279778, "global_step": 29699, "epoch": 249, "lr": 6.367061413321942e-05} +{"train_loss": 0.0013997525675222278, "global_step": 29700, "epoch": 249, "lr": 6.36684830278667e-05} +{"train_loss": 0.002831951482221484, "global_step": 29701, "epoch": 249, "lr": 6.366635189567736e-05} +{"train_loss": 0.002739244606345892, "global_step": 29702, "epoch": 249, "lr": 6.36642207366556e-05} +{"train_loss": 0.002335124649107456, "global_step": 29703, "epoch": 249, "lr": 6.366208955080559e-05} +{"train_loss": 0.0021132545080035925, "global_step": 29704, "epoch": 249, "lr": 6.365995833813154e-05} +{"train_loss": 0.0021608294919133186, "global_step": 29705, "epoch": 249, "lr": 6.365782709863762e-05} +{"train_loss": 0.0032107250299304724, "global_step": 29706, "epoch": 249, "lr": 6.365569583232802e-05} +{"train_loss": 0.004114025738090277, "global_step": 29707, "epoch": 249, "lr": 6.365356453920692e-05} +{"train_loss": 0.0032858499325811863, "global_step": 29708, "epoch": 249, "lr": 6.36514332192785e-05} +{"train_loss": 0.0035857672337442636, "global_step": 29709, "epoch": 249, "lr": 6.364930187254695e-05} +{"train_loss": 0.002766116987913847, "global_step": 29710, "epoch": 249, "lr": 6.364717049901644e-05} +{"train_loss": 0.0029642449226230383, "global_step": 29711, "epoch": 249, "lr": 6.36450390986912e-05} +{"train_loss": 0.004422209225594997, "global_step": 29712, "epoch": 249, "lr": 6.364290767157536e-05} +{"train_loss": 0.0023201736621558666, "global_step": 29713, "epoch": 249, "lr": 6.364077621767315e-05} +{"train_loss": 0.0032647056505084038, "global_step": 29714, "epoch": 249, "lr": 6.363864473698871e-05} +{"train_loss": 0.002216215245425701, "global_step": 29715, "epoch": 249, "lr": 6.363651322952625e-05} +{"train_loss": 0.00173672114033252, "global_step": 29716, "epoch": 249, "lr": 6.363438169528995e-05} +{"train_loss": 0.0044088116846978664, "global_step": 29717, "epoch": 249, "lr": 6.363225013428402e-05} +{"train_loss": 0.0024586981162428856, "global_step": 29718, "epoch": 249, "lr": 6.363011854651261e-05} +{"train_loss": 0.003671988844871521, "global_step": 29719, "epoch": 249, "lr": 6.362798693197991e-05} +{"train_loss": 0.0026385204400867224, "global_step": 29720, "epoch": 249, "lr": 6.362585529069013e-05} +{"train_loss": 0.001988599542528391, "global_step": 29721, "epoch": 249, "lr": 6.362372362264742e-05} +{"train_loss": 0.0016312227817252278, "global_step": 29722, "epoch": 249, "lr": 6.3621591927856e-05} +{"train_loss": 0.0038466625846922398, "global_step": 29723, "epoch": 249, "lr": 6.361946020632003e-05} +{"train_loss": 0.0026863543316721916, "global_step": 29724, "epoch": 249, "lr": 6.36173284580437e-05} +{"train_loss": 0.0016210074536502361, "global_step": 29725, "epoch": 249, "lr": 6.361519668303124e-05} +{"train_loss": 0.0016862815245985985, "global_step": 29726, "epoch": 249, "lr": 6.361306488128676e-05} +{"train_loss": 0.005429829470813274, "global_step": 29727, "epoch": 249, "lr": 6.361093305281449e-05} +{"train_loss": 0.0038019835483282804, "global_step": 29728, "epoch": 249, "lr": 6.360880119761859e-05} +{"train_loss": 0.0036693322472274303, "global_step": 29729, "epoch": 249, "lr": 6.360666931570328e-05} +{"train_loss": 0.0032512920442968607, "global_step": 29730, "epoch": 249, "lr": 6.360453740707272e-05} +{"train_loss": 0.0023543271236121655, "global_step": 29731, "epoch": 249, "lr": 6.360240547173113e-05} +{"train_loss": 0.0021324933040887117, "global_step": 29732, "epoch": 249, "lr": 6.360027350968265e-05} +{"train_loss": 0.0033936991821974516, "global_step": 29733, "epoch": 249, "lr": 6.359814152093149e-05} +{"train_loss": 0.0032387482933700085, "global_step": 29734, "epoch": 249, "lr": 6.359600950548183e-05} +{"train_loss": 0.0016549935098737478, "global_step": 29735, "epoch": 249, "lr": 6.359387746333784e-05} +{"train_loss": 0.0033978577703237534, "global_step": 29736, "epoch": 249, "lr": 6.359174539450374e-05} +{"train_loss": 0.0027120434679090977, "global_step": 29737, "epoch": 249, "lr": 6.358961329898369e-05} +{"train_loss": 0.0014723733766004443, "global_step": 29738, "epoch": 249, "lr": 6.35874811767819e-05} +{"train_loss": 0.004005459602922201, "global_step": 29739, "epoch": 249, "lr": 6.358534902790254e-05} +{"train_loss": 0.0029627291951328516, "global_step": 29740, "epoch": 249, "lr": 6.35832168523498e-05} +{"train_loss": 0.00342151103541255, "global_step": 29741, "epoch": 249, "lr": 6.358108465012786e-05} +{"train_loss": 0.002078418852761388, "global_step": 29742, "epoch": 249, "lr": 6.357895242124091e-05} +{"train_loss": 0.002007410628721118, "global_step": 29743, "epoch": 249, "lr": 6.357682016569313e-05} +{"train_loss": 0.003169175935909152, "global_step": 29744, "epoch": 249, "lr": 6.357468788348875e-05} +{"train_loss": 0.003235691459849477, "global_step": 29745, "epoch": 249, "lr": 6.35725555746319e-05} +{"train_loss": 0.0027250084094703197, "global_step": 29746, "epoch": 249, "lr": 6.357042323912676e-05} +{"train_loss": 0.003749767318367958, "global_step": 29747, "epoch": 249, "lr": 6.356829087697757e-05} +{"train_loss": 0.0021892159711569548, "global_step": 29748, "epoch": 249, "lr": 6.356615848818848e-05} +{"train_loss": 0.0031080237362815554, "global_step": 29749, "epoch": 249, "lr": 6.35640260727637e-05, "val_loss": 0.01882261037826538} +{"train_loss": 0.002330714138224721, "global_step": 29750, "epoch": 250, "lr": 6.356189363070742e-05} +{"train_loss": 0.003151825163513422, "global_step": 29751, "epoch": 250, "lr": 6.355976116202378e-05} +{"train_loss": 0.0016153125325217843, "global_step": 29752, "epoch": 250, "lr": 6.355762866671699e-05} +{"train_loss": 0.0015614059520885348, "global_step": 29753, "epoch": 250, "lr": 6.355549614479126e-05} +{"train_loss": 0.004514375701546669, "global_step": 29754, "epoch": 250, "lr": 6.355336359625076e-05} +{"train_loss": 0.0037174748722463846, "global_step": 29755, "epoch": 250, "lr": 6.355123102109967e-05} +{"train_loss": 0.0036544334143400192, "global_step": 29756, "epoch": 250, "lr": 6.354909841934221e-05} +{"train_loss": 0.002775428583845496, "global_step": 29757, "epoch": 250, "lr": 6.354696579098254e-05} +{"train_loss": 0.002229045843705535, "global_step": 29758, "epoch": 250, "lr": 6.354483313602482e-05} +{"train_loss": 0.0029460908845067024, "global_step": 29759, "epoch": 250, "lr": 6.354270045447331e-05} +{"train_loss": 0.002336092758923769, "global_step": 29760, "epoch": 250, "lr": 6.354056774633212e-05} +{"train_loss": 0.003716148901730776, "global_step": 29761, "epoch": 250, "lr": 6.353843501160547e-05} +{"train_loss": 0.003069979138672352, "global_step": 29762, "epoch": 250, "lr": 6.353630225029758e-05} +{"train_loss": 0.0020443520043045282, "global_step": 29763, "epoch": 250, "lr": 6.353416946241259e-05} +{"train_loss": 0.0029329166281968355, "global_step": 29764, "epoch": 250, "lr": 6.353203664795469e-05} +{"train_loss": 0.004531230311840773, "global_step": 29765, "epoch": 250, "lr": 6.35299038069281e-05} +{"train_loss": 0.0037855873815715313, "global_step": 29766, "epoch": 250, "lr": 6.352777093933699e-05} +{"train_loss": 0.0021453802473843098, "global_step": 29767, "epoch": 250, "lr": 6.352563804518553e-05} +{"train_loss": 0.0019226375734433532, "global_step": 29768, "epoch": 250, "lr": 6.352350512447794e-05} +{"train_loss": 0.004431064706295729, "global_step": 29769, "epoch": 250, "lr": 6.352137217721838e-05} +{"train_loss": 0.0041183242574334145, "global_step": 29770, "epoch": 250, "lr": 6.351923920341105e-05} +{"train_loss": 0.002957734512165189, "global_step": 29771, "epoch": 250, "lr": 6.351710620306015e-05} +{"train_loss": 0.0018128054216504097, "global_step": 29772, "epoch": 250, "lr": 6.351497317616986e-05} +{"train_loss": 0.0022277995012700558, "global_step": 29773, "epoch": 250, "lr": 6.351284012274435e-05} +{"train_loss": 0.0029500245582312346, "global_step": 29774, "epoch": 250, "lr": 6.351070704278782e-05} +{"train_loss": 0.002635116223245859, "global_step": 29775, "epoch": 250, "lr": 6.350857393630448e-05} +{"train_loss": 0.00204267306253314, "global_step": 29776, "epoch": 250, "lr": 6.350644080329848e-05} +{"train_loss": 0.0032628988847136497, "global_step": 29777, "epoch": 250, "lr": 6.350430764377404e-05} +{"train_loss": 0.002337133511900902, "global_step": 29778, "epoch": 250, "lr": 6.350217445773532e-05} +{"train_loss": 0.0022333883680403233, "global_step": 29779, "epoch": 250, "lr": 6.350004124518653e-05} +{"train_loss": 0.0013049660483375192, "global_step": 29780, "epoch": 250, "lr": 6.349790800613185e-05} +{"train_loss": 0.0033362829126417637, "global_step": 29781, "epoch": 250, "lr": 6.349577474057549e-05} +{"train_loss": 0.00378849683329463, "global_step": 29782, "epoch": 250, "lr": 6.349364144852159e-05} +{"train_loss": 0.0017532657366245985, "global_step": 29783, "epoch": 250, "lr": 6.349150812997437e-05} +{"train_loss": 0.0032196452375501394, "global_step": 29784, "epoch": 250, "lr": 6.348937478493803e-05} +{"train_loss": 0.0019123062957078218, "global_step": 29785, "epoch": 250, "lr": 6.348724141341673e-05} +{"train_loss": 0.0021606669761240482, "global_step": 29786, "epoch": 250, "lr": 6.348510801541468e-05} +{"train_loss": 0.0035890149883925915, "global_step": 29787, "epoch": 250, "lr": 6.348297459093606e-05} +{"train_loss": 0.0028570680879056454, "global_step": 29788, "epoch": 250, "lr": 6.348084113998507e-05} +{"train_loss": 0.002727714367210865, "global_step": 29789, "epoch": 250, "lr": 6.347870766256587e-05} +{"train_loss": 0.0034994978923350573, "global_step": 29790, "epoch": 250, "lr": 6.347657415868266e-05} +{"train_loss": 0.0029043566901236773, "global_step": 29791, "epoch": 250, "lr": 6.347444062833965e-05} +{"train_loss": 0.002371886745095253, "global_step": 29792, "epoch": 250, "lr": 6.347230707154101e-05} +{"train_loss": 0.002763864817097783, "global_step": 29793, "epoch": 250, "lr": 6.347017348829095e-05} +{"train_loss": 0.003909269347786903, "global_step": 29794, "epoch": 250, "lr": 6.346803987859364e-05} +{"train_loss": 0.0038326538633555174, "global_step": 29795, "epoch": 250, "lr": 6.346590624245326e-05} +{"train_loss": 0.0036562932655215263, "global_step": 29796, "epoch": 250, "lr": 6.346377257987403e-05} +{"train_loss": 0.0021172072738409042, "global_step": 29797, "epoch": 250, "lr": 6.346163889086009e-05} +{"train_loss": 0.0034964431542903185, "global_step": 29798, "epoch": 250, "lr": 6.345950517541569e-05} +{"train_loss": 0.003455568803474307, "global_step": 29799, "epoch": 250, "lr": 6.345737143354497e-05} +{"train_loss": 0.0038337712176144123, "global_step": 29800, "epoch": 250, "lr": 6.345523766525215e-05} +{"train_loss": 0.002354302676394582, "global_step": 29801, "epoch": 250, "lr": 6.34531038705414e-05} +{"train_loss": 0.004135814495384693, "global_step": 29802, "epoch": 250, "lr": 6.345097004941693e-05} +{"train_loss": 0.0026348652318120003, "global_step": 29803, "epoch": 250, "lr": 6.344883620188292e-05} +{"train_loss": 0.001642253017053008, "global_step": 29804, "epoch": 250, "lr": 6.344670232794354e-05} +{"train_loss": 0.0038471717853099108, "global_step": 29805, "epoch": 250, "lr": 6.3444568427603e-05} +{"train_loss": 0.003748765680938959, "global_step": 29806, "epoch": 250, "lr": 6.344243450086551e-05} +{"train_loss": 0.002715085167437792, "global_step": 29807, "epoch": 250, "lr": 6.344030054773521e-05} +{"train_loss": 0.0028939940966665745, "global_step": 29808, "epoch": 250, "lr": 6.343816656821633e-05} +{"train_loss": 0.0042738779447972775, "global_step": 29809, "epoch": 250, "lr": 6.343603256231303e-05} +{"train_loss": 0.002208733931183815, "global_step": 29810, "epoch": 250, "lr": 6.343389853002953e-05} +{"train_loss": 0.0031766684260219336, "global_step": 29811, "epoch": 250, "lr": 6.343176447136999e-05} +{"train_loss": 0.004845562856644392, "global_step": 29812, "epoch": 250, "lr": 6.342963038633863e-05} +{"train_loss": 0.0030930484645068645, "global_step": 29813, "epoch": 250, "lr": 6.342749627493963e-05} +{"train_loss": 0.004048317205160856, "global_step": 29814, "epoch": 250, "lr": 6.342536213717716e-05} +{"train_loss": 0.0023055977653712034, "global_step": 29815, "epoch": 250, "lr": 6.342322797305544e-05} +{"train_loss": 0.0024444914888590574, "global_step": 29816, "epoch": 250, "lr": 6.342109378257863e-05} +{"train_loss": 0.003139758249744773, "global_step": 29817, "epoch": 250, "lr": 6.341895956575094e-05} +{"train_loss": 0.002440084470435977, "global_step": 29818, "epoch": 250, "lr": 6.341682532257656e-05} +{"train_loss": 0.004437543451786041, "global_step": 29819, "epoch": 250, "lr": 6.341469105305966e-05} +{"train_loss": 0.002883761655539274, "global_step": 29820, "epoch": 250, "lr": 6.341255675720448e-05} +{"train_loss": 0.00230017164722085, "global_step": 29821, "epoch": 250, "lr": 6.341042243501515e-05} +{"train_loss": 0.004338152706623077, "global_step": 29822, "epoch": 250, "lr": 6.34082880864959e-05} +{"train_loss": 0.0031854549888521433, "global_step": 29823, "epoch": 250, "lr": 6.34061537116509e-05} +{"train_loss": 0.0035642951261252165, "global_step": 29824, "epoch": 250, "lr": 6.340401931048437e-05} +{"train_loss": 0.0026956601068377495, "global_step": 29825, "epoch": 250, "lr": 6.340188488300048e-05} +{"train_loss": 0.003080015769228339, "global_step": 29826, "epoch": 250, "lr": 6.33997504292034e-05} +{"train_loss": 0.006750373635441065, "global_step": 29827, "epoch": 250, "lr": 6.339761594909735e-05} +{"train_loss": 0.0033527358900755644, "global_step": 29828, "epoch": 250, "lr": 6.339548144268652e-05} +{"train_loss": 0.0045222267508506775, "global_step": 29829, "epoch": 250, "lr": 6.339334690997508e-05} +{"train_loss": 0.0034757640678435564, "global_step": 29830, "epoch": 250, "lr": 6.339121235096724e-05} +{"train_loss": 0.004889179952442646, "global_step": 29831, "epoch": 250, "lr": 6.338907776566721e-05} +{"train_loss": 0.0026253669057041407, "global_step": 29832, "epoch": 250, "lr": 6.338694315407912e-05} +{"train_loss": 0.004551119636744261, "global_step": 29833, "epoch": 250, "lr": 6.33848085162072e-05} +{"train_loss": 0.006050275173038244, "global_step": 29834, "epoch": 250, "lr": 6.338267385205565e-05} +{"train_loss": 0.004852238576859236, "global_step": 29835, "epoch": 250, "lr": 6.338053916162864e-05} +{"train_loss": 0.0026979169342666864, "global_step": 29836, "epoch": 250, "lr": 6.337840444493038e-05} +{"train_loss": 0.004910377319902182, "global_step": 29837, "epoch": 250, "lr": 6.337626970196505e-05} +{"train_loss": 0.004839202389121056, "global_step": 29838, "epoch": 250, "lr": 6.337413493273685e-05} +{"train_loss": 0.002907827030867338, "global_step": 29839, "epoch": 250, "lr": 6.337200013724996e-05} +{"train_loss": 0.0023756937589496374, "global_step": 29840, "epoch": 250, "lr": 6.336986531550857e-05} +{"train_loss": 0.0037415330298244953, "global_step": 29841, "epoch": 250, "lr": 6.336773046751688e-05} +{"train_loss": 0.0033020481932908297, "global_step": 29842, "epoch": 250, "lr": 6.336559559327908e-05} +{"train_loss": 0.0032225006725639105, "global_step": 29843, "epoch": 250, "lr": 6.336346069279938e-05} +{"train_loss": 0.0025354602839797735, "global_step": 29844, "epoch": 250, "lr": 6.336132576608194e-05} +{"train_loss": 0.004837817512452602, "global_step": 29845, "epoch": 250, "lr": 6.335919081313095e-05} +{"train_loss": 0.003951222635805607, "global_step": 29846, "epoch": 250, "lr": 6.335705583395063e-05} +{"train_loss": 0.0016002397751435637, "global_step": 29847, "epoch": 250, "lr": 6.335492082854515e-05} +{"train_loss": 0.0041031865403056145, "global_step": 29848, "epoch": 250, "lr": 6.335278579691872e-05} +{"train_loss": 0.001983985770493746, "global_step": 29849, "epoch": 250, "lr": 6.335065073907551e-05} +{"train_loss": 0.004379271063953638, "global_step": 29850, "epoch": 250, "lr": 6.334851565501972e-05} +{"train_loss": 0.0033659953624010086, "global_step": 29851, "epoch": 250, "lr": 6.334638054475556e-05} +{"train_loss": 0.003839273704215884, "global_step": 29852, "epoch": 250, "lr": 6.33442454082872e-05} +{"train_loss": 0.0017852832097560167, "global_step": 29853, "epoch": 250, "lr": 6.334211024561885e-05} +{"train_loss": 0.004741823300719261, "global_step": 29854, "epoch": 250, "lr": 6.333997505675467e-05} +{"train_loss": 0.004908538423478603, "global_step": 29855, "epoch": 250, "lr": 6.33378398416989e-05} +{"train_loss": 0.0032638844568282366, "global_step": 29856, "epoch": 250, "lr": 6.33357046004557e-05} +{"train_loss": 0.0030428480822592974, "global_step": 29857, "epoch": 250, "lr": 6.333356933302926e-05} +{"train_loss": 0.00483472365885973, "global_step": 29858, "epoch": 250, "lr": 6.333143403942378e-05} +{"train_loss": 0.003589062485843897, "global_step": 29859, "epoch": 250, "lr": 6.332929871964347e-05} +{"train_loss": 0.002586120506748557, "global_step": 29860, "epoch": 250, "lr": 6.332716337369249e-05} +{"train_loss": 0.002755116205662489, "global_step": 29861, "epoch": 250, "lr": 6.332502800157505e-05} +{"train_loss": 0.003045495133846998, "global_step": 29862, "epoch": 250, "lr": 6.332289260329534e-05} +{"train_loss": 0.0019719572737812996, "global_step": 29863, "epoch": 250, "lr": 6.332075717885756e-05} +{"train_loss": 0.002146208193153143, "global_step": 29864, "epoch": 250, "lr": 6.33186217282659e-05} +{"train_loss": 0.00322585622780025, "global_step": 29865, "epoch": 250, "lr": 6.331648625152453e-05} +{"train_loss": 0.005098576657474041, "global_step": 29866, "epoch": 250, "lr": 6.331435074863769e-05} +{"train_loss": 0.0019238066161051393, "global_step": 29867, "epoch": 250, "lr": 6.331221521960952e-05} +{"train_loss": 0.003213378391424272, "global_step": 29868, "epoch": 250, "lr": 6.331007966444425e-05, "val_loss": 0.029063725844025612, "train_action_mse_error": 6.833834777353331e-05} +{"train_loss": 0.004885565023869276, "global_step": 29869, "epoch": 251, "lr": 6.330794408314606e-05} +{"train_loss": 0.002775537082925439, "global_step": 29870, "epoch": 251, "lr": 6.330580847571913e-05} +{"train_loss": 0.004870139062404633, "global_step": 29871, "epoch": 251, "lr": 6.330367284216767e-05} +{"train_loss": 0.0040022931061685085, "global_step": 29872, "epoch": 251, "lr": 6.330153718249588e-05} +{"train_loss": 0.004016700200736523, "global_step": 29873, "epoch": 251, "lr": 6.329940149670794e-05} +{"train_loss": 0.0023702532052993774, "global_step": 29874, "epoch": 251, "lr": 6.329726578480805e-05} +{"train_loss": 0.0035840992350131273, "global_step": 29875, "epoch": 251, "lr": 6.32951300468004e-05} +{"train_loss": 0.0029662137385457754, "global_step": 29876, "epoch": 251, "lr": 6.329299428268917e-05} +{"train_loss": 0.0024316178169101477, "global_step": 29877, "epoch": 251, "lr": 6.329085849247858e-05} +{"train_loss": 0.00478903204202652, "global_step": 29878, "epoch": 251, "lr": 6.32887226761728e-05} +{"train_loss": 0.00400899350643158, "global_step": 29879, "epoch": 251, "lr": 6.328658683377603e-05} +{"train_loss": 0.0024627624079585075, "global_step": 29880, "epoch": 251, "lr": 6.328445096529248e-05} +{"train_loss": 0.002620317740365863, "global_step": 29881, "epoch": 251, "lr": 6.328231507072633e-05} +{"train_loss": 0.003440696746110916, "global_step": 29882, "epoch": 251, "lr": 6.328017915008176e-05} +{"train_loss": 0.003276523668318987, "global_step": 29883, "epoch": 251, "lr": 6.327804320336299e-05} +{"train_loss": 0.005600342992693186, "global_step": 29884, "epoch": 251, "lr": 6.327590723057417e-05} +{"train_loss": 0.00351708778180182, "global_step": 29885, "epoch": 251, "lr": 6.327377123171956e-05} +{"train_loss": 0.004553863313049078, "global_step": 29886, "epoch": 251, "lr": 6.32716352068033e-05} +{"train_loss": 0.005932163912802935, "global_step": 29887, "epoch": 251, "lr": 6.32694991558296e-05} +{"train_loss": 0.004193684086203575, "global_step": 29888, "epoch": 251, "lr": 6.326736307880268e-05} +{"train_loss": 0.004753428045660257, "global_step": 29889, "epoch": 251, "lr": 6.326522697572669e-05} +{"train_loss": 0.004306888673454523, "global_step": 29890, "epoch": 251, "lr": 6.326309084660584e-05} +{"train_loss": 0.0036475176457315683, "global_step": 29891, "epoch": 251, "lr": 6.326095469144434e-05} +{"train_loss": 0.002176491776481271, "global_step": 29892, "epoch": 251, "lr": 6.325881851024638e-05} +{"train_loss": 0.004836163483560085, "global_step": 29893, "epoch": 251, "lr": 6.325668230301612e-05} +{"train_loss": 0.003295702626928687, "global_step": 29894, "epoch": 251, "lr": 6.32545460697578e-05} +{"train_loss": 0.0028600336518138647, "global_step": 29895, "epoch": 251, "lr": 6.32524098104756e-05} +{"train_loss": 0.0030855934601277113, "global_step": 29896, "epoch": 251, "lr": 6.32502735251737e-05} +{"train_loss": 0.003778791055083275, "global_step": 29897, "epoch": 251, "lr": 6.32481372138563e-05} +{"train_loss": 0.004048772156238556, "global_step": 29898, "epoch": 251, "lr": 6.32460008765276e-05} +{"train_loss": 0.0024568652734160423, "global_step": 29899, "epoch": 251, "lr": 6.324386451319179e-05} +{"train_loss": 0.0021575491409748793, "global_step": 29900, "epoch": 251, "lr": 6.324172812385307e-05} +{"train_loss": 0.0038336387369781733, "global_step": 29901, "epoch": 251, "lr": 6.323959170851562e-05} +{"train_loss": 0.002478347858414054, "global_step": 29902, "epoch": 251, "lr": 6.323745526718367e-05} +{"train_loss": 0.00427605677396059, "global_step": 29903, "epoch": 251, "lr": 6.323531879986136e-05} +{"train_loss": 0.0019217671360820532, "global_step": 29904, "epoch": 251, "lr": 6.323318230655295e-05} +{"train_loss": 0.002115816343575716, "global_step": 29905, "epoch": 251, "lr": 6.323104578726258e-05} +{"train_loss": 0.002885087626054883, "global_step": 29906, "epoch": 251, "lr": 6.322890924199447e-05} +{"train_loss": 0.0035360350739210844, "global_step": 29907, "epoch": 251, "lr": 6.322677267075281e-05} +{"train_loss": 0.0019368261564522982, "global_step": 29908, "epoch": 251, "lr": 6.322463607354178e-05} +{"train_loss": 0.0034583306405693293, "global_step": 29909, "epoch": 251, "lr": 6.322249945036561e-05} +{"train_loss": 0.0038498311769217253, "global_step": 29910, "epoch": 251, "lr": 6.322036280122847e-05} +{"train_loss": 0.0024470628704875708, "global_step": 29911, "epoch": 251, "lr": 6.321822612613456e-05} +{"train_loss": 0.0032334281131625175, "global_step": 29912, "epoch": 251, "lr": 6.321608942508807e-05} +{"train_loss": 0.005276680923998356, "global_step": 29913, "epoch": 251, "lr": 6.321395269809322e-05} +{"train_loss": 0.0034382622689008713, "global_step": 29914, "epoch": 251, "lr": 6.321181594515418e-05} +{"train_loss": 0.0032620602287352085, "global_step": 29915, "epoch": 251, "lr": 6.320967916627512e-05} +{"train_loss": 0.0038034378085285425, "global_step": 29916, "epoch": 251, "lr": 6.320754236146029e-05} +{"train_loss": 0.0032878322526812553, "global_step": 29917, "epoch": 251, "lr": 6.320540553071386e-05} +{"train_loss": 0.003082884941250086, "global_step": 29918, "epoch": 251, "lr": 6.320326867404003e-05} +{"train_loss": 0.0029024151153862476, "global_step": 29919, "epoch": 251, "lr": 6.320113179144299e-05} +{"train_loss": 0.00218416890129447, "global_step": 29920, "epoch": 251, "lr": 6.319899488292694e-05} +{"train_loss": 0.0030065549071878195, "global_step": 29921, "epoch": 251, "lr": 6.319685794849606e-05} +{"train_loss": 0.0030274423770606518, "global_step": 29922, "epoch": 251, "lr": 6.319472098815456e-05} +{"train_loss": 0.005123529117554426, "global_step": 29923, "epoch": 251, "lr": 6.319258400190665e-05} +{"train_loss": 0.002847465220838785, "global_step": 29924, "epoch": 251, "lr": 6.31904469897565e-05} +{"train_loss": 0.003621530020609498, "global_step": 29925, "epoch": 251, "lr": 6.318830995170833e-05} +{"train_loss": 0.0030881355050951242, "global_step": 29926, "epoch": 251, "lr": 6.318617288776632e-05} +{"train_loss": 0.0034797820262610912, "global_step": 29927, "epoch": 251, "lr": 6.318403579793465e-05} +{"train_loss": 0.003375145373865962, "global_step": 29928, "epoch": 251, "lr": 6.318189868221755e-05} +{"train_loss": 0.0025234296917915344, "global_step": 29929, "epoch": 251, "lr": 6.317976154061919e-05} +{"train_loss": 0.0029043981339782476, "global_step": 29930, "epoch": 251, "lr": 6.317762437314379e-05} +{"train_loss": 0.00484554935246706, "global_step": 29931, "epoch": 251, "lr": 6.317548717979552e-05} +{"train_loss": 0.0014882837422192097, "global_step": 29932, "epoch": 251, "lr": 6.317334996057861e-05} +{"train_loss": 0.0029455008916556835, "global_step": 29933, "epoch": 251, "lr": 6.31712127154972e-05} +{"train_loss": 0.0034929036628454924, "global_step": 29934, "epoch": 251, "lr": 6.316907544455554e-05} +{"train_loss": 0.0032403136137872934, "global_step": 29935, "epoch": 251, "lr": 6.31669381477578e-05} +{"train_loss": 0.0022029171232134104, "global_step": 29936, "epoch": 251, "lr": 6.316480082510819e-05} +{"train_loss": 0.004313115030527115, "global_step": 29937, "epoch": 251, "lr": 6.316266347661091e-05} +{"train_loss": 0.00300912419334054, "global_step": 29938, "epoch": 251, "lr": 6.316052610227015e-05} +{"train_loss": 0.0039683557115495205, "global_step": 29939, "epoch": 251, "lr": 6.315838870209008e-05} +{"train_loss": 0.0026851678267121315, "global_step": 29940, "epoch": 251, "lr": 6.315625127607493e-05} +{"train_loss": 0.002333601238206029, "global_step": 29941, "epoch": 251, "lr": 6.315411382422889e-05} +{"train_loss": 0.0022657732479274273, "global_step": 29942, "epoch": 251, "lr": 6.315197634655614e-05} +{"train_loss": 0.0034662894904613495, "global_step": 29943, "epoch": 251, "lr": 6.314983884306089e-05} +{"train_loss": 0.0030456995591521263, "global_step": 29944, "epoch": 251, "lr": 6.314770131374736e-05} +{"train_loss": 0.0020964089781045914, "global_step": 29945, "epoch": 251, "lr": 6.314556375861971e-05} +{"train_loss": 0.0032858557533472776, "global_step": 29946, "epoch": 251, "lr": 6.314342617768214e-05} +{"train_loss": 0.002676662290468812, "global_step": 29947, "epoch": 251, "lr": 6.314128857093886e-05} +{"train_loss": 0.003931459039449692, "global_step": 29948, "epoch": 251, "lr": 6.313915093839407e-05} +{"train_loss": 0.005264519713819027, "global_step": 29949, "epoch": 251, "lr": 6.313701328005196e-05} +{"train_loss": 0.002790577942505479, "global_step": 29950, "epoch": 251, "lr": 6.313487559591673e-05} +{"train_loss": 0.0029675110708922148, "global_step": 29951, "epoch": 251, "lr": 6.313273788599256e-05} +{"train_loss": 0.0038139179814606905, "global_step": 29952, "epoch": 251, "lr": 6.313060015028368e-05} +{"train_loss": 0.004026913549751043, "global_step": 29953, "epoch": 251, "lr": 6.312846238879427e-05} +{"train_loss": 0.003084592754021287, "global_step": 29954, "epoch": 251, "lr": 6.312632460152851e-05} +{"train_loss": 0.003335188841447234, "global_step": 29955, "epoch": 251, "lr": 6.312418678849063e-05} +{"train_loss": 0.0022334991954267025, "global_step": 29956, "epoch": 251, "lr": 6.31220489496848e-05} +{"train_loss": 0.0019635879434645176, "global_step": 29957, "epoch": 251, "lr": 6.311991108511523e-05} +{"train_loss": 0.004237556364387274, "global_step": 29958, "epoch": 251, "lr": 6.311777319478614e-05} +{"train_loss": 0.005091555416584015, "global_step": 29959, "epoch": 251, "lr": 6.311563527870167e-05} +{"train_loss": 0.005602797493338585, "global_step": 29960, "epoch": 251, "lr": 6.311349733686607e-05} +{"train_loss": 0.00419421074911952, "global_step": 29961, "epoch": 251, "lr": 6.31113593692835e-05} +{"train_loss": 0.005549598950892687, "global_step": 29962, "epoch": 251, "lr": 6.310922137595821e-05} +{"train_loss": 0.002846574177965522, "global_step": 29963, "epoch": 251, "lr": 6.310708335689435e-05} +{"train_loss": 0.0045417002402246, "global_step": 29964, "epoch": 251, "lr": 6.310494531209612e-05} +{"train_loss": 0.003549814224243164, "global_step": 29965, "epoch": 251, "lr": 6.310280724156775e-05} +{"train_loss": 0.002696318319067359, "global_step": 29966, "epoch": 251, "lr": 6.310066914531338e-05} +{"train_loss": 0.0054137264378368855, "global_step": 29967, "epoch": 251, "lr": 6.309853102333728e-05} +{"train_loss": 0.0016624776180833578, "global_step": 29968, "epoch": 251, "lr": 6.309639287564359e-05} +{"train_loss": 0.0046857791021466255, "global_step": 29969, "epoch": 251, "lr": 6.309425470223656e-05} +{"train_loss": 0.004000138025730848, "global_step": 29970, "epoch": 251, "lr": 6.309211650312034e-05} +{"train_loss": 0.003209411632269621, "global_step": 29971, "epoch": 251, "lr": 6.308997827829915e-05} +{"train_loss": 0.003455007914453745, "global_step": 29972, "epoch": 251, "lr": 6.308784002777718e-05} +{"train_loss": 0.005149237811565399, "global_step": 29973, "epoch": 251, "lr": 6.308570175155866e-05} +{"train_loss": 0.004358259495347738, "global_step": 29974, "epoch": 251, "lr": 6.308356344964774e-05} +{"train_loss": 0.0029804138466715813, "global_step": 29975, "epoch": 251, "lr": 6.308142512204866e-05} +{"train_loss": 0.0023889560252428055, "global_step": 29976, "epoch": 251, "lr": 6.307928676876559e-05} +{"train_loss": 0.003369079902768135, "global_step": 29977, "epoch": 251, "lr": 6.307714838980273e-05} +{"train_loss": 0.0038063942920416594, "global_step": 29978, "epoch": 251, "lr": 6.30750099851643e-05} +{"train_loss": 0.0031357058323919773, "global_step": 29979, "epoch": 251, "lr": 6.307287155485446e-05} +{"train_loss": 0.0025913543067872524, "global_step": 29980, "epoch": 251, "lr": 6.307073309887745e-05} +{"train_loss": 0.005722848232835531, "global_step": 29981, "epoch": 251, "lr": 6.306859461723745e-05} +{"train_loss": 0.004326114431023598, "global_step": 29982, "epoch": 251, "lr": 6.306645610993866e-05} +{"train_loss": 0.0035408264957368374, "global_step": 29983, "epoch": 251, "lr": 6.306431757698529e-05} +{"train_loss": 0.0024968720972537994, "global_step": 29984, "epoch": 251, "lr": 6.306217901838151e-05} +{"train_loss": 0.003959175199270248, "global_step": 29985, "epoch": 251, "lr": 6.306004043413156e-05} +{"train_loss": 0.004273587837815285, "global_step": 29986, "epoch": 251, "lr": 6.30579018242396e-05} +{"train_loss": 0.003478200632703154, "global_step": 29987, "epoch": 251, "lr": 6.305576318870983e-05, "val_loss": 0.010263173840939999} +{"train_loss": 0.003457855898886919, "global_step": 29988, "epoch": 252, "lr": 6.30536245275465e-05} +{"train_loss": 0.003826715284958482, "global_step": 29989, "epoch": 252, "lr": 6.305148584075375e-05} +{"train_loss": 0.003161555388942361, "global_step": 29990, "epoch": 252, "lr": 6.304934712833581e-05} +{"train_loss": 0.0028223497793078423, "global_step": 29991, "epoch": 252, "lr": 6.304720839029686e-05} +{"train_loss": 0.005311222281306982, "global_step": 29992, "epoch": 252, "lr": 6.304506962664111e-05} +{"train_loss": 0.002071899129077792, "global_step": 29993, "epoch": 252, "lr": 6.304293083737277e-05} +{"train_loss": 0.004318522289395332, "global_step": 29994, "epoch": 252, "lr": 6.304079202249604e-05} +{"train_loss": 0.0026299546007066965, "global_step": 29995, "epoch": 252, "lr": 6.30386531820151e-05} +{"train_loss": 0.00529308058321476, "global_step": 29996, "epoch": 252, "lr": 6.303651431593413e-05} +{"train_loss": 0.004019176121801138, "global_step": 29997, "epoch": 252, "lr": 6.303437542425739e-05} +{"train_loss": 0.004506317432969809, "global_step": 29998, "epoch": 252, "lr": 6.303223650698903e-05} +{"train_loss": 0.003246857086196542, "global_step": 29999, "epoch": 252, "lr": 6.303009756413327e-05} +{"train_loss": 0.004196855239570141, "global_step": 30000, "epoch": 252, "lr": 6.302795859569431e-05} +{"train_loss": 0.0031350546050816774, "global_step": 30001, "epoch": 252, "lr": 6.302581960167632e-05} +{"train_loss": 0.0043180640786886215, "global_step": 30002, "epoch": 252, "lr": 6.302368058208355e-05} +{"train_loss": 0.0028997145127505064, "global_step": 30003, "epoch": 252, "lr": 6.302154153692017e-05} +{"train_loss": 0.004516290966421366, "global_step": 30004, "epoch": 252, "lr": 6.30194024661904e-05} +{"train_loss": 0.004562269430607557, "global_step": 30005, "epoch": 252, "lr": 6.30172633698984e-05} +{"train_loss": 0.0023352941498160362, "global_step": 30006, "epoch": 252, "lr": 6.301512424804839e-05} +{"train_loss": 0.0033158438745886087, "global_step": 30007, "epoch": 252, "lr": 6.301298510064461e-05} +{"train_loss": 0.0031805681064724922, "global_step": 30008, "epoch": 252, "lr": 6.30108459276912e-05} +{"train_loss": 0.002325505716726184, "global_step": 30009, "epoch": 252, "lr": 6.300870672919237e-05} +{"train_loss": 0.002759181195870042, "global_step": 30010, "epoch": 252, "lr": 6.300656750515234e-05} +{"train_loss": 0.003956569824367762, "global_step": 30011, "epoch": 252, "lr": 6.300442825557533e-05} +{"train_loss": 0.004469431936740875, "global_step": 30012, "epoch": 252, "lr": 6.30022889804655e-05} +{"train_loss": 0.002792143728584051, "global_step": 30013, "epoch": 252, "lr": 6.300014967982706e-05} +{"train_loss": 0.0016630396712571383, "global_step": 30014, "epoch": 252, "lr": 6.299801035366421e-05} +{"train_loss": 0.0038071239832788706, "global_step": 30015, "epoch": 252, "lr": 6.299587100198117e-05} +{"train_loss": 0.005222130101174116, "global_step": 30016, "epoch": 252, "lr": 6.299373162478212e-05} +{"train_loss": 0.003428327152505517, "global_step": 30017, "epoch": 252, "lr": 6.299159222207125e-05} +{"train_loss": 0.004053074866533279, "global_step": 30018, "epoch": 252, "lr": 6.298945279385279e-05} +{"train_loss": 0.0034307672176510096, "global_step": 30019, "epoch": 252, "lr": 6.298731334013093e-05} +{"train_loss": 0.0011732818093150854, "global_step": 30020, "epoch": 252, "lr": 6.298517386090988e-05} +{"train_loss": 0.003619792405515909, "global_step": 30021, "epoch": 252, "lr": 6.298303435619381e-05} +{"train_loss": 0.0023706848733127117, "global_step": 30022, "epoch": 252, "lr": 6.298089482598693e-05} +{"train_loss": 0.0028461250476539135, "global_step": 30023, "epoch": 252, "lr": 6.297875527029347e-05} +{"train_loss": 0.0036509190686047077, "global_step": 30024, "epoch": 252, "lr": 6.29766156891176e-05} +{"train_loss": 0.0031585688702762127, "global_step": 30025, "epoch": 252, "lr": 6.297447608246353e-05} +{"train_loss": 0.0049270340241491795, "global_step": 30026, "epoch": 252, "lr": 6.297233645033548e-05} +{"train_loss": 0.0033761467784643173, "global_step": 30027, "epoch": 252, "lr": 6.297019679273761e-05} +{"train_loss": 0.002635619603097439, "global_step": 30028, "epoch": 252, "lr": 6.296805710967416e-05} +{"train_loss": 0.0031416385900229216, "global_step": 30029, "epoch": 252, "lr": 6.296591740114931e-05} +{"train_loss": 0.0023533892817795277, "global_step": 30030, "epoch": 252, "lr": 6.296377766716726e-05} +{"train_loss": 0.0038102511316537857, "global_step": 30031, "epoch": 252, "lr": 6.296163790773223e-05} +{"train_loss": 0.003038353519514203, "global_step": 30032, "epoch": 252, "lr": 6.295949812284841e-05} +{"train_loss": 0.002509731100872159, "global_step": 30033, "epoch": 252, "lr": 6.295735831251998e-05} +{"train_loss": 0.0028879607561975718, "global_step": 30034, "epoch": 252, "lr": 6.295521847675117e-05} +{"train_loss": 0.0051695676520466805, "global_step": 30035, "epoch": 252, "lr": 6.295307861554618e-05} +{"train_loss": 0.002472740365192294, "global_step": 30036, "epoch": 252, "lr": 6.295093872890919e-05} +{"train_loss": 0.004197682719677687, "global_step": 30037, "epoch": 252, "lr": 6.294879881684444e-05} +{"train_loss": 0.0026118482928723097, "global_step": 30038, "epoch": 252, "lr": 6.29466588793561e-05} +{"train_loss": 0.0037028747610747814, "global_step": 30039, "epoch": 252, "lr": 6.294451891644837e-05} +{"train_loss": 0.0034710527397692204, "global_step": 30040, "epoch": 252, "lr": 6.294237892812546e-05} +{"train_loss": 0.00433136522769928, "global_step": 30041, "epoch": 252, "lr": 6.294023891439156e-05} +{"train_loss": 0.004974990151822567, "global_step": 30042, "epoch": 252, "lr": 6.293809887525091e-05} +{"train_loss": 0.0030785787384957075, "global_step": 30043, "epoch": 252, "lr": 6.293595881070766e-05} +{"train_loss": 0.0015506925992667675, "global_step": 30044, "epoch": 252, "lr": 6.293381872076606e-05} +{"train_loss": 0.0018406087765470147, "global_step": 30045, "epoch": 252, "lr": 6.293167860543028e-05} +{"train_loss": 0.003066530916839838, "global_step": 30046, "epoch": 252, "lr": 6.292953846470451e-05} +{"train_loss": 0.0020114872604608536, "global_step": 30047, "epoch": 252, "lr": 6.2927398298593e-05} +{"train_loss": 0.002754305023699999, "global_step": 30048, "epoch": 252, "lr": 6.292525810709991e-05} +{"train_loss": 0.0020752563141286373, "global_step": 30049, "epoch": 252, "lr": 6.292311789022946e-05} +{"train_loss": 0.005415872670710087, "global_step": 30050, "epoch": 252, "lr": 6.292097764798586e-05} +{"train_loss": 0.0027467694599181414, "global_step": 30051, "epoch": 252, "lr": 6.291883738037328e-05} +{"train_loss": 0.004697741474956274, "global_step": 30052, "epoch": 252, "lr": 6.291669708739595e-05} +{"train_loss": 0.002822012873366475, "global_step": 30053, "epoch": 252, "lr": 6.291455676905806e-05} +{"train_loss": 0.0029278425499796867, "global_step": 30054, "epoch": 252, "lr": 6.291241642536383e-05} +{"train_loss": 0.0033272558357566595, "global_step": 30055, "epoch": 252, "lr": 6.291027605631745e-05} +{"train_loss": 0.0028901987243443727, "global_step": 30056, "epoch": 252, "lr": 6.290813566192312e-05} +{"train_loss": 0.0025038677267730236, "global_step": 30057, "epoch": 252, "lr": 6.290599524218505e-05} +{"train_loss": 0.0019031857373192906, "global_step": 30058, "epoch": 252, "lr": 6.290385479710744e-05} +{"train_loss": 0.004847770556807518, "global_step": 30059, "epoch": 252, "lr": 6.290171432669447e-05} +{"train_loss": 0.0033054309897124767, "global_step": 30060, "epoch": 252, "lr": 6.289957383095036e-05} +{"train_loss": 0.002971430541947484, "global_step": 30061, "epoch": 252, "lr": 6.289743330987934e-05} +{"train_loss": 0.004483341705054045, "global_step": 30062, "epoch": 252, "lr": 6.289529276348557e-05} +{"train_loss": 0.004455018788576126, "global_step": 30063, "epoch": 252, "lr": 6.289315219177327e-05} +{"train_loss": 0.003430962562561035, "global_step": 30064, "epoch": 252, "lr": 6.289101159474667e-05} +{"train_loss": 0.004745993763208389, "global_step": 30065, "epoch": 252, "lr": 6.28888709724099e-05} +{"train_loss": 0.0037701535038650036, "global_step": 30066, "epoch": 252, "lr": 6.288673032476724e-05} +{"train_loss": 0.0033606523647904396, "global_step": 30067, "epoch": 252, "lr": 6.288458965182284e-05} +{"train_loss": 0.003594745649024844, "global_step": 30068, "epoch": 252, "lr": 6.288244895358095e-05} +{"train_loss": 0.0052887252531945705, "global_step": 30069, "epoch": 252, "lr": 6.288030823004574e-05} +{"train_loss": 0.004048836883157492, "global_step": 30070, "epoch": 252, "lr": 6.287816748122141e-05} +{"train_loss": 0.004687783773988485, "global_step": 30071, "epoch": 252, "lr": 6.287602670711219e-05} +{"train_loss": 0.0038110530003905296, "global_step": 30072, "epoch": 252, "lr": 6.287388590772226e-05} +{"train_loss": 0.003786791115999222, "global_step": 30073, "epoch": 252, "lr": 6.287174508305582e-05} +{"train_loss": 0.00451198173686862, "global_step": 30074, "epoch": 252, "lr": 6.28696042331171e-05} +{"train_loss": 0.0059799193404614925, "global_step": 30075, "epoch": 252, "lr": 6.286746335791027e-05} +{"train_loss": 0.0024628774262964725, "global_step": 30076, "epoch": 252, "lr": 6.286532245743956e-05} +{"train_loss": 0.0036166300997138023, "global_step": 30077, "epoch": 252, "lr": 6.286318153170918e-05} +{"train_loss": 0.007361256051808596, "global_step": 30078, "epoch": 252, "lr": 6.286104058072329e-05} +{"train_loss": 0.002740260912105441, "global_step": 30079, "epoch": 252, "lr": 6.285889960448615e-05} +{"train_loss": 0.0048028468154370785, "global_step": 30080, "epoch": 252, "lr": 6.28567586030019e-05} +{"train_loss": 0.003482284490019083, "global_step": 30081, "epoch": 252, "lr": 6.285461757627479e-05} +{"train_loss": 0.0026750327087938786, "global_step": 30082, "epoch": 252, "lr": 6.285247652430903e-05} +{"train_loss": 0.002193692373111844, "global_step": 30083, "epoch": 252, "lr": 6.28503354471088e-05} +{"train_loss": 0.003497338853776455, "global_step": 30084, "epoch": 252, "lr": 6.284819434467828e-05} +{"train_loss": 0.005377305205911398, "global_step": 30085, "epoch": 252, "lr": 6.284605321702173e-05} +{"train_loss": 0.0025337908882647753, "global_step": 30086, "epoch": 252, "lr": 6.284391206414332e-05} +{"train_loss": 0.0022145421244204044, "global_step": 30087, "epoch": 252, "lr": 6.284177088604726e-05} +{"train_loss": 0.004988841246813536, "global_step": 30088, "epoch": 252, "lr": 6.283962968273777e-05} +{"train_loss": 0.004719576332718134, "global_step": 30089, "epoch": 252, "lr": 6.283748845421902e-05} +{"train_loss": 0.0029615710955113173, "global_step": 30090, "epoch": 252, "lr": 6.283534720049523e-05} +{"train_loss": 0.003966130781918764, "global_step": 30091, "epoch": 252, "lr": 6.283320592157062e-05} +{"train_loss": 0.0034781722351908684, "global_step": 30092, "epoch": 252, "lr": 6.283106461744938e-05} +{"train_loss": 0.005084480158984661, "global_step": 30093, "epoch": 252, "lr": 6.28289232881357e-05} +{"train_loss": 0.0032045687548816204, "global_step": 30094, "epoch": 252, "lr": 6.282678193363382e-05} +{"train_loss": 0.0035972644109278917, "global_step": 30095, "epoch": 252, "lr": 6.282464055394792e-05} +{"train_loss": 0.0032366435043513775, "global_step": 30096, "epoch": 252, "lr": 6.28224991490822e-05} +{"train_loss": 0.003920990973711014, "global_step": 30097, "epoch": 252, "lr": 6.282035771904088e-05} +{"train_loss": 0.00397876463830471, "global_step": 30098, "epoch": 252, "lr": 6.281821626382816e-05} +{"train_loss": 0.004761406686156988, "global_step": 30099, "epoch": 252, "lr": 6.281607478344824e-05} +{"train_loss": 0.0033033816143870354, "global_step": 30100, "epoch": 252, "lr": 6.28139332779053e-05} +{"train_loss": 0.005188949406147003, "global_step": 30101, "epoch": 252, "lr": 6.28117917472036e-05} +{"train_loss": 0.0038566640578210354, "global_step": 30102, "epoch": 252, "lr": 6.28096501913473e-05} +{"train_loss": 0.003420734079554677, "global_step": 30103, "epoch": 252, "lr": 6.280750861034064e-05} +{"train_loss": 0.0042467135936021805, "global_step": 30104, "epoch": 252, "lr": 6.280536700418779e-05} +{"train_loss": 0.0017211143858730793, "global_step": 30105, "epoch": 252, "lr": 6.280322537289297e-05} +{"train_loss": 0.0035713657818953783, "global_step": 30106, "epoch": 252, "lr": 6.280108371646038e-05, "val_loss": 0.021181153133511543} +{"train_loss": 0.0028894066344946623, "global_step": 30107, "epoch": 253, "lr": 6.279894203489426e-05} +{"train_loss": 0.004101048689335585, "global_step": 30108, "epoch": 253, "lr": 6.279680032819877e-05} +{"train_loss": 0.003541690530255437, "global_step": 30109, "epoch": 253, "lr": 6.279465859637813e-05} +{"train_loss": 0.0021916828118264675, "global_step": 30110, "epoch": 253, "lr": 6.279251683943653e-05} +{"train_loss": 0.003539792727679014, "global_step": 30111, "epoch": 253, "lr": 6.27903750573782e-05} +{"train_loss": 0.0028307694010436535, "global_step": 30112, "epoch": 253, "lr": 6.278823325020731e-05} +{"train_loss": 0.0030437884852290154, "global_step": 30113, "epoch": 253, "lr": 6.278609141792812e-05} +{"train_loss": 0.002513810759410262, "global_step": 30114, "epoch": 253, "lr": 6.27839495605448e-05} +{"train_loss": 0.002730532083660364, "global_step": 30115, "epoch": 253, "lr": 6.278180767806155e-05} +{"train_loss": 0.003907567821443081, "global_step": 30116, "epoch": 253, "lr": 6.27796657704826e-05} +{"train_loss": 0.004045842681080103, "global_step": 30117, "epoch": 253, "lr": 6.277752383781213e-05} +{"train_loss": 0.0032441953662782907, "global_step": 30118, "epoch": 253, "lr": 6.277538188005437e-05} +{"train_loss": 0.0021809935569763184, "global_step": 30119, "epoch": 253, "lr": 6.277323989721352e-05} +{"train_loss": 0.003168009454384446, "global_step": 30120, "epoch": 253, "lr": 6.277109788929376e-05} +{"train_loss": 0.003377906046807766, "global_step": 30121, "epoch": 253, "lr": 6.276895585629931e-05} +{"train_loss": 0.0026710941456258297, "global_step": 30122, "epoch": 253, "lr": 6.27668137982344e-05} +{"train_loss": 0.002025487832725048, "global_step": 30123, "epoch": 253, "lr": 6.27646717151032e-05} +{"train_loss": 0.0018397977109998465, "global_step": 30124, "epoch": 253, "lr": 6.276252960690993e-05} +{"train_loss": 0.004292652010917664, "global_step": 30125, "epoch": 253, "lr": 6.27603874736588e-05} +{"train_loss": 0.003357416018843651, "global_step": 30126, "epoch": 253, "lr": 6.275824531535402e-05} +{"train_loss": 0.0030708375852555037, "global_step": 30127, "epoch": 253, "lr": 6.275610313199977e-05} +{"train_loss": 0.0034284081775695086, "global_step": 30128, "epoch": 253, "lr": 6.27539609236003e-05} +{"train_loss": 0.004066437017172575, "global_step": 30129, "epoch": 253, "lr": 6.275181869015977e-05} +{"train_loss": 0.001858376432210207, "global_step": 30130, "epoch": 253, "lr": 6.274967643168241e-05} +{"train_loss": 0.004994004033505917, "global_step": 30131, "epoch": 253, "lr": 6.274753414817243e-05} +{"train_loss": 0.004239750560373068, "global_step": 30132, "epoch": 253, "lr": 6.274539183963402e-05} +{"train_loss": 0.0025915587320923805, "global_step": 30133, "epoch": 253, "lr": 6.27432495060714e-05} +{"train_loss": 0.003334855427965522, "global_step": 30134, "epoch": 253, "lr": 6.274110714748876e-05} +{"train_loss": 0.0024624979123473167, "global_step": 30135, "epoch": 253, "lr": 6.273896476389031e-05} +{"train_loss": 0.0022944060619920492, "global_step": 30136, "epoch": 253, "lr": 6.273682235528028e-05} +{"train_loss": 0.004851176403462887, "global_step": 30137, "epoch": 253, "lr": 6.273467992166286e-05} +{"train_loss": 0.003751381766051054, "global_step": 30138, "epoch": 253, "lr": 6.273253746304227e-05} +{"train_loss": 0.0016214611241593957, "global_step": 30139, "epoch": 253, "lr": 6.27303949794227e-05} +{"train_loss": 0.002446283819153905, "global_step": 30140, "epoch": 253, "lr": 6.272825247080834e-05} +{"train_loss": 0.004321063868701458, "global_step": 30141, "epoch": 253, "lr": 6.272610993720342e-05} +{"train_loss": 0.0032828429248183966, "global_step": 30142, "epoch": 253, "lr": 6.272396737861214e-05} +{"train_loss": 0.003559050615876913, "global_step": 30143, "epoch": 253, "lr": 6.272182479503873e-05} +{"train_loss": 0.002705856692045927, "global_step": 30144, "epoch": 253, "lr": 6.271968218648736e-05} +{"train_loss": 0.003614486427977681, "global_step": 30145, "epoch": 253, "lr": 6.271753955296226e-05} +{"train_loss": 0.0018462726147845387, "global_step": 30146, "epoch": 253, "lr": 6.271539689446762e-05} +{"train_loss": 0.0055264662951231, "global_step": 30147, "epoch": 253, "lr": 6.271325421100767e-05} +{"train_loss": 0.004143171943724155, "global_step": 30148, "epoch": 253, "lr": 6.27111115025866e-05} +{"train_loss": 0.003677551867440343, "global_step": 30149, "epoch": 253, "lr": 6.27089687692086e-05} +{"train_loss": 0.0031020434107631445, "global_step": 30150, "epoch": 253, "lr": 6.270682601087792e-05} +{"train_loss": 0.003285831306129694, "global_step": 30151, "epoch": 253, "lr": 6.270468322759874e-05} +{"train_loss": 0.0030520197469741106, "global_step": 30152, "epoch": 253, "lr": 6.270254041937526e-05} +{"train_loss": 0.0026525140274316072, "global_step": 30153, "epoch": 253, "lr": 6.270039758621171e-05} +{"train_loss": 0.0041929930448532104, "global_step": 30154, "epoch": 253, "lr": 6.269825472811229e-05} +{"train_loss": 0.0031994145829230547, "global_step": 30155, "epoch": 253, "lr": 6.26961118450812e-05} +{"train_loss": 0.0024377533700317144, "global_step": 30156, "epoch": 253, "lr": 6.269396893712265e-05} +{"train_loss": 0.003040632000193, "global_step": 30157, "epoch": 253, "lr": 6.269182600424086e-05} +{"train_loss": 0.003717872081324458, "global_step": 30158, "epoch": 253, "lr": 6.268968304644e-05} +{"train_loss": 0.003344816155731678, "global_step": 30159, "epoch": 253, "lr": 6.268754006372432e-05} +{"train_loss": 0.002103576436638832, "global_step": 30160, "epoch": 253, "lr": 6.268539705609802e-05} +{"train_loss": 0.003074327250942588, "global_step": 30161, "epoch": 253, "lr": 6.268325402356528e-05} +{"train_loss": 0.0029287126380950212, "global_step": 30162, "epoch": 253, "lr": 6.268111096613032e-05} +{"train_loss": 0.003419577144086361, "global_step": 30163, "epoch": 253, "lr": 6.267896788379737e-05} +{"train_loss": 0.0020921214018017054, "global_step": 30164, "epoch": 253, "lr": 6.26768247765706e-05} +{"train_loss": 0.003192071570083499, "global_step": 30165, "epoch": 253, "lr": 6.267468164445426e-05} +{"train_loss": 0.00180998130235821, "global_step": 30166, "epoch": 253, "lr": 6.267253848745253e-05} +{"train_loss": 0.002150079235434532, "global_step": 30167, "epoch": 253, "lr": 6.267039530556963e-05} +{"train_loss": 0.003042367985472083, "global_step": 30168, "epoch": 253, "lr": 6.266825209880975e-05} +{"train_loss": 0.005348057020455599, "global_step": 30169, "epoch": 253, "lr": 6.266610886717711e-05} +{"train_loss": 0.004553486593067646, "global_step": 30170, "epoch": 253, "lr": 6.266396561067595e-05} +{"train_loss": 0.002888036658987403, "global_step": 30171, "epoch": 253, "lr": 6.266182232931042e-05} +{"train_loss": 0.0022597305942326784, "global_step": 30172, "epoch": 253, "lr": 6.265967902308476e-05} +{"train_loss": 0.0031145247630774975, "global_step": 30173, "epoch": 253, "lr": 6.265753569200316e-05} +{"train_loss": 0.002281979424878955, "global_step": 30174, "epoch": 253, "lr": 6.265539233606986e-05} +{"train_loss": 0.002631234470754862, "global_step": 30175, "epoch": 253, "lr": 6.265324895528904e-05} +{"train_loss": 0.002123474609106779, "global_step": 30176, "epoch": 253, "lr": 6.265110554966492e-05} +{"train_loss": 0.002794798696413636, "global_step": 30177, "epoch": 253, "lr": 6.26489621192017e-05} +{"train_loss": 0.003400248009711504, "global_step": 30178, "epoch": 253, "lr": 6.26468186639036e-05} +{"train_loss": 0.0021560073364526033, "global_step": 30179, "epoch": 253, "lr": 6.264467518377482e-05} +{"train_loss": 0.0028380241710692644, "global_step": 30180, "epoch": 253, "lr": 6.264253167881957e-05} +{"train_loss": 0.0034955518785864115, "global_step": 30181, "epoch": 253, "lr": 6.264038814904207e-05} +{"train_loss": 0.0032563551794737577, "global_step": 30182, "epoch": 253, "lr": 6.263824459444651e-05} +{"train_loss": 0.0021285787224769592, "global_step": 30183, "epoch": 253, "lr": 6.26361010150371e-05} +{"train_loss": 0.0018875054083764553, "global_step": 30184, "epoch": 253, "lr": 6.263395741081806e-05} +{"train_loss": 0.0025164142716675997, "global_step": 30185, "epoch": 253, "lr": 6.26318137817936e-05} +{"train_loss": 0.0025907172821462154, "global_step": 30186, "epoch": 253, "lr": 6.262967012796793e-05} +{"train_loss": 0.004378640092909336, "global_step": 30187, "epoch": 253, "lr": 6.262752644934523e-05} +{"train_loss": 0.003080454422160983, "global_step": 30188, "epoch": 253, "lr": 6.262538274592975e-05} +{"train_loss": 0.0033889818005263805, "global_step": 30189, "epoch": 253, "lr": 6.262323901772567e-05} +{"train_loss": 0.005520946346223354, "global_step": 30190, "epoch": 253, "lr": 6.26210952647372e-05} +{"train_loss": 0.0035115305799990892, "global_step": 30191, "epoch": 253, "lr": 6.261895148696858e-05} +{"train_loss": 0.0037918826565146446, "global_step": 30192, "epoch": 253, "lr": 6.261680768442398e-05} +{"train_loss": 0.003855291986837983, "global_step": 30193, "epoch": 253, "lr": 6.261466385710764e-05} +{"train_loss": 0.0028124877717345953, "global_step": 30194, "epoch": 253, "lr": 6.261252000502374e-05} +{"train_loss": 0.004660755395889282, "global_step": 30195, "epoch": 253, "lr": 6.261037612817652e-05} +{"train_loss": 0.002716493560001254, "global_step": 30196, "epoch": 253, "lr": 6.260823222657018e-05} +{"train_loss": 0.004395771771669388, "global_step": 30197, "epoch": 253, "lr": 6.26060883002089e-05} +{"train_loss": 0.002695826580747962, "global_step": 30198, "epoch": 253, "lr": 6.260394434909691e-05} +{"train_loss": 0.002221805974841118, "global_step": 30199, "epoch": 253, "lr": 6.260180037323844e-05} +{"train_loss": 0.0025184534024447203, "global_step": 30200, "epoch": 253, "lr": 6.259965637263767e-05} +{"train_loss": 0.002773728920146823, "global_step": 30201, "epoch": 253, "lr": 6.259751234729882e-05} +{"train_loss": 0.0026207210030406713, "global_step": 30202, "epoch": 253, "lr": 6.259536829722611e-05} +{"train_loss": 0.0025732412468641996, "global_step": 30203, "epoch": 253, "lr": 6.259322422242372e-05} +{"train_loss": 0.0037074724677950144, "global_step": 30204, "epoch": 253, "lr": 6.25910801228959e-05} +{"train_loss": 0.002465242985635996, "global_step": 30205, "epoch": 253, "lr": 6.258893599864684e-05} +{"train_loss": 0.004210044629871845, "global_step": 30206, "epoch": 253, "lr": 6.258679184968074e-05} +{"train_loss": 0.0059402333572506905, "global_step": 30207, "epoch": 253, "lr": 6.258464767600183e-05} +{"train_loss": 0.003315495792776346, "global_step": 30208, "epoch": 253, "lr": 6.25825034776143e-05} +{"train_loss": 0.0034708704333752394, "global_step": 30209, "epoch": 253, "lr": 6.258035925452237e-05} +{"train_loss": 0.0036412647459656, "global_step": 30210, "epoch": 253, "lr": 6.257821500673024e-05} +{"train_loss": 0.002193497261032462, "global_step": 30211, "epoch": 253, "lr": 6.257607073424215e-05} +{"train_loss": 0.005182896740734577, "global_step": 30212, "epoch": 253, "lr": 6.257392643706226e-05} +{"train_loss": 0.0025543624069541693, "global_step": 30213, "epoch": 253, "lr": 6.257178211519483e-05} +{"train_loss": 0.002020081039518118, "global_step": 30214, "epoch": 253, "lr": 6.256963776864404e-05} +{"train_loss": 0.0019868810195475817, "global_step": 30215, "epoch": 253, "lr": 6.256749339741411e-05} +{"train_loss": 0.006026501301676035, "global_step": 30216, "epoch": 253, "lr": 6.256534900150926e-05} +{"train_loss": 0.004028834868222475, "global_step": 30217, "epoch": 253, "lr": 6.256320458093367e-05} +{"train_loss": 0.005418920423835516, "global_step": 30218, "epoch": 253, "lr": 6.256106013569158e-05} +{"train_loss": 0.003447767347097397, "global_step": 30219, "epoch": 253, "lr": 6.25589156657872e-05} +{"train_loss": 0.003325302852317691, "global_step": 30220, "epoch": 253, "lr": 6.255677117122473e-05} +{"train_loss": 0.005110155325382948, "global_step": 30221, "epoch": 253, "lr": 6.255462665200837e-05} +{"train_loss": 0.00478195259347558, "global_step": 30222, "epoch": 253, "lr": 6.255248210814234e-05} +{"train_loss": 0.003671132493764162, "global_step": 30223, "epoch": 253, "lr": 6.255033753963086e-05} +{"train_loss": 0.003355230437591672, "global_step": 30224, "epoch": 253, "lr": 6.254819294647813e-05} +{"train_loss": 0.003276178751242574, "global_step": 30225, "epoch": 253, "lr": 6.254604832868836e-05, "val_loss": 0.015080807730555534} +{"train_loss": 0.002469182014465332, "global_step": 30226, "epoch": 254, "lr": 6.254390368626578e-05} +{"train_loss": 0.0025044323410838842, "global_step": 30227, "epoch": 254, "lr": 6.254175901921457e-05} +{"train_loss": 0.0024064471945166588, "global_step": 30228, "epoch": 254, "lr": 6.253961432753896e-05} +{"train_loss": 0.005706654395908117, "global_step": 30229, "epoch": 254, "lr": 6.253746961124316e-05} +{"train_loss": 0.006350434385240078, "global_step": 30230, "epoch": 254, "lr": 6.253532487033138e-05} +{"train_loss": 0.0024747245479375124, "global_step": 30231, "epoch": 254, "lr": 6.253318010480782e-05} +{"train_loss": 0.0037035266868770123, "global_step": 30232, "epoch": 254, "lr": 6.25310353146767e-05} +{"train_loss": 0.002815424930304289, "global_step": 30233, "epoch": 254, "lr": 6.252889049994224e-05} +{"train_loss": 0.004944118205457926, "global_step": 30234, "epoch": 254, "lr": 6.252674566060863e-05} +{"train_loss": 0.002241062466055155, "global_step": 30235, "epoch": 254, "lr": 6.25246007966801e-05} +{"train_loss": 0.005688487086445093, "global_step": 30236, "epoch": 254, "lr": 6.252245590816084e-05} +{"train_loss": 0.007118368521332741, "global_step": 30237, "epoch": 254, "lr": 6.25203109950551e-05} +{"train_loss": 0.0055330852046608925, "global_step": 30238, "epoch": 254, "lr": 6.251816605736706e-05} +{"train_loss": 0.005758798215538263, "global_step": 30239, "epoch": 254, "lr": 6.251602109510094e-05} +{"train_loss": 0.0048479014076292515, "global_step": 30240, "epoch": 254, "lr": 6.251387610826093e-05} +{"train_loss": 0.004476181231439114, "global_step": 30241, "epoch": 254, "lr": 6.251173109685128e-05} +{"train_loss": 0.004381128121167421, "global_step": 30242, "epoch": 254, "lr": 6.250958606087619e-05} +{"train_loss": 0.002444695681333542, "global_step": 30243, "epoch": 254, "lr": 6.250744100033985e-05} +{"train_loss": 0.00574879813939333, "global_step": 30244, "epoch": 254, "lr": 6.250529591524649e-05} +{"train_loss": 0.0031773513182997704, "global_step": 30245, "epoch": 254, "lr": 6.250315080560032e-05} +{"train_loss": 0.002142086625099182, "global_step": 30246, "epoch": 254, "lr": 6.250100567140554e-05} +{"train_loss": 0.006307782605290413, "global_step": 30247, "epoch": 254, "lr": 6.249886051266637e-05} +{"train_loss": 0.0030535932164639235, "global_step": 30248, "epoch": 254, "lr": 6.249671532938704e-05} +{"train_loss": 0.00533967325463891, "global_step": 30249, "epoch": 254, "lr": 6.249457012157173e-05} +{"train_loss": 0.004018151666969061, "global_step": 30250, "epoch": 254, "lr": 6.249242488922467e-05} +{"train_loss": 0.004089525435119867, "global_step": 30251, "epoch": 254, "lr": 6.249027963235006e-05} +{"train_loss": 0.004876165650784969, "global_step": 30252, "epoch": 254, "lr": 6.248813435095213e-05} +{"train_loss": 0.0038896379992365837, "global_step": 30253, "epoch": 254, "lr": 6.248598904503509e-05} +{"train_loss": 0.005645317025482655, "global_step": 30254, "epoch": 254, "lr": 6.248384371460312e-05} +{"train_loss": 0.002481057308614254, "global_step": 30255, "epoch": 254, "lr": 6.248169835966048e-05} +{"train_loss": 0.003089951118454337, "global_step": 30256, "epoch": 254, "lr": 6.247955298021135e-05} +{"train_loss": 0.00294978148303926, "global_step": 30257, "epoch": 254, "lr": 6.247740757625996e-05} +{"train_loss": 0.005425931420177221, "global_step": 30258, "epoch": 254, "lr": 6.247526214781051e-05} +{"train_loss": 0.00214167358353734, "global_step": 30259, "epoch": 254, "lr": 6.247311669486721e-05} +{"train_loss": 0.0033047893084585667, "global_step": 30260, "epoch": 254, "lr": 6.247097121743426e-05} +{"train_loss": 0.0032049764413386583, "global_step": 30261, "epoch": 254, "lr": 6.246882571551593e-05} +{"train_loss": 0.0034555501770228148, "global_step": 30262, "epoch": 254, "lr": 6.246668018911637e-05} +{"train_loss": 0.003454816062003374, "global_step": 30263, "epoch": 254, "lr": 6.246453463823981e-05} +{"train_loss": 0.002851546509191394, "global_step": 30264, "epoch": 254, "lr": 6.246238906289047e-05} +{"train_loss": 0.002340956823900342, "global_step": 30265, "epoch": 254, "lr": 6.246024346307256e-05} +{"train_loss": 0.0017033576732501388, "global_step": 30266, "epoch": 254, "lr": 6.245809783879031e-05} +{"train_loss": 0.002812728751450777, "global_step": 30267, "epoch": 254, "lr": 6.245595219004789e-05} +{"train_loss": 0.001990959048271179, "global_step": 30268, "epoch": 254, "lr": 6.245380651684955e-05} +{"train_loss": 0.0026971029583364725, "global_step": 30269, "epoch": 254, "lr": 6.245166081919949e-05} +{"train_loss": 0.00310869375243783, "global_step": 30270, "epoch": 254, "lr": 6.244951509710195e-05} +{"train_loss": 0.0037115609738975763, "global_step": 30271, "epoch": 254, "lr": 6.244736935056109e-05} +{"train_loss": 0.0022688303142786026, "global_step": 30272, "epoch": 254, "lr": 6.244522357958116e-05} +{"train_loss": 0.0026463503018021584, "global_step": 30273, "epoch": 254, "lr": 6.244307778416635e-05} +{"train_loss": 0.0036042719148099422, "global_step": 30274, "epoch": 254, "lr": 6.244093196432091e-05} +{"train_loss": 0.0028777432162314653, "global_step": 30275, "epoch": 254, "lr": 6.243878612004901e-05} +{"train_loss": 0.00211704196408391, "global_step": 30276, "epoch": 254, "lr": 6.24366402513549e-05} +{"train_loss": 0.00604593101888895, "global_step": 30277, "epoch": 254, "lr": 6.243449435824276e-05} +{"train_loss": 0.004061257466673851, "global_step": 30278, "epoch": 254, "lr": 6.243234844071682e-05} +{"train_loss": 0.003269331995397806, "global_step": 30279, "epoch": 254, "lr": 6.243020249878129e-05} +{"train_loss": 0.005011699162423611, "global_step": 30280, "epoch": 254, "lr": 6.242805653244038e-05} +{"train_loss": 0.002636015648022294, "global_step": 30281, "epoch": 254, "lr": 6.242591054169831e-05} +{"train_loss": 0.0020218812860548496, "global_step": 30282, "epoch": 254, "lr": 6.24237645265593e-05} +{"train_loss": 0.004545006435364485, "global_step": 30283, "epoch": 254, "lr": 6.242161848702756e-05} +{"train_loss": 0.0019282903522253036, "global_step": 30284, "epoch": 254, "lr": 6.24194724231073e-05} +{"train_loss": 0.003580074990168214, "global_step": 30285, "epoch": 254, "lr": 6.241732633480272e-05} +{"train_loss": 0.0029816371388733387, "global_step": 30286, "epoch": 254, "lr": 6.241518022211805e-05} +{"train_loss": 0.002770548453554511, "global_step": 30287, "epoch": 254, "lr": 6.24130340850575e-05} +{"train_loss": 0.00377054326236248, "global_step": 30288, "epoch": 254, "lr": 6.241088792362529e-05} +{"train_loss": 0.0023562912829220295, "global_step": 30289, "epoch": 254, "lr": 6.240874173782562e-05} +{"train_loss": 0.0025294998195022345, "global_step": 30290, "epoch": 254, "lr": 6.240659552766273e-05} +{"train_loss": 0.002065329346805811, "global_step": 30291, "epoch": 254, "lr": 6.24044492931408e-05} +{"train_loss": 0.004288653843104839, "global_step": 30292, "epoch": 254, "lr": 6.240230303426405e-05} +{"train_loss": 0.0035887793637812138, "global_step": 30293, "epoch": 254, "lr": 6.240015675103671e-05} +{"train_loss": 0.003910181578248739, "global_step": 30294, "epoch": 254, "lr": 6.2398010443463e-05} +{"train_loss": 0.00541138369590044, "global_step": 30295, "epoch": 254, "lr": 6.239586411154712e-05} +{"train_loss": 0.0032324756029993296, "global_step": 30296, "epoch": 254, "lr": 6.239371775529325e-05} +{"train_loss": 0.0033539209980517626, "global_step": 30297, "epoch": 254, "lr": 6.239157137470567e-05} +{"train_loss": 0.003124558599665761, "global_step": 30298, "epoch": 254, "lr": 6.238942496978856e-05} +{"train_loss": 0.005029088351875544, "global_step": 30299, "epoch": 254, "lr": 6.238727854054613e-05} +{"train_loss": 0.003229857422411442, "global_step": 30300, "epoch": 254, "lr": 6.238513208698261e-05} +{"train_loss": 0.0016710130730643868, "global_step": 30301, "epoch": 254, "lr": 6.238298560910221e-05} +{"train_loss": 0.004142056684941053, "global_step": 30302, "epoch": 254, "lr": 6.238083910690914e-05} +{"train_loss": 0.0035363351926207542, "global_step": 30303, "epoch": 254, "lr": 6.237869258040761e-05} +{"train_loss": 0.0054039680399000645, "global_step": 30304, "epoch": 254, "lr": 6.237654602960184e-05} +{"train_loss": 0.0038387547247111797, "global_step": 30305, "epoch": 254, "lr": 6.237439945449603e-05} +{"train_loss": 0.0032839798368513584, "global_step": 30306, "epoch": 254, "lr": 6.237225285509443e-05} +{"train_loss": 0.0025522836949676275, "global_step": 30307, "epoch": 254, "lr": 6.237010623140124e-05} +{"train_loss": 0.002659191843122244, "global_step": 30308, "epoch": 254, "lr": 6.236795958342064e-05} +{"train_loss": 0.0030838351231068373, "global_step": 30309, "epoch": 254, "lr": 6.236581291115689e-05} +{"train_loss": 0.003249627538025379, "global_step": 30310, "epoch": 254, "lr": 6.236366621461418e-05} +{"train_loss": 0.005299392621964216, "global_step": 30311, "epoch": 254, "lr": 6.236151949379674e-05} +{"train_loss": 0.004328308627009392, "global_step": 30312, "epoch": 254, "lr": 6.235937274870877e-05} +{"train_loss": 0.007041572127491236, "global_step": 30313, "epoch": 254, "lr": 6.235722597935449e-05} +{"train_loss": 0.00433250842615962, "global_step": 30314, "epoch": 254, "lr": 6.235507918573813e-05} +{"train_loss": 0.00247683166526258, "global_step": 30315, "epoch": 254, "lr": 6.235293236786388e-05} +{"train_loss": 0.003304211888462305, "global_step": 30316, "epoch": 254, "lr": 6.235078552573597e-05} +{"train_loss": 0.002419792814180255, "global_step": 30317, "epoch": 254, "lr": 6.234863865935861e-05} +{"train_loss": 0.0029531701002269983, "global_step": 30318, "epoch": 254, "lr": 6.234649176873603e-05} +{"train_loss": 0.0025812347885221243, "global_step": 30319, "epoch": 254, "lr": 6.234434485387241e-05} +{"train_loss": 0.002722009550780058, "global_step": 30320, "epoch": 254, "lr": 6.234219791477202e-05} +{"train_loss": 0.0041579934768378735, "global_step": 30321, "epoch": 254, "lr": 6.234005095143902e-05} +{"train_loss": 0.005318335723131895, "global_step": 30322, "epoch": 254, "lr": 6.233790396387764e-05} +{"train_loss": 0.0031306168530136347, "global_step": 30323, "epoch": 254, "lr": 6.233575695209213e-05} +{"train_loss": 0.003550482913851738, "global_step": 30324, "epoch": 254, "lr": 6.233360991608666e-05} +{"train_loss": 0.004124418832361698, "global_step": 30325, "epoch": 254, "lr": 6.233146285586546e-05} +{"train_loss": 0.002473062602803111, "global_step": 30326, "epoch": 254, "lr": 6.232931577143277e-05} +{"train_loss": 0.003906541503965855, "global_step": 30327, "epoch": 254, "lr": 6.232716866279277e-05} +{"train_loss": 0.0017616476397961378, "global_step": 30328, "epoch": 254, "lr": 6.23250215299497e-05} +{"train_loss": 0.0032339629251509905, "global_step": 30329, "epoch": 254, "lr": 6.232287437290777e-05} +{"train_loss": 0.004108439199626446, "global_step": 30330, "epoch": 254, "lr": 6.232072719167118e-05} +{"train_loss": 0.004147327039390802, "global_step": 30331, "epoch": 254, "lr": 6.231857998624415e-05} +{"train_loss": 0.0036406416911631823, "global_step": 30332, "epoch": 254, "lr": 6.231643275663091e-05} +{"train_loss": 0.004236661363393068, "global_step": 30333, "epoch": 254, "lr": 6.23142855028357e-05} +{"train_loss": 0.0035400390625, "global_step": 30334, "epoch": 254, "lr": 6.231213822486268e-05} +{"train_loss": 0.0023631304502487183, "global_step": 30335, "epoch": 254, "lr": 6.23099909227161e-05} +{"train_loss": 0.005055516492575407, "global_step": 30336, "epoch": 254, "lr": 6.230784359640016e-05} +{"train_loss": 0.004530990030616522, "global_step": 30337, "epoch": 254, "lr": 6.23056962459191e-05} +{"train_loss": 0.00406675273552537, "global_step": 30338, "epoch": 254, "lr": 6.23035488712771e-05} +{"train_loss": 0.0028986455872654915, "global_step": 30339, "epoch": 254, "lr": 6.230140147247842e-05} +{"train_loss": 0.0024368332233279943, "global_step": 30340, "epoch": 254, "lr": 6.229925404952723e-05} +{"train_loss": 0.002954652300104499, "global_step": 30341, "epoch": 254, "lr": 6.229710660242776e-05} +{"train_loss": 0.0039785741828382015, "global_step": 30342, "epoch": 254, "lr": 6.229495913118426e-05} +{"train_loss": 0.002672711620107293, "global_step": 30343, "epoch": 254, "lr": 6.229281163580092e-05} +{"train_loss": 0.003599124070366516, "global_step": 30344, "epoch": 254, "lr": 6.229066411628195e-05, "val_loss": 0.020544428378343582} +{"train_loss": 0.0042501771822571754, "global_step": 30345, "epoch": 255, "lr": 6.228851657263158e-05} +{"train_loss": 0.006139554549008608, "global_step": 30346, "epoch": 255, "lr": 6.2286369004854e-05} +{"train_loss": 0.004862661939114332, "global_step": 30347, "epoch": 255, "lr": 6.228422141295346e-05} +{"train_loss": 0.00293351779691875, "global_step": 30348, "epoch": 255, "lr": 6.228207379693416e-05} +{"train_loss": 0.0024547509383410215, "global_step": 30349, "epoch": 255, "lr": 6.227992615680033e-05} +{"train_loss": 0.0026769498363137245, "global_step": 30350, "epoch": 255, "lr": 6.227777849255617e-05} +{"train_loss": 0.0029514015186578035, "global_step": 30351, "epoch": 255, "lr": 6.227563080420592e-05} +{"train_loss": 0.0044463519006967545, "global_step": 30352, "epoch": 255, "lr": 6.227348309175375e-05} +{"train_loss": 0.0035555108916014433, "global_step": 30353, "epoch": 255, "lr": 6.227133535520393e-05} +{"train_loss": 0.004443466663360596, "global_step": 30354, "epoch": 255, "lr": 6.226918759456065e-05} +{"train_loss": 0.0029617140535265207, "global_step": 30355, "epoch": 255, "lr": 6.226703980982813e-05} +{"train_loss": 0.0034872060641646385, "global_step": 30356, "epoch": 255, "lr": 6.226489200101058e-05} +{"train_loss": 0.0032760093454271555, "global_step": 30357, "epoch": 255, "lr": 6.226274416811223e-05} +{"train_loss": 0.003609693143516779, "global_step": 30358, "epoch": 255, "lr": 6.226059631113731e-05} +{"train_loss": 0.0033749633003026247, "global_step": 30359, "epoch": 255, "lr": 6.225844843009e-05} +{"train_loss": 0.002777271205559373, "global_step": 30360, "epoch": 255, "lr": 6.225630052497453e-05} +{"train_loss": 0.0022803563624620438, "global_step": 30361, "epoch": 255, "lr": 6.225415259579513e-05} +{"train_loss": 0.00405581621453166, "global_step": 30362, "epoch": 255, "lr": 6.225200464255602e-05} +{"train_loss": 0.00219711079262197, "global_step": 30363, "epoch": 255, "lr": 6.22498566652614e-05} +{"train_loss": 0.0027143037877976894, "global_step": 30364, "epoch": 255, "lr": 6.224770866391549e-05} +{"train_loss": 0.00400224793702364, "global_step": 30365, "epoch": 255, "lr": 6.224556063852252e-05} +{"train_loss": 0.0038494463078677654, "global_step": 30366, "epoch": 255, "lr": 6.22434125890867e-05} +{"train_loss": 0.004807630088180304, "global_step": 30367, "epoch": 255, "lr": 6.224126451561224e-05} +{"train_loss": 0.0021168766543269157, "global_step": 30368, "epoch": 255, "lr": 6.223911641810336e-05} +{"train_loss": 0.003878466784954071, "global_step": 30369, "epoch": 255, "lr": 6.223696829656429e-05} +{"train_loss": 0.0028291898779571056, "global_step": 30370, "epoch": 255, "lr": 6.223482015099927e-05} +{"train_loss": 0.004283906891942024, "global_step": 30371, "epoch": 255, "lr": 6.223267198141245e-05} +{"train_loss": 0.0024092167150229216, "global_step": 30372, "epoch": 255, "lr": 6.22305237878081e-05} +{"train_loss": 0.003529901150614023, "global_step": 30373, "epoch": 255, "lr": 6.222837557019041e-05} +{"train_loss": 0.003161090426146984, "global_step": 30374, "epoch": 255, "lr": 6.222622732856363e-05} +{"train_loss": 0.0016484324587509036, "global_step": 30375, "epoch": 255, "lr": 6.222407906293193e-05} +{"train_loss": 0.0026461214292794466, "global_step": 30376, "epoch": 255, "lr": 6.222193077329958e-05} +{"train_loss": 0.002916275057941675, "global_step": 30377, "epoch": 255, "lr": 6.221978245967078e-05} +{"train_loss": 0.004109798930585384, "global_step": 30378, "epoch": 255, "lr": 6.221763412204973e-05} +{"train_loss": 0.0066941725090146065, "global_step": 30379, "epoch": 255, "lr": 6.221548576044065e-05} +{"train_loss": 0.0013561610830947757, "global_step": 30380, "epoch": 255, "lr": 6.221333737484778e-05} +{"train_loss": 0.002928315196186304, "global_step": 30381, "epoch": 255, "lr": 6.221118896527533e-05} +{"train_loss": 0.005635788664221764, "global_step": 30382, "epoch": 255, "lr": 6.220904053172751e-05} +{"train_loss": 0.003081201110035181, "global_step": 30383, "epoch": 255, "lr": 6.220689207420855e-05} +{"train_loss": 0.002547501353546977, "global_step": 30384, "epoch": 255, "lr": 6.220474359272266e-05} +{"train_loss": 0.0018549715168774128, "global_step": 30385, "epoch": 255, "lr": 6.220259508727407e-05} +{"train_loss": 0.004171634092926979, "global_step": 30386, "epoch": 255, "lr": 6.220044655786697e-05} +{"train_loss": 0.0028305219020694494, "global_step": 30387, "epoch": 255, "lr": 6.219829800450561e-05} +{"train_loss": 0.005376520100980997, "global_step": 30388, "epoch": 255, "lr": 6.219614942719418e-05} +{"train_loss": 0.0054901372641325, "global_step": 30389, "epoch": 255, "lr": 6.219400082593694e-05} +{"train_loss": 0.0038906813133507967, "global_step": 30390, "epoch": 255, "lr": 6.219185220073805e-05} +{"train_loss": 0.001974770100787282, "global_step": 30391, "epoch": 255, "lr": 6.218970355160178e-05} +{"train_loss": 0.003276965580880642, "global_step": 30392, "epoch": 255, "lr": 6.218755487853232e-05} +{"train_loss": 0.0036765423137694597, "global_step": 30393, "epoch": 255, "lr": 6.21854061815339e-05} +{"train_loss": 0.0019949746783822775, "global_step": 30394, "epoch": 255, "lr": 6.218325746061074e-05} +{"train_loss": 0.003390819299966097, "global_step": 30395, "epoch": 255, "lr": 6.218110871576705e-05} +{"train_loss": 0.0045974538661539555, "global_step": 30396, "epoch": 255, "lr": 6.217895994700707e-05} +{"train_loss": 0.005047171376645565, "global_step": 30397, "epoch": 255, "lr": 6.217681115433498e-05} +{"train_loss": 0.0029348295647650957, "global_step": 30398, "epoch": 255, "lr": 6.217466233775504e-05} +{"train_loss": 0.0031040110625326633, "global_step": 30399, "epoch": 255, "lr": 6.217251349727145e-05} +{"train_loss": 0.004993526265025139, "global_step": 30400, "epoch": 255, "lr": 6.217036463288841e-05} +{"train_loss": 0.004083441570401192, "global_step": 30401, "epoch": 255, "lr": 6.21682157446102e-05} +{"train_loss": 0.003730419557541609, "global_step": 30402, "epoch": 255, "lr": 6.216606683244096e-05} +{"train_loss": 0.002351208822801709, "global_step": 30403, "epoch": 255, "lr": 6.216391789638497e-05} +{"train_loss": 0.0036925594322383404, "global_step": 30404, "epoch": 255, "lr": 6.21617689364464e-05} +{"train_loss": 0.003005290636792779, "global_step": 30405, "epoch": 255, "lr": 6.215961995262953e-05} +{"train_loss": 0.002989937085658312, "global_step": 30406, "epoch": 255, "lr": 6.215747094493852e-05} +{"train_loss": 0.004832826554775238, "global_step": 30407, "epoch": 255, "lr": 6.215532191337763e-05} +{"train_loss": 0.004775004927068949, "global_step": 30408, "epoch": 255, "lr": 6.215317285795106e-05} +{"train_loss": 0.0036239016335457563, "global_step": 30409, "epoch": 255, "lr": 6.215102377866303e-05} +{"train_loss": 0.004214516840875149, "global_step": 30410, "epoch": 255, "lr": 6.214887467551777e-05} +{"train_loss": 0.0023887897841632366, "global_step": 30411, "epoch": 255, "lr": 6.214672554851948e-05} +{"train_loss": 0.0034735165536403656, "global_step": 30412, "epoch": 255, "lr": 6.21445763976724e-05} +{"train_loss": 0.002466364298015833, "global_step": 30413, "epoch": 255, "lr": 6.214242722298074e-05} +{"train_loss": 0.0036384486593306065, "global_step": 30414, "epoch": 255, "lr": 6.214027802444872e-05} +{"train_loss": 0.004703447222709656, "global_step": 30415, "epoch": 255, "lr": 6.213812880208055e-05} +{"train_loss": 0.003713296726346016, "global_step": 30416, "epoch": 255, "lr": 6.213597955588049e-05} +{"train_loss": 0.004199938848614693, "global_step": 30417, "epoch": 255, "lr": 6.21338302858527e-05} +{"train_loss": 0.004573347046971321, "global_step": 30418, "epoch": 255, "lr": 6.213168099200146e-05} +{"train_loss": 0.0029561230912804604, "global_step": 30419, "epoch": 255, "lr": 6.212953167433093e-05} +{"train_loss": 0.0035200188867747784, "global_step": 30420, "epoch": 255, "lr": 6.212738233284538e-05} +{"train_loss": 0.002555470447987318, "global_step": 30421, "epoch": 255, "lr": 6.212523296754901e-05} +{"train_loss": 0.0033784881234169006, "global_step": 30422, "epoch": 255, "lr": 6.212308357844605e-05} +{"train_loss": 0.0045642065815627575, "global_step": 30423, "epoch": 255, "lr": 6.212093416554068e-05} +{"train_loss": 0.002717368071898818, "global_step": 30424, "epoch": 255, "lr": 6.211878472883716e-05} +{"train_loss": 0.0027851746417582035, "global_step": 30425, "epoch": 255, "lr": 6.211663526833972e-05} +{"train_loss": 0.0028742870781570673, "global_step": 30426, "epoch": 255, "lr": 6.211448578405256e-05} +{"train_loss": 0.005188634619116783, "global_step": 30427, "epoch": 255, "lr": 6.211233627597989e-05} +{"train_loss": 0.0021541505120694637, "global_step": 30428, "epoch": 255, "lr": 6.211018674412593e-05} +{"train_loss": 0.0037375763058662415, "global_step": 30429, "epoch": 255, "lr": 6.210803718849491e-05} +{"train_loss": 0.002726973732933402, "global_step": 30430, "epoch": 255, "lr": 6.210588760909107e-05} +{"train_loss": 0.0016596706118434668, "global_step": 30431, "epoch": 255, "lr": 6.210373800591862e-05} +{"train_loss": 0.002830651355907321, "global_step": 30432, "epoch": 255, "lr": 6.210158837898176e-05} +{"train_loss": 0.0038502211682498455, "global_step": 30433, "epoch": 255, "lr": 6.209943872828474e-05} +{"train_loss": 0.002439640462398529, "global_step": 30434, "epoch": 255, "lr": 6.209728905383176e-05} +{"train_loss": 0.0034755400847643614, "global_step": 30435, "epoch": 255, "lr": 6.209513935562703e-05} +{"train_loss": 0.001977507956326008, "global_step": 30436, "epoch": 255, "lr": 6.209298963367479e-05} +{"train_loss": 0.002483982127159834, "global_step": 30437, "epoch": 255, "lr": 6.209083988797926e-05} +{"train_loss": 0.004230998922139406, "global_step": 30438, "epoch": 255, "lr": 6.208869011854466e-05} +{"train_loss": 0.004487363155931234, "global_step": 30439, "epoch": 255, "lr": 6.208654032537522e-05} +{"train_loss": 0.002055640798062086, "global_step": 30440, "epoch": 255, "lr": 6.208439050847514e-05} +{"train_loss": 0.0028222529217600822, "global_step": 30441, "epoch": 255, "lr": 6.208224066784864e-05} +{"train_loss": 0.0018260360229760408, "global_step": 30442, "epoch": 255, "lr": 6.208009080349996e-05} +{"train_loss": 0.003014066955074668, "global_step": 30443, "epoch": 255, "lr": 6.20779409154333e-05} +{"train_loss": 0.004042420070618391, "global_step": 30444, "epoch": 255, "lr": 6.207579100365291e-05} +{"train_loss": 0.0033917019609361887, "global_step": 30445, "epoch": 255, "lr": 6.207364106816298e-05} +{"train_loss": 0.002046093111857772, "global_step": 30446, "epoch": 255, "lr": 6.207149110896775e-05} +{"train_loss": 0.002772327046841383, "global_step": 30447, "epoch": 255, "lr": 6.206934112607145e-05} +{"train_loss": 0.004914654418826103, "global_step": 30448, "epoch": 255, "lr": 6.206719111947828e-05} +{"train_loss": 0.0032449227292090654, "global_step": 30449, "epoch": 255, "lr": 6.206504108919246e-05} +{"train_loss": 0.002399328164756298, "global_step": 30450, "epoch": 255, "lr": 6.206289103521823e-05} +{"train_loss": 0.00208658492192626, "global_step": 30451, "epoch": 255, "lr": 6.206074095755979e-05} +{"train_loss": 0.0026508630253374577, "global_step": 30452, "epoch": 255, "lr": 6.205859085622139e-05} +{"train_loss": 0.0021345706190913916, "global_step": 30453, "epoch": 255, "lr": 6.205644073120724e-05} +{"train_loss": 0.00442934688180685, "global_step": 30454, "epoch": 255, "lr": 6.205429058252155e-05} +{"train_loss": 0.0031249425373971462, "global_step": 30455, "epoch": 255, "lr": 6.205214041016854e-05} +{"train_loss": 0.0017547068418934941, "global_step": 30456, "epoch": 255, "lr": 6.204999021415244e-05} +{"train_loss": 0.00316026178188622, "global_step": 30457, "epoch": 255, "lr": 6.204783999447747e-05} +{"train_loss": 0.0022668123710900545, "global_step": 30458, "epoch": 255, "lr": 6.204568975114787e-05} +{"train_loss": 0.003031764877960086, "global_step": 30459, "epoch": 255, "lr": 6.204353948416783e-05} +{"train_loss": 0.00396409397944808, "global_step": 30460, "epoch": 255, "lr": 6.20413891935416e-05} +{"train_loss": 0.0021454242523759604, "global_step": 30461, "epoch": 255, "lr": 6.203923887927337e-05} +{"train_loss": 0.003448770847171545, "global_step": 30462, "epoch": 255, "lr": 6.20370885413674e-05} +{"train_loss": 0.0033619993203906576, "global_step": 30463, "epoch": 255, "lr": 6.203493817982787e-05, "val_loss": 0.013436408713459969, "train_action_mse_error": 5.176446939003654e-05} +{"train_loss": 0.0026281145401299, "global_step": 30464, "epoch": 256, "lr": 6.203278779465905e-05} +{"train_loss": 0.003933100961148739, "global_step": 30465, "epoch": 256, "lr": 6.203063738586512e-05} +{"train_loss": 0.0017320041079074144, "global_step": 30466, "epoch": 256, "lr": 6.202848695345032e-05} +{"train_loss": 0.0023308792151510715, "global_step": 30467, "epoch": 256, "lr": 6.202633649741888e-05} +{"train_loss": 0.0020559479016810656, "global_step": 30468, "epoch": 256, "lr": 6.2024186017775e-05} +{"train_loss": 0.002118089236319065, "global_step": 30469, "epoch": 256, "lr": 6.202203551452292e-05} +{"train_loss": 0.0021685203537344933, "global_step": 30470, "epoch": 256, "lr": 6.201988498766688e-05} +{"train_loss": 0.004919777624309063, "global_step": 30471, "epoch": 256, "lr": 6.201773443721107e-05} +{"train_loss": 0.003577950643375516, "global_step": 30472, "epoch": 256, "lr": 6.201558386315969e-05} +{"train_loss": 0.0019702452700585127, "global_step": 30473, "epoch": 256, "lr": 6.201343326551703e-05} +{"train_loss": 0.00437572319060564, "global_step": 30474, "epoch": 256, "lr": 6.201128264428726e-05} +{"train_loss": 0.003586147679015994, "global_step": 30475, "epoch": 256, "lr": 6.200913199947462e-05} +{"train_loss": 0.0030671036802232265, "global_step": 30476, "epoch": 256, "lr": 6.200698133108333e-05} +{"train_loss": 0.002564365044236183, "global_step": 30477, "epoch": 256, "lr": 6.200483063911763e-05} +{"train_loss": 0.0035093696787953377, "global_step": 30478, "epoch": 256, "lr": 6.200267992358172e-05} +{"train_loss": 0.005907035432755947, "global_step": 30479, "epoch": 256, "lr": 6.200052918447982e-05} +{"train_loss": 0.004504595883190632, "global_step": 30480, "epoch": 256, "lr": 6.199837842181617e-05} +{"train_loss": 0.0031712190248072147, "global_step": 30481, "epoch": 256, "lr": 6.199622763559499e-05} +{"train_loss": 0.003635098459199071, "global_step": 30482, "epoch": 256, "lr": 6.19940768258205e-05} +{"train_loss": 0.004333641845732927, "global_step": 30483, "epoch": 256, "lr": 6.199192599249692e-05} +{"train_loss": 0.0030385185964405537, "global_step": 30484, "epoch": 256, "lr": 6.198977513562849e-05} +{"train_loss": 0.003960577771067619, "global_step": 30485, "epoch": 256, "lr": 6.198762425521939e-05} +{"train_loss": 0.0023081712424755096, "global_step": 30486, "epoch": 256, "lr": 6.198547335127388e-05} +{"train_loss": 0.002345615765079856, "global_step": 30487, "epoch": 256, "lr": 6.198332242379618e-05} +{"train_loss": 0.0021550296805799007, "global_step": 30488, "epoch": 256, "lr": 6.198117147279049e-05} +{"train_loss": 0.004296031780540943, "global_step": 30489, "epoch": 256, "lr": 6.197902049826107e-05} +{"train_loss": 0.002644701162353158, "global_step": 30490, "epoch": 256, "lr": 6.197686950021212e-05} +{"train_loss": 0.002619353821501136, "global_step": 30491, "epoch": 256, "lr": 6.197471847864785e-05} +{"train_loss": 0.0037171076983213425, "global_step": 30492, "epoch": 256, "lr": 6.197256743357251e-05} +{"train_loss": 0.0034566428512334824, "global_step": 30493, "epoch": 256, "lr": 6.197041636499031e-05} +{"train_loss": 0.003538332413882017, "global_step": 30494, "epoch": 256, "lr": 6.196826527290549e-05} +{"train_loss": 0.0042587826028466225, "global_step": 30495, "epoch": 256, "lr": 6.196611415732224e-05} +{"train_loss": 0.0034973795991390944, "global_step": 30496, "epoch": 256, "lr": 6.196396301824481e-05} +{"train_loss": 0.003164042020216584, "global_step": 30497, "epoch": 256, "lr": 6.196181185567742e-05} +{"train_loss": 0.0027553413528949022, "global_step": 30498, "epoch": 256, "lr": 6.195966066962428e-05} +{"train_loss": 0.002612379379570484, "global_step": 30499, "epoch": 256, "lr": 6.195750946008965e-05} +{"train_loss": 0.0015493301907554269, "global_step": 30500, "epoch": 256, "lr": 6.195535822707769e-05} +{"train_loss": 0.003072609892114997, "global_step": 30501, "epoch": 256, "lr": 6.195320697059269e-05} +{"train_loss": 0.004373069386929274, "global_step": 30502, "epoch": 256, "lr": 6.195105569063884e-05} +{"train_loss": 0.0019698746036738157, "global_step": 30503, "epoch": 256, "lr": 6.194890438722037e-05} +{"train_loss": 0.0022952568251639605, "global_step": 30504, "epoch": 256, "lr": 6.19467530603415e-05} +{"train_loss": 0.0023633120581507683, "global_step": 30505, "epoch": 256, "lr": 6.194460171000646e-05} +{"train_loss": 0.003397848457098007, "global_step": 30506, "epoch": 256, "lr": 6.194245033621946e-05} +{"train_loss": 0.002975125564262271, "global_step": 30507, "epoch": 256, "lr": 6.194029893898474e-05} +{"train_loss": 0.002598398132249713, "global_step": 30508, "epoch": 256, "lr": 6.193814751830653e-05} +{"train_loss": 0.0024094656109809875, "global_step": 30509, "epoch": 256, "lr": 6.193599607418903e-05} +{"train_loss": 0.0020015407353639603, "global_step": 30510, "epoch": 256, "lr": 6.193384460663648e-05} +{"train_loss": 0.0023530153557658195, "global_step": 30511, "epoch": 256, "lr": 6.19316931156531e-05} +{"train_loss": 0.003047656500712037, "global_step": 30512, "epoch": 256, "lr": 6.19295416012431e-05} +{"train_loss": 0.002091026632115245, "global_step": 30513, "epoch": 256, "lr": 6.192739006341074e-05} +{"train_loss": 0.0026377553585916758, "global_step": 30514, "epoch": 256, "lr": 6.192523850216023e-05} +{"train_loss": 0.005122072994709015, "global_step": 30515, "epoch": 256, "lr": 6.192308691749578e-05} +{"train_loss": 0.0030121246818453074, "global_step": 30516, "epoch": 256, "lr": 6.192093530942162e-05} +{"train_loss": 0.0020504675339907408, "global_step": 30517, "epoch": 256, "lr": 6.191878367794197e-05} +{"train_loss": 0.001590605708770454, "global_step": 30518, "epoch": 256, "lr": 6.191663202306107e-05} +{"train_loss": 0.0030767854768782854, "global_step": 30519, "epoch": 256, "lr": 6.191448034478313e-05} +{"train_loss": 0.0033808357547968626, "global_step": 30520, "epoch": 256, "lr": 6.19123286431124e-05} +{"train_loss": 0.0013156764907762408, "global_step": 30521, "epoch": 256, "lr": 6.191017691805307e-05} +{"train_loss": 0.002214019186794758, "global_step": 30522, "epoch": 256, "lr": 6.190802516960938e-05} +{"train_loss": 0.0026640973519533873, "global_step": 30523, "epoch": 256, "lr": 6.190587339778556e-05} +{"train_loss": 0.002576572122052312, "global_step": 30524, "epoch": 256, "lr": 6.190372160258582e-05} +{"train_loss": 0.0030558372382074594, "global_step": 30525, "epoch": 256, "lr": 6.190156978401439e-05} +{"train_loss": 0.003809957532212138, "global_step": 30526, "epoch": 256, "lr": 6.18994179420755e-05} +{"train_loss": 0.0034960927441716194, "global_step": 30527, "epoch": 256, "lr": 6.18972660767734e-05} +{"train_loss": 0.003454171819612384, "global_step": 30528, "epoch": 256, "lr": 6.189511418811227e-05} +{"train_loss": 0.002007435541599989, "global_step": 30529, "epoch": 256, "lr": 6.189296227609634e-05} +{"train_loss": 0.0021215921733528376, "global_step": 30530, "epoch": 256, "lr": 6.189081034072988e-05} +{"train_loss": 0.002461883006617427, "global_step": 30531, "epoch": 256, "lr": 6.188865838201706e-05} +{"train_loss": 0.002244817791506648, "global_step": 30532, "epoch": 256, "lr": 6.188650639996213e-05} +{"train_loss": 0.0039128391072154045, "global_step": 30533, "epoch": 256, "lr": 6.188435439456935e-05} +{"train_loss": 0.0029027466662228107, "global_step": 30534, "epoch": 256, "lr": 6.188220236584288e-05} +{"train_loss": 0.0020200025755912066, "global_step": 30535, "epoch": 256, "lr": 6.188005031378697e-05} +{"train_loss": 0.0028300085105001926, "global_step": 30536, "epoch": 256, "lr": 6.187789823840586e-05} +{"train_loss": 0.004880981985479593, "global_step": 30537, "epoch": 256, "lr": 6.187574613970376e-05} +{"train_loss": 0.004535907879471779, "global_step": 30538, "epoch": 256, "lr": 6.187359401768492e-05} +{"train_loss": 0.002326776972040534, "global_step": 30539, "epoch": 256, "lr": 6.187144187235353e-05} +{"train_loss": 0.0038970308378338814, "global_step": 30540, "epoch": 256, "lr": 6.186928970371383e-05} +{"train_loss": 0.003078587120398879, "global_step": 30541, "epoch": 256, "lr": 6.186713751177006e-05} +{"train_loss": 0.003945489414036274, "global_step": 30542, "epoch": 256, "lr": 6.186498529652642e-05} +{"train_loss": 0.002966306172311306, "global_step": 30543, "epoch": 256, "lr": 6.186283305798715e-05} +{"train_loss": 0.0031080832704901695, "global_step": 30544, "epoch": 256, "lr": 6.186068079615648e-05} +{"train_loss": 0.003067704848945141, "global_step": 30545, "epoch": 256, "lr": 6.185852851103863e-05} +{"train_loss": 0.0019325653556734324, "global_step": 30546, "epoch": 256, "lr": 6.185637620263782e-05} +{"train_loss": 0.002883950714021921, "global_step": 30547, "epoch": 256, "lr": 6.185422387095828e-05} +{"train_loss": 0.004415476229041815, "global_step": 30548, "epoch": 256, "lr": 6.185207151600425e-05} +{"train_loss": 0.0017276279395446181, "global_step": 30549, "epoch": 256, "lr": 6.184991913777995e-05} +{"train_loss": 0.0026294724084436893, "global_step": 30550, "epoch": 256, "lr": 6.184776673628958e-05} +{"train_loss": 0.002916384022682905, "global_step": 30551, "epoch": 256, "lr": 6.184561431153739e-05} +{"train_loss": 0.0034843948669731617, "global_step": 30552, "epoch": 256, "lr": 6.184346186352762e-05} +{"train_loss": 0.00273723853752017, "global_step": 30553, "epoch": 256, "lr": 6.184130939226447e-05} +{"train_loss": 0.0023002605885267258, "global_step": 30554, "epoch": 256, "lr": 6.183915689775216e-05} +{"train_loss": 0.0023239278234541416, "global_step": 30555, "epoch": 256, "lr": 6.183700437999494e-05} +{"train_loss": 0.004662282299250364, "global_step": 30556, "epoch": 256, "lr": 6.183485183899702e-05} +{"train_loss": 0.0023633865639567375, "global_step": 30557, "epoch": 256, "lr": 6.183269927476263e-05} +{"train_loss": 0.0018411637283861637, "global_step": 30558, "epoch": 256, "lr": 6.183054668729601e-05} +{"train_loss": 0.002980389865115285, "global_step": 30559, "epoch": 256, "lr": 6.18283940766014e-05} +{"train_loss": 0.004442181438207626, "global_step": 30560, "epoch": 256, "lr": 6.182624144268296e-05} +{"train_loss": 0.0022031660191714764, "global_step": 30561, "epoch": 256, "lr": 6.182408878554497e-05} +{"train_loss": 0.0022211510222405195, "global_step": 30562, "epoch": 256, "lr": 6.182193610519163e-05} +{"train_loss": 0.0025617508217692375, "global_step": 30563, "epoch": 256, "lr": 6.18197834016272e-05} +{"train_loss": 0.003314524656161666, "global_step": 30564, "epoch": 256, "lr": 6.181763067485591e-05} +{"train_loss": 0.0028672991320490837, "global_step": 30565, "epoch": 256, "lr": 6.181547792488194e-05} +{"train_loss": 0.002957258839160204, "global_step": 30566, "epoch": 256, "lr": 6.181332515170954e-05} +{"train_loss": 0.0028932567220181227, "global_step": 30567, "epoch": 256, "lr": 6.181117235534294e-05} +{"train_loss": 0.0013797598658129573, "global_step": 30568, "epoch": 256, "lr": 6.180901953578636e-05} +{"train_loss": 0.003740857355296612, "global_step": 30569, "epoch": 256, "lr": 6.180686669304404e-05} +{"train_loss": 0.004043999128043652, "global_step": 30570, "epoch": 256, "lr": 6.18047138271202e-05} +{"train_loss": 0.0020635046530514956, "global_step": 30571, "epoch": 256, "lr": 6.180256093801907e-05} +{"train_loss": 0.0035279016010463238, "global_step": 30572, "epoch": 256, "lr": 6.180040802574486e-05} +{"train_loss": 0.001825801795348525, "global_step": 30573, "epoch": 256, "lr": 6.179825509030182e-05} +{"train_loss": 0.002974929055199027, "global_step": 30574, "epoch": 256, "lr": 6.179610213169415e-05} +{"train_loss": 0.003767682472243905, "global_step": 30575, "epoch": 256, "lr": 6.179394914992612e-05} +{"train_loss": 0.003000276628881693, "global_step": 30576, "epoch": 256, "lr": 6.17917961450019e-05} +{"train_loss": 0.003231672802940011, "global_step": 30577, "epoch": 256, "lr": 6.178964311692576e-05} +{"train_loss": 0.0029256290290504694, "global_step": 30578, "epoch": 256, "lr": 6.178749006570192e-05} +{"train_loss": 0.0035654399544000626, "global_step": 30579, "epoch": 256, "lr": 6.178533699133461e-05} +{"train_loss": 0.0022269180044531822, "global_step": 30580, "epoch": 256, "lr": 6.178318389382804e-05} +{"train_loss": 0.0028294785879552364, "global_step": 30581, "epoch": 256, "lr": 6.178103077318645e-05} +{"train_loss": 0.0029920955754018258, "global_step": 30582, "epoch": 256, "lr": 6.177887762941405e-05, "val_loss": 0.01930108293890953} +{"train_loss": 0.0036863547284156084, "global_step": 30583, "epoch": 257, "lr": 6.177672446251511e-05} +{"train_loss": 0.0016471118433400989, "global_step": 30584, "epoch": 257, "lr": 6.177457127249382e-05} +{"train_loss": 0.0034029092639684677, "global_step": 30585, "epoch": 257, "lr": 6.17724180593544e-05} +{"train_loss": 0.002752765081822872, "global_step": 30586, "epoch": 257, "lr": 6.177026482310111e-05} +{"train_loss": 0.004703195299953222, "global_step": 30587, "epoch": 257, "lr": 6.176811156373816e-05} +{"train_loss": 0.003003276651725173, "global_step": 30588, "epoch": 257, "lr": 6.176595828126978e-05} +{"train_loss": 0.002173385117202997, "global_step": 30589, "epoch": 257, "lr": 6.176380497570022e-05} +{"train_loss": 0.0027894277591258287, "global_step": 30590, "epoch": 257, "lr": 6.176165164703365e-05} +{"train_loss": 0.0020416767802089453, "global_step": 30591, "epoch": 257, "lr": 6.175949829527435e-05} +{"train_loss": 0.0023055144120007753, "global_step": 30592, "epoch": 257, "lr": 6.175734492042653e-05} +{"train_loss": 0.0029124035499989986, "global_step": 30593, "epoch": 257, "lr": 6.175519152249442e-05} +{"train_loss": 0.0022445679642260075, "global_step": 30594, "epoch": 257, "lr": 6.175303810148223e-05} +{"train_loss": 0.0029287836514413357, "global_step": 30595, "epoch": 257, "lr": 6.175088465739423e-05} +{"train_loss": 0.003238084027543664, "global_step": 30596, "epoch": 257, "lr": 6.174873119023461e-05} +{"train_loss": 0.002034020610153675, "global_step": 30597, "epoch": 257, "lr": 6.174657770000761e-05} +{"train_loss": 0.0027090716175734997, "global_step": 30598, "epoch": 257, "lr": 6.174442418671746e-05} +{"train_loss": 0.0021622106432914734, "global_step": 30599, "epoch": 257, "lr": 6.174227065036839e-05} +{"train_loss": 0.0019770197104662657, "global_step": 30600, "epoch": 257, "lr": 6.174011709096464e-05} +{"train_loss": 0.002445350168272853, "global_step": 30601, "epoch": 257, "lr": 6.173796350851041e-05} +{"train_loss": 0.004349295049905777, "global_step": 30602, "epoch": 257, "lr": 6.173580990300995e-05} +{"train_loss": 0.003330560866743326, "global_step": 30603, "epoch": 257, "lr": 6.173365627446748e-05} +{"train_loss": 0.003485668683424592, "global_step": 30604, "epoch": 257, "lr": 6.173150262288722e-05} +{"train_loss": 0.0027448812033981085, "global_step": 30605, "epoch": 257, "lr": 6.172934894827341e-05} +{"train_loss": 0.0014532917411997914, "global_step": 30606, "epoch": 257, "lr": 6.17271952506303e-05} +{"train_loss": 0.0025467851664870977, "global_step": 30607, "epoch": 257, "lr": 6.172504152996206e-05} +{"train_loss": 0.002291422337293625, "global_step": 30608, "epoch": 257, "lr": 6.172288778627298e-05} +{"train_loss": 0.002480523195117712, "global_step": 30609, "epoch": 257, "lr": 6.172073401956725e-05} +{"train_loss": 0.0022033851128071547, "global_step": 30610, "epoch": 257, "lr": 6.171858022984909e-05} +{"train_loss": 0.004979661200195551, "global_step": 30611, "epoch": 257, "lr": 6.171642641712278e-05} +{"train_loss": 0.00339118973352015, "global_step": 30612, "epoch": 257, "lr": 6.17142725813925e-05} +{"train_loss": 0.004269863944500685, "global_step": 30613, "epoch": 257, "lr": 6.171211872266251e-05} +{"train_loss": 0.0023661726154386997, "global_step": 30614, "epoch": 257, "lr": 6.170996484093705e-05} +{"train_loss": 0.0032485059928148985, "global_step": 30615, "epoch": 257, "lr": 6.170781093622028e-05} +{"train_loss": 0.0020664867479354143, "global_step": 30616, "epoch": 257, "lr": 6.17056570085165e-05} +{"train_loss": 0.0024811227340251207, "global_step": 30617, "epoch": 257, "lr": 6.17035030578299e-05} +{"train_loss": 0.0018514211988076568, "global_step": 30618, "epoch": 257, "lr": 6.170134908416474e-05} +{"train_loss": 0.003764873603358865, "global_step": 30619, "epoch": 257, "lr": 6.169919508752522e-05} +{"train_loss": 0.0027419175021350384, "global_step": 30620, "epoch": 257, "lr": 6.169704106791558e-05} +{"train_loss": 0.003049820428714156, "global_step": 30621, "epoch": 257, "lr": 6.169488702534006e-05} +{"train_loss": 0.0031203660182654858, "global_step": 30622, "epoch": 257, "lr": 6.169273295980286e-05} +{"train_loss": 0.001976952888071537, "global_step": 30623, "epoch": 257, "lr": 6.169057887130823e-05} +{"train_loss": 0.0036168221849948168, "global_step": 30624, "epoch": 257, "lr": 6.16884247598604e-05} +{"train_loss": 0.00203220103867352, "global_step": 30625, "epoch": 257, "lr": 6.16862706254636e-05} +{"train_loss": 0.003093080362305045, "global_step": 30626, "epoch": 257, "lr": 6.168411646812205e-05} +{"train_loss": 0.0023580575361847878, "global_step": 30627, "epoch": 257, "lr": 6.168196228784e-05} +{"train_loss": 0.0037072908598929644, "global_step": 30628, "epoch": 257, "lr": 6.167980808462165e-05} +{"train_loss": 0.0024948061909526587, "global_step": 30629, "epoch": 257, "lr": 6.167765385847125e-05} +{"train_loss": 0.003101693233475089, "global_step": 30630, "epoch": 257, "lr": 6.167549960939302e-05} +{"train_loss": 0.0032064730767160654, "global_step": 30631, "epoch": 257, "lr": 6.167334533739121e-05} +{"train_loss": 0.0018143245251849294, "global_step": 30632, "epoch": 257, "lr": 6.167119104247002e-05} +{"train_loss": 0.002908561611548066, "global_step": 30633, "epoch": 257, "lr": 6.16690367246337e-05} +{"train_loss": 0.002368883229792118, "global_step": 30634, "epoch": 257, "lr": 6.166688238388647e-05} +{"train_loss": 0.0026895704213529825, "global_step": 30635, "epoch": 257, "lr": 6.166472802023257e-05} +{"train_loss": 0.0024319696240127087, "global_step": 30636, "epoch": 257, "lr": 6.166257363367621e-05} +{"train_loss": 0.0022445705253630877, "global_step": 30637, "epoch": 257, "lr": 6.166041922422164e-05} +{"train_loss": 0.0049684420228004456, "global_step": 30638, "epoch": 257, "lr": 6.165826479187308e-05} +{"train_loss": 0.001971341436728835, "global_step": 30639, "epoch": 257, "lr": 6.165611033663475e-05} +{"train_loss": 0.00414489908143878, "global_step": 30640, "epoch": 257, "lr": 6.165395585851093e-05} +{"train_loss": 0.002787941601127386, "global_step": 30641, "epoch": 257, "lr": 6.165180135750578e-05} +{"train_loss": 0.0026687856297940016, "global_step": 30642, "epoch": 257, "lr": 6.164964683362356e-05} +{"train_loss": 0.0019170232117176056, "global_step": 30643, "epoch": 257, "lr": 6.164749228686852e-05} +{"train_loss": 0.002387211425229907, "global_step": 30644, "epoch": 257, "lr": 6.164533771724487e-05} +{"train_loss": 0.003437696723267436, "global_step": 30645, "epoch": 257, "lr": 6.164318312475683e-05} +{"train_loss": 0.004809941630810499, "global_step": 30646, "epoch": 257, "lr": 6.164102850940866e-05} +{"train_loss": 0.0041487314738333225, "global_step": 30647, "epoch": 257, "lr": 6.163887387120457e-05} +{"train_loss": 0.0028423883486539125, "global_step": 30648, "epoch": 257, "lr": 6.16367192101488e-05} +{"train_loss": 0.0015809776959940791, "global_step": 30649, "epoch": 257, "lr": 6.163456452624556e-05} +{"train_loss": 0.0036050942726433277, "global_step": 30650, "epoch": 257, "lr": 6.16324098194991e-05} +{"train_loss": 0.003925343509763479, "global_step": 30651, "epoch": 257, "lr": 6.163025508991365e-05} +{"train_loss": 0.002999466611072421, "global_step": 30652, "epoch": 257, "lr": 6.162810033749344e-05} +{"train_loss": 0.004090540576726198, "global_step": 30653, "epoch": 257, "lr": 6.16259455622427e-05} +{"train_loss": 0.0031381247099488974, "global_step": 30654, "epoch": 257, "lr": 6.162379076416564e-05} +{"train_loss": 0.003513021394610405, "global_step": 30655, "epoch": 257, "lr": 6.162163594326654e-05} +{"train_loss": 0.0036980044096708298, "global_step": 30656, "epoch": 257, "lr": 6.161948109954957e-05} +{"train_loss": 0.002360520651564002, "global_step": 30657, "epoch": 257, "lr": 6.1617326233019e-05} +{"train_loss": 0.002165280980989337, "global_step": 30658, "epoch": 257, "lr": 6.161517134367904e-05} +{"train_loss": 0.005200678948312998, "global_step": 30659, "epoch": 257, "lr": 6.161301643153394e-05} +{"train_loss": 0.0025112188886851072, "global_step": 30660, "epoch": 257, "lr": 6.161086149658794e-05} +{"train_loss": 0.0042214300483465195, "global_step": 30661, "epoch": 257, "lr": 6.160870653884524e-05} +{"train_loss": 0.003019010415300727, "global_step": 30662, "epoch": 257, "lr": 6.160655155831007e-05} +{"train_loss": 0.004266194999217987, "global_step": 30663, "epoch": 257, "lr": 6.16043965549867e-05} +{"train_loss": 0.0029927061405032873, "global_step": 30664, "epoch": 257, "lr": 6.160224152887932e-05} +{"train_loss": 0.0025715201627463102, "global_step": 30665, "epoch": 257, "lr": 6.16000864799922e-05} +{"train_loss": 0.002803731942549348, "global_step": 30666, "epoch": 257, "lr": 6.159793140832953e-05} +{"train_loss": 0.002849229145795107, "global_step": 30667, "epoch": 257, "lr": 6.159577631389557e-05} +{"train_loss": 0.0031736267264932394, "global_step": 30668, "epoch": 257, "lr": 6.159362119669454e-05} +{"train_loss": 0.00513279577717185, "global_step": 30669, "epoch": 257, "lr": 6.159146605673066e-05} +{"train_loss": 0.0033741414081305265, "global_step": 30670, "epoch": 257, "lr": 6.158931089400819e-05} +{"train_loss": 0.0032531709875911474, "global_step": 30671, "epoch": 257, "lr": 6.158715570853135e-05} +{"train_loss": 0.003909788094460964, "global_step": 30672, "epoch": 257, "lr": 6.158500050030436e-05} +{"train_loss": 0.001846559694968164, "global_step": 30673, "epoch": 257, "lr": 6.158284526933145e-05} +{"train_loss": 0.0036091923248022795, "global_step": 30674, "epoch": 257, "lr": 6.158069001561689e-05} +{"train_loss": 0.0026023858226835728, "global_step": 30675, "epoch": 257, "lr": 6.157853473916485e-05} +{"train_loss": 0.0021929664071649313, "global_step": 30676, "epoch": 257, "lr": 6.157637943997961e-05} +{"train_loss": 0.0023217492271214724, "global_step": 30677, "epoch": 257, "lr": 6.157422411806538e-05} +{"train_loss": 0.002717953873798251, "global_step": 30678, "epoch": 257, "lr": 6.157206877342639e-05} +{"train_loss": 0.0029251514934003353, "global_step": 30679, "epoch": 257, "lr": 6.15699134060669e-05} +{"train_loss": 0.0022942759096622467, "global_step": 30680, "epoch": 257, "lr": 6.156775801599111e-05} +{"train_loss": 0.0035720770247280598, "global_step": 30681, "epoch": 257, "lr": 6.156560260320326e-05} +{"train_loss": 0.003051099134609103, "global_step": 30682, "epoch": 257, "lr": 6.156344716770759e-05} +{"train_loss": 0.0025844380725175142, "global_step": 30683, "epoch": 257, "lr": 6.156129170950833e-05} +{"train_loss": 0.004396680276840925, "global_step": 30684, "epoch": 257, "lr": 6.15591362286097e-05} +{"train_loss": 0.004773293621838093, "global_step": 30685, "epoch": 257, "lr": 6.155698072501595e-05} +{"train_loss": 0.0023074913769960403, "global_step": 30686, "epoch": 257, "lr": 6.155482519873129e-05} +{"train_loss": 0.002738997805863619, "global_step": 30687, "epoch": 257, "lr": 6.155266964975997e-05} +{"train_loss": 0.004505786579102278, "global_step": 30688, "epoch": 257, "lr": 6.155051407810622e-05} +{"train_loss": 0.0023708180524408817, "global_step": 30689, "epoch": 257, "lr": 6.154835848377427e-05} +{"train_loss": 0.004974233452230692, "global_step": 30690, "epoch": 257, "lr": 6.154620286676837e-05} +{"train_loss": 0.0031439231242984533, "global_step": 30691, "epoch": 257, "lr": 6.15440472270927e-05} +{"train_loss": 0.002133140107616782, "global_step": 30692, "epoch": 257, "lr": 6.154189156475155e-05} +{"train_loss": 0.0017984069418162107, "global_step": 30693, "epoch": 257, "lr": 6.153973587974911e-05} +{"train_loss": 0.003163898130878806, "global_step": 30694, "epoch": 257, "lr": 6.153758017208965e-05} +{"train_loss": 0.0022197491489350796, "global_step": 30695, "epoch": 257, "lr": 6.153542444177736e-05} +{"train_loss": 0.0025656064972281456, "global_step": 30696, "epoch": 257, "lr": 6.153326868881654e-05} +{"train_loss": 0.0035389666445553303, "global_step": 30697, "epoch": 257, "lr": 6.153111291321134e-05} +{"train_loss": 0.003625779878348112, "global_step": 30698, "epoch": 257, "lr": 6.152895711496604e-05} +{"train_loss": 0.004247833974659443, "global_step": 30699, "epoch": 257, "lr": 6.152680129408488e-05} +{"train_loss": 0.002130684209987521, "global_step": 30700, "epoch": 257, "lr": 6.152464545057206e-05} +{"train_loss": 0.003012790417048235, "global_step": 30701, "epoch": 257, "lr": 6.152248958443183e-05, "val_loss": 0.030144808813929558} +{"train_loss": 0.002698656404390931, "global_step": 30702, "epoch": 258, "lr": 6.152033369566844e-05} +{"train_loss": 0.003381446236744523, "global_step": 30703, "epoch": 258, "lr": 6.151817778428609e-05} +{"train_loss": 0.0020358487963676453, "global_step": 30704, "epoch": 258, "lr": 6.151602185028905e-05} +{"train_loss": 0.001890648389235139, "global_step": 30705, "epoch": 258, "lr": 6.15138658936815e-05} +{"train_loss": 0.002277025952935219, "global_step": 30706, "epoch": 258, "lr": 6.151170991446772e-05} +{"train_loss": 0.0031191217713057995, "global_step": 30707, "epoch": 258, "lr": 6.150955391265192e-05} +{"train_loss": 0.00265796878375113, "global_step": 30708, "epoch": 258, "lr": 6.150739788823835e-05} +{"train_loss": 0.0030163798946887255, "global_step": 30709, "epoch": 258, "lr": 6.150524184123122e-05} +{"train_loss": 0.003422696841880679, "global_step": 30710, "epoch": 258, "lr": 6.15030857716348e-05} +{"train_loss": 0.0037572646979242563, "global_step": 30711, "epoch": 258, "lr": 6.150092967945328e-05} +{"train_loss": 0.003951515536755323, "global_step": 30712, "epoch": 258, "lr": 6.149877356469091e-05} +{"train_loss": 0.00302139506675303, "global_step": 30713, "epoch": 258, "lr": 6.149661742735194e-05} +{"train_loss": 0.001425600261427462, "global_step": 30714, "epoch": 258, "lr": 6.149446126744059e-05} +{"train_loss": 0.0026993851643055677, "global_step": 30715, "epoch": 258, "lr": 6.149230508496109e-05} +{"train_loss": 0.004671598318964243, "global_step": 30716, "epoch": 258, "lr": 6.149014887991768e-05} +{"train_loss": 0.002481909468770027, "global_step": 30717, "epoch": 258, "lr": 6.148799265231458e-05} +{"train_loss": 0.0021659673657268286, "global_step": 30718, "epoch": 258, "lr": 6.148583640215604e-05} +{"train_loss": 0.0026940577663481236, "global_step": 30719, "epoch": 258, "lr": 6.148368012944629e-05} +{"train_loss": 0.0026202064473181963, "global_step": 30720, "epoch": 258, "lr": 6.148152383418956e-05} +{"train_loss": 0.0022917462047189474, "global_step": 30721, "epoch": 258, "lr": 6.14793675163901e-05} +{"train_loss": 0.002364152343943715, "global_step": 30722, "epoch": 258, "lr": 6.147721117605209e-05} +{"train_loss": 0.002946536522358656, "global_step": 30723, "epoch": 258, "lr": 6.147505481317984e-05} +{"train_loss": 0.0020605840254575014, "global_step": 30724, "epoch": 258, "lr": 6.147289842777752e-05} +{"train_loss": 0.0024100837763398886, "global_step": 30725, "epoch": 258, "lr": 6.14707420198494e-05} +{"train_loss": 0.003597917500883341, "global_step": 30726, "epoch": 258, "lr": 6.14685855893997e-05} +{"train_loss": 0.003902469063177705, "global_step": 30727, "epoch": 258, "lr": 6.146642913643266e-05} +{"train_loss": 0.00457648653537035, "global_step": 30728, "epoch": 258, "lr": 6.146427266095251e-05} +{"train_loss": 0.003919512964785099, "global_step": 30729, "epoch": 258, "lr": 6.146211616296349e-05} +{"train_loss": 0.0038271548692137003, "global_step": 30730, "epoch": 258, "lr": 6.145995964246983e-05} +{"train_loss": 0.003065922064706683, "global_step": 30731, "epoch": 258, "lr": 6.145780309947575e-05} +{"train_loss": 0.002700903918594122, "global_step": 30732, "epoch": 258, "lr": 6.14556465339855e-05} +{"train_loss": 0.0029481013771146536, "global_step": 30733, "epoch": 258, "lr": 6.145348994600333e-05} +{"train_loss": 0.002327335299924016, "global_step": 30734, "epoch": 258, "lr": 6.145133333553344e-05} +{"train_loss": 0.0039634364657104015, "global_step": 30735, "epoch": 258, "lr": 6.144917670258009e-05} +{"train_loss": 0.0024549735244363546, "global_step": 30736, "epoch": 258, "lr": 6.14470200471475e-05} +{"train_loss": 0.002227595541626215, "global_step": 30737, "epoch": 258, "lr": 6.144486336923991e-05} +{"train_loss": 0.0033262798096984625, "global_step": 30738, "epoch": 258, "lr": 6.144270666886156e-05} +{"train_loss": 0.002014949917793274, "global_step": 30739, "epoch": 258, "lr": 6.144054994601667e-05} +{"train_loss": 0.002909192582592368, "global_step": 30740, "epoch": 258, "lr": 6.143839320070949e-05} +{"train_loss": 0.004951817914843559, "global_step": 30741, "epoch": 258, "lr": 6.143623643294424e-05} +{"train_loss": 0.0018040947616100311, "global_step": 30742, "epoch": 258, "lr": 6.143407964272514e-05} +{"train_loss": 0.0032731720712035894, "global_step": 30743, "epoch": 258, "lr": 6.143192283005647e-05} +{"train_loss": 0.0031109629198908806, "global_step": 30744, "epoch": 258, "lr": 6.142976599494244e-05} +{"train_loss": 0.003705371404066682, "global_step": 30745, "epoch": 258, "lr": 6.142760913738728e-05} +{"train_loss": 0.0034917332231998444, "global_step": 30746, "epoch": 258, "lr": 6.142545225739525e-05} +{"train_loss": 0.0032622283324599266, "global_step": 30747, "epoch": 258, "lr": 6.142329535497054e-05} +{"train_loss": 0.0029351534321904182, "global_step": 30748, "epoch": 258, "lr": 6.142113843011742e-05} +{"train_loss": 0.003786614164710045, "global_step": 30749, "epoch": 258, "lr": 6.141898148284012e-05} +{"train_loss": 0.0029088372830301523, "global_step": 30750, "epoch": 258, "lr": 6.141682451314286e-05} +{"train_loss": 0.005006896331906319, "global_step": 30751, "epoch": 258, "lr": 6.141466752102988e-05} +{"train_loss": 0.006857079453766346, "global_step": 30752, "epoch": 258, "lr": 6.141251050650545e-05} +{"train_loss": 0.0067965020425617695, "global_step": 30753, "epoch": 258, "lr": 6.141035346957376e-05} +{"train_loss": 0.0032989990431815386, "global_step": 30754, "epoch": 258, "lr": 6.140819641023904e-05} +{"train_loss": 0.003410741686820984, "global_step": 30755, "epoch": 258, "lr": 6.140603932850555e-05} +{"train_loss": 0.004769596736878157, "global_step": 30756, "epoch": 258, "lr": 6.140388222437754e-05} +{"train_loss": 0.002905574394389987, "global_step": 30757, "epoch": 258, "lr": 6.140172509785921e-05} +{"train_loss": 0.005462327506393194, "global_step": 30758, "epoch": 258, "lr": 6.139956794895482e-05} +{"train_loss": 0.0028731951024383307, "global_step": 30759, "epoch": 258, "lr": 6.139741077766859e-05} +{"train_loss": 0.003855085698887706, "global_step": 30760, "epoch": 258, "lr": 6.139525358400476e-05} +{"train_loss": 0.0036023042630404234, "global_step": 30761, "epoch": 258, "lr": 6.139309636796757e-05} +{"train_loss": 0.0028416530694812536, "global_step": 30762, "epoch": 258, "lr": 6.139093912956125e-05} +{"train_loss": 0.0028374367393553257, "global_step": 30763, "epoch": 258, "lr": 6.138878186879005e-05} +{"train_loss": 0.004157385788857937, "global_step": 30764, "epoch": 258, "lr": 6.138662458565818e-05} +{"train_loss": 0.002225017873570323, "global_step": 30765, "epoch": 258, "lr": 6.13844672801699e-05} +{"train_loss": 0.0026189505588263273, "global_step": 30766, "epoch": 258, "lr": 6.138230995232943e-05} +{"train_loss": 0.0023128464818000793, "global_step": 30767, "epoch": 258, "lr": 6.1380152602141e-05} +{"train_loss": 0.00261339801363647, "global_step": 30768, "epoch": 258, "lr": 6.137799522960887e-05} +{"train_loss": 0.003623261582106352, "global_step": 30769, "epoch": 258, "lr": 6.137583783473726e-05} +{"train_loss": 0.0033350151497870684, "global_step": 30770, "epoch": 258, "lr": 6.13736804175304e-05} +{"train_loss": 0.004150912165641785, "global_step": 30771, "epoch": 258, "lr": 6.137152297799254e-05} +{"train_loss": 0.002795856213197112, "global_step": 30772, "epoch": 258, "lr": 6.13693655161279e-05} +{"train_loss": 0.004371514543890953, "global_step": 30773, "epoch": 258, "lr": 6.136720803194075e-05} +{"train_loss": 0.002895880723372102, "global_step": 30774, "epoch": 258, "lr": 6.136505052543527e-05} +{"train_loss": 0.0036644197534769773, "global_step": 30775, "epoch": 258, "lr": 6.136289299661575e-05} +{"train_loss": 0.005719819571822882, "global_step": 30776, "epoch": 258, "lr": 6.13607354454864e-05} +{"train_loss": 0.002463418524712324, "global_step": 30777, "epoch": 258, "lr": 6.135857787205144e-05} +{"train_loss": 0.003657478839159012, "global_step": 30778, "epoch": 258, "lr": 6.135642027631515e-05} +{"train_loss": 0.0024856242816895247, "global_step": 30779, "epoch": 258, "lr": 6.135426265828173e-05} +{"train_loss": 0.002502345945686102, "global_step": 30780, "epoch": 258, "lr": 6.135210501795544e-05} +{"train_loss": 0.0039175222627818584, "global_step": 30781, "epoch": 258, "lr": 6.134994735534048e-05} +{"train_loss": 0.0038833385333418846, "global_step": 30782, "epoch": 258, "lr": 6.134778967044112e-05} +{"train_loss": 0.003351809922605753, "global_step": 30783, "epoch": 258, "lr": 6.13456319632616e-05} +{"train_loss": 0.003370635909959674, "global_step": 30784, "epoch": 258, "lr": 6.134347423380615e-05} +{"train_loss": 0.003415257204324007, "global_step": 30785, "epoch": 258, "lr": 6.1341316482079e-05} +{"train_loss": 0.002341008745133877, "global_step": 30786, "epoch": 258, "lr": 6.133915870808437e-05} +{"train_loss": 0.003671760205179453, "global_step": 30787, "epoch": 258, "lr": 6.133700091182651e-05} +{"train_loss": 0.0033341837115585804, "global_step": 30788, "epoch": 258, "lr": 6.133484309330966e-05} +{"train_loss": 0.0025957461912184954, "global_step": 30789, "epoch": 258, "lr": 6.133268525253806e-05} +{"train_loss": 0.003943170420825481, "global_step": 30790, "epoch": 258, "lr": 6.133052738951597e-05} +{"train_loss": 0.002792380517348647, "global_step": 30791, "epoch": 258, "lr": 6.132836950424756e-05} +{"train_loss": 0.002477947622537613, "global_step": 30792, "epoch": 258, "lr": 6.132621159673712e-05} +{"train_loss": 0.003977274987846613, "global_step": 30793, "epoch": 258, "lr": 6.132405366698887e-05} +{"train_loss": 0.0049751861952245235, "global_step": 30794, "epoch": 258, "lr": 6.132189571500707e-05} +{"train_loss": 0.002410812769085169, "global_step": 30795, "epoch": 258, "lr": 6.131973774079593e-05} +{"train_loss": 0.003953042905777693, "global_step": 30796, "epoch": 258, "lr": 6.131757974435969e-05} +{"train_loss": 0.004912063479423523, "global_step": 30797, "epoch": 258, "lr": 6.13154217257026e-05} +{"train_loss": 0.003444385016337037, "global_step": 30798, "epoch": 258, "lr": 6.131326368482888e-05} +{"train_loss": 0.0035116709768772125, "global_step": 30799, "epoch": 258, "lr": 6.131110562174277e-05} +{"train_loss": 0.0018755291821435094, "global_step": 30800, "epoch": 258, "lr": 6.130894753644852e-05} +{"train_loss": 0.00189772283192724, "global_step": 30801, "epoch": 258, "lr": 6.130678942895035e-05} +{"train_loss": 0.004108835011720657, "global_step": 30802, "epoch": 258, "lr": 6.130463129925252e-05} +{"train_loss": 0.004065876826643944, "global_step": 30803, "epoch": 258, "lr": 6.130247314735925e-05} +{"train_loss": 0.002353786025196314, "global_step": 30804, "epoch": 258, "lr": 6.130031497327478e-05} +{"train_loss": 0.003084916854277253, "global_step": 30805, "epoch": 258, "lr": 6.129815677700335e-05} +{"train_loss": 0.002591620432212949, "global_step": 30806, "epoch": 258, "lr": 6.129599855854919e-05} +{"train_loss": 0.0035559500101953745, "global_step": 30807, "epoch": 258, "lr": 6.129384031791655e-05} +{"train_loss": 0.0025226592551916838, "global_step": 30808, "epoch": 258, "lr": 6.129168205510965e-05} +{"train_loss": 0.0031528580002486706, "global_step": 30809, "epoch": 258, "lr": 6.128952377013276e-05} +{"train_loss": 0.0035860843490809202, "global_step": 30810, "epoch": 258, "lr": 6.128736546299008e-05} +{"train_loss": 0.0018640088383108377, "global_step": 30811, "epoch": 258, "lr": 6.128520713368586e-05} +{"train_loss": 0.0035143475979566574, "global_step": 30812, "epoch": 258, "lr": 6.128304878222436e-05} +{"train_loss": 0.0022984452079981565, "global_step": 30813, "epoch": 258, "lr": 6.128089040860978e-05} +{"train_loss": 0.0017167687183246017, "global_step": 30814, "epoch": 258, "lr": 6.127873201284638e-05} +{"train_loss": 0.0032190559431910515, "global_step": 30815, "epoch": 258, "lr": 6.127657359493841e-05} +{"train_loss": 0.0018261868972331285, "global_step": 30816, "epoch": 258, "lr": 6.127441515489009e-05} +{"train_loss": 0.0017472918843850493, "global_step": 30817, "epoch": 258, "lr": 6.127225669270566e-05} +{"train_loss": 0.002600547391921282, "global_step": 30818, "epoch": 258, "lr": 6.127009820838934e-05} +{"train_loss": 0.0026312966365367174, "global_step": 30819, "epoch": 258, "lr": 6.12679397019454e-05} +{"train_loss": 0.0031973606556607017, "global_step": 30820, "epoch": 258, "lr": 6.126578117337806e-05, "val_loss": 0.036342885345220566} +{"train_loss": 0.003242220962420106, "global_step": 30821, "epoch": 259, "lr": 6.126362262269158e-05} +{"train_loss": 0.002493863692507148, "global_step": 30822, "epoch": 259, "lr": 6.126146404989016e-05} +{"train_loss": 0.0024270103313028812, "global_step": 30823, "epoch": 259, "lr": 6.125930545497806e-05} +{"train_loss": 0.003757576923817396, "global_step": 30824, "epoch": 259, "lr": 6.125714683795952e-05} +{"train_loss": 0.0029948584269732237, "global_step": 30825, "epoch": 259, "lr": 6.125498819883876e-05} +{"train_loss": 0.0024678180925548077, "global_step": 30826, "epoch": 259, "lr": 6.125282953762005e-05} +{"train_loss": 0.001901600044220686, "global_step": 30827, "epoch": 259, "lr": 6.125067085430761e-05} +{"train_loss": 0.0017572998767718673, "global_step": 30828, "epoch": 259, "lr": 6.124851214890568e-05} +{"train_loss": 0.003088416764512658, "global_step": 30829, "epoch": 259, "lr": 6.12463534214185e-05} +{"train_loss": 0.0034618470817804337, "global_step": 30830, "epoch": 259, "lr": 6.12441946718503e-05} +{"train_loss": 0.0026451649609953165, "global_step": 30831, "epoch": 259, "lr": 6.124203590020533e-05} +{"train_loss": 0.0036292436998337507, "global_step": 30832, "epoch": 259, "lr": 6.123987710648782e-05} +{"train_loss": 0.004816419444978237, "global_step": 30833, "epoch": 259, "lr": 6.1237718290702e-05} +{"train_loss": 0.0021995988208800554, "global_step": 30834, "epoch": 259, "lr": 6.123555945285216e-05} +{"train_loss": 0.003730031196027994, "global_step": 30835, "epoch": 259, "lr": 6.123340059294247e-05} +{"train_loss": 0.002533942461013794, "global_step": 30836, "epoch": 259, "lr": 6.12312417109772e-05} +{"train_loss": 0.001619615824893117, "global_step": 30837, "epoch": 259, "lr": 6.122908280696058e-05} +{"train_loss": 0.0035479560028761625, "global_step": 30838, "epoch": 259, "lr": 6.122692388089688e-05} +{"train_loss": 0.002204242628067732, "global_step": 30839, "epoch": 259, "lr": 6.12247649327903e-05} +{"train_loss": 0.0019427345832809806, "global_step": 30840, "epoch": 259, "lr": 6.122260596264507e-05} +{"train_loss": 0.0033797260839492083, "global_step": 30841, "epoch": 259, "lr": 6.122044697046548e-05} +{"train_loss": 0.0038937553763389587, "global_step": 30842, "epoch": 259, "lr": 6.121828795625573e-05} +{"train_loss": 0.0035160689149051905, "global_step": 30843, "epoch": 259, "lr": 6.121612892002008e-05} +{"train_loss": 0.00269325147382915, "global_step": 30844, "epoch": 259, "lr": 6.121396986176276e-05} +{"train_loss": 0.0032652546651661396, "global_step": 30845, "epoch": 259, "lr": 6.121181078148799e-05} +{"train_loss": 0.002033369615674019, "global_step": 30846, "epoch": 259, "lr": 6.120965167920005e-05} +{"train_loss": 0.0032165434677153826, "global_step": 30847, "epoch": 259, "lr": 6.120749255490314e-05} +{"train_loss": 0.002005941467359662, "global_step": 30848, "epoch": 259, "lr": 6.120533340860153e-05} +{"train_loss": 0.0021713124588131905, "global_step": 30849, "epoch": 259, "lr": 6.120317424029944e-05} +{"train_loss": 0.0025004500057548285, "global_step": 30850, "epoch": 259, "lr": 6.120101505000111e-05} +{"train_loss": 0.002757730893790722, "global_step": 30851, "epoch": 259, "lr": 6.119885583771078e-05} +{"train_loss": 0.0022607326973229647, "global_step": 30852, "epoch": 259, "lr": 6.119669660343271e-05} +{"train_loss": 0.003027205355465412, "global_step": 30853, "epoch": 259, "lr": 6.119453734717111e-05} +{"train_loss": 0.0019732441287487745, "global_step": 30854, "epoch": 259, "lr": 6.119237806893023e-05} +{"train_loss": 0.002991914050653577, "global_step": 30855, "epoch": 259, "lr": 6.119021876871431e-05} +{"train_loss": 0.0036376146599650383, "global_step": 30856, "epoch": 259, "lr": 6.118805944652759e-05} +{"train_loss": 0.0014997964026406407, "global_step": 30857, "epoch": 259, "lr": 6.118590010237431e-05} +{"train_loss": 0.0025181409437209368, "global_step": 30858, "epoch": 259, "lr": 6.118374073625872e-05} +{"train_loss": 0.0018698010826483369, "global_step": 30859, "epoch": 259, "lr": 6.118158134818504e-05} +{"train_loss": 0.002261040499433875, "global_step": 30860, "epoch": 259, "lr": 6.117942193815753e-05} +{"train_loss": 0.0039243618957698345, "global_step": 30861, "epoch": 259, "lr": 6.117726250618041e-05} +{"train_loss": 0.0023283190093934536, "global_step": 30862, "epoch": 259, "lr": 6.117510305225793e-05} +{"train_loss": 0.002914579352363944, "global_step": 30863, "epoch": 259, "lr": 6.117294357639434e-05} +{"train_loss": 0.0028691692277789116, "global_step": 30864, "epoch": 259, "lr": 6.117078407859385e-05} +{"train_loss": 0.00354430521838367, "global_step": 30865, "epoch": 259, "lr": 6.116862455886075e-05} +{"train_loss": 0.0022402077447623014, "global_step": 30866, "epoch": 259, "lr": 6.116646501719923e-05} +{"train_loss": 0.003396176965907216, "global_step": 30867, "epoch": 259, "lr": 6.116430545361355e-05} +{"train_loss": 0.002574796788394451, "global_step": 30868, "epoch": 259, "lr": 6.116214586810794e-05} +{"train_loss": 0.0020048029255121946, "global_step": 30869, "epoch": 259, "lr": 6.115998626068665e-05} +{"train_loss": 0.0027176968287676573, "global_step": 30870, "epoch": 259, "lr": 6.115782663135391e-05} +{"train_loss": 0.005003561265766621, "global_step": 30871, "epoch": 259, "lr": 6.115566698011401e-05} +{"train_loss": 0.0027331311721354723, "global_step": 30872, "epoch": 259, "lr": 6.115350730697112e-05} +{"train_loss": 0.0025764950551092625, "global_step": 30873, "epoch": 259, "lr": 6.115134761192953e-05} +{"train_loss": 0.00227724714204669, "global_step": 30874, "epoch": 259, "lr": 6.114918789499344e-05} +{"train_loss": 0.0033072882797569036, "global_step": 30875, "epoch": 259, "lr": 6.11470281561671e-05} +{"train_loss": 0.004049642942845821, "global_step": 30876, "epoch": 259, "lr": 6.114486839545477e-05} +{"train_loss": 0.002721521072089672, "global_step": 30877, "epoch": 259, "lr": 6.114270861286068e-05} +{"train_loss": 0.0031367584597319365, "global_step": 30878, "epoch": 259, "lr": 6.11405488083891e-05} +{"train_loss": 0.0031647097785025835, "global_step": 30879, "epoch": 259, "lr": 6.113838898204422e-05} +{"train_loss": 0.002307994058355689, "global_step": 30880, "epoch": 259, "lr": 6.11362291338303e-05} +{"train_loss": 0.0020751170814037323, "global_step": 30881, "epoch": 259, "lr": 6.11340692637516e-05} +{"train_loss": 0.0024710462894290686, "global_step": 30882, "epoch": 259, "lr": 6.113190937181233e-05} +{"train_loss": 0.0035883153323084116, "global_step": 30883, "epoch": 259, "lr": 6.112974945801675e-05} +{"train_loss": 0.005281066056340933, "global_step": 30884, "epoch": 259, "lr": 6.11275895223691e-05} +{"train_loss": 0.00332981301471591, "global_step": 30885, "epoch": 259, "lr": 6.112542956487362e-05} +{"train_loss": 0.0034944340586662292, "global_step": 30886, "epoch": 259, "lr": 6.112326958553452e-05} +{"train_loss": 0.003377928864210844, "global_step": 30887, "epoch": 259, "lr": 6.11211095843561e-05} +{"train_loss": 0.0043049282394349575, "global_step": 30888, "epoch": 259, "lr": 6.111894956134255e-05} +{"train_loss": 0.0017389843706041574, "global_step": 30889, "epoch": 259, "lr": 6.111678951649815e-05} +{"train_loss": 0.002770313760265708, "global_step": 30890, "epoch": 259, "lr": 6.11146294498271e-05} +{"train_loss": 0.0030732841696590185, "global_step": 30891, "epoch": 259, "lr": 6.111246936133367e-05} +{"train_loss": 0.0019435618305578828, "global_step": 30892, "epoch": 259, "lr": 6.111030925102209e-05} +{"train_loss": 0.002343236468732357, "global_step": 30893, "epoch": 259, "lr": 6.110814911889662e-05} +{"train_loss": 0.0031481629703193903, "global_step": 30894, "epoch": 259, "lr": 6.110598896496147e-05} +{"train_loss": 0.004295316059142351, "global_step": 30895, "epoch": 259, "lr": 6.11038287892209e-05} +{"train_loss": 0.001786797889508307, "global_step": 30896, "epoch": 259, "lr": 6.110166859167917e-05} +{"train_loss": 0.0037073707208037376, "global_step": 30897, "epoch": 259, "lr": 6.109950837234047e-05} +{"train_loss": 0.0024470847565680742, "global_step": 30898, "epoch": 259, "lr": 6.109734813120908e-05} +{"train_loss": 0.0020443061366677284, "global_step": 30899, "epoch": 259, "lr": 6.109518786828924e-05} +{"train_loss": 0.0038551283068954945, "global_step": 30900, "epoch": 259, "lr": 6.109302758358519e-05} +{"train_loss": 0.0019946664106100798, "global_step": 30901, "epoch": 259, "lr": 6.109086727710114e-05} +{"train_loss": 0.004766787867993116, "global_step": 30902, "epoch": 259, "lr": 6.108870694884137e-05} +{"train_loss": 0.00249604438431561, "global_step": 30903, "epoch": 259, "lr": 6.108654659881012e-05} +{"train_loss": 0.0014894769992679358, "global_step": 30904, "epoch": 259, "lr": 6.108438622701161e-05} +{"train_loss": 0.002746549202129245, "global_step": 30905, "epoch": 259, "lr": 6.10822258334501e-05} +{"train_loss": 0.0023634559474885464, "global_step": 30906, "epoch": 259, "lr": 6.108006541812981e-05} +{"train_loss": 0.0031310629565268755, "global_step": 30907, "epoch": 259, "lr": 6.1077904981055e-05} +{"train_loss": 0.0027587858494371176, "global_step": 30908, "epoch": 259, "lr": 6.10757445222299e-05} +{"train_loss": 0.0029071939643472433, "global_step": 30909, "epoch": 259, "lr": 6.107358404165877e-05} +{"train_loss": 0.0027138213627040386, "global_step": 30910, "epoch": 259, "lr": 6.107142353934585e-05} +{"train_loss": 0.0024462128058075905, "global_step": 30911, "epoch": 259, "lr": 6.106926301529536e-05} +{"train_loss": 0.0023656184785068035, "global_step": 30912, "epoch": 259, "lr": 6.106710246951154e-05} +{"train_loss": 0.001532708527520299, "global_step": 30913, "epoch": 259, "lr": 6.106494190199867e-05} +{"train_loss": 0.003318598261103034, "global_step": 30914, "epoch": 259, "lr": 6.106278131276095e-05} +{"train_loss": 0.0026744408532977104, "global_step": 30915, "epoch": 259, "lr": 6.106062070180266e-05} +{"train_loss": 0.0033778082579374313, "global_step": 30916, "epoch": 259, "lr": 6.105846006912801e-05} +{"train_loss": 0.002042255597189069, "global_step": 30917, "epoch": 259, "lr": 6.105629941474127e-05} +{"train_loss": 0.0019555860199034214, "global_step": 30918, "epoch": 259, "lr": 6.105413873864664e-05} +{"train_loss": 0.002391544869169593, "global_step": 30919, "epoch": 259, "lr": 6.105197804084842e-05} +{"train_loss": 0.0018959860317409039, "global_step": 30920, "epoch": 259, "lr": 6.10498173213508e-05} +{"train_loss": 0.003261315869167447, "global_step": 30921, "epoch": 259, "lr": 6.104765658015807e-05} +{"train_loss": 0.001486182794906199, "global_step": 30922, "epoch": 259, "lr": 6.104549581727443e-05} +{"train_loss": 0.0032533323392271996, "global_step": 30923, "epoch": 259, "lr": 6.104333503270411e-05} +{"train_loss": 0.0021629552356898785, "global_step": 30924, "epoch": 259, "lr": 6.104117422645141e-05} +{"train_loss": 0.0044860574416816235, "global_step": 30925, "epoch": 259, "lr": 6.103901339852056e-05} +{"train_loss": 0.0032370048575103283, "global_step": 30926, "epoch": 259, "lr": 6.103685254891576e-05} +{"train_loss": 0.004799096845090389, "global_step": 30927, "epoch": 259, "lr": 6.103469167764129e-05} +{"train_loss": 0.0038973973132669926, "global_step": 30928, "epoch": 259, "lr": 6.103253078470139e-05} +{"train_loss": 0.002872302196919918, "global_step": 30929, "epoch": 259, "lr": 6.1030369870100276e-05} +{"train_loss": 0.004293383099138737, "global_step": 30930, "epoch": 259, "lr": 6.1028208933842225e-05} +{"train_loss": 0.0034280226100236177, "global_step": 30931, "epoch": 259, "lr": 6.102604797593146e-05} +{"train_loss": 0.0018024849705398083, "global_step": 30932, "epoch": 259, "lr": 6.1023886996372214e-05} +{"train_loss": 0.0025302800349891186, "global_step": 30933, "epoch": 259, "lr": 6.102172599516876e-05} +{"train_loss": 0.0027867513708770275, "global_step": 30934, "epoch": 259, "lr": 6.1019564972325325e-05} +{"train_loss": 0.0031371605582535267, "global_step": 30935, "epoch": 259, "lr": 6.101740392784615e-05} +{"train_loss": 0.003294262569397688, "global_step": 30936, "epoch": 259, "lr": 6.101524286173548e-05} +{"train_loss": 0.003316704649478197, "global_step": 30937, "epoch": 259, "lr": 6.101308177399754e-05} +{"train_loss": 0.0027869881596416235, "global_step": 30938, "epoch": 259, "lr": 6.10109206646366e-05} +{"train_loss": 0.002875950200162327, "global_step": 30939, "epoch": 259, "lr": 6.10087595336569e-05, "val_loss": 0.024927649646997452} +{"train_loss": 0.00349705689586699, "global_step": 30940, "epoch": 260, "lr": 6.1006598381062675e-05} +{"train_loss": 0.0024257884360849857, "global_step": 30941, "epoch": 260, "lr": 6.100443720685817e-05} +{"train_loss": 0.001781241036951542, "global_step": 30942, "epoch": 260, "lr": 6.100227601104762e-05} +{"train_loss": 0.003015767317265272, "global_step": 30943, "epoch": 260, "lr": 6.1000114793635276e-05} +{"train_loss": 0.003742142114788294, "global_step": 30944, "epoch": 260, "lr": 6.0997953554625396e-05} +{"train_loss": 0.003777994541451335, "global_step": 30945, "epoch": 260, "lr": 6.09957922940222e-05} +{"train_loss": 0.0035883693490177393, "global_step": 30946, "epoch": 260, "lr": 6.099363101182994e-05} +{"train_loss": 0.004185538738965988, "global_step": 30947, "epoch": 260, "lr": 6.0991469708052875e-05} +{"train_loss": 0.003666447475552559, "global_step": 30948, "epoch": 260, "lr": 6.098930838269522e-05} +{"train_loss": 0.0024442621506750584, "global_step": 30949, "epoch": 260, "lr": 6.098714703576123e-05} +{"train_loss": 0.0036195283755660057, "global_step": 30950, "epoch": 260, "lr": 6.0984985667255156e-05} +{"train_loss": 0.0016366973286494613, "global_step": 30951, "epoch": 260, "lr": 6.0982824277181226e-05} +{"train_loss": 0.003244849154725671, "global_step": 30952, "epoch": 260, "lr": 6.09806628655437e-05} +{"train_loss": 0.0033046461176127195, "global_step": 30953, "epoch": 260, "lr": 6.0978501432346835e-05} +{"train_loss": 0.0036861153785139322, "global_step": 30954, "epoch": 260, "lr": 6.097633997759483e-05} +{"train_loss": 0.0026723456103354692, "global_step": 30955, "epoch": 260, "lr": 6.097417850129197e-05} +{"train_loss": 0.00250441487878561, "global_step": 30956, "epoch": 260, "lr": 6.097201700344247e-05} +{"train_loss": 0.004251434002071619, "global_step": 30957, "epoch": 260, "lr": 6.096985548405059e-05} +{"train_loss": 0.0020230920054018497, "global_step": 30958, "epoch": 260, "lr": 6.096769394312057e-05} +{"train_loss": 0.0023441207595169544, "global_step": 30959, "epoch": 260, "lr": 6.096553238065665e-05} +{"train_loss": 0.002859489293769002, "global_step": 30960, "epoch": 260, "lr": 6.096337079666309e-05} +{"train_loss": 0.0038626124151051044, "global_step": 30961, "epoch": 260, "lr": 6.096120919114412e-05} +{"train_loss": 0.0021163243800401688, "global_step": 30962, "epoch": 260, "lr": 6.095904756410398e-05} +{"train_loss": 0.003193197539076209, "global_step": 30963, "epoch": 260, "lr": 6.0956885915546926e-05} +{"train_loss": 0.006043204106390476, "global_step": 30964, "epoch": 260, "lr": 6.095472424547719e-05} +{"train_loss": 0.0024694129824638367, "global_step": 30965, "epoch": 260, "lr": 6.095256255389905e-05} +{"train_loss": 0.0032302492763847113, "global_step": 30966, "epoch": 260, "lr": 6.09504008408167e-05} +{"train_loss": 0.0014364183880388737, "global_step": 30967, "epoch": 260, "lr": 6.0948239106234405e-05} +{"train_loss": 0.003597719594836235, "global_step": 30968, "epoch": 260, "lr": 6.094607735015643e-05} +{"train_loss": 0.003046969883143902, "global_step": 30969, "epoch": 260, "lr": 6.0943915572586987e-05} +{"train_loss": 0.004073171876370907, "global_step": 30970, "epoch": 260, "lr": 6.094175377353033e-05} +{"train_loss": 0.0020534766372293234, "global_step": 30971, "epoch": 260, "lr": 6.0939591952990715e-05} +{"train_loss": 0.0028580049984157085, "global_step": 30972, "epoch": 260, "lr": 6.093743011097238e-05} +{"train_loss": 0.002433446003124118, "global_step": 30973, "epoch": 260, "lr": 6.093526824747957e-05} +{"train_loss": 0.0043952930718660355, "global_step": 30974, "epoch": 260, "lr": 6.093310636251653e-05} +{"train_loss": 0.005278522614389658, "global_step": 30975, "epoch": 260, "lr": 6.09309444560875e-05} +{"train_loss": 0.0021323408000171185, "global_step": 30976, "epoch": 260, "lr": 6.092878252819674e-05} +{"train_loss": 0.003773825243115425, "global_step": 30977, "epoch": 260, "lr": 6.092662057884847e-05} +{"train_loss": 0.0016476480523124337, "global_step": 30978, "epoch": 260, "lr": 6.0924458608046966e-05} +{"train_loss": 0.003425528295338154, "global_step": 30979, "epoch": 260, "lr": 6.0922296615796436e-05} +{"train_loss": 0.0030818223021924496, "global_step": 30980, "epoch": 260, "lr": 6.092013460210115e-05} +{"train_loss": 0.002197887049987912, "global_step": 30981, "epoch": 260, "lr": 6.0917972566965344e-05} +{"train_loss": 0.004201390780508518, "global_step": 30982, "epoch": 260, "lr": 6.0915810510393266e-05} +{"train_loss": 0.0018661807989701629, "global_step": 30983, "epoch": 260, "lr": 6.091364843238916e-05} +{"train_loss": 0.0043358951807022095, "global_step": 30984, "epoch": 260, "lr": 6.091148633295728e-05} +{"train_loss": 0.00301021127961576, "global_step": 30985, "epoch": 260, "lr": 6.0909324212101856e-05} +{"train_loss": 0.003024380188435316, "global_step": 30986, "epoch": 260, "lr": 6.090716206982714e-05} +{"train_loss": 0.00317339482717216, "global_step": 30987, "epoch": 260, "lr": 6.090499990613737e-05} +{"train_loss": 0.001846207887865603, "global_step": 30988, "epoch": 260, "lr": 6.09028377210368e-05} +{"train_loss": 0.0035815443843603134, "global_step": 30989, "epoch": 260, "lr": 6.090067551452967e-05} +{"train_loss": 0.0014692165423184633, "global_step": 30990, "epoch": 260, "lr": 6.089851328662024e-05} +{"train_loss": 0.004754848312586546, "global_step": 30991, "epoch": 260, "lr": 6.089635103731274e-05} +{"train_loss": 0.0021478207781910896, "global_step": 30992, "epoch": 260, "lr": 6.0894188766611415e-05} +{"train_loss": 0.004079220816493034, "global_step": 30993, "epoch": 260, "lr": 6.0892026474520505e-05} +{"train_loss": 0.0034110285341739655, "global_step": 30994, "epoch": 260, "lr": 6.0889864161044276e-05} +{"train_loss": 0.005024588666856289, "global_step": 30995, "epoch": 260, "lr": 6.088770182618696e-05} +{"train_loss": 0.0028082793578505516, "global_step": 30996, "epoch": 260, "lr": 6.0885539469952804e-05} +{"train_loss": 0.001967949792742729, "global_step": 30997, "epoch": 260, "lr": 6.0883377092346064e-05} +{"train_loss": 0.0028657002840191126, "global_step": 30998, "epoch": 260, "lr": 6.0881214693370966e-05} +{"train_loss": 0.0028594345785677433, "global_step": 30999, "epoch": 260, "lr": 6.087905227303177e-05} +{"train_loss": 0.0026736122090369463, "global_step": 31000, "epoch": 260, "lr": 6.087688983133271e-05} +{"train_loss": 0.00336524099111557, "global_step": 31001, "epoch": 260, "lr": 6.087472736827804e-05} +{"train_loss": 0.001394706661812961, "global_step": 31002, "epoch": 260, "lr": 6.087256488387201e-05} +{"train_loss": 0.00185186427552253, "global_step": 31003, "epoch": 260, "lr": 6.0870402378118873e-05} +{"train_loss": 0.005378150846809149, "global_step": 31004, "epoch": 260, "lr": 6.086823985102283e-05} +{"train_loss": 0.0018019165145233274, "global_step": 31005, "epoch": 260, "lr": 6.086607730258819e-05} +{"train_loss": 0.00250534457154572, "global_step": 31006, "epoch": 260, "lr": 6.086391473281915e-05} +{"train_loss": 0.0026340256445109844, "global_step": 31007, "epoch": 260, "lr": 6.0861752141719965e-05} +{"train_loss": 0.002671995433047414, "global_step": 31008, "epoch": 260, "lr": 6.08595895292949e-05} +{"train_loss": 0.00575980031862855, "global_step": 31009, "epoch": 260, "lr": 6.085742689554821e-05} +{"train_loss": 0.0029794559814035892, "global_step": 31010, "epoch": 260, "lr": 6.08552642404841e-05} +{"train_loss": 0.003197707934305072, "global_step": 31011, "epoch": 260, "lr": 6.085310156410685e-05} +{"train_loss": 0.003599785501137376, "global_step": 31012, "epoch": 260, "lr": 6.085093886642068e-05} +{"train_loss": 0.0030158439185470343, "global_step": 31013, "epoch": 260, "lr": 6.0848776147429866e-05} +{"train_loss": 0.003184596309438348, "global_step": 31014, "epoch": 260, "lr": 6.084661340713863e-05} +{"train_loss": 0.003856580937281251, "global_step": 31015, "epoch": 260, "lr": 6.0844450645551246e-05} +{"train_loss": 0.002968071261420846, "global_step": 31016, "epoch": 260, "lr": 6.084228786267192e-05} +{"train_loss": 0.0031880789902061224, "global_step": 31017, "epoch": 260, "lr": 6.084012505850493e-05} +{"train_loss": 0.006373753771185875, "global_step": 31018, "epoch": 260, "lr": 6.0837962233054514e-05} +{"train_loss": 0.004597352351993322, "global_step": 31019, "epoch": 260, "lr": 6.083579938632491e-05} +{"train_loss": 0.0026626389008015394, "global_step": 31020, "epoch": 260, "lr": 6.083363651832037e-05} +{"train_loss": 0.002147722290828824, "global_step": 31021, "epoch": 260, "lr": 6.0831473629045144e-05} +{"train_loss": 0.0035335104912519455, "global_step": 31022, "epoch": 260, "lr": 6.0829310718503474e-05} +{"train_loss": 0.004693357273936272, "global_step": 31023, "epoch": 260, "lr": 6.082714778669961e-05} +{"train_loss": 0.0029164107982069254, "global_step": 31024, "epoch": 260, "lr": 6.082498483363781e-05} +{"train_loss": 0.0030775018967688084, "global_step": 31025, "epoch": 260, "lr": 6.08228218593223e-05} +{"train_loss": 0.0030225166119635105, "global_step": 31026, "epoch": 260, "lr": 6.082065886375733e-05} +{"train_loss": 0.003852174384519458, "global_step": 31027, "epoch": 260, "lr": 6.081849584694715e-05} +{"train_loss": 0.005258706398308277, "global_step": 31028, "epoch": 260, "lr": 6.081633280889604e-05} +{"train_loss": 0.002347153378650546, "global_step": 31029, "epoch": 260, "lr": 6.0814169749608186e-05} +{"train_loss": 0.0027381216641515493, "global_step": 31030, "epoch": 260, "lr": 6.0812006669087876e-05} +{"train_loss": 0.0016791478265076876, "global_step": 31031, "epoch": 260, "lr": 6.080984356733934e-05} +{"train_loss": 0.0028502708300948143, "global_step": 31032, "epoch": 260, "lr": 6.080768044436683e-05} +{"train_loss": 0.002196589019149542, "global_step": 31033, "epoch": 260, "lr": 6.08055173001746e-05} +{"train_loss": 0.0023123794235289097, "global_step": 31034, "epoch": 260, "lr": 6.08033541347669e-05} +{"train_loss": 0.0031601437367498875, "global_step": 31035, "epoch": 260, "lr": 6.0801190948147955e-05} +{"train_loss": 0.006849971599876881, "global_step": 31036, "epoch": 260, "lr": 6.0799027740322035e-05} +{"train_loss": 0.0029477612115442753, "global_step": 31037, "epoch": 260, "lr": 6.079686451129336e-05} +{"train_loss": 0.0024111606180667877, "global_step": 31038, "epoch": 260, "lr": 6.079470126106621e-05} +{"train_loss": 0.0039305975660681725, "global_step": 31039, "epoch": 260, "lr": 6.0792537989644814e-05} +{"train_loss": 0.0028296818491071463, "global_step": 31040, "epoch": 260, "lr": 6.0790374697033416e-05} +{"train_loss": 0.0022196476347744465, "global_step": 31041, "epoch": 260, "lr": 6.078821138323628e-05} +{"train_loss": 0.002466809004545212, "global_step": 31042, "epoch": 260, "lr": 6.078604804825764e-05} +{"train_loss": 0.0030235738959163427, "global_step": 31043, "epoch": 260, "lr": 6.0783884692101746e-05} +{"train_loss": 0.005612189881503582, "global_step": 31044, "epoch": 260, "lr": 6.0781721314772844e-05} +{"train_loss": 0.0037546041421592236, "global_step": 31045, "epoch": 260, "lr": 6.0779557916275186e-05} +{"train_loss": 0.002771554747596383, "global_step": 31046, "epoch": 260, "lr": 6.0777394496613014e-05} +{"train_loss": 0.002987623680382967, "global_step": 31047, "epoch": 260, "lr": 6.0775231055790596e-05} +{"train_loss": 0.0017639698926359415, "global_step": 31048, "epoch": 260, "lr": 6.077306759381215e-05} +{"train_loss": 0.0020275849383324385, "global_step": 31049, "epoch": 260, "lr": 6.077090411068194e-05} +{"train_loss": 0.0028107357211411, "global_step": 31050, "epoch": 260, "lr": 6.0768740606404205e-05} +{"train_loss": 0.0030568414367735386, "global_step": 31051, "epoch": 260, "lr": 6.07665770809832e-05} +{"train_loss": 0.0032738097943365574, "global_step": 31052, "epoch": 260, "lr": 6.076441353442317e-05} +{"train_loss": 0.005186753813177347, "global_step": 31053, "epoch": 260, "lr": 6.076224996672838e-05} +{"train_loss": 0.0013565330300480127, "global_step": 31054, "epoch": 260, "lr": 6.076008637790305e-05} +{"train_loss": 0.004143187310546637, "global_step": 31055, "epoch": 260, "lr": 6.075792276795143e-05} +{"train_loss": 0.0030643590725958347, "global_step": 31056, "epoch": 260, "lr": 6.075575913687778e-05} +{"train_loss": 0.001547326217405498, "global_step": 31057, "epoch": 260, "lr": 6.075359548468634e-05} +{"train_loss": 0.0031702091933048073, "global_step": 31058, "epoch": 260, "lr": 6.0751431811381385e-05, "val_loss": 0.018971910700201988, "train_action_mse_error": 4.5070901251165196e-05} +{"train_loss": 0.002375447889789939, "global_step": 31059, "epoch": 261, "lr": 6.074926811696714e-05} +{"train_loss": 0.0020773534197360277, "global_step": 31060, "epoch": 261, "lr": 6.0747104401447854e-05} +{"train_loss": 0.0030942412558943033, "global_step": 31061, "epoch": 261, "lr": 6.074494066482776e-05} +{"train_loss": 0.004261304624378681, "global_step": 31062, "epoch": 261, "lr": 6.074277690711114e-05} +{"train_loss": 0.002069334965199232, "global_step": 31063, "epoch": 261, "lr": 6.0740613128302216e-05} +{"train_loss": 0.004598669707775116, "global_step": 31064, "epoch": 261, "lr": 6.0738449328405246e-05} +{"train_loss": 0.0034618601202964783, "global_step": 31065, "epoch": 261, "lr": 6.073628550742448e-05} +{"train_loss": 0.003144617658108473, "global_step": 31066, "epoch": 261, "lr": 6.073412166536418e-05} +{"train_loss": 0.0031261565163731575, "global_step": 31067, "epoch": 261, "lr": 6.0731957802228567e-05} +{"train_loss": 0.0025205793790519238, "global_step": 31068, "epoch": 261, "lr": 6.0729793918021894e-05} +{"train_loss": 0.0015476796543225646, "global_step": 31069, "epoch": 261, "lr": 6.072763001274843e-05} +{"train_loss": 0.0027871073689311743, "global_step": 31070, "epoch": 261, "lr": 6.07254660864124e-05} +{"train_loss": 0.004100860096514225, "global_step": 31071, "epoch": 261, "lr": 6.0723302139018057e-05} +{"train_loss": 0.0029526115395128727, "global_step": 31072, "epoch": 261, "lr": 6.072113817056967e-05} +{"train_loss": 0.003077311906963587, "global_step": 31073, "epoch": 261, "lr": 6.071897418107146e-05} +{"train_loss": 0.003203270025551319, "global_step": 31074, "epoch": 261, "lr": 6.0716810170527704e-05} +{"train_loss": 0.002761523937806487, "global_step": 31075, "epoch": 261, "lr": 6.071464613894262e-05} +{"train_loss": 0.003323197830468416, "global_step": 31076, "epoch": 261, "lr": 6.0712482086320487e-05} +{"train_loss": 0.0023600421845912933, "global_step": 31077, "epoch": 261, "lr": 6.071031801266554e-05} +{"train_loss": 0.002854851773008704, "global_step": 31078, "epoch": 261, "lr": 6.0708153917982034e-05} +{"train_loss": 0.0034754150547087193, "global_step": 31079, "epoch": 261, "lr": 6.0705989802274196e-05} +{"train_loss": 0.0018625283846631646, "global_step": 31080, "epoch": 261, "lr": 6.07038256655463e-05} +{"train_loss": 0.0024961575400084257, "global_step": 31081, "epoch": 261, "lr": 6.0701661507802576e-05} +{"train_loss": 0.004040183965116739, "global_step": 31082, "epoch": 261, "lr": 6.06994973290473e-05} +{"train_loss": 0.0035723198670893908, "global_step": 31083, "epoch": 261, "lr": 6.069733312928468e-05} +{"train_loss": 0.002552509307861328, "global_step": 31084, "epoch": 261, "lr": 6.069516890851901e-05} +{"train_loss": 0.0016801299061626196, "global_step": 31085, "epoch": 261, "lr": 6.0693004666754514e-05} +{"train_loss": 0.005977618508040905, "global_step": 31086, "epoch": 261, "lr": 6.069084040399544e-05} +{"train_loss": 0.0021880739368498325, "global_step": 31087, "epoch": 261, "lr": 6.0688676120246046e-05} +{"train_loss": 0.0024434642400592566, "global_step": 31088, "epoch": 261, "lr": 6.0686511815510575e-05} +{"train_loss": 0.0016333394451066852, "global_step": 31089, "epoch": 261, "lr": 6.068434748979328e-05} +{"train_loss": 0.0029552713967859745, "global_step": 31090, "epoch": 261, "lr": 6.068218314309842e-05} +{"train_loss": 0.003314981935545802, "global_step": 31091, "epoch": 261, "lr": 6.0680018775430214e-05} +{"train_loss": 0.0030843904241919518, "global_step": 31092, "epoch": 261, "lr": 6.067785438679295e-05} +{"train_loss": 0.0018437107792124152, "global_step": 31093, "epoch": 261, "lr": 6.067568997719085e-05} +{"train_loss": 0.0016799434088170528, "global_step": 31094, "epoch": 261, "lr": 6.067352554662818e-05} +{"train_loss": 0.003933578729629517, "global_step": 31095, "epoch": 261, "lr": 6.067136109510918e-05} +{"train_loss": 0.002600402571260929, "global_step": 31096, "epoch": 261, "lr": 6.0669196622638105e-05} +{"train_loss": 0.001792681054212153, "global_step": 31097, "epoch": 261, "lr": 6.0667032129219214e-05} +{"train_loss": 0.0027699368074536324, "global_step": 31098, "epoch": 261, "lr": 6.066486761485672e-05} +{"train_loss": 0.0024570231325924397, "global_step": 31099, "epoch": 261, "lr": 6.066270307955492e-05} +{"train_loss": 0.0030239159241318703, "global_step": 31100, "epoch": 261, "lr": 6.066053852331803e-05} +{"train_loss": 0.0029634067323058844, "global_step": 31101, "epoch": 261, "lr": 6.0658373946150305e-05} +{"train_loss": 0.003593839006498456, "global_step": 31102, "epoch": 261, "lr": 6.065620934805602e-05} +{"train_loss": 0.0026740834582597017, "global_step": 31103, "epoch": 261, "lr": 6.0654044729039394e-05} +{"train_loss": 0.002621785271912813, "global_step": 31104, "epoch": 261, "lr": 6.0651880089104695e-05} +{"train_loss": 0.0024116886779665947, "global_step": 31105, "epoch": 261, "lr": 6.064971542825615e-05} +{"train_loss": 0.0029349965043365955, "global_step": 31106, "epoch": 261, "lr": 6.064755074649804e-05} +{"train_loss": 0.0020477965008467436, "global_step": 31107, "epoch": 261, "lr": 6.064538604383461e-05} +{"train_loss": 0.0030252605210989714, "global_step": 31108, "epoch": 261, "lr": 6.064322132027008e-05} +{"train_loss": 0.00179990753531456, "global_step": 31109, "epoch": 261, "lr": 6.064105657580875e-05} +{"train_loss": 0.0014740531332790852, "global_step": 31110, "epoch": 261, "lr": 6.0638891810454834e-05} +{"train_loss": 0.002133207628503442, "global_step": 31111, "epoch": 261, "lr": 6.063672702421258e-05} +{"train_loss": 0.0021448787301778793, "global_step": 31112, "epoch": 261, "lr": 6.063456221708626e-05} +{"train_loss": 0.0017463439144194126, "global_step": 31113, "epoch": 261, "lr": 6.0632397389080096e-05} +{"train_loss": 0.002281065797433257, "global_step": 31114, "epoch": 261, "lr": 6.063023254019836e-05} +{"train_loss": 0.0020161992870271206, "global_step": 31115, "epoch": 261, "lr": 6.062806767044531e-05} +{"train_loss": 0.00215083546936512, "global_step": 31116, "epoch": 261, "lr": 6.062590277982518e-05} +{"train_loss": 0.0029234951362013817, "global_step": 31117, "epoch": 261, "lr": 6.062373786834223e-05} +{"train_loss": 0.002172069624066353, "global_step": 31118, "epoch": 261, "lr": 6.0621572936000706e-05} +{"train_loss": 0.002734983107075095, "global_step": 31119, "epoch": 261, "lr": 6.0619407982804844e-05} +{"train_loss": 0.0030942121520638466, "global_step": 31120, "epoch": 261, "lr": 6.0617243008758914e-05} +{"train_loss": 0.002459364477545023, "global_step": 31121, "epoch": 261, "lr": 6.0615078013867164e-05} +{"train_loss": 0.0034815575927495956, "global_step": 31122, "epoch": 261, "lr": 6.061291299813384e-05} +{"train_loss": 0.0023167438339442015, "global_step": 31123, "epoch": 261, "lr": 6.0610747961563193e-05} +{"train_loss": 0.0025413872208446264, "global_step": 31124, "epoch": 261, "lr": 6.0608582904159484e-05} +{"train_loss": 0.00288643897511065, "global_step": 31125, "epoch": 261, "lr": 6.0606417825926956e-05} +{"train_loss": 0.001604477409273386, "global_step": 31126, "epoch": 261, "lr": 6.060425272686986e-05} +{"train_loss": 0.0014290140243247151, "global_step": 31127, "epoch": 261, "lr": 6.060208760699244e-05} +{"train_loss": 0.0025361496955156326, "global_step": 31128, "epoch": 261, "lr": 6.0599922466298965e-05} +{"train_loss": 0.002131158486008644, "global_step": 31129, "epoch": 261, "lr": 6.0597757304793666e-05} +{"train_loss": 0.002530669327825308, "global_step": 31130, "epoch": 261, "lr": 6.0595592122480806e-05} +{"train_loss": 0.0034307893365621567, "global_step": 31131, "epoch": 261, "lr": 6.059342691936463e-05} +{"train_loss": 0.0033580437302589417, "global_step": 31132, "epoch": 261, "lr": 6.0591261695449385e-05} +{"train_loss": 0.002452119253575802, "global_step": 31133, "epoch": 261, "lr": 6.0589096450739335e-05} +{"train_loss": 0.003543251659721136, "global_step": 31134, "epoch": 261, "lr": 6.058693118523874e-05} +{"train_loss": 0.002718471921980381, "global_step": 31135, "epoch": 261, "lr": 6.0584765898951826e-05} +{"train_loss": 0.0031685722060501575, "global_step": 31136, "epoch": 261, "lr": 6.0582600591882844e-05} +{"train_loss": 0.002193986438214779, "global_step": 31137, "epoch": 261, "lr": 6.058043526403606e-05} +{"train_loss": 0.0023068643640726805, "global_step": 31138, "epoch": 261, "lr": 6.057826991541573e-05} +{"train_loss": 0.0023404820822179317, "global_step": 31139, "epoch": 261, "lr": 6.057610454602609e-05} +{"train_loss": 0.002779086120426655, "global_step": 31140, "epoch": 261, "lr": 6.0573939155871396e-05} +{"train_loss": 0.004251063801348209, "global_step": 31141, "epoch": 261, "lr": 6.057177374495592e-05} +{"train_loss": 0.005142833571881056, "global_step": 31142, "epoch": 261, "lr": 6.0569608313283876e-05} +{"train_loss": 0.002862778725102544, "global_step": 31143, "epoch": 261, "lr": 6.056744286085955e-05} +{"train_loss": 0.002549315569922328, "global_step": 31144, "epoch": 261, "lr": 6.056527738768716e-05} +{"train_loss": 0.0033047760371118784, "global_step": 31145, "epoch": 261, "lr": 6.0563111893771e-05} +{"train_loss": 0.00226111663505435, "global_step": 31146, "epoch": 261, "lr": 6.056094637911528e-05} +{"train_loss": 0.003490267787128687, "global_step": 31147, "epoch": 261, "lr": 6.0558780843724286e-05} +{"train_loss": 0.002506584394723177, "global_step": 31148, "epoch": 261, "lr": 6.0556615287602234e-05} +{"train_loss": 0.0034209771547466516, "global_step": 31149, "epoch": 261, "lr": 6.0554449710753415e-05} +{"train_loss": 0.0027818793896585703, "global_step": 31150, "epoch": 261, "lr": 6.0552284113182056e-05} +{"train_loss": 0.0015215591993182898, "global_step": 31151, "epoch": 261, "lr": 6.055011849489241e-05} +{"train_loss": 0.0031167769338935614, "global_step": 31152, "epoch": 261, "lr": 6.054795285588874e-05} +{"train_loss": 0.0032128780148923397, "global_step": 31153, "epoch": 261, "lr": 6.054578719617529e-05} +{"train_loss": 0.0020504603162407875, "global_step": 31154, "epoch": 261, "lr": 6.05436215157563e-05} +{"train_loss": 0.0024555467534810305, "global_step": 31155, "epoch": 261, "lr": 6.054145581463604e-05} +{"train_loss": 0.0044062635861337185, "global_step": 31156, "epoch": 261, "lr": 6.0539290092818756e-05} +{"train_loss": 0.0026590756606310606, "global_step": 31157, "epoch": 261, "lr": 6.0537124350308716e-05} +{"train_loss": 0.0021419813856482506, "global_step": 31158, "epoch": 261, "lr": 6.053495858711015e-05} +{"train_loss": 0.0023913062177598476, "global_step": 31159, "epoch": 261, "lr": 6.053279280322731e-05} +{"train_loss": 0.004442396108061075, "global_step": 31160, "epoch": 261, "lr": 6.0530626998664487e-05} +{"train_loss": 0.003039549570530653, "global_step": 31161, "epoch": 261, "lr": 6.052846117342588e-05} +{"train_loss": 0.00310464296489954, "global_step": 31162, "epoch": 261, "lr": 6.052629532751576e-05} +{"train_loss": 0.0029323913622647524, "global_step": 31163, "epoch": 261, "lr": 6.0524129460938394e-05} +{"train_loss": 0.0019876889418810606, "global_step": 31164, "epoch": 261, "lr": 6.052196357369802e-05} +{"train_loss": 0.0027925753965973854, "global_step": 31165, "epoch": 261, "lr": 6.051979766579889e-05} +{"train_loss": 0.002650210168212652, "global_step": 31166, "epoch": 261, "lr": 6.0517631737245276e-05} +{"train_loss": 0.006405647378414869, "global_step": 31167, "epoch": 261, "lr": 6.05154657880414e-05} +{"train_loss": 0.0023477738723158836, "global_step": 31168, "epoch": 261, "lr": 6.0513299818191536e-05} +{"train_loss": 0.001709163305349648, "global_step": 31169, "epoch": 261, "lr": 6.051113382769993e-05} +{"train_loss": 0.0020695487037301064, "global_step": 31170, "epoch": 261, "lr": 6.050896781657084e-05} +{"train_loss": 0.0023302261251956224, "global_step": 31171, "epoch": 261, "lr": 6.050680178480851e-05} +{"train_loss": 0.0020389272831380367, "global_step": 31172, "epoch": 261, "lr": 6.050463573241719e-05} +{"train_loss": 0.0028453620616346598, "global_step": 31173, "epoch": 261, "lr": 6.050246965940115e-05} +{"train_loss": 0.0008621591841802001, "global_step": 31174, "epoch": 261, "lr": 6.0500303565764634e-05} +{"train_loss": 0.004003586713224649, "global_step": 31175, "epoch": 261, "lr": 6.049813745151189e-05} +{"train_loss": 0.0035769506357610226, "global_step": 31176, "epoch": 261, "lr": 6.049597131664717e-05} +{"train_loss": 0.0027965288804922286, "global_step": 31177, "epoch": 261, "lr": 6.0493805161174744e-05, "val_loss": 0.01827593706548214} +{"train_loss": 0.002545488765463233, "global_step": 31178, "epoch": 262, "lr": 6.0491638985098856e-05} +{"train_loss": 0.002102702623233199, "global_step": 31179, "epoch": 262, "lr": 6.048947278842374e-05} +{"train_loss": 0.0017503165872767568, "global_step": 31180, "epoch": 262, "lr": 6.048730657115367e-05} +{"train_loss": 0.004013773053884506, "global_step": 31181, "epoch": 262, "lr": 6.0485140333292886e-05} +{"train_loss": 0.003240200225263834, "global_step": 31182, "epoch": 262, "lr": 6.0482974074845667e-05} +{"train_loss": 0.002752481959760189, "global_step": 31183, "epoch": 262, "lr": 6.048080779581623e-05} +{"train_loss": 0.004472053609788418, "global_step": 31184, "epoch": 262, "lr": 6.0478641496208854e-05} +{"train_loss": 0.0027327772695571184, "global_step": 31185, "epoch": 262, "lr": 6.04764751760278e-05} +{"train_loss": 0.0024448183830827475, "global_step": 31186, "epoch": 262, "lr": 6.0474308835277295e-05} +{"train_loss": 0.0028879682067781687, "global_step": 31187, "epoch": 262, "lr": 6.0472142473961604e-05} +{"train_loss": 0.0026133465580642223, "global_step": 31188, "epoch": 262, "lr": 6.0469976092084966e-05} +{"train_loss": 0.002425912767648697, "global_step": 31189, "epoch": 262, "lr": 6.046780968965165e-05} +{"train_loss": 0.002414490794762969, "global_step": 31190, "epoch": 262, "lr": 6.046564326666592e-05} +{"train_loss": 0.0031955402810126543, "global_step": 31191, "epoch": 262, "lr": 6.0463476823132025e-05} +{"train_loss": 0.003850864479318261, "global_step": 31192, "epoch": 262, "lr": 6.04613103590542e-05} +{"train_loss": 0.00308688054792583, "global_step": 31193, "epoch": 262, "lr": 6.045914387443671e-05} +{"train_loss": 0.002869504038244486, "global_step": 31194, "epoch": 262, "lr": 6.0456977369283805e-05} +{"train_loss": 0.001884231111034751, "global_step": 31195, "epoch": 262, "lr": 6.045481084359975e-05} +{"train_loss": 0.0017501087859272957, "global_step": 31196, "epoch": 262, "lr": 6.045264429738878e-05} +{"train_loss": 0.001923796022310853, "global_step": 31197, "epoch": 262, "lr": 6.045047773065518e-05} +{"train_loss": 0.0022616777569055557, "global_step": 31198, "epoch": 262, "lr": 6.044831114340317e-05} +{"train_loss": 0.0036889174953103065, "global_step": 31199, "epoch": 262, "lr": 6.0446144535637016e-05} +{"train_loss": 0.003446822287514806, "global_step": 31200, "epoch": 262, "lr": 6.0443977907360975e-05} +{"train_loss": 0.0049274759367108345, "global_step": 31201, "epoch": 262, "lr": 6.0441811258579296e-05} +{"train_loss": 0.002592947334051132, "global_step": 31202, "epoch": 262, "lr": 6.043964458929624e-05} +{"train_loss": 0.004945711698383093, "global_step": 31203, "epoch": 262, "lr": 6.043747789951606e-05} +{"train_loss": 0.003978511784225702, "global_step": 31204, "epoch": 262, "lr": 6.0435311189242994e-05} +{"train_loss": 0.002397221280261874, "global_step": 31205, "epoch": 262, "lr": 6.043314445848132e-05} +{"train_loss": 0.0024749611038714647, "global_step": 31206, "epoch": 262, "lr": 6.0430977707235284e-05} +{"train_loss": 0.0030025688465684652, "global_step": 31207, "epoch": 262, "lr": 6.042881093550913e-05} +{"train_loss": 0.0034370243083685637, "global_step": 31208, "epoch": 262, "lr": 6.042664414330712e-05} +{"train_loss": 0.003938831388950348, "global_step": 31209, "epoch": 262, "lr": 6.042447733063351e-05} +{"train_loss": 0.0033180592581629753, "global_step": 31210, "epoch": 262, "lr": 6.042231049749257e-05} +{"train_loss": 0.0027265537064522505, "global_step": 31211, "epoch": 262, "lr": 6.042014364388852e-05} +{"train_loss": 0.0028751720674335957, "global_step": 31212, "epoch": 262, "lr": 6.0417976769825634e-05} +{"train_loss": 0.0029965625144541264, "global_step": 31213, "epoch": 262, "lr": 6.041580987530816e-05} +{"train_loss": 0.002205127151682973, "global_step": 31214, "epoch": 262, "lr": 6.041364296034036e-05} +{"train_loss": 0.004439349286258221, "global_step": 31215, "epoch": 262, "lr": 6.041147602492647e-05} +{"train_loss": 0.003661627182736993, "global_step": 31216, "epoch": 262, "lr": 6.040930906907078e-05} +{"train_loss": 0.003340591909363866, "global_step": 31217, "epoch": 262, "lr": 6.0407142092777526e-05} +{"train_loss": 0.003114184131845832, "global_step": 31218, "epoch": 262, "lr": 6.040497509605094e-05} +{"train_loss": 0.0023924752604216337, "global_step": 31219, "epoch": 262, "lr": 6.040280807889531e-05} +{"train_loss": 0.002218943554908037, "global_step": 31220, "epoch": 262, "lr": 6.040064104131488e-05} +{"train_loss": 0.0024712278973311186, "global_step": 31221, "epoch": 262, "lr": 6.0398473983313895e-05} +{"train_loss": 0.004142013378441334, "global_step": 31222, "epoch": 262, "lr": 6.0396306904896613e-05} +{"train_loss": 0.002493219915777445, "global_step": 31223, "epoch": 262, "lr": 6.0394139806067295e-05} +{"train_loss": 0.0029771686531603336, "global_step": 31224, "epoch": 262, "lr": 6.03919726868302e-05} +{"train_loss": 0.0018874944653362036, "global_step": 31225, "epoch": 262, "lr": 6.038980554718958e-05} +{"train_loss": 0.0024258659686893225, "global_step": 31226, "epoch": 262, "lr": 6.038763838714968e-05} +{"train_loss": 0.0036920264828950167, "global_step": 31227, "epoch": 262, "lr": 6.038547120671476e-05} +{"train_loss": 0.007193358615040779, "global_step": 31228, "epoch": 262, "lr": 6.0383304005889094e-05} +{"train_loss": 0.002314504235982895, "global_step": 31229, "epoch": 262, "lr": 6.0381136784676905e-05} +{"train_loss": 0.002988781314343214, "global_step": 31230, "epoch": 262, "lr": 6.0378969543082466e-05} +{"train_loss": 0.004632039926946163, "global_step": 31231, "epoch": 262, "lr": 6.037680228111002e-05} +{"train_loss": 0.0018956938292831182, "global_step": 31232, "epoch": 262, "lr": 6.0374634998763846e-05} +{"train_loss": 0.0021761804819107056, "global_step": 31233, "epoch": 262, "lr": 6.0372467696048174e-05} +{"train_loss": 0.004268775228410959, "global_step": 31234, "epoch": 262, "lr": 6.037030037296727e-05} +{"train_loss": 0.0025365569163113832, "global_step": 31235, "epoch": 262, "lr": 6.03681330295254e-05} +{"train_loss": 0.003077859291806817, "global_step": 31236, "epoch": 262, "lr": 6.036596566572681e-05} +{"train_loss": 0.003466013353317976, "global_step": 31237, "epoch": 262, "lr": 6.036379828157572e-05} +{"train_loss": 0.0035840151831507683, "global_step": 31238, "epoch": 262, "lr": 6.0361630877076444e-05} +{"train_loss": 0.0020289940293878317, "global_step": 31239, "epoch": 262, "lr": 6.0359463452233224e-05} +{"train_loss": 0.0033832555636763573, "global_step": 31240, "epoch": 262, "lr": 6.035729600705029e-05} +{"train_loss": 0.0038312498945742846, "global_step": 31241, "epoch": 262, "lr": 6.0355128541531925e-05} +{"train_loss": 0.0020777189638465643, "global_step": 31242, "epoch": 262, "lr": 6.0352961055682357e-05} +{"train_loss": 0.003434639424085617, "global_step": 31243, "epoch": 262, "lr": 6.0350793549505854e-05} +{"train_loss": 0.001962910406291485, "global_step": 31244, "epoch": 262, "lr": 6.034862602300668e-05} +{"train_loss": 0.0032769222743809223, "global_step": 31245, "epoch": 262, "lr": 6.034645847618908e-05} +{"train_loss": 0.00333805033005774, "global_step": 31246, "epoch": 262, "lr": 6.0344290909057325e-05} +{"train_loss": 0.0030255664605647326, "global_step": 31247, "epoch": 262, "lr": 6.034212332161566e-05} +{"train_loss": 0.0033784848637878895, "global_step": 31248, "epoch": 262, "lr": 6.0339955713868335e-05} +{"train_loss": 0.0019014769932255149, "global_step": 31249, "epoch": 262, "lr": 6.0337788085819614e-05} +{"train_loss": 0.0013999984366819263, "global_step": 31250, "epoch": 262, "lr": 6.033562043747374e-05} +{"train_loss": 0.0021353766787797213, "global_step": 31251, "epoch": 262, "lr": 6.0333452768834984e-05} +{"train_loss": 0.0047236280515789986, "global_step": 31252, "epoch": 262, "lr": 6.0331285079907606e-05} +{"train_loss": 0.0031645570416003466, "global_step": 31253, "epoch": 262, "lr": 6.032911737069584e-05} +{"train_loss": 0.0012941989116370678, "global_step": 31254, "epoch": 262, "lr": 6.032694964120397e-05} +{"train_loss": 0.0023637276608496904, "global_step": 31255, "epoch": 262, "lr": 6.032478189143622e-05} +{"train_loss": 0.0023257152643054724, "global_step": 31256, "epoch": 262, "lr": 6.032261412139688e-05} +{"train_loss": 0.0015980267198756337, "global_step": 31257, "epoch": 262, "lr": 6.032044633109019e-05} +{"train_loss": 0.0031695703510195017, "global_step": 31258, "epoch": 262, "lr": 6.031827852052039e-05} +{"train_loss": 0.0042454819194972515, "global_step": 31259, "epoch": 262, "lr": 6.0316110689691764e-05} +{"train_loss": 0.0028100227937102318, "global_step": 31260, "epoch": 262, "lr": 6.0313942838608575e-05} +{"train_loss": 0.002791461767628789, "global_step": 31261, "epoch": 262, "lr": 6.031177496727504e-05} +{"train_loss": 0.0020042930264025927, "global_step": 31262, "epoch": 262, "lr": 6.0309607075695426e-05} +{"train_loss": 0.004993523005396128, "global_step": 31263, "epoch": 262, "lr": 6.0307439163874026e-05} +{"train_loss": 0.0032661573495715857, "global_step": 31264, "epoch": 262, "lr": 6.030527123181505e-05} +{"train_loss": 0.003349236212670803, "global_step": 31265, "epoch": 262, "lr": 6.0303103279522774e-05} +{"train_loss": 0.0019021533662453294, "global_step": 31266, "epoch": 262, "lr": 6.030093530700148e-05} +{"train_loss": 0.002008836716413498, "global_step": 31267, "epoch": 262, "lr": 6.029876731425538e-05} +{"train_loss": 0.0049861157312989235, "global_step": 31268, "epoch": 262, "lr": 6.029659930128876e-05} +{"train_loss": 0.00215702666901052, "global_step": 31269, "epoch": 262, "lr": 6.029443126810586e-05} +{"train_loss": 0.0018156442092731595, "global_step": 31270, "epoch": 262, "lr": 6.0292263214710944e-05} +{"train_loss": 0.0019382697064429522, "global_step": 31271, "epoch": 262, "lr": 6.029009514110826e-05} +{"train_loss": 0.00270497752353549, "global_step": 31272, "epoch": 262, "lr": 6.0287927047302084e-05} +{"train_loss": 0.002975077833980322, "global_step": 31273, "epoch": 262, "lr": 6.028575893329666e-05} +{"train_loss": 0.002015308476984501, "global_step": 31274, "epoch": 262, "lr": 6.0283590799096255e-05} +{"train_loss": 0.0034118283074349165, "global_step": 31275, "epoch": 262, "lr": 6.028142264470511e-05} +{"train_loss": 0.004287774208933115, "global_step": 31276, "epoch": 262, "lr": 6.027925447012749e-05} +{"train_loss": 0.002836858620867133, "global_step": 31277, "epoch": 262, "lr": 6.0277086275367654e-05} +{"train_loss": 0.0052270712330937386, "global_step": 31278, "epoch": 262, "lr": 6.0274918060429855e-05} +{"train_loss": 0.0027561199385672808, "global_step": 31279, "epoch": 262, "lr": 6.027274982531837e-05} +{"train_loss": 0.0025800494477152824, "global_step": 31280, "epoch": 262, "lr": 6.027058157003742e-05} +{"train_loss": 0.002458629896864295, "global_step": 31281, "epoch": 262, "lr": 6.026841329459127e-05} +{"train_loss": 0.002267837291583419, "global_step": 31282, "epoch": 262, "lr": 6.026624499898421e-05} +{"train_loss": 0.004462274722754955, "global_step": 31283, "epoch": 262, "lr": 6.026407668322046e-05} +{"train_loss": 0.004928946029394865, "global_step": 31284, "epoch": 262, "lr": 6.02619083473043e-05} +{"train_loss": 0.0032628015615046024, "global_step": 31285, "epoch": 262, "lr": 6.025973999123998e-05} +{"train_loss": 0.004094551783055067, "global_step": 31286, "epoch": 262, "lr": 6.025757161503175e-05} +{"train_loss": 0.0033640097826719284, "global_step": 31287, "epoch": 262, "lr": 6.025540321868387e-05} +{"train_loss": 0.0037050850223749876, "global_step": 31288, "epoch": 262, "lr": 6.025323480220061e-05} +{"train_loss": 0.0029115797951817513, "global_step": 31289, "epoch": 262, "lr": 6.025106636558622e-05} +{"train_loss": 0.002758789574727416, "global_step": 31290, "epoch": 262, "lr": 6.024889790884495e-05} +{"train_loss": 0.002330777468159795, "global_step": 31291, "epoch": 262, "lr": 6.024672943198108e-05} +{"train_loss": 0.002492425264790654, "global_step": 31292, "epoch": 262, "lr": 6.0244560934998836e-05} +{"train_loss": 0.004937421064823866, "global_step": 31293, "epoch": 262, "lr": 6.024239241790249e-05} +{"train_loss": 0.0026174394879490137, "global_step": 31294, "epoch": 262, "lr": 6.024022388069631e-05} +{"train_loss": 0.003917702939361334, "global_step": 31295, "epoch": 262, "lr": 6.0238055323384533e-05} +{"train_loss": 0.003032618436078001, "global_step": 31296, "epoch": 262, "lr": 6.023588674597144e-05, "val_loss": 0.01825743541121483} +{"train_loss": 0.0035805213265120983, "global_step": 31297, "epoch": 263, "lr": 6.023371814846128e-05} +{"train_loss": 0.002948295557871461, "global_step": 31298, "epoch": 263, "lr": 6.02315495308583e-05} +{"train_loss": 0.002904875436797738, "global_step": 31299, "epoch": 263, "lr": 6.022938089316677e-05} +{"train_loss": 0.0026767419185489416, "global_step": 31300, "epoch": 263, "lr": 6.022721223539093e-05} +{"train_loss": 0.003665971802547574, "global_step": 31301, "epoch": 263, "lr": 6.0225043557535054e-05} +{"train_loss": 0.0020683312322944403, "global_step": 31302, "epoch": 263, "lr": 6.022287485960341e-05} +{"train_loss": 0.004715359769761562, "global_step": 31303, "epoch": 263, "lr": 6.0220706141600226e-05} +{"train_loss": 0.002472992753610015, "global_step": 31304, "epoch": 263, "lr": 6.021853740352978e-05} +{"train_loss": 0.003999441396445036, "global_step": 31305, "epoch": 263, "lr": 6.021636864539635e-05} +{"train_loss": 0.002128058345988393, "global_step": 31306, "epoch": 263, "lr": 6.021419986720414e-05} +{"train_loss": 0.003191168187186122, "global_step": 31307, "epoch": 263, "lr": 6.0212031068957464e-05} +{"train_loss": 0.0028592227026820183, "global_step": 31308, "epoch": 263, "lr": 6.020986225066055e-05} +{"train_loss": 0.0027221168857067823, "global_step": 31309, "epoch": 263, "lr": 6.020769341231766e-05} +{"train_loss": 0.0038976159412413836, "global_step": 31310, "epoch": 263, "lr": 6.020552455393307e-05} +{"train_loss": 0.0022754683159291744, "global_step": 31311, "epoch": 263, "lr": 6.020335567551101e-05} +{"train_loss": 0.0028019340243190527, "global_step": 31312, "epoch": 263, "lr": 6.020118677705574e-05} +{"train_loss": 0.0026680759619921446, "global_step": 31313, "epoch": 263, "lr": 6.019901785857154e-05} +{"train_loss": 0.0026331807021051645, "global_step": 31314, "epoch": 263, "lr": 6.0196848920062655e-05} +{"train_loss": 0.0020476505160331726, "global_step": 31315, "epoch": 263, "lr": 6.0194679961533354e-05} +{"train_loss": 0.0029053757898509502, "global_step": 31316, "epoch": 263, "lr": 6.019251098298788e-05} +{"train_loss": 0.003591373795643449, "global_step": 31317, "epoch": 263, "lr": 6.019034198443051e-05} +{"train_loss": 0.002408693078905344, "global_step": 31318, "epoch": 263, "lr": 6.0188172965865474e-05} +{"train_loss": 0.00232818815857172, "global_step": 31319, "epoch": 263, "lr": 6.018600392729706e-05} +{"train_loss": 0.0026661355514079332, "global_step": 31320, "epoch": 263, "lr": 6.018383486872952e-05} +{"train_loss": 0.003939017187803984, "global_step": 31321, "epoch": 263, "lr": 6.018166579016708e-05} +{"train_loss": 0.003376930020749569, "global_step": 31322, "epoch": 263, "lr": 6.017949669161407e-05} +{"train_loss": 0.003491027280688286, "global_step": 31323, "epoch": 263, "lr": 6.017732757307468e-05} +{"train_loss": 0.0026041255332529545, "global_step": 31324, "epoch": 263, "lr": 6.01751584345532e-05} +{"train_loss": 0.002903995104134083, "global_step": 31325, "epoch": 263, "lr": 6.017298927605388e-05} +{"train_loss": 0.0026957362424582243, "global_step": 31326, "epoch": 263, "lr": 6.017082009758099e-05} +{"train_loss": 0.0029365026857703924, "global_step": 31327, "epoch": 263, "lr": 6.016865089913878e-05} +{"train_loss": 0.0020038001239299774, "global_step": 31328, "epoch": 263, "lr": 6.01664816807315e-05} +{"train_loss": 0.0032035326585173607, "global_step": 31329, "epoch": 263, "lr": 6.016431244236345e-05} +{"train_loss": 0.0037346642930060625, "global_step": 31330, "epoch": 263, "lr": 6.0162143184038835e-05} +{"train_loss": 0.0023613846860826015, "global_step": 31331, "epoch": 263, "lr": 6.0159973905761935e-05} +{"train_loss": 0.0017883969703689218, "global_step": 31332, "epoch": 263, "lr": 6.0157804607537e-05} +{"train_loss": 0.0016243213322013617, "global_step": 31333, "epoch": 263, "lr": 6.0155635289368315e-05} +{"train_loss": 0.0031518784817308187, "global_step": 31334, "epoch": 263, "lr": 6.015346595126014e-05} +{"train_loss": 0.0035071494057774544, "global_step": 31335, "epoch": 263, "lr": 6.01512965932167e-05} +{"train_loss": 0.002880136016756296, "global_step": 31336, "epoch": 263, "lr": 6.014912721524228e-05} +{"train_loss": 0.004647049121558666, "global_step": 31337, "epoch": 263, "lr": 6.014695781734112e-05} +{"train_loss": 0.004222049843519926, "global_step": 31338, "epoch": 263, "lr": 6.0144788399517504e-05} +{"train_loss": 0.0037109232507646084, "global_step": 31339, "epoch": 263, "lr": 6.014261896177569e-05} +{"train_loss": 0.0019788003992289305, "global_step": 31340, "epoch": 263, "lr": 6.014044950411991e-05} +{"train_loss": 0.0022805118933320045, "global_step": 31341, "epoch": 263, "lr": 6.013828002655446e-05} +{"train_loss": 0.0017006071284413338, "global_step": 31342, "epoch": 263, "lr": 6.013611052908357e-05} +{"train_loss": 0.004490272607654333, "global_step": 31343, "epoch": 263, "lr": 6.01339410117115e-05} +{"train_loss": 0.0022390619851648808, "global_step": 31344, "epoch": 263, "lr": 6.0131771474442534e-05} +{"train_loss": 0.0027902640867978334, "global_step": 31345, "epoch": 263, "lr": 6.01296019172809e-05} +{"train_loss": 0.002351021161302924, "global_step": 31346, "epoch": 263, "lr": 6.0127432340230886e-05} +{"train_loss": 0.002301278058439493, "global_step": 31347, "epoch": 263, "lr": 6.012526274329674e-05} +{"train_loss": 0.004070265684276819, "global_step": 31348, "epoch": 263, "lr": 6.0123093126482735e-05} +{"train_loss": 0.002707874868065119, "global_step": 31349, "epoch": 263, "lr": 6.01209234897931e-05} +{"train_loss": 0.003174549899995327, "global_step": 31350, "epoch": 263, "lr": 6.011875383323212e-05} +{"train_loss": 0.0023629043716937304, "global_step": 31351, "epoch": 263, "lr": 6.011658415680404e-05} +{"train_loss": 0.0019667446613311768, "global_step": 31352, "epoch": 263, "lr": 6.011441446051314e-05} +{"train_loss": 0.0030836479272693396, "global_step": 31353, "epoch": 263, "lr": 6.0112244744363654e-05} +{"train_loss": 0.003913733176887035, "global_step": 31354, "epoch": 263, "lr": 6.011007500835987e-05} +{"train_loss": 0.0025001452304422855, "global_step": 31355, "epoch": 263, "lr": 6.0107905252506025e-05} +{"train_loss": 0.004997064359486103, "global_step": 31356, "epoch": 263, "lr": 6.010573547680639e-05} +{"train_loss": 0.001926935976371169, "global_step": 31357, "epoch": 263, "lr": 6.0103565681265214e-05} +{"train_loss": 0.002590416930615902, "global_step": 31358, "epoch": 263, "lr": 6.0101395865886776e-05} +{"train_loss": 0.002775682369247079, "global_step": 31359, "epoch": 263, "lr": 6.0099226030675325e-05} +{"train_loss": 0.002326840301975608, "global_step": 31360, "epoch": 263, "lr": 6.009705617563514e-05} +{"train_loss": 0.002882425906136632, "global_step": 31361, "epoch": 263, "lr": 6.009488630077045e-05} +{"train_loss": 0.0017616472905501723, "global_step": 31362, "epoch": 263, "lr": 6.0092716406085523e-05} +{"train_loss": 0.0017431376036256552, "global_step": 31363, "epoch": 263, "lr": 6.0090546491584633e-05} +{"train_loss": 0.0030913951341062784, "global_step": 31364, "epoch": 263, "lr": 6.008837655727202e-05} +{"train_loss": 0.0024038117844611406, "global_step": 31365, "epoch": 263, "lr": 6.008620660315196e-05} +{"train_loss": 0.0027522712480276823, "global_step": 31366, "epoch": 263, "lr": 6.008403662922873e-05} +{"train_loss": 0.001864010002464056, "global_step": 31367, "epoch": 263, "lr": 6.0081866635506566e-05} +{"train_loss": 0.0032092530746012926, "global_step": 31368, "epoch": 263, "lr": 6.007969662198972e-05} +{"train_loss": 0.0053087263368070126, "global_step": 31369, "epoch": 263, "lr": 6.007752658868248e-05} +{"train_loss": 0.0026699702721089125, "global_step": 31370, "epoch": 263, "lr": 6.007535653558907e-05} +{"train_loss": 0.0034067064989358187, "global_step": 31371, "epoch": 263, "lr": 6.007318646271379e-05} +{"train_loss": 0.0026187668554484844, "global_step": 31372, "epoch": 263, "lr": 6.007101637006089e-05} +{"train_loss": 0.0018245598766952753, "global_step": 31373, "epoch": 263, "lr": 6.006884625763463e-05} +{"train_loss": 0.0029629236087203026, "global_step": 31374, "epoch": 263, "lr": 6.006667612543925e-05} +{"train_loss": 0.003075291635468602, "global_step": 31375, "epoch": 263, "lr": 6.0064505973479036e-05} +{"train_loss": 0.002885320456698537, "global_step": 31376, "epoch": 263, "lr": 6.006233580175823e-05} +{"train_loss": 0.003457066835835576, "global_step": 31377, "epoch": 263, "lr": 6.0060165610281115e-05} +{"train_loss": 0.001977457432076335, "global_step": 31378, "epoch": 263, "lr": 6.0057995399051926e-05} +{"train_loss": 0.0033280712086707354, "global_step": 31379, "epoch": 263, "lr": 6.0055825168074956e-05} +{"train_loss": 0.002196433488279581, "global_step": 31380, "epoch": 263, "lr": 6.005365491735444e-05} +{"train_loss": 0.0026112026534974575, "global_step": 31381, "epoch": 263, "lr": 6.005148464689464e-05} +{"train_loss": 0.003600160591304302, "global_step": 31382, "epoch": 263, "lr": 6.0049314356699824e-05} +{"train_loss": 0.0027982040774077177, "global_step": 31383, "epoch": 263, "lr": 6.004714404677426e-05} +{"train_loss": 0.0020553944632411003, "global_step": 31384, "epoch": 263, "lr": 6.00449737171222e-05} +{"train_loss": 0.002870632102712989, "global_step": 31385, "epoch": 263, "lr": 6.00428033677479e-05} +{"train_loss": 0.0022376812994480133, "global_step": 31386, "epoch": 263, "lr": 6.004063299865563e-05} +{"train_loss": 0.003616817994043231, "global_step": 31387, "epoch": 263, "lr": 6.003846260984967e-05} +{"train_loss": 0.0017494307830929756, "global_step": 31388, "epoch": 263, "lr": 6.0036292201334234e-05} +{"train_loss": 0.002523987088352442, "global_step": 31389, "epoch": 263, "lr": 6.003412177311363e-05} +{"train_loss": 0.002322807442396879, "global_step": 31390, "epoch": 263, "lr": 6.003195132519208e-05} +{"train_loss": 0.0028554031159728765, "global_step": 31391, "epoch": 263, "lr": 6.002978085757389e-05} +{"train_loss": 0.004501143004745245, "global_step": 31392, "epoch": 263, "lr": 6.002761037026329e-05} +{"train_loss": 0.0028885439969599247, "global_step": 31393, "epoch": 263, "lr": 6.0025439863264534e-05} +{"train_loss": 0.002414785325527191, "global_step": 31394, "epoch": 263, "lr": 6.002326933658191e-05} +{"train_loss": 0.00191440898925066, "global_step": 31395, "epoch": 263, "lr": 6.002109879021966e-05} +{"train_loss": 0.00457130279392004, "global_step": 31396, "epoch": 263, "lr": 6.001892822418206e-05} +{"train_loss": 0.003017138224095106, "global_step": 31397, "epoch": 263, "lr": 6.001675763847335e-05} +{"train_loss": 0.0032425178214907646, "global_step": 31398, "epoch": 263, "lr": 6.001458703309784e-05} +{"train_loss": 0.002519849454984069, "global_step": 31399, "epoch": 263, "lr": 6.001241640805973e-05} +{"train_loss": 0.002793730003759265, "global_step": 31400, "epoch": 263, "lr": 6.001024576336332e-05} +{"train_loss": 0.0028423082549124956, "global_step": 31401, "epoch": 263, "lr": 6.000807509901285e-05} +{"train_loss": 0.002317070262506604, "global_step": 31402, "epoch": 263, "lr": 6.000590441501261e-05} +{"train_loss": 0.0028642842080444098, "global_step": 31403, "epoch": 263, "lr": 6.000373371136683e-05} +{"train_loss": 0.001718956045806408, "global_step": 31404, "epoch": 263, "lr": 6.00015629880798e-05} +{"train_loss": 0.001921671093441546, "global_step": 31405, "epoch": 263, "lr": 5.999939224515576e-05} +{"train_loss": 0.0036348330322653055, "global_step": 31406, "epoch": 263, "lr": 5.9997221482598986e-05} +{"train_loss": 0.0029652223456650972, "global_step": 31407, "epoch": 263, "lr": 5.9995050700413734e-05} +{"train_loss": 0.0032944446429610252, "global_step": 31408, "epoch": 263, "lr": 5.999287989860427e-05} +{"train_loss": 0.0035326529759913683, "global_step": 31409, "epoch": 263, "lr": 5.9990709077174845e-05} +{"train_loss": 0.004275893326848745, "global_step": 31410, "epoch": 263, "lr": 5.9988538236129754e-05} +{"train_loss": 0.001659258152358234, "global_step": 31411, "epoch": 263, "lr": 5.998636737547322e-05} +{"train_loss": 0.0013820211170241237, "global_step": 31412, "epoch": 263, "lr": 5.998419649520952e-05} +{"train_loss": 0.0030974755063652992, "global_step": 31413, "epoch": 263, "lr": 5.998202559534292e-05} +{"train_loss": 0.002727789105847478, "global_step": 31414, "epoch": 263, "lr": 5.997985467587767e-05} +{"train_loss": 0.0028698916944182094, "global_step": 31415, "epoch": 263, "lr": 5.9977683736818044e-05, "val_loss": 0.010996072553098202} +{"train_loss": 0.0031186151318252087, "global_step": 31416, "epoch": 264, "lr": 5.9975512778168316e-05} +{"train_loss": 0.002747592981904745, "global_step": 31417, "epoch": 264, "lr": 5.997334179993273e-05} +{"train_loss": 0.0017466330900788307, "global_step": 31418, "epoch": 264, "lr": 5.997117080211554e-05} +{"train_loss": 0.003388874465599656, "global_step": 31419, "epoch": 264, "lr": 5.996899978472103e-05} +{"train_loss": 0.0043794638477265835, "global_step": 31420, "epoch": 264, "lr": 5.996682874775344e-05} +{"train_loss": 0.00256224162876606, "global_step": 31421, "epoch": 264, "lr": 5.9964657691217063e-05} +{"train_loss": 0.003833724418655038, "global_step": 31422, "epoch": 264, "lr": 5.996248661511614e-05} +{"train_loss": 0.003188173519447446, "global_step": 31423, "epoch": 264, "lr": 5.9960315519454946e-05} +{"train_loss": 0.0027976767159998417, "global_step": 31424, "epoch": 264, "lr": 5.995814440423774e-05} +{"train_loss": 0.004304356407374144, "global_step": 31425, "epoch": 264, "lr": 5.9955973269468766e-05} +{"train_loss": 0.0017743937205523252, "global_step": 31426, "epoch": 264, "lr": 5.99538021151523e-05} +{"train_loss": 0.003231968032196164, "global_step": 31427, "epoch": 264, "lr": 5.995163094129262e-05} +{"train_loss": 0.0016562228556722403, "global_step": 31428, "epoch": 264, "lr": 5.994945974789397e-05} +{"train_loss": 0.004627409856766462, "global_step": 31429, "epoch": 264, "lr": 5.9947288534960634e-05} +{"train_loss": 0.003193480661138892, "global_step": 31430, "epoch": 264, "lr": 5.994511730249685e-05} +{"train_loss": 0.003074208041653037, "global_step": 31431, "epoch": 264, "lr": 5.994294605050688e-05} +{"train_loss": 0.0021769655868411064, "global_step": 31432, "epoch": 264, "lr": 5.9940774778995e-05} +{"train_loss": 0.0025978111661970615, "global_step": 31433, "epoch": 264, "lr": 5.993860348796547e-05} +{"train_loss": 0.002221106318756938, "global_step": 31434, "epoch": 264, "lr": 5.993643217742256e-05} +{"train_loss": 0.004413502290844917, "global_step": 31435, "epoch": 264, "lr": 5.9934260847370524e-05} +{"train_loss": 0.003348996862769127, "global_step": 31436, "epoch": 264, "lr": 5.993208949781363e-05} +{"train_loss": 0.0017646016785874963, "global_step": 31437, "epoch": 264, "lr": 5.9929918128756136e-05} +{"train_loss": 0.002869828138500452, "global_step": 31438, "epoch": 264, "lr": 5.992774674020232e-05} +{"train_loss": 0.002549421042203903, "global_step": 31439, "epoch": 264, "lr": 5.9925575332156414e-05} +{"train_loss": 0.0029657480772584677, "global_step": 31440, "epoch": 264, "lr": 5.992340390462271e-05} +{"train_loss": 0.002365384716540575, "global_step": 31441, "epoch": 264, "lr": 5.992123245760548e-05} +{"train_loss": 0.003450117539614439, "global_step": 31442, "epoch": 264, "lr": 5.991906099110895e-05} +{"train_loss": 0.0025697879027575254, "global_step": 31443, "epoch": 264, "lr": 5.991688950513741e-05} +{"train_loss": 0.002316151512786746, "global_step": 31444, "epoch": 264, "lr": 5.9914717999695116e-05} +{"train_loss": 0.002879691543057561, "global_step": 31445, "epoch": 264, "lr": 5.991254647478633e-05} +{"train_loss": 0.0019363599130883813, "global_step": 31446, "epoch": 264, "lr": 5.991037493041532e-05} +{"train_loss": 0.0024239341728389263, "global_step": 31447, "epoch": 264, "lr": 5.9908203366586344e-05} +{"train_loss": 0.0021388076711446047, "global_step": 31448, "epoch": 264, "lr": 5.990603178330368e-05} +{"train_loss": 0.0015527469804510474, "global_step": 31449, "epoch": 264, "lr": 5.990386018057158e-05} +{"train_loss": 0.0031092825811356306, "global_step": 31450, "epoch": 264, "lr": 5.99016885583943e-05} +{"train_loss": 0.0022179826628416777, "global_step": 31451, "epoch": 264, "lr": 5.989951691677611e-05} +{"train_loss": 0.003339493414387107, "global_step": 31452, "epoch": 264, "lr": 5.989734525572128e-05} +{"train_loss": 0.0017618087586015463, "global_step": 31453, "epoch": 264, "lr": 5.9895173575234076e-05} +{"train_loss": 0.002370112109929323, "global_step": 31454, "epoch": 264, "lr": 5.9893001875318745e-05} +{"train_loss": 0.0031440684106200933, "global_step": 31455, "epoch": 264, "lr": 5.9890830155979574e-05} +{"train_loss": 0.0031126344110816717, "global_step": 31456, "epoch": 264, "lr": 5.98886584172208e-05} +{"train_loss": 0.001518503064289689, "global_step": 31457, "epoch": 264, "lr": 5.9886486659046716e-05} +{"train_loss": 0.0033198643941432238, "global_step": 31458, "epoch": 264, "lr": 5.9884314881461554e-05} +{"train_loss": 0.003722249763086438, "global_step": 31459, "epoch": 264, "lr": 5.988214308446961e-05} +{"train_loss": 0.005252556409686804, "global_step": 31460, "epoch": 264, "lr": 5.987997126807514e-05} +{"train_loss": 0.004626422189176083, "global_step": 31461, "epoch": 264, "lr": 5.98777994322824e-05} +{"train_loss": 0.002536074025556445, "global_step": 31462, "epoch": 264, "lr": 5.9875627577095636e-05} +{"train_loss": 0.0026416967157274485, "global_step": 31463, "epoch": 264, "lr": 5.987345570251916e-05} +{"train_loss": 0.0016205187421292067, "global_step": 31464, "epoch": 264, "lr": 5.987128380855719e-05} +{"train_loss": 0.0030114827677607536, "global_step": 31465, "epoch": 264, "lr": 5.9869111895214e-05} +{"train_loss": 0.002142007928341627, "global_step": 31466, "epoch": 264, "lr": 5.9866939962493886e-05} +{"train_loss": 0.004422847181558609, "global_step": 31467, "epoch": 264, "lr": 5.986476801040107e-05} +{"train_loss": 0.0025361734442412853, "global_step": 31468, "epoch": 264, "lr": 5.986259603893985e-05} +{"train_loss": 0.0022340172436088324, "global_step": 31469, "epoch": 264, "lr": 5.986042404811447e-05} +{"train_loss": 0.0036704200319945812, "global_step": 31470, "epoch": 264, "lr": 5.98582520379292e-05} +{"train_loss": 0.0019365114858374, "global_step": 31471, "epoch": 264, "lr": 5.9856080008388306e-05} +{"train_loss": 0.003156389109790325, "global_step": 31472, "epoch": 264, "lr": 5.985390795949606e-05} +{"train_loss": 0.0022191221360117197, "global_step": 31473, "epoch": 264, "lr": 5.985173589125671e-05} +{"train_loss": 0.003302233060821891, "global_step": 31474, "epoch": 264, "lr": 5.984956380367453e-05} +{"train_loss": 0.00301063759252429, "global_step": 31475, "epoch": 264, "lr": 5.9847391696753786e-05} +{"train_loss": 0.0025021573528647423, "global_step": 31476, "epoch": 264, "lr": 5.9845219570498746e-05} +{"train_loss": 0.0036192433908581734, "global_step": 31477, "epoch": 264, "lr": 5.9843047424913656e-05} +{"train_loss": 0.0031102041248232126, "global_step": 31478, "epoch": 264, "lr": 5.9840875260002804e-05} +{"train_loss": 0.006515332031995058, "global_step": 31479, "epoch": 264, "lr": 5.983870307577044e-05} +{"train_loss": 0.0036136603448539972, "global_step": 31480, "epoch": 264, "lr": 5.9836530872220845e-05} +{"train_loss": 0.0035249062348157167, "global_step": 31481, "epoch": 264, "lr": 5.9834358649358255e-05} +{"train_loss": 0.0026677337009459734, "global_step": 31482, "epoch": 264, "lr": 5.983218640718696e-05} +{"train_loss": 0.002194676548242569, "global_step": 31483, "epoch": 264, "lr": 5.983001414571122e-05} +{"train_loss": 0.002362241270020604, "global_step": 31484, "epoch": 264, "lr": 5.982784186493529e-05} +{"train_loss": 0.0025974304880946875, "global_step": 31485, "epoch": 264, "lr": 5.982566956486345e-05} +{"train_loss": 0.003776386845856905, "global_step": 31486, "epoch": 264, "lr": 5.982349724549995e-05} +{"train_loss": 0.003115468192845583, "global_step": 31487, "epoch": 264, "lr": 5.982132490684906e-05} +{"train_loss": 0.0035769466776400805, "global_step": 31488, "epoch": 264, "lr": 5.981915254891506e-05} +{"train_loss": 0.004711551126092672, "global_step": 31489, "epoch": 264, "lr": 5.9816980171702196e-05} +{"train_loss": 0.0026223163586109877, "global_step": 31490, "epoch": 264, "lr": 5.9814807775214746e-05} +{"train_loss": 0.0032923973631113768, "global_step": 31491, "epoch": 264, "lr": 5.981263535945696e-05} +{"train_loss": 0.003861186560243368, "global_step": 31492, "epoch": 264, "lr": 5.981046292443313e-05} +{"train_loss": 0.0041726939380168915, "global_step": 31493, "epoch": 264, "lr": 5.980829047014749e-05} +{"train_loss": 0.002660157857462764, "global_step": 31494, "epoch": 264, "lr": 5.9806117996604325e-05} +{"train_loss": 0.0033957259729504585, "global_step": 31495, "epoch": 264, "lr": 5.980394550380789e-05} +{"train_loss": 0.003245006315410137, "global_step": 31496, "epoch": 264, "lr": 5.980177299176246e-05} +{"train_loss": 0.0028446705546230078, "global_step": 31497, "epoch": 264, "lr": 5.979960046047228e-05} +{"train_loss": 0.004085858818143606, "global_step": 31498, "epoch": 264, "lr": 5.979742790994166e-05} +{"train_loss": 0.002676479984074831, "global_step": 31499, "epoch": 264, "lr": 5.9795255340174825e-05} +{"train_loss": 0.003950509708374739, "global_step": 31500, "epoch": 264, "lr": 5.9793082751176044e-05} +{"train_loss": 0.002525153337046504, "global_step": 31501, "epoch": 264, "lr": 5.9790910142949594e-05} +{"train_loss": 0.0021804324351251125, "global_step": 31502, "epoch": 264, "lr": 5.9788737515499746e-05} +{"train_loss": 0.0033062042202800512, "global_step": 31503, "epoch": 264, "lr": 5.978656486883074e-05} +{"train_loss": 0.005343143828213215, "global_step": 31504, "epoch": 264, "lr": 5.978439220294688e-05} +{"train_loss": 0.002282824832946062, "global_step": 31505, "epoch": 264, "lr": 5.97822195178524e-05} +{"train_loss": 0.004964480176568031, "global_step": 31506, "epoch": 264, "lr": 5.9780046813551584e-05} +{"train_loss": 0.0032403937075287104, "global_step": 31507, "epoch": 264, "lr": 5.977787409004868e-05} +{"train_loss": 0.0021666591055691242, "global_step": 31508, "epoch": 264, "lr": 5.977570134734798e-05} +{"train_loss": 0.003001229604706168, "global_step": 31509, "epoch": 264, "lr": 5.977352858545372e-05} +{"train_loss": 0.003689511911943555, "global_step": 31510, "epoch": 264, "lr": 5.97713558043702e-05} +{"train_loss": 0.0035665947943925858, "global_step": 31511, "epoch": 264, "lr": 5.976918300410165e-05} +{"train_loss": 0.003332652384415269, "global_step": 31512, "epoch": 264, "lr": 5.976701018465236e-05} +{"train_loss": 0.0032063208054751158, "global_step": 31513, "epoch": 264, "lr": 5.976483734602658e-05} +{"train_loss": 0.0032189516350626945, "global_step": 31514, "epoch": 264, "lr": 5.976266448822859e-05} +{"train_loss": 0.0033977613784372807, "global_step": 31515, "epoch": 264, "lr": 5.976049161126265e-05} +{"train_loss": 0.0032590911723673344, "global_step": 31516, "epoch": 264, "lr": 5.9758318715133034e-05} +{"train_loss": 0.0044322023168206215, "global_step": 31517, "epoch": 264, "lr": 5.9756145799844e-05} +{"train_loss": 0.0020521997939795256, "global_step": 31518, "epoch": 264, "lr": 5.975397286539981e-05} +{"train_loss": 0.0028480507899075747, "global_step": 31519, "epoch": 264, "lr": 5.975179991180474e-05} +{"train_loss": 0.003266390645876527, "global_step": 31520, "epoch": 264, "lr": 5.9749626939063056e-05} +{"train_loss": 0.002555078361183405, "global_step": 31521, "epoch": 264, "lr": 5.974745394717901e-05} +{"train_loss": 0.004538997542113066, "global_step": 31522, "epoch": 264, "lr": 5.974528093615689e-05} +{"train_loss": 0.0023696243297308683, "global_step": 31523, "epoch": 264, "lr": 5.974310790600095e-05} +{"train_loss": 0.0034966119565069675, "global_step": 31524, "epoch": 264, "lr": 5.974093485671546e-05} +{"train_loss": 0.003414782462641597, "global_step": 31525, "epoch": 264, "lr": 5.973876178830469e-05} +{"train_loss": 0.0028047491796314716, "global_step": 31526, "epoch": 264, "lr": 5.973658870077289e-05} +{"train_loss": 0.0016368047799915075, "global_step": 31527, "epoch": 264, "lr": 5.9734415594124335e-05} +{"train_loss": 0.002894460689276457, "global_step": 31528, "epoch": 264, "lr": 5.973224246836331e-05} +{"train_loss": 0.0024727904237806797, "global_step": 31529, "epoch": 264, "lr": 5.973006932349407e-05} +{"train_loss": 0.0036522247828543186, "global_step": 31530, "epoch": 264, "lr": 5.972789615952086e-05} +{"train_loss": 0.00384672824293375, "global_step": 31531, "epoch": 264, "lr": 5.972572297644797e-05} +{"train_loss": 0.002807954791933298, "global_step": 31532, "epoch": 264, "lr": 5.972354977427966e-05} +{"train_loss": 0.0018131800461560488, "global_step": 31533, "epoch": 264, "lr": 5.9721376553020217e-05} +{"train_loss": 0.003061000515996408, "global_step": 31534, "epoch": 264, "lr": 5.971920331267387e-05, "val_loss": 0.02626223862171173} +{"train_loss": 0.005279085598886013, "global_step": 31535, "epoch": 265, "lr": 5.9717030053244904e-05} +{"train_loss": 0.0023848298005759716, "global_step": 31536, "epoch": 265, "lr": 5.971485677473761e-05} +{"train_loss": 0.002666416810825467, "global_step": 31537, "epoch": 265, "lr": 5.9712683477156206e-05} +{"train_loss": 0.003357989015057683, "global_step": 31538, "epoch": 265, "lr": 5.9710510160504996e-05} +{"train_loss": 0.00271270121447742, "global_step": 31539, "epoch": 265, "lr": 5.970833682478823e-05} +{"train_loss": 0.0020645938348025084, "global_step": 31540, "epoch": 265, "lr": 5.97061634700102e-05} +{"train_loss": 0.002798699773848057, "global_step": 31541, "epoch": 265, "lr": 5.9703990096175145e-05} +{"train_loss": 0.00217974791303277, "global_step": 31542, "epoch": 265, "lr": 5.970181670328735e-05} +{"train_loss": 0.002294756006449461, "global_step": 31543, "epoch": 265, "lr": 5.969964329135107e-05} +{"train_loss": 0.002209136728197336, "global_step": 31544, "epoch": 265, "lr": 5.969746986037057e-05} +{"train_loss": 0.0033456648234277964, "global_step": 31545, "epoch": 265, "lr": 5.969529641035012e-05} +{"train_loss": 0.002882413100451231, "global_step": 31546, "epoch": 265, "lr": 5.9693122941294e-05} +{"train_loss": 0.0026423048693686724, "global_step": 31547, "epoch": 265, "lr": 5.969094945320647e-05} +{"train_loss": 0.0015312983887270093, "global_step": 31548, "epoch": 265, "lr": 5.96887759460918e-05} +{"train_loss": 0.005712401587516069, "global_step": 31549, "epoch": 265, "lr": 5.968660241995425e-05} +{"train_loss": 0.002204394433647394, "global_step": 31550, "epoch": 265, "lr": 5.968442887479808e-05} +{"train_loss": 0.0028556750621646643, "global_step": 31551, "epoch": 265, "lr": 5.968225531062757e-05} +{"train_loss": 0.0015437538968399167, "global_step": 31552, "epoch": 265, "lr": 5.968008172744699e-05} +{"train_loss": 0.0022513619624078274, "global_step": 31553, "epoch": 265, "lr": 5.967790812526061e-05} +{"train_loss": 0.002512164879590273, "global_step": 31554, "epoch": 265, "lr": 5.9675734504072703e-05} +{"train_loss": 0.0030550542287528515, "global_step": 31555, "epoch": 265, "lr": 5.96735608638875e-05} +{"train_loss": 0.003265642561018467, "global_step": 31556, "epoch": 265, "lr": 5.967138720470931e-05} +{"train_loss": 0.0028921940829604864, "global_step": 31557, "epoch": 265, "lr": 5.966921352654237e-05} +{"train_loss": 0.005477321799844503, "global_step": 31558, "epoch": 265, "lr": 5.966703982939097e-05} +{"train_loss": 0.0034692292101681232, "global_step": 31559, "epoch": 265, "lr": 5.966486611325936e-05} +{"train_loss": 0.0029754077550023794, "global_step": 31560, "epoch": 265, "lr": 5.966269237815184e-05} +{"train_loss": 0.0014373515732586384, "global_step": 31561, "epoch": 265, "lr": 5.966051862407265e-05} +{"train_loss": 0.004107038024812937, "global_step": 31562, "epoch": 265, "lr": 5.965834485102606e-05} +{"train_loss": 0.0021614073775708675, "global_step": 31563, "epoch": 265, "lr": 5.965617105901633e-05} +{"train_loss": 0.0013939630007371306, "global_step": 31564, "epoch": 265, "lr": 5.965399724804776e-05} +{"train_loss": 0.002368417102843523, "global_step": 31565, "epoch": 265, "lr": 5.965182341812459e-05} +{"train_loss": 0.003663053037598729, "global_step": 31566, "epoch": 265, "lr": 5.964964956925109e-05} +{"train_loss": 0.002180777955800295, "global_step": 31567, "epoch": 265, "lr": 5.9647475701431534e-05} +{"train_loss": 0.0036234213039278984, "global_step": 31568, "epoch": 265, "lr": 5.964530181467018e-05} +{"train_loss": 0.001824833918362856, "global_step": 31569, "epoch": 265, "lr": 5.964312790897133e-05} +{"train_loss": 0.004031901713460684, "global_step": 31570, "epoch": 265, "lr": 5.964095398433921e-05} +{"train_loss": 0.0020194065291434526, "global_step": 31571, "epoch": 265, "lr": 5.963878004077812e-05} +{"train_loss": 0.00307075516320765, "global_step": 31572, "epoch": 265, "lr": 5.96366060782923e-05} +{"train_loss": 0.0034324314910918474, "global_step": 31573, "epoch": 265, "lr": 5.963443209688606e-05} +{"train_loss": 0.0021429606713354588, "global_step": 31574, "epoch": 265, "lr": 5.963225809656362e-05} +{"train_loss": 0.002418489195406437, "global_step": 31575, "epoch": 265, "lr": 5.9630084077329276e-05} +{"train_loss": 0.0031137350015342236, "global_step": 31576, "epoch": 265, "lr": 5.962791003918729e-05} +{"train_loss": 0.003862055717036128, "global_step": 31577, "epoch": 265, "lr": 5.962573598214193e-05} +{"train_loss": 0.0024705599062144756, "global_step": 31578, "epoch": 265, "lr": 5.962356190619747e-05} +{"train_loss": 0.0038071544840931892, "global_step": 31579, "epoch": 265, "lr": 5.962138781135818e-05} +{"train_loss": 0.00149970140773803, "global_step": 31580, "epoch": 265, "lr": 5.9619213697628305e-05} +{"train_loss": 0.0029661571606993675, "global_step": 31581, "epoch": 265, "lr": 5.9617039565012144e-05} +{"train_loss": 0.002669330220669508, "global_step": 31582, "epoch": 265, "lr": 5.961486541351395e-05} +{"train_loss": 0.0014804044039919972, "global_step": 31583, "epoch": 265, "lr": 5.9612691243138e-05} +{"train_loss": 0.003102037822827697, "global_step": 31584, "epoch": 265, "lr": 5.961051705388855e-05} +{"train_loss": 0.0037810266949236393, "global_step": 31585, "epoch": 265, "lr": 5.9608342845769884e-05} +{"train_loss": 0.0025546858087182045, "global_step": 31586, "epoch": 265, "lr": 5.960616861878625e-05} +{"train_loss": 0.003149159951135516, "global_step": 31587, "epoch": 265, "lr": 5.960399437294194e-05} +{"train_loss": 0.002270003082230687, "global_step": 31588, "epoch": 265, "lr": 5.960182010824121e-05} +{"train_loss": 0.003043012460693717, "global_step": 31589, "epoch": 265, "lr": 5.9599645824688334e-05} +{"train_loss": 0.0033101451117545366, "global_step": 31590, "epoch": 265, "lr": 5.959747152228758e-05} +{"train_loss": 0.004039991181343794, "global_step": 31591, "epoch": 265, "lr": 5.959529720104321e-05} +{"train_loss": 0.001967214047908783, "global_step": 31592, "epoch": 265, "lr": 5.9593122860959515e-05} +{"train_loss": 0.0021942732855677605, "global_step": 31593, "epoch": 265, "lr": 5.9590948502040734e-05} +{"train_loss": 0.0041613331995904446, "global_step": 31594, "epoch": 265, "lr": 5.958877412429116e-05} +{"train_loss": 0.003097744192928076, "global_step": 31595, "epoch": 265, "lr": 5.958659972771504e-05} +{"train_loss": 0.002024955814704299, "global_step": 31596, "epoch": 265, "lr": 5.958442531231666e-05} +{"train_loss": 0.0022865459322929382, "global_step": 31597, "epoch": 265, "lr": 5.958225087810029e-05} +{"train_loss": 0.0033444056753069162, "global_step": 31598, "epoch": 265, "lr": 5.95800764250702e-05} +{"train_loss": 0.0018366866279393435, "global_step": 31599, "epoch": 265, "lr": 5.957790195323064e-05} +{"train_loss": 0.002648881869390607, "global_step": 31600, "epoch": 265, "lr": 5.957572746258588e-05} +{"train_loss": 0.0015276734484359622, "global_step": 31601, "epoch": 265, "lr": 5.957355295314022e-05} +{"train_loss": 0.0026413067243993282, "global_step": 31602, "epoch": 265, "lr": 5.9571378424897906e-05} +{"train_loss": 0.0027143945917487144, "global_step": 31603, "epoch": 265, "lr": 5.956920387786322e-05} +{"train_loss": 0.002367400098592043, "global_step": 31604, "epoch": 265, "lr": 5.956702931204043e-05} +{"train_loss": 0.0026752944104373455, "global_step": 31605, "epoch": 265, "lr": 5.9564854727433796e-05} +{"train_loss": 0.002714271657168865, "global_step": 31606, "epoch": 265, "lr": 5.9562680124047586e-05} +{"train_loss": 0.0021223907824605703, "global_step": 31607, "epoch": 265, "lr": 5.9560505501886077e-05} +{"train_loss": 0.003117918036878109, "global_step": 31608, "epoch": 265, "lr": 5.955833086095354e-05} +{"train_loss": 0.0014574361266568303, "global_step": 31609, "epoch": 265, "lr": 5.955615620125423e-05} +{"train_loss": 0.001196759520098567, "global_step": 31610, "epoch": 265, "lr": 5.9553981522792436e-05} +{"train_loss": 0.002981043653562665, "global_step": 31611, "epoch": 265, "lr": 5.955180682557243e-05} +{"train_loss": 0.0024854035582393408, "global_step": 31612, "epoch": 265, "lr": 5.9549632109598465e-05} +{"train_loss": 0.0027852251660078764, "global_step": 31613, "epoch": 265, "lr": 5.95474573748748e-05} +{"train_loss": 0.0017469157464802265, "global_step": 31614, "epoch": 265, "lr": 5.954528262140574e-05} +{"train_loss": 0.005123121663928032, "global_step": 31615, "epoch": 265, "lr": 5.954310784919553e-05} +{"train_loss": 0.0032892937306314707, "global_step": 31616, "epoch": 265, "lr": 5.954093305824846e-05} +{"train_loss": 0.00440671481192112, "global_step": 31617, "epoch": 265, "lr": 5.953875824856878e-05} +{"train_loss": 0.001548010273836553, "global_step": 31618, "epoch": 265, "lr": 5.953658342016076e-05} +{"train_loss": 0.0024523339234292507, "global_step": 31619, "epoch": 265, "lr": 5.953440857302869e-05} +{"train_loss": 0.0027736262418329716, "global_step": 31620, "epoch": 265, "lr": 5.953223370717681e-05} +{"train_loss": 0.0029532783664762974, "global_step": 31621, "epoch": 265, "lr": 5.953005882260942e-05} +{"train_loss": 0.0012498053256422281, "global_step": 31622, "epoch": 265, "lr": 5.952788391933078e-05} +{"train_loss": 0.003492632182314992, "global_step": 31623, "epoch": 265, "lr": 5.9525708997345165e-05} +{"train_loss": 0.0024270527064800262, "global_step": 31624, "epoch": 265, "lr": 5.952353405665683e-05} +{"train_loss": 0.003154084552079439, "global_step": 31625, "epoch": 265, "lr": 5.9521359097270035e-05} +{"train_loss": 0.0033852059859782457, "global_step": 31626, "epoch": 265, "lr": 5.951918411918909e-05} +{"train_loss": 0.0028741424903273582, "global_step": 31627, "epoch": 265, "lr": 5.9517009122418234e-05} +{"train_loss": 0.0011489897733554244, "global_step": 31628, "epoch": 265, "lr": 5.951483410696175e-05} +{"train_loss": 0.004577871412038803, "global_step": 31629, "epoch": 265, "lr": 5.951265907282392e-05} +{"train_loss": 0.00328898336738348, "global_step": 31630, "epoch": 265, "lr": 5.951048402000898e-05} +{"train_loss": 0.0022279242984950542, "global_step": 31631, "epoch": 265, "lr": 5.950830894852123e-05} +{"train_loss": 0.0026913031470030546, "global_step": 31632, "epoch": 265, "lr": 5.950613385836493e-05} +{"train_loss": 0.0024212109856307507, "global_step": 31633, "epoch": 265, "lr": 5.950395874954435e-05} +{"train_loss": 0.004406788852065802, "global_step": 31634, "epoch": 265, "lr": 5.9501783622063755e-05} +{"train_loss": 0.0030006999149918556, "global_step": 31635, "epoch": 265, "lr": 5.949960847592743e-05} +{"train_loss": 0.0027241481002420187, "global_step": 31636, "epoch": 265, "lr": 5.949743331113964e-05} +{"train_loss": 0.0029606884345412254, "global_step": 31637, "epoch": 265, "lr": 5.9495258127704655e-05} +{"train_loss": 0.003632407868281007, "global_step": 31638, "epoch": 265, "lr": 5.949308292562674e-05} +{"train_loss": 0.0038411871064454317, "global_step": 31639, "epoch": 265, "lr": 5.949090770491018e-05} +{"train_loss": 0.003759316634386778, "global_step": 31640, "epoch": 265, "lr": 5.9488732465559224e-05} +{"train_loss": 0.003273341339081526, "global_step": 31641, "epoch": 265, "lr": 5.9486557207578166e-05} +{"train_loss": 0.0031664238777011633, "global_step": 31642, "epoch": 265, "lr": 5.948438193097128e-05} +{"train_loss": 0.0037973029538989067, "global_step": 31643, "epoch": 265, "lr": 5.94822066357428e-05} +{"train_loss": 0.0038339707534760237, "global_step": 31644, "epoch": 265, "lr": 5.948003132189702e-05} +{"train_loss": 0.003561274381354451, "global_step": 31645, "epoch": 265, "lr": 5.9477855989438226e-05} +{"train_loss": 0.0025981981307268143, "global_step": 31646, "epoch": 265, "lr": 5.947568063837066e-05} +{"train_loss": 0.002351605100557208, "global_step": 31647, "epoch": 265, "lr": 5.9473505268698617e-05} +{"train_loss": 0.0020304564386606216, "global_step": 31648, "epoch": 265, "lr": 5.947132988042636e-05} +{"train_loss": 0.004529300611466169, "global_step": 31649, "epoch": 265, "lr": 5.946915447355814e-05} +{"train_loss": 0.0020656276028603315, "global_step": 31650, "epoch": 265, "lr": 5.946697904809827e-05} +{"train_loss": 0.004326989408582449, "global_step": 31651, "epoch": 265, "lr": 5.946480360405099e-05} +{"train_loss": 0.004731880966573954, "global_step": 31652, "epoch": 265, "lr": 5.946262814142057e-05} +{"train_loss": 0.002872858285520445, "global_step": 31653, "epoch": 265, "lr": 5.94604526602113e-05, "val_loss": 0.013728861697018147, "train_action_mse_error": 5.393843093770556e-05} +{"train_loss": 0.002912146272137761, "global_step": 31654, "epoch": 266, "lr": 5.945827716042745e-05} +{"train_loss": 0.0026836812030524015, "global_step": 31655, "epoch": 266, "lr": 5.945610164207327e-05} +{"train_loss": 0.0036843593697994947, "global_step": 31656, "epoch": 266, "lr": 5.9453926105153057e-05} +{"train_loss": 0.0028259200043976307, "global_step": 31657, "epoch": 266, "lr": 5.945175054967106e-05} +{"train_loss": 0.0014830015134066343, "global_step": 31658, "epoch": 266, "lr": 5.944957497563156e-05} +{"train_loss": 0.002399466000497341, "global_step": 31659, "epoch": 266, "lr": 5.944739938303883e-05} +{"train_loss": 0.003359057242050767, "global_step": 31660, "epoch": 266, "lr": 5.944522377189714e-05} +{"train_loss": 0.002932860516011715, "global_step": 31661, "epoch": 266, "lr": 5.944304814221078e-05} +{"train_loss": 0.002765725366771221, "global_step": 31662, "epoch": 266, "lr": 5.9440872493983976e-05} +{"train_loss": 0.0033554499968886375, "global_step": 31663, "epoch": 266, "lr": 5.943869682722104e-05} +{"train_loss": 0.0022747970651835203, "global_step": 31664, "epoch": 266, "lr": 5.9436521141926235e-05} +{"train_loss": 0.00266872625797987, "global_step": 31665, "epoch": 266, "lr": 5.943434543810382e-05} +{"train_loss": 0.003137378254905343, "global_step": 31666, "epoch": 266, "lr": 5.943216971575808e-05} +{"train_loss": 0.002759997034445405, "global_step": 31667, "epoch": 266, "lr": 5.942999397489328e-05} +{"train_loss": 0.0022497326135635376, "global_step": 31668, "epoch": 266, "lr": 5.94278182155137e-05} +{"train_loss": 0.002434826921671629, "global_step": 31669, "epoch": 266, "lr": 5.9425642437623595e-05} +{"train_loss": 0.002977905562147498, "global_step": 31670, "epoch": 266, "lr": 5.942346664122726e-05} +{"train_loss": 0.0023824875243008137, "global_step": 31671, "epoch": 266, "lr": 5.942129082632895e-05} +{"train_loss": 0.0037924207281321287, "global_step": 31672, "epoch": 266, "lr": 5.941911499293294e-05} +{"train_loss": 0.002427330007776618, "global_step": 31673, "epoch": 266, "lr": 5.941693914104351e-05} +{"train_loss": 0.004863842390477657, "global_step": 31674, "epoch": 266, "lr": 5.941476327066493e-05} +{"train_loss": 0.0036093397065997124, "global_step": 31675, "epoch": 266, "lr": 5.941258738180147e-05} +{"train_loss": 0.0029220380820333958, "global_step": 31676, "epoch": 266, "lr": 5.941041147445738e-05} +{"train_loss": 0.003594868117943406, "global_step": 31677, "epoch": 266, "lr": 5.940823554863697e-05} +{"train_loss": 0.0015525356866419315, "global_step": 31678, "epoch": 266, "lr": 5.940605960434449e-05} +{"train_loss": 0.002641533501446247, "global_step": 31679, "epoch": 266, "lr": 5.9403883641584214e-05} +{"train_loss": 0.0026135232765227556, "global_step": 31680, "epoch": 266, "lr": 5.9401707660360414e-05} +{"train_loss": 0.0029945385176688433, "global_step": 31681, "epoch": 266, "lr": 5.9399531660677375e-05} +{"train_loss": 0.0038260750006884336, "global_step": 31682, "epoch": 266, "lr": 5.939735564253935e-05} +{"train_loss": 0.0036792480386793613, "global_step": 31683, "epoch": 266, "lr": 5.939517960595063e-05} +{"train_loss": 0.002488547470420599, "global_step": 31684, "epoch": 266, "lr": 5.939300355091546e-05} +{"train_loss": 0.004014093428850174, "global_step": 31685, "epoch": 266, "lr": 5.939082747743815e-05} +{"train_loss": 0.004650450311601162, "global_step": 31686, "epoch": 266, "lr": 5.938865138552296e-05} +{"train_loss": 0.003810608759522438, "global_step": 31687, "epoch": 266, "lr": 5.9386475275174146e-05} +{"train_loss": 0.0040699802339077, "global_step": 31688, "epoch": 266, "lr": 5.938429914639598e-05} +{"train_loss": 0.002445109188556671, "global_step": 31689, "epoch": 266, "lr": 5.9382122999192755e-05} +{"train_loss": 0.0026121747214347124, "global_step": 31690, "epoch": 266, "lr": 5.937994683356873e-05} +{"train_loss": 0.0031705733854323626, "global_step": 31691, "epoch": 266, "lr": 5.9377770649528185e-05} +{"train_loss": 0.0037492255214601755, "global_step": 31692, "epoch": 266, "lr": 5.937559444707541e-05} +{"train_loss": 0.0033198015298694372, "global_step": 31693, "epoch": 266, "lr": 5.937341822621463e-05} +{"train_loss": 0.0018250384600833058, "global_step": 31694, "epoch": 266, "lr": 5.9371241986950156e-05} +{"train_loss": 0.00222626980394125, "global_step": 31695, "epoch": 266, "lr": 5.9369065729286245e-05} +{"train_loss": 0.003482427913695574, "global_step": 31696, "epoch": 266, "lr": 5.936688945322717e-05} +{"train_loss": 0.0022272090427577496, "global_step": 31697, "epoch": 266, "lr": 5.936471315877721e-05} +{"train_loss": 0.0038870912976562977, "global_step": 31698, "epoch": 266, "lr": 5.936253684594064e-05} +{"train_loss": 0.0020370855927467346, "global_step": 31699, "epoch": 266, "lr": 5.936036051472173e-05} +{"train_loss": 0.002227849792689085, "global_step": 31700, "epoch": 266, "lr": 5.935818416512474e-05} +{"train_loss": 0.0013684005243703723, "global_step": 31701, "epoch": 266, "lr": 5.935600779715397e-05} +{"train_loss": 0.0017544003203511238, "global_step": 31702, "epoch": 266, "lr": 5.935383141081366e-05} +{"train_loss": 0.0019242452690377831, "global_step": 31703, "epoch": 266, "lr": 5.935165500610812e-05} +{"train_loss": 0.004171761218458414, "global_step": 31704, "epoch": 266, "lr": 5.9349478583041595e-05} +{"train_loss": 0.0034733135253190994, "global_step": 31705, "epoch": 266, "lr": 5.9347302141618385e-05} +{"train_loss": 0.002733994973823428, "global_step": 31706, "epoch": 266, "lr": 5.934512568184273e-05} +{"train_loss": 0.0024520792067050934, "global_step": 31707, "epoch": 266, "lr": 5.934294920371892e-05} +{"train_loss": 0.0021520720329135656, "global_step": 31708, "epoch": 266, "lr": 5.934077270725122e-05} +{"train_loss": 0.0035017533227801323, "global_step": 31709, "epoch": 266, "lr": 5.933859619244393e-05} +{"train_loss": 0.0030872193165123463, "global_step": 31710, "epoch": 266, "lr": 5.933641965930129e-05} +{"train_loss": 0.0018771161558106542, "global_step": 31711, "epoch": 266, "lr": 5.93342431078276e-05} +{"train_loss": 0.0025901661720126867, "global_step": 31712, "epoch": 266, "lr": 5.933206653802712e-05} +{"train_loss": 0.0021519153378903866, "global_step": 31713, "epoch": 266, "lr": 5.93298899499041e-05} +{"train_loss": 0.0036633717827498913, "global_step": 31714, "epoch": 266, "lr": 5.932771334346287e-05} +{"train_loss": 0.0018335735658183694, "global_step": 31715, "epoch": 266, "lr": 5.9325536718707644e-05} +{"train_loss": 0.002777271205559373, "global_step": 31716, "epoch": 266, "lr": 5.9323360075642745e-05} +{"train_loss": 0.0021830867044627666, "global_step": 31717, "epoch": 266, "lr": 5.932118341427241e-05} +{"train_loss": 0.0017358207842335105, "global_step": 31718, "epoch": 266, "lr": 5.931900673460093e-05} +{"train_loss": 0.0019783650059252977, "global_step": 31719, "epoch": 266, "lr": 5.931683003663258e-05} +{"train_loss": 0.0017123414436355233, "global_step": 31720, "epoch": 266, "lr": 5.931465332037161e-05} +{"train_loss": 0.0023350242991000414, "global_step": 31721, "epoch": 266, "lr": 5.931247658582233e-05} +{"train_loss": 0.0043465252965688705, "global_step": 31722, "epoch": 266, "lr": 5.9310299832989e-05} +{"train_loss": 0.0035466249100863934, "global_step": 31723, "epoch": 266, "lr": 5.93081230618759e-05} +{"train_loss": 0.0024347701109945774, "global_step": 31724, "epoch": 266, "lr": 5.930594627248728e-05} +{"train_loss": 0.003136524697765708, "global_step": 31725, "epoch": 266, "lr": 5.930376946482743e-05} +{"train_loss": 0.0028605463448911905, "global_step": 31726, "epoch": 266, "lr": 5.930159263890063e-05} +{"train_loss": 0.0014237057184800506, "global_step": 31727, "epoch": 266, "lr": 5.929941579471113e-05} +{"train_loss": 0.001712846220470965, "global_step": 31728, "epoch": 266, "lr": 5.9297238932263235e-05} +{"train_loss": 0.0016998584615066648, "global_step": 31729, "epoch": 266, "lr": 5.92950620515612e-05} +{"train_loss": 0.0038624382577836514, "global_step": 31730, "epoch": 266, "lr": 5.929288515260931e-05} +{"train_loss": 0.0028415503911674023, "global_step": 31731, "epoch": 266, "lr": 5.929070823541183e-05} +{"train_loss": 0.0014261489268392324, "global_step": 31732, "epoch": 266, "lr": 5.928853129997304e-05} +{"train_loss": 0.0019845229107886553, "global_step": 31733, "epoch": 266, "lr": 5.928635434629719e-05} +{"train_loss": 0.0016635024221614003, "global_step": 31734, "epoch": 266, "lr": 5.9284177374388584e-05} +{"train_loss": 0.002506172051653266, "global_step": 31735, "epoch": 266, "lr": 5.92820003842515e-05} +{"train_loss": 0.001916369772516191, "global_step": 31736, "epoch": 266, "lr": 5.92798233758902e-05} +{"train_loss": 0.0028249931056052446, "global_step": 31737, "epoch": 266, "lr": 5.9277646349308956e-05} +{"train_loss": 0.0020373063161969185, "global_step": 31738, "epoch": 266, "lr": 5.9275469304512045e-05} +{"train_loss": 0.003269432345405221, "global_step": 31739, "epoch": 266, "lr": 5.927329224150373e-05} +{"train_loss": 0.002200937597081065, "global_step": 31740, "epoch": 266, "lr": 5.9271115160288304e-05} +{"train_loss": 0.0011666456703096628, "global_step": 31741, "epoch": 266, "lr": 5.9268938060870025e-05} +{"train_loss": 0.0033182695042341948, "global_step": 31742, "epoch": 266, "lr": 5.92667609432532e-05} +{"train_loss": 0.002594863763079047, "global_step": 31743, "epoch": 266, "lr": 5.926458380744207e-05} +{"train_loss": 0.0030233494471758604, "global_step": 31744, "epoch": 266, "lr": 5.9262406653440904e-05} +{"train_loss": 0.0030435724183917046, "global_step": 31745, "epoch": 266, "lr": 5.9260229481254005e-05} +{"train_loss": 0.0024258517660200596, "global_step": 31746, "epoch": 266, "lr": 5.925805229088563e-05} +{"train_loss": 0.0035315235145390034, "global_step": 31747, "epoch": 266, "lr": 5.925587508234006e-05} +{"train_loss": 0.002933592302724719, "global_step": 31748, "epoch": 266, "lr": 5.925369785562157e-05} +{"train_loss": 0.0023768700193613768, "global_step": 31749, "epoch": 266, "lr": 5.9251520610734426e-05} +{"train_loss": 0.0029219554271548986, "global_step": 31750, "epoch": 266, "lr": 5.9249343347682915e-05} +{"train_loss": 0.0016218518139794469, "global_step": 31751, "epoch": 266, "lr": 5.92471660664713e-05} +{"train_loss": 0.0021016253158450127, "global_step": 31752, "epoch": 266, "lr": 5.924498876710387e-05} +{"train_loss": 0.0031380681321024895, "global_step": 31753, "epoch": 266, "lr": 5.9242811449584886e-05} +{"train_loss": 0.0023859539069235325, "global_step": 31754, "epoch": 266, "lr": 5.9240634113918636e-05} +{"train_loss": 0.0038846146780997515, "global_step": 31755, "epoch": 266, "lr": 5.9238456760109395e-05} +{"train_loss": 0.0029059117659926414, "global_step": 31756, "epoch": 266, "lr": 5.923627938816143e-05} +{"train_loss": 0.002261195331811905, "global_step": 31757, "epoch": 266, "lr": 5.9234101998079005e-05} +{"train_loss": 0.002518529538065195, "global_step": 31758, "epoch": 266, "lr": 5.92319245898664e-05} +{"train_loss": 0.002953835530206561, "global_step": 31759, "epoch": 266, "lr": 5.922974716352792e-05} +{"train_loss": 0.0045555406250059605, "global_step": 31760, "epoch": 266, "lr": 5.92275697190678e-05} +{"train_loss": 0.0025871461257338524, "global_step": 31761, "epoch": 266, "lr": 5.9225392256490354e-05} +{"train_loss": 0.0016584205441176891, "global_step": 31762, "epoch": 266, "lr": 5.922321477579982e-05} +{"train_loss": 0.002880348823964596, "global_step": 31763, "epoch": 266, "lr": 5.922103727700049e-05} +{"train_loss": 0.002733484609052539, "global_step": 31764, "epoch": 266, "lr": 5.9218859760096634e-05} +{"train_loss": 0.0038296901620924473, "global_step": 31765, "epoch": 266, "lr": 5.921668222509254e-05} +{"train_loss": 0.0031869064550846815, "global_step": 31766, "epoch": 266, "lr": 5.921450467199247e-05} +{"train_loss": 0.001967725809663534, "global_step": 31767, "epoch": 266, "lr": 5.9212327100800705e-05} +{"train_loss": 0.0036192687693983316, "global_step": 31768, "epoch": 266, "lr": 5.9210149511521514e-05} +{"train_loss": 0.0026319788303226233, "global_step": 31769, "epoch": 266, "lr": 5.920797190415919e-05} +{"train_loss": 0.003813748015090823, "global_step": 31770, "epoch": 266, "lr": 5.9205794278718e-05} +{"train_loss": 0.0040381369180977345, "global_step": 31771, "epoch": 266, "lr": 5.92036166352022e-05} +{"train_loss": 0.002778359063697525, "global_step": 31772, "epoch": 266, "lr": 5.920143897361609e-05, "val_loss": 0.0235997773706913} +{"train_loss": 0.002757875481620431, "global_step": 31773, "epoch": 267, "lr": 5.919926129396394e-05} +{"train_loss": 0.0033373653423041105, "global_step": 31774, "epoch": 267, "lr": 5.919708359625002e-05} +{"train_loss": 0.0017207944765686989, "global_step": 31775, "epoch": 267, "lr": 5.919490588047861e-05} +{"train_loss": 0.004768218379467726, "global_step": 31776, "epoch": 267, "lr": 5.9192728146654e-05} +{"train_loss": 0.0022251801565289497, "global_step": 31777, "epoch": 267, "lr": 5.919055039478043e-05} +{"train_loss": 0.001729561248794198, "global_step": 31778, "epoch": 267, "lr": 5.9188372624862196e-05} +{"train_loss": 0.002818875480443239, "global_step": 31779, "epoch": 267, "lr": 5.9186194836903575e-05} +{"train_loss": 0.0034566842950880527, "global_step": 31780, "epoch": 267, "lr": 5.918401703090886e-05} +{"train_loss": 0.0030234798323363066, "global_step": 31781, "epoch": 267, "lr": 5.9181839206882285e-05} +{"train_loss": 0.0032779902685433626, "global_step": 31782, "epoch": 267, "lr": 5.9179661364828155e-05} +{"train_loss": 0.0026202937588095665, "global_step": 31783, "epoch": 267, "lr": 5.9177483504750756e-05} +{"train_loss": 0.004033670760691166, "global_step": 31784, "epoch": 267, "lr": 5.917530562665433e-05} +{"train_loss": 0.0037226988933980465, "global_step": 31785, "epoch": 267, "lr": 5.9173127730543174e-05} +{"train_loss": 0.0026574707590043545, "global_step": 31786, "epoch": 267, "lr": 5.9170949816421583e-05} +{"train_loss": 0.0018628464313223958, "global_step": 31787, "epoch": 267, "lr": 5.9168771884293794e-05} +{"train_loss": 0.00345088099129498, "global_step": 31788, "epoch": 267, "lr": 5.916659393416411e-05} +{"train_loss": 0.0027546712663024664, "global_step": 31789, "epoch": 267, "lr": 5.916441596603678e-05} +{"train_loss": 0.0032717694994062185, "global_step": 31790, "epoch": 267, "lr": 5.9162237979916115e-05} +{"train_loss": 0.0015912106027826667, "global_step": 31791, "epoch": 267, "lr": 5.916005997580636e-05} +{"train_loss": 0.0022246073931455612, "global_step": 31792, "epoch": 267, "lr": 5.9157881953711834e-05} +{"train_loss": 0.0032090875320136547, "global_step": 31793, "epoch": 267, "lr": 5.915570391363676e-05} +{"train_loss": 0.002690366469323635, "global_step": 31794, "epoch": 267, "lr": 5.915352585558544e-05} +{"train_loss": 0.002845236100256443, "global_step": 31795, "epoch": 267, "lr": 5.915134777956216e-05} +{"train_loss": 0.0033012309577316046, "global_step": 31796, "epoch": 267, "lr": 5.914916968557118e-05} +{"train_loss": 0.002666379790753126, "global_step": 31797, "epoch": 267, "lr": 5.914699157361678e-05} +{"train_loss": 0.0033956016413867474, "global_step": 31798, "epoch": 267, "lr": 5.914481344370325e-05} +{"train_loss": 0.0033107022754848003, "global_step": 31799, "epoch": 267, "lr": 5.914263529583485e-05} +{"train_loss": 0.0032565833535045385, "global_step": 31800, "epoch": 267, "lr": 5.914045713001586e-05} +{"train_loss": 0.002594649326056242, "global_step": 31801, "epoch": 267, "lr": 5.913827894625056e-05} +{"train_loss": 0.002844123635441065, "global_step": 31802, "epoch": 267, "lr": 5.913610074454322e-05} +{"train_loss": 0.0028275074437260628, "global_step": 31803, "epoch": 267, "lr": 5.913392252489813e-05} +{"train_loss": 0.002043315675109625, "global_step": 31804, "epoch": 267, "lr": 5.9131744287319554e-05} +{"train_loss": 0.0028858191799372435, "global_step": 31805, "epoch": 267, "lr": 5.912956603181179e-05} +{"train_loss": 0.0027504186145961285, "global_step": 31806, "epoch": 267, "lr": 5.9127387758379094e-05} +{"train_loss": 0.0016650411998853087, "global_step": 31807, "epoch": 267, "lr": 5.9125209467025736e-05} +{"train_loss": 0.0037420785520225763, "global_step": 31808, "epoch": 267, "lr": 5.9123031157756005e-05} +{"train_loss": 0.0028580811340361834, "global_step": 31809, "epoch": 267, "lr": 5.912085283057418e-05} +{"train_loss": 0.0023074629716575146, "global_step": 31810, "epoch": 267, "lr": 5.9118674485484526e-05} +{"train_loss": 0.0027819820679724216, "global_step": 31811, "epoch": 267, "lr": 5.911649612249135e-05} +{"train_loss": 0.002447993727400899, "global_step": 31812, "epoch": 267, "lr": 5.911431774159889e-05} +{"train_loss": 0.002851043827831745, "global_step": 31813, "epoch": 267, "lr": 5.9112139342811445e-05} +{"train_loss": 0.0036532997619360685, "global_step": 31814, "epoch": 267, "lr": 5.910996092613329e-05} +{"train_loss": 0.0019068998517468572, "global_step": 31815, "epoch": 267, "lr": 5.9107782491568694e-05} +{"train_loss": 0.003143229288980365, "global_step": 31816, "epoch": 267, "lr": 5.9105604039121954e-05} +{"train_loss": 0.0018416706006973982, "global_step": 31817, "epoch": 267, "lr": 5.9103425568797324e-05} +{"train_loss": 0.003374743275344372, "global_step": 31818, "epoch": 267, "lr": 5.9101247080599086e-05} +{"train_loss": 0.0031365700997412205, "global_step": 31819, "epoch": 267, "lr": 5.909906857453152e-05} +{"train_loss": 0.0023885273840278387, "global_step": 31820, "epoch": 267, "lr": 5.909689005059891e-05} +{"train_loss": 0.0019522691145539284, "global_step": 31821, "epoch": 267, "lr": 5.9094711508805534e-05} +{"train_loss": 0.004021996166557074, "global_step": 31822, "epoch": 267, "lr": 5.9092532949155655e-05} +{"train_loss": 0.00291953282430768, "global_step": 31823, "epoch": 267, "lr": 5.9090354371653554e-05} +{"train_loss": 0.0023266626521945, "global_step": 31824, "epoch": 267, "lr": 5.9088175776303534e-05} +{"train_loss": 0.0025271752383559942, "global_step": 31825, "epoch": 267, "lr": 5.908599716310984e-05} +{"train_loss": 0.0026827428955584764, "global_step": 31826, "epoch": 267, "lr": 5.9083818532076764e-05} +{"train_loss": 0.004802023991942406, "global_step": 31827, "epoch": 267, "lr": 5.908163988320857e-05} +{"train_loss": 0.0019224811112508178, "global_step": 31828, "epoch": 267, "lr": 5.907946121650956e-05} +{"train_loss": 0.0027442362625151873, "global_step": 31829, "epoch": 267, "lr": 5.907728253198399e-05} +{"train_loss": 0.002417254028841853, "global_step": 31830, "epoch": 267, "lr": 5.9075103829636145e-05} +{"train_loss": 0.0016197303775697947, "global_step": 31831, "epoch": 267, "lr": 5.907292510947031e-05} +{"train_loss": 0.0017492553452029824, "global_step": 31832, "epoch": 267, "lr": 5.907074637149075e-05} +{"train_loss": 0.002947465516626835, "global_step": 31833, "epoch": 267, "lr": 5.906856761570174e-05} +{"train_loss": 0.003014487447217107, "global_step": 31834, "epoch": 267, "lr": 5.906638884210758e-05} +{"train_loss": 0.003737748134881258, "global_step": 31835, "epoch": 267, "lr": 5.906421005071253e-05} +{"train_loss": 0.002823461778461933, "global_step": 31836, "epoch": 267, "lr": 5.906203124152089e-05} +{"train_loss": 0.0029238038696348667, "global_step": 31837, "epoch": 267, "lr": 5.9059852414536897e-05} +{"train_loss": 0.0033125930931419134, "global_step": 31838, "epoch": 267, "lr": 5.905767356976486e-05} +{"train_loss": 0.0018406242597848177, "global_step": 31839, "epoch": 267, "lr": 5.905549470720904e-05} +{"train_loss": 0.0015518361469730735, "global_step": 31840, "epoch": 267, "lr": 5.9053315826873726e-05} +{"train_loss": 0.003145543159916997, "global_step": 31841, "epoch": 267, "lr": 5.90511369287632e-05} +{"train_loss": 0.003240845864638686, "global_step": 31842, "epoch": 267, "lr": 5.904895801288174e-05} +{"train_loss": 0.002901428611949086, "global_step": 31843, "epoch": 267, "lr": 5.9046779079233604e-05} +{"train_loss": 0.0028974462766200304, "global_step": 31844, "epoch": 267, "lr": 5.904460012782309e-05} +{"train_loss": 0.0013007844099774957, "global_step": 31845, "epoch": 267, "lr": 5.904242115865446e-05} +{"train_loss": 0.002547549782320857, "global_step": 31846, "epoch": 267, "lr": 5.904024217173202e-05} +{"train_loss": 0.0021388321183621883, "global_step": 31847, "epoch": 267, "lr": 5.903806316706001e-05} +{"train_loss": 0.0025189195293933153, "global_step": 31848, "epoch": 267, "lr": 5.903588414464274e-05} +{"train_loss": 0.002800466027110815, "global_step": 31849, "epoch": 267, "lr": 5.903370510448447e-05} +{"train_loss": 0.002200379967689514, "global_step": 31850, "epoch": 267, "lr": 5.903152604658949e-05} +{"train_loss": 0.0029000909999012947, "global_step": 31851, "epoch": 267, "lr": 5.9029346970962073e-05} +{"train_loss": 0.005362058989703655, "global_step": 31852, "epoch": 267, "lr": 5.9027167877606506e-05} +{"train_loss": 0.0023888815194368362, "global_step": 31853, "epoch": 267, "lr": 5.9024988766527045e-05} +{"train_loss": 0.0015308576403185725, "global_step": 31854, "epoch": 267, "lr": 5.9022809637727994e-05} +{"train_loss": 0.002793410327285528, "global_step": 31855, "epoch": 267, "lr": 5.902063049121362e-05} +{"train_loss": 0.0032975838985294104, "global_step": 31856, "epoch": 267, "lr": 5.90184513269882e-05} +{"train_loss": 0.002639409387484193, "global_step": 31857, "epoch": 267, "lr": 5.9016272145056015e-05} +{"train_loss": 0.0016880497569218278, "global_step": 31858, "epoch": 267, "lr": 5.901409294542134e-05} +{"train_loss": 0.0023515261709690094, "global_step": 31859, "epoch": 267, "lr": 5.901191372808845e-05} +{"train_loss": 0.003104167291894555, "global_step": 31860, "epoch": 267, "lr": 5.9009734493061644e-05} +{"train_loss": 0.0026098613161593676, "global_step": 31861, "epoch": 267, "lr": 5.900755524034519e-05} +{"train_loss": 0.0029372673016041517, "global_step": 31862, "epoch": 267, "lr": 5.900537596994336e-05} +{"train_loss": 0.003370187245309353, "global_step": 31863, "epoch": 267, "lr": 5.900319668186042e-05} +{"train_loss": 0.0010747286723926663, "global_step": 31864, "epoch": 267, "lr": 5.900101737610067e-05} +{"train_loss": 0.0028366122860461473, "global_step": 31865, "epoch": 267, "lr": 5.899883805266838e-05} +{"train_loss": 0.0021049496717751026, "global_step": 31866, "epoch": 267, "lr": 5.8996658711567844e-05} +{"train_loss": 0.0021415946539491415, "global_step": 31867, "epoch": 267, "lr": 5.8994479352803326e-05} +{"train_loss": 0.003175800433382392, "global_step": 31868, "epoch": 267, "lr": 5.899229997637912e-05} +{"train_loss": 0.0038085717242211103, "global_step": 31869, "epoch": 267, "lr": 5.899012058229948e-05} +{"train_loss": 0.0020833557937294245, "global_step": 31870, "epoch": 267, "lr": 5.898794117056871e-05} +{"train_loss": 0.0016410569660365582, "global_step": 31871, "epoch": 267, "lr": 5.898576174119106e-05} +{"train_loss": 0.002499951981008053, "global_step": 31872, "epoch": 267, "lr": 5.8983582294170836e-05} +{"train_loss": 0.0024361182004213333, "global_step": 31873, "epoch": 267, "lr": 5.898140282951231e-05} +{"train_loss": 0.0024703913368284702, "global_step": 31874, "epoch": 267, "lr": 5.8979223347219766e-05} +{"train_loss": 0.0021259731147438288, "global_step": 31875, "epoch": 267, "lr": 5.897704384729748e-05} +{"train_loss": 0.0014662750763818622, "global_step": 31876, "epoch": 267, "lr": 5.89748643297497e-05} +{"train_loss": 0.0019443286582827568, "global_step": 31877, "epoch": 267, "lr": 5.897268479458076e-05} +{"train_loss": 0.001933719264343381, "global_step": 31878, "epoch": 267, "lr": 5.8970505241794893e-05} +{"train_loss": 0.0018513821996748447, "global_step": 31879, "epoch": 267, "lr": 5.896832567139641e-05} +{"train_loss": 0.002153910230845213, "global_step": 31880, "epoch": 267, "lr": 5.8966146083389564e-05} +{"train_loss": 0.003123906208202243, "global_step": 31881, "epoch": 267, "lr": 5.896396647777865e-05} +{"train_loss": 0.00315591087564826, "global_step": 31882, "epoch": 267, "lr": 5.896178685456796e-05} +{"train_loss": 0.0038337651640176773, "global_step": 31883, "epoch": 267, "lr": 5.895960721376175e-05} +{"train_loss": 0.002484898781403899, "global_step": 31884, "epoch": 267, "lr": 5.895742755536431e-05} +{"train_loss": 0.002783402567729354, "global_step": 31885, "epoch": 267, "lr": 5.895524787937992e-05} +{"train_loss": 0.0027491801884025335, "global_step": 31886, "epoch": 267, "lr": 5.8953068185812854e-05} +{"train_loss": 0.00281629734672606, "global_step": 31887, "epoch": 267, "lr": 5.8950888474667396e-05} +{"train_loss": 0.00422712555155158, "global_step": 31888, "epoch": 267, "lr": 5.894870874594782e-05} +{"train_loss": 0.002321353182196617, "global_step": 31889, "epoch": 267, "lr": 5.8946528999658424e-05} +{"train_loss": 0.002394522540271282, "global_step": 31890, "epoch": 267, "lr": 5.894434923580347e-05} +{"train_loss": 0.0027150406596102134, "global_step": 31891, "epoch": 267, "lr": 5.894216945438723e-05, "val_loss": 0.016248777508735657} +{"train_loss": 0.0020974292419850826, "global_step": 31892, "epoch": 268, "lr": 5.8939989655413994e-05} +{"train_loss": 0.0029871193692088127, "global_step": 31893, "epoch": 268, "lr": 5.893780983888807e-05} +{"train_loss": 0.0023717202711850405, "global_step": 31894, "epoch": 268, "lr": 5.893563000481369e-05} +{"train_loss": 0.0027839967515319586, "global_step": 31895, "epoch": 268, "lr": 5.8933450153195155e-05} +{"train_loss": 0.0021557470317929983, "global_step": 31896, "epoch": 268, "lr": 5.893127028403675e-05} +{"train_loss": 0.004508320242166519, "global_step": 31897, "epoch": 268, "lr": 5.8929090397342746e-05} +{"train_loss": 0.003074354026466608, "global_step": 31898, "epoch": 268, "lr": 5.892691049311743e-05} +{"train_loss": 0.002020483370870352, "global_step": 31899, "epoch": 268, "lr": 5.892473057136507e-05} +{"train_loss": 0.002543302718549967, "global_step": 31900, "epoch": 268, "lr": 5.892255063208997e-05} +{"train_loss": 0.001804759493097663, "global_step": 31901, "epoch": 268, "lr": 5.892037067529639e-05} +{"train_loss": 0.0034579152707010508, "global_step": 31902, "epoch": 268, "lr": 5.8918190700988604e-05} +{"train_loss": 0.002482899697497487, "global_step": 31903, "epoch": 268, "lr": 5.891601070917092e-05} +{"train_loss": 0.0023777028545737267, "global_step": 31904, "epoch": 268, "lr": 5.89138306998476e-05} +{"train_loss": 0.0015779029345139861, "global_step": 31905, "epoch": 268, "lr": 5.891165067302292e-05} +{"train_loss": 0.004445419646799564, "global_step": 31906, "epoch": 268, "lr": 5.8909470628701166e-05} +{"train_loss": 0.0022355292458087206, "global_step": 31907, "epoch": 268, "lr": 5.890729056688662e-05} +{"train_loss": 0.0028874040581285954, "global_step": 31908, "epoch": 268, "lr": 5.890511048758356e-05} +{"train_loss": 0.0026861161459237337, "global_step": 31909, "epoch": 268, "lr": 5.8902930390796265e-05} +{"train_loss": 0.0023179883137345314, "global_step": 31910, "epoch": 268, "lr": 5.890075027652902e-05} +{"train_loss": 0.003108596196398139, "global_step": 31911, "epoch": 268, "lr": 5.88985701447861e-05} +{"train_loss": 0.0022089662961661816, "global_step": 31912, "epoch": 268, "lr": 5.8896389995571786e-05} +{"train_loss": 0.001317136106081307, "global_step": 31913, "epoch": 268, "lr": 5.889420982889037e-05} +{"train_loss": 0.001574271940626204, "global_step": 31914, "epoch": 268, "lr": 5.889202964474611e-05} +{"train_loss": 0.0026442420203238726, "global_step": 31915, "epoch": 268, "lr": 5.88898494431433e-05} +{"train_loss": 0.003111522179096937, "global_step": 31916, "epoch": 268, "lr": 5.888766922408623e-05} +{"train_loss": 0.0033203831408172846, "global_step": 31917, "epoch": 268, "lr": 5.8885488987579164e-05} +{"train_loss": 0.002224169671535492, "global_step": 31918, "epoch": 268, "lr": 5.888330873362641e-05} +{"train_loss": 0.004011792596429586, "global_step": 31919, "epoch": 268, "lr": 5.8881128462232206e-05} +{"train_loss": 0.0025195449125021696, "global_step": 31920, "epoch": 268, "lr": 5.887894817340086e-05} +{"train_loss": 0.0043054018169641495, "global_step": 31921, "epoch": 268, "lr": 5.887676786713665e-05} +{"train_loss": 0.001781001454219222, "global_step": 31922, "epoch": 268, "lr": 5.887458754344385e-05} +{"train_loss": 0.0018201111815869808, "global_step": 31923, "epoch": 268, "lr": 5.887240720232675e-05} +{"train_loss": 0.0020414323080331087, "global_step": 31924, "epoch": 268, "lr": 5.887022684378963e-05} +{"train_loss": 0.003492441726848483, "global_step": 31925, "epoch": 268, "lr": 5.8868046467836766e-05} +{"train_loss": 0.0016590935410931706, "global_step": 31926, "epoch": 268, "lr": 5.886586607447243e-05} +{"train_loss": 0.0030117023270577192, "global_step": 31927, "epoch": 268, "lr": 5.886368566370093e-05} +{"train_loss": 0.0022386249620467424, "global_step": 31928, "epoch": 268, "lr": 5.8861505235526516e-05} +{"train_loss": 0.001737038022838533, "global_step": 31929, "epoch": 268, "lr": 5.8859324789953484e-05} +{"train_loss": 0.002763953758403659, "global_step": 31930, "epoch": 268, "lr": 5.8857144326986115e-05} +{"train_loss": 0.0035724560730159283, "global_step": 31931, "epoch": 268, "lr": 5.88549638466287e-05} +{"train_loss": 0.0014063550624996424, "global_step": 31932, "epoch": 268, "lr": 5.8852783348885485e-05} +{"train_loss": 0.0024535362608730793, "global_step": 31933, "epoch": 268, "lr": 5.88506028337608e-05} +{"train_loss": 0.0034384543541818857, "global_step": 31934, "epoch": 268, "lr": 5.8848422301258886e-05} +{"train_loss": 0.00428161583840847, "global_step": 31935, "epoch": 268, "lr": 5.884624175138406e-05} +{"train_loss": 0.0036422202829271555, "global_step": 31936, "epoch": 268, "lr": 5.884406118414057e-05} +{"train_loss": 0.0021777001675218344, "global_step": 31937, "epoch": 268, "lr": 5.884188059953272e-05} +{"train_loss": 0.0029613529331982136, "global_step": 31938, "epoch": 268, "lr": 5.8839699997564765e-05} +{"train_loss": 0.0014370287535712123, "global_step": 31939, "epoch": 268, "lr": 5.883751937824101e-05} +{"train_loss": 0.004472799599170685, "global_step": 31940, "epoch": 268, "lr": 5.883533874156574e-05} +{"train_loss": 0.002482996555045247, "global_step": 31941, "epoch": 268, "lr": 5.8833158087543216e-05} +{"train_loss": 0.002022966742515564, "global_step": 31942, "epoch": 268, "lr": 5.8830977416177736e-05} +{"train_loss": 0.0023463470861315727, "global_step": 31943, "epoch": 268, "lr": 5.882879672747358e-05} +{"train_loss": 0.002952398033812642, "global_step": 31944, "epoch": 268, "lr": 5.882661602143501e-05} +{"train_loss": 0.0025296928361058235, "global_step": 31945, "epoch": 268, "lr": 5.8824435298066335e-05} +{"train_loss": 0.004679626785218716, "global_step": 31946, "epoch": 268, "lr": 5.882225455737181e-05} +{"train_loss": 0.0019417935982346535, "global_step": 31947, "epoch": 268, "lr": 5.882007379935575e-05} +{"train_loss": 0.002655621850863099, "global_step": 31948, "epoch": 268, "lr": 5.8817893024022395e-05} +{"train_loss": 0.002435065805912018, "global_step": 31949, "epoch": 268, "lr": 5.881571223137606e-05} +{"train_loss": 0.002316885394975543, "global_step": 31950, "epoch": 268, "lr": 5.881353142142102e-05} +{"train_loss": 0.0021659699268639088, "global_step": 31951, "epoch": 268, "lr": 5.8811350594161555e-05} +{"train_loss": 0.0019780145958065987, "global_step": 31952, "epoch": 268, "lr": 5.880916974960193e-05} +{"train_loss": 0.003791634226217866, "global_step": 31953, "epoch": 268, "lr": 5.880698888774645e-05} +{"train_loss": 0.001455312711186707, "global_step": 31954, "epoch": 268, "lr": 5.880480800859939e-05} +{"train_loss": 0.00224948744289577, "global_step": 31955, "epoch": 268, "lr": 5.880262711216503e-05} +{"train_loss": 0.002700260141864419, "global_step": 31956, "epoch": 268, "lr": 5.8800446198447656e-05} +{"train_loss": 0.001869034138508141, "global_step": 31957, "epoch": 268, "lr": 5.8798265267451534e-05} +{"train_loss": 0.0013117126654833555, "global_step": 31958, "epoch": 268, "lr": 5.879608431918097e-05} +{"train_loss": 0.0024997564032673836, "global_step": 31959, "epoch": 268, "lr": 5.879390335364022e-05} +{"train_loss": 0.0014934965874999762, "global_step": 31960, "epoch": 268, "lr": 5.879172237083359e-05} +{"train_loss": 0.0029840257484465837, "global_step": 31961, "epoch": 268, "lr": 5.878954137076536e-05} +{"train_loss": 0.0028577109333127737, "global_step": 31962, "epoch": 268, "lr": 5.87873603534398e-05} +{"train_loss": 0.003127629403024912, "global_step": 31963, "epoch": 268, "lr": 5.8785179318861186e-05} +{"train_loss": 0.002225319854915142, "global_step": 31964, "epoch": 268, "lr": 5.878299826703381e-05} +{"train_loss": 0.0031675409991294146, "global_step": 31965, "epoch": 268, "lr": 5.878081719796196e-05} +{"train_loss": 0.0020758917089551687, "global_step": 31966, "epoch": 268, "lr": 5.877863611164991e-05} +{"train_loss": 0.002846892224624753, "global_step": 31967, "epoch": 268, "lr": 5.877645500810196e-05} +{"train_loss": 0.001045048120431602, "global_step": 31968, "epoch": 268, "lr": 5.877427388732237e-05} +{"train_loss": 0.002186803612858057, "global_step": 31969, "epoch": 268, "lr": 5.8772092749315436e-05} +{"train_loss": 0.004650192800909281, "global_step": 31970, "epoch": 268, "lr": 5.876991159408543e-05} +{"train_loss": 0.001470042741857469, "global_step": 31971, "epoch": 268, "lr": 5.8767730421636635e-05} +{"train_loss": 0.003300637938082218, "global_step": 31972, "epoch": 268, "lr": 5.876554923197335e-05} +{"train_loss": 0.0021972879767417908, "global_step": 31973, "epoch": 268, "lr": 5.876336802509983e-05} +{"train_loss": 0.00195000518579036, "global_step": 31974, "epoch": 268, "lr": 5.8761186801020394e-05} +{"train_loss": 0.0034572819713503122, "global_step": 31975, "epoch": 268, "lr": 5.875900555973929e-05} +{"train_loss": 0.0022971786092966795, "global_step": 31976, "epoch": 268, "lr": 5.875682430126082e-05} +{"train_loss": 0.0032711189705878496, "global_step": 31977, "epoch": 268, "lr": 5.875464302558925e-05} +{"train_loss": 0.0015180191257968545, "global_step": 31978, "epoch": 268, "lr": 5.8752461732728884e-05} +{"train_loss": 0.0022992135491222143, "global_step": 31979, "epoch": 268, "lr": 5.875028042268398e-05} +{"train_loss": 0.002915159100666642, "global_step": 31980, "epoch": 268, "lr": 5.874809909545884e-05} +{"train_loss": 0.002775746863335371, "global_step": 31981, "epoch": 268, "lr": 5.8745917751057754e-05} +{"train_loss": 0.0017284986097365618, "global_step": 31982, "epoch": 268, "lr": 5.8743736389484983e-05} +{"train_loss": 0.002553265541791916, "global_step": 31983, "epoch": 268, "lr": 5.874155501074482e-05} +{"train_loss": 0.0027871213387697935, "global_step": 31984, "epoch": 268, "lr": 5.873937361484155e-05} +{"train_loss": 0.0022959064226597548, "global_step": 31985, "epoch": 268, "lr": 5.873719220177946e-05} +{"train_loss": 0.003703685477375984, "global_step": 31986, "epoch": 268, "lr": 5.873501077156281e-05} +{"train_loss": 0.003632731270045042, "global_step": 31987, "epoch": 268, "lr": 5.8732829324195925e-05} +{"train_loss": 0.003578362287953496, "global_step": 31988, "epoch": 268, "lr": 5.873064785968305e-05} +{"train_loss": 0.0026486427523195744, "global_step": 31989, "epoch": 268, "lr": 5.872846637802848e-05} +{"train_loss": 0.0020197280682623386, "global_step": 31990, "epoch": 268, "lr": 5.872628487923649e-05} +{"train_loss": 0.002044627210125327, "global_step": 31991, "epoch": 268, "lr": 5.8724103363311375e-05} +{"train_loss": 0.0032341531477868557, "global_step": 31992, "epoch": 268, "lr": 5.8721921830257434e-05} +{"train_loss": 0.0027962024323642254, "global_step": 31993, "epoch": 268, "lr": 5.8719740280078914e-05} +{"train_loss": 0.00486407894641161, "global_step": 31994, "epoch": 268, "lr": 5.8717558712780116e-05} +{"train_loss": 0.00316005595959723, "global_step": 31995, "epoch": 268, "lr": 5.871537712836534e-05} +{"train_loss": 0.001989735057577491, "global_step": 31996, "epoch": 268, "lr": 5.8713195526838825e-05} +{"train_loss": 0.0022231321781873703, "global_step": 31997, "epoch": 268, "lr": 5.871101390820489e-05} +{"train_loss": 0.0035631402861326933, "global_step": 31998, "epoch": 268, "lr": 5.870883227246781e-05} +{"train_loss": 0.003440726548433304, "global_step": 31999, "epoch": 268, "lr": 5.870665061963188e-05} +{"train_loss": 0.0015669079730287194, "global_step": 32000, "epoch": 268, "lr": 5.870446894970136e-05} +{"train_loss": 0.0030187773518264294, "global_step": 32001, "epoch": 268, "lr": 5.870228726268054e-05} +{"train_loss": 0.0033190466929227114, "global_step": 32002, "epoch": 268, "lr": 5.8700105558573727e-05} +{"train_loss": 0.0028968967963010073, "global_step": 32003, "epoch": 268, "lr": 5.869792383738517e-05} +{"train_loss": 0.002106666099280119, "global_step": 32004, "epoch": 268, "lr": 5.8695742099119175e-05} +{"train_loss": 0.002054415410384536, "global_step": 32005, "epoch": 268, "lr": 5.869356034378003e-05} +{"train_loss": 0.003049602499231696, "global_step": 32006, "epoch": 268, "lr": 5.8691378571372e-05} +{"train_loss": 0.0030489785131067038, "global_step": 32007, "epoch": 268, "lr": 5.868919678189937e-05} +{"train_loss": 0.0022349096834659576, "global_step": 32008, "epoch": 268, "lr": 5.868701497536644e-05} +{"train_loss": 0.0018674987368285656, "global_step": 32009, "epoch": 268, "lr": 5.868483315177748e-05} +{"train_loss": 0.0026373268298789105, "global_step": 32010, "epoch": 268, "lr": 5.868265131113677e-05, "val_loss": 0.016542095690965652} +{"train_loss": 0.0021472300868481398, "global_step": 32011, "epoch": 269, "lr": 5.86804694534486e-05} +{"train_loss": 0.003762517822906375, "global_step": 32012, "epoch": 269, "lr": 5.867828757871727e-05} +{"train_loss": 0.003664568765088916, "global_step": 32013, "epoch": 269, "lr": 5.8676105686947047e-05} +{"train_loss": 0.0022404175251722336, "global_step": 32014, "epoch": 269, "lr": 5.86739237781422e-05} +{"train_loss": 0.0017119229305535555, "global_step": 32015, "epoch": 269, "lr": 5.867174185230705e-05} +{"train_loss": 0.0014141093706712127, "global_step": 32016, "epoch": 269, "lr": 5.866955990944586e-05} +{"train_loss": 0.00213022087700665, "global_step": 32017, "epoch": 269, "lr": 5.866737794956291e-05} +{"train_loss": 0.003745946567505598, "global_step": 32018, "epoch": 269, "lr": 5.8665195972662504e-05} +{"train_loss": 0.0018008671468123794, "global_step": 32019, "epoch": 269, "lr": 5.8663013978748894e-05} +{"train_loss": 0.0034980764612555504, "global_step": 32020, "epoch": 269, "lr": 5.866083196782638e-05} +{"train_loss": 0.002951602451503277, "global_step": 32021, "epoch": 269, "lr": 5.8658649939899256e-05} +{"train_loss": 0.002593324286863208, "global_step": 32022, "epoch": 269, "lr": 5.8656467894971786e-05} +{"train_loss": 0.001589214545674622, "global_step": 32023, "epoch": 269, "lr": 5.865428583304828e-05} +{"train_loss": 0.0031190672889351845, "global_step": 32024, "epoch": 269, "lr": 5.865210375413301e-05} +{"train_loss": 0.0025406840723007917, "global_step": 32025, "epoch": 269, "lr": 5.864992165823026e-05} +{"train_loss": 0.002810410223901272, "global_step": 32026, "epoch": 269, "lr": 5.8647739545344305e-05} +{"train_loss": 0.0018927392084151506, "global_step": 32027, "epoch": 269, "lr": 5.8645557415479434e-05} +{"train_loss": 0.002242882503196597, "global_step": 32028, "epoch": 269, "lr": 5.8643375268639935e-05} +{"train_loss": 0.0012169694527983665, "global_step": 32029, "epoch": 269, "lr": 5.8641193104830096e-05} +{"train_loss": 0.0022835235577076674, "global_step": 32030, "epoch": 269, "lr": 5.8639010924054195e-05} +{"train_loss": 0.005169016309082508, "global_step": 32031, "epoch": 269, "lr": 5.863682872631652e-05} +{"train_loss": 0.0015953114489093423, "global_step": 32032, "epoch": 269, "lr": 5.8634646511621346e-05} +{"train_loss": 0.00640035979449749, "global_step": 32033, "epoch": 269, "lr": 5.863246427997298e-05} +{"train_loss": 0.0038660275749862194, "global_step": 32034, "epoch": 269, "lr": 5.8630282031375683e-05} +{"train_loss": 0.0032486494164913893, "global_step": 32035, "epoch": 269, "lr": 5.862809976583375e-05} +{"train_loss": 0.001972897443920374, "global_step": 32036, "epoch": 269, "lr": 5.862591748335147e-05} +{"train_loss": 0.002018890343606472, "global_step": 32037, "epoch": 269, "lr": 5.862373518393314e-05} +{"train_loss": 0.0022597811184823513, "global_step": 32038, "epoch": 269, "lr": 5.862155286758299e-05} +{"train_loss": 0.003503261599689722, "global_step": 32039, "epoch": 269, "lr": 5.8619370534305376e-05} +{"train_loss": 0.0026229002978652716, "global_step": 32040, "epoch": 269, "lr": 5.8617188184104534e-05} +{"train_loss": 0.003225353779271245, "global_step": 32041, "epoch": 269, "lr": 5.861500581698476e-05} +{"train_loss": 0.0027626072987914085, "global_step": 32042, "epoch": 269, "lr": 5.861282343295034e-05} +{"train_loss": 0.0030846367590129375, "global_step": 32043, "epoch": 269, "lr": 5.861064103200558e-05} +{"train_loss": 0.0029858204070478678, "global_step": 32044, "epoch": 269, "lr": 5.860845861415473e-05} +{"train_loss": 0.0021928222849965096, "global_step": 32045, "epoch": 269, "lr": 5.8606276179402096e-05} +{"train_loss": 0.0023939390666782856, "global_step": 32046, "epoch": 269, "lr": 5.860409372775195e-05} +{"train_loss": 0.0036613037809729576, "global_step": 32047, "epoch": 269, "lr": 5.8601911259208584e-05} +{"train_loss": 0.003923099022358656, "global_step": 32048, "epoch": 269, "lr": 5.8599728773776284e-05} +{"train_loss": 0.0055932640098035336, "global_step": 32049, "epoch": 269, "lr": 5.859754627145936e-05} +{"train_loss": 0.004539540968835354, "global_step": 32050, "epoch": 269, "lr": 5.859536375226205e-05} +{"train_loss": 0.0018696897896006703, "global_step": 32051, "epoch": 269, "lr": 5.859318121618866e-05} +{"train_loss": 0.003718477673828602, "global_step": 32052, "epoch": 269, "lr": 5.859099866324349e-05} +{"train_loss": 0.0027356063947081566, "global_step": 32053, "epoch": 269, "lr": 5.858881609343081e-05} +{"train_loss": 0.002534419996663928, "global_step": 32054, "epoch": 269, "lr": 5.85866335067549e-05} +{"train_loss": 0.0023097344674170017, "global_step": 32055, "epoch": 269, "lr": 5.8584450903220056e-05} +{"train_loss": 0.003888934850692749, "global_step": 32056, "epoch": 269, "lr": 5.8582268282830565e-05} +{"train_loss": 0.003957570996135473, "global_step": 32057, "epoch": 269, "lr": 5.85800856455907e-05} +{"train_loss": 0.002977272029966116, "global_step": 32058, "epoch": 269, "lr": 5.857790299150476e-05} +{"train_loss": 0.0037913296837359667, "global_step": 32059, "epoch": 269, "lr": 5.857572032057701e-05} +{"train_loss": 0.0027450909838080406, "global_step": 32060, "epoch": 269, "lr": 5.857353763281176e-05} +{"train_loss": 0.004347789566963911, "global_step": 32061, "epoch": 269, "lr": 5.857135492821328e-05} +{"train_loss": 0.003535002935677767, "global_step": 32062, "epoch": 269, "lr": 5.856917220678586e-05} +{"train_loss": 0.004361618310213089, "global_step": 32063, "epoch": 269, "lr": 5.8566989468533795e-05} +{"train_loss": 0.002420348348096013, "global_step": 32064, "epoch": 269, "lr": 5.856480671346135e-05} +{"train_loss": 0.003559735370799899, "global_step": 32065, "epoch": 269, "lr": 5.8562623941572826e-05} +{"train_loss": 0.0025154363829642534, "global_step": 32066, "epoch": 269, "lr": 5.8560441152872515e-05} +{"train_loss": 0.0023087982553988695, "global_step": 32067, "epoch": 269, "lr": 5.855825834736468e-05} +{"train_loss": 0.00248538376763463, "global_step": 32068, "epoch": 269, "lr": 5.855607552505363e-05} +{"train_loss": 0.003108787816017866, "global_step": 32069, "epoch": 269, "lr": 5.855389268594363e-05} +{"train_loss": 0.002810634905472398, "global_step": 32070, "epoch": 269, "lr": 5.855170983003898e-05} +{"train_loss": 0.0026968331076204777, "global_step": 32071, "epoch": 269, "lr": 5.8549526957343956e-05} +{"train_loss": 0.0043098777532577515, "global_step": 32072, "epoch": 269, "lr": 5.854734406786285e-05} +{"train_loss": 0.0018023565644398332, "global_step": 32073, "epoch": 269, "lr": 5.854516116159995e-05} +{"train_loss": 0.0032755574211478233, "global_step": 32074, "epoch": 269, "lr": 5.854297823855954e-05} +{"train_loss": 0.0032318460289388895, "global_step": 32075, "epoch": 269, "lr": 5.854079529874591e-05} +{"train_loss": 0.0022004558704793453, "global_step": 32076, "epoch": 269, "lr": 5.853861234216333e-05} +{"train_loss": 0.0035074877087026834, "global_step": 32077, "epoch": 269, "lr": 5.8536429368816106e-05} +{"train_loss": 0.0027375812642276287, "global_step": 32078, "epoch": 269, "lr": 5.8534246378708504e-05} +{"train_loss": 0.004211608320474625, "global_step": 32079, "epoch": 269, "lr": 5.853206337184483e-05} +{"train_loss": 0.0015093890251591802, "global_step": 32080, "epoch": 269, "lr": 5.852988034822936e-05} +{"train_loss": 0.003469986142590642, "global_step": 32081, "epoch": 269, "lr": 5.852769730786638e-05} +{"train_loss": 0.00444419588893652, "global_step": 32082, "epoch": 269, "lr": 5.852551425076017e-05} +{"train_loss": 0.002287626964971423, "global_step": 32083, "epoch": 269, "lr": 5.852333117691503e-05} +{"train_loss": 0.0025144917890429497, "global_step": 32084, "epoch": 269, "lr": 5.8521148086335245e-05} +{"train_loss": 0.0038599777035415173, "global_step": 32085, "epoch": 269, "lr": 5.851896497902508e-05} +{"train_loss": 0.0028012527618557215, "global_step": 32086, "epoch": 269, "lr": 5.851678185498885e-05} +{"train_loss": 0.002994627458974719, "global_step": 32087, "epoch": 269, "lr": 5.851459871423084e-05} +{"train_loss": 0.0020160386338829994, "global_step": 32088, "epoch": 269, "lr": 5.8512415556755305e-05} +{"train_loss": 0.002367943525314331, "global_step": 32089, "epoch": 269, "lr": 5.8510232382566566e-05} +{"train_loss": 0.0014668102376163006, "global_step": 32090, "epoch": 269, "lr": 5.850804919166888e-05} +{"train_loss": 0.0026972831692546606, "global_step": 32091, "epoch": 269, "lr": 5.850586598406656e-05} +{"train_loss": 0.002964344574138522, "global_step": 32092, "epoch": 269, "lr": 5.850368275976388e-05} +{"train_loss": 0.0032983364071696997, "global_step": 32093, "epoch": 269, "lr": 5.850149951876514e-05} +{"train_loss": 0.004066127818077803, "global_step": 32094, "epoch": 269, "lr": 5.849931626107459e-05} +{"train_loss": 0.002330436371266842, "global_step": 32095, "epoch": 269, "lr": 5.849713298669654e-05} +{"train_loss": 0.002474964829161763, "global_step": 32096, "epoch": 269, "lr": 5.849494969563528e-05} +{"train_loss": 0.0035646057222038507, "global_step": 32097, "epoch": 269, "lr": 5.849276638789509e-05} +{"train_loss": 0.0024613335262984037, "global_step": 32098, "epoch": 269, "lr": 5.849058306348027e-05} +{"train_loss": 0.003239427227526903, "global_step": 32099, "epoch": 269, "lr": 5.8488399722395117e-05} +{"train_loss": 0.004246697295457125, "global_step": 32100, "epoch": 269, "lr": 5.8486216364643875e-05} +{"train_loss": 0.002395784482359886, "global_step": 32101, "epoch": 269, "lr": 5.8484032990230865e-05} +{"train_loss": 0.003717432264238596, "global_step": 32102, "epoch": 269, "lr": 5.848184959916034e-05} +{"train_loss": 0.003948835656046867, "global_step": 32103, "epoch": 269, "lr": 5.847966619143663e-05} +{"train_loss": 0.003358319867402315, "global_step": 32104, "epoch": 269, "lr": 5.8477482767064e-05} +{"train_loss": 0.00310877850279212, "global_step": 32105, "epoch": 269, "lr": 5.847529932604673e-05} +{"train_loss": 0.0020830181892961264, "global_step": 32106, "epoch": 269, "lr": 5.847311586838913e-05} +{"train_loss": 0.0036968293134123087, "global_step": 32107, "epoch": 269, "lr": 5.847093239409546e-05} +{"train_loss": 0.0027771207969635725, "global_step": 32108, "epoch": 269, "lr": 5.8468748903170025e-05} +{"train_loss": 0.0025409855879843235, "global_step": 32109, "epoch": 269, "lr": 5.846656539561709e-05} +{"train_loss": 0.0029225193429738283, "global_step": 32110, "epoch": 269, "lr": 5.846438187144098e-05} +{"train_loss": 0.0042913490906357765, "global_step": 32111, "epoch": 269, "lr": 5.8462198330645944e-05} +{"train_loss": 0.004807904362678528, "global_step": 32112, "epoch": 269, "lr": 5.846001477323629e-05} +{"train_loss": 0.0011995802633464336, "global_step": 32113, "epoch": 269, "lr": 5.845783119921631e-05} +{"train_loss": 0.0023712969850748777, "global_step": 32114, "epoch": 269, "lr": 5.845564760859027e-05} +{"train_loss": 0.0031733789946883917, "global_step": 32115, "epoch": 269, "lr": 5.845346400136247e-05} +{"train_loss": 0.004799226764589548, "global_step": 32116, "epoch": 269, "lr": 5.84512803775372e-05} +{"train_loss": 0.0022304486483335495, "global_step": 32117, "epoch": 269, "lr": 5.8449096737118745e-05} +{"train_loss": 0.004263829905539751, "global_step": 32118, "epoch": 269, "lr": 5.84469130801114e-05} +{"train_loss": 0.0026167475152760744, "global_step": 32119, "epoch": 269, "lr": 5.8444729406519435e-05} +{"train_loss": 0.0030755603220313787, "global_step": 32120, "epoch": 269, "lr": 5.844254571634715e-05} +{"train_loss": 0.0032251595985144377, "global_step": 32121, "epoch": 269, "lr": 5.8440362009598814e-05} +{"train_loss": 0.0036897349637001753, "global_step": 32122, "epoch": 269, "lr": 5.8438178286278744e-05} +{"train_loss": 0.002489854581654072, "global_step": 32123, "epoch": 269, "lr": 5.8435994546391204e-05} +{"train_loss": 0.0027526102494448423, "global_step": 32124, "epoch": 269, "lr": 5.8433810789940504e-05} +{"train_loss": 0.0027923660818487406, "global_step": 32125, "epoch": 269, "lr": 5.843162701693091e-05} +{"train_loss": 0.0029590162448585033, "global_step": 32126, "epoch": 269, "lr": 5.842944322736671e-05} +{"train_loss": 0.00379559095017612, "global_step": 32127, "epoch": 269, "lr": 5.84272594212522e-05} +{"train_loss": 0.0019119331846013665, "global_step": 32128, "epoch": 269, "lr": 5.8425075598591674e-05} +{"train_loss": 0.0030105166732012725, "global_step": 32129, "epoch": 269, "lr": 5.8422891759389406e-05, "val_loss": 0.014816132374107838} +{"train_loss": 0.0023573264479637146, "global_step": 32130, "epoch": 270, "lr": 5.842070790364969e-05} +{"train_loss": 0.003959109541028738, "global_step": 32131, "epoch": 270, "lr": 5.841852403137682e-05} +{"train_loss": 0.002900683553889394, "global_step": 32132, "epoch": 270, "lr": 5.841634014257507e-05} +{"train_loss": 0.001343826181255281, "global_step": 32133, "epoch": 270, "lr": 5.841415623724873e-05} +{"train_loss": 0.0029347273521125317, "global_step": 32134, "epoch": 270, "lr": 5.8411972315402095e-05} +{"train_loss": 0.004342231899499893, "global_step": 32135, "epoch": 270, "lr": 5.840978837703946e-05} +{"train_loss": 0.003812825307250023, "global_step": 32136, "epoch": 270, "lr": 5.840760442216511e-05} +{"train_loss": 0.003848019987344742, "global_step": 32137, "epoch": 270, "lr": 5.840542045078332e-05} +{"train_loss": 0.0022793940734118223, "global_step": 32138, "epoch": 270, "lr": 5.840323646289838e-05} +{"train_loss": 0.0023363977670669556, "global_step": 32139, "epoch": 270, "lr": 5.8401052458514595e-05} +{"train_loss": 0.0019309447379782796, "global_step": 32140, "epoch": 270, "lr": 5.839886843763622e-05} +{"train_loss": 0.00226348708383739, "global_step": 32141, "epoch": 270, "lr": 5.839668440026757e-05} +{"train_loss": 0.006182265933603048, "global_step": 32142, "epoch": 270, "lr": 5.839450034641294e-05} +{"train_loss": 0.0026708869263529778, "global_step": 32143, "epoch": 270, "lr": 5.839231627607661e-05} +{"train_loss": 0.002862568711861968, "global_step": 32144, "epoch": 270, "lr": 5.8390132189262833e-05} +{"train_loss": 0.0028679079841822386, "global_step": 32145, "epoch": 270, "lr": 5.838794808597595e-05} +{"train_loss": 0.004020391497761011, "global_step": 32146, "epoch": 270, "lr": 5.838576396622023e-05} +{"train_loss": 0.001581862336024642, "global_step": 32147, "epoch": 270, "lr": 5.8383579829999945e-05} +{"train_loss": 0.0022552642039954662, "global_step": 32148, "epoch": 270, "lr": 5.83813956773194e-05} +{"train_loss": 0.0023607523180544376, "global_step": 32149, "epoch": 270, "lr": 5.837921150818291e-05} +{"train_loss": 0.0035730849485844374, "global_step": 32150, "epoch": 270, "lr": 5.83770273225947e-05} +{"train_loss": 0.0026165100280195475, "global_step": 32151, "epoch": 270, "lr": 5.83748431205591e-05} +{"train_loss": 0.0022981204092502594, "global_step": 32152, "epoch": 270, "lr": 5.837265890208039e-05} +{"train_loss": 0.004499863833189011, "global_step": 32153, "epoch": 270, "lr": 5.837047466716285e-05} +{"train_loss": 0.001744998968206346, "global_step": 32154, "epoch": 270, "lr": 5.836829041581079e-05} +{"train_loss": 0.0037273066118359566, "global_step": 32155, "epoch": 270, "lr": 5.8366106148028474e-05} +{"train_loss": 0.0025884401984512806, "global_step": 32156, "epoch": 270, "lr": 5.836392186382023e-05} +{"train_loss": 0.002051148097962141, "global_step": 32157, "epoch": 270, "lr": 5.836173756319029e-05} +{"train_loss": 0.0031805881299078465, "global_step": 32158, "epoch": 270, "lr": 5.8359553246142985e-05} +{"train_loss": 0.001491574221290648, "global_step": 32159, "epoch": 270, "lr": 5.835736891268257e-05} +{"train_loss": 0.0021607778035104275, "global_step": 32160, "epoch": 270, "lr": 5.835518456281338e-05} +{"train_loss": 0.002487652702257037, "global_step": 32161, "epoch": 270, "lr": 5.8353000196539665e-05} +{"train_loss": 0.0032355659641325474, "global_step": 32162, "epoch": 270, "lr": 5.8350815813865724e-05} +{"train_loss": 0.0033986575435847044, "global_step": 32163, "epoch": 270, "lr": 5.834863141479585e-05} +{"train_loss": 0.00287149241194129, "global_step": 32164, "epoch": 270, "lr": 5.834644699933434e-05} +{"train_loss": 0.0030643062200397253, "global_step": 32165, "epoch": 270, "lr": 5.834426256748546e-05} +{"train_loss": 0.002249403391033411, "global_step": 32166, "epoch": 270, "lr": 5.8342078119253516e-05} +{"train_loss": 0.004322490654885769, "global_step": 32167, "epoch": 270, "lr": 5.83398936546428e-05} +{"train_loss": 0.001630606479011476, "global_step": 32168, "epoch": 270, "lr": 5.83377091736576e-05} +{"train_loss": 0.0022843144834041595, "global_step": 32169, "epoch": 270, "lr": 5.833552467630219e-05} +{"train_loss": 0.003932849504053593, "global_step": 32170, "epoch": 270, "lr": 5.8333340162580855e-05} +{"train_loss": 0.002354792784899473, "global_step": 32171, "epoch": 270, "lr": 5.833115563249791e-05} +{"train_loss": 0.0033913219813257456, "global_step": 32172, "epoch": 270, "lr": 5.832897108605762e-05} +{"train_loss": 0.0023486819118261337, "global_step": 32173, "epoch": 270, "lr": 5.83267865232643e-05} +{"train_loss": 0.0047765448689460754, "global_step": 32174, "epoch": 270, "lr": 5.832460194412221e-05} +{"train_loss": 0.0025376249104738235, "global_step": 32175, "epoch": 270, "lr": 5.8322417348635673e-05} +{"train_loss": 0.0017417467897757888, "global_step": 32176, "epoch": 270, "lr": 5.832023273680894e-05} +{"train_loss": 0.005312555003911257, "global_step": 32177, "epoch": 270, "lr": 5.8318048108646325e-05} +{"train_loss": 0.0025387865025550127, "global_step": 32178, "epoch": 270, "lr": 5.831586346415212e-05} +{"train_loss": 0.001757728517986834, "global_step": 32179, "epoch": 270, "lr": 5.8313678803330584e-05} +{"train_loss": 0.003247458254918456, "global_step": 32180, "epoch": 270, "lr": 5.831149412618604e-05} +{"train_loss": 0.0024360015522688627, "global_step": 32181, "epoch": 270, "lr": 5.830930943272278e-05} +{"train_loss": 0.00247076153755188, "global_step": 32182, "epoch": 270, "lr": 5.830712472294506e-05} +{"train_loss": 0.0015491406666114926, "global_step": 32183, "epoch": 270, "lr": 5.830493999685719e-05} +{"train_loss": 0.001808068249374628, "global_step": 32184, "epoch": 270, "lr": 5.830275525446346e-05} +{"train_loss": 0.004020886495709419, "global_step": 32185, "epoch": 270, "lr": 5.830057049576816e-05} +{"train_loss": 0.003358971793204546, "global_step": 32186, "epoch": 270, "lr": 5.8298385720775574e-05} +{"train_loss": 0.0037788201589137316, "global_step": 32187, "epoch": 270, "lr": 5.829620092949e-05} +{"train_loss": 0.0016795025439932942, "global_step": 32188, "epoch": 270, "lr": 5.829401612191572e-05} +{"train_loss": 0.0015591154806315899, "global_step": 32189, "epoch": 270, "lr": 5.829183129805702e-05} +{"train_loss": 0.0038272771053016186, "global_step": 32190, "epoch": 270, "lr": 5.828964645791819e-05} +{"train_loss": 0.0029673571698367596, "global_step": 32191, "epoch": 270, "lr": 5.8287461601503534e-05} +{"train_loss": 0.002439536852762103, "global_step": 32192, "epoch": 270, "lr": 5.8285276728817326e-05} +{"train_loss": 0.0020221429876983166, "global_step": 32193, "epoch": 270, "lr": 5.828309183986387e-05} +{"train_loss": 0.0019377449061721563, "global_step": 32194, "epoch": 270, "lr": 5.828090693464745e-05} +{"train_loss": 0.003379663685336709, "global_step": 32195, "epoch": 270, "lr": 5.827872201317234e-05} +{"train_loss": 0.0026596609968692064, "global_step": 32196, "epoch": 270, "lr": 5.827653707544285e-05} +{"train_loss": 0.00310253887437284, "global_step": 32197, "epoch": 270, "lr": 5.827435212146327e-05} +{"train_loss": 0.0028870271053165197, "global_step": 32198, "epoch": 270, "lr": 5.827216715123788e-05} +{"train_loss": 0.0026967802550643682, "global_step": 32199, "epoch": 270, "lr": 5.826998216477096e-05} +{"train_loss": 0.0025002441834658384, "global_step": 32200, "epoch": 270, "lr": 5.826779716206685e-05} +{"train_loss": 0.0021335177589207888, "global_step": 32201, "epoch": 270, "lr": 5.826561214312978e-05} +{"train_loss": 0.0022960719652473927, "global_step": 32202, "epoch": 270, "lr": 5.8263427107964055e-05} +{"train_loss": 0.002830193378031254, "global_step": 32203, "epoch": 270, "lr": 5.8261242056573987e-05} +{"train_loss": 0.0030611290130764246, "global_step": 32204, "epoch": 270, "lr": 5.825905698896385e-05} +{"train_loss": 0.003580986289307475, "global_step": 32205, "epoch": 270, "lr": 5.825687190513793e-05} +{"train_loss": 0.003864181460812688, "global_step": 32206, "epoch": 270, "lr": 5.825468680510053e-05} +{"train_loss": 0.0028101662173867226, "global_step": 32207, "epoch": 270, "lr": 5.825250168885594e-05} +{"train_loss": 0.003365118755027652, "global_step": 32208, "epoch": 270, "lr": 5.825031655640843e-05} +{"train_loss": 0.0034508639946579933, "global_step": 32209, "epoch": 270, "lr": 5.824813140776232e-05} +{"train_loss": 0.0014416136546060443, "global_step": 32210, "epoch": 270, "lr": 5.8245946242921877e-05} +{"train_loss": 0.002767393831163645, "global_step": 32211, "epoch": 270, "lr": 5.82437610618914e-05} +{"train_loss": 0.0021363503765314817, "global_step": 32212, "epoch": 270, "lr": 5.824157586467518e-05} +{"train_loss": 0.0032211996149271727, "global_step": 32213, "epoch": 270, "lr": 5.8239390651277503e-05} +{"train_loss": 0.0025213889311999083, "global_step": 32214, "epoch": 270, "lr": 5.823720542170267e-05} +{"train_loss": 0.0029746489599347115, "global_step": 32215, "epoch": 270, "lr": 5.8235020175954956e-05} +{"train_loss": 0.001702642417512834, "global_step": 32216, "epoch": 270, "lr": 5.8232834914038656e-05} +{"train_loss": 0.002664250088855624, "global_step": 32217, "epoch": 270, "lr": 5.823064963595808e-05} +{"train_loss": 0.0028142393566668034, "global_step": 32218, "epoch": 270, "lr": 5.82284643417175e-05} +{"train_loss": 0.0032958996016532183, "global_step": 32219, "epoch": 270, "lr": 5.822627903132121e-05} +{"train_loss": 0.0031865076161921024, "global_step": 32220, "epoch": 270, "lr": 5.8224093704773484e-05} +{"train_loss": 0.003213708521798253, "global_step": 32221, "epoch": 270, "lr": 5.8221908362078634e-05} +{"train_loss": 0.0020990129560232162, "global_step": 32222, "epoch": 270, "lr": 5.8219723003240955e-05} +{"train_loss": 0.004428103566169739, "global_step": 32223, "epoch": 270, "lr": 5.821753762826472e-05} +{"train_loss": 0.0032289926894009113, "global_step": 32224, "epoch": 270, "lr": 5.821535223715423e-05} +{"train_loss": 0.0035534624475985765, "global_step": 32225, "epoch": 270, "lr": 5.821316682991378e-05} +{"train_loss": 0.0036551458761096, "global_step": 32226, "epoch": 270, "lr": 5.821098140654765e-05} +{"train_loss": 0.001742801396176219, "global_step": 32227, "epoch": 270, "lr": 5.8208795967060135e-05} +{"train_loss": 0.002911337884142995, "global_step": 32228, "epoch": 270, "lr": 5.820661051145551e-05} +{"train_loss": 0.0027212391141802073, "global_step": 32229, "epoch": 270, "lr": 5.82044250397381e-05} +{"train_loss": 0.0027675838209688663, "global_step": 32230, "epoch": 270, "lr": 5.820223955191218e-05} +{"train_loss": 0.0045142387971282005, "global_step": 32231, "epoch": 270, "lr": 5.820005404798203e-05} +{"train_loss": 0.002503907075151801, "global_step": 32232, "epoch": 270, "lr": 5.819786852795196e-05} +{"train_loss": 0.0015003320295363665, "global_step": 32233, "epoch": 270, "lr": 5.8195682991826236e-05} +{"train_loss": 0.004208336118608713, "global_step": 32234, "epoch": 270, "lr": 5.819349743960918e-05} +{"train_loss": 0.0029907545540481806, "global_step": 32235, "epoch": 270, "lr": 5.819131187130505e-05} +{"train_loss": 0.002543805632740259, "global_step": 32236, "epoch": 270, "lr": 5.818912628691817e-05} +{"train_loss": 0.002274479018524289, "global_step": 32237, "epoch": 270, "lr": 5.818694068645282e-05} +{"train_loss": 0.002658568089827895, "global_step": 32238, "epoch": 270, "lr": 5.8184755069913275e-05} +{"train_loss": 0.0031078613828867674, "global_step": 32239, "epoch": 270, "lr": 5.8182569437303835e-05} +{"train_loss": 0.0028942388016730547, "global_step": 32240, "epoch": 270, "lr": 5.81803837886288e-05} +{"train_loss": 0.004305693786591291, "global_step": 32241, "epoch": 270, "lr": 5.8178198123892446e-05} +{"train_loss": 0.001972650643438101, "global_step": 32242, "epoch": 270, "lr": 5.817601244309908e-05} +{"train_loss": 0.0021102800965309143, "global_step": 32243, "epoch": 270, "lr": 5.8173826746252994e-05} +{"train_loss": 0.003727857256308198, "global_step": 32244, "epoch": 270, "lr": 5.817164103335846e-05} +{"train_loss": 0.0024725624825805426, "global_step": 32245, "epoch": 270, "lr": 5.8169455304419795e-05} +{"train_loss": 0.003266148502007127, "global_step": 32246, "epoch": 270, "lr": 5.816726955944126e-05} +{"train_loss": 0.003095905762165785, "global_step": 32247, "epoch": 270, "lr": 5.816508379842718e-05} +{"train_loss": 0.0028573237917143383, "global_step": 32248, "epoch": 270, "lr": 5.8162898021381815e-05, "val_loss": 0.027308516204357147, "train_action_mse_error": 4.493832602747716e-05} +{"train_loss": 0.0027396532241255045, "global_step": 32249, "epoch": 271, "lr": 5.816071222830949e-05} +{"train_loss": 0.0022208108566701412, "global_step": 32250, "epoch": 271, "lr": 5.8158526419214475e-05} +{"train_loss": 0.006814098916947842, "global_step": 32251, "epoch": 271, "lr": 5.815634059410107e-05} +{"train_loss": 0.0015331455506384373, "global_step": 32252, "epoch": 271, "lr": 5.8154154752973544e-05} +{"train_loss": 0.0022792736999690533, "global_step": 32253, "epoch": 271, "lr": 5.815196889583621e-05} +{"train_loss": 0.0018686945550143719, "global_step": 32254, "epoch": 271, "lr": 5.814978302269336e-05} +{"train_loss": 0.003388634417206049, "global_step": 32255, "epoch": 271, "lr": 5.814759713354928e-05} +{"train_loss": 0.0019612452015280724, "global_step": 32256, "epoch": 271, "lr": 5.814541122840827e-05} +{"train_loss": 0.0026591296773403883, "global_step": 32257, "epoch": 271, "lr": 5.814322530727461e-05} +{"train_loss": 0.0026096634101122618, "global_step": 32258, "epoch": 271, "lr": 5.8141039370152596e-05} +{"train_loss": 0.002388971857726574, "global_step": 32259, "epoch": 271, "lr": 5.813885341704652e-05} +{"train_loss": 0.001701180823147297, "global_step": 32260, "epoch": 271, "lr": 5.813666744796068e-05} +{"train_loss": 0.0021190717816352844, "global_step": 32261, "epoch": 271, "lr": 5.813448146289936e-05} +{"train_loss": 0.005685941781848669, "global_step": 32262, "epoch": 271, "lr": 5.813229546186685e-05} +{"train_loss": 0.0026166648603975773, "global_step": 32263, "epoch": 271, "lr": 5.8130109444867456e-05} +{"train_loss": 0.0032034278847277164, "global_step": 32264, "epoch": 271, "lr": 5.812792341190545e-05} +{"train_loss": 0.0020809913985431194, "global_step": 32265, "epoch": 271, "lr": 5.812573736298515e-05} +{"train_loss": 0.0027307637501507998, "global_step": 32266, "epoch": 271, "lr": 5.812355129811081e-05} +{"train_loss": 0.0021264865063130856, "global_step": 32267, "epoch": 271, "lr": 5.812136521728676e-05} +{"train_loss": 0.0033185884822160006, "global_step": 32268, "epoch": 271, "lr": 5.811917912051728e-05} +{"train_loss": 0.0015123413177207112, "global_step": 32269, "epoch": 271, "lr": 5.811699300780666e-05} +{"train_loss": 0.0021322318352758884, "global_step": 32270, "epoch": 271, "lr": 5.811480687915918e-05} +{"train_loss": 0.002360190497711301, "global_step": 32271, "epoch": 271, "lr": 5.811262073457915e-05} +{"train_loss": 0.0030805410351604223, "global_step": 32272, "epoch": 271, "lr": 5.811043457407086e-05} +{"train_loss": 0.002519757254049182, "global_step": 32273, "epoch": 271, "lr": 5.8108248397638585e-05} +{"train_loss": 0.003599179442971945, "global_step": 32274, "epoch": 271, "lr": 5.810606220528664e-05} +{"train_loss": 0.0027113386895507574, "global_step": 32275, "epoch": 271, "lr": 5.810387599701932e-05} +{"train_loss": 0.002173872897401452, "global_step": 32276, "epoch": 271, "lr": 5.8101689772840894e-05} +{"train_loss": 0.004478254821151495, "global_step": 32277, "epoch": 271, "lr": 5.809950353275565e-05} +{"train_loss": 0.0027650909032672644, "global_step": 32278, "epoch": 271, "lr": 5.8097317276767904e-05} +{"train_loss": 0.0034545145463198423, "global_step": 32279, "epoch": 271, "lr": 5.8095131004881956e-05} +{"train_loss": 0.00270612770691514, "global_step": 32280, "epoch": 271, "lr": 5.809294471710206e-05} +{"train_loss": 0.001813220209442079, "global_step": 32281, "epoch": 271, "lr": 5.8090758413432555e-05} +{"train_loss": 0.002807388547807932, "global_step": 32282, "epoch": 271, "lr": 5.80885720938777e-05} +{"train_loss": 0.0036689687985926867, "global_step": 32283, "epoch": 271, "lr": 5.80863857584418e-05} +{"train_loss": 0.002138882875442505, "global_step": 32284, "epoch": 271, "lr": 5.808419940712915e-05} +{"train_loss": 0.0015142993070185184, "global_step": 32285, "epoch": 271, "lr": 5.808201303994403e-05} +{"train_loss": 0.0027649388648569584, "global_step": 32286, "epoch": 271, "lr": 5.807982665689074e-05} +{"train_loss": 0.002949247369542718, "global_step": 32287, "epoch": 271, "lr": 5.8077640257973585e-05} +{"train_loss": 0.0032726468052715063, "global_step": 32288, "epoch": 271, "lr": 5.807545384319684e-05} +{"train_loss": 0.001784060732461512, "global_step": 32289, "epoch": 271, "lr": 5.807326741256479e-05} +{"train_loss": 0.003408093238249421, "global_step": 32290, "epoch": 271, "lr": 5.807108096608176e-05} +{"train_loss": 0.003672471269965172, "global_step": 32291, "epoch": 271, "lr": 5.8068894503752014e-05} +{"train_loss": 0.0033736417535692453, "global_step": 32292, "epoch": 271, "lr": 5.8066708025579866e-05} +{"train_loss": 0.0023046680726110935, "global_step": 32293, "epoch": 271, "lr": 5.8064521531569584e-05} +{"train_loss": 0.0021181318443268538, "global_step": 32294, "epoch": 271, "lr": 5.806233502172549e-05} +{"train_loss": 0.002864001551643014, "global_step": 32295, "epoch": 271, "lr": 5.806014849605186e-05} +{"train_loss": 0.007266422733664513, "global_step": 32296, "epoch": 271, "lr": 5.805796195455298e-05} +{"train_loss": 0.0021969638764858246, "global_step": 32297, "epoch": 271, "lr": 5.8055775397233155e-05} +{"train_loss": 0.0024837753735482693, "global_step": 32298, "epoch": 271, "lr": 5.805358882409668e-05} +{"train_loss": 0.003027114551514387, "global_step": 32299, "epoch": 271, "lr": 5.805140223514784e-05} +{"train_loss": 0.002877571852877736, "global_step": 32300, "epoch": 271, "lr": 5.804921563039094e-05} +{"train_loss": 0.003367938566952944, "global_step": 32301, "epoch": 271, "lr": 5.8047029009830266e-05} +{"train_loss": 0.0022160073276609182, "global_step": 32302, "epoch": 271, "lr": 5.80448423734701e-05} +{"train_loss": 0.00325440033338964, "global_step": 32303, "epoch": 271, "lr": 5.8042655721314755e-05} +{"train_loss": 0.0022575175389647484, "global_step": 32304, "epoch": 271, "lr": 5.8040469053368506e-05} +{"train_loss": 0.0029121122788637877, "global_step": 32305, "epoch": 271, "lr": 5.803828236963566e-05} +{"train_loss": 0.003188451984897256, "global_step": 32306, "epoch": 271, "lr": 5.803609567012052e-05} +{"train_loss": 0.0033231701236218214, "global_step": 32307, "epoch": 271, "lr": 5.8033908954827345e-05} +{"train_loss": 0.0028418495785444975, "global_step": 32308, "epoch": 271, "lr": 5.8031722223760445e-05} +{"train_loss": 0.002160401549190283, "global_step": 32309, "epoch": 271, "lr": 5.802953547692412e-05} +{"train_loss": 0.002844779985025525, "global_step": 32310, "epoch": 271, "lr": 5.802734871432266e-05} +{"train_loss": 0.001863890327513218, "global_step": 32311, "epoch": 271, "lr": 5.802516193596037e-05} +{"train_loss": 0.003617057576775551, "global_step": 32312, "epoch": 271, "lr": 5.8022975141841517e-05} +{"train_loss": 0.002067331923171878, "global_step": 32313, "epoch": 271, "lr": 5.802078833197042e-05} +{"train_loss": 0.003366636112332344, "global_step": 32314, "epoch": 271, "lr": 5.801860150635135e-05} +{"train_loss": 0.0026991060003638268, "global_step": 32315, "epoch": 271, "lr": 5.801641466498861e-05} +{"train_loss": 0.0029176785610616207, "global_step": 32316, "epoch": 271, "lr": 5.8014227807886525e-05} +{"train_loss": 0.0027490383945405483, "global_step": 32317, "epoch": 271, "lr": 5.801204093504933e-05} +{"train_loss": 0.002282968256622553, "global_step": 32318, "epoch": 271, "lr": 5.800985404648136e-05} +{"train_loss": 0.0028725804295390844, "global_step": 32319, "epoch": 271, "lr": 5.800766714218691e-05} +{"train_loss": 0.0025818380527198315, "global_step": 32320, "epoch": 271, "lr": 5.800548022217025e-05} +{"train_loss": 0.002594641176983714, "global_step": 32321, "epoch": 271, "lr": 5.800329328643568e-05} +{"train_loss": 0.0033062787260860205, "global_step": 32322, "epoch": 271, "lr": 5.8001106334987496e-05} +{"train_loss": 0.002884267596527934, "global_step": 32323, "epoch": 271, "lr": 5.799891936783001e-05} +{"train_loss": 0.003769970266148448, "global_step": 32324, "epoch": 271, "lr": 5.7996732384967476e-05} +{"train_loss": 0.002660913858562708, "global_step": 32325, "epoch": 271, "lr": 5.799454538640423e-05} +{"train_loss": 0.0017818787600845098, "global_step": 32326, "epoch": 271, "lr": 5.799235837214455e-05} +{"train_loss": 0.002660284982994199, "global_step": 32327, "epoch": 271, "lr": 5.7990171342192725e-05} +{"train_loss": 0.0016082715010270476, "global_step": 32328, "epoch": 271, "lr": 5.798798429655304e-05} +{"train_loss": 0.0016971344593912363, "global_step": 32329, "epoch": 271, "lr": 5.798579723522982e-05} +{"train_loss": 0.0024083456955850124, "global_step": 32330, "epoch": 271, "lr": 5.798361015822733e-05} +{"train_loss": 0.003695849562063813, "global_step": 32331, "epoch": 271, "lr": 5.798142306554989e-05} +{"train_loss": 0.002157867420464754, "global_step": 32332, "epoch": 271, "lr": 5.7979235957201764e-05} +{"train_loss": 0.0035749352537095547, "global_step": 32333, "epoch": 271, "lr": 5.7977048833187254e-05} +{"train_loss": 0.002875243779271841, "global_step": 32334, "epoch": 271, "lr": 5.797486169351067e-05} +{"train_loss": 0.002005825750529766, "global_step": 32335, "epoch": 271, "lr": 5.79726745381763e-05} +{"train_loss": 0.003145036520436406, "global_step": 32336, "epoch": 271, "lr": 5.797048736718842e-05} +{"train_loss": 0.0031052851118147373, "global_step": 32337, "epoch": 271, "lr": 5.796830018055137e-05} +{"train_loss": 0.0036780082155019045, "global_step": 32338, "epoch": 271, "lr": 5.796611297826939e-05} +{"train_loss": 0.002261853776872158, "global_step": 32339, "epoch": 271, "lr": 5.796392576034681e-05} +{"train_loss": 0.0026596791576594114, "global_step": 32340, "epoch": 271, "lr": 5.79617385267879e-05} +{"train_loss": 0.0027241792995482683, "global_step": 32341, "epoch": 271, "lr": 5.795955127759697e-05} +{"train_loss": 0.002493887208402157, "global_step": 32342, "epoch": 271, "lr": 5.7957364012778315e-05} +{"train_loss": 0.0028509115800261497, "global_step": 32343, "epoch": 271, "lr": 5.7955176732336214e-05} +{"train_loss": 0.002181797754019499, "global_step": 32344, "epoch": 271, "lr": 5.795298943627499e-05} +{"train_loss": 0.0038943137042224407, "global_step": 32345, "epoch": 271, "lr": 5.795080212459891e-05} +{"train_loss": 0.0023552286438643932, "global_step": 32346, "epoch": 271, "lr": 5.7948614797312284e-05} +{"train_loss": 0.004198989365249872, "global_step": 32347, "epoch": 271, "lr": 5.7946427454419405e-05} +{"train_loss": 0.002434331923723221, "global_step": 32348, "epoch": 271, "lr": 5.794424009592456e-05} +{"train_loss": 0.0018590674735605717, "global_step": 32349, "epoch": 271, "lr": 5.794205272183205e-05} +{"train_loss": 0.0022424417547881603, "global_step": 32350, "epoch": 271, "lr": 5.793986533214617e-05} +{"train_loss": 0.00271620717830956, "global_step": 32351, "epoch": 271, "lr": 5.793767792687121e-05} +{"train_loss": 0.002883404726162553, "global_step": 32352, "epoch": 271, "lr": 5.793549050601147e-05} +{"train_loss": 0.0019816914573311806, "global_step": 32353, "epoch": 271, "lr": 5.7933303069571246e-05} +{"train_loss": 0.002856307430192828, "global_step": 32354, "epoch": 271, "lr": 5.793111561755482e-05} +{"train_loss": 0.0026834451127797365, "global_step": 32355, "epoch": 271, "lr": 5.79289281499665e-05} +{"train_loss": 0.0020984939765185118, "global_step": 32356, "epoch": 271, "lr": 5.7926740666810586e-05} +{"train_loss": 0.004944264888763428, "global_step": 32357, "epoch": 271, "lr": 5.792455316809135e-05} +{"train_loss": 0.003262567799538374, "global_step": 32358, "epoch": 271, "lr": 5.79223656538131e-05} +{"train_loss": 0.0018289475701749325, "global_step": 32359, "epoch": 271, "lr": 5.792017812398014e-05} +{"train_loss": 0.001996792620047927, "global_step": 32360, "epoch": 271, "lr": 5.791799057859675e-05} +{"train_loss": 0.0021121115423738956, "global_step": 32361, "epoch": 271, "lr": 5.791580301766722e-05} +{"train_loss": 0.0013501403154805303, "global_step": 32362, "epoch": 271, "lr": 5.791361544119587e-05} +{"train_loss": 0.0016366963973268867, "global_step": 32363, "epoch": 271, "lr": 5.7911427849186996e-05} +{"train_loss": 0.003158323001116514, "global_step": 32364, "epoch": 271, "lr": 5.790924024164486e-05} +{"train_loss": 0.0034195620100945234, "global_step": 32365, "epoch": 271, "lr": 5.790705261857378e-05} +{"train_loss": 0.0038187773898243904, "global_step": 32366, "epoch": 271, "lr": 5.790486497997804e-05} +{"train_loss": 0.0027714868549633177, "global_step": 32367, "epoch": 271, "lr": 5.7902677325861944e-05, "val_loss": 0.015021235682070255} +{"train_loss": 0.0017884494736790657, "global_step": 32368, "epoch": 272, "lr": 5.790048965622979e-05} +{"train_loss": 0.002333579119294882, "global_step": 32369, "epoch": 272, "lr": 5.789830197108588e-05} +{"train_loss": 0.0036227679811418056, "global_step": 32370, "epoch": 272, "lr": 5.789611427043449e-05} +{"train_loss": 0.003397443098947406, "global_step": 32371, "epoch": 272, "lr": 5.789392655427992e-05} +{"train_loss": 0.0017982501303777099, "global_step": 32372, "epoch": 272, "lr": 5.789173882262646e-05} +{"train_loss": 0.002628863090649247, "global_step": 32373, "epoch": 272, "lr": 5.788955107547842e-05} +{"train_loss": 0.0019706683233380318, "global_step": 32374, "epoch": 272, "lr": 5.7887363312840096e-05} +{"train_loss": 0.00230061961337924, "global_step": 32375, "epoch": 272, "lr": 5.7885175534715776e-05} +{"train_loss": 0.0039010534528642893, "global_step": 32376, "epoch": 272, "lr": 5.788298774110974e-05} +{"train_loss": 0.003145898226648569, "global_step": 32377, "epoch": 272, "lr": 5.788079993202632e-05} +{"train_loss": 0.0014215483097359538, "global_step": 32378, "epoch": 272, "lr": 5.7878612107469776e-05} +{"train_loss": 0.0035212403163313866, "global_step": 32379, "epoch": 272, "lr": 5.787642426744443e-05} +{"train_loss": 0.0023392264265567064, "global_step": 32380, "epoch": 272, "lr": 5.787423641195456e-05} +{"train_loss": 0.0034709456376731396, "global_step": 32381, "epoch": 272, "lr": 5.787204854100447e-05} +{"train_loss": 0.003779743565246463, "global_step": 32382, "epoch": 272, "lr": 5.786986065459846e-05} +{"train_loss": 0.0011545917950570583, "global_step": 32383, "epoch": 272, "lr": 5.786767275274082e-05} +{"train_loss": 0.0028229202143847942, "global_step": 32384, "epoch": 272, "lr": 5.786548483543583e-05} +{"train_loss": 0.002253360813483596, "global_step": 32385, "epoch": 272, "lr": 5.786329690268781e-05} +{"train_loss": 0.0035557455848902464, "global_step": 32386, "epoch": 272, "lr": 5.7861108954501055e-05} +{"train_loss": 0.002430924214422703, "global_step": 32387, "epoch": 272, "lr": 5.785892099087984e-05} +{"train_loss": 0.0027670362032949924, "global_step": 32388, "epoch": 272, "lr": 5.785673301182848e-05} +{"train_loss": 0.003290537977591157, "global_step": 32389, "epoch": 272, "lr": 5.7854545017351256e-05} +{"train_loss": 0.0031974108424037695, "global_step": 32390, "epoch": 272, "lr": 5.7852357007452485e-05} +{"train_loss": 0.0034752883948385715, "global_step": 32391, "epoch": 272, "lr": 5.785016898213644e-05} +{"train_loss": 0.003976588137447834, "global_step": 32392, "epoch": 272, "lr": 5.784798094140743e-05} +{"train_loss": 0.004665975458920002, "global_step": 32393, "epoch": 272, "lr": 5.784579288526975e-05} +{"train_loss": 0.002841746900230646, "global_step": 32394, "epoch": 272, "lr": 5.784360481372768e-05} +{"train_loss": 0.002961579244583845, "global_step": 32395, "epoch": 272, "lr": 5.784141672678555e-05} +{"train_loss": 0.003647579811513424, "global_step": 32396, "epoch": 272, "lr": 5.7839228624447613e-05} +{"train_loss": 0.0026903494726866484, "global_step": 32397, "epoch": 272, "lr": 5.783704050671821e-05} +{"train_loss": 0.002441616728901863, "global_step": 32398, "epoch": 272, "lr": 5.78348523736016e-05} +{"train_loss": 0.003164732363075018, "global_step": 32399, "epoch": 272, "lr": 5.7832664225102103e-05} +{"train_loss": 0.002774330787360668, "global_step": 32400, "epoch": 272, "lr": 5.783047606122402e-05} +{"train_loss": 0.0018511395901441574, "global_step": 32401, "epoch": 272, "lr": 5.782828788197161e-05} +{"train_loss": 0.003278427990153432, "global_step": 32402, "epoch": 272, "lr": 5.78260996873492e-05} +{"train_loss": 0.003547315951436758, "global_step": 32403, "epoch": 272, "lr": 5.782391147736108e-05} +{"train_loss": 0.003737051971256733, "global_step": 32404, "epoch": 272, "lr": 5.782172325201155e-05} +{"train_loss": 0.0020713736303150654, "global_step": 32405, "epoch": 272, "lr": 5.7819535011304895e-05} +{"train_loss": 0.0025850471574813128, "global_step": 32406, "epoch": 272, "lr": 5.781734675524544e-05} +{"train_loss": 0.002911062678322196, "global_step": 32407, "epoch": 272, "lr": 5.781515848383744e-05} +{"train_loss": 0.0015680537326261401, "global_step": 32408, "epoch": 272, "lr": 5.78129701970852e-05} +{"train_loss": 0.0021135900169610977, "global_step": 32409, "epoch": 272, "lr": 5.781078189499304e-05} +{"train_loss": 0.0028985196258872747, "global_step": 32410, "epoch": 272, "lr": 5.780859357756524e-05} +{"train_loss": 0.0027849734760820866, "global_step": 32411, "epoch": 272, "lr": 5.7806405244806104e-05} +{"train_loss": 0.004072369541972876, "global_step": 32412, "epoch": 272, "lr": 5.780421689671993e-05} +{"train_loss": 0.0033772459719330072, "global_step": 32413, "epoch": 272, "lr": 5.7802028533311015e-05} +{"train_loss": 0.004212528932839632, "global_step": 32414, "epoch": 272, "lr": 5.779984015458364e-05} +{"train_loss": 0.0037112152203917503, "global_step": 32415, "epoch": 272, "lr": 5.779765176054212e-05} +{"train_loss": 0.002677698852494359, "global_step": 32416, "epoch": 272, "lr": 5.779546335119074e-05} +{"train_loss": 0.002509649842977524, "global_step": 32417, "epoch": 272, "lr": 5.779327492653379e-05} +{"train_loss": 0.002647233894094825, "global_step": 32418, "epoch": 272, "lr": 5.779108648657559e-05} +{"train_loss": 0.002996311755850911, "global_step": 32419, "epoch": 272, "lr": 5.7788898031320425e-05} +{"train_loss": 0.0029909817967563868, "global_step": 32420, "epoch": 272, "lr": 5.778670956077259e-05} +{"train_loss": 0.0016513741575181484, "global_step": 32421, "epoch": 272, "lr": 5.778452107493637e-05} +{"train_loss": 0.0024633207358419895, "global_step": 32422, "epoch": 272, "lr": 5.778233257381609e-05} +{"train_loss": 0.00223520933650434, "global_step": 32423, "epoch": 272, "lr": 5.778014405741602e-05} +{"train_loss": 0.002949772635474801, "global_step": 32424, "epoch": 272, "lr": 5.777795552574048e-05} +{"train_loss": 0.004477372858673334, "global_step": 32425, "epoch": 272, "lr": 5.7775766978793744e-05} +{"train_loss": 0.0018010801868513227, "global_step": 32426, "epoch": 272, "lr": 5.777357841658012e-05} +{"train_loss": 0.0029117176309227943, "global_step": 32427, "epoch": 272, "lr": 5.777138983910391e-05} +{"train_loss": 0.003880246076732874, "global_step": 32428, "epoch": 272, "lr": 5.776920124636941e-05} +{"train_loss": 0.002192314248532057, "global_step": 32429, "epoch": 272, "lr": 5.77670126383809e-05} +{"train_loss": 0.0044188350439071655, "global_step": 32430, "epoch": 272, "lr": 5.7764824015142705e-05} +{"train_loss": 0.00501897931098938, "global_step": 32431, "epoch": 272, "lr": 5.7762635376659116e-05} +{"train_loss": 0.0044595468789339066, "global_step": 32432, "epoch": 272, "lr": 5.7760446722934404e-05} +{"train_loss": 0.003878770861774683, "global_step": 32433, "epoch": 272, "lr": 5.775825805397288e-05} +{"train_loss": 0.0025929841212928295, "global_step": 32434, "epoch": 272, "lr": 5.7756069369778856e-05} +{"train_loss": 0.0031518423929810524, "global_step": 32435, "epoch": 272, "lr": 5.775388067035662e-05} +{"train_loss": 0.0026774718426167965, "global_step": 32436, "epoch": 272, "lr": 5.7751691955710466e-05} +{"train_loss": 0.002090866444632411, "global_step": 32437, "epoch": 272, "lr": 5.774950322584468e-05} +{"train_loss": 0.005220397375524044, "global_step": 32438, "epoch": 272, "lr": 5.7747314480763595e-05} +{"train_loss": 0.00206824135966599, "global_step": 32439, "epoch": 272, "lr": 5.774512572047147e-05} +{"train_loss": 0.0036581899039447308, "global_step": 32440, "epoch": 272, "lr": 5.774293694497263e-05} +{"train_loss": 0.0031643223483115435, "global_step": 32441, "epoch": 272, "lr": 5.774074815427135e-05} +{"train_loss": 0.0017637975979596376, "global_step": 32442, "epoch": 272, "lr": 5.7738559348371937e-05} +{"train_loss": 0.0023487985599786043, "global_step": 32443, "epoch": 272, "lr": 5.773637052727869e-05} +{"train_loss": 0.0019145511323586106, "global_step": 32444, "epoch": 272, "lr": 5.77341816909959e-05} +{"train_loss": 0.004560644738376141, "global_step": 32445, "epoch": 272, "lr": 5.773199283952788e-05} +{"train_loss": 0.0030638885218650103, "global_step": 32446, "epoch": 272, "lr": 5.772980397287893e-05} +{"train_loss": 0.002650325419381261, "global_step": 32447, "epoch": 272, "lr": 5.772761509105331e-05} +{"train_loss": 0.0015223915688693523, "global_step": 32448, "epoch": 272, "lr": 5.7725426194055356e-05} +{"train_loss": 0.0037534490693360567, "global_step": 32449, "epoch": 272, "lr": 5.772323728188935e-05} +{"train_loss": 0.0017183602321892977, "global_step": 32450, "epoch": 272, "lr": 5.772104835455961e-05} +{"train_loss": 0.003736570943146944, "global_step": 32451, "epoch": 272, "lr": 5.7718859412070404e-05} +{"train_loss": 0.00356034142896533, "global_step": 32452, "epoch": 272, "lr": 5.7716670454426034e-05} +{"train_loss": 0.0029238329734653234, "global_step": 32453, "epoch": 272, "lr": 5.7714481481630814e-05} +{"train_loss": 0.0023383330553770065, "global_step": 32454, "epoch": 272, "lr": 5.771229249368904e-05} +{"train_loss": 0.003947261720895767, "global_step": 32455, "epoch": 272, "lr": 5.7710103490604996e-05} +{"train_loss": 0.0028526163659989834, "global_step": 32456, "epoch": 272, "lr": 5.770791447238297e-05} +{"train_loss": 0.0025204047560691833, "global_step": 32457, "epoch": 272, "lr": 5.7705725439027314e-05} +{"train_loss": 0.0035469899885356426, "global_step": 32458, "epoch": 272, "lr": 5.770353639054226e-05} +{"train_loss": 0.0023015737533569336, "global_step": 32459, "epoch": 272, "lr": 5.7701347326932144e-05} +{"train_loss": 0.003909461200237274, "global_step": 32460, "epoch": 272, "lr": 5.769915824820126e-05} +{"train_loss": 0.004131739493459463, "global_step": 32461, "epoch": 272, "lr": 5.7696969154353894e-05} +{"train_loss": 0.002846012357622385, "global_step": 32462, "epoch": 272, "lr": 5.7694780045394346e-05} +{"train_loss": 0.0020036352798342705, "global_step": 32463, "epoch": 272, "lr": 5.769259092132695e-05} +{"train_loss": 0.0019719242118299007, "global_step": 32464, "epoch": 272, "lr": 5.7690401782155945e-05} +{"train_loss": 0.003193254116922617, "global_step": 32465, "epoch": 272, "lr": 5.768821262788566e-05} +{"train_loss": 0.0025267896708101034, "global_step": 32466, "epoch": 272, "lr": 5.76860234585204e-05} +{"train_loss": 0.004113192204385996, "global_step": 32467, "epoch": 272, "lr": 5.7683834274064454e-05} +{"train_loss": 0.0025674221105873585, "global_step": 32468, "epoch": 272, "lr": 5.768164507452212e-05} +{"train_loss": 0.0034153335727751255, "global_step": 32469, "epoch": 272, "lr": 5.767945585989769e-05} +{"train_loss": 0.0023976394440978765, "global_step": 32470, "epoch": 272, "lr": 5.767726663019548e-05} +{"train_loss": 0.0021642008796334267, "global_step": 32471, "epoch": 272, "lr": 5.767507738541976e-05} +{"train_loss": 0.002473855158314109, "global_step": 32472, "epoch": 272, "lr": 5.767288812557485e-05} +{"train_loss": 0.003628613892942667, "global_step": 32473, "epoch": 272, "lr": 5.767069885066505e-05} +{"train_loss": 0.002640597755089402, "global_step": 32474, "epoch": 272, "lr": 5.766850956069465e-05} +{"train_loss": 0.002330370945855975, "global_step": 32475, "epoch": 272, "lr": 5.766632025566796e-05} +{"train_loss": 0.0023652443196624517, "global_step": 32476, "epoch": 272, "lr": 5.766413093558926e-05} +{"train_loss": 0.003047731937840581, "global_step": 32477, "epoch": 272, "lr": 5.766194160046285e-05} +{"train_loss": 0.0025672686751931906, "global_step": 32478, "epoch": 272, "lr": 5.765975225029304e-05} +{"train_loss": 0.0022274665534496307, "global_step": 32479, "epoch": 272, "lr": 5.765756288508414e-05} +{"train_loss": 0.0023808754049241543, "global_step": 32480, "epoch": 272, "lr": 5.7655373504840415e-05} +{"train_loss": 0.004350175615400076, "global_step": 32481, "epoch": 272, "lr": 5.7653184109566194e-05} +{"train_loss": 0.0019574237521737814, "global_step": 32482, "epoch": 272, "lr": 5.765099469926577e-05} +{"train_loss": 0.003042986150830984, "global_step": 32483, "epoch": 272, "lr": 5.764880527394342e-05} +{"train_loss": 0.0017689286032691598, "global_step": 32484, "epoch": 272, "lr": 5.764661583360347e-05} +{"train_loss": 0.0024922527372837067, "global_step": 32485, "epoch": 272, "lr": 5.764442637825019e-05} +{"train_loss": 0.0029233001415156015, "global_step": 32486, "epoch": 272, "lr": 5.76422369078879e-05, "val_loss": 0.023622335866093636} +{"train_loss": 0.003466735128313303, "global_step": 32487, "epoch": 273, "lr": 5.7640047422520904e-05} +{"train_loss": 0.0037007424980401993, "global_step": 32488, "epoch": 273, "lr": 5.7637857922153496e-05} +{"train_loss": 0.0023385281674563885, "global_step": 32489, "epoch": 273, "lr": 5.763566840678996e-05} +{"train_loss": 0.0019094463204964995, "global_step": 32490, "epoch": 273, "lr": 5.76334788764346e-05} +{"train_loss": 0.002091960282996297, "global_step": 32491, "epoch": 273, "lr": 5.763128933109172e-05} +{"train_loss": 0.0017200943548232317, "global_step": 32492, "epoch": 273, "lr": 5.7629099770765624e-05} +{"train_loss": 0.0027620894834399223, "global_step": 32493, "epoch": 273, "lr": 5.76269101954606e-05} +{"train_loss": 0.002776812994852662, "global_step": 32494, "epoch": 273, "lr": 5.762472060518096e-05} +{"train_loss": 0.0036237577442079782, "global_step": 32495, "epoch": 273, "lr": 5.7622530999931e-05} +{"train_loss": 0.0020140036940574646, "global_step": 32496, "epoch": 273, "lr": 5.7620341379715004e-05} +{"train_loss": 0.002933751093223691, "global_step": 32497, "epoch": 273, "lr": 5.761815174453729e-05} +{"train_loss": 0.002892937045544386, "global_step": 32498, "epoch": 273, "lr": 5.761596209440214e-05} +{"train_loss": 0.003349950537085533, "global_step": 32499, "epoch": 273, "lr": 5.761377242931386e-05} +{"train_loss": 0.0029027280397713184, "global_step": 32500, "epoch": 273, "lr": 5.761158274927677e-05} +{"train_loss": 0.0023806975223124027, "global_step": 32501, "epoch": 273, "lr": 5.760939305429515e-05} +{"train_loss": 0.0012946377974003553, "global_step": 32502, "epoch": 273, "lr": 5.760720334437328e-05} +{"train_loss": 0.0017860393272712827, "global_step": 32503, "epoch": 273, "lr": 5.760501361951549e-05} +{"train_loss": 0.0018665756797417998, "global_step": 32504, "epoch": 273, "lr": 5.760282387972607e-05} +{"train_loss": 0.0029506096616387367, "global_step": 32505, "epoch": 273, "lr": 5.76006341250093e-05} +{"train_loss": 0.0028732577338814735, "global_step": 32506, "epoch": 273, "lr": 5.759844435536951e-05} +{"train_loss": 0.0022296339739114046, "global_step": 32507, "epoch": 273, "lr": 5.7596254570810994e-05} +{"train_loss": 0.0036770824808627367, "global_step": 32508, "epoch": 273, "lr": 5.759406477133803e-05} +{"train_loss": 0.004183927085250616, "global_step": 32509, "epoch": 273, "lr": 5.7591874956954936e-05} +{"train_loss": 0.0021144025959074497, "global_step": 32510, "epoch": 273, "lr": 5.7589685127666006e-05} +{"train_loss": 0.002538404893130064, "global_step": 32511, "epoch": 273, "lr": 5.758749528347554e-05} +{"train_loss": 0.002064858563244343, "global_step": 32512, "epoch": 273, "lr": 5.758530542438784e-05} +{"train_loss": 0.0020301220938563347, "global_step": 32513, "epoch": 273, "lr": 5.758311555040721e-05} +{"train_loss": 0.0015988252125680447, "global_step": 32514, "epoch": 273, "lr": 5.7580925661537934e-05} +{"train_loss": 0.0015745038399472833, "global_step": 32515, "epoch": 273, "lr": 5.757873575778432e-05} +{"train_loss": 0.0014402162050828338, "global_step": 32516, "epoch": 273, "lr": 5.757654583915067e-05} +{"train_loss": 0.001471757423132658, "global_step": 32517, "epoch": 273, "lr": 5.7574355905641284e-05} +{"train_loss": 0.0010165672283619642, "global_step": 32518, "epoch": 273, "lr": 5.757216595726045e-05} +{"train_loss": 0.005247772671282291, "global_step": 32519, "epoch": 273, "lr": 5.7569975994012494e-05} +{"train_loss": 0.0019788951613008976, "global_step": 32520, "epoch": 273, "lr": 5.756778601590169e-05} +{"train_loss": 0.0025647373404353857, "global_step": 32521, "epoch": 273, "lr": 5.7565596022932345e-05} +{"train_loss": 0.0022744787856936455, "global_step": 32522, "epoch": 273, "lr": 5.756340601510876e-05} +{"train_loss": 0.002171003958210349, "global_step": 32523, "epoch": 273, "lr": 5.7561215992435234e-05} +{"train_loss": 0.0015983401099219918, "global_step": 32524, "epoch": 273, "lr": 5.755902595491607e-05} +{"train_loss": 0.0009739050292409956, "global_step": 32525, "epoch": 273, "lr": 5.7556835902555564e-05} +{"train_loss": 0.0012712556635960937, "global_step": 32526, "epoch": 273, "lr": 5.7554645835358024e-05} +{"train_loss": 0.0025260262191295624, "global_step": 32527, "epoch": 273, "lr": 5.755245575332774e-05} +{"train_loss": 0.0020292080007493496, "global_step": 32528, "epoch": 273, "lr": 5.7550265656469014e-05} +{"train_loss": 0.001661954796873033, "global_step": 32529, "epoch": 273, "lr": 5.754807554478615e-05} +{"train_loss": 0.0017787166871130466, "global_step": 32530, "epoch": 273, "lr": 5.754588541828344e-05} +{"train_loss": 0.001729096518829465, "global_step": 32531, "epoch": 273, "lr": 5.754369527696521e-05} +{"train_loss": 0.0021723872050642967, "global_step": 32532, "epoch": 273, "lr": 5.7541505120835726e-05} +{"train_loss": 0.0024372627958655357, "global_step": 32533, "epoch": 273, "lr": 5.75393149498993e-05} +{"train_loss": 0.0018658057088032365, "global_step": 32534, "epoch": 273, "lr": 5.753712476416025e-05} +{"train_loss": 0.0020288359373807907, "global_step": 32535, "epoch": 273, "lr": 5.753493456362284e-05} +{"train_loss": 0.0015547400107607245, "global_step": 32536, "epoch": 273, "lr": 5.75327443482914e-05} +{"train_loss": 0.001413005986250937, "global_step": 32537, "epoch": 273, "lr": 5.753055411817022e-05} +{"train_loss": 0.003251858754083514, "global_step": 32538, "epoch": 273, "lr": 5.7528363873263615e-05} +{"train_loss": 0.003313081106171012, "global_step": 32539, "epoch": 273, "lr": 5.752617361357585e-05} +{"train_loss": 0.003058761591091752, "global_step": 32540, "epoch": 273, "lr": 5.7523983339111254e-05} +{"train_loss": 0.0018547975923866034, "global_step": 32541, "epoch": 273, "lr": 5.752179304987413e-05} +{"train_loss": 0.0019827496726065874, "global_step": 32542, "epoch": 273, "lr": 5.751960274586875e-05} +{"train_loss": 0.0026792711578309536, "global_step": 32543, "epoch": 273, "lr": 5.7517412427099435e-05} +{"train_loss": 0.0018721085507422686, "global_step": 32544, "epoch": 273, "lr": 5.751522209357051e-05} +{"train_loss": 0.005003800615668297, "global_step": 32545, "epoch": 273, "lr": 5.7513031745286226e-05} +{"train_loss": 0.0014810373540967703, "global_step": 32546, "epoch": 273, "lr": 5.7510841382250916e-05} +{"train_loss": 0.0019567450508475304, "global_step": 32547, "epoch": 273, "lr": 5.750865100446887e-05} +{"train_loss": 0.0020352068822830915, "global_step": 32548, "epoch": 273, "lr": 5.7506460611944394e-05} +{"train_loss": 0.001731961965560913, "global_step": 32549, "epoch": 273, "lr": 5.7504270204681773e-05} +{"train_loss": 0.002745814388617873, "global_step": 32550, "epoch": 273, "lr": 5.7502079782685334e-05} +{"train_loss": 0.0013339564902707934, "global_step": 32551, "epoch": 273, "lr": 5.749988934595936e-05} +{"train_loss": 0.0013877033488824964, "global_step": 32552, "epoch": 273, "lr": 5.7497698894508146e-05} +{"train_loss": 0.0028993391897529364, "global_step": 32553, "epoch": 273, "lr": 5.749550842833601e-05} +{"train_loss": 0.0037733453791588545, "global_step": 32554, "epoch": 273, "lr": 5.749331794744723e-05} +{"train_loss": 0.0017978714313358068, "global_step": 32555, "epoch": 273, "lr": 5.749112745184613e-05} +{"train_loss": 0.002162075135856867, "global_step": 32556, "epoch": 273, "lr": 5.7488936941537e-05} +{"train_loss": 0.001832669135183096, "global_step": 32557, "epoch": 273, "lr": 5.748674641652414e-05} +{"train_loss": 0.002803117735311389, "global_step": 32558, "epoch": 273, "lr": 5.748455587681186e-05} +{"train_loss": 0.0021494582761079073, "global_step": 32559, "epoch": 273, "lr": 5.748236532240445e-05} +{"train_loss": 0.0025075520388782024, "global_step": 32560, "epoch": 273, "lr": 5.748017475330621e-05} +{"train_loss": 0.0021624495275318623, "global_step": 32561, "epoch": 273, "lr": 5.747798416952146e-05} +{"train_loss": 0.002935828175395727, "global_step": 32562, "epoch": 273, "lr": 5.747579357105447e-05} +{"train_loss": 0.0014615753898397088, "global_step": 32563, "epoch": 273, "lr": 5.747360295790958e-05} +{"train_loss": 0.0023364517837762833, "global_step": 32564, "epoch": 273, "lr": 5.7471412330091057e-05} +{"train_loss": 0.002517504384741187, "global_step": 32565, "epoch": 273, "lr": 5.7469221687603206e-05} +{"train_loss": 0.0042330739088356495, "global_step": 32566, "epoch": 273, "lr": 5.746703103045035e-05} +{"train_loss": 0.0021269170101732016, "global_step": 32567, "epoch": 273, "lr": 5.746484035863676e-05} +{"train_loss": 0.001562815741635859, "global_step": 32568, "epoch": 273, "lr": 5.746264967216677e-05} +{"train_loss": 0.0030265399254858494, "global_step": 32569, "epoch": 273, "lr": 5.7460458971044664e-05} +{"train_loss": 0.0019444471690803766, "global_step": 32570, "epoch": 273, "lr": 5.745826825527474e-05} +{"train_loss": 0.0014452912146225572, "global_step": 32571, "epoch": 273, "lr": 5.745607752486129e-05} +{"train_loss": 0.0012843776494264603, "global_step": 32572, "epoch": 273, "lr": 5.745388677980864e-05} +{"train_loss": 0.003804415464401245, "global_step": 32573, "epoch": 273, "lr": 5.7451696020121085e-05} +{"train_loss": 0.002924446715041995, "global_step": 32574, "epoch": 273, "lr": 5.74495052458029e-05} +{"train_loss": 0.0016985866241157055, "global_step": 32575, "epoch": 273, "lr": 5.744731445685843e-05} +{"train_loss": 0.0024618208408355713, "global_step": 32576, "epoch": 273, "lr": 5.744512365329194e-05} +{"train_loss": 0.0014009723672643304, "global_step": 32577, "epoch": 273, "lr": 5.744293283510775e-05} +{"train_loss": 0.00186197052244097, "global_step": 32578, "epoch": 273, "lr": 5.744074200231015e-05} +{"train_loss": 0.0032018774654716253, "global_step": 32579, "epoch": 273, "lr": 5.743855115490346e-05} +{"train_loss": 0.004471893422305584, "global_step": 32580, "epoch": 273, "lr": 5.743636029289197e-05} +{"train_loss": 0.002906030509620905, "global_step": 32581, "epoch": 273, "lr": 5.743416941627997e-05} +{"train_loss": 0.002262768568471074, "global_step": 32582, "epoch": 273, "lr": 5.7431978525071795e-05} +{"train_loss": 0.0011926330626010895, "global_step": 32583, "epoch": 273, "lr": 5.7429787619271705e-05} +{"train_loss": 0.0026128266472369432, "global_step": 32584, "epoch": 273, "lr": 5.742759669888402e-05} +{"train_loss": 0.00206152256578207, "global_step": 32585, "epoch": 273, "lr": 5.742540576391304e-05} +{"train_loss": 0.002134883776307106, "global_step": 32586, "epoch": 273, "lr": 5.742321481436308e-05} +{"train_loss": 0.0017106557497754693, "global_step": 32587, "epoch": 273, "lr": 5.742102385023842e-05} +{"train_loss": 0.0012941898312419653, "global_step": 32588, "epoch": 273, "lr": 5.741883287154339e-05} +{"train_loss": 0.00211063283495605, "global_step": 32589, "epoch": 273, "lr": 5.741664187828226e-05} +{"train_loss": 0.002710235072299838, "global_step": 32590, "epoch": 273, "lr": 5.7414450870459345e-05} +{"train_loss": 0.0035928627476096153, "global_step": 32591, "epoch": 273, "lr": 5.7412259848078945e-05} +{"train_loss": 0.00252191792242229, "global_step": 32592, "epoch": 273, "lr": 5.741006881114537e-05} +{"train_loss": 0.002015592297539115, "global_step": 32593, "epoch": 273, "lr": 5.740787775966291e-05} +{"train_loss": 0.0028041123878210783, "global_step": 32594, "epoch": 273, "lr": 5.74056866936359e-05} +{"train_loss": 0.0018425688613206148, "global_step": 32595, "epoch": 273, "lr": 5.740349561306859e-05} +{"train_loss": 0.002508873585611582, "global_step": 32596, "epoch": 273, "lr": 5.74013045179653e-05} +{"train_loss": 0.0014576723333448172, "global_step": 32597, "epoch": 273, "lr": 5.7399113408330365e-05} +{"train_loss": 0.003530730726197362, "global_step": 32598, "epoch": 273, "lr": 5.739692228416804e-05} +{"train_loss": 0.0034544956870377064, "global_step": 32599, "epoch": 273, "lr": 5.739473114548266e-05} +{"train_loss": 0.0019922901410609484, "global_step": 32600, "epoch": 273, "lr": 5.7392539992278515e-05} +{"train_loss": 0.0020810242276638746, "global_step": 32601, "epoch": 273, "lr": 5.739034882455991e-05} +{"train_loss": 0.003275279887020588, "global_step": 32602, "epoch": 273, "lr": 5.738815764233114e-05} +{"train_loss": 0.002851788653060794, "global_step": 32603, "epoch": 273, "lr": 5.7385966445596504e-05} +{"train_loss": 0.0015633858274668455, "global_step": 32604, "epoch": 273, "lr": 5.7383775234360324e-05} +{"train_loss": 0.002350186594045807, "global_step": 32605, "epoch": 273, "lr": 5.7381584008626884e-05, "val_loss": 0.020676789805293083} +{"train_loss": 0.003777771722525358, "global_step": 32606, "epoch": 274, "lr": 5.73793927684005e-05} +{"train_loss": 0.0014436269411817193, "global_step": 32607, "epoch": 274, "lr": 5.7377201513685455e-05} +{"train_loss": 0.0032525970600545406, "global_step": 32608, "epoch": 274, "lr": 5.737501024448607e-05} +{"train_loss": 0.002376939170062542, "global_step": 32609, "epoch": 274, "lr": 5.737281896080664e-05} +{"train_loss": 0.002527747070416808, "global_step": 32610, "epoch": 274, "lr": 5.737062766265147e-05} +{"train_loss": 0.002558834385126829, "global_step": 32611, "epoch": 274, "lr": 5.736843635002485e-05} +{"train_loss": 0.004329899325966835, "global_step": 32612, "epoch": 274, "lr": 5.7366245022931096e-05} +{"train_loss": 0.001746974652633071, "global_step": 32613, "epoch": 274, "lr": 5.736405368137452e-05} +{"train_loss": 0.0018963625188916922, "global_step": 32614, "epoch": 274, "lr": 5.7361862325359395e-05} +{"train_loss": 0.0034206921700388193, "global_step": 32615, "epoch": 274, "lr": 5.7359670954890054e-05} +{"train_loss": 0.0018453425727784634, "global_step": 32616, "epoch": 274, "lr": 5.735747956997077e-05} +{"train_loss": 0.00258197751827538, "global_step": 32617, "epoch": 274, "lr": 5.735528817060587e-05} +{"train_loss": 0.003698415122926235, "global_step": 32618, "epoch": 274, "lr": 5.735309675679964e-05} +{"train_loss": 0.00247924099676311, "global_step": 32619, "epoch": 274, "lr": 5.73509053285564e-05} +{"train_loss": 0.001807552413083613, "global_step": 32620, "epoch": 274, "lr": 5.7348713885880444e-05} +{"train_loss": 0.0017418788047507405, "global_step": 32621, "epoch": 274, "lr": 5.734652242877607e-05} +{"train_loss": 0.003146212315186858, "global_step": 32622, "epoch": 274, "lr": 5.734433095724758e-05} +{"train_loss": 0.0028021230828016996, "global_step": 32623, "epoch": 274, "lr": 5.7342139471299284e-05} +{"train_loss": 0.0018105675699189305, "global_step": 32624, "epoch": 274, "lr": 5.733994797093548e-05} +{"train_loss": 0.00220462866127491, "global_step": 32625, "epoch": 274, "lr": 5.733775645616047e-05} +{"train_loss": 0.004661215003579855, "global_step": 32626, "epoch": 274, "lr": 5.7335564926978555e-05} +{"train_loss": 0.003321328666061163, "global_step": 32627, "epoch": 274, "lr": 5.733337338339405e-05} +{"train_loss": 0.002870754571631551, "global_step": 32628, "epoch": 274, "lr": 5.733118182541125e-05} +{"train_loss": 0.0027636855375021696, "global_step": 32629, "epoch": 274, "lr": 5.7328990253034456e-05} +{"train_loss": 0.0042960867285728455, "global_step": 32630, "epoch": 274, "lr": 5.732679866626797e-05} +{"train_loss": 0.002445491496473551, "global_step": 32631, "epoch": 274, "lr": 5.73246070651161e-05} +{"train_loss": 0.0034842046443372965, "global_step": 32632, "epoch": 274, "lr": 5.732241544958315e-05} +{"train_loss": 0.0023643565364181995, "global_step": 32633, "epoch": 274, "lr": 5.732022381967343e-05} +{"train_loss": 0.00317412824369967, "global_step": 32634, "epoch": 274, "lr": 5.731803217539121e-05} +{"train_loss": 0.003876762930303812, "global_step": 32635, "epoch": 274, "lr": 5.7315840516740825e-05} +{"train_loss": 0.0025866851210594177, "global_step": 32636, "epoch": 274, "lr": 5.731364884372656e-05} +{"train_loss": 0.003442269517108798, "global_step": 32637, "epoch": 274, "lr": 5.7311457156352745e-05} +{"train_loss": 0.0023777938913553953, "global_step": 32638, "epoch": 274, "lr": 5.7309265454623665e-05} +{"train_loss": 0.0025053482968360186, "global_step": 32639, "epoch": 274, "lr": 5.7307073738543604e-05} +{"train_loss": 0.003316435730084777, "global_step": 32640, "epoch": 274, "lr": 5.730488200811689e-05} +{"train_loss": 0.002598315943032503, "global_step": 32641, "epoch": 274, "lr": 5.7302690263347824e-05} +{"train_loss": 0.0025299189146608114, "global_step": 32642, "epoch": 274, "lr": 5.7300498504240705e-05} +{"train_loss": 0.0036454873625189066, "global_step": 32643, "epoch": 274, "lr": 5.729830673079984e-05} +{"train_loss": 0.0029832918662577868, "global_step": 32644, "epoch": 274, "lr": 5.7296114943029536e-05} +{"train_loss": 0.0018907469930127263, "global_step": 32645, "epoch": 274, "lr": 5.729392314093408e-05} +{"train_loss": 0.00342115038074553, "global_step": 32646, "epoch": 274, "lr": 5.729173132451778e-05} +{"train_loss": 0.0033908775076270103, "global_step": 32647, "epoch": 274, "lr": 5.728953949378495e-05} +{"train_loss": 0.003495883895084262, "global_step": 32648, "epoch": 274, "lr": 5.728734764873989e-05} +{"train_loss": 0.002063841326162219, "global_step": 32649, "epoch": 274, "lr": 5.72851557893869e-05} +{"train_loss": 0.0021468554623425007, "global_step": 32650, "epoch": 274, "lr": 5.728296391573029e-05} +{"train_loss": 0.0027961439918726683, "global_step": 32651, "epoch": 274, "lr": 5.7280772027774365e-05} +{"train_loss": 0.003916705958545208, "global_step": 32652, "epoch": 274, "lr": 5.727858012552341e-05} +{"train_loss": 0.0030294316820800304, "global_step": 32653, "epoch": 274, "lr": 5.727638820898174e-05} +{"train_loss": 0.001561780576594174, "global_step": 32654, "epoch": 274, "lr": 5.727419627815366e-05} +{"train_loss": 0.0035259113647043705, "global_step": 32655, "epoch": 274, "lr": 5.727200433304347e-05} +{"train_loss": 0.004279914312064648, "global_step": 32656, "epoch": 274, "lr": 5.726981237365547e-05} +{"train_loss": 0.0014705777866765857, "global_step": 32657, "epoch": 274, "lr": 5.7267620399993984e-05} +{"train_loss": 0.0035744719207286835, "global_step": 32658, "epoch": 274, "lr": 5.7265428412063306e-05} +{"train_loss": 0.0024956748820841312, "global_step": 32659, "epoch": 274, "lr": 5.726323640986771e-05} +{"train_loss": 0.0031538226176053286, "global_step": 32660, "epoch": 274, "lr": 5.7261044393411554e-05} +{"train_loss": 0.0028946080710738897, "global_step": 32661, "epoch": 274, "lr": 5.72588523626991e-05} +{"train_loss": 0.0038369721733033657, "global_step": 32662, "epoch": 274, "lr": 5.725666031773467e-05} +{"train_loss": 0.002968871034681797, "global_step": 32663, "epoch": 274, "lr": 5.7254468258522565e-05} +{"train_loss": 0.002323040273040533, "global_step": 32664, "epoch": 274, "lr": 5.725227618506708e-05} +{"train_loss": 0.004694080445915461, "global_step": 32665, "epoch": 274, "lr": 5.725008409737253e-05} +{"train_loss": 0.003811762435361743, "global_step": 32666, "epoch": 274, "lr": 5.72478919954432e-05} +{"train_loss": 0.0030301869846880436, "global_step": 32667, "epoch": 274, "lr": 5.724569987928342e-05} +{"train_loss": 0.0032598653342574835, "global_step": 32668, "epoch": 274, "lr": 5.7243507748897486e-05} +{"train_loss": 0.0034997016191482544, "global_step": 32669, "epoch": 274, "lr": 5.7241315604289694e-05} +{"train_loss": 0.0028185697738081217, "global_step": 32670, "epoch": 274, "lr": 5.723912344546436e-05} +{"train_loss": 0.002784071722999215, "global_step": 32671, "epoch": 274, "lr": 5.7236931272425764e-05} +{"train_loss": 0.001988559029996395, "global_step": 32672, "epoch": 274, "lr": 5.723473908517823e-05} +{"train_loss": 0.002039775950834155, "global_step": 32673, "epoch": 274, "lr": 5.7232546883726066e-05} +{"train_loss": 0.003611907595768571, "global_step": 32674, "epoch": 274, "lr": 5.723035466807357e-05} +{"train_loss": 0.005654375068843365, "global_step": 32675, "epoch": 274, "lr": 5.722816243822503e-05} +{"train_loss": 0.0018318926449865103, "global_step": 32676, "epoch": 274, "lr": 5.7225970194184785e-05} +{"train_loss": 0.0033066931646317244, "global_step": 32677, "epoch": 274, "lr": 5.722377793595711e-05} +{"train_loss": 0.0030383202247321606, "global_step": 32678, "epoch": 274, "lr": 5.722158566354632e-05} +{"train_loss": 0.0017991731874644756, "global_step": 32679, "epoch": 274, "lr": 5.721939337695672e-05} +{"train_loss": 0.002441460033878684, "global_step": 32680, "epoch": 274, "lr": 5.721720107619261e-05} +{"train_loss": 0.001970460405573249, "global_step": 32681, "epoch": 274, "lr": 5.7215008761258294e-05} +{"train_loss": 0.0021720652002841234, "global_step": 32682, "epoch": 274, "lr": 5.72128164321581e-05} +{"train_loss": 0.002120907185599208, "global_step": 32683, "epoch": 274, "lr": 5.7210624088896294e-05} +{"train_loss": 0.0016427823575213552, "global_step": 32684, "epoch": 274, "lr": 5.72084317314772e-05} +{"train_loss": 0.0023601665161550045, "global_step": 32685, "epoch": 274, "lr": 5.7206239359905114e-05} +{"train_loss": 0.003481789492070675, "global_step": 32686, "epoch": 274, "lr": 5.7204046974184345e-05} +{"train_loss": 0.0020894641056656837, "global_step": 32687, "epoch": 274, "lr": 5.7201854574319204e-05} +{"train_loss": 0.0016583588439971209, "global_step": 32688, "epoch": 274, "lr": 5.719966216031399e-05} +{"train_loss": 0.002324436791241169, "global_step": 32689, "epoch": 274, "lr": 5.7197469732173014e-05} +{"train_loss": 0.004744209349155426, "global_step": 32690, "epoch": 274, "lr": 5.719527728990057e-05} +{"train_loss": 0.0022428270895034075, "global_step": 32691, "epoch": 274, "lr": 5.7193084833500975e-05} +{"train_loss": 0.0035542165860533714, "global_step": 32692, "epoch": 274, "lr": 5.719089236297852e-05} +{"train_loss": 0.003603799734264612, "global_step": 32693, "epoch": 274, "lr": 5.718869987833752e-05} +{"train_loss": 0.0013476336607709527, "global_step": 32694, "epoch": 274, "lr": 5.718650737958227e-05} +{"train_loss": 0.0029228096827864647, "global_step": 32695, "epoch": 274, "lr": 5.718431486671709e-05} +{"train_loss": 0.002379362704232335, "global_step": 32696, "epoch": 274, "lr": 5.7182122339746266e-05} +{"train_loss": 0.002941076410934329, "global_step": 32697, "epoch": 274, "lr": 5.717992979867411e-05} +{"train_loss": 0.0028627265710383654, "global_step": 32698, "epoch": 274, "lr": 5.7177737243504945e-05} +{"train_loss": 0.0037109265103936195, "global_step": 32699, "epoch": 274, "lr": 5.717554467424304e-05} +{"train_loss": 0.0021945456974208355, "global_step": 32700, "epoch": 274, "lr": 5.7173352090892726e-05} +{"train_loss": 0.0016662038397043943, "global_step": 32701, "epoch": 274, "lr": 5.717115949345833e-05} +{"train_loss": 0.0039932942017912865, "global_step": 32702, "epoch": 274, "lr": 5.7168966881944096e-05} +{"train_loss": 0.002482609124854207, "global_step": 32703, "epoch": 274, "lr": 5.7166774256354364e-05} +{"train_loss": 0.0019221438560634851, "global_step": 32704, "epoch": 274, "lr": 5.7164581616693436e-05} +{"train_loss": 0.002952505135908723, "global_step": 32705, "epoch": 274, "lr": 5.7162388962965616e-05} +{"train_loss": 0.0036541868466883898, "global_step": 32706, "epoch": 274, "lr": 5.7160196295175225e-05} +{"train_loss": 0.00294422241859138, "global_step": 32707, "epoch": 274, "lr": 5.715800361332654e-05} +{"train_loss": 0.002612408949062228, "global_step": 32708, "epoch": 274, "lr": 5.715581091742389e-05} +{"train_loss": 0.002803883980959654, "global_step": 32709, "epoch": 274, "lr": 5.715361820747156e-05} +{"train_loss": 0.0038272985257208347, "global_step": 32710, "epoch": 274, "lr": 5.715142548347386e-05} +{"train_loss": 0.0024628073442727327, "global_step": 32711, "epoch": 274, "lr": 5.714923274543511e-05} +{"train_loss": 0.002140423748642206, "global_step": 32712, "epoch": 274, "lr": 5.714703999335961e-05} +{"train_loss": 0.002661805134266615, "global_step": 32713, "epoch": 274, "lr": 5.7144847227251666e-05} +{"train_loss": 0.003118206514045596, "global_step": 32714, "epoch": 274, "lr": 5.714265444711556e-05} +{"train_loss": 0.0026380952913314104, "global_step": 32715, "epoch": 274, "lr": 5.714046165295562e-05} +{"train_loss": 0.0026476597413420677, "global_step": 32716, "epoch": 274, "lr": 5.7138268844776154e-05} +{"train_loss": 0.003447671653702855, "global_step": 32717, "epoch": 274, "lr": 5.7136076022581456e-05} +{"train_loss": 0.002942792372778058, "global_step": 32718, "epoch": 274, "lr": 5.713388318637582e-05} +{"train_loss": 0.0034587581176310778, "global_step": 32719, "epoch": 274, "lr": 5.713169033616359e-05} +{"train_loss": 0.0025280523113906384, "global_step": 32720, "epoch": 274, "lr": 5.7129497471949046e-05} +{"train_loss": 0.001984158530831337, "global_step": 32721, "epoch": 274, "lr": 5.712730459373649e-05} +{"train_loss": 0.004587549716234207, "global_step": 32722, "epoch": 274, "lr": 5.712511170153022e-05} +{"train_loss": 0.00398657051846385, "global_step": 32723, "epoch": 274, "lr": 5.712291879533456e-05} +{"train_loss": 0.002862816186379172, "global_step": 32724, "epoch": 274, "lr": 5.7120725875153816e-05, "val_loss": 0.010438119992613792} +{"train_loss": 0.0031207676511257887, "global_step": 32725, "epoch": 275, "lr": 5.711853294099227e-05} +{"train_loss": 0.003185250097885728, "global_step": 32726, "epoch": 275, "lr": 5.7116339992854284e-05} +{"train_loss": 0.0034956559538841248, "global_step": 32727, "epoch": 275, "lr": 5.711414703074409e-05} +{"train_loss": 0.0025221621617674828, "global_step": 32728, "epoch": 275, "lr": 5.711195405466605e-05} +{"train_loss": 0.002371804090216756, "global_step": 32729, "epoch": 275, "lr": 5.710976106462443e-05} +{"train_loss": 0.004195427522063255, "global_step": 32730, "epoch": 275, "lr": 5.710756806062356e-05} +{"train_loss": 0.002807286335155368, "global_step": 32731, "epoch": 275, "lr": 5.710537504266774e-05} +{"train_loss": 0.0022419195156544447, "global_step": 32732, "epoch": 275, "lr": 5.710318201076129e-05} +{"train_loss": 0.004036166239529848, "global_step": 32733, "epoch": 275, "lr": 5.7100988964908486e-05} +{"train_loss": 0.0024236117023974657, "global_step": 32734, "epoch": 275, "lr": 5.709879590511365e-05} +{"train_loss": 0.003210092429071665, "global_step": 32735, "epoch": 275, "lr": 5.709660283138108e-05} +{"train_loss": 0.002720864722505212, "global_step": 32736, "epoch": 275, "lr": 5.709440974371509e-05} +{"train_loss": 0.0021941885352134705, "global_step": 32737, "epoch": 275, "lr": 5.709221664212e-05} +{"train_loss": 0.0017660121666267514, "global_step": 32738, "epoch": 275, "lr": 5.709002352660009e-05} +{"train_loss": 0.002917646896094084, "global_step": 32739, "epoch": 275, "lr": 5.708783039715967e-05} +{"train_loss": 0.003619556315243244, "global_step": 32740, "epoch": 275, "lr": 5.708563725380306e-05} +{"train_loss": 0.0020711307879537344, "global_step": 32741, "epoch": 275, "lr": 5.708344409653455e-05} +{"train_loss": 0.002715331967920065, "global_step": 32742, "epoch": 275, "lr": 5.7081250925358465e-05} +{"train_loss": 0.0030882691498845816, "global_step": 32743, "epoch": 275, "lr": 5.70790577402791e-05} +{"train_loss": 0.0021386598236858845, "global_step": 32744, "epoch": 275, "lr": 5.7076864541300746e-05} +{"train_loss": 0.0036831528414040804, "global_step": 32745, "epoch": 275, "lr": 5.7074671328427754e-05} +{"train_loss": 0.0029126922599971294, "global_step": 32746, "epoch": 275, "lr": 5.707247810166437e-05} +{"train_loss": 0.003379560075700283, "global_step": 32747, "epoch": 275, "lr": 5.707028486101496e-05} +{"train_loss": 0.0033280965872108936, "global_step": 32748, "epoch": 275, "lr": 5.7068091606483775e-05} +{"train_loss": 0.003625929355621338, "global_step": 32749, "epoch": 275, "lr": 5.7065898338075155e-05} +{"train_loss": 0.0029513160698115826, "global_step": 32750, "epoch": 275, "lr": 5.706370505579339e-05} +{"train_loss": 0.002878767205402255, "global_step": 32751, "epoch": 275, "lr": 5.706151175964283e-05} +{"train_loss": 0.002375207608565688, "global_step": 32752, "epoch": 275, "lr": 5.705931844962771e-05} +{"train_loss": 0.0018433525692671537, "global_step": 32753, "epoch": 275, "lr": 5.705712512575239e-05} +{"train_loss": 0.0031387072522193193, "global_step": 32754, "epoch": 275, "lr": 5.705493178802115e-05} +{"train_loss": 0.001976424129679799, "global_step": 32755, "epoch": 275, "lr": 5.70527384364383e-05} +{"train_loss": 0.003738060826435685, "global_step": 32756, "epoch": 275, "lr": 5.705054507100816e-05} +{"train_loss": 0.00339301023632288, "global_step": 32757, "epoch": 275, "lr": 5.7048351691735027e-05} +{"train_loss": 0.0028248471207916737, "global_step": 32758, "epoch": 275, "lr": 5.704615829862321e-05} +{"train_loss": 0.002024717628955841, "global_step": 32759, "epoch": 275, "lr": 5.7043964891677004e-05} +{"train_loss": 0.0033589843660593033, "global_step": 32760, "epoch": 275, "lr": 5.704177147090074e-05} +{"train_loss": 0.002357796998694539, "global_step": 32761, "epoch": 275, "lr": 5.7039578036298704e-05} +{"train_loss": 0.0026596568059176207, "global_step": 32762, "epoch": 275, "lr": 5.703738458787521e-05} +{"train_loss": 0.002402789192274213, "global_step": 32763, "epoch": 275, "lr": 5.703519112563456e-05} +{"train_loss": 0.003153969068080187, "global_step": 32764, "epoch": 275, "lr": 5.7032997649581076e-05} +{"train_loss": 0.0017353887669742107, "global_step": 32765, "epoch": 275, "lr": 5.703080415971904e-05} +{"train_loss": 0.0017106614541262388, "global_step": 32766, "epoch": 275, "lr": 5.702861065605277e-05} +{"train_loss": 0.0037364503368735313, "global_step": 32767, "epoch": 275, "lr": 5.702641713858658e-05} +{"train_loss": 0.0018442372092977166, "global_step": 32768, "epoch": 275, "lr": 5.7024223607324756e-05} +{"train_loss": 0.0026408834382891655, "global_step": 32769, "epoch": 275, "lr": 5.702203006227164e-05} +{"train_loss": 0.0030781098175793886, "global_step": 32770, "epoch": 275, "lr": 5.701983650343151e-05} +{"train_loss": 0.0017589613562449813, "global_step": 32771, "epoch": 275, "lr": 5.701764293080869e-05} +{"train_loss": 0.002509783022105694, "global_step": 32772, "epoch": 275, "lr": 5.701544934440744e-05} +{"train_loss": 0.0018398030661046505, "global_step": 32773, "epoch": 275, "lr": 5.701325574423214e-05} +{"train_loss": 0.003743744920939207, "global_step": 32774, "epoch": 275, "lr": 5.7011062130287054e-05} +{"train_loss": 0.002356654964387417, "global_step": 32775, "epoch": 275, "lr": 5.70088685025765e-05} +{"train_loss": 0.0019591667223721743, "global_step": 32776, "epoch": 275, "lr": 5.700667486110478e-05} +{"train_loss": 0.003113254439085722, "global_step": 32777, "epoch": 275, "lr": 5.7004481205876204e-05} +{"train_loss": 0.0017161881551146507, "global_step": 32778, "epoch": 275, "lr": 5.700228753689507e-05} +{"train_loss": 0.0039850021712481976, "global_step": 32779, "epoch": 275, "lr": 5.70000938541657e-05} +{"train_loss": 0.0024167662486433983, "global_step": 32780, "epoch": 275, "lr": 5.6997900157692387e-05} +{"train_loss": 0.0024599507451057434, "global_step": 32781, "epoch": 275, "lr": 5.6995706447479446e-05} +{"train_loss": 0.0037375236861407757, "global_step": 32782, "epoch": 275, "lr": 5.6993512723531195e-05} +{"train_loss": 0.0025763637386262417, "global_step": 32783, "epoch": 275, "lr": 5.6991318985851924e-05} +{"train_loss": 0.002728137420490384, "global_step": 32784, "epoch": 275, "lr": 5.698912523444594e-05} +{"train_loss": 0.0037318177055567503, "global_step": 32785, "epoch": 275, "lr": 5.698693146931755e-05} +{"train_loss": 0.0024336494971066713, "global_step": 32786, "epoch": 275, "lr": 5.698473769047107e-05} +{"train_loss": 0.0023867820855230093, "global_step": 32787, "epoch": 275, "lr": 5.69825438979108e-05} +{"train_loss": 0.0022508883848786354, "global_step": 32788, "epoch": 275, "lr": 5.698035009164107e-05} +{"train_loss": 0.001468351692892611, "global_step": 32789, "epoch": 275, "lr": 5.697815627166614e-05} +{"train_loss": 0.00302332965657115, "global_step": 32790, "epoch": 275, "lr": 5.697596243799036e-05} +{"train_loss": 0.003718954510986805, "global_step": 32791, "epoch": 275, "lr": 5.697376859061803e-05} +{"train_loss": 0.0028437958098948, "global_step": 32792, "epoch": 275, "lr": 5.697157472955343e-05} +{"train_loss": 0.0026005159597843885, "global_step": 32793, "epoch": 275, "lr": 5.696938085480091e-05} +{"train_loss": 0.0038459617644548416, "global_step": 32794, "epoch": 275, "lr": 5.696718696636475e-05} +{"train_loss": 0.0026827072724699974, "global_step": 32795, "epoch": 275, "lr": 5.696499306424926e-05} +{"train_loss": 0.0044342814944684505, "global_step": 32796, "epoch": 275, "lr": 5.696279914845875e-05} +{"train_loss": 0.002827440155670047, "global_step": 32797, "epoch": 275, "lr": 5.6960605218997534e-05} +{"train_loss": 0.0030032722279429436, "global_step": 32798, "epoch": 275, "lr": 5.6958411275869907e-05} +{"train_loss": 0.0015366945881396532, "global_step": 32799, "epoch": 275, "lr": 5.695621731908017e-05} +{"train_loss": 0.0018453147495165467, "global_step": 32800, "epoch": 275, "lr": 5.695402334863267e-05} +{"train_loss": 0.003296991577371955, "global_step": 32801, "epoch": 275, "lr": 5.695182936453167e-05} +{"train_loss": 0.0037231245078146458, "global_step": 32802, "epoch": 275, "lr": 5.6949635366781506e-05} +{"train_loss": 0.0020674262195825577, "global_step": 32803, "epoch": 275, "lr": 5.6947441355386465e-05} +{"train_loss": 0.0024577330332249403, "global_step": 32804, "epoch": 275, "lr": 5.694524733035087e-05} +{"train_loss": 0.0016033750725910068, "global_step": 32805, "epoch": 275, "lr": 5.6943053291679026e-05} +{"train_loss": 0.0024746463168412447, "global_step": 32806, "epoch": 275, "lr": 5.6940859239375235e-05} +{"train_loss": 0.002740593859925866, "global_step": 32807, "epoch": 275, "lr": 5.693866517344381e-05} +{"train_loss": 0.002651984803378582, "global_step": 32808, "epoch": 275, "lr": 5.6936471093889055e-05} +{"train_loss": 0.0021348195150494576, "global_step": 32809, "epoch": 275, "lr": 5.6934277000715274e-05} +{"train_loss": 0.0023474430199712515, "global_step": 32810, "epoch": 275, "lr": 5.69320828939268e-05} +{"train_loss": 0.00373432831838727, "global_step": 32811, "epoch": 275, "lr": 5.6929888773527895e-05} +{"train_loss": 0.0033776636701077223, "global_step": 32812, "epoch": 275, "lr": 5.692769463952291e-05} +{"train_loss": 0.0028046169318258762, "global_step": 32813, "epoch": 275, "lr": 5.692550049191614e-05} +{"train_loss": 0.0024462619330734015, "global_step": 32814, "epoch": 275, "lr": 5.692330633071189e-05} +{"train_loss": 0.004780666437000036, "global_step": 32815, "epoch": 275, "lr": 5.692111215591447e-05} +{"train_loss": 0.0035819094628095627, "global_step": 32816, "epoch": 275, "lr": 5.6918917967528176e-05} +{"train_loss": 0.002948537701740861, "global_step": 32817, "epoch": 275, "lr": 5.691672376555732e-05} +{"train_loss": 0.002597753657028079, "global_step": 32818, "epoch": 275, "lr": 5.6914529550006226e-05} +{"train_loss": 0.0017417562194168568, "global_step": 32819, "epoch": 275, "lr": 5.69123353208792e-05} +{"train_loss": 0.0024443946313112974, "global_step": 32820, "epoch": 275, "lr": 5.691014107818053e-05} +{"train_loss": 0.0028416092973202467, "global_step": 32821, "epoch": 275, "lr": 5.6907946821914534e-05} +{"train_loss": 0.0037418100982904434, "global_step": 32822, "epoch": 275, "lr": 5.690575255208552e-05} +{"train_loss": 0.0011172896483913064, "global_step": 32823, "epoch": 275, "lr": 5.690355826869781e-05} +{"train_loss": 0.0014030992751941085, "global_step": 32824, "epoch": 275, "lr": 5.690136397175569e-05} +{"train_loss": 0.005495437886565924, "global_step": 32825, "epoch": 275, "lr": 5.6899169661263485e-05} +{"train_loss": 0.002371936570852995, "global_step": 32826, "epoch": 275, "lr": 5.689697533722551e-05} +{"train_loss": 0.005244164727628231, "global_step": 32827, "epoch": 275, "lr": 5.6894780999646046e-05} +{"train_loss": 0.002078352030366659, "global_step": 32828, "epoch": 275, "lr": 5.689258664852942e-05} +{"train_loss": 0.002885658759623766, "global_step": 32829, "epoch": 275, "lr": 5.689039228387993e-05} +{"train_loss": 0.0026463759131729603, "global_step": 32830, "epoch": 275, "lr": 5.68881979057019e-05} +{"train_loss": 0.0021389268804341555, "global_step": 32831, "epoch": 275, "lr": 5.688600351399963e-05} +{"train_loss": 0.0018298061331734061, "global_step": 32832, "epoch": 275, "lr": 5.688380910877743e-05} +{"train_loss": 0.0033584285993129015, "global_step": 32833, "epoch": 275, "lr": 5.68816146900396e-05} +{"train_loss": 0.00223357742652297, "global_step": 32834, "epoch": 275, "lr": 5.687942025779045e-05} +{"train_loss": 0.0023134120274335146, "global_step": 32835, "epoch": 275, "lr": 5.68772258120343e-05} +{"train_loss": 0.004601803608238697, "global_step": 32836, "epoch": 275, "lr": 5.687503135277545e-05} +{"train_loss": 0.0020500400569289923, "global_step": 32837, "epoch": 275, "lr": 5.687283688001821e-05} +{"train_loss": 0.003354019718244672, "global_step": 32838, "epoch": 275, "lr": 5.687064239376688e-05} +{"train_loss": 0.0017775380983948708, "global_step": 32839, "epoch": 275, "lr": 5.686844789402579e-05} +{"train_loss": 0.0031604240648448467, "global_step": 32840, "epoch": 275, "lr": 5.6866253380799226e-05} +{"train_loss": 0.0031772961374372244, "global_step": 32841, "epoch": 275, "lr": 5.686405885409152e-05} +{"train_loss": 0.0034667435102164745, "global_step": 32842, "epoch": 275, "lr": 5.686186431390697e-05} +{"train_loss": 0.002796516598186636, "global_step": 32843, "epoch": 275, "lr": 5.685966976024987e-05, "val_loss": 0.019243232905864716, "train_action_mse_error": 4.955957047059201e-05} +{"train_loss": 0.0031970699783414602, "global_step": 32844, "epoch": 276, "lr": 5.685747519312454e-05} +{"train_loss": 0.002305247588083148, "global_step": 32845, "epoch": 276, "lr": 5.6855280612535314e-05} +{"train_loss": 0.002651225309818983, "global_step": 32846, "epoch": 276, "lr": 5.685308601848645e-05} +{"train_loss": 0.0043586562387645245, "global_step": 32847, "epoch": 276, "lr": 5.685089141098229e-05} +{"train_loss": 0.00195758743211627, "global_step": 32848, "epoch": 276, "lr": 5.6848696790027134e-05} +{"train_loss": 0.0019905592780560255, "global_step": 32849, "epoch": 276, "lr": 5.68465021556253e-05} +{"train_loss": 0.004550255835056305, "global_step": 32850, "epoch": 276, "lr": 5.684430750778109e-05} +{"train_loss": 0.003381097689270973, "global_step": 32851, "epoch": 276, "lr": 5.684211284649882e-05} +{"train_loss": 0.0019902403000742197, "global_step": 32852, "epoch": 276, "lr": 5.683991817178278e-05} +{"train_loss": 0.0015302525134757161, "global_step": 32853, "epoch": 276, "lr": 5.6837723483637296e-05} +{"train_loss": 0.0028127857949584723, "global_step": 32854, "epoch": 276, "lr": 5.6835528782066684e-05} +{"train_loss": 0.0021252185106277466, "global_step": 32855, "epoch": 276, "lr": 5.683333406707523e-05} +{"train_loss": 0.0018605986842885613, "global_step": 32856, "epoch": 276, "lr": 5.683113933866724e-05} +{"train_loss": 0.002788034500554204, "global_step": 32857, "epoch": 276, "lr": 5.6828944596847056e-05} +{"train_loss": 0.0018339954549446702, "global_step": 32858, "epoch": 276, "lr": 5.682674984161897e-05} +{"train_loss": 0.0036288953851908445, "global_step": 32859, "epoch": 276, "lr": 5.6824555072987286e-05} +{"train_loss": 0.0021432461217045784, "global_step": 32860, "epoch": 276, "lr": 5.682236029095631e-05} +{"train_loss": 0.0025069541297852993, "global_step": 32861, "epoch": 276, "lr": 5.682016549553037e-05} +{"train_loss": 0.0024875595699995756, "global_step": 32862, "epoch": 276, "lr": 5.681797068671375e-05} +{"train_loss": 0.002616365673020482, "global_step": 32863, "epoch": 276, "lr": 5.681577586451078e-05} +{"train_loss": 0.001422314322553575, "global_step": 32864, "epoch": 276, "lr": 5.681358102892578e-05} +{"train_loss": 0.003131232690066099, "global_step": 32865, "epoch": 276, "lr": 5.6811386179963023e-05} +{"train_loss": 0.002353811403736472, "global_step": 32866, "epoch": 276, "lr": 5.680919131762683e-05} +{"train_loss": 0.0022935138549655676, "global_step": 32867, "epoch": 276, "lr": 5.680699644192153e-05} +{"train_loss": 0.0022565037943422794, "global_step": 32868, "epoch": 276, "lr": 5.6804801552851416e-05} +{"train_loss": 0.0019991544540971518, "global_step": 32869, "epoch": 276, "lr": 5.68026066504208e-05} +{"train_loss": 0.004657383542507887, "global_step": 32870, "epoch": 276, "lr": 5.6800411734633995e-05} +{"train_loss": 0.0019840714521706104, "global_step": 32871, "epoch": 276, "lr": 5.679821680549531e-05} +{"train_loss": 0.004270618781447411, "global_step": 32872, "epoch": 276, "lr": 5.679602186300904e-05} +{"train_loss": 0.00315428851172328, "global_step": 32873, "epoch": 276, "lr": 5.679382690717951e-05} +{"train_loss": 0.0018487602937966585, "global_step": 32874, "epoch": 276, "lr": 5.679163193801105e-05} +{"train_loss": 0.0028850273229181767, "global_step": 32875, "epoch": 276, "lr": 5.6789436955507924e-05} +{"train_loss": 0.001539541524834931, "global_step": 32876, "epoch": 276, "lr": 5.6787241959674475e-05} +{"train_loss": 0.004156226757913828, "global_step": 32877, "epoch": 276, "lr": 5.6785046950514995e-05} +{"train_loss": 0.0029150056652724743, "global_step": 32878, "epoch": 276, "lr": 5.67828519280338e-05} +{"train_loss": 0.0017833998426795006, "global_step": 32879, "epoch": 276, "lr": 5.678065689223521e-05} +{"train_loss": 0.003801044775173068, "global_step": 32880, "epoch": 276, "lr": 5.677846184312351e-05} +{"train_loss": 0.0021267361007630825, "global_step": 32881, "epoch": 276, "lr": 5.6776266780703025e-05} +{"train_loss": 0.004143132362514734, "global_step": 32882, "epoch": 276, "lr": 5.677407170497807e-05} +{"train_loss": 0.002626216970384121, "global_step": 32883, "epoch": 276, "lr": 5.677187661595296e-05} +{"train_loss": 0.002817474538460374, "global_step": 32884, "epoch": 276, "lr": 5.676968151363198e-05} +{"train_loss": 0.0038290254306048155, "global_step": 32885, "epoch": 276, "lr": 5.676748639801946e-05} +{"train_loss": 0.0015529139200225472, "global_step": 32886, "epoch": 276, "lr": 5.676529126911969e-05} +{"train_loss": 0.00208765990100801, "global_step": 32887, "epoch": 276, "lr": 5.6763096126936996e-05} +{"train_loss": 0.002803204348310828, "global_step": 32888, "epoch": 276, "lr": 5.6760900971475695e-05} +{"train_loss": 0.003853499423712492, "global_step": 32889, "epoch": 276, "lr": 5.6758705802740086e-05} +{"train_loss": 0.0016944909002631903, "global_step": 32890, "epoch": 276, "lr": 5.675651062073448e-05} +{"train_loss": 0.0018419264815747738, "global_step": 32891, "epoch": 276, "lr": 5.675431542546318e-05} +{"train_loss": 0.0033848537132143974, "global_step": 32892, "epoch": 276, "lr": 5.675212021693051e-05} +{"train_loss": 0.0035621647257357836, "global_step": 32893, "epoch": 276, "lr": 5.674992499514077e-05} +{"train_loss": 0.001792378956452012, "global_step": 32894, "epoch": 276, "lr": 5.674772976009828e-05} +{"train_loss": 0.0017146490281447768, "global_step": 32895, "epoch": 276, "lr": 5.674553451180734e-05} +{"train_loss": 0.002554983599111438, "global_step": 32896, "epoch": 276, "lr": 5.6743339250272265e-05} +{"train_loss": 0.0026371360290795565, "global_step": 32897, "epoch": 276, "lr": 5.6741143975497354e-05} +{"train_loss": 0.003978810738772154, "global_step": 32898, "epoch": 276, "lr": 5.673894868748694e-05} +{"train_loss": 0.0027008792385458946, "global_step": 32899, "epoch": 276, "lr": 5.673675338624531e-05} +{"train_loss": 0.002529195509850979, "global_step": 32900, "epoch": 276, "lr": 5.673455807177679e-05} +{"train_loss": 0.0036903677973896265, "global_step": 32901, "epoch": 276, "lr": 5.6732362744085696e-05} +{"train_loss": 0.003049092832952738, "global_step": 32902, "epoch": 276, "lr": 5.6730167403176317e-05} +{"train_loss": 0.0030983383767306805, "global_step": 32903, "epoch": 276, "lr": 5.672797204905297e-05} +{"train_loss": 0.0033482308499515057, "global_step": 32904, "epoch": 276, "lr": 5.6725776681719966e-05} +{"train_loss": 0.0021958646830171347, "global_step": 32905, "epoch": 276, "lr": 5.672358130118161e-05} +{"train_loss": 0.003921402618288994, "global_step": 32906, "epoch": 276, "lr": 5.672138590744223e-05} +{"train_loss": 0.0026702743489295244, "global_step": 32907, "epoch": 276, "lr": 5.671919050050613e-05} +{"train_loss": 0.002877812599763274, "global_step": 32908, "epoch": 276, "lr": 5.6716995080377625e-05} +{"train_loss": 0.0033557135611772537, "global_step": 32909, "epoch": 276, "lr": 5.6714799647061e-05} +{"train_loss": 0.002352986019104719, "global_step": 32910, "epoch": 276, "lr": 5.671260420056059e-05} +{"train_loss": 0.004075657110661268, "global_step": 32911, "epoch": 276, "lr": 5.6710408740880705e-05} +{"train_loss": 0.0035308420192450285, "global_step": 32912, "epoch": 276, "lr": 5.670821326802564e-05} +{"train_loss": 0.003981608431786299, "global_step": 32913, "epoch": 276, "lr": 5.670601778199972e-05} +{"train_loss": 0.001995102735236287, "global_step": 32914, "epoch": 276, "lr": 5.670382228280726e-05} +{"train_loss": 0.0025785034522414207, "global_step": 32915, "epoch": 276, "lr": 5.670162677045255e-05} +{"train_loss": 0.002244114177301526, "global_step": 32916, "epoch": 276, "lr": 5.669943124493992e-05} +{"train_loss": 0.0027966448105871677, "global_step": 32917, "epoch": 276, "lr": 5.669723570627367e-05} +{"train_loss": 0.0026367404498159885, "global_step": 32918, "epoch": 276, "lr": 5.66950401544581e-05} +{"train_loss": 0.0028889677487313747, "global_step": 32919, "epoch": 276, "lr": 5.6692844589497554e-05} +{"train_loss": 0.003201068611815572, "global_step": 32920, "epoch": 276, "lr": 5.66906490113963e-05} +{"train_loss": 0.0036336658522486687, "global_step": 32921, "epoch": 276, "lr": 5.668845342015868e-05} +{"train_loss": 0.003493565134704113, "global_step": 32922, "epoch": 276, "lr": 5.6686257815789e-05} +{"train_loss": 0.002139101969078183, "global_step": 32923, "epoch": 276, "lr": 5.668406219829156e-05} +{"train_loss": 0.00514681963250041, "global_step": 32924, "epoch": 276, "lr": 5.668186656767069e-05} +{"train_loss": 0.0020472053438425064, "global_step": 32925, "epoch": 276, "lr": 5.667967092393068e-05} +{"train_loss": 0.0028860378079116344, "global_step": 32926, "epoch": 276, "lr": 5.667747526707588e-05} +{"train_loss": 0.004304226487874985, "global_step": 32927, "epoch": 276, "lr": 5.667527959711053e-05} +{"train_loss": 0.0028071796987205744, "global_step": 32928, "epoch": 276, "lr": 5.667308391403899e-05} +{"train_loss": 0.0025383811444044113, "global_step": 32929, "epoch": 276, "lr": 5.667088821786557e-05} +{"train_loss": 0.005650477018207312, "global_step": 32930, "epoch": 276, "lr": 5.666869250859458e-05} +{"train_loss": 0.00238140020519495, "global_step": 32931, "epoch": 276, "lr": 5.6666496786230306e-05} +{"train_loss": 0.004376545082777739, "global_step": 32932, "epoch": 276, "lr": 5.666430105077709e-05} +{"train_loss": 0.0038109689485281706, "global_step": 32933, "epoch": 276, "lr": 5.6662105302239246e-05} +{"train_loss": 0.001963087823241949, "global_step": 32934, "epoch": 276, "lr": 5.665990954062105e-05} +{"train_loss": 0.004089033231139183, "global_step": 32935, "epoch": 276, "lr": 5.665771376592683e-05} +{"train_loss": 0.004142652731388807, "global_step": 32936, "epoch": 276, "lr": 5.665551797816091e-05} +{"train_loss": 0.001920692971907556, "global_step": 32937, "epoch": 276, "lr": 5.665332217732758e-05} +{"train_loss": 0.002319920575246215, "global_step": 32938, "epoch": 276, "lr": 5.665112636343117e-05} +{"train_loss": 0.003974625840783119, "global_step": 32939, "epoch": 276, "lr": 5.664893053647599e-05} +{"train_loss": 0.0034348780754953623, "global_step": 32940, "epoch": 276, "lr": 5.664673469646634e-05} +{"train_loss": 0.002354165306314826, "global_step": 32941, "epoch": 276, "lr": 5.6644538843406535e-05} +{"train_loss": 0.00246477616019547, "global_step": 32942, "epoch": 276, "lr": 5.664234297730089e-05} +{"train_loss": 0.0029992463532835245, "global_step": 32943, "epoch": 276, "lr": 5.6640147098153706e-05} +{"train_loss": 0.002958850469440222, "global_step": 32944, "epoch": 276, "lr": 5.663795120596931e-05} +{"train_loss": 0.004559866618365049, "global_step": 32945, "epoch": 276, "lr": 5.6635755300752025e-05} +{"train_loss": 0.003654666943475604, "global_step": 32946, "epoch": 276, "lr": 5.663355938250612e-05} +{"train_loss": 0.0035524312406778336, "global_step": 32947, "epoch": 276, "lr": 5.663136345123593e-05} +{"train_loss": 0.003266238374635577, "global_step": 32948, "epoch": 276, "lr": 5.662916750694577e-05} +{"train_loss": 0.003794766031205654, "global_step": 32949, "epoch": 276, "lr": 5.662697154963995e-05} +{"train_loss": 0.003851719433441758, "global_step": 32950, "epoch": 276, "lr": 5.6624775579322775e-05} +{"train_loss": 0.002315158722922206, "global_step": 32951, "epoch": 276, "lr": 5.662257959599857e-05} +{"train_loss": 0.0016435441793873906, "global_step": 32952, "epoch": 276, "lr": 5.6620383599671636e-05} +{"train_loss": 0.003490254981443286, "global_step": 32953, "epoch": 276, "lr": 5.661818759034627e-05} +{"train_loss": 0.0017141413409262896, "global_step": 32954, "epoch": 276, "lr": 5.661599156802682e-05} +{"train_loss": 0.0026551864575594664, "global_step": 32955, "epoch": 276, "lr": 5.661379553271756e-05} +{"train_loss": 0.002054797951132059, "global_step": 32956, "epoch": 276, "lr": 5.661159948442283e-05} +{"train_loss": 0.003065043594688177, "global_step": 32957, "epoch": 276, "lr": 5.6609403423146925e-05} +{"train_loss": 0.00443702656775713, "global_step": 32958, "epoch": 276, "lr": 5.6607207348894174e-05} +{"train_loss": 0.004847162403166294, "global_step": 32959, "epoch": 276, "lr": 5.660501126166886e-05} +{"train_loss": 0.002205784199759364, "global_step": 32960, "epoch": 276, "lr": 5.660281516147533e-05} +{"train_loss": 0.0019350543152540922, "global_step": 32961, "epoch": 276, "lr": 5.660061904831786e-05} +{"train_loss": 0.0029236761620268226, "global_step": 32962, "epoch": 276, "lr": 5.659842292220079e-05, "val_loss": 0.018756426870822906} +{"train_loss": 0.0029162175487726927, "global_step": 32963, "epoch": 277, "lr": 5.659622678312843e-05} +{"train_loss": 0.004315617959946394, "global_step": 32964, "epoch": 277, "lr": 5.6594030631105075e-05} +{"train_loss": 0.001611670246347785, "global_step": 32965, "epoch": 277, "lr": 5.659183446613504e-05} +{"train_loss": 0.0027958506252616644, "global_step": 32966, "epoch": 277, "lr": 5.658963828822265e-05} +{"train_loss": 0.00443269032984972, "global_step": 32967, "epoch": 277, "lr": 5.65874420973722e-05} +{"train_loss": 0.0026271925307810307, "global_step": 32968, "epoch": 277, "lr": 5.658524589358801e-05} +{"train_loss": 0.00414669094607234, "global_step": 32969, "epoch": 277, "lr": 5.65830496768744e-05} +{"train_loss": 0.003616367932409048, "global_step": 32970, "epoch": 277, "lr": 5.6580853447235684e-05} +{"train_loss": 0.0038926182314753532, "global_step": 32971, "epoch": 277, "lr": 5.657865720467616e-05} +{"train_loss": 0.004089154303073883, "global_step": 32972, "epoch": 277, "lr": 5.657646094920013e-05} +{"train_loss": 0.0024931852240115404, "global_step": 32973, "epoch": 277, "lr": 5.657426468081194e-05} +{"train_loss": 0.00293233641423285, "global_step": 32974, "epoch": 277, "lr": 5.6572068399515875e-05} +{"train_loss": 0.0018843888537958264, "global_step": 32975, "epoch": 277, "lr": 5.656987210531626e-05} +{"train_loss": 0.0030106392223387957, "global_step": 32976, "epoch": 277, "lr": 5.656767579821739e-05} +{"train_loss": 0.004844640381634235, "global_step": 32977, "epoch": 277, "lr": 5.6565479478223616e-05} +{"train_loss": 0.0018948878860101104, "global_step": 32978, "epoch": 277, "lr": 5.6563283145339207e-05} +{"train_loss": 0.003231026465073228, "global_step": 32979, "epoch": 277, "lr": 5.65610867995685e-05} +{"train_loss": 0.003234160365536809, "global_step": 32980, "epoch": 277, "lr": 5.655889044091579e-05} +{"train_loss": 0.002467015292495489, "global_step": 32981, "epoch": 277, "lr": 5.65566940693854e-05} +{"train_loss": 0.0023315860889852047, "global_step": 32982, "epoch": 277, "lr": 5.655449768498165e-05} +{"train_loss": 0.002278041560202837, "global_step": 32983, "epoch": 277, "lr": 5.655230128770884e-05} +{"train_loss": 0.004203903488814831, "global_step": 32984, "epoch": 277, "lr": 5.655010487757129e-05} +{"train_loss": 0.0033483963925391436, "global_step": 32985, "epoch": 277, "lr": 5.6547908454573306e-05} +{"train_loss": 0.002022824017331004, "global_step": 32986, "epoch": 277, "lr": 5.65457120187192e-05} +{"train_loss": 0.004415611736476421, "global_step": 32987, "epoch": 277, "lr": 5.6543515570013295e-05} +{"train_loss": 0.00223708082921803, "global_step": 32988, "epoch": 277, "lr": 5.654131910845989e-05} +{"train_loss": 0.005391019396483898, "global_step": 32989, "epoch": 277, "lr": 5.65391226340633e-05} +{"train_loss": 0.0025317780673503876, "global_step": 32990, "epoch": 277, "lr": 5.653692614682785e-05} +{"train_loss": 0.0030201999470591545, "global_step": 32991, "epoch": 277, "lr": 5.653472964675783e-05} +{"train_loss": 0.003296779002994299, "global_step": 32992, "epoch": 277, "lr": 5.653253313385758e-05} +{"train_loss": 0.0034917043522000313, "global_step": 32993, "epoch": 277, "lr": 5.65303366081314e-05} +{"train_loss": 0.0029414675664156675, "global_step": 32994, "epoch": 277, "lr": 5.65281400695836e-05} +{"train_loss": 0.0019716082606464624, "global_step": 32995, "epoch": 277, "lr": 5.6525943518218496e-05} +{"train_loss": 0.002696421230211854, "global_step": 32996, "epoch": 277, "lr": 5.652374695404039e-05} +{"train_loss": 0.0018989742966368794, "global_step": 32997, "epoch": 277, "lr": 5.6521550377053614e-05} +{"train_loss": 0.0014790653949603438, "global_step": 32998, "epoch": 277, "lr": 5.6519353787262465e-05} +{"train_loss": 0.0026568893808871508, "global_step": 32999, "epoch": 277, "lr": 5.6517157184671266e-05} +{"train_loss": 0.0023600566200912, "global_step": 33000, "epoch": 277, "lr": 5.651496056928431e-05} +{"train_loss": 0.005545494146645069, "global_step": 33001, "epoch": 277, "lr": 5.651276394110594e-05} +{"train_loss": 0.0026623858138918877, "global_step": 33002, "epoch": 277, "lr": 5.651056730014045e-05} +{"train_loss": 0.00506398594006896, "global_step": 33003, "epoch": 277, "lr": 5.650837064639216e-05} +{"train_loss": 0.0026726718060672283, "global_step": 33004, "epoch": 277, "lr": 5.6506173979865376e-05} +{"train_loss": 0.002292961347848177, "global_step": 33005, "epoch": 277, "lr": 5.6503977300564414e-05} +{"train_loss": 0.0030971388332545757, "global_step": 33006, "epoch": 277, "lr": 5.650178060849358e-05} +{"train_loss": 0.0020228340290486813, "global_step": 33007, "epoch": 277, "lr": 5.6499583903657205e-05} +{"train_loss": 0.003922104369848967, "global_step": 33008, "epoch": 277, "lr": 5.64973871860596e-05} +{"train_loss": 0.0041640144772827625, "global_step": 33009, "epoch": 277, "lr": 5.649519045570506e-05} +{"train_loss": 0.003930024802684784, "global_step": 33010, "epoch": 277, "lr": 5.64929937125979e-05} +{"train_loss": 0.0035492100287228823, "global_step": 33011, "epoch": 277, "lr": 5.6490796956742444e-05} +{"train_loss": 0.003723026718944311, "global_step": 33012, "epoch": 277, "lr": 5.6488600188143006e-05} +{"train_loss": 0.001826483174227178, "global_step": 33013, "epoch": 277, "lr": 5.648640340680389e-05} +{"train_loss": 0.003388376208022237, "global_step": 33014, "epoch": 277, "lr": 5.648420661272943e-05} +{"train_loss": 0.003627465572208166, "global_step": 33015, "epoch": 277, "lr": 5.648200980592391e-05} +{"train_loss": 0.002779716392979026, "global_step": 33016, "epoch": 277, "lr": 5.647981298639165e-05} +{"train_loss": 0.002375129610300064, "global_step": 33017, "epoch": 277, "lr": 5.6477616154136984e-05} +{"train_loss": 0.002864823443815112, "global_step": 33018, "epoch": 277, "lr": 5.647541930916419e-05} +{"train_loss": 0.004177519120275974, "global_step": 33019, "epoch": 277, "lr": 5.6473222451477614e-05} +{"train_loss": 0.0031675028149038553, "global_step": 33020, "epoch": 277, "lr": 5.647102558108156e-05} +{"train_loss": 0.0024355680216103792, "global_step": 33021, "epoch": 277, "lr": 5.6468828697980336e-05} +{"train_loss": 0.002699279459193349, "global_step": 33022, "epoch": 277, "lr": 5.646663180217825e-05} +{"train_loss": 0.0034825133625417948, "global_step": 33023, "epoch": 277, "lr": 5.646443489367963e-05} +{"train_loss": 0.0031618322245776653, "global_step": 33024, "epoch": 277, "lr": 5.6462237972488783e-05} +{"train_loss": 0.0023571744095534086, "global_step": 33025, "epoch": 277, "lr": 5.646004103861002e-05} +{"train_loss": 0.002785598626360297, "global_step": 33026, "epoch": 277, "lr": 5.645784409204766e-05} +{"train_loss": 0.0016969398129731417, "global_step": 33027, "epoch": 277, "lr": 5.645564713280602e-05} +{"train_loss": 0.003269878914579749, "global_step": 33028, "epoch": 277, "lr": 5.645345016088941e-05} +{"train_loss": 0.0025444738566875458, "global_step": 33029, "epoch": 277, "lr": 5.645125317630212e-05} +{"train_loss": 0.0034043907653540373, "global_step": 33030, "epoch": 277, "lr": 5.6449056179048495e-05} +{"train_loss": 0.00203520804643631, "global_step": 33031, "epoch": 277, "lr": 5.644685916913284e-05} +{"train_loss": 0.002205448690801859, "global_step": 33032, "epoch": 277, "lr": 5.6444662146559456e-05} +{"train_loss": 0.0018634365405887365, "global_step": 33033, "epoch": 277, "lr": 5.6442465111332674e-05} +{"train_loss": 0.002811257727444172, "global_step": 33034, "epoch": 277, "lr": 5.64402680634568e-05} +{"train_loss": 0.002967964392155409, "global_step": 33035, "epoch": 277, "lr": 5.6438071002936146e-05} +{"train_loss": 0.002845444018021226, "global_step": 33036, "epoch": 277, "lr": 5.643587392977503e-05} +{"train_loss": 0.002116413554176688, "global_step": 33037, "epoch": 277, "lr": 5.643367684397774e-05} +{"train_loss": 0.002012212062254548, "global_step": 33038, "epoch": 277, "lr": 5.6431479745548635e-05} +{"train_loss": 0.0015207723481580615, "global_step": 33039, "epoch": 277, "lr": 5.642928263449201e-05} +{"train_loss": 0.0035351947881281376, "global_step": 33040, "epoch": 277, "lr": 5.642708551081217e-05} +{"train_loss": 0.00306869950145483, "global_step": 33041, "epoch": 277, "lr": 5.642488837451343e-05} +{"train_loss": 0.0027950708754360676, "global_step": 33042, "epoch": 277, "lr": 5.642269122560011e-05} +{"train_loss": 0.003910609055310488, "global_step": 33043, "epoch": 277, "lr": 5.642049406407652e-05} +{"train_loss": 0.0023680999875068665, "global_step": 33044, "epoch": 277, "lr": 5.641829688994699e-05} +{"train_loss": 0.00433475011959672, "global_step": 33045, "epoch": 277, "lr": 5.641609970321582e-05} +{"train_loss": 0.001612913329154253, "global_step": 33046, "epoch": 277, "lr": 5.641390250388731e-05} +{"train_loss": 0.0030570896342396736, "global_step": 33047, "epoch": 277, "lr": 5.6411705291965787e-05} +{"train_loss": 0.0024398276582360268, "global_step": 33048, "epoch": 277, "lr": 5.640950806745556e-05} +{"train_loss": 0.004098591394722462, "global_step": 33049, "epoch": 277, "lr": 5.640731083036096e-05} +{"train_loss": 0.002230837708339095, "global_step": 33050, "epoch": 277, "lr": 5.6405113580686285e-05} +{"train_loss": 0.0022166920825839043, "global_step": 33051, "epoch": 277, "lr": 5.640291631843586e-05} +{"train_loss": 0.0016393171390518546, "global_step": 33052, "epoch": 277, "lr": 5.640071904361399e-05} +{"train_loss": 0.0038103703409433365, "global_step": 33053, "epoch": 277, "lr": 5.639852175622499e-05} +{"train_loss": 0.0020957228261977434, "global_step": 33054, "epoch": 277, "lr": 5.6396324456273175e-05} +{"train_loss": 0.001922604744322598, "global_step": 33055, "epoch": 277, "lr": 5.639412714376287e-05} +{"train_loss": 0.003965605050325394, "global_step": 33056, "epoch": 277, "lr": 5.6391929818698364e-05} +{"train_loss": 0.0018412636127322912, "global_step": 33057, "epoch": 277, "lr": 5.638973248108399e-05} +{"train_loss": 0.002077283337712288, "global_step": 33058, "epoch": 277, "lr": 5.638753513092407e-05} +{"train_loss": 0.001958737848326564, "global_step": 33059, "epoch": 277, "lr": 5.63853377682229e-05} +{"train_loss": 0.002806358737871051, "global_step": 33060, "epoch": 277, "lr": 5.63831403929848e-05} +{"train_loss": 0.002154428046196699, "global_step": 33061, "epoch": 277, "lr": 5.6380943005214096e-05} +{"train_loss": 0.0014746306696906686, "global_step": 33062, "epoch": 277, "lr": 5.6378745604915084e-05} +{"train_loss": 0.002484165132045746, "global_step": 33063, "epoch": 277, "lr": 5.637654819209208e-05} +{"train_loss": 0.003473060205578804, "global_step": 33064, "epoch": 277, "lr": 5.637435076674942e-05} +{"train_loss": 0.0023864395916461945, "global_step": 33065, "epoch": 277, "lr": 5.6372153328891394e-05} +{"train_loss": 0.0021889423951506615, "global_step": 33066, "epoch": 277, "lr": 5.6369955878522326e-05} +{"train_loss": 0.0021829032339155674, "global_step": 33067, "epoch": 277, "lr": 5.636775841564653e-05} +{"train_loss": 0.0034608470741659403, "global_step": 33068, "epoch": 277, "lr": 5.636556094026832e-05} +{"train_loss": 0.0015897980192676187, "global_step": 33069, "epoch": 277, "lr": 5.636336345239202e-05} +{"train_loss": 0.0021950204391032457, "global_step": 33070, "epoch": 277, "lr": 5.6361165952021925e-05} +{"train_loss": 0.0025399483274668455, "global_step": 33071, "epoch": 277, "lr": 5.635896843916235e-05} +{"train_loss": 0.0020860068034380674, "global_step": 33072, "epoch": 277, "lr": 5.635677091381763e-05} +{"train_loss": 0.002642896259203553, "global_step": 33073, "epoch": 277, "lr": 5.635457337599208e-05} +{"train_loss": 0.0019546980038285255, "global_step": 33074, "epoch": 277, "lr": 5.635237582569e-05} +{"train_loss": 0.0032150812912732363, "global_step": 33075, "epoch": 277, "lr": 5.63501782629157e-05} +{"train_loss": 0.002135658171027899, "global_step": 33076, "epoch": 277, "lr": 5.6347980687673505e-05} +{"train_loss": 0.0023881986271589994, "global_step": 33077, "epoch": 277, "lr": 5.634578309996774e-05} +{"train_loss": 0.003394505474716425, "global_step": 33078, "epoch": 277, "lr": 5.63435854998027e-05} +{"train_loss": 0.003240722231566906, "global_step": 33079, "epoch": 277, "lr": 5.634138788718271e-05} +{"train_loss": 0.0017654768889769912, "global_step": 33080, "epoch": 277, "lr": 5.633919026211207e-05} +{"train_loss": 0.0028467436571519415, "global_step": 33081, "epoch": 277, "lr": 5.633699262459512e-05, "val_loss": 0.017356514930725098} +{"train_loss": 0.0015222270740196109, "global_step": 33082, "epoch": 278, "lr": 5.633479497463616e-05} +{"train_loss": 0.0015339447418227792, "global_step": 33083, "epoch": 278, "lr": 5.633259731223952e-05} +{"train_loss": 0.0022412685211747885, "global_step": 33084, "epoch": 278, "lr": 5.633039963740948e-05} +{"train_loss": 0.002386318286880851, "global_step": 33085, "epoch": 278, "lr": 5.632820195015038e-05} +{"train_loss": 0.002286020200699568, "global_step": 33086, "epoch": 278, "lr": 5.6326004250466524e-05} +{"train_loss": 0.0014313909923657775, "global_step": 33087, "epoch": 278, "lr": 5.6323806538362256e-05} +{"train_loss": 0.002556778024882078, "global_step": 33088, "epoch": 278, "lr": 5.6321608813841854e-05} +{"train_loss": 0.003009266220033169, "global_step": 33089, "epoch": 278, "lr": 5.631941107690967e-05} +{"train_loss": 0.0018193653086200356, "global_step": 33090, "epoch": 278, "lr": 5.6317213327569974e-05} +{"train_loss": 0.0017645939951762557, "global_step": 33091, "epoch": 278, "lr": 5.631501556582711e-05} +{"train_loss": 0.001463918830268085, "global_step": 33092, "epoch": 278, "lr": 5.631281779168539e-05} +{"train_loss": 0.00261725764721632, "global_step": 33093, "epoch": 278, "lr": 5.631062000514913e-05} +{"train_loss": 0.002230148296803236, "global_step": 33094, "epoch": 278, "lr": 5.630842220622263e-05} +{"train_loss": 0.0015161033952608705, "global_step": 33095, "epoch": 278, "lr": 5.6306224394910225e-05} +{"train_loss": 0.0012815076624974608, "global_step": 33096, "epoch": 278, "lr": 5.630402657121623e-05} +{"train_loss": 0.0032474289182573557, "global_step": 33097, "epoch": 278, "lr": 5.6301828735144943e-05} +{"train_loss": 0.0015478850109502673, "global_step": 33098, "epoch": 278, "lr": 5.6299630886700694e-05} +{"train_loss": 0.0021595675498247147, "global_step": 33099, "epoch": 278, "lr": 5.629743302588779e-05} +{"train_loss": 0.003995074424892664, "global_step": 33100, "epoch": 278, "lr": 5.6295235152710545e-05} +{"train_loss": 0.002728265943005681, "global_step": 33101, "epoch": 278, "lr": 5.629303726717328e-05} +{"train_loss": 0.002950015477836132, "global_step": 33102, "epoch": 278, "lr": 5.62908393692803e-05} +{"train_loss": 0.0021542184986174107, "global_step": 33103, "epoch": 278, "lr": 5.628864145903594e-05} +{"train_loss": 0.002048769500106573, "global_step": 33104, "epoch": 278, "lr": 5.62864435364445e-05} +{"train_loss": 0.0026556220836937428, "global_step": 33105, "epoch": 278, "lr": 5.628424560151031e-05} +{"train_loss": 0.0016862854827195406, "global_step": 33106, "epoch": 278, "lr": 5.628204765423766e-05} +{"train_loss": 0.0016276348615065217, "global_step": 33107, "epoch": 278, "lr": 5.627984969463089e-05} +{"train_loss": 0.0021103546023368835, "global_step": 33108, "epoch": 278, "lr": 5.6277651722694315e-05} +{"train_loss": 0.0023096047807484865, "global_step": 33109, "epoch": 278, "lr": 5.627545373843223e-05} +{"train_loss": 0.004155272152274847, "global_step": 33110, "epoch": 278, "lr": 5.6273255741848964e-05} +{"train_loss": 0.0024990502279251814, "global_step": 33111, "epoch": 278, "lr": 5.627105773294883e-05} +{"train_loss": 0.0015008681220933795, "global_step": 33112, "epoch": 278, "lr": 5.6268859711736145e-05} +{"train_loss": 0.004965490661561489, "global_step": 33113, "epoch": 278, "lr": 5.6266661678215216e-05} +{"train_loss": 0.0028444738127291203, "global_step": 33114, "epoch": 278, "lr": 5.626446363239038e-05} +{"train_loss": 0.002943111816421151, "global_step": 33115, "epoch": 278, "lr": 5.6262265574265925e-05} +{"train_loss": 0.002856370760127902, "global_step": 33116, "epoch": 278, "lr": 5.6260067503846195e-05} +{"train_loss": 0.0015974806156009436, "global_step": 33117, "epoch": 278, "lr": 5.625786942113548e-05} +{"train_loss": 0.002614703495055437, "global_step": 33118, "epoch": 278, "lr": 5.6255671326138115e-05} +{"train_loss": 0.002565813483670354, "global_step": 33119, "epoch": 278, "lr": 5.62534732188584e-05} +{"train_loss": 0.0033810066524893045, "global_step": 33120, "epoch": 278, "lr": 5.625127509930066e-05} +{"train_loss": 0.0021698004566133022, "global_step": 33121, "epoch": 278, "lr": 5.6249076967469205e-05} +{"train_loss": 0.0030202537309378386, "global_step": 33122, "epoch": 278, "lr": 5.624687882336836e-05} +{"train_loss": 0.0032008567359298468, "global_step": 33123, "epoch": 278, "lr": 5.6244680667002436e-05} +{"train_loss": 0.0025817505083978176, "global_step": 33124, "epoch": 278, "lr": 5.624248249837575e-05} +{"train_loss": 0.0020205327309668064, "global_step": 33125, "epoch": 278, "lr": 5.624028431749261e-05} +{"train_loss": 0.001899066031910479, "global_step": 33126, "epoch": 278, "lr": 5.623808612435735e-05} +{"train_loss": 0.001465211040340364, "global_step": 33127, "epoch": 278, "lr": 5.6235887918974274e-05} +{"train_loss": 0.001667106058448553, "global_step": 33128, "epoch": 278, "lr": 5.623368970134769e-05} +{"train_loss": 0.002933849347755313, "global_step": 33129, "epoch": 278, "lr": 5.6231491471481924e-05} +{"train_loss": 0.003786469344049692, "global_step": 33130, "epoch": 278, "lr": 5.6229293229381294e-05} +{"train_loss": 0.0026738003361970186, "global_step": 33131, "epoch": 278, "lr": 5.622709497505011e-05} +{"train_loss": 0.0014787300024181604, "global_step": 33132, "epoch": 278, "lr": 5.622489670849268e-05} +{"train_loss": 0.004192722961306572, "global_step": 33133, "epoch": 278, "lr": 5.622269842971335e-05} +{"train_loss": 0.002742607379332185, "global_step": 33134, "epoch": 278, "lr": 5.622050013871641e-05} +{"train_loss": 0.00458853505551815, "global_step": 33135, "epoch": 278, "lr": 5.621830183550617e-05} +{"train_loss": 0.00228608725592494, "global_step": 33136, "epoch": 278, "lr": 5.621610352008696e-05} +{"train_loss": 0.004485166631639004, "global_step": 33137, "epoch": 278, "lr": 5.62139051924631e-05} +{"train_loss": 0.002025688998401165, "global_step": 33138, "epoch": 278, "lr": 5.6211706852638915e-05} +{"train_loss": 0.002049001632258296, "global_step": 33139, "epoch": 278, "lr": 5.6209508500618704e-05} +{"train_loss": 0.003370799822732806, "global_step": 33140, "epoch": 278, "lr": 5.620731013640676e-05} +{"train_loss": 0.0031459571328014135, "global_step": 33141, "epoch": 278, "lr": 5.620511176000746e-05} +{"train_loss": 0.0016166630666702986, "global_step": 33142, "epoch": 278, "lr": 5.620291337142506e-05} +{"train_loss": 0.002586736809462309, "global_step": 33143, "epoch": 278, "lr": 5.6200714970663915e-05} +{"train_loss": 0.0036634858697652817, "global_step": 33144, "epoch": 278, "lr": 5.619851655772832e-05} +{"train_loss": 0.0017779988702386618, "global_step": 33145, "epoch": 278, "lr": 5.61963181326226e-05} +{"train_loss": 0.003174177138134837, "global_step": 33146, "epoch": 278, "lr": 5.61941196953511e-05} +{"train_loss": 0.002167781349271536, "global_step": 33147, "epoch": 278, "lr": 5.619192124591808e-05} +{"train_loss": 0.002018590457737446, "global_step": 33148, "epoch": 278, "lr": 5.618972278432788e-05} +{"train_loss": 0.0024296818301081657, "global_step": 33149, "epoch": 278, "lr": 5.618752431058484e-05} +{"train_loss": 0.002422284334897995, "global_step": 33150, "epoch": 278, "lr": 5.618532582469323e-05} +{"train_loss": 0.0018587945960462093, "global_step": 33151, "epoch": 278, "lr": 5.618312732665742e-05} +{"train_loss": 0.0037821591831743717, "global_step": 33152, "epoch": 278, "lr": 5.6180928816481695e-05} +{"train_loss": 0.0022207326255738735, "global_step": 33153, "epoch": 278, "lr": 5.617873029417037e-05} +{"train_loss": 0.0017191871302202344, "global_step": 33154, "epoch": 278, "lr": 5.6176531759727755e-05} +{"train_loss": 0.0021871288772672415, "global_step": 33155, "epoch": 278, "lr": 5.6174333213158205e-05} +{"train_loss": 0.00448609609156847, "global_step": 33156, "epoch": 278, "lr": 5.6172134654465994e-05} +{"train_loss": 0.004273696336895227, "global_step": 33157, "epoch": 278, "lr": 5.616993608365546e-05} +{"train_loss": 0.0022353520616889, "global_step": 33158, "epoch": 278, "lr": 5.6167737500730935e-05} +{"train_loss": 0.0024561702739447355, "global_step": 33159, "epoch": 278, "lr": 5.616553890569669e-05} +{"train_loss": 0.0015815825900062919, "global_step": 33160, "epoch": 278, "lr": 5.6163340298557085e-05} +{"train_loss": 0.002476748079061508, "global_step": 33161, "epoch": 278, "lr": 5.616114167931641e-05} +{"train_loss": 0.0033386037684977055, "global_step": 33162, "epoch": 278, "lr": 5.6158943047978995e-05} +{"train_loss": 0.002204801421612501, "global_step": 33163, "epoch": 278, "lr": 5.615674440454915e-05} +{"train_loss": 0.002652313094586134, "global_step": 33164, "epoch": 278, "lr": 5.61545457490312e-05} +{"train_loss": 0.005250321701169014, "global_step": 33165, "epoch": 278, "lr": 5.6152347081429454e-05} +{"train_loss": 0.001903847442008555, "global_step": 33166, "epoch": 278, "lr": 5.6150148401748236e-05} +{"train_loss": 0.0029805318918079138, "global_step": 33167, "epoch": 278, "lr": 5.614794970999185e-05} +{"train_loss": 0.0028278373647481203, "global_step": 33168, "epoch": 278, "lr": 5.614575100616464e-05} +{"train_loss": 0.003166806185618043, "global_step": 33169, "epoch": 278, "lr": 5.6143552290270884e-05} +{"train_loss": 0.003263398539274931, "global_step": 33170, "epoch": 278, "lr": 5.614135356231491e-05} +{"train_loss": 0.0032883959356695414, "global_step": 33171, "epoch": 278, "lr": 5.6139154822301076e-05} +{"train_loss": 0.0018820237601175904, "global_step": 33172, "epoch": 278, "lr": 5.613695607023365e-05} +{"train_loss": 0.003141117515042424, "global_step": 33173, "epoch": 278, "lr": 5.613475730611697e-05} +{"train_loss": 0.0029164522420614958, "global_step": 33174, "epoch": 278, "lr": 5.613255852995535e-05} +{"train_loss": 0.00272696977481246, "global_step": 33175, "epoch": 278, "lr": 5.613035974175309e-05} +{"train_loss": 0.0029412207659333944, "global_step": 33176, "epoch": 278, "lr": 5.612816094151454e-05} +{"train_loss": 0.0022625853307545185, "global_step": 33177, "epoch": 278, "lr": 5.6125962129244014e-05} +{"train_loss": 0.0034409326035529375, "global_step": 33178, "epoch": 278, "lr": 5.61237633049458e-05} +{"train_loss": 0.002795581007376313, "global_step": 33179, "epoch": 278, "lr": 5.6121564468624234e-05} +{"train_loss": 0.002596452832221985, "global_step": 33180, "epoch": 278, "lr": 5.6119365620283624e-05} +{"train_loss": 0.005240662023425102, "global_step": 33181, "epoch": 278, "lr": 5.61171667599283e-05} +{"train_loss": 0.001867984770797193, "global_step": 33182, "epoch": 278, "lr": 5.611496788756256e-05} +{"train_loss": 0.004984068218618631, "global_step": 33183, "epoch": 278, "lr": 5.6112769003190744e-05} +{"train_loss": 0.002282527042552829, "global_step": 33184, "epoch": 278, "lr": 5.611057010681716e-05} +{"train_loss": 0.001615105546079576, "global_step": 33185, "epoch": 278, "lr": 5.610837119844612e-05} +{"train_loss": 0.003414959879592061, "global_step": 33186, "epoch": 278, "lr": 5.6106172278081945e-05} +{"train_loss": 0.0033086470793932676, "global_step": 33187, "epoch": 278, "lr": 5.610397334572897e-05} +{"train_loss": 0.0037699800450354815, "global_step": 33188, "epoch": 278, "lr": 5.610177440139147e-05} +{"train_loss": 0.0017970851622521877, "global_step": 33189, "epoch": 278, "lr": 5.609957544507381e-05} +{"train_loss": 0.0042569516226649284, "global_step": 33190, "epoch": 278, "lr": 5.6097376476780274e-05} +{"train_loss": 0.0035428907722234726, "global_step": 33191, "epoch": 278, "lr": 5.60951774965152e-05} +{"train_loss": 0.0019350219517946243, "global_step": 33192, "epoch": 278, "lr": 5.609297850428288e-05} +{"train_loss": 0.0031408178620040417, "global_step": 33193, "epoch": 278, "lr": 5.609077950008765e-05} +{"train_loss": 0.0036250855773687363, "global_step": 33194, "epoch": 278, "lr": 5.608858048393384e-05} +{"train_loss": 0.0016923026414588094, "global_step": 33195, "epoch": 278, "lr": 5.6086381455825746e-05} +{"train_loss": 0.003484765300527215, "global_step": 33196, "epoch": 278, "lr": 5.608418241576769e-05} +{"train_loss": 0.0036846394650638103, "global_step": 33197, "epoch": 278, "lr": 5.608198336376399e-05} +{"train_loss": 0.0019831277895718813, "global_step": 33198, "epoch": 278, "lr": 5.6079784299818975e-05} +{"train_loss": 0.004102291073650122, "global_step": 33199, "epoch": 278, "lr": 5.6077585223936936e-05} +{"train_loss": 0.0026812640472683087, "global_step": 33200, "epoch": 278, "lr": 5.607538613612222e-05, "val_loss": 0.03137081861495972} +{"train_loss": 0.004998990800231695, "global_step": 33201, "epoch": 279, "lr": 5.6073187036379125e-05} +{"train_loss": 0.003083461197093129, "global_step": 33202, "epoch": 279, "lr": 5.6070987924711984e-05} +{"train_loss": 0.003406540025025606, "global_step": 33203, "epoch": 279, "lr": 5.6068788801125105e-05} +{"train_loss": 0.0025283072609454393, "global_step": 33204, "epoch": 279, "lr": 5.60665896656228e-05} +{"train_loss": 0.0016752762021496892, "global_step": 33205, "epoch": 279, "lr": 5.6064390518209394e-05} +{"train_loss": 0.004105296917259693, "global_step": 33206, "epoch": 279, "lr": 5.606219135888922e-05} +{"train_loss": 0.0029108142480254173, "global_step": 33207, "epoch": 279, "lr": 5.605999218766657e-05} +{"train_loss": 0.0028687326703220606, "global_step": 33208, "epoch": 279, "lr": 5.605779300454579e-05} +{"train_loss": 0.00356034142896533, "global_step": 33209, "epoch": 279, "lr": 5.605559380953116e-05} +{"train_loss": 0.0017541298875585198, "global_step": 33210, "epoch": 279, "lr": 5.6053394602627016e-05} +{"train_loss": 0.002280574291944504, "global_step": 33211, "epoch": 279, "lr": 5.60511953838377e-05} +{"train_loss": 0.002772758947685361, "global_step": 33212, "epoch": 279, "lr": 5.604899615316749e-05} +{"train_loss": 0.0030304347164928913, "global_step": 33213, "epoch": 279, "lr": 5.604679691062072e-05} +{"train_loss": 0.0019714038353413343, "global_step": 33214, "epoch": 279, "lr": 5.604459765620172e-05} +{"train_loss": 0.0029097965452820063, "global_step": 33215, "epoch": 279, "lr": 5.604239838991481e-05} +{"train_loss": 0.002172306180000305, "global_step": 33216, "epoch": 279, "lr": 5.604019911176428e-05} +{"train_loss": 0.002341205021366477, "global_step": 33217, "epoch": 279, "lr": 5.603799982175446e-05} +{"train_loss": 0.0022753316443413496, "global_step": 33218, "epoch": 279, "lr": 5.603580051988968e-05} +{"train_loss": 0.0029776240698993206, "global_step": 33219, "epoch": 279, "lr": 5.603360120617424e-05} +{"train_loss": 0.0018792679766193032, "global_step": 33220, "epoch": 279, "lr": 5.603140188061247e-05} +{"train_loss": 0.0030943320598453283, "global_step": 33221, "epoch": 279, "lr": 5.60292025432087e-05} +{"train_loss": 0.001760434010066092, "global_step": 33222, "epoch": 279, "lr": 5.602700319396723e-05} +{"train_loss": 0.0018711944576352835, "global_step": 33223, "epoch": 279, "lr": 5.602480383289239e-05} +{"train_loss": 0.0028221444226801395, "global_step": 33224, "epoch": 279, "lr": 5.6022604459988485e-05} +{"train_loss": 0.003697939682751894, "global_step": 33225, "epoch": 279, "lr": 5.602040507525983e-05} +{"train_loss": 0.0028063091449439526, "global_step": 33226, "epoch": 279, "lr": 5.601820567871077e-05} +{"train_loss": 0.0015349102905020118, "global_step": 33227, "epoch": 279, "lr": 5.60160062703456e-05} +{"train_loss": 0.004440117161720991, "global_step": 33228, "epoch": 279, "lr": 5.6013806850168635e-05} +{"train_loss": 0.004387731663882732, "global_step": 33229, "epoch": 279, "lr": 5.601160741818422e-05} +{"train_loss": 0.003401795867830515, "global_step": 33230, "epoch": 279, "lr": 5.600940797439664e-05} +{"train_loss": 0.0025523179210722446, "global_step": 33231, "epoch": 279, "lr": 5.600720851881024e-05} +{"train_loss": 0.002117492724210024, "global_step": 33232, "epoch": 279, "lr": 5.6005009051429314e-05} +{"train_loss": 0.001904693664982915, "global_step": 33233, "epoch": 279, "lr": 5.600280957225821e-05} +{"train_loss": 0.002902962965890765, "global_step": 33234, "epoch": 279, "lr": 5.600061008130122e-05} +{"train_loss": 0.004301318433135748, "global_step": 33235, "epoch": 279, "lr": 5.599841057856268e-05} +{"train_loss": 0.0013365320628508925, "global_step": 33236, "epoch": 279, "lr": 5.5996211064046886e-05} +{"train_loss": 0.0014921554829925299, "global_step": 33237, "epoch": 279, "lr": 5.5994011537758196e-05} +{"train_loss": 0.0019498005276545882, "global_step": 33238, "epoch": 279, "lr": 5.599181199970088e-05} +{"train_loss": 0.0016657127998769283, "global_step": 33239, "epoch": 279, "lr": 5.59896124498793e-05} +{"train_loss": 0.0012998376041650772, "global_step": 33240, "epoch": 279, "lr": 5.598741288829776e-05} +{"train_loss": 0.0023762909695506096, "global_step": 33241, "epoch": 279, "lr": 5.598521331496056e-05} +{"train_loss": 0.0015570477116852999, "global_step": 33242, "epoch": 279, "lr": 5.5983013729872046e-05} +{"train_loss": 0.0032494948245584965, "global_step": 33243, "epoch": 279, "lr": 5.598081413303651e-05} +{"train_loss": 0.0034083668142557144, "global_step": 33244, "epoch": 279, "lr": 5.5978614524458296e-05} +{"train_loss": 0.002186375670135021, "global_step": 33245, "epoch": 279, "lr": 5.5976414904141704e-05} +{"train_loss": 0.0033944628667086363, "global_step": 33246, "epoch": 279, "lr": 5.597421527209107e-05} +{"train_loss": 0.0027449587360024452, "global_step": 33247, "epoch": 279, "lr": 5.597201562831069e-05} +{"train_loss": 0.0026438089553266764, "global_step": 33248, "epoch": 279, "lr": 5.5969815972804894e-05} +{"train_loss": 0.0017850296571850777, "global_step": 33249, "epoch": 279, "lr": 5.5967616305578005e-05} +{"train_loss": 0.0030987258069217205, "global_step": 33250, "epoch": 279, "lr": 5.5965416626634346e-05} +{"train_loss": 0.001560876495204866, "global_step": 33251, "epoch": 279, "lr": 5.596321693597823e-05} +{"train_loss": 0.0021589219104498625, "global_step": 33252, "epoch": 279, "lr": 5.5961017233613965e-05} +{"train_loss": 0.0014577544061467052, "global_step": 33253, "epoch": 279, "lr": 5.595881751954588e-05} +{"train_loss": 0.0019305748865008354, "global_step": 33254, "epoch": 279, "lr": 5.59566177937783e-05} +{"train_loss": 0.0024729010183364153, "global_step": 33255, "epoch": 279, "lr": 5.5954418056315524e-05} +{"train_loss": 0.005236566532403231, "global_step": 33256, "epoch": 279, "lr": 5.5952218307161894e-05} +{"train_loss": 0.0028927018865942955, "global_step": 33257, "epoch": 279, "lr": 5.595001854632172e-05} +{"train_loss": 0.0016353706596419215, "global_step": 33258, "epoch": 279, "lr": 5.5947818773799335e-05} +{"train_loss": 0.002916979370638728, "global_step": 33259, "epoch": 279, "lr": 5.5945618989599025e-05} +{"train_loss": 0.0033384019043296576, "global_step": 33260, "epoch": 279, "lr": 5.594341919372513e-05} +{"train_loss": 0.0027484570164233446, "global_step": 33261, "epoch": 279, "lr": 5.594121938618196e-05} +{"train_loss": 0.0011689616367220879, "global_step": 33262, "epoch": 279, "lr": 5.593901956697385e-05} +{"train_loss": 0.002230668207630515, "global_step": 33263, "epoch": 279, "lr": 5.593681973610511e-05} +{"train_loss": 0.0023213715758174658, "global_step": 33264, "epoch": 279, "lr": 5.5934619893580054e-05} +{"train_loss": 0.002050870331004262, "global_step": 33265, "epoch": 279, "lr": 5.593242003940301e-05} +{"train_loss": 0.0034429035149514675, "global_step": 33266, "epoch": 279, "lr": 5.59302201735783e-05} +{"train_loss": 0.0015721748350188136, "global_step": 33267, "epoch": 279, "lr": 5.592802029611021e-05} +{"train_loss": 0.0022473479621112347, "global_step": 33268, "epoch": 279, "lr": 5.5925820407003106e-05} +{"train_loss": 0.0012941703898832202, "global_step": 33269, "epoch": 279, "lr": 5.5923620506261275e-05} +{"train_loss": 0.0013383707264438272, "global_step": 33270, "epoch": 279, "lr": 5.592142059388905e-05} +{"train_loss": 0.002665832871571183, "global_step": 33271, "epoch": 279, "lr": 5.591922066989077e-05} +{"train_loss": 0.004003132227808237, "global_step": 33272, "epoch": 279, "lr": 5.591702073427072e-05} +{"train_loss": 0.0014982417924329638, "global_step": 33273, "epoch": 279, "lr": 5.591482078703323e-05} +{"train_loss": 0.0024687680415809155, "global_step": 33274, "epoch": 279, "lr": 5.5912620828182614e-05} +{"train_loss": 0.0028348625637590885, "global_step": 33275, "epoch": 279, "lr": 5.59104208577232e-05} +{"train_loss": 0.001351712504401803, "global_step": 33276, "epoch": 279, "lr": 5.590822087565931e-05} +{"train_loss": 0.004347390029579401, "global_step": 33277, "epoch": 279, "lr": 5.590602088199527e-05} +{"train_loss": 0.0030105640180408955, "global_step": 33278, "epoch": 279, "lr": 5.590382087673538e-05} +{"train_loss": 0.0017857711063697934, "global_step": 33279, "epoch": 279, "lr": 5.590162085988396e-05} +{"train_loss": 0.002476736903190613, "global_step": 33280, "epoch": 279, "lr": 5.589942083144535e-05} +{"train_loss": 0.0018778343219310045, "global_step": 33281, "epoch": 279, "lr": 5.589722079142386e-05} +{"train_loss": 0.0017316520679742098, "global_step": 33282, "epoch": 279, "lr": 5.589502073982379e-05} +{"train_loss": 0.0021780782844871283, "global_step": 33283, "epoch": 279, "lr": 5.5892820676649494e-05} +{"train_loss": 0.0032991927582770586, "global_step": 33284, "epoch": 279, "lr": 5.589062060190526e-05} +{"train_loss": 0.0027438488323241472, "global_step": 33285, "epoch": 279, "lr": 5.588842051559543e-05} +{"train_loss": 0.003807945642620325, "global_step": 33286, "epoch": 279, "lr": 5.588622041772431e-05} +{"train_loss": 0.0019157483475282788, "global_step": 33287, "epoch": 279, "lr": 5.5884020308296225e-05} +{"train_loss": 0.002315911464393139, "global_step": 33288, "epoch": 279, "lr": 5.58818201873155e-05} +{"train_loss": 0.0023201312869787216, "global_step": 33289, "epoch": 279, "lr": 5.587962005478645e-05} +{"train_loss": 0.0019036910962313414, "global_step": 33290, "epoch": 279, "lr": 5.58774199107134e-05} +{"train_loss": 0.0020370534621179104, "global_step": 33291, "epoch": 279, "lr": 5.587521975510066e-05} +{"train_loss": 0.002714949194341898, "global_step": 33292, "epoch": 279, "lr": 5.587301958795255e-05} +{"train_loss": 0.0023087242152541876, "global_step": 33293, "epoch": 279, "lr": 5.587081940927339e-05} +{"train_loss": 0.0034404669422656298, "global_step": 33294, "epoch": 279, "lr": 5.5868619219067495e-05} +{"train_loss": 0.003209631657227874, "global_step": 33295, "epoch": 279, "lr": 5.586641901733921e-05} +{"train_loss": 0.00243775499984622, "global_step": 33296, "epoch": 279, "lr": 5.586421880409285e-05} +{"train_loss": 0.002848779084160924, "global_step": 33297, "epoch": 279, "lr": 5.5862018579332695e-05} +{"train_loss": 0.001497914781793952, "global_step": 33298, "epoch": 279, "lr": 5.585981834306311e-05} +{"train_loss": 0.0015368136810138822, "global_step": 33299, "epoch": 279, "lr": 5.585761809528839e-05} +{"train_loss": 0.0018597037997096777, "global_step": 33300, "epoch": 279, "lr": 5.585541783601286e-05} +{"train_loss": 0.005095520988106728, "global_step": 33301, "epoch": 279, "lr": 5.585321756524084e-05} +{"train_loss": 0.003283129772171378, "global_step": 33302, "epoch": 279, "lr": 5.5851017282976656e-05} +{"train_loss": 0.002285993192344904, "global_step": 33303, "epoch": 279, "lr": 5.584881698922463e-05} +{"train_loss": 0.0025502927601337433, "global_step": 33304, "epoch": 279, "lr": 5.584661668398907e-05} +{"train_loss": 0.0015537581639364362, "global_step": 33305, "epoch": 279, "lr": 5.584441636727431e-05} +{"train_loss": 0.002893780590966344, "global_step": 33306, "epoch": 279, "lr": 5.584221603908466e-05} +{"train_loss": 0.003087658667936921, "global_step": 33307, "epoch": 279, "lr": 5.584001569942444e-05} +{"train_loss": 0.0023018489591777325, "global_step": 33308, "epoch": 279, "lr": 5.5837815348297986e-05} +{"train_loss": 0.003160596825182438, "global_step": 33309, "epoch": 279, "lr": 5.58356149857096e-05} +{"train_loss": 0.004667351488023996, "global_step": 33310, "epoch": 279, "lr": 5.5833414611663604e-05} +{"train_loss": 0.003906761761754751, "global_step": 33311, "epoch": 279, "lr": 5.5831214226164316e-05} +{"train_loss": 0.0023525531869381666, "global_step": 33312, "epoch": 279, "lr": 5.582901382921606e-05} +{"train_loss": 0.003315910929813981, "global_step": 33313, "epoch": 279, "lr": 5.582681342082317e-05} +{"train_loss": 0.002888473216444254, "global_step": 33314, "epoch": 279, "lr": 5.582461300098995e-05} +{"train_loss": 0.0023524754215031862, "global_step": 33315, "epoch": 279, "lr": 5.5822412569720725e-05} +{"train_loss": 0.0030246309470385313, "global_step": 33316, "epoch": 279, "lr": 5.58202121270198e-05} +{"train_loss": 0.003389563877135515, "global_step": 33317, "epoch": 279, "lr": 5.581801167289152e-05} +{"train_loss": 0.002184363780543208, "global_step": 33318, "epoch": 279, "lr": 5.5815811207340206e-05} +{"train_loss": 0.0026171779584828296, "global_step": 33319, "epoch": 279, "lr": 5.5813610730370155e-05, "val_loss": 0.01775594986975193} +{"train_loss": 0.001830034889280796, "global_step": 33320, "epoch": 280, "lr": 5.5811410241985705e-05} +{"train_loss": 0.001954836305230856, "global_step": 33321, "epoch": 280, "lr": 5.580920974219119e-05} +{"train_loss": 0.003681190311908722, "global_step": 33322, "epoch": 280, "lr": 5.580700923099089e-05} +{"train_loss": 0.003144435817375779, "global_step": 33323, "epoch": 280, "lr": 5.580480870838916e-05} +{"train_loss": 0.0026834735181182623, "global_step": 33324, "epoch": 280, "lr": 5.580260817439029e-05} +{"train_loss": 0.004320092964917421, "global_step": 33325, "epoch": 280, "lr": 5.580040762899864e-05} +{"train_loss": 0.0019526189425960183, "global_step": 33326, "epoch": 280, "lr": 5.57982070722185e-05} +{"train_loss": 0.0026362487114965916, "global_step": 33327, "epoch": 280, "lr": 5.579600650405421e-05} +{"train_loss": 0.00408749096095562, "global_step": 33328, "epoch": 280, "lr": 5.579380592451007e-05} +{"train_loss": 0.0022408687509596348, "global_step": 33329, "epoch": 280, "lr": 5.5791605333590404e-05} +{"train_loss": 0.0034289564937353134, "global_step": 33330, "epoch": 280, "lr": 5.5789404731299545e-05} +{"train_loss": 0.0023058238439261913, "global_step": 33331, "epoch": 280, "lr": 5.578720411764181e-05} +{"train_loss": 0.0012199915945529938, "global_step": 33332, "epoch": 280, "lr": 5.578500349262151e-05} +{"train_loss": 0.0030751468148082495, "global_step": 33333, "epoch": 280, "lr": 5.578280285624299e-05} +{"train_loss": 0.003019033232703805, "global_step": 33334, "epoch": 280, "lr": 5.578060220851055e-05} +{"train_loss": 0.0024437406100332737, "global_step": 33335, "epoch": 280, "lr": 5.577840154942851e-05} +{"train_loss": 0.0029717765282839537, "global_step": 33336, "epoch": 280, "lr": 5.5776200879001194e-05} +{"train_loss": 0.002314850455150008, "global_step": 33337, "epoch": 280, "lr": 5.577400019723292e-05} +{"train_loss": 0.0032405327074229717, "global_step": 33338, "epoch": 280, "lr": 5.577179950412802e-05} +{"train_loss": 0.003573518944904208, "global_step": 33339, "epoch": 280, "lr": 5.5769598799690816e-05} +{"train_loss": 0.0027590396348387003, "global_step": 33340, "epoch": 280, "lr": 5.576739808392563e-05} +{"train_loss": 0.0020862105302512646, "global_step": 33341, "epoch": 280, "lr": 5.576519735683675e-05} +{"train_loss": 0.0022390156518667936, "global_step": 33342, "epoch": 280, "lr": 5.576299661842853e-05} +{"train_loss": 0.002213540254160762, "global_step": 33343, "epoch": 280, "lr": 5.576079586870527e-05} +{"train_loss": 0.0019081520149484277, "global_step": 33344, "epoch": 280, "lr": 5.5758595107671316e-05} +{"train_loss": 0.0027653106953948736, "global_step": 33345, "epoch": 280, "lr": 5.5756394335330976e-05} +{"train_loss": 0.002904680557549, "global_step": 33346, "epoch": 280, "lr": 5.575419355168858e-05} +{"train_loss": 0.0020179366692900658, "global_step": 33347, "epoch": 280, "lr": 5.5751992756748426e-05} +{"train_loss": 0.003977107349783182, "global_step": 33348, "epoch": 280, "lr": 5.574979195051485e-05} +{"train_loss": 0.0018451677169650793, "global_step": 33349, "epoch": 280, "lr": 5.574759113299217e-05} +{"train_loss": 0.0036103606689721346, "global_step": 33350, "epoch": 280, "lr": 5.574539030418472e-05} +{"train_loss": 0.0040123057551681995, "global_step": 33351, "epoch": 280, "lr": 5.574318946409679e-05} +{"train_loss": 0.0033062950242310762, "global_step": 33352, "epoch": 280, "lr": 5.574098861273274e-05} +{"train_loss": 0.0033158923033624887, "global_step": 33353, "epoch": 280, "lr": 5.5738787750096864e-05} +{"train_loss": 0.0035906690172851086, "global_step": 33354, "epoch": 280, "lr": 5.5736586876193486e-05} +{"train_loss": 0.0034741542767733335, "global_step": 33355, "epoch": 280, "lr": 5.573438599102694e-05} +{"train_loss": 0.0021558678708970547, "global_step": 33356, "epoch": 280, "lr": 5.573218509460154e-05} +{"train_loss": 0.0021488466300070286, "global_step": 33357, "epoch": 280, "lr": 5.5729984186921604e-05} +{"train_loss": 0.002136103343218565, "global_step": 33358, "epoch": 280, "lr": 5.5727783267991465e-05} +{"train_loss": 0.002561204833909869, "global_step": 33359, "epoch": 280, "lr": 5.5725582337815426e-05} +{"train_loss": 0.004074930679053068, "global_step": 33360, "epoch": 280, "lr": 5.572338139639782e-05} +{"train_loss": 0.0028203106485307217, "global_step": 33361, "epoch": 280, "lr": 5.572118044374297e-05} +{"train_loss": 0.002403860678896308, "global_step": 33362, "epoch": 280, "lr": 5.5718979479855185e-05} +{"train_loss": 0.002519928850233555, "global_step": 33363, "epoch": 280, "lr": 5.5716778504738796e-05} +{"train_loss": 0.004089280031621456, "global_step": 33364, "epoch": 280, "lr": 5.5714577518398123e-05} +{"train_loss": 0.0024494812823832035, "global_step": 33365, "epoch": 280, "lr": 5.5712376520837496e-05} +{"train_loss": 0.003082884941250086, "global_step": 33366, "epoch": 280, "lr": 5.5710175512061224e-05} +{"train_loss": 0.0038603409193456173, "global_step": 33367, "epoch": 280, "lr": 5.570797449207363e-05} +{"train_loss": 0.005513160489499569, "global_step": 33368, "epoch": 280, "lr": 5.570577346087904e-05} +{"train_loss": 0.0017645874759182334, "global_step": 33369, "epoch": 280, "lr": 5.5703572418481774e-05} +{"train_loss": 0.0016243549762293696, "global_step": 33370, "epoch": 280, "lr": 5.570137136488614e-05} +{"train_loss": 0.003866114653646946, "global_step": 33371, "epoch": 280, "lr": 5.5699170300096504e-05} +{"train_loss": 0.004566267132759094, "global_step": 33372, "epoch": 280, "lr": 5.569696922411713e-05} +{"train_loss": 0.002592414617538452, "global_step": 33373, "epoch": 280, "lr": 5.5694768136952366e-05} +{"train_loss": 0.002720118034631014, "global_step": 33374, "epoch": 280, "lr": 5.569256703860655e-05} +{"train_loss": 0.0029163190629333258, "global_step": 33375, "epoch": 280, "lr": 5.569036592908397e-05} +{"train_loss": 0.0024587560910731554, "global_step": 33376, "epoch": 280, "lr": 5.568816480838897e-05} +{"train_loss": 0.0036484880838543177, "global_step": 33377, "epoch": 280, "lr": 5.5685963676525866e-05} +{"train_loss": 0.005355509463697672, "global_step": 33378, "epoch": 280, "lr": 5.5683762533498985e-05} +{"train_loss": 0.0024437913671135902, "global_step": 33379, "epoch": 280, "lr": 5.568156137931264e-05} +{"train_loss": 0.002473208587616682, "global_step": 33380, "epoch": 280, "lr": 5.567936021397115e-05} +{"train_loss": 0.003793298499658704, "global_step": 33381, "epoch": 280, "lr": 5.5677159037478854e-05} +{"train_loss": 0.002301289699971676, "global_step": 33382, "epoch": 280, "lr": 5.567495784984005e-05} +{"train_loss": 0.002606661058962345, "global_step": 33383, "epoch": 280, "lr": 5.5672756651059074e-05} +{"train_loss": 0.0023775824811309576, "global_step": 33384, "epoch": 280, "lr": 5.567055544114026e-05} +{"train_loss": 0.0022881466429680586, "global_step": 33385, "epoch": 280, "lr": 5.56683542200879e-05} +{"train_loss": 0.004086424596607685, "global_step": 33386, "epoch": 280, "lr": 5.566615298790634e-05} +{"train_loss": 0.0020502391271293163, "global_step": 33387, "epoch": 280, "lr": 5.56639517445999e-05} +{"train_loss": 0.0030457591637969017, "global_step": 33388, "epoch": 280, "lr": 5.5661750490172884e-05} +{"train_loss": 0.0017954615177586675, "global_step": 33389, "epoch": 280, "lr": 5.5659549224629626e-05} +{"train_loss": 0.0036675105802714825, "global_step": 33390, "epoch": 280, "lr": 5.565734794797446e-05} +{"train_loss": 0.0028962776996195316, "global_step": 33391, "epoch": 280, "lr": 5.565514666021169e-05} +{"train_loss": 0.001924007898196578, "global_step": 33392, "epoch": 280, "lr": 5.5652945361345645e-05} +{"train_loss": 0.003319671843200922, "global_step": 33393, "epoch": 280, "lr": 5.5650744051380645e-05} +{"train_loss": 0.003988821990787983, "global_step": 33394, "epoch": 280, "lr": 5.5648542730321005e-05} +{"train_loss": 0.002957031363621354, "global_step": 33395, "epoch": 280, "lr": 5.5646341398171054e-05} +{"train_loss": 0.001425342750735581, "global_step": 33396, "epoch": 280, "lr": 5.5644140054935136e-05} +{"train_loss": 0.0031337132677435875, "global_step": 33397, "epoch": 280, "lr": 5.564193870061753e-05} +{"train_loss": 0.002593525918200612, "global_step": 33398, "epoch": 280, "lr": 5.563973733522259e-05} +{"train_loss": 0.0015178477624431252, "global_step": 33399, "epoch": 280, "lr": 5.563753595875463e-05} +{"train_loss": 0.004210934974253178, "global_step": 33400, "epoch": 280, "lr": 5.5635334571217944e-05} +{"train_loss": 0.0019721556454896927, "global_step": 33401, "epoch": 280, "lr": 5.56331331726169e-05} +{"train_loss": 0.0031238566152751446, "global_step": 33402, "epoch": 280, "lr": 5.563093176295581e-05} +{"train_loss": 0.0025071711279451847, "global_step": 33403, "epoch": 280, "lr": 5.562873034223899e-05} +{"train_loss": 0.0034587327390909195, "global_step": 33404, "epoch": 280, "lr": 5.562652891047075e-05} +{"train_loss": 0.0032325952779501677, "global_step": 33405, "epoch": 280, "lr": 5.5624327467655424e-05} +{"train_loss": 0.0017194980755448341, "global_step": 33406, "epoch": 280, "lr": 5.562212601379733e-05} +{"train_loss": 0.002730504609644413, "global_step": 33407, "epoch": 280, "lr": 5.561992454890078e-05} +{"train_loss": 0.0029430368449538946, "global_step": 33408, "epoch": 280, "lr": 5.561772307297013e-05} +{"train_loss": 0.0034073686692863703, "global_step": 33409, "epoch": 280, "lr": 5.5615521586009676e-05} +{"train_loss": 0.003079590853303671, "global_step": 33410, "epoch": 280, "lr": 5.561332008802374e-05} +{"train_loss": 0.001840031472966075, "global_step": 33411, "epoch": 280, "lr": 5.5611118579016655e-05} +{"train_loss": 0.002065197564661503, "global_step": 33412, "epoch": 280, "lr": 5.560891705899273e-05} +{"train_loss": 0.002332965610548854, "global_step": 33413, "epoch": 280, "lr": 5.5606715527956285e-05} +{"train_loss": 0.0018447712063789368, "global_step": 33414, "epoch": 280, "lr": 5.560451398591168e-05} +{"train_loss": 0.00282687833532691, "global_step": 33415, "epoch": 280, "lr": 5.560231243286319e-05} +{"train_loss": 0.00258815661072731, "global_step": 33416, "epoch": 280, "lr": 5.5600110868815156e-05} +{"train_loss": 0.0016240221448242664, "global_step": 33417, "epoch": 280, "lr": 5.559790929377192e-05} +{"train_loss": 0.004508757498115301, "global_step": 33418, "epoch": 280, "lr": 5.5595707707737775e-05} +{"train_loss": 0.0022409558296203613, "global_step": 33419, "epoch": 280, "lr": 5.5593506110717064e-05} +{"train_loss": 0.002376375487074256, "global_step": 33420, "epoch": 280, "lr": 5.559130450271409e-05} +{"train_loss": 0.0012597307795658708, "global_step": 33421, "epoch": 280, "lr": 5.55891028837332e-05} +{"train_loss": 0.0034612882882356644, "global_step": 33422, "epoch": 280, "lr": 5.55869012537787e-05} +{"train_loss": 0.002017085673287511, "global_step": 33423, "epoch": 280, "lr": 5.558469961285492e-05} +{"train_loss": 0.0019303933950141072, "global_step": 33424, "epoch": 280, "lr": 5.5582497960966174e-05} +{"train_loss": 0.002827664138749242, "global_step": 33425, "epoch": 280, "lr": 5.5580296298116786e-05} +{"train_loss": 0.0032662416342645884, "global_step": 33426, "epoch": 280, "lr": 5.557809462431108e-05} +{"train_loss": 0.002436156151816249, "global_step": 33427, "epoch": 280, "lr": 5.557589293955339e-05} +{"train_loss": 0.003047873731702566, "global_step": 33428, "epoch": 280, "lr": 5.5573691243848034e-05} +{"train_loss": 0.001867580460384488, "global_step": 33429, "epoch": 280, "lr": 5.557148953719932e-05} +{"train_loss": 0.0019415200222283602, "global_step": 33430, "epoch": 280, "lr": 5.5569287819611585e-05} +{"train_loss": 0.003031236119568348, "global_step": 33431, "epoch": 280, "lr": 5.556708609108915e-05} +{"train_loss": 0.0028216878417879343, "global_step": 33432, "epoch": 280, "lr": 5.5564884351636326e-05} +{"train_loss": 0.002647147746756673, "global_step": 33433, "epoch": 280, "lr": 5.5562682601257454e-05} +{"train_loss": 0.0033710645511746407, "global_step": 33434, "epoch": 280, "lr": 5.556048083995685e-05} +{"train_loss": 0.003071387065574527, "global_step": 33435, "epoch": 280, "lr": 5.5558279067738826e-05} +{"train_loss": 0.0016794089460745454, "global_step": 33436, "epoch": 280, "lr": 5.555607728460773e-05} +{"train_loss": 0.0016629936872050166, "global_step": 33437, "epoch": 280, "lr": 5.555387549056786e-05} +{"train_loss": 0.0027943683989706033, "global_step": 33438, "epoch": 280, "lr": 5.555167368562355e-05, "val_loss": 0.01493176631629467, "train_action_mse_error": 4.55523440905381e-05} +{"train_loss": 0.0016845747595652938, "global_step": 33439, "epoch": 281, "lr": 5.5549471869779124e-05} +{"train_loss": 0.0017235097475349903, "global_step": 33440, "epoch": 281, "lr": 5.554727004303891e-05} +{"train_loss": 0.002793749561533332, "global_step": 33441, "epoch": 281, "lr": 5.554506820540722e-05} +{"train_loss": 0.0029858299531042576, "global_step": 33442, "epoch": 281, "lr": 5.554286635688838e-05} +{"train_loss": 0.0026339837349951267, "global_step": 33443, "epoch": 281, "lr": 5.5540664497486705e-05} +{"train_loss": 0.0018657359760254622, "global_step": 33444, "epoch": 281, "lr": 5.553846262720653e-05} +{"train_loss": 0.0018209083937108517, "global_step": 33445, "epoch": 281, "lr": 5.553626074605218e-05} +{"train_loss": 0.002201467752456665, "global_step": 33446, "epoch": 281, "lr": 5.5534058854027995e-05} +{"train_loss": 0.002426036400720477, "global_step": 33447, "epoch": 281, "lr": 5.553185695113825e-05} +{"train_loss": 0.004141136538237333, "global_step": 33448, "epoch": 281, "lr": 5.55296550373873e-05} +{"train_loss": 0.002923238091170788, "global_step": 33449, "epoch": 281, "lr": 5.5527453112779447e-05} +{"train_loss": 0.004122279118746519, "global_step": 33450, "epoch": 281, "lr": 5.552525117731905e-05} +{"train_loss": 0.003535025753080845, "global_step": 33451, "epoch": 281, "lr": 5.5523049231010406e-05} +{"train_loss": 0.002417945768684149, "global_step": 33452, "epoch": 281, "lr": 5.552084727385785e-05} +{"train_loss": 0.0016599742230027914, "global_step": 33453, "epoch": 281, "lr": 5.55186453058657e-05} +{"train_loss": 0.0016688283067196608, "global_step": 33454, "epoch": 281, "lr": 5.551644332703828e-05} +{"train_loss": 0.0031298440881073475, "global_step": 33455, "epoch": 281, "lr": 5.55142413373799e-05} +{"train_loss": 0.00245273276232183, "global_step": 33456, "epoch": 281, "lr": 5.5512039336894907e-05} +{"train_loss": 0.0023909499868750572, "global_step": 33457, "epoch": 281, "lr": 5.550983732558761e-05} +{"train_loss": 0.0023834803141653538, "global_step": 33458, "epoch": 281, "lr": 5.5507635303462346e-05} +{"train_loss": 0.0029071257449686527, "global_step": 33459, "epoch": 281, "lr": 5.5505433270523434e-05} +{"train_loss": 0.0016397773288190365, "global_step": 33460, "epoch": 281, "lr": 5.5503231226775174e-05} +{"train_loss": 0.0016022719210013747, "global_step": 33461, "epoch": 281, "lr": 5.5501029172221905e-05} +{"train_loss": 0.003796735778450966, "global_step": 33462, "epoch": 281, "lr": 5.549882710686797e-05} +{"train_loss": 0.0029340314213186502, "global_step": 33463, "epoch": 281, "lr": 5.5496625030717665e-05} +{"train_loss": 0.0028393312823027372, "global_step": 33464, "epoch": 281, "lr": 5.549442294377531e-05} +{"train_loss": 0.0024845143780112267, "global_step": 33465, "epoch": 281, "lr": 5.5492220846045265e-05} +{"train_loss": 0.002178453141823411, "global_step": 33466, "epoch": 281, "lr": 5.549001873753182e-05} +{"train_loss": 0.0022502231877297163, "global_step": 33467, "epoch": 281, "lr": 5.548781661823932e-05} +{"train_loss": 0.0033976109698414803, "global_step": 33468, "epoch": 281, "lr": 5.5485614488172065e-05} +{"train_loss": 0.004242348484694958, "global_step": 33469, "epoch": 281, "lr": 5.548341234733441e-05} +{"train_loss": 0.0021019054111093283, "global_step": 33470, "epoch": 281, "lr": 5.548121019573064e-05} +{"train_loss": 0.0025963932275772095, "global_step": 33471, "epoch": 281, "lr": 5.547900803336511e-05} +{"train_loss": 0.002522605936974287, "global_step": 33472, "epoch": 281, "lr": 5.5476805860242146e-05} +{"train_loss": 0.0030843738932162523, "global_step": 33473, "epoch": 281, "lr": 5.5474603676366034e-05} +{"train_loss": 0.0031038145534694195, "global_step": 33474, "epoch": 281, "lr": 5.547240148174113e-05} +{"train_loss": 0.0011494767386466265, "global_step": 33475, "epoch": 281, "lr": 5.547019927637176e-05} +{"train_loss": 0.0018905915785580873, "global_step": 33476, "epoch": 281, "lr": 5.546799706026223e-05} +{"train_loss": 0.0021566562354564667, "global_step": 33477, "epoch": 281, "lr": 5.5465794833416876e-05} +{"train_loss": 0.002902934793382883, "global_step": 33478, "epoch": 281, "lr": 5.546359259584002e-05} +{"train_loss": 0.0035816533491015434, "global_step": 33479, "epoch": 281, "lr": 5.546139034753598e-05} +{"train_loss": 0.001998514635488391, "global_step": 33480, "epoch": 281, "lr": 5.545918808850908e-05} +{"train_loss": 0.002820337424054742, "global_step": 33481, "epoch": 281, "lr": 5.545698581876365e-05} +{"train_loss": 0.002243728144094348, "global_step": 33482, "epoch": 281, "lr": 5.545478353830401e-05} +{"train_loss": 0.0016016040463000536, "global_step": 33483, "epoch": 281, "lr": 5.5452581247134486e-05} +{"train_loss": 0.0031988690607249737, "global_step": 33484, "epoch": 281, "lr": 5.545037894525941e-05} +{"train_loss": 0.002430583816021681, "global_step": 33485, "epoch": 281, "lr": 5.544817663268308e-05} +{"train_loss": 0.003024467034265399, "global_step": 33486, "epoch": 281, "lr": 5.5445974309409846e-05} +{"train_loss": 0.0020162914879620075, "global_step": 33487, "epoch": 281, "lr": 5.544377197544402e-05} +{"train_loss": 0.004124911967664957, "global_step": 33488, "epoch": 281, "lr": 5.544156963078994e-05} +{"train_loss": 0.002187177538871765, "global_step": 33489, "epoch": 281, "lr": 5.54393672754519e-05} +{"train_loss": 0.003514154814183712, "global_step": 33490, "epoch": 281, "lr": 5.543716490943427e-05} +{"train_loss": 0.001733809127472341, "global_step": 33491, "epoch": 281, "lr": 5.543496253274133e-05} +{"train_loss": 0.0023682580795139074, "global_step": 33492, "epoch": 281, "lr": 5.543276014537743e-05} +{"train_loss": 0.0030133912805467844, "global_step": 33493, "epoch": 281, "lr": 5.543055774734688e-05} +{"train_loss": 0.0025024372152984142, "global_step": 33494, "epoch": 281, "lr": 5.5428355338654014e-05} +{"train_loss": 0.0026023187674582005, "global_step": 33495, "epoch": 281, "lr": 5.5426152919303143e-05} +{"train_loss": 0.0024957614950835705, "global_step": 33496, "epoch": 281, "lr": 5.5423950489298604e-05} +{"train_loss": 0.0030288798734545708, "global_step": 33497, "epoch": 281, "lr": 5.542174804864472e-05} +{"train_loss": 0.002421293407678604, "global_step": 33498, "epoch": 281, "lr": 5.541954559734581e-05} +{"train_loss": 0.001977864420041442, "global_step": 33499, "epoch": 281, "lr": 5.5417343135406206e-05} +{"train_loss": 0.0032894194591790438, "global_step": 33500, "epoch": 281, "lr": 5.5415140662830224e-05} +{"train_loss": 0.0017565481830388308, "global_step": 33501, "epoch": 281, "lr": 5.5412938179622196e-05} +{"train_loss": 0.0018293086905032396, "global_step": 33502, "epoch": 281, "lr": 5.541073568578644e-05} +{"train_loss": 0.0021864986047148705, "global_step": 33503, "epoch": 281, "lr": 5.540853318132729e-05} +{"train_loss": 0.0038391905836760998, "global_step": 33504, "epoch": 281, "lr": 5.540633066624905e-05} +{"train_loss": 0.0038057484198361635, "global_step": 33505, "epoch": 281, "lr": 5.540412814055607e-05} +{"train_loss": 0.001963058253750205, "global_step": 33506, "epoch": 281, "lr": 5.540192560425265e-05} +{"train_loss": 0.0018393949139863253, "global_step": 33507, "epoch": 281, "lr": 5.5399723057343135e-05} +{"train_loss": 0.0028603174723684788, "global_step": 33508, "epoch": 281, "lr": 5.539752049983183e-05} +{"train_loss": 0.0034177261404693127, "global_step": 33509, "epoch": 281, "lr": 5.539531793172309e-05} +{"train_loss": 0.002275678562000394, "global_step": 33510, "epoch": 281, "lr": 5.5393115353021206e-05} +{"train_loss": 0.0016709695337340236, "global_step": 33511, "epoch": 281, "lr": 5.539091276373052e-05} +{"train_loss": 0.0026623676531016827, "global_step": 33512, "epoch": 281, "lr": 5.538871016385534e-05} +{"train_loss": 0.0020241185557097197, "global_step": 33513, "epoch": 281, "lr": 5.538650755340001e-05} +{"train_loss": 0.003495109500363469, "global_step": 33514, "epoch": 281, "lr": 5.538430493236885e-05} +{"train_loss": 0.002546238247305155, "global_step": 33515, "epoch": 281, "lr": 5.538210230076618e-05} +{"train_loss": 0.0018176456214860082, "global_step": 33516, "epoch": 281, "lr": 5.537989965859633e-05} +{"train_loss": 0.0033351248130202293, "global_step": 33517, "epoch": 281, "lr": 5.5377697005863625e-05} +{"train_loss": 0.001763856504112482, "global_step": 33518, "epoch": 281, "lr": 5.5375494342572374e-05} +{"train_loss": 0.0031373719684779644, "global_step": 33519, "epoch": 281, "lr": 5.5373291668726924e-05} +{"train_loss": 0.0018478590063750744, "global_step": 33520, "epoch": 281, "lr": 5.537108898433159e-05} +{"train_loss": 0.0021939724683761597, "global_step": 33521, "epoch": 281, "lr": 5.5368886289390696e-05} +{"train_loss": 0.003771174233406782, "global_step": 33522, "epoch": 281, "lr": 5.536668358390857e-05} +{"train_loss": 0.0030163496267050505, "global_step": 33523, "epoch": 281, "lr": 5.5364480867889535e-05} +{"train_loss": 0.0020254121627658606, "global_step": 33524, "epoch": 281, "lr": 5.5362278141337906e-05} +{"train_loss": 0.00404773186892271, "global_step": 33525, "epoch": 281, "lr": 5.5360075404258025e-05} +{"train_loss": 0.0021790608298033476, "global_step": 33526, "epoch": 281, "lr": 5.5357872656654206e-05} +{"train_loss": 0.0029548322781920433, "global_step": 33527, "epoch": 281, "lr": 5.535566989853078e-05} +{"train_loss": 0.0016530809225514531, "global_step": 33528, "epoch": 281, "lr": 5.535346712989207e-05} +{"train_loss": 0.002390313893556595, "global_step": 33529, "epoch": 281, "lr": 5.535126435074239e-05} +{"train_loss": 0.003096126252785325, "global_step": 33530, "epoch": 281, "lr": 5.534906156108608e-05} +{"train_loss": 0.0022360635921359062, "global_step": 33531, "epoch": 281, "lr": 5.5346858760927456e-05} +{"train_loss": 0.002476842375472188, "global_step": 33532, "epoch": 281, "lr": 5.534465595027084e-05} +{"train_loss": 0.0019947639666497707, "global_step": 33533, "epoch": 281, "lr": 5.534245312912056e-05} +{"train_loss": 0.0024395666550844908, "global_step": 33534, "epoch": 281, "lr": 5.5340250297480965e-05} +{"train_loss": 0.0020676767453551292, "global_step": 33535, "epoch": 281, "lr": 5.533804745535635e-05} +{"train_loss": 0.003411703510209918, "global_step": 33536, "epoch": 281, "lr": 5.5335844602751044e-05} +{"train_loss": 0.001736602047458291, "global_step": 33537, "epoch": 281, "lr": 5.533364173966939e-05} +{"train_loss": 0.0033107316121459007, "global_step": 33538, "epoch": 281, "lr": 5.533143886611568e-05} +{"train_loss": 0.0015008324990049005, "global_step": 33539, "epoch": 281, "lr": 5.532923598209426e-05} +{"train_loss": 0.0018103384645655751, "global_step": 33540, "epoch": 281, "lr": 5.532703308760948e-05} +{"train_loss": 0.004006660543382168, "global_step": 33541, "epoch": 281, "lr": 5.532483018266562e-05} +{"train_loss": 0.003577029798179865, "global_step": 33542, "epoch": 281, "lr": 5.5322627267267035e-05} +{"train_loss": 0.0019674927461892366, "global_step": 33543, "epoch": 281, "lr": 5.5320424341418034e-05} +{"train_loss": 0.0034251094330102205, "global_step": 33544, "epoch": 281, "lr": 5.5318221405122935e-05} +{"train_loss": 0.0015920684672892094, "global_step": 33545, "epoch": 281, "lr": 5.5316018458386096e-05} +{"train_loss": 0.0036835256032645702, "global_step": 33546, "epoch": 281, "lr": 5.531381550121182e-05} +{"train_loss": 0.0021519106812775135, "global_step": 33547, "epoch": 281, "lr": 5.531161253360443e-05} +{"train_loss": 0.002473850967362523, "global_step": 33548, "epoch": 281, "lr": 5.530940955556825e-05} +{"train_loss": 0.0024967461358755827, "global_step": 33549, "epoch": 281, "lr": 5.5307206567107614e-05} +{"train_loss": 0.004318313207477331, "global_step": 33550, "epoch": 281, "lr": 5.530500356822686e-05} +{"train_loss": 0.0029159593395888805, "global_step": 33551, "epoch": 281, "lr": 5.530280055893028e-05} +{"train_loss": 0.004329686984419823, "global_step": 33552, "epoch": 281, "lr": 5.5300597539222234e-05} +{"train_loss": 0.0017247638897970319, "global_step": 33553, "epoch": 281, "lr": 5.529839450910702e-05} +{"train_loss": 0.001639308873564005, "global_step": 33554, "epoch": 281, "lr": 5.529619146858898e-05} +{"train_loss": 0.0026719090528786182, "global_step": 33555, "epoch": 281, "lr": 5.5293988417672424e-05} +{"train_loss": 0.00278751109726727, "global_step": 33556, "epoch": 281, "lr": 5.52917853563617e-05} +{"train_loss": 0.0026095543641737906, "global_step": 33557, "epoch": 281, "lr": 5.528958228466111e-05, "val_loss": 0.013508755713701248} +{"train_loss": 0.0017866655252873898, "global_step": 33558, "epoch": 282, "lr": 5.5287379202574995e-05} +{"train_loss": 0.002344238106161356, "global_step": 33559, "epoch": 282, "lr": 5.5285176110107695e-05} +{"train_loss": 0.001611438812687993, "global_step": 33560, "epoch": 282, "lr": 5.5282973007263496e-05} +{"train_loss": 0.002326762769371271, "global_step": 33561, "epoch": 282, "lr": 5.5280769894046735e-05} +{"train_loss": 0.002911257091909647, "global_step": 33562, "epoch": 282, "lr": 5.527856677046176e-05} +{"train_loss": 0.001856373273767531, "global_step": 33563, "epoch": 282, "lr": 5.5276363636512887e-05} +{"train_loss": 0.0017560271080583334, "global_step": 33564, "epoch": 282, "lr": 5.527416049220442e-05} +{"train_loss": 0.002870419295504689, "global_step": 33565, "epoch": 282, "lr": 5.5271957337540716e-05} +{"train_loss": 0.0029457085765898228, "global_step": 33566, "epoch": 282, "lr": 5.526975417252608e-05} +{"train_loss": 0.0026247138157486916, "global_step": 33567, "epoch": 282, "lr": 5.526755099716485e-05} +{"train_loss": 0.0018580224132165313, "global_step": 33568, "epoch": 282, "lr": 5.526534781146134e-05} +{"train_loss": 0.0021744470577687025, "global_step": 33569, "epoch": 282, "lr": 5.5263144615419895e-05} +{"train_loss": 0.0028905710205435753, "global_step": 33570, "epoch": 282, "lr": 5.526094140904481e-05} +{"train_loss": 0.001861356315203011, "global_step": 33571, "epoch": 282, "lr": 5.5258738192340444e-05} +{"train_loss": 0.00199183844961226, "global_step": 33572, "epoch": 282, "lr": 5.525653496531111e-05} +{"train_loss": 0.003637973451986909, "global_step": 33573, "epoch": 282, "lr": 5.5254331727961117e-05} +{"train_loss": 0.0035471655428409576, "global_step": 33574, "epoch": 282, "lr": 5.5252128480294816e-05} +{"train_loss": 0.0029819710180163383, "global_step": 33575, "epoch": 282, "lr": 5.524992522231651e-05} +{"train_loss": 0.0017134803347289562, "global_step": 33576, "epoch": 282, "lr": 5.524772195403054e-05} +{"train_loss": 0.0022487391252070665, "global_step": 33577, "epoch": 282, "lr": 5.524551867544123e-05} +{"train_loss": 0.0018688791897147894, "global_step": 33578, "epoch": 282, "lr": 5.524331538655292e-05} +{"train_loss": 0.003507643938064575, "global_step": 33579, "epoch": 282, "lr": 5.5241112087369905e-05} +{"train_loss": 0.0024019998963922262, "global_step": 33580, "epoch": 282, "lr": 5.523890877789654e-05} +{"train_loss": 0.0014650882221758366, "global_step": 33581, "epoch": 282, "lr": 5.523670545813711e-05} +{"train_loss": 0.0020896829664707184, "global_step": 33582, "epoch": 282, "lr": 5.523450212809598e-05} +{"train_loss": 0.0028091149870306253, "global_step": 33583, "epoch": 282, "lr": 5.523229878777747e-05} +{"train_loss": 0.004062602296471596, "global_step": 33584, "epoch": 282, "lr": 5.52300954371859e-05} +{"train_loss": 0.0015150171238929033, "global_step": 33585, "epoch": 282, "lr": 5.5227892076325595e-05} +{"train_loss": 0.0021477025002241135, "global_step": 33586, "epoch": 282, "lr": 5.522568870520088e-05} +{"train_loss": 0.0023777224123477936, "global_step": 33587, "epoch": 282, "lr": 5.522348532381609e-05} +{"train_loss": 0.0025100396014750004, "global_step": 33588, "epoch": 282, "lr": 5.522128193217554e-05} +{"train_loss": 0.00209400849416852, "global_step": 33589, "epoch": 282, "lr": 5.521907853028356e-05} +{"train_loss": 0.0027081698644906282, "global_step": 33590, "epoch": 282, "lr": 5.5216875118144475e-05} +{"train_loss": 0.0016485410742461681, "global_step": 33591, "epoch": 282, "lr": 5.521467169576263e-05} +{"train_loss": 0.0016226260922849178, "global_step": 33592, "epoch": 282, "lr": 5.521246826314231e-05} +{"train_loss": 0.002420213771983981, "global_step": 33593, "epoch": 282, "lr": 5.5210264820287886e-05} +{"train_loss": 0.0032070826273411512, "global_step": 33594, "epoch": 282, "lr": 5.520806136720365e-05} +{"train_loss": 0.0019252098863944411, "global_step": 33595, "epoch": 282, "lr": 5.5205857903893946e-05} +{"train_loss": 0.002602747641503811, "global_step": 33596, "epoch": 282, "lr": 5.52036544303631e-05} +{"train_loss": 0.0020012722816318274, "global_step": 33597, "epoch": 282, "lr": 5.520145094661542e-05} +{"train_loss": 0.0023778907489031553, "global_step": 33598, "epoch": 282, "lr": 5.5199247452655254e-05} +{"train_loss": 0.003092257073149085, "global_step": 33599, "epoch": 282, "lr": 5.5197043948486926e-05} +{"train_loss": 0.003965405281633139, "global_step": 33600, "epoch": 282, "lr": 5.519484043411476e-05} +{"train_loss": 0.0026050799060612917, "global_step": 33601, "epoch": 282, "lr": 5.519263690954307e-05} +{"train_loss": 0.0030836614314466715, "global_step": 33602, "epoch": 282, "lr": 5.5190433374776195e-05} +{"train_loss": 0.0027660024352371693, "global_step": 33603, "epoch": 282, "lr": 5.5188229829818474e-05} +{"train_loss": 0.0020631817169487476, "global_step": 33604, "epoch": 282, "lr": 5.51860262746742e-05} +{"train_loss": 0.004099723882973194, "global_step": 33605, "epoch": 282, "lr": 5.518382270934772e-05} +{"train_loss": 0.0032193276565521955, "global_step": 33606, "epoch": 282, "lr": 5.518161913384337e-05} +{"train_loss": 0.002896082354709506, "global_step": 33607, "epoch": 282, "lr": 5.5179415548165446e-05} +{"train_loss": 0.0033351995516568422, "global_step": 33608, "epoch": 282, "lr": 5.5177211952318297e-05} +{"train_loss": 0.003099306020885706, "global_step": 33609, "epoch": 282, "lr": 5.5175008346306264e-05} +{"train_loss": 0.0028365489561110735, "global_step": 33610, "epoch": 282, "lr": 5.5172804730133645e-05} +{"train_loss": 0.0025647326838225126, "global_step": 33611, "epoch": 282, "lr": 5.517060110380476e-05} +{"train_loss": 0.001186043955385685, "global_step": 33612, "epoch": 282, "lr": 5.516839746732397e-05} +{"train_loss": 0.003267203690484166, "global_step": 33613, "epoch": 282, "lr": 5.516619382069558e-05} +{"train_loss": 0.0026136250235140324, "global_step": 33614, "epoch": 282, "lr": 5.5163990163923916e-05} +{"train_loss": 0.0031110504642128944, "global_step": 33615, "epoch": 282, "lr": 5.516178649701331e-05} +{"train_loss": 0.0020229287911206484, "global_step": 33616, "epoch": 282, "lr": 5.5159582819968093e-05} +{"train_loss": 0.0016294799279421568, "global_step": 33617, "epoch": 282, "lr": 5.515737913279258e-05} +{"train_loss": 0.0025775246322155, "global_step": 33618, "epoch": 282, "lr": 5.51551754354911e-05} +{"train_loss": 0.0027057663537561893, "global_step": 33619, "epoch": 282, "lr": 5.5152971728067996e-05} +{"train_loss": 0.0034985574893653393, "global_step": 33620, "epoch": 282, "lr": 5.5150768010527576e-05} +{"train_loss": 0.0031834999099373817, "global_step": 33621, "epoch": 282, "lr": 5.514856428287417e-05} +{"train_loss": 0.001353456056676805, "global_step": 33622, "epoch": 282, "lr": 5.514636054511212e-05} +{"train_loss": 0.0026410629507154226, "global_step": 33623, "epoch": 282, "lr": 5.514415679724574e-05} +{"train_loss": 0.0013319748686626554, "global_step": 33624, "epoch": 282, "lr": 5.514195303927935e-05} +{"train_loss": 0.004835876170545816, "global_step": 33625, "epoch": 282, "lr": 5.513974927121728e-05} +{"train_loss": 0.0037206229753792286, "global_step": 33626, "epoch": 282, "lr": 5.513754549306387e-05} +{"train_loss": 0.0037763183936476707, "global_step": 33627, "epoch": 282, "lr": 5.5135341704823426e-05} +{"train_loss": 0.0033782231621444225, "global_step": 33628, "epoch": 282, "lr": 5.513313790650031e-05} +{"train_loss": 0.0026916477363556623, "global_step": 33629, "epoch": 282, "lr": 5.5130934098098806e-05} +{"train_loss": 0.0029135390650480986, "global_step": 33630, "epoch": 282, "lr": 5.5128730279623264e-05} +{"train_loss": 0.0042149657383561134, "global_step": 33631, "epoch": 282, "lr": 5.512652645107801e-05} +{"train_loss": 0.0024549700319767, "global_step": 33632, "epoch": 282, "lr": 5.512432261246737e-05} +{"train_loss": 0.0026697299908846617, "global_step": 33633, "epoch": 282, "lr": 5.512211876379567e-05} +{"train_loss": 0.0027845853473991156, "global_step": 33634, "epoch": 282, "lr": 5.5119914905067246e-05} +{"train_loss": 0.0033476860262453556, "global_step": 33635, "epoch": 282, "lr": 5.51177110362864e-05} +{"train_loss": 0.0022115421015769243, "global_step": 33636, "epoch": 282, "lr": 5.511550715745749e-05} +{"train_loss": 0.0024327957071363926, "global_step": 33637, "epoch": 282, "lr": 5.511330326858482e-05} +{"train_loss": 0.0025256730150431395, "global_step": 33638, "epoch": 282, "lr": 5.511109936967272e-05} +{"train_loss": 0.0028189325239509344, "global_step": 33639, "epoch": 282, "lr": 5.510889546072553e-05} +{"train_loss": 0.0037123910151422024, "global_step": 33640, "epoch": 282, "lr": 5.510669154174757e-05} +{"train_loss": 0.0020674702245742083, "global_step": 33641, "epoch": 282, "lr": 5.510448761274317e-05} +{"train_loss": 0.003074058098718524, "global_step": 33642, "epoch": 282, "lr": 5.5102283673716646e-05} +{"train_loss": 0.002512977458536625, "global_step": 33643, "epoch": 282, "lr": 5.510007972467234e-05} +{"train_loss": 0.002146769082173705, "global_step": 33644, "epoch": 282, "lr": 5.509787576561457e-05} +{"train_loss": 0.0013548460556194186, "global_step": 33645, "epoch": 282, "lr": 5.5095671796547665e-05} +{"train_loss": 0.0029028442222625017, "global_step": 33646, "epoch": 282, "lr": 5.509346781747595e-05} +{"train_loss": 0.003097109729424119, "global_step": 33647, "epoch": 282, "lr": 5.509126382840375e-05} +{"train_loss": 0.0025029645767062902, "global_step": 33648, "epoch": 282, "lr": 5.508905982933541e-05} +{"train_loss": 0.003987468779087067, "global_step": 33649, "epoch": 282, "lr": 5.5086855820275244e-05} +{"train_loss": 0.0018918408313766122, "global_step": 33650, "epoch": 282, "lr": 5.508465180122757e-05} +{"train_loss": 0.0014121831627562642, "global_step": 33651, "epoch": 282, "lr": 5.508244777219672e-05} +{"train_loss": 0.0016841155011206865, "global_step": 33652, "epoch": 282, "lr": 5.508024373318704e-05} +{"train_loss": 0.0040278020314872265, "global_step": 33653, "epoch": 282, "lr": 5.5078039684202854e-05} +{"train_loss": 0.0032811693381518126, "global_step": 33654, "epoch": 282, "lr": 5.5075835625248464e-05} +{"train_loss": 0.001513147377409041, "global_step": 33655, "epoch": 282, "lr": 5.507363155632822e-05} +{"train_loss": 0.003061906434595585, "global_step": 33656, "epoch": 282, "lr": 5.5071427477446434e-05} +{"train_loss": 0.003105528187006712, "global_step": 33657, "epoch": 282, "lr": 5.506922338860745e-05} +{"train_loss": 0.0038626946043223143, "global_step": 33658, "epoch": 282, "lr": 5.506701928981558e-05} +{"train_loss": 0.0029607629403471947, "global_step": 33659, "epoch": 282, "lr": 5.506481518107517e-05} +{"train_loss": 0.002230814890936017, "global_step": 33660, "epoch": 282, "lr": 5.5062611062390536e-05} +{"train_loss": 0.0023420467041432858, "global_step": 33661, "epoch": 282, "lr": 5.506040693376599e-05} +{"train_loss": 0.0016465125372633338, "global_step": 33662, "epoch": 282, "lr": 5.505820279520588e-05} +{"train_loss": 0.003748000832274556, "global_step": 33663, "epoch": 282, "lr": 5.505599864671454e-05} +{"train_loss": 0.002676916541531682, "global_step": 33664, "epoch": 282, "lr": 5.505379448829628e-05} +{"train_loss": 0.0025814168620854616, "global_step": 33665, "epoch": 282, "lr": 5.5051590319955426e-05} +{"train_loss": 0.0032302248291671276, "global_step": 33666, "epoch": 282, "lr": 5.504938614169634e-05} +{"train_loss": 0.001862606150098145, "global_step": 33667, "epoch": 282, "lr": 5.5047181953523297e-05} +{"train_loss": 0.0031383002642542124, "global_step": 33668, "epoch": 282, "lr": 5.504497775544066e-05} +{"train_loss": 0.0030073870439082384, "global_step": 33669, "epoch": 282, "lr": 5.5042773547452756e-05} +{"train_loss": 0.002103515202179551, "global_step": 33670, "epoch": 282, "lr": 5.5040569329563896e-05} +{"train_loss": 0.003067821031436324, "global_step": 33671, "epoch": 282, "lr": 5.503836510177841e-05} +{"train_loss": 0.0018525449559092522, "global_step": 33672, "epoch": 282, "lr": 5.503616086410066e-05} +{"train_loss": 0.002595109399408102, "global_step": 33673, "epoch": 282, "lr": 5.503395661653492e-05} +{"train_loss": 0.0030788974836468697, "global_step": 33674, "epoch": 282, "lr": 5.5031752359085556e-05} +{"train_loss": 0.0027071726508438587, "global_step": 33675, "epoch": 282, "lr": 5.502954809175688e-05} +{"train_loss": 0.0026256294300811005, "global_step": 33676, "epoch": 282, "lr": 5.502734381455322e-05, "val_loss": 0.02109786868095398} +{"train_loss": 0.0031297311652451754, "global_step": 33677, "epoch": 283, "lr": 5.502513952747891e-05} +{"train_loss": 0.0026003990788012743, "global_step": 33678, "epoch": 283, "lr": 5.5022935230538286e-05} +{"train_loss": 0.002953612944111228, "global_step": 33679, "epoch": 283, "lr": 5.502073092373564e-05} +{"train_loss": 0.0037674582563340664, "global_step": 33680, "epoch": 283, "lr": 5.501852660707535e-05} +{"train_loss": 0.0028360537253320217, "global_step": 33681, "epoch": 283, "lr": 5.5016322280561704e-05} +{"train_loss": 0.0013250221963971853, "global_step": 33682, "epoch": 283, "lr": 5.501411794419905e-05} +{"train_loss": 0.002046368783339858, "global_step": 33683, "epoch": 283, "lr": 5.501191359799172e-05} +{"train_loss": 0.0017458648653700948, "global_step": 33684, "epoch": 283, "lr": 5.500970924194402e-05} +{"train_loss": 0.002728627761825919, "global_step": 33685, "epoch": 283, "lr": 5.50075048760603e-05} +{"train_loss": 0.004138682037591934, "global_step": 33686, "epoch": 283, "lr": 5.500530050034488e-05} +{"train_loss": 0.002030398230999708, "global_step": 33687, "epoch": 283, "lr": 5.500309611480208e-05} +{"train_loss": 0.0036252797581255436, "global_step": 33688, "epoch": 283, "lr": 5.500089171943623e-05} +{"train_loss": 0.002619860228151083, "global_step": 33689, "epoch": 283, "lr": 5.499868731425167e-05} +{"train_loss": 0.0018050934886559844, "global_step": 33690, "epoch": 283, "lr": 5.499648289925273e-05} +{"train_loss": 0.003026452613994479, "global_step": 33691, "epoch": 283, "lr": 5.499427847444373e-05} +{"train_loss": 0.0018455551471561193, "global_step": 33692, "epoch": 283, "lr": 5.499207403982899e-05} +{"train_loss": 0.0026288246735930443, "global_step": 33693, "epoch": 283, "lr": 5.498986959541285e-05} +{"train_loss": 0.0017672224203124642, "global_step": 33694, "epoch": 283, "lr": 5.4987665141199626e-05} +{"train_loss": 0.0020974997896701097, "global_step": 33695, "epoch": 283, "lr": 5.4985460677193654e-05} +{"train_loss": 0.0015679181087762117, "global_step": 33696, "epoch": 283, "lr": 5.498325620339927e-05} +{"train_loss": 0.001981279579922557, "global_step": 33697, "epoch": 283, "lr": 5.4981051719820796e-05} +{"train_loss": 0.0029262262396514416, "global_step": 33698, "epoch": 283, "lr": 5.497884722646255e-05} +{"train_loss": 0.0020366376265883446, "global_step": 33699, "epoch": 283, "lr": 5.4976642723328874e-05} +{"train_loss": 0.0027930003125220537, "global_step": 33700, "epoch": 283, "lr": 5.4974438210424096e-05} +{"train_loss": 0.0018694489262998104, "global_step": 33701, "epoch": 283, "lr": 5.497223368775253e-05} +{"train_loss": 0.002010883064940572, "global_step": 33702, "epoch": 283, "lr": 5.4970029155318524e-05} +{"train_loss": 0.0026324826758354902, "global_step": 33703, "epoch": 283, "lr": 5.4967824613126396e-05} +{"train_loss": 0.0034258479718118906, "global_step": 33704, "epoch": 283, "lr": 5.496562006118048e-05} +{"train_loss": 0.002435936126857996, "global_step": 33705, "epoch": 283, "lr": 5.496341549948508e-05} +{"train_loss": 0.003125392133370042, "global_step": 33706, "epoch": 283, "lr": 5.496121092804456e-05} +{"train_loss": 0.0015239474596455693, "global_step": 33707, "epoch": 283, "lr": 5.495900634686323e-05} +{"train_loss": 0.0028295842930674553, "global_step": 33708, "epoch": 283, "lr": 5.495680175594542e-05} +{"train_loss": 0.002291942946612835, "global_step": 33709, "epoch": 283, "lr": 5.495459715529545e-05} +{"train_loss": 0.00282057817094028, "global_step": 33710, "epoch": 283, "lr": 5.4952392544917685e-05} +{"train_loss": 0.004324968904256821, "global_step": 33711, "epoch": 283, "lr": 5.49501879248164e-05} +{"train_loss": 0.0023205969482660294, "global_step": 33712, "epoch": 283, "lr": 5.4947983294995965e-05} +{"train_loss": 0.002141716657206416, "global_step": 33713, "epoch": 283, "lr": 5.4945778655460676e-05} +{"train_loss": 0.001857362687587738, "global_step": 33714, "epoch": 283, "lr": 5.494357400621488e-05} +{"train_loss": 0.0012258259812369943, "global_step": 33715, "epoch": 283, "lr": 5.494136934726292e-05} +{"train_loss": 0.0026272195391356945, "global_step": 33716, "epoch": 283, "lr": 5.493916467860911e-05} +{"train_loss": 0.0026547431480139494, "global_step": 33717, "epoch": 283, "lr": 5.4936960000257766e-05} +{"train_loss": 0.0015709885628893971, "global_step": 33718, "epoch": 283, "lr": 5.493475531221324e-05} +{"train_loss": 0.0021696367766708136, "global_step": 33719, "epoch": 283, "lr": 5.493255061447984e-05} +{"train_loss": 0.0027060715947300196, "global_step": 33720, "epoch": 283, "lr": 5.4930345907061896e-05} +{"train_loss": 0.0016842411132529378, "global_step": 33721, "epoch": 283, "lr": 5.492814118996375e-05} +{"train_loss": 0.0023819839116185904, "global_step": 33722, "epoch": 283, "lr": 5.492593646318974e-05} +{"train_loss": 0.0018719369545578957, "global_step": 33723, "epoch": 283, "lr": 5.4923731726744174e-05} +{"train_loss": 0.002149357460439205, "global_step": 33724, "epoch": 283, "lr": 5.492152698063138e-05} +{"train_loss": 0.0021455304231494665, "global_step": 33725, "epoch": 283, "lr": 5.49193222248557e-05} +{"train_loss": 0.002930608345195651, "global_step": 33726, "epoch": 283, "lr": 5.491711745942145e-05} +{"train_loss": 0.002205602591857314, "global_step": 33727, "epoch": 283, "lr": 5.4914912684332966e-05} +{"train_loss": 0.0016344693722203374, "global_step": 33728, "epoch": 283, "lr": 5.491270789959457e-05} +{"train_loss": 0.0016384792979806662, "global_step": 33729, "epoch": 283, "lr": 5.491050310521061e-05} +{"train_loss": 0.0017467254074290395, "global_step": 33730, "epoch": 283, "lr": 5.490829830118539e-05} +{"train_loss": 0.002460090909153223, "global_step": 33731, "epoch": 283, "lr": 5.490609348752326e-05} +{"train_loss": 0.0023974503856152296, "global_step": 33732, "epoch": 283, "lr": 5.490388866422853e-05} +{"train_loss": 0.0013699420960620046, "global_step": 33733, "epoch": 283, "lr": 5.490168383130555e-05} +{"train_loss": 0.002223177347332239, "global_step": 33734, "epoch": 283, "lr": 5.4899478988758634e-05} +{"train_loss": 0.0033761512022465467, "global_step": 33735, "epoch": 283, "lr": 5.489727413659212e-05} +{"train_loss": 0.0022877496667206287, "global_step": 33736, "epoch": 283, "lr": 5.489506927481033e-05} +{"train_loss": 0.004142254590988159, "global_step": 33737, "epoch": 283, "lr": 5.489286440341759e-05} +{"train_loss": 0.002675973577424884, "global_step": 33738, "epoch": 283, "lr": 5.4890659522418216e-05} +{"train_loss": 0.0026952524203807116, "global_step": 33739, "epoch": 283, "lr": 5.4888454631816575e-05} +{"train_loss": 0.002045263070613146, "global_step": 33740, "epoch": 283, "lr": 5.488624973161698e-05} +{"train_loss": 0.002941496903076768, "global_step": 33741, "epoch": 283, "lr": 5.4884044821823755e-05} +{"train_loss": 0.001968447584658861, "global_step": 33742, "epoch": 283, "lr": 5.4881839902441215e-05} +{"train_loss": 0.0025093471631407738, "global_step": 33743, "epoch": 283, "lr": 5.487963497347372e-05} +{"train_loss": 0.0016191466711461544, "global_step": 33744, "epoch": 283, "lr": 5.487743003492557e-05} +{"train_loss": 0.0019946207758039236, "global_step": 33745, "epoch": 283, "lr": 5.4875225086801105e-05} +{"train_loss": 0.002215032232925296, "global_step": 33746, "epoch": 283, "lr": 5.4873020129104656e-05} +{"train_loss": 0.005629387684166431, "global_step": 33747, "epoch": 283, "lr": 5.4870815161840563e-05} +{"train_loss": 0.0016163919353857636, "global_step": 33748, "epoch": 283, "lr": 5.486861018501314e-05} +{"train_loss": 0.0015357908559963107, "global_step": 33749, "epoch": 283, "lr": 5.4866405198626726e-05} +{"train_loss": 0.0018343678675591946, "global_step": 33750, "epoch": 283, "lr": 5.4864200202685635e-05} +{"train_loss": 0.0021346313878893852, "global_step": 33751, "epoch": 283, "lr": 5.4861995197194214e-05} +{"train_loss": 0.0016388752264901996, "global_step": 33752, "epoch": 283, "lr": 5.485979018215678e-05} +{"train_loss": 0.003257458098232746, "global_step": 33753, "epoch": 283, "lr": 5.485758515757769e-05} +{"train_loss": 0.002430739812552929, "global_step": 33754, "epoch": 283, "lr": 5.485538012346122e-05} +{"train_loss": 0.0034818428102880716, "global_step": 33755, "epoch": 283, "lr": 5.485317507981174e-05} +{"train_loss": 0.0030943758320063353, "global_step": 33756, "epoch": 283, "lr": 5.4850970026633574e-05} +{"train_loss": 0.0032688449136912823, "global_step": 33757, "epoch": 283, "lr": 5.484876496393104e-05} +{"train_loss": 0.0022884232457727194, "global_step": 33758, "epoch": 283, "lr": 5.484655989170847e-05} +{"train_loss": 0.0025360595900565386, "global_step": 33759, "epoch": 283, "lr": 5.484435480997021e-05} +{"train_loss": 0.0029079143423587084, "global_step": 33760, "epoch": 283, "lr": 5.4842149718720583e-05} +{"train_loss": 0.0024950425140559673, "global_step": 33761, "epoch": 283, "lr": 5.48399446179639e-05} +{"train_loss": 0.002253421349450946, "global_step": 33762, "epoch": 283, "lr": 5.48377395077045e-05} +{"train_loss": 0.0020418670028448105, "global_step": 33763, "epoch": 283, "lr": 5.483553438794671e-05} +{"train_loss": 0.002187003381550312, "global_step": 33764, "epoch": 283, "lr": 5.483332925869487e-05} +{"train_loss": 0.0019444721983745694, "global_step": 33765, "epoch": 283, "lr": 5.4831124119953306e-05} +{"train_loss": 0.002260408364236355, "global_step": 33766, "epoch": 283, "lr": 5.4828918971726364e-05} +{"train_loss": 0.003120698733255267, "global_step": 33767, "epoch": 283, "lr": 5.4826713814018324e-05} +{"train_loss": 0.002093786606565118, "global_step": 33768, "epoch": 283, "lr": 5.482450864683357e-05} +{"train_loss": 0.0028063124045729637, "global_step": 33769, "epoch": 283, "lr": 5.4822303470176395e-05} +{"train_loss": 0.003251961898058653, "global_step": 33770, "epoch": 283, "lr": 5.4820098284051145e-05} +{"train_loss": 0.00326933478936553, "global_step": 33771, "epoch": 283, "lr": 5.481789308846216e-05} +{"train_loss": 0.003152364632114768, "global_step": 33772, "epoch": 283, "lr": 5.481568788341376e-05} +{"train_loss": 0.002343027852475643, "global_step": 33773, "epoch": 283, "lr": 5.481348266891026e-05} +{"train_loss": 0.0018777906661853194, "global_step": 33774, "epoch": 283, "lr": 5.481127744495599e-05} +{"train_loss": 0.002820109250023961, "global_step": 33775, "epoch": 283, "lr": 5.48090722115553e-05} +{"train_loss": 0.0017970104236155748, "global_step": 33776, "epoch": 283, "lr": 5.480686696871251e-05} +{"train_loss": 0.0019211076432839036, "global_step": 33777, "epoch": 283, "lr": 5.4804661716431946e-05} +{"train_loss": 0.002591643948107958, "global_step": 33778, "epoch": 283, "lr": 5.4802456454717944e-05} +{"train_loss": 0.002000777516514063, "global_step": 33779, "epoch": 283, "lr": 5.480025118357484e-05} +{"train_loss": 0.003609361359849572, "global_step": 33780, "epoch": 283, "lr": 5.479804590300695e-05} +{"train_loss": 0.0009928611107170582, "global_step": 33781, "epoch": 283, "lr": 5.47958406130186e-05} +{"train_loss": 0.0024185599759221077, "global_step": 33782, "epoch": 283, "lr": 5.4793635313614144e-05} +{"train_loss": 0.0016024538781493902, "global_step": 33783, "epoch": 283, "lr": 5.4791430004797893e-05} +{"train_loss": 0.0031170682050287724, "global_step": 33784, "epoch": 283, "lr": 5.478922468657418e-05} +{"train_loss": 0.0033578623551875353, "global_step": 33785, "epoch": 283, "lr": 5.478701935894734e-05} +{"train_loss": 0.003096343018114567, "global_step": 33786, "epoch": 283, "lr": 5.4784814021921696e-05} +{"train_loss": 0.0023128145840018988, "global_step": 33787, "epoch": 283, "lr": 5.478260867550158e-05} +{"train_loss": 0.0013764906907454133, "global_step": 33788, "epoch": 283, "lr": 5.478040331969132e-05} +{"train_loss": 0.0024078059941530228, "global_step": 33789, "epoch": 283, "lr": 5.477819795449526e-05} +{"train_loss": 0.001834164373576641, "global_step": 33790, "epoch": 283, "lr": 5.47759925799177e-05} +{"train_loss": 0.002675930969417095, "global_step": 33791, "epoch": 283, "lr": 5.477378719596301e-05} +{"train_loss": 0.001834611757658422, "global_step": 33792, "epoch": 283, "lr": 5.477158180263548e-05} +{"train_loss": 0.0021019387058913708, "global_step": 33793, "epoch": 283, "lr": 5.476937639993947e-05} +{"train_loss": 0.0026965339202433825, "global_step": 33794, "epoch": 283, "lr": 5.4767170987879305e-05} +{"train_loss": 0.002429690581801183, "global_step": 33795, "epoch": 283, "lr": 5.476496556645929e-05, "val_loss": 0.01760084740817547} +{"train_loss": 0.0036477255634963512, "global_step": 33796, "epoch": 284, "lr": 5.476276013568379e-05} +{"train_loss": 0.003104685340076685, "global_step": 33797, "epoch": 284, "lr": 5.476055469555711e-05} +{"train_loss": 0.0023093402851372957, "global_step": 33798, "epoch": 284, "lr": 5.47583492460836e-05} +{"train_loss": 0.0041872793808579445, "global_step": 33799, "epoch": 284, "lr": 5.475614378726757e-05} +{"train_loss": 0.0027401235420256853, "global_step": 33800, "epoch": 284, "lr": 5.475393831911335e-05} +{"train_loss": 0.0021911102812737226, "global_step": 33801, "epoch": 284, "lr": 5.475173284162529e-05} +{"train_loss": 0.00395452743396163, "global_step": 33802, "epoch": 284, "lr": 5.474952735480772e-05} +{"train_loss": 0.002360735787078738, "global_step": 33803, "epoch": 284, "lr": 5.474732185866495e-05} +{"train_loss": 0.0027720166835933924, "global_step": 33804, "epoch": 284, "lr": 5.474511635320133e-05} +{"train_loss": 0.002405313076451421, "global_step": 33805, "epoch": 284, "lr": 5.474291083842118e-05} +{"train_loss": 0.002587195485830307, "global_step": 33806, "epoch": 284, "lr": 5.474070531432882e-05} +{"train_loss": 0.003781882580369711, "global_step": 33807, "epoch": 284, "lr": 5.47384997809286e-05} +{"train_loss": 0.0034481165930628777, "global_step": 33808, "epoch": 284, "lr": 5.473629423822484e-05} +{"train_loss": 0.0029453334864228964, "global_step": 33809, "epoch": 284, "lr": 5.4734088686221874e-05} +{"train_loss": 0.0032125136349350214, "global_step": 33810, "epoch": 284, "lr": 5.4731883124924035e-05} +{"train_loss": 0.003144789021462202, "global_step": 33811, "epoch": 284, "lr": 5.4729677554335626e-05} +{"train_loss": 0.0035112968180328608, "global_step": 33812, "epoch": 284, "lr": 5.472747197446102e-05} +{"train_loss": 0.002482503652572632, "global_step": 33813, "epoch": 284, "lr": 5.4725266385304516e-05} +{"train_loss": 0.002161974087357521, "global_step": 33814, "epoch": 284, "lr": 5.4723060786870476e-05} +{"train_loss": 0.004013388883322477, "global_step": 33815, "epoch": 284, "lr": 5.4720855179163186e-05} +{"train_loss": 0.0029099162202328444, "global_step": 33816, "epoch": 284, "lr": 5.471864956218703e-05} +{"train_loss": 0.0022549720015376806, "global_step": 33817, "epoch": 284, "lr": 5.4716443935946295e-05} +{"train_loss": 0.003738788887858391, "global_step": 33818, "epoch": 284, "lr": 5.4714238300445333e-05} +{"train_loss": 0.0028338360134512186, "global_step": 33819, "epoch": 284, "lr": 5.471203265568845e-05} +{"train_loss": 0.0017449462320655584, "global_step": 33820, "epoch": 284, "lr": 5.470982700168e-05} +{"train_loss": 0.001362475217320025, "global_step": 33821, "epoch": 284, "lr": 5.470762133842432e-05} +{"train_loss": 0.0023515159264206886, "global_step": 33822, "epoch": 284, "lr": 5.470541566592573e-05} +{"train_loss": 0.0034979977644979954, "global_step": 33823, "epoch": 284, "lr": 5.470320998418854e-05} +{"train_loss": 0.0024030215572565794, "global_step": 33824, "epoch": 284, "lr": 5.470100429321712e-05} +{"train_loss": 0.003505612025037408, "global_step": 33825, "epoch": 284, "lr": 5.469879859301576e-05} +{"train_loss": 0.0033391586039215326, "global_step": 33826, "epoch": 284, "lr": 5.469659288358883e-05} +{"train_loss": 0.0023314908612519503, "global_step": 33827, "epoch": 284, "lr": 5.469438716494063e-05} +{"train_loss": 0.002497049979865551, "global_step": 33828, "epoch": 284, "lr": 5.46921814370755e-05} +{"train_loss": 0.002989533357322216, "global_step": 33829, "epoch": 284, "lr": 5.468997569999778e-05} +{"train_loss": 0.0028140402864664793, "global_step": 33830, "epoch": 284, "lr": 5.468776995371179e-05} +{"train_loss": 0.0018014477100223303, "global_step": 33831, "epoch": 284, "lr": 5.468556419822186e-05} +{"train_loss": 0.003880203003063798, "global_step": 33832, "epoch": 284, "lr": 5.468335843353234e-05} +{"train_loss": 0.004727819003164768, "global_step": 33833, "epoch": 284, "lr": 5.468115265964753e-05} +{"train_loss": 0.002709011547267437, "global_step": 33834, "epoch": 284, "lr": 5.467894687657178e-05} +{"train_loss": 0.003503860905766487, "global_step": 33835, "epoch": 284, "lr": 5.4676741084309435e-05} +{"train_loss": 0.0014835473848506808, "global_step": 33836, "epoch": 284, "lr": 5.467453528286479e-05} +{"train_loss": 0.004231539089232683, "global_step": 33837, "epoch": 284, "lr": 5.46723294722422e-05} +{"train_loss": 0.0037799321580678225, "global_step": 33838, "epoch": 284, "lr": 5.467012365244599e-05} +{"train_loss": 0.0030262183863669634, "global_step": 33839, "epoch": 284, "lr": 5.46679178234805e-05} +{"train_loss": 0.0020941540133208036, "global_step": 33840, "epoch": 284, "lr": 5.4665711985350044e-05} +{"train_loss": 0.0020446113776415586, "global_step": 33841, "epoch": 284, "lr": 5.466350613805896e-05} +{"train_loss": 0.0027338112704455853, "global_step": 33842, "epoch": 284, "lr": 5.4661300281611585e-05} +{"train_loss": 0.003290443914011121, "global_step": 33843, "epoch": 284, "lr": 5.465909441601223e-05} +{"train_loss": 0.0020527848973870277, "global_step": 33844, "epoch": 284, "lr": 5.4656888541265264e-05} +{"train_loss": 0.0021808750461786985, "global_step": 33845, "epoch": 284, "lr": 5.465468265737498e-05} +{"train_loss": 0.0021465355530381203, "global_step": 33846, "epoch": 284, "lr": 5.465247676434572e-05} +{"train_loss": 0.002993911039084196, "global_step": 33847, "epoch": 284, "lr": 5.465027086218183e-05} +{"train_loss": 0.002351825824007392, "global_step": 33848, "epoch": 284, "lr": 5.464806495088762e-05} +{"train_loss": 0.0028330902568995953, "global_step": 33849, "epoch": 284, "lr": 5.464585903046744e-05} +{"train_loss": 0.0019739135168492794, "global_step": 33850, "epoch": 284, "lr": 5.464365310092559e-05} +{"train_loss": 0.0047837188467383385, "global_step": 33851, "epoch": 284, "lr": 5.4641447162266444e-05} +{"train_loss": 0.0016265895683318377, "global_step": 33852, "epoch": 284, "lr": 5.463924121449432e-05} +{"train_loss": 0.0020463468972593546, "global_step": 33853, "epoch": 284, "lr": 5.4637035257613525e-05} +{"train_loss": 0.00195984891615808, "global_step": 33854, "epoch": 284, "lr": 5.463482929162842e-05} +{"train_loss": 0.002507217228412628, "global_step": 33855, "epoch": 284, "lr": 5.463262331654332e-05} +{"train_loss": 0.00306347175501287, "global_step": 33856, "epoch": 284, "lr": 5.4630417332362546e-05} +{"train_loss": 0.002683362690731883, "global_step": 33857, "epoch": 284, "lr": 5.4628211339090453e-05} +{"train_loss": 0.002864904934540391, "global_step": 33858, "epoch": 284, "lr": 5.462600533673136e-05} +{"train_loss": 0.003400045447051525, "global_step": 33859, "epoch": 284, "lr": 5.46237993252896e-05} +{"train_loss": 0.0014052552869543433, "global_step": 33860, "epoch": 284, "lr": 5.46215933047695e-05} +{"train_loss": 0.0036171053070575, "global_step": 33861, "epoch": 284, "lr": 5.4619387275175396e-05} +{"train_loss": 0.0019641767721623182, "global_step": 33862, "epoch": 284, "lr": 5.461718123651163e-05} +{"train_loss": 0.0024290895089507103, "global_step": 33863, "epoch": 284, "lr": 5.4614975188782505e-05} +{"train_loss": 0.002551694866269827, "global_step": 33864, "epoch": 284, "lr": 5.461276913199238e-05} +{"train_loss": 0.0027606242801994085, "global_step": 33865, "epoch": 284, "lr": 5.461056306614557e-05} +{"train_loss": 0.0026492951437830925, "global_step": 33866, "epoch": 284, "lr": 5.460835699124642e-05} +{"train_loss": 0.0037341683637350798, "global_step": 33867, "epoch": 284, "lr": 5.460615090729925e-05} +{"train_loss": 0.0014050013851374388, "global_step": 33868, "epoch": 284, "lr": 5.460394481430839e-05} +{"train_loss": 0.0027771545574069023, "global_step": 33869, "epoch": 284, "lr": 5.4601738712278184e-05} +{"train_loss": 0.002668999368324876, "global_step": 33870, "epoch": 284, "lr": 5.4599532601212946e-05} +{"train_loss": 0.0014763395301997662, "global_step": 33871, "epoch": 284, "lr": 5.4597326481117016e-05} +{"train_loss": 0.0024006504099816084, "global_step": 33872, "epoch": 284, "lr": 5.459512035199474e-05} +{"train_loss": 0.003137031104415655, "global_step": 33873, "epoch": 284, "lr": 5.459291421385043e-05} +{"train_loss": 0.0021327678114175797, "global_step": 33874, "epoch": 284, "lr": 5.459070806668842e-05} +{"train_loss": 0.0020127780735492706, "global_step": 33875, "epoch": 284, "lr": 5.4588501910513056e-05} +{"train_loss": 0.0029672093223780394, "global_step": 33876, "epoch": 284, "lr": 5.458629574532864e-05} +{"train_loss": 0.002872155047953129, "global_step": 33877, "epoch": 284, "lr": 5.458408957113954e-05} +{"train_loss": 0.0016426495276391506, "global_step": 33878, "epoch": 284, "lr": 5.458188338795006e-05} +{"train_loss": 0.0020949747413396835, "global_step": 33879, "epoch": 284, "lr": 5.4579677195764546e-05} +{"train_loss": 0.0024189569521695375, "global_step": 33880, "epoch": 284, "lr": 5.457747099458732e-05} +{"train_loss": 0.0019440569449216127, "global_step": 33881, "epoch": 284, "lr": 5.457526478442272e-05} +{"train_loss": 0.00253406073898077, "global_step": 33882, "epoch": 284, "lr": 5.4573058565275074e-05} +{"train_loss": 0.002499084919691086, "global_step": 33883, "epoch": 284, "lr": 5.457085233714872e-05} +{"train_loss": 0.002008038340136409, "global_step": 33884, "epoch": 284, "lr": 5.4568646100047985e-05} +{"train_loss": 0.0029102242551743984, "global_step": 33885, "epoch": 284, "lr": 5.4566439853977215e-05} +{"train_loss": 0.0020740991458296776, "global_step": 33886, "epoch": 284, "lr": 5.456423359894071e-05} +{"train_loss": 0.0029758119489997625, "global_step": 33887, "epoch": 284, "lr": 5.4562027334942825e-05} +{"train_loss": 0.0017082641134038568, "global_step": 33888, "epoch": 284, "lr": 5.455982106198788e-05} +{"train_loss": 0.0018214775482192636, "global_step": 33889, "epoch": 284, "lr": 5.455761478008022e-05} +{"train_loss": 0.002409436507150531, "global_step": 33890, "epoch": 284, "lr": 5.455540848922418e-05} +{"train_loss": 0.003137880237773061, "global_step": 33891, "epoch": 284, "lr": 5.455320218942408e-05} +{"train_loss": 0.0031155806500464678, "global_step": 33892, "epoch": 284, "lr": 5.4550995880684245e-05} +{"train_loss": 0.0020384788513183594, "global_step": 33893, "epoch": 284, "lr": 5.4548789563009016e-05} +{"train_loss": 0.0022115944884717464, "global_step": 33894, "epoch": 284, "lr": 5.4546583236402725e-05} +{"train_loss": 0.0019669574685394764, "global_step": 33895, "epoch": 284, "lr": 5.4544376900869684e-05} +{"train_loss": 0.0010739030549302697, "global_step": 33896, "epoch": 284, "lr": 5.4542170556414275e-05} +{"train_loss": 0.0029920146334916353, "global_step": 33897, "epoch": 284, "lr": 5.453996420304078e-05} +{"train_loss": 0.0012837633257731795, "global_step": 33898, "epoch": 284, "lr": 5.453775784075358e-05} +{"train_loss": 0.002671809634193778, "global_step": 33899, "epoch": 284, "lr": 5.4535551469556956e-05} +{"train_loss": 0.00264246785081923, "global_step": 33900, "epoch": 284, "lr": 5.4533345089455256e-05} +{"train_loss": 0.0015583642525598407, "global_step": 33901, "epoch": 284, "lr": 5.453113870045282e-05} +{"train_loss": 0.0025973659940063953, "global_step": 33902, "epoch": 284, "lr": 5.452893230255398e-05} +{"train_loss": 0.00385949295014143, "global_step": 33903, "epoch": 284, "lr": 5.4526725895763074e-05} +{"train_loss": 0.0029795069713145494, "global_step": 33904, "epoch": 284, "lr": 5.4524519480084425e-05} +{"train_loss": 0.002044966211542487, "global_step": 33905, "epoch": 284, "lr": 5.452231305552235e-05} +{"train_loss": 0.0023316959850490093, "global_step": 33906, "epoch": 284, "lr": 5.452010662208121e-05} +{"train_loss": 0.001681885914877057, "global_step": 33907, "epoch": 284, "lr": 5.4517900179765316e-05} +{"train_loss": 0.003613418899476528, "global_step": 33908, "epoch": 284, "lr": 5.4515693728579006e-05} +{"train_loss": 0.0037950065452605486, "global_step": 33909, "epoch": 284, "lr": 5.451348726852662e-05} +{"train_loss": 0.0027444108854979277, "global_step": 33910, "epoch": 284, "lr": 5.4511280799612485e-05} +{"train_loss": 0.0021442975848913193, "global_step": 33911, "epoch": 284, "lr": 5.450907432184093e-05} +{"train_loss": 0.001657098880968988, "global_step": 33912, "epoch": 284, "lr": 5.4506867835216276e-05} +{"train_loss": 0.0018853727960959077, "global_step": 33913, "epoch": 284, "lr": 5.450466133974288e-05} +{"train_loss": 0.0026375417658245238, "global_step": 33914, "epoch": 284, "lr": 5.450245483542507e-05, "val_loss": 0.01914118602871895} +{"train_loss": 0.0013878218596801162, "global_step": 33915, "epoch": 285, "lr": 5.450024832226716e-05} +{"train_loss": 0.002723407233133912, "global_step": 33916, "epoch": 285, "lr": 5.44980418002735e-05} +{"train_loss": 0.0029071478638798, "global_step": 33917, "epoch": 285, "lr": 5.4495835269448414e-05} +{"train_loss": 0.0016803686739876866, "global_step": 33918, "epoch": 285, "lr": 5.449362872979624e-05} +{"train_loss": 0.0019861971959471703, "global_step": 33919, "epoch": 285, "lr": 5.449142218132129e-05} +{"train_loss": 0.0030387258157134056, "global_step": 33920, "epoch": 285, "lr": 5.448921562402792e-05} +{"train_loss": 0.0021377934608608484, "global_step": 33921, "epoch": 285, "lr": 5.4487009057920465e-05} +{"train_loss": 0.0027365528512746096, "global_step": 33922, "epoch": 285, "lr": 5.448480248300324e-05} +{"train_loss": 0.002199911279603839, "global_step": 33923, "epoch": 285, "lr": 5.4482595899280594e-05} +{"train_loss": 0.0019853049889206886, "global_step": 33924, "epoch": 285, "lr": 5.448038930675684e-05} +{"train_loss": 0.0023865276016294956, "global_step": 33925, "epoch": 285, "lr": 5.447818270543632e-05} +{"train_loss": 0.0027292692102491856, "global_step": 33926, "epoch": 285, "lr": 5.4475976095323366e-05} +{"train_loss": 0.0017252839170396328, "global_step": 33927, "epoch": 285, "lr": 5.447376947642231e-05} +{"train_loss": 0.0019222735427320004, "global_step": 33928, "epoch": 285, "lr": 5.447156284873749e-05} +{"train_loss": 0.004511728882789612, "global_step": 33929, "epoch": 285, "lr": 5.446935621227322e-05} +{"train_loss": 0.00196624593809247, "global_step": 33930, "epoch": 285, "lr": 5.446714956703386e-05} +{"train_loss": 0.0015707853017374873, "global_step": 33931, "epoch": 285, "lr": 5.446494291302373e-05} +{"train_loss": 0.0029443150851875544, "global_step": 33932, "epoch": 285, "lr": 5.446273625024716e-05} +{"train_loss": 0.001948505756445229, "global_step": 33933, "epoch": 285, "lr": 5.446052957870847e-05} +{"train_loss": 0.003191936295479536, "global_step": 33934, "epoch": 285, "lr": 5.445832289841203e-05} +{"train_loss": 0.0025703459978103638, "global_step": 33935, "epoch": 285, "lr": 5.445611620936215e-05} +{"train_loss": 0.0027778090443462133, "global_step": 33936, "epoch": 285, "lr": 5.445390951156315e-05} +{"train_loss": 0.0029053939506411552, "global_step": 33937, "epoch": 285, "lr": 5.4451702805019366e-05} +{"train_loss": 0.0017950993496924639, "global_step": 33938, "epoch": 285, "lr": 5.4449496089735155e-05} +{"train_loss": 0.0022608237341046333, "global_step": 33939, "epoch": 285, "lr": 5.444728936571483e-05} +{"train_loss": 0.0021993641275912523, "global_step": 33940, "epoch": 285, "lr": 5.444508263296272e-05} +{"train_loss": 0.0016967523843050003, "global_step": 33941, "epoch": 285, "lr": 5.444287589148318e-05} +{"train_loss": 0.002568970201537013, "global_step": 33942, "epoch": 285, "lr": 5.444066914128051e-05} +{"train_loss": 0.002870414638891816, "global_step": 33943, "epoch": 285, "lr": 5.443846238235907e-05} +{"train_loss": 0.0018957426073029637, "global_step": 33944, "epoch": 285, "lr": 5.443625561472317e-05} +{"train_loss": 0.003276680363342166, "global_step": 33945, "epoch": 285, "lr": 5.443404883837717e-05} +{"train_loss": 0.001451691729016602, "global_step": 33946, "epoch": 285, "lr": 5.443184205332539e-05} +{"train_loss": 0.0027164858765900135, "global_step": 33947, "epoch": 285, "lr": 5.4429635259572156e-05} +{"train_loss": 0.002635984681546688, "global_step": 33948, "epoch": 285, "lr": 5.442742845712181e-05} +{"train_loss": 0.0029985266737639904, "global_step": 33949, "epoch": 285, "lr": 5.4425221645978685e-05} +{"train_loss": 0.0025475616566836834, "global_step": 33950, "epoch": 285, "lr": 5.44230148261471e-05} +{"train_loss": 0.0017592768417671323, "global_step": 33951, "epoch": 285, "lr": 5.4420807997631406e-05} +{"train_loss": 0.0022728287149220705, "global_step": 33952, "epoch": 285, "lr": 5.4418601160435925e-05} +{"train_loss": 0.0015141317853704095, "global_step": 33953, "epoch": 285, "lr": 5.441639431456499e-05} +{"train_loss": 0.0018838753458112478, "global_step": 33954, "epoch": 285, "lr": 5.4414187460022946e-05} +{"train_loss": 0.002681507496163249, "global_step": 33955, "epoch": 285, "lr": 5.441198059681411e-05} +{"train_loss": 0.0016498627373948693, "global_step": 33956, "epoch": 285, "lr": 5.440977372494281e-05} +{"train_loss": 0.0015558163868263364, "global_step": 33957, "epoch": 285, "lr": 5.4407566844413404e-05} +{"train_loss": 0.0016508289845660329, "global_step": 33958, "epoch": 285, "lr": 5.4405359955230206e-05} +{"train_loss": 0.0017710214015096426, "global_step": 33959, "epoch": 285, "lr": 5.440315305739756e-05} +{"train_loss": 0.0016088486881926656, "global_step": 33960, "epoch": 285, "lr": 5.4400946150919786e-05} +{"train_loss": 0.001350182224996388, "global_step": 33961, "epoch": 285, "lr": 5.439873923580123e-05} +{"train_loss": 0.003154281061142683, "global_step": 33962, "epoch": 285, "lr": 5.439653231204622e-05} +{"train_loss": 0.00403683353215456, "global_step": 33963, "epoch": 285, "lr": 5.439432537965908e-05} +{"train_loss": 0.001957134809345007, "global_step": 33964, "epoch": 285, "lr": 5.4392118438644157e-05} +{"train_loss": 0.0017201807349920273, "global_step": 33965, "epoch": 285, "lr": 5.4389911489005784e-05} +{"train_loss": 0.0014632350066676736, "global_step": 33966, "epoch": 285, "lr": 5.4387704530748296e-05} +{"train_loss": 0.0037154655437916517, "global_step": 33967, "epoch": 285, "lr": 5.4385497563876e-05} +{"train_loss": 0.0018348165322095156, "global_step": 33968, "epoch": 285, "lr": 5.438329058839326e-05} +{"train_loss": 0.0017059362726286054, "global_step": 33969, "epoch": 285, "lr": 5.438108360430438e-05} +{"train_loss": 0.0019085112726315856, "global_step": 33970, "epoch": 285, "lr": 5.437887661161373e-05} +{"train_loss": 0.0016050325939431787, "global_step": 33971, "epoch": 285, "lr": 5.437666961032561e-05} +{"train_loss": 0.0021953564137220383, "global_step": 33972, "epoch": 285, "lr": 5.437446260044438e-05} +{"train_loss": 0.0016107024857774377, "global_step": 33973, "epoch": 285, "lr": 5.437225558197436e-05} +{"train_loss": 0.0020673663821071386, "global_step": 33974, "epoch": 285, "lr": 5.437004855491988e-05} +{"train_loss": 0.0016585254343226552, "global_step": 33975, "epoch": 285, "lr": 5.436784151928527e-05} +{"train_loss": 0.003360635368153453, "global_step": 33976, "epoch": 285, "lr": 5.436563447507488e-05} +{"train_loss": 0.0016403644112870097, "global_step": 33977, "epoch": 285, "lr": 5.436342742229302e-05} +{"train_loss": 0.0025924898218363523, "global_step": 33978, "epoch": 285, "lr": 5.436122036094404e-05} +{"train_loss": 0.001715859747491777, "global_step": 33979, "epoch": 285, "lr": 5.435901329103227e-05} +{"train_loss": 0.0019535415340214968, "global_step": 33980, "epoch": 285, "lr": 5.435680621256205e-05} +{"train_loss": 0.003270604880526662, "global_step": 33981, "epoch": 285, "lr": 5.4354599125537696e-05} +{"train_loss": 0.0019506844691932201, "global_step": 33982, "epoch": 285, "lr": 5.435239202996356e-05} +{"train_loss": 0.0022402696777135134, "global_step": 33983, "epoch": 285, "lr": 5.435018492584396e-05} +{"train_loss": 0.00344522250816226, "global_step": 33984, "epoch": 285, "lr": 5.4347977813183247e-05} +{"train_loss": 0.00283863116055727, "global_step": 33985, "epoch": 285, "lr": 5.4345770691985743e-05} +{"train_loss": 0.002317554783076048, "global_step": 33986, "epoch": 285, "lr": 5.4343563562255786e-05} +{"train_loss": 0.0025883594062179327, "global_step": 33987, "epoch": 285, "lr": 5.434135642399769e-05} +{"train_loss": 0.001997903920710087, "global_step": 33988, "epoch": 285, "lr": 5.4339149277215815e-05} +{"train_loss": 0.0021798519883304834, "global_step": 33989, "epoch": 285, "lr": 5.433694212191448e-05} +{"train_loss": 0.0026593783404678106, "global_step": 33990, "epoch": 285, "lr": 5.433473495809802e-05} +{"train_loss": 0.0014089517062529922, "global_step": 33991, "epoch": 285, "lr": 5.4332527785770784e-05} +{"train_loss": 0.004721195437014103, "global_step": 33992, "epoch": 285, "lr": 5.433032060493709e-05} +{"train_loss": 0.002236375119537115, "global_step": 33993, "epoch": 285, "lr": 5.432811341560126e-05} +{"train_loss": 0.0022250742185860872, "global_step": 33994, "epoch": 285, "lr": 5.432590621776764e-05} +{"train_loss": 0.0029838464688509703, "global_step": 33995, "epoch": 285, "lr": 5.4323699011440576e-05} +{"train_loss": 0.002474702661857009, "global_step": 33996, "epoch": 285, "lr": 5.432149179662439e-05} +{"train_loss": 0.0024936413392424583, "global_step": 33997, "epoch": 285, "lr": 5.4319284573323415e-05} +{"train_loss": 0.0025016546715050936, "global_step": 33998, "epoch": 285, "lr": 5.4317077341542e-05} +{"train_loss": 0.0021397601813077927, "global_step": 33999, "epoch": 285, "lr": 5.431487010128444e-05} +{"train_loss": 0.0026095393113791943, "global_step": 34000, "epoch": 285, "lr": 5.4312662852555116e-05} +{"train_loss": 0.003734034951776266, "global_step": 34001, "epoch": 285, "lr": 5.431045559535832e-05} +{"train_loss": 0.0027582210022956133, "global_step": 34002, "epoch": 285, "lr": 5.430824832969842e-05} +{"train_loss": 0.0034777738619595766, "global_step": 34003, "epoch": 285, "lr": 5.4306041055579724e-05} +{"train_loss": 0.0014434574404731393, "global_step": 34004, "epoch": 285, "lr": 5.4303833773006595e-05} +{"train_loss": 0.002384468913078308, "global_step": 34005, "epoch": 285, "lr": 5.4301626481983336e-05} +{"train_loss": 0.00300102261826396, "global_step": 34006, "epoch": 285, "lr": 5.429941918251429e-05} +{"train_loss": 0.0028460121247917414, "global_step": 34007, "epoch": 285, "lr": 5.429721187460379e-05} +{"train_loss": 0.002549250377342105, "global_step": 34008, "epoch": 285, "lr": 5.429500455825618e-05} +{"train_loss": 0.0013866409426555037, "global_step": 34009, "epoch": 285, "lr": 5.429279723347578e-05} +{"train_loss": 0.0034001613967120647, "global_step": 34010, "epoch": 285, "lr": 5.4290589900266943e-05} +{"train_loss": 0.0028401310555636883, "global_step": 34011, "epoch": 285, "lr": 5.4288382558633974e-05} +{"train_loss": 0.004651197232306004, "global_step": 34012, "epoch": 285, "lr": 5.4286175208581233e-05} +{"train_loss": 0.0019194567576050758, "global_step": 34013, "epoch": 285, "lr": 5.428396785011306e-05} +{"train_loss": 0.0018114919075742364, "global_step": 34014, "epoch": 285, "lr": 5.4281760483233757e-05} +{"train_loss": 0.0027240351773798466, "global_step": 34015, "epoch": 285, "lr": 5.427955310794768e-05} +{"train_loss": 0.003014153568074107, "global_step": 34016, "epoch": 285, "lr": 5.427734572425915e-05} +{"train_loss": 0.002181325340643525, "global_step": 34017, "epoch": 285, "lr": 5.4275138332172524e-05} +{"train_loss": 0.0025440386962145567, "global_step": 34018, "epoch": 285, "lr": 5.427293093169211e-05} +{"train_loss": 0.002132547553628683, "global_step": 34019, "epoch": 285, "lr": 5.4270723522822255e-05} +{"train_loss": 0.0037288847379386425, "global_step": 34020, "epoch": 285, "lr": 5.426851610556729e-05} +{"train_loss": 0.0025054295547306538, "global_step": 34021, "epoch": 285, "lr": 5.4266308679931556e-05} +{"train_loss": 0.0017972076311707497, "global_step": 34022, "epoch": 285, "lr": 5.4264101245919364e-05} +{"train_loss": 0.0021855838131159544, "global_step": 34023, "epoch": 285, "lr": 5.426189380353509e-05} +{"train_loss": 0.0016588877188041806, "global_step": 34024, "epoch": 285, "lr": 5.425968635278302e-05} +{"train_loss": 0.0012901279842481017, "global_step": 34025, "epoch": 285, "lr": 5.4257478893667525e-05} +{"train_loss": 0.0035887155681848526, "global_step": 34026, "epoch": 285, "lr": 5.425527142619291e-05} +{"train_loss": 0.0027381102554500103, "global_step": 34027, "epoch": 285, "lr": 5.4253063950363536e-05} +{"train_loss": 0.0038503038231283426, "global_step": 34028, "epoch": 285, "lr": 5.425085646618371e-05} +{"train_loss": 0.0024766423739492893, "global_step": 34029, "epoch": 285, "lr": 5.424864897365781e-05} +{"train_loss": 0.0026795940939337015, "global_step": 34030, "epoch": 285, "lr": 5.4246441472790123e-05} +{"train_loss": 0.0030126390047371387, "global_step": 34031, "epoch": 285, "lr": 5.4244233963585e-05} +{"train_loss": 0.0024996274150907993, "global_step": 34032, "epoch": 285, "lr": 5.4242026446046775e-05} +{"train_loss": 0.002410994597100222, "global_step": 34033, "epoch": 285, "lr": 5.42398189201798e-05, "val_loss": 0.025060400366783142, "train_action_mse_error": 3.8107486034277827e-05} +{"train_loss": 0.004025597590953112, "global_step": 34034, "epoch": 286, "lr": 5.423761138598839e-05} +{"train_loss": 0.0023960822727531195, "global_step": 34035, "epoch": 286, "lr": 5.423540384347687e-05} +{"train_loss": 0.0019611050374805927, "global_step": 34036, "epoch": 286, "lr": 5.42331962926496e-05} +{"train_loss": 0.0041481140069663525, "global_step": 34037, "epoch": 286, "lr": 5.423098873351089e-05} +{"train_loss": 0.0021415655501186848, "global_step": 34038, "epoch": 286, "lr": 5.422878116606509e-05} +{"train_loss": 0.002528885845094919, "global_step": 34039, "epoch": 286, "lr": 5.422657359031653e-05} +{"train_loss": 0.0026688186917454004, "global_step": 34040, "epoch": 286, "lr": 5.4224366006269544e-05} +{"train_loss": 0.002660160418599844, "global_step": 34041, "epoch": 286, "lr": 5.422215841392847e-05} +{"train_loss": 0.004700005054473877, "global_step": 34042, "epoch": 286, "lr": 5.421995081329764e-05} +{"train_loss": 0.0019737286493182182, "global_step": 34043, "epoch": 286, "lr": 5.421774320438138e-05} +{"train_loss": 0.002369652036577463, "global_step": 34044, "epoch": 286, "lr": 5.421553558718404e-05} +{"train_loss": 0.0032448945567011833, "global_step": 34045, "epoch": 286, "lr": 5.421332796170994e-05} +{"train_loss": 0.0030037604738026857, "global_step": 34046, "epoch": 286, "lr": 5.421112032796341e-05} +{"train_loss": 0.003053424647077918, "global_step": 34047, "epoch": 286, "lr": 5.4208912685948824e-05} +{"train_loss": 0.0021944274194538593, "global_step": 34048, "epoch": 286, "lr": 5.4206705035670466e-05} +{"train_loss": 0.003406087402254343, "global_step": 34049, "epoch": 286, "lr": 5.42044973771327e-05} +{"train_loss": 0.0017619647551327944, "global_step": 34050, "epoch": 286, "lr": 5.420228971033986e-05} +{"train_loss": 0.0017365270759910345, "global_step": 34051, "epoch": 286, "lr": 5.420008203529625e-05} +{"train_loss": 0.0035899383947253227, "global_step": 34052, "epoch": 286, "lr": 5.419787435200625e-05} +{"train_loss": 0.002231583697721362, "global_step": 34053, "epoch": 286, "lr": 5.4195666660474165e-05} +{"train_loss": 0.0016321665607392788, "global_step": 34054, "epoch": 286, "lr": 5.4193458960704336e-05} +{"train_loss": 0.003082935931161046, "global_step": 34055, "epoch": 286, "lr": 5.41912512527011e-05} +{"train_loss": 0.003469873685389757, "global_step": 34056, "epoch": 286, "lr": 5.418904353646879e-05} +{"train_loss": 0.002471013693138957, "global_step": 34057, "epoch": 286, "lr": 5.4186835812011737e-05} +{"train_loss": 0.0021094141993671656, "global_step": 34058, "epoch": 286, "lr": 5.418462807933428e-05} +{"train_loss": 0.002564126392826438, "global_step": 34059, "epoch": 286, "lr": 5.418242033844074e-05} +{"train_loss": 0.0015301728853955865, "global_step": 34060, "epoch": 286, "lr": 5.4180212589335485e-05} +{"train_loss": 0.003584236139431596, "global_step": 34061, "epoch": 286, "lr": 5.4178004832022825e-05} +{"train_loss": 0.0028338960837572813, "global_step": 34062, "epoch": 286, "lr": 5.4175797066507085e-05} +{"train_loss": 0.0020169680938124657, "global_step": 34063, "epoch": 286, "lr": 5.417358929279263e-05} +{"train_loss": 0.003865416394546628, "global_step": 34064, "epoch": 286, "lr": 5.417138151088377e-05} +{"train_loss": 0.003006932558491826, "global_step": 34065, "epoch": 286, "lr": 5.416917372078485e-05} +{"train_loss": 0.0031776295509189367, "global_step": 34066, "epoch": 286, "lr": 5.4166965922500204e-05} +{"train_loss": 0.0028771471697837114, "global_step": 34067, "epoch": 286, "lr": 5.4164758116034175e-05} +{"train_loss": 0.0021347790025174618, "global_step": 34068, "epoch": 286, "lr": 5.4162550301391065e-05} +{"train_loss": 0.0015184861840680242, "global_step": 34069, "epoch": 286, "lr": 5.4160342478575254e-05} +{"train_loss": 0.0023571259807795286, "global_step": 34070, "epoch": 286, "lr": 5.415813464759104e-05} +{"train_loss": 0.0029043941758573055, "global_step": 34071, "epoch": 286, "lr": 5.415592680844278e-05} +{"train_loss": 0.0028521690983325243, "global_step": 34072, "epoch": 286, "lr": 5.41537189611348e-05} +{"train_loss": 0.0032210436183959246, "global_step": 34073, "epoch": 286, "lr": 5.415151110567145e-05} +{"train_loss": 0.003747229464352131, "global_step": 34074, "epoch": 286, "lr": 5.4149303242057034e-05} +{"train_loss": 0.002481450093910098, "global_step": 34075, "epoch": 286, "lr": 5.414709537029591e-05} +{"train_loss": 0.0033328423742204905, "global_step": 34076, "epoch": 286, "lr": 5.41448874903924e-05} +{"train_loss": 0.0020603572484105825, "global_step": 34077, "epoch": 286, "lr": 5.4142679602350846e-05} +{"train_loss": 0.002317161997780204, "global_step": 34078, "epoch": 286, "lr": 5.414047170617559e-05} +{"train_loss": 0.0019145526457577944, "global_step": 34079, "epoch": 286, "lr": 5.413826380187097e-05} +{"train_loss": 0.0024533160030841827, "global_step": 34080, "epoch": 286, "lr": 5.413605588944131e-05} +{"train_loss": 0.0026193198282271624, "global_step": 34081, "epoch": 286, "lr": 5.4133847968890924e-05} +{"train_loss": 0.0018518409924581647, "global_step": 34082, "epoch": 286, "lr": 5.413164004022418e-05} +{"train_loss": 0.003915002103894949, "global_step": 34083, "epoch": 286, "lr": 5.412943210344541e-05} +{"train_loss": 0.002339158672839403, "global_step": 34084, "epoch": 286, "lr": 5.412722415855893e-05} +{"train_loss": 0.0021807742305099964, "global_step": 34085, "epoch": 286, "lr": 5.41250162055691e-05} +{"train_loss": 0.0012677193153649569, "global_step": 34086, "epoch": 286, "lr": 5.4122808244480236e-05} +{"train_loss": 0.004445546306669712, "global_step": 34087, "epoch": 286, "lr": 5.4120600275296684e-05} +{"train_loss": 0.0031665535643696785, "global_step": 34088, "epoch": 286, "lr": 5.411839229802276e-05} +{"train_loss": 0.001545788487419486, "global_step": 34089, "epoch": 286, "lr": 5.4116184312662824e-05} +{"train_loss": 0.0026888721622526646, "global_step": 34090, "epoch": 286, "lr": 5.411397631922118e-05} +{"train_loss": 0.002949389396235347, "global_step": 34091, "epoch": 286, "lr": 5.41117683177022e-05} +{"train_loss": 0.0025899182073771954, "global_step": 34092, "epoch": 286, "lr": 5.41095603081102e-05} +{"train_loss": 0.00436383904889226, "global_step": 34093, "epoch": 286, "lr": 5.410735229044952e-05} +{"train_loss": 0.0034754250664263964, "global_step": 34094, "epoch": 286, "lr": 5.4105144264724486e-05} +{"train_loss": 0.0017544181318953633, "global_step": 34095, "epoch": 286, "lr": 5.410293623093944e-05} +{"train_loss": 0.0029827833641320467, "global_step": 34096, "epoch": 286, "lr": 5.410072818909873e-05} +{"train_loss": 0.0021461453288793564, "global_step": 34097, "epoch": 286, "lr": 5.409852013920665e-05} +{"train_loss": 0.0026276730932295322, "global_step": 34098, "epoch": 286, "lr": 5.40963120812676e-05} +{"train_loss": 0.0027866086456924677, "global_step": 34099, "epoch": 286, "lr": 5.409410401528586e-05} +{"train_loss": 0.001648051431402564, "global_step": 34100, "epoch": 286, "lr": 5.409189594126578e-05} +{"train_loss": 0.002861989429220557, "global_step": 34101, "epoch": 286, "lr": 5.408968785921171e-05} +{"train_loss": 0.002144950209185481, "global_step": 34102, "epoch": 286, "lr": 5.408747976912797e-05} +{"train_loss": 0.0015309343580156565, "global_step": 34103, "epoch": 286, "lr": 5.40852716710189e-05} +{"train_loss": 0.0009542275220155716, "global_step": 34104, "epoch": 286, "lr": 5.408306356488884e-05} +{"train_loss": 0.0027364143170416355, "global_step": 34105, "epoch": 286, "lr": 5.408085545074212e-05} +{"train_loss": 0.003043781267479062, "global_step": 34106, "epoch": 286, "lr": 5.4078647328583063e-05} +{"train_loss": 0.001360989874228835, "global_step": 34107, "epoch": 286, "lr": 5.407643919841603e-05} +{"train_loss": 0.0031619796063750982, "global_step": 34108, "epoch": 286, "lr": 5.4074231060245336e-05} +{"train_loss": 0.003165310947224498, "global_step": 34109, "epoch": 286, "lr": 5.407202291407534e-05} +{"train_loss": 0.004305921029299498, "global_step": 34110, "epoch": 286, "lr": 5.4069814759910344e-05} +{"train_loss": 0.0025969622656702995, "global_step": 34111, "epoch": 286, "lr": 5.40676065977547e-05} +{"train_loss": 0.0012478881981223822, "global_step": 34112, "epoch": 286, "lr": 5.406539842761276e-05} +{"train_loss": 0.0019509188132360578, "global_step": 34113, "epoch": 286, "lr": 5.406319024948884e-05} +{"train_loss": 0.0027516481932252645, "global_step": 34114, "epoch": 286, "lr": 5.406098206338728e-05} +{"train_loss": 0.001456776401028037, "global_step": 34115, "epoch": 286, "lr": 5.4058773869312405e-05} +{"train_loss": 0.0031161655206233263, "global_step": 34116, "epoch": 286, "lr": 5.405656566726858e-05} +{"train_loss": 0.0022254229988902807, "global_step": 34117, "epoch": 286, "lr": 5.4054357457260116e-05} +{"train_loss": 0.002738937269896269, "global_step": 34118, "epoch": 286, "lr": 5.405214923929135e-05} +{"train_loss": 0.0018208767287433147, "global_step": 34119, "epoch": 286, "lr": 5.4049941013366625e-05} +{"train_loss": 0.0033774515613913536, "global_step": 34120, "epoch": 286, "lr": 5.404773277949027e-05} +{"train_loss": 0.0030004442669451237, "global_step": 34121, "epoch": 286, "lr": 5.404552453766663e-05} +{"train_loss": 0.00227328110486269, "global_step": 34122, "epoch": 286, "lr": 5.404331628790002e-05} +{"train_loss": 0.003114960389211774, "global_step": 34123, "epoch": 286, "lr": 5.404110803019481e-05} +{"train_loss": 0.003050853032618761, "global_step": 34124, "epoch": 286, "lr": 5.403889976455531e-05} +{"train_loss": 0.002311964286491275, "global_step": 34125, "epoch": 286, "lr": 5.4036691490985845e-05} +{"train_loss": 0.003036780981346965, "global_step": 34126, "epoch": 286, "lr": 5.403448320949078e-05} +{"train_loss": 0.003164985915645957, "global_step": 34127, "epoch": 286, "lr": 5.403227492007443e-05} +{"train_loss": 0.0018493036041036248, "global_step": 34128, "epoch": 286, "lr": 5.403006662274115e-05} +{"train_loss": 0.003949841018766165, "global_step": 34129, "epoch": 286, "lr": 5.4027858317495274e-05} +{"train_loss": 0.0036449814215302467, "global_step": 34130, "epoch": 286, "lr": 5.402565000434112e-05} +{"train_loss": 0.0033985553309321404, "global_step": 34131, "epoch": 286, "lr": 5.402344168328303e-05} +{"train_loss": 0.00202800240367651, "global_step": 34132, "epoch": 286, "lr": 5.402123335432534e-05} +{"train_loss": 0.0028837176505476236, "global_step": 34133, "epoch": 286, "lr": 5.401902501747238e-05} +{"train_loss": 0.0025085946545004845, "global_step": 34134, "epoch": 286, "lr": 5.4016816672728506e-05} +{"train_loss": 0.002861839486286044, "global_step": 34135, "epoch": 286, "lr": 5.401460832009804e-05} +{"train_loss": 0.0033452012576162815, "global_step": 34136, "epoch": 286, "lr": 5.4012399959585325e-05} +{"train_loss": 0.0017142633441835642, "global_step": 34137, "epoch": 286, "lr": 5.4010191591194684e-05} +{"train_loss": 0.0030948552303016186, "global_step": 34138, "epoch": 286, "lr": 5.400798321493046e-05} +{"train_loss": 0.0034008785150945187, "global_step": 34139, "epoch": 286, "lr": 5.4005774830797e-05} +{"train_loss": 0.002103580627590418, "global_step": 34140, "epoch": 286, "lr": 5.40035664387986e-05} +{"train_loss": 0.0035022255033254623, "global_step": 34141, "epoch": 286, "lr": 5.4001358038939656e-05} +{"train_loss": 0.004481187090277672, "global_step": 34142, "epoch": 286, "lr": 5.399914963122445e-05} +{"train_loss": 0.0038688238710165024, "global_step": 34143, "epoch": 286, "lr": 5.399694121565736e-05} +{"train_loss": 0.0024441007990390062, "global_step": 34144, "epoch": 286, "lr": 5.399473279224268e-05} +{"train_loss": 0.0015738090733066201, "global_step": 34145, "epoch": 286, "lr": 5.3992524360984796e-05} +{"train_loss": 0.002499577822163701, "global_step": 34146, "epoch": 286, "lr": 5.3990315921888005e-05} +{"train_loss": 0.0015951144741848111, "global_step": 34147, "epoch": 286, "lr": 5.3988107474956654e-05} +{"train_loss": 0.002607561182230711, "global_step": 34148, "epoch": 286, "lr": 5.3985899020195086e-05} +{"train_loss": 0.0033524674363434315, "global_step": 34149, "epoch": 286, "lr": 5.3983690557607626e-05} +{"train_loss": 0.0021885428577661514, "global_step": 34150, "epoch": 286, "lr": 5.398148208719861e-05} +{"train_loss": 0.0014925420982763171, "global_step": 34151, "epoch": 286, "lr": 5.397927360897239e-05} +{"train_loss": 0.00268659766415181, "global_step": 34152, "epoch": 286, "lr": 5.397706512293328e-05, "val_loss": 0.022094562649726868} +{"train_loss": 0.002301675733178854, "global_step": 34153, "epoch": 287, "lr": 5.3974856629085634e-05} +{"train_loss": 0.0038838174659758806, "global_step": 34154, "epoch": 287, "lr": 5.3972648127433786e-05} +{"train_loss": 0.0027450521010905504, "global_step": 34155, "epoch": 287, "lr": 5.397043961798207e-05} +{"train_loss": 0.0026341502089053392, "global_step": 34156, "epoch": 287, "lr": 5.396823110073481e-05} +{"train_loss": 0.0023235694970935583, "global_step": 34157, "epoch": 287, "lr": 5.396602257569635e-05} +{"train_loss": 0.0018860033014789224, "global_step": 34158, "epoch": 287, "lr": 5.396381404287103e-05} +{"train_loss": 0.002135010901838541, "global_step": 34159, "epoch": 287, "lr": 5.396160550226319e-05} +{"train_loss": 0.0031604852993041277, "global_step": 34160, "epoch": 287, "lr": 5.395939695387715e-05} +{"train_loss": 0.001947716809809208, "global_step": 34161, "epoch": 287, "lr": 5.395718839771727e-05} +{"train_loss": 0.002842248184606433, "global_step": 34162, "epoch": 287, "lr": 5.3954979833787876e-05} +{"train_loss": 0.0037232458125799894, "global_step": 34163, "epoch": 287, "lr": 5.3952771262093295e-05} +{"train_loss": 0.0024140786845237017, "global_step": 34164, "epoch": 287, "lr": 5.395056268263786e-05} +{"train_loss": 0.002135257702320814, "global_step": 34165, "epoch": 287, "lr": 5.394835409542593e-05} +{"train_loss": 0.002955386182293296, "global_step": 34166, "epoch": 287, "lr": 5.394614550046182e-05} +{"train_loss": 0.0013871273258700967, "global_step": 34167, "epoch": 287, "lr": 5.3943936897749894e-05} +{"train_loss": 0.0014196232659742236, "global_step": 34168, "epoch": 287, "lr": 5.3941728287294455e-05} +{"train_loss": 0.0028722803108394146, "global_step": 34169, "epoch": 287, "lr": 5.393951966909986e-05} +{"train_loss": 0.001981679117307067, "global_step": 34170, "epoch": 287, "lr": 5.393731104317042e-05} +{"train_loss": 0.0030593029223382473, "global_step": 34171, "epoch": 287, "lr": 5.393510240951051e-05} +{"train_loss": 0.0027362604159861803, "global_step": 34172, "epoch": 287, "lr": 5.3932893768124436e-05} +{"train_loss": 0.00226675090380013, "global_step": 34173, "epoch": 287, "lr": 5.3930685119016566e-05} +{"train_loss": 0.0022493144497275352, "global_step": 34174, "epoch": 287, "lr": 5.392847646219118e-05} +{"train_loss": 0.002552320947870612, "global_step": 34175, "epoch": 287, "lr": 5.392626779765268e-05} +{"train_loss": 0.0019834216218441725, "global_step": 34176, "epoch": 287, "lr": 5.392405912540536e-05} +{"train_loss": 0.0018105837516486645, "global_step": 34177, "epoch": 287, "lr": 5.392185044545357e-05} +{"train_loss": 0.0017993712099269032, "global_step": 34178, "epoch": 287, "lr": 5.391964175780164e-05} +{"train_loss": 0.0020782637875527143, "global_step": 34179, "epoch": 287, "lr": 5.391743306245392e-05} +{"train_loss": 0.0028493034187704325, "global_step": 34180, "epoch": 287, "lr": 5.391522435941475e-05} +{"train_loss": 0.002672687405720353, "global_step": 34181, "epoch": 287, "lr": 5.391301564868844e-05} +{"train_loss": 0.002456079702824354, "global_step": 34182, "epoch": 287, "lr": 5.391080693027935e-05} +{"train_loss": 0.0022454671561717987, "global_step": 34183, "epoch": 287, "lr": 5.3908598204191795e-05} +{"train_loss": 0.0024502102751284838, "global_step": 34184, "epoch": 287, "lr": 5.390638947043013e-05} +{"train_loss": 0.0018869099440053105, "global_step": 34185, "epoch": 287, "lr": 5.3904180728998686e-05} +{"train_loss": 0.004681482445448637, "global_step": 34186, "epoch": 287, "lr": 5.390197197990182e-05} +{"train_loss": 0.001921853399835527, "global_step": 34187, "epoch": 287, "lr": 5.389976322314383e-05} +{"train_loss": 0.002161562442779541, "global_step": 34188, "epoch": 287, "lr": 5.3897554458729074e-05} +{"train_loss": 0.002246574265882373, "global_step": 34189, "epoch": 287, "lr": 5.389534568666189e-05} +{"train_loss": 0.0051286350935697556, "global_step": 34190, "epoch": 287, "lr": 5.389313690694661e-05} +{"train_loss": 0.002195334527641535, "global_step": 34191, "epoch": 287, "lr": 5.389092811958756e-05} +{"train_loss": 0.002855897881090641, "global_step": 34192, "epoch": 287, "lr": 5.38887193245891e-05} +{"train_loss": 0.0017416994087398052, "global_step": 34193, "epoch": 287, "lr": 5.3886510521955547e-05} +{"train_loss": 0.002427946077659726, "global_step": 34194, "epoch": 287, "lr": 5.3884301711691256e-05} +{"train_loss": 0.003041754476726055, "global_step": 34195, "epoch": 287, "lr": 5.388209289380055e-05} +{"train_loss": 0.002463981043547392, "global_step": 34196, "epoch": 287, "lr": 5.3879884068287764e-05} +{"train_loss": 0.003604016499593854, "global_step": 34197, "epoch": 287, "lr": 5.387767523515724e-05} +{"train_loss": 0.0023946156725287437, "global_step": 34198, "epoch": 287, "lr": 5.387546639441333e-05} +{"train_loss": 0.003567993873730302, "global_step": 34199, "epoch": 287, "lr": 5.387325754606035e-05} +{"train_loss": 0.003867698134854436, "global_step": 34200, "epoch": 287, "lr": 5.387104869010263e-05} +{"train_loss": 0.0022221780382096767, "global_step": 34201, "epoch": 287, "lr": 5.386883982654452e-05} +{"train_loss": 0.002778264693915844, "global_step": 34202, "epoch": 287, "lr": 5.3866630955390375e-05} +{"train_loss": 0.002809516154229641, "global_step": 34203, "epoch": 287, "lr": 5.3864422076644494e-05} +{"train_loss": 0.0020056762732565403, "global_step": 34204, "epoch": 287, "lr": 5.386221319031125e-05} +{"train_loss": 0.002144990488886833, "global_step": 34205, "epoch": 287, "lr": 5.386000429639496e-05} +{"train_loss": 0.002969103865325451, "global_step": 34206, "epoch": 287, "lr": 5.385779539489996e-05} +{"train_loss": 0.0038276580162346363, "global_step": 34207, "epoch": 287, "lr": 5.385558648583059e-05} +{"train_loss": 0.003060380695387721, "global_step": 34208, "epoch": 287, "lr": 5.385337756919118e-05} +{"train_loss": 0.0013675641966983676, "global_step": 34209, "epoch": 287, "lr": 5.3851168644986075e-05} +{"train_loss": 0.0034662282560020685, "global_step": 34210, "epoch": 287, "lr": 5.384895971321962e-05} +{"train_loss": 0.002964295679703355, "global_step": 34211, "epoch": 287, "lr": 5.384675077389615e-05} +{"train_loss": 0.0016353634418919683, "global_step": 34212, "epoch": 287, "lr": 5.384454182701998e-05} +{"train_loss": 0.002839372493326664, "global_step": 34213, "epoch": 287, "lr": 5.384233287259547e-05} +{"train_loss": 0.0017527827294543386, "global_step": 34214, "epoch": 287, "lr": 5.384012391062695e-05} +{"train_loss": 0.0019167830469086766, "global_step": 34215, "epoch": 287, "lr": 5.383791494111876e-05} +{"train_loss": 0.002502691000699997, "global_step": 34216, "epoch": 287, "lr": 5.3835705964075225e-05} +{"train_loss": 0.003571567125618458, "global_step": 34217, "epoch": 287, "lr": 5.383349697950071e-05} +{"train_loss": 0.0031286231242120266, "global_step": 34218, "epoch": 287, "lr": 5.383128798739951e-05} +{"train_loss": 0.002091451548039913, "global_step": 34219, "epoch": 287, "lr": 5.3829078987776005e-05} +{"train_loss": 0.003280150704085827, "global_step": 34220, "epoch": 287, "lr": 5.382686998063451e-05} +{"train_loss": 0.003086027456447482, "global_step": 34221, "epoch": 287, "lr": 5.3824660965979355e-05} +{"train_loss": 0.002293533179908991, "global_step": 34222, "epoch": 287, "lr": 5.382245194381489e-05} +{"train_loss": 0.002930615795776248, "global_step": 34223, "epoch": 287, "lr": 5.3820242914145446e-05} +{"train_loss": 0.0014837725320830941, "global_step": 34224, "epoch": 287, "lr": 5.381803387697536e-05} +{"train_loss": 0.0014629106735810637, "global_step": 34225, "epoch": 287, "lr": 5.381582483230898e-05} +{"train_loss": 0.0028501441702246666, "global_step": 34226, "epoch": 287, "lr": 5.381361578015064e-05} +{"train_loss": 0.0028382311575114727, "global_step": 34227, "epoch": 287, "lr": 5.3811406720504664e-05} +{"train_loss": 0.001825000741519034, "global_step": 34228, "epoch": 287, "lr": 5.3809197653375396e-05} +{"train_loss": 0.00151549419388175, "global_step": 34229, "epoch": 287, "lr": 5.380698857876718e-05} +{"train_loss": 0.0028274348005652428, "global_step": 34230, "epoch": 287, "lr": 5.3804779496684365e-05} +{"train_loss": 0.0025847216602414846, "global_step": 34231, "epoch": 287, "lr": 5.380257040713125e-05} +{"train_loss": 0.0021530024241656065, "global_step": 34232, "epoch": 287, "lr": 5.38003613101122e-05} +{"train_loss": 0.0026826029643416405, "global_step": 34233, "epoch": 287, "lr": 5.3798152205631544e-05} +{"train_loss": 0.0018087198259308934, "global_step": 34234, "epoch": 287, "lr": 5.379594309369362e-05} +{"train_loss": 0.001760023646056652, "global_step": 34235, "epoch": 287, "lr": 5.3793733974302775e-05} +{"train_loss": 0.0023270421661436558, "global_step": 34236, "epoch": 287, "lr": 5.379152484746335e-05} +{"train_loss": 0.002135190647095442, "global_step": 34237, "epoch": 287, "lr": 5.3789315713179656e-05} +{"train_loss": 0.002587466035038233, "global_step": 34238, "epoch": 287, "lr": 5.3787106571456045e-05} +{"train_loss": 0.0037384768947958946, "global_step": 34239, "epoch": 287, "lr": 5.3784897422296854e-05} +{"train_loss": 0.004879290238022804, "global_step": 34240, "epoch": 287, "lr": 5.3782688265706426e-05} +{"train_loss": 0.003772723488509655, "global_step": 34241, "epoch": 287, "lr": 5.3780479101689084e-05} +{"train_loss": 0.0020474379416555166, "global_step": 34242, "epoch": 287, "lr": 5.377826993024918e-05} +{"train_loss": 0.001553653390146792, "global_step": 34243, "epoch": 287, "lr": 5.3776060751391054e-05} +{"train_loss": 0.0030434008222073317, "global_step": 34244, "epoch": 287, "lr": 5.3773851565119027e-05} +{"train_loss": 0.003105641109868884, "global_step": 34245, "epoch": 287, "lr": 5.3771642371437446e-05} +{"train_loss": 0.0027880393899977207, "global_step": 34246, "epoch": 287, "lr": 5.3769433170350656e-05} +{"train_loss": 0.002300735330209136, "global_step": 34247, "epoch": 287, "lr": 5.376722396186298e-05} +{"train_loss": 0.0020994406659156084, "global_step": 34248, "epoch": 287, "lr": 5.376501474597877e-05} +{"train_loss": 0.0031898529268801212, "global_step": 34249, "epoch": 287, "lr": 5.376280552270235e-05} +{"train_loss": 0.003234636737033725, "global_step": 34250, "epoch": 287, "lr": 5.3760596292038065e-05} +{"train_loss": 0.0014801828656345606, "global_step": 34251, "epoch": 287, "lr": 5.3758387053990254e-05} +{"train_loss": 0.0026480057276785374, "global_step": 34252, "epoch": 287, "lr": 5.375617780856325e-05} +{"train_loss": 0.002466802950948477, "global_step": 34253, "epoch": 287, "lr": 5.375396855576138e-05} +{"train_loss": 0.0025432570837438107, "global_step": 34254, "epoch": 287, "lr": 5.3751759295588997e-05} +{"train_loss": 0.0026085868012160063, "global_step": 34255, "epoch": 287, "lr": 5.374955002805045e-05} +{"train_loss": 0.0030958738643676043, "global_step": 34256, "epoch": 287, "lr": 5.374734075315007e-05} +{"train_loss": 0.0016928281402215362, "global_step": 34257, "epoch": 287, "lr": 5.3745131470892164e-05} +{"train_loss": 0.002460864605382085, "global_step": 34258, "epoch": 287, "lr": 5.374292218128109e-05} +{"train_loss": 0.0019494519801810384, "global_step": 34259, "epoch": 287, "lr": 5.3740712884321186e-05} +{"train_loss": 0.0037623245734721422, "global_step": 34260, "epoch": 287, "lr": 5.373850358001681e-05} +{"train_loss": 0.0033919927664101124, "global_step": 34261, "epoch": 287, "lr": 5.373629426837228e-05} +{"train_loss": 0.0019922470673918724, "global_step": 34262, "epoch": 287, "lr": 5.3734084949391926e-05} +{"train_loss": 0.0032886923290789127, "global_step": 34263, "epoch": 287, "lr": 5.373187562308011e-05} +{"train_loss": 0.0024995622225105762, "global_step": 34264, "epoch": 287, "lr": 5.372966628944114e-05} +{"train_loss": 0.004210652783513069, "global_step": 34265, "epoch": 287, "lr": 5.372745694847937e-05} +{"train_loss": 0.0021465665195137262, "global_step": 34266, "epoch": 287, "lr": 5.372524760019914e-05} +{"train_loss": 0.004077205900102854, "global_step": 34267, "epoch": 287, "lr": 5.37230382446048e-05} +{"train_loss": 0.0022412012331187725, "global_step": 34268, "epoch": 287, "lr": 5.372082888170065e-05} +{"train_loss": 0.00249952613376081, "global_step": 34269, "epoch": 287, "lr": 5.371861951149105e-05} +{"train_loss": 0.003725355491042137, "global_step": 34270, "epoch": 287, "lr": 5.3716410133980345e-05} +{"train_loss": 0.002627312214536389, "global_step": 34271, "epoch": 287, "lr": 5.371420074917286e-05, "val_loss": 0.023606911301612854} +{"train_loss": 0.0021296825725585222, "global_step": 34272, "epoch": 288, "lr": 5.3711991357072945e-05} +{"train_loss": 0.0016819997690618038, "global_step": 34273, "epoch": 288, "lr": 5.370978195768493e-05} +{"train_loss": 0.003128918819129467, "global_step": 34274, "epoch": 288, "lr": 5.370757255101315e-05} +{"train_loss": 0.005010225810110569, "global_step": 34275, "epoch": 288, "lr": 5.3705363137061946e-05} +{"train_loss": 0.002218793146312237, "global_step": 34276, "epoch": 288, "lr": 5.370315371583568e-05} +{"train_loss": 0.001876343972980976, "global_step": 34277, "epoch": 288, "lr": 5.370094428733864e-05} +{"train_loss": 0.0022413190454244614, "global_step": 34278, "epoch": 288, "lr": 5.369873485157519e-05} +{"train_loss": 0.002848427277058363, "global_step": 34279, "epoch": 288, "lr": 5.369652540854969e-05} +{"train_loss": 0.0027414083015173674, "global_step": 34280, "epoch": 288, "lr": 5.369431595826646e-05} +{"train_loss": 0.0015713806496933103, "global_step": 34281, "epoch": 288, "lr": 5.369210650072982e-05} +{"train_loss": 0.002251026453450322, "global_step": 34282, "epoch": 288, "lr": 5.368989703594413e-05} +{"train_loss": 0.0028995394241064787, "global_step": 34283, "epoch": 288, "lr": 5.368768756391371e-05} +{"train_loss": 0.002902450505644083, "global_step": 34284, "epoch": 288, "lr": 5.368547808464292e-05} +{"train_loss": 0.003885182086378336, "global_step": 34285, "epoch": 288, "lr": 5.3683268598136084e-05} +{"train_loss": 0.0030664510559290648, "global_step": 34286, "epoch": 288, "lr": 5.368105910439756e-05} +{"train_loss": 0.004591600503772497, "global_step": 34287, "epoch": 288, "lr": 5.3678849603431644e-05} +{"train_loss": 0.0030427095480263233, "global_step": 34288, "epoch": 288, "lr": 5.367664009524271e-05} +{"train_loss": 0.0017907859291881323, "global_step": 34289, "epoch": 288, "lr": 5.367443057983509e-05} +{"train_loss": 0.004236972890794277, "global_step": 34290, "epoch": 288, "lr": 5.367222105721311e-05} +{"train_loss": 0.002100307261571288, "global_step": 34291, "epoch": 288, "lr": 5.3670011527381113e-05} +{"train_loss": 0.003163457615301013, "global_step": 34292, "epoch": 288, "lr": 5.3667801990343445e-05} +{"train_loss": 0.0036447609309107065, "global_step": 34293, "epoch": 288, "lr": 5.366559244610445e-05} +{"train_loss": 0.001946734613738954, "global_step": 34294, "epoch": 288, "lr": 5.366338289466844e-05} +{"train_loss": 0.001846793107688427, "global_step": 34295, "epoch": 288, "lr": 5.366117333603978e-05} +{"train_loss": 0.0034326105378568172, "global_step": 34296, "epoch": 288, "lr": 5.3658963770222795e-05} +{"train_loss": 0.002721447264775634, "global_step": 34297, "epoch": 288, "lr": 5.365675419722183e-05} +{"train_loss": 0.0025941531639546156, "global_step": 34298, "epoch": 288, "lr": 5.3654544617041215e-05} +{"train_loss": 0.004251372069120407, "global_step": 34299, "epoch": 288, "lr": 5.3652335029685297e-05} +{"train_loss": 0.0023028787691146135, "global_step": 34300, "epoch": 288, "lr": 5.3650125435158404e-05} +{"train_loss": 0.0022159325890243053, "global_step": 34301, "epoch": 288, "lr": 5.364791583346488e-05} +{"train_loss": 0.0025918781757354736, "global_step": 34302, "epoch": 288, "lr": 5.364570622460906e-05} +{"train_loss": 0.0030140362214297056, "global_step": 34303, "epoch": 288, "lr": 5.364349660859528e-05} +{"train_loss": 0.003215621691197157, "global_step": 34304, "epoch": 288, "lr": 5.36412869854279e-05} +{"train_loss": 0.0034338291734457016, "global_step": 34305, "epoch": 288, "lr": 5.3639077355111234e-05} +{"train_loss": 0.0013148686848580837, "global_step": 34306, "epoch": 288, "lr": 5.363686771764963e-05} +{"train_loss": 0.0033978470601141453, "global_step": 34307, "epoch": 288, "lr": 5.3634658073047405e-05} +{"train_loss": 0.0036956823896616697, "global_step": 34308, "epoch": 288, "lr": 5.363244842130893e-05} +{"train_loss": 0.00208724825643003, "global_step": 34309, "epoch": 288, "lr": 5.3630238762438545e-05} +{"train_loss": 0.0024428805336356163, "global_step": 34310, "epoch": 288, "lr": 5.362802909644056e-05} +{"train_loss": 0.002730029169470072, "global_step": 34311, "epoch": 288, "lr": 5.362581942331935e-05} +{"train_loss": 0.0032700211741030216, "global_step": 34312, "epoch": 288, "lr": 5.3623609743079207e-05} +{"train_loss": 0.0038124893326312304, "global_step": 34313, "epoch": 288, "lr": 5.362140005572449e-05} +{"train_loss": 0.0038736783899366856, "global_step": 34314, "epoch": 288, "lr": 5.3619190361259555e-05} +{"train_loss": 0.0026748485397547483, "global_step": 34315, "epoch": 288, "lr": 5.361698065968872e-05} +{"train_loss": 0.0020850813016295433, "global_step": 34316, "epoch": 288, "lr": 5.361477095101632e-05} +{"train_loss": 0.0016804791521281004, "global_step": 34317, "epoch": 288, "lr": 5.361256123524674e-05} +{"train_loss": 0.003651332575827837, "global_step": 34318, "epoch": 288, "lr": 5.361035151238425e-05} +{"train_loss": 0.003022428136318922, "global_step": 34319, "epoch": 288, "lr": 5.360814178243323e-05} +{"train_loss": 0.0017438550712540746, "global_step": 34320, "epoch": 288, "lr": 5.3605932045398e-05} +{"train_loss": 0.00200745090842247, "global_step": 34321, "epoch": 288, "lr": 5.360372230128291e-05} +{"train_loss": 0.0024321218952536583, "global_step": 34322, "epoch": 288, "lr": 5.3601512550092305e-05} +{"train_loss": 0.004342431202530861, "global_step": 34323, "epoch": 288, "lr": 5.359930279183051e-05} +{"train_loss": 0.002424012403935194, "global_step": 34324, "epoch": 288, "lr": 5.359709302650187e-05} +{"train_loss": 0.001896493136882782, "global_step": 34325, "epoch": 288, "lr": 5.3594883254110715e-05} +{"train_loss": 0.0021927407942712307, "global_step": 34326, "epoch": 288, "lr": 5.359267347466139e-05} +{"train_loss": 0.002648213179782033, "global_step": 34327, "epoch": 288, "lr": 5.3590463688158244e-05} +{"train_loss": 0.0022207768633961678, "global_step": 34328, "epoch": 288, "lr": 5.35882538946056e-05} +{"train_loss": 0.0028398693539202213, "global_step": 34329, "epoch": 288, "lr": 5.35860440940078e-05} +{"train_loss": 0.003045642515644431, "global_step": 34330, "epoch": 288, "lr": 5.358383428636921e-05} +{"train_loss": 0.002525370568037033, "global_step": 34331, "epoch": 288, "lr": 5.358162447169412e-05} +{"train_loss": 0.0017862921813502908, "global_step": 34332, "epoch": 288, "lr": 5.35794146499869e-05} +{"train_loss": 0.002458604983985424, "global_step": 34333, "epoch": 288, "lr": 5.3577204821251884e-05} +{"train_loss": 0.003556131385266781, "global_step": 34334, "epoch": 288, "lr": 5.3574994985493396e-05} +{"train_loss": 0.00208536465652287, "global_step": 34335, "epoch": 288, "lr": 5.35727851427158e-05} +{"train_loss": 0.002743133343756199, "global_step": 34336, "epoch": 288, "lr": 5.357057529292342e-05} +{"train_loss": 0.002469243947416544, "global_step": 34337, "epoch": 288, "lr": 5.356836543612059e-05} +{"train_loss": 0.00285351718775928, "global_step": 34338, "epoch": 288, "lr": 5.3566155572311674e-05} +{"train_loss": 0.0030526199843734503, "global_step": 34339, "epoch": 288, "lr": 5.356394570150097e-05} +{"train_loss": 0.004306911490857601, "global_step": 34340, "epoch": 288, "lr": 5.356173582369285e-05} +{"train_loss": 0.001577561255544424, "global_step": 34341, "epoch": 288, "lr": 5.355952593889164e-05} +{"train_loss": 0.0027960643637925386, "global_step": 34342, "epoch": 288, "lr": 5.355731604710168e-05} +{"train_loss": 0.0035389915574342012, "global_step": 34343, "epoch": 288, "lr": 5.355510614832731e-05} +{"train_loss": 0.0025281028356403112, "global_step": 34344, "epoch": 288, "lr": 5.355289624257287e-05} +{"train_loss": 0.0017067564185708761, "global_step": 34345, "epoch": 288, "lr": 5.3550686329842704e-05} +{"train_loss": 0.0032730461098253727, "global_step": 34346, "epoch": 288, "lr": 5.354847641014114e-05} +{"train_loss": 0.0036001973785459995, "global_step": 34347, "epoch": 288, "lr": 5.354626648347251e-05} +{"train_loss": 0.002239958383142948, "global_step": 34348, "epoch": 288, "lr": 5.354405654984118e-05} +{"train_loss": 0.0023754192516207695, "global_step": 34349, "epoch": 288, "lr": 5.3541846609251475e-05} +{"train_loss": 0.0027650105766952038, "global_step": 34350, "epoch": 288, "lr": 5.3539636661707725e-05} +{"train_loss": 0.0014278375310823321, "global_step": 34351, "epoch": 288, "lr": 5.353742670721428e-05} +{"train_loss": 0.0043605598621070385, "global_step": 34352, "epoch": 288, "lr": 5.353521674577548e-05} +{"train_loss": 0.0028341072611510754, "global_step": 34353, "epoch": 288, "lr": 5.3533006777395645e-05} +{"train_loss": 0.0034329653717577457, "global_step": 34354, "epoch": 288, "lr": 5.353079680207913e-05} +{"train_loss": 0.0019332143710926175, "global_step": 34355, "epoch": 288, "lr": 5.3528586819830284e-05} +{"train_loss": 0.002853550249710679, "global_step": 34356, "epoch": 288, "lr": 5.352637683065342e-05} +{"train_loss": 0.00247472757473588, "global_step": 34357, "epoch": 288, "lr": 5.352416683455291e-05} +{"train_loss": 0.0026822155341506004, "global_step": 34358, "epoch": 288, "lr": 5.352195683153307e-05} +{"train_loss": 0.0026996047236025333, "global_step": 34359, "epoch": 288, "lr": 5.3519746821598236e-05} +{"train_loss": 0.003919837065041065, "global_step": 34360, "epoch": 288, "lr": 5.3517536804752765e-05} +{"train_loss": 0.004802937153726816, "global_step": 34361, "epoch": 288, "lr": 5.3515326781000986e-05} +{"train_loss": 0.002351251896470785, "global_step": 34362, "epoch": 288, "lr": 5.351311675034724e-05} +{"train_loss": 0.003068668069317937, "global_step": 34363, "epoch": 288, "lr": 5.351090671279585e-05} +{"train_loss": 0.0043943580240011215, "global_step": 34364, "epoch": 288, "lr": 5.350869666835118e-05} +{"train_loss": 0.004377158358693123, "global_step": 34365, "epoch": 288, "lr": 5.350648661701756e-05} +{"train_loss": 0.003369345096871257, "global_step": 34366, "epoch": 288, "lr": 5.350427655879933e-05} +{"train_loss": 0.0013718047412112355, "global_step": 34367, "epoch": 288, "lr": 5.350206649370082e-05} +{"train_loss": 0.0025589941069483757, "global_step": 34368, "epoch": 288, "lr": 5.349985642172638e-05} +{"train_loss": 0.0032892869785428047, "global_step": 34369, "epoch": 288, "lr": 5.3497646342880347e-05} +{"train_loss": 0.004094169940799475, "global_step": 34370, "epoch": 288, "lr": 5.349543625716705e-05} +{"train_loss": 0.002982886740937829, "global_step": 34371, "epoch": 288, "lr": 5.349322616459085e-05} +{"train_loss": 0.0024537108838558197, "global_step": 34372, "epoch": 288, "lr": 5.349101606515606e-05} +{"train_loss": 0.005267483647912741, "global_step": 34373, "epoch": 288, "lr": 5.348880595886705e-05} +{"train_loss": 0.0022171633318066597, "global_step": 34374, "epoch": 288, "lr": 5.348659584572813e-05} +{"train_loss": 0.0026103074196726084, "global_step": 34375, "epoch": 288, "lr": 5.3484385725743655e-05} +{"train_loss": 0.0016620255773887038, "global_step": 34376, "epoch": 288, "lr": 5.348217559891796e-05} +{"train_loss": 0.0035637107212096453, "global_step": 34377, "epoch": 288, "lr": 5.347996546525539e-05} +{"train_loss": 0.00325013417750597, "global_step": 34378, "epoch": 288, "lr": 5.347775532476027e-05} +{"train_loss": 0.0032310732640326023, "global_step": 34379, "epoch": 288, "lr": 5.3475545177436946e-05} +{"train_loss": 0.0042571499943733215, "global_step": 34380, "epoch": 288, "lr": 5.3473335023289785e-05} +{"train_loss": 0.003476249286904931, "global_step": 34381, "epoch": 288, "lr": 5.347112486232309e-05} +{"train_loss": 0.003238256089389324, "global_step": 34382, "epoch": 288, "lr": 5.34689146945412e-05} +{"train_loss": 0.00381238991394639, "global_step": 34383, "epoch": 288, "lr": 5.3466704519948476e-05} +{"train_loss": 0.002830932382494211, "global_step": 34384, "epoch": 288, "lr": 5.346449433854924e-05} +{"train_loss": 0.002311561955139041, "global_step": 34385, "epoch": 288, "lr": 5.3462284150347854e-05} +{"train_loss": 0.002348099835216999, "global_step": 34386, "epoch": 288, "lr": 5.346007395534865e-05} +{"train_loss": 0.002873224439099431, "global_step": 34387, "epoch": 288, "lr": 5.345786375355594e-05} +{"train_loss": 0.0036497460678219795, "global_step": 34388, "epoch": 288, "lr": 5.345565354497408e-05} +{"train_loss": 0.0032117506489157677, "global_step": 34389, "epoch": 288, "lr": 5.3453443329607425e-05} +{"train_loss": 0.0028972633382571594, "global_step": 34390, "epoch": 288, "lr": 5.3451233107460296e-05, "val_loss": 0.02019275724887848} +{"train_loss": 0.003930520266294479, "global_step": 34391, "epoch": 289, "lr": 5.344902287853703e-05} +{"train_loss": 0.003214366501197219, "global_step": 34392, "epoch": 289, "lr": 5.344681264284199e-05} +{"train_loss": 0.0028872783295810223, "global_step": 34393, "epoch": 289, "lr": 5.3444602400379517e-05} +{"train_loss": 0.002656861674040556, "global_step": 34394, "epoch": 289, "lr": 5.344239215115392e-05} +{"train_loss": 0.0027391903568059206, "global_step": 34395, "epoch": 289, "lr": 5.344018189516955e-05} +{"train_loss": 0.0035578450188040733, "global_step": 34396, "epoch": 289, "lr": 5.343797163243076e-05} +{"train_loss": 0.002284768270328641, "global_step": 34397, "epoch": 289, "lr": 5.343576136294187e-05} +{"train_loss": 0.00477907620370388, "global_step": 34398, "epoch": 289, "lr": 5.3433551086707235e-05} +{"train_loss": 0.002894048346206546, "global_step": 34399, "epoch": 289, "lr": 5.34313408037312e-05} +{"train_loss": 0.003387665841728449, "global_step": 34400, "epoch": 289, "lr": 5.342913051401808e-05} +{"train_loss": 0.0025985173415392637, "global_step": 34401, "epoch": 289, "lr": 5.342692021757223e-05} +{"train_loss": 0.002821281785145402, "global_step": 34402, "epoch": 289, "lr": 5.342470991439799e-05} +{"train_loss": 0.003533910494297743, "global_step": 34403, "epoch": 289, "lr": 5.3422499604499696e-05} +{"train_loss": 0.002947448752820492, "global_step": 34404, "epoch": 289, "lr": 5.342028928788169e-05} +{"train_loss": 0.0018322705291211605, "global_step": 34405, "epoch": 289, "lr": 5.3418078964548315e-05} +{"train_loss": 0.002826214535161853, "global_step": 34406, "epoch": 289, "lr": 5.3415868634503894e-05} +{"train_loss": 0.002120236400514841, "global_step": 34407, "epoch": 289, "lr": 5.341365829775279e-05} +{"train_loss": 0.0036162198521196842, "global_step": 34408, "epoch": 289, "lr": 5.341144795429933e-05} +{"train_loss": 0.001994253369048238, "global_step": 34409, "epoch": 289, "lr": 5.340923760414787e-05} +{"train_loss": 0.005294150672852993, "global_step": 34410, "epoch": 289, "lr": 5.340702724730271e-05} +{"train_loss": 0.003091961843892932, "global_step": 34411, "epoch": 289, "lr": 5.340481688376825e-05} +{"train_loss": 0.004310886841267347, "global_step": 34412, "epoch": 289, "lr": 5.340260651354877e-05} +{"train_loss": 0.0024855583906173706, "global_step": 34413, "epoch": 289, "lr": 5.340039613664865e-05} +{"train_loss": 0.004627238027751446, "global_step": 34414, "epoch": 289, "lr": 5.3398185753072205e-05} +{"train_loss": 0.0026590528432279825, "global_step": 34415, "epoch": 289, "lr": 5.339597536282378e-05} +{"train_loss": 0.002885947935283184, "global_step": 34416, "epoch": 289, "lr": 5.339376496590773e-05} +{"train_loss": 0.0016876518493518233, "global_step": 34417, "epoch": 289, "lr": 5.339155456232838e-05} +{"train_loss": 0.0021443767473101616, "global_step": 34418, "epoch": 289, "lr": 5.338934415209009e-05} +{"train_loss": 0.0015671964501962066, "global_step": 34419, "epoch": 289, "lr": 5.338713373519717e-05} +{"train_loss": 0.0019582833629101515, "global_step": 34420, "epoch": 289, "lr": 5.3384923311653976e-05} +{"train_loss": 0.0029714065603911877, "global_step": 34421, "epoch": 289, "lr": 5.3382712881464856e-05} +{"train_loss": 0.001956744585186243, "global_step": 34422, "epoch": 289, "lr": 5.338050244463413e-05} +{"train_loss": 0.0018800689140334725, "global_step": 34423, "epoch": 289, "lr": 5.337829200116615e-05} +{"train_loss": 0.0018253338057547808, "global_step": 34424, "epoch": 289, "lr": 5.337608155106526e-05} +{"train_loss": 0.003347221063449979, "global_step": 34425, "epoch": 289, "lr": 5.3373871094335795e-05} +{"train_loss": 0.00210791127756238, "global_step": 34426, "epoch": 289, "lr": 5.3371660630982076e-05} +{"train_loss": 0.003440484870225191, "global_step": 34427, "epoch": 289, "lr": 5.336945016100848e-05} +{"train_loss": 0.001807994325645268, "global_step": 34428, "epoch": 289, "lr": 5.3367239684419324e-05} +{"train_loss": 0.0028478975873440504, "global_step": 34429, "epoch": 289, "lr": 5.336502920121895e-05} +{"train_loss": 0.003025070298463106, "global_step": 34430, "epoch": 289, "lr": 5.336281871141172e-05} +{"train_loss": 0.002208855701610446, "global_step": 34431, "epoch": 289, "lr": 5.336060821500194e-05} +{"train_loss": 0.003118629101663828, "global_step": 34432, "epoch": 289, "lr": 5.335839771199396e-05} +{"train_loss": 0.00236578774638474, "global_step": 34433, "epoch": 289, "lr": 5.3356187202392126e-05} +{"train_loss": 0.00511721009388566, "global_step": 34434, "epoch": 289, "lr": 5.3353976686200776e-05} +{"train_loss": 0.0017206703778356314, "global_step": 34435, "epoch": 289, "lr": 5.335176616342425e-05} +{"train_loss": 0.0022007105872035027, "global_step": 34436, "epoch": 289, "lr": 5.3349555634066914e-05} +{"train_loss": 0.0029644430615007877, "global_step": 34437, "epoch": 289, "lr": 5.334734509813306e-05} +{"train_loss": 0.0018181942868977785, "global_step": 34438, "epoch": 289, "lr": 5.3345134555627055e-05} +{"train_loss": 0.0038894438184797764, "global_step": 34439, "epoch": 289, "lr": 5.3342924006553216e-05} +{"train_loss": 0.0017871499294415116, "global_step": 34440, "epoch": 289, "lr": 5.334071345091593e-05} +{"train_loss": 0.0027106557972729206, "global_step": 34441, "epoch": 289, "lr": 5.33385028887195e-05} +{"train_loss": 0.0027413838542997837, "global_step": 34442, "epoch": 289, "lr": 5.333629231996827e-05} +{"train_loss": 0.0024958262220025063, "global_step": 34443, "epoch": 289, "lr": 5.3334081744666606e-05} +{"train_loss": 0.0017784005030989647, "global_step": 34444, "epoch": 289, "lr": 5.3331871162818825e-05} +{"train_loss": 0.003504635766148567, "global_step": 34445, "epoch": 289, "lr": 5.332966057442926e-05} +{"train_loss": 0.004172089509665966, "global_step": 34446, "epoch": 289, "lr": 5.332744997950227e-05} +{"train_loss": 0.004034582059830427, "global_step": 34447, "epoch": 289, "lr": 5.332523937804218e-05} +{"train_loss": 0.002197169465944171, "global_step": 34448, "epoch": 289, "lr": 5.332302877005334e-05} +{"train_loss": 0.0030678927432745695, "global_step": 34449, "epoch": 289, "lr": 5.33208181555401e-05} +{"train_loss": 0.0013352337991818786, "global_step": 34450, "epoch": 289, "lr": 5.331860753450677e-05} +{"train_loss": 0.0012573220301419497, "global_step": 34451, "epoch": 289, "lr": 5.331639690695772e-05} +{"train_loss": 0.004201720934361219, "global_step": 34452, "epoch": 289, "lr": 5.331418627289727e-05} +{"train_loss": 0.0020783867221325636, "global_step": 34453, "epoch": 289, "lr": 5.331197563232978e-05} +{"train_loss": 0.0031378373969346285, "global_step": 34454, "epoch": 289, "lr": 5.330976498525957e-05} +{"train_loss": 0.0016409358941018581, "global_step": 34455, "epoch": 289, "lr": 5.330755433169099e-05} +{"train_loss": 0.001958767417818308, "global_step": 34456, "epoch": 289, "lr": 5.3305343671628386e-05} +{"train_loss": 0.002001645276322961, "global_step": 34457, "epoch": 289, "lr": 5.330313300507609e-05} +{"train_loss": 0.0017911208560690284, "global_step": 34458, "epoch": 289, "lr": 5.330092233203845e-05} +{"train_loss": 0.0023606771137565374, "global_step": 34459, "epoch": 289, "lr": 5.3298711652519795e-05} +{"train_loss": 0.0027481308206915855, "global_step": 34460, "epoch": 289, "lr": 5.3296500966524475e-05} +{"train_loss": 0.0021614839788526297, "global_step": 34461, "epoch": 289, "lr": 5.3294290274056834e-05} +{"train_loss": 0.0025101315695792437, "global_step": 34462, "epoch": 289, "lr": 5.32920795751212e-05} +{"train_loss": 0.002820354886353016, "global_step": 34463, "epoch": 289, "lr": 5.3289868869721916e-05} +{"train_loss": 0.0020112963393330574, "global_step": 34464, "epoch": 289, "lr": 5.328765815786333e-05} +{"train_loss": 0.001445324975065887, "global_step": 34465, "epoch": 289, "lr": 5.3285447439549776e-05} +{"train_loss": 0.003498147241771221, "global_step": 34466, "epoch": 289, "lr": 5.32832367147856e-05} +{"train_loss": 0.002992527326568961, "global_step": 34467, "epoch": 289, "lr": 5.328102598357514e-05} +{"train_loss": 0.0012758177472278476, "global_step": 34468, "epoch": 289, "lr": 5.3278815245922745e-05} +{"train_loss": 0.0034071647096425295, "global_step": 34469, "epoch": 289, "lr": 5.327660450183273e-05} +{"train_loss": 0.0017348366091027856, "global_step": 34470, "epoch": 289, "lr": 5.3274393751309456e-05} +{"train_loss": 0.00218869186937809, "global_step": 34471, "epoch": 289, "lr": 5.3272182994357265e-05} +{"train_loss": 0.0013147228164598346, "global_step": 34472, "epoch": 289, "lr": 5.326997223098049e-05} +{"train_loss": 0.001949465018697083, "global_step": 34473, "epoch": 289, "lr": 5.3267761461183465e-05} +{"train_loss": 0.0023082862608134747, "global_step": 34474, "epoch": 289, "lr": 5.3265550684970544e-05} +{"train_loss": 0.0025148550048470497, "global_step": 34475, "epoch": 289, "lr": 5.3263339902346064e-05} +{"train_loss": 0.001784204738214612, "global_step": 34476, "epoch": 289, "lr": 5.326112911331437e-05} +{"train_loss": 0.0019508611876517534, "global_step": 34477, "epoch": 289, "lr": 5.325891831787979e-05} +{"train_loss": 0.004886480513960123, "global_step": 34478, "epoch": 289, "lr": 5.325670751604668e-05} +{"train_loss": 0.0019362014718353748, "global_step": 34479, "epoch": 289, "lr": 5.325449670781937e-05} +{"train_loss": 0.002698509721085429, "global_step": 34480, "epoch": 289, "lr": 5.325228589320222e-05} +{"train_loss": 0.002937811426818371, "global_step": 34481, "epoch": 289, "lr": 5.325007507219952e-05} +{"train_loss": 0.0015242251101881266, "global_step": 34482, "epoch": 289, "lr": 5.324786424481567e-05} +{"train_loss": 0.001677618594840169, "global_step": 34483, "epoch": 289, "lr": 5.3245653411054975e-05} +{"train_loss": 0.002521219663321972, "global_step": 34484, "epoch": 289, "lr": 5.324344257092179e-05} +{"train_loss": 0.0015932269161567092, "global_step": 34485, "epoch": 289, "lr": 5.324123172442045e-05} +{"train_loss": 0.0017538636457175016, "global_step": 34486, "epoch": 289, "lr": 5.323902087155529e-05} +{"train_loss": 0.0035185597371309996, "global_step": 34487, "epoch": 289, "lr": 5.3236810012330684e-05} +{"train_loss": 0.0019927984103560448, "global_step": 34488, "epoch": 289, "lr": 5.323459914675091e-05} +{"train_loss": 0.0012514969566836953, "global_step": 34489, "epoch": 289, "lr": 5.3232388274820364e-05} +{"train_loss": 0.0027444656006991863, "global_step": 34490, "epoch": 289, "lr": 5.323017739654338e-05} +{"train_loss": 0.0034879478625953197, "global_step": 34491, "epoch": 289, "lr": 5.322796651192428e-05} +{"train_loss": 0.0018028536578640342, "global_step": 34492, "epoch": 289, "lr": 5.32257556209674e-05} +{"train_loss": 0.00191432423889637, "global_step": 34493, "epoch": 289, "lr": 5.322354472367712e-05} +{"train_loss": 0.0024346427526324987, "global_step": 34494, "epoch": 289, "lr": 5.322133382005774e-05} +{"train_loss": 0.0028366034384816885, "global_step": 34495, "epoch": 289, "lr": 5.3219122910113605e-05} +{"train_loss": 0.0031201534438878298, "global_step": 34496, "epoch": 289, "lr": 5.3216911993849085e-05} +{"train_loss": 0.0024627260863780975, "global_step": 34497, "epoch": 289, "lr": 5.321470107126849e-05} +{"train_loss": 0.0024791655596345663, "global_step": 34498, "epoch": 289, "lr": 5.321249014237617e-05} +{"train_loss": 0.002635034266859293, "global_step": 34499, "epoch": 289, "lr": 5.3210279207176483e-05} +{"train_loss": 0.0015815370716154575, "global_step": 34500, "epoch": 289, "lr": 5.320806826567375e-05} +{"train_loss": 0.0027103431057184935, "global_step": 34501, "epoch": 289, "lr": 5.320585731787231e-05} +{"train_loss": 0.0027468327898532152, "global_step": 34502, "epoch": 289, "lr": 5.320364636377651e-05} +{"train_loss": 0.0023293637204915285, "global_step": 34503, "epoch": 289, "lr": 5.320143540339071e-05} +{"train_loss": 0.0016798870638012886, "global_step": 34504, "epoch": 289, "lr": 5.319922443671922e-05} +{"train_loss": 0.002611087867990136, "global_step": 34505, "epoch": 289, "lr": 5.319701346376639e-05} +{"train_loss": 0.0024464763700962067, "global_step": 34506, "epoch": 289, "lr": 5.319480248453658e-05} +{"train_loss": 0.0022225389257073402, "global_step": 34507, "epoch": 289, "lr": 5.319259149903411e-05} +{"train_loss": 0.0018355591455474496, "global_step": 34508, "epoch": 289, "lr": 5.3190380507263316e-05} +{"train_loss": 0.0025753152366931073, "global_step": 34509, "epoch": 289, "lr": 5.318816950922856e-05, "val_loss": 0.013266334310173988} +{"train_loss": 0.002989682601764798, "global_step": 34510, "epoch": 290, "lr": 5.3185958504934175e-05} +{"train_loss": 0.0009553426061756909, "global_step": 34511, "epoch": 290, "lr": 5.318374749438451e-05} +{"train_loss": 0.004032752942293882, "global_step": 34512, "epoch": 290, "lr": 5.318153647758389e-05} +{"train_loss": 0.002286491682752967, "global_step": 34513, "epoch": 290, "lr": 5.3179325454536666e-05} +{"train_loss": 0.0019511089194566011, "global_step": 34514, "epoch": 290, "lr": 5.3177114425247166e-05} +{"train_loss": 0.0019256017403677106, "global_step": 34515, "epoch": 290, "lr": 5.3174903389719743e-05} +{"train_loss": 0.00135040155146271, "global_step": 34516, "epoch": 290, "lr": 5.317269234795874e-05} +{"train_loss": 0.0037589995190501213, "global_step": 34517, "epoch": 290, "lr": 5.31704812999685e-05} +{"train_loss": 0.0024223034270107746, "global_step": 34518, "epoch": 290, "lr": 5.316827024575336e-05} +{"train_loss": 0.002260727109387517, "global_step": 34519, "epoch": 290, "lr": 5.316605918531765e-05} +{"train_loss": 0.002742169192060828, "global_step": 34520, "epoch": 290, "lr": 5.316384811866573e-05} +{"train_loss": 0.0033286099787801504, "global_step": 34521, "epoch": 290, "lr": 5.3161637045801915e-05} +{"train_loss": 0.0026630691718310118, "global_step": 34522, "epoch": 290, "lr": 5.315942596673058e-05} +{"train_loss": 0.0030439672991633415, "global_step": 34523, "epoch": 290, "lr": 5.315721488145603e-05} +{"train_loss": 0.0031676767393946648, "global_step": 34524, "epoch": 290, "lr": 5.315500378998265e-05} +{"train_loss": 0.0016554984031245112, "global_step": 34525, "epoch": 290, "lr": 5.3152792692314744e-05} +{"train_loss": 0.003541982965543866, "global_step": 34526, "epoch": 290, "lr": 5.315058158845667e-05} +{"train_loss": 0.0021131448447704315, "global_step": 34527, "epoch": 290, "lr": 5.3148370478412766e-05} +{"train_loss": 0.0035561206750571728, "global_step": 34528, "epoch": 290, "lr": 5.3146159362187376e-05} +{"train_loss": 0.001620147260837257, "global_step": 34529, "epoch": 290, "lr": 5.314394823978484e-05} +{"train_loss": 0.004330878145992756, "global_step": 34530, "epoch": 290, "lr": 5.314173711120949e-05} +{"train_loss": 0.004372084513306618, "global_step": 34531, "epoch": 290, "lr": 5.313952597646568e-05} +{"train_loss": 0.002731091110035777, "global_step": 34532, "epoch": 290, "lr": 5.313731483555774e-05} +{"train_loss": 0.0016635763458907604, "global_step": 34533, "epoch": 290, "lr": 5.3135103688490017e-05} +{"train_loss": 0.0027417426463216543, "global_step": 34534, "epoch": 290, "lr": 5.313289253526685e-05} +{"train_loss": 0.003755138488486409, "global_step": 34535, "epoch": 290, "lr": 5.31306813758926e-05} +{"train_loss": 0.003604693803936243, "global_step": 34536, "epoch": 290, "lr": 5.312847021037157e-05} +{"train_loss": 0.0036713960580527782, "global_step": 34537, "epoch": 290, "lr": 5.312625903870814e-05} +{"train_loss": 0.0021225037053227425, "global_step": 34538, "epoch": 290, "lr": 5.312404786090663e-05} +{"train_loss": 0.002083035185933113, "global_step": 34539, "epoch": 290, "lr": 5.312183667697138e-05} +{"train_loss": 0.0025899563916027546, "global_step": 34540, "epoch": 290, "lr": 5.3119625486906746e-05} +{"train_loss": 0.002761576557531953, "global_step": 34541, "epoch": 290, "lr": 5.311741429071705e-05} +{"train_loss": 0.002075495198369026, "global_step": 34542, "epoch": 290, "lr": 5.311520308840665e-05} +{"train_loss": 0.002072104951366782, "global_step": 34543, "epoch": 290, "lr": 5.311299187997989e-05} +{"train_loss": 0.002578064799308777, "global_step": 34544, "epoch": 290, "lr": 5.3110780665441096e-05} +{"train_loss": 0.0024593323469161987, "global_step": 34545, "epoch": 290, "lr": 5.310856944479462e-05} +{"train_loss": 0.00487099913880229, "global_step": 34546, "epoch": 290, "lr": 5.3106358218044795e-05} +{"train_loss": 0.002850135089829564, "global_step": 34547, "epoch": 290, "lr": 5.310414698519596e-05} +{"train_loss": 0.0014741414925083518, "global_step": 34548, "epoch": 290, "lr": 5.3101935746252476e-05} +{"train_loss": 0.0018787359585985541, "global_step": 34549, "epoch": 290, "lr": 5.309972450121867e-05} +{"train_loss": 0.0017682292964309454, "global_step": 34550, "epoch": 290, "lr": 5.3097513250098885e-05} +{"train_loss": 0.0023565262090414762, "global_step": 34551, "epoch": 290, "lr": 5.3095301992897465e-05} +{"train_loss": 0.0028097212780267, "global_step": 34552, "epoch": 290, "lr": 5.3093090729618745e-05} +{"train_loss": 0.001742371590808034, "global_step": 34553, "epoch": 290, "lr": 5.309087946026707e-05} +{"train_loss": 0.0023259357549250126, "global_step": 34554, "epoch": 290, "lr": 5.308866818484679e-05} +{"train_loss": 0.0038707652129232883, "global_step": 34555, "epoch": 290, "lr": 5.3086456903362245e-05} +{"train_loss": 0.004880035761743784, "global_step": 34556, "epoch": 290, "lr": 5.308424561581776e-05} +{"train_loss": 0.0017806543037295341, "global_step": 34557, "epoch": 290, "lr": 5.30820343222177e-05} +{"train_loss": 0.002085241489112377, "global_step": 34558, "epoch": 290, "lr": 5.3079823022566376e-05} +{"train_loss": 0.0034846924245357513, "global_step": 34559, "epoch": 290, "lr": 5.307761171686817e-05} +{"train_loss": 0.0031497315503656864, "global_step": 34560, "epoch": 290, "lr": 5.3075400405127385e-05} +{"train_loss": 0.0018570568645372987, "global_step": 34561, "epoch": 290, "lr": 5.3073189087348384e-05} +{"train_loss": 0.0021386495791375637, "global_step": 34562, "epoch": 290, "lr": 5.307097776353552e-05} +{"train_loss": 0.0028539083432406187, "global_step": 34563, "epoch": 290, "lr": 5.306876643369311e-05} +{"train_loss": 0.003591654123738408, "global_step": 34564, "epoch": 290, "lr": 5.30665550978255e-05} +{"train_loss": 0.002831400139257312, "global_step": 34565, "epoch": 290, "lr": 5.306434375593704e-05} +{"train_loss": 0.004164816811680794, "global_step": 34566, "epoch": 290, "lr": 5.306213240803207e-05} +{"train_loss": 0.0017117849783971906, "global_step": 34567, "epoch": 290, "lr": 5.305992105411492e-05} +{"train_loss": 0.0028808501083403826, "global_step": 34568, "epoch": 290, "lr": 5.305770969418996e-05} +{"train_loss": 0.002695648930966854, "global_step": 34569, "epoch": 290, "lr": 5.305549832826151e-05} +{"train_loss": 0.002539584180340171, "global_step": 34570, "epoch": 290, "lr": 5.30532869563339e-05} +{"train_loss": 0.001670059165917337, "global_step": 34571, "epoch": 290, "lr": 5.30510755784115e-05} +{"train_loss": 0.0034061623737215996, "global_step": 34572, "epoch": 290, "lr": 5.304886419449863e-05} +{"train_loss": 0.0029040996450930834, "global_step": 34573, "epoch": 290, "lr": 5.3046652804599636e-05} +{"train_loss": 0.0024320860393345356, "global_step": 34574, "epoch": 290, "lr": 5.304444140871889e-05} +{"train_loss": 0.0034128364641219378, "global_step": 34575, "epoch": 290, "lr": 5.3042230006860696e-05} +{"train_loss": 0.0025498017203062773, "global_step": 34576, "epoch": 290, "lr": 5.3040018599029394e-05} +{"train_loss": 0.002603297820314765, "global_step": 34577, "epoch": 290, "lr": 5.303780718522936e-05} +{"train_loss": 0.0018921010196208954, "global_step": 34578, "epoch": 290, "lr": 5.3035595765464905e-05} +{"train_loss": 0.002423695055767894, "global_step": 34579, "epoch": 290, "lr": 5.303338433974039e-05} +{"train_loss": 0.0024713061284273863, "global_step": 34580, "epoch": 290, "lr": 5.3031172908060145e-05} +{"train_loss": 0.001499140984378755, "global_step": 34581, "epoch": 290, "lr": 5.3028961470428516e-05} +{"train_loss": 0.0024588266387581825, "global_step": 34582, "epoch": 290, "lr": 5.302675002684985e-05} +{"train_loss": 0.0029828636907041073, "global_step": 34583, "epoch": 290, "lr": 5.3024538577328466e-05} +{"train_loss": 0.0017237237188965082, "global_step": 34584, "epoch": 290, "lr": 5.3022327121868745e-05} +{"train_loss": 0.0028898988384753466, "global_step": 34585, "epoch": 290, "lr": 5.302011566047499e-05} +{"train_loss": 0.0029565198346972466, "global_step": 34586, "epoch": 290, "lr": 5.301790419315157e-05} +{"train_loss": 0.0025102279614657164, "global_step": 34587, "epoch": 290, "lr": 5.301569271990281e-05} +{"train_loss": 0.002979239681735635, "global_step": 34588, "epoch": 290, "lr": 5.3013481240733063e-05} +{"train_loss": 0.002922461600974202, "global_step": 34589, "epoch": 290, "lr": 5.301126975564668e-05} +{"train_loss": 0.0014338677283376455, "global_step": 34590, "epoch": 290, "lr": 5.300905826464797e-05} +{"train_loss": 0.002382420003414154, "global_step": 34591, "epoch": 290, "lr": 5.30068467677413e-05} +{"train_loss": 0.0021655382588505745, "global_step": 34592, "epoch": 290, "lr": 5.3004635264931014e-05} +{"train_loss": 0.00146996951662004, "global_step": 34593, "epoch": 290, "lr": 5.300242375622146e-05} +{"train_loss": 0.0024827751331031322, "global_step": 34594, "epoch": 290, "lr": 5.3000212241616955e-05} +{"train_loss": 0.0010318574495613575, "global_step": 34595, "epoch": 290, "lr": 5.2998000721121855e-05} +{"train_loss": 0.003099512541666627, "global_step": 34596, "epoch": 290, "lr": 5.29957891947405e-05} +{"train_loss": 0.0021542690228670835, "global_step": 34597, "epoch": 290, "lr": 5.2993577662477225e-05} +{"train_loss": 0.002005083253607154, "global_step": 34598, "epoch": 290, "lr": 5.2991366124336396e-05} +{"train_loss": 0.0017628757050260901, "global_step": 34599, "epoch": 290, "lr": 5.298915458032233e-05} +{"train_loss": 0.002155996859073639, "global_step": 34600, "epoch": 290, "lr": 5.2986943030439386e-05} +{"train_loss": 0.001695845858193934, "global_step": 34601, "epoch": 290, "lr": 5.2984731474691886e-05} +{"train_loss": 0.00236262078396976, "global_step": 34602, "epoch": 290, "lr": 5.298251991308419e-05} +{"train_loss": 0.0021486671175807714, "global_step": 34603, "epoch": 290, "lr": 5.2980308345620634e-05} +{"train_loss": 0.00275676348246634, "global_step": 34604, "epoch": 290, "lr": 5.297809677230556e-05} +{"train_loss": 0.0016877059824764729, "global_step": 34605, "epoch": 290, "lr": 5.297588519314331e-05} +{"train_loss": 0.0029084321577101946, "global_step": 34606, "epoch": 290, "lr": 5.297367360813823e-05} +{"train_loss": 0.0018845864105969667, "global_step": 34607, "epoch": 290, "lr": 5.297146201729466e-05} +{"train_loss": 0.0014674466801807284, "global_step": 34608, "epoch": 290, "lr": 5.296925042061694e-05} +{"train_loss": 0.0018538427539169788, "global_step": 34609, "epoch": 290, "lr": 5.2967038818109415e-05} +{"train_loss": 0.0031157766934484243, "global_step": 34610, "epoch": 290, "lr": 5.296482720977642e-05} +{"train_loss": 0.001387680764310062, "global_step": 34611, "epoch": 290, "lr": 5.296261559562232e-05} +{"train_loss": 0.0017346196109429002, "global_step": 34612, "epoch": 290, "lr": 5.296040397565144e-05} +{"train_loss": 0.001894890796393156, "global_step": 34613, "epoch": 290, "lr": 5.2958192349868106e-05} +{"train_loss": 0.0019814856350421906, "global_step": 34614, "epoch": 290, "lr": 5.2955980718276686e-05} +{"train_loss": 0.0016025896184146404, "global_step": 34615, "epoch": 290, "lr": 5.295376908088152e-05} +{"train_loss": 0.002453179331496358, "global_step": 34616, "epoch": 290, "lr": 5.295155743768694e-05} +{"train_loss": 0.002064419910311699, "global_step": 34617, "epoch": 290, "lr": 5.294934578869728e-05} +{"train_loss": 0.0021087198983877897, "global_step": 34618, "epoch": 290, "lr": 5.294713413391692e-05} +{"train_loss": 0.0029864120297133923, "global_step": 34619, "epoch": 290, "lr": 5.2944922473350155e-05} +{"train_loss": 0.002912397962063551, "global_step": 34620, "epoch": 290, "lr": 5.294271080700136e-05} +{"train_loss": 0.002032064599916339, "global_step": 34621, "epoch": 290, "lr": 5.294049913487484e-05} +{"train_loss": 0.002242287155240774, "global_step": 34622, "epoch": 290, "lr": 5.293828745697499e-05} +{"train_loss": 0.002117966301739216, "global_step": 34623, "epoch": 290, "lr": 5.293607577330612e-05} +{"train_loss": 0.001258855452761054, "global_step": 34624, "epoch": 290, "lr": 5.29338640838726e-05} +{"train_loss": 0.002188656013458967, "global_step": 34625, "epoch": 290, "lr": 5.293165238867873e-05} +{"train_loss": 0.002502600895240903, "global_step": 34626, "epoch": 290, "lr": 5.292944068772887e-05} +{"train_loss": 0.0021654576994478703, "global_step": 34627, "epoch": 290, "lr": 5.292722898102738e-05} +{"train_loss": 0.002490257937754622, "global_step": 34628, "epoch": 290, "lr": 5.292501726857858e-05, "val_loss": 0.031057139858603477, "train_action_mse_error": 4.777108915732242e-05} +{"train_loss": 0.0010145982960239053, "global_step": 34629, "epoch": 291, "lr": 5.2922805550386825e-05} +{"train_loss": 0.0018675867468118668, "global_step": 34630, "epoch": 291, "lr": 5.292059382645645e-05} +{"train_loss": 0.004301394335925579, "global_step": 34631, "epoch": 291, "lr": 5.2918382096791806e-05} +{"train_loss": 0.0022229193709790707, "global_step": 34632, "epoch": 291, "lr": 5.291617036139722e-05} +{"train_loss": 0.0038600305560976267, "global_step": 34633, "epoch": 291, "lr": 5.291395862027706e-05} +{"train_loss": 0.0014869965380057693, "global_step": 34634, "epoch": 291, "lr": 5.2911746873435645e-05} +{"train_loss": 0.0025785472244024277, "global_step": 34635, "epoch": 291, "lr": 5.2909535120877315e-05} +{"train_loss": 0.00398572813719511, "global_step": 34636, "epoch": 291, "lr": 5.290732336260644e-05} +{"train_loss": 0.003371218917891383, "global_step": 34637, "epoch": 291, "lr": 5.290511159862734e-05} +{"train_loss": 0.002128035994246602, "global_step": 34638, "epoch": 291, "lr": 5.2902899828944364e-05} +{"train_loss": 0.0021918793208897114, "global_step": 34639, "epoch": 291, "lr": 5.290068805356185e-05} +{"train_loss": 0.0033586849458515644, "global_step": 34640, "epoch": 291, "lr": 5.289847627248415e-05} +{"train_loss": 0.0014672507531940937, "global_step": 34641, "epoch": 291, "lr": 5.2896264485715606e-05} +{"train_loss": 0.003412744728848338, "global_step": 34642, "epoch": 291, "lr": 5.2894052693260554e-05} +{"train_loss": 0.0013661135453730822, "global_step": 34643, "epoch": 291, "lr": 5.289184089512335e-05} +{"train_loss": 0.0015548962401226163, "global_step": 34644, "epoch": 291, "lr": 5.2889629091308304e-05} +{"train_loss": 0.0019128484418615699, "global_step": 34645, "epoch": 291, "lr": 5.2887417281819785e-05} +{"train_loss": 0.0031089300755411386, "global_step": 34646, "epoch": 291, "lr": 5.2885205466662137e-05} +{"train_loss": 0.0020538722164928913, "global_step": 34647, "epoch": 291, "lr": 5.2882993645839694e-05} +{"train_loss": 0.0017441831296309829, "global_step": 34648, "epoch": 291, "lr": 5.2880781819356795e-05} +{"train_loss": 0.0019359312718734145, "global_step": 34649, "epoch": 291, "lr": 5.287856998721781e-05} +{"train_loss": 0.0026601175777614117, "global_step": 34650, "epoch": 291, "lr": 5.287635814942704e-05} +{"train_loss": 0.0027658354956656694, "global_step": 34651, "epoch": 291, "lr": 5.2874146305988845e-05} +{"train_loss": 0.002746504032984376, "global_step": 34652, "epoch": 291, "lr": 5.287193445690758e-05} +{"train_loss": 0.0020360222551971674, "global_step": 34653, "epoch": 291, "lr": 5.286972260218758e-05} +{"train_loss": 0.002030902775004506, "global_step": 34654, "epoch": 291, "lr": 5.286751074183318e-05} +{"train_loss": 0.0033591222018003464, "global_step": 34655, "epoch": 291, "lr": 5.286529887584872e-05} +{"train_loss": 0.0022056789603084326, "global_step": 34656, "epoch": 291, "lr": 5.2863087004238576e-05} +{"train_loss": 0.0021660104393959045, "global_step": 34657, "epoch": 291, "lr": 5.2860875127007046e-05} +{"train_loss": 0.0010728382039815187, "global_step": 34658, "epoch": 291, "lr": 5.28586632441585e-05} +{"train_loss": 0.00281791971065104, "global_step": 34659, "epoch": 291, "lr": 5.285645135569728e-05} +{"train_loss": 0.001883351942524314, "global_step": 34660, "epoch": 291, "lr": 5.285423946162772e-05} +{"train_loss": 0.002111740643158555, "global_step": 34661, "epoch": 291, "lr": 5.285202756195415e-05} +{"train_loss": 0.0027671807911247015, "global_step": 34662, "epoch": 291, "lr": 5.284981565668096e-05} +{"train_loss": 0.002465474419295788, "global_step": 34663, "epoch": 291, "lr": 5.284760374581245e-05} +{"train_loss": 0.0015052163507789373, "global_step": 34664, "epoch": 291, "lr": 5.284539182935297e-05} +{"train_loss": 0.0028304182924330235, "global_step": 34665, "epoch": 291, "lr": 5.284317990730685e-05} +{"train_loss": 0.0011477614752948284, "global_step": 34666, "epoch": 291, "lr": 5.284096797967847e-05} +{"train_loss": 0.0017762236529961228, "global_step": 34667, "epoch": 291, "lr": 5.283875604647215e-05} +{"train_loss": 0.002740135882049799, "global_step": 34668, "epoch": 291, "lr": 5.2836544107692245e-05} +{"train_loss": 0.0025187432765960693, "global_step": 34669, "epoch": 291, "lr": 5.283433216334306e-05} +{"train_loss": 0.0017854401376098394, "global_step": 34670, "epoch": 291, "lr": 5.283212021342898e-05} +{"train_loss": 0.003927973099052906, "global_step": 34671, "epoch": 291, "lr": 5.282990825795434e-05} +{"train_loss": 0.002707270672544837, "global_step": 34672, "epoch": 291, "lr": 5.282769629692348e-05} +{"train_loss": 0.003378012217581272, "global_step": 34673, "epoch": 291, "lr": 5.2825484330340736e-05} +{"train_loss": 0.0018712363671511412, "global_step": 34674, "epoch": 291, "lr": 5.282327235821046e-05} +{"train_loss": 0.0029829279519617558, "global_step": 34675, "epoch": 291, "lr": 5.282106038053699e-05} +{"train_loss": 0.001789282076060772, "global_step": 34676, "epoch": 291, "lr": 5.281884839732466e-05} +{"train_loss": 0.0019392359536141157, "global_step": 34677, "epoch": 291, "lr": 5.281663640857784e-05} +{"train_loss": 0.0027298624627292156, "global_step": 34678, "epoch": 291, "lr": 5.2814424414300836e-05} +{"train_loss": 0.0023173566441982985, "global_step": 34679, "epoch": 291, "lr": 5.281221241449802e-05} +{"train_loss": 0.0029524166602641344, "global_step": 34680, "epoch": 291, "lr": 5.281000040917372e-05} +{"train_loss": 0.004602690692991018, "global_step": 34681, "epoch": 291, "lr": 5.2807788398332294e-05} +{"train_loss": 0.0028391003143042326, "global_step": 34682, "epoch": 291, "lr": 5.2805576381978075e-05} +{"train_loss": 0.0014921171823516488, "global_step": 34683, "epoch": 291, "lr": 5.280336436011539e-05} +{"train_loss": 0.002729988656938076, "global_step": 34684, "epoch": 291, "lr": 5.280115233274861e-05} +{"train_loss": 0.0037227850407361984, "global_step": 34685, "epoch": 291, "lr": 5.279894029988207e-05} +{"train_loss": 0.003661057446151972, "global_step": 34686, "epoch": 291, "lr": 5.27967282615201e-05} +{"train_loss": 0.002123664366081357, "global_step": 34687, "epoch": 291, "lr": 5.279451621766706e-05} +{"train_loss": 0.001808809582144022, "global_step": 34688, "epoch": 291, "lr": 5.279230416832728e-05} +{"train_loss": 0.004106923006474972, "global_step": 34689, "epoch": 291, "lr": 5.279009211350512e-05} +{"train_loss": 0.0032640628051012754, "global_step": 34690, "epoch": 291, "lr": 5.27878800532049e-05} +{"train_loss": 0.00480499817058444, "global_step": 34691, "epoch": 291, "lr": 5.278566798743098e-05} +{"train_loss": 0.002128788735717535, "global_step": 34692, "epoch": 291, "lr": 5.2783455916187696e-05} +{"train_loss": 0.002276955172419548, "global_step": 34693, "epoch": 291, "lr": 5.278124383947941e-05} +{"train_loss": 0.0032059834338724613, "global_step": 34694, "epoch": 291, "lr": 5.2779031757310436e-05} +{"train_loss": 0.0030065590981394053, "global_step": 34695, "epoch": 291, "lr": 5.277681966968513e-05} +{"train_loss": 0.003297071671113372, "global_step": 34696, "epoch": 291, "lr": 5.2774607576607826e-05} +{"train_loss": 0.002404552884399891, "global_step": 34697, "epoch": 291, "lr": 5.2772395478082895e-05} +{"train_loss": 0.0028306529857218266, "global_step": 34698, "epoch": 291, "lr": 5.2770183374114644e-05} +{"train_loss": 0.003750622970983386, "global_step": 34699, "epoch": 291, "lr": 5.276797126470744e-05} +{"train_loss": 0.00314858416095376, "global_step": 34700, "epoch": 291, "lr": 5.276575914986564e-05} +{"train_loss": 0.0019995940383523703, "global_step": 34701, "epoch": 291, "lr": 5.276354702959354e-05} +{"train_loss": 0.001706691924482584, "global_step": 34702, "epoch": 291, "lr": 5.276133490389552e-05} +{"train_loss": 0.001218110672198236, "global_step": 34703, "epoch": 291, "lr": 5.2759122772775915e-05} +{"train_loss": 0.005117753986269236, "global_step": 34704, "epoch": 291, "lr": 5.2756910636239065e-05} +{"train_loss": 0.0030702853109687567, "global_step": 34705, "epoch": 291, "lr": 5.2754698494289315e-05} +{"train_loss": 0.0028270287439227104, "global_step": 34706, "epoch": 291, "lr": 5.2752486346931016e-05} +{"train_loss": 0.0034361989237368107, "global_step": 34707, "epoch": 291, "lr": 5.275027419416849e-05} +{"train_loss": 0.002109760884195566, "global_step": 34708, "epoch": 291, "lr": 5.274806203600611e-05} +{"train_loss": 0.0036028616596013308, "global_step": 34709, "epoch": 291, "lr": 5.274584987244819e-05} +{"train_loss": 0.0019174051703885198, "global_step": 34710, "epoch": 291, "lr": 5.2743637703499097e-05} +{"train_loss": 0.0032120109535753727, "global_step": 34711, "epoch": 291, "lr": 5.274142552916316e-05} +{"train_loss": 0.005099437199532986, "global_step": 34712, "epoch": 291, "lr": 5.273921334944474e-05} +{"train_loss": 0.002663831692188978, "global_step": 34713, "epoch": 291, "lr": 5.273700116434815e-05} +{"train_loss": 0.001531541463918984, "global_step": 34714, "epoch": 291, "lr": 5.273478897387776e-05} +{"train_loss": 0.004886633716523647, "global_step": 34715, "epoch": 291, "lr": 5.2732576778037904e-05} +{"train_loss": 0.0017487314762547612, "global_step": 34716, "epoch": 291, "lr": 5.2730364576832914e-05} +{"train_loss": 0.002820705296471715, "global_step": 34717, "epoch": 291, "lr": 5.272815237026716e-05} +{"train_loss": 0.0033417807426303625, "global_step": 34718, "epoch": 291, "lr": 5.2725940158344955e-05} +{"train_loss": 0.0023478777147829533, "global_step": 34719, "epoch": 291, "lr": 5.2723727941070666e-05} +{"train_loss": 0.0038279748987406492, "global_step": 34720, "epoch": 291, "lr": 5.272151571844863e-05} +{"train_loss": 0.004103730898350477, "global_step": 34721, "epoch": 291, "lr": 5.2719303490483187e-05} +{"train_loss": 0.0023327316157519817, "global_step": 34722, "epoch": 291, "lr": 5.271709125717868e-05} +{"train_loss": 0.002467550802975893, "global_step": 34723, "epoch": 291, "lr": 5.271487901853945e-05} +{"train_loss": 0.0016136955237016082, "global_step": 34724, "epoch": 291, "lr": 5.271266677456985e-05} +{"train_loss": 0.002291738986968994, "global_step": 34725, "epoch": 291, "lr": 5.271045452527423e-05} +{"train_loss": 0.0037282307166606188, "global_step": 34726, "epoch": 291, "lr": 5.2708242270656916e-05} +{"train_loss": 0.0022628046572208405, "global_step": 34727, "epoch": 291, "lr": 5.270603001072225e-05} +{"train_loss": 0.0024722833186388016, "global_step": 34728, "epoch": 291, "lr": 5.270381774547459e-05} +{"train_loss": 0.0035152616910636425, "global_step": 34729, "epoch": 291, "lr": 5.270160547491827e-05} +{"train_loss": 0.0027878631372004747, "global_step": 34730, "epoch": 291, "lr": 5.2699393199057635e-05} +{"train_loss": 0.002906956011429429, "global_step": 34731, "epoch": 291, "lr": 5.269718091789704e-05} +{"train_loss": 0.003796761855483055, "global_step": 34732, "epoch": 291, "lr": 5.269496863144081e-05} +{"train_loss": 0.0028344884049147367, "global_step": 34733, "epoch": 291, "lr": 5.269275633969329e-05} +{"train_loss": 0.0016152593307197094, "global_step": 34734, "epoch": 291, "lr": 5.269054404265884e-05} +{"train_loss": 0.002093506045639515, "global_step": 34735, "epoch": 291, "lr": 5.268833174034179e-05} +{"train_loss": 0.004316005390137434, "global_step": 34736, "epoch": 291, "lr": 5.2686119432746486e-05} +{"train_loss": 0.0015949406661093235, "global_step": 34737, "epoch": 291, "lr": 5.268390711987727e-05} +{"train_loss": 0.00240249908529222, "global_step": 34738, "epoch": 291, "lr": 5.26816948017385e-05} +{"train_loss": 0.002803381998091936, "global_step": 34739, "epoch": 291, "lr": 5.2679482478334495e-05} +{"train_loss": 0.0031604415271431208, "global_step": 34740, "epoch": 291, "lr": 5.2677270149669633e-05} +{"train_loss": 0.002685988089069724, "global_step": 34741, "epoch": 291, "lr": 5.267505781574822e-05} +{"train_loss": 0.0025412023533135653, "global_step": 34742, "epoch": 291, "lr": 5.2672845476574615e-05} +{"train_loss": 0.0028860862366855145, "global_step": 34743, "epoch": 291, "lr": 5.267063313215319e-05} +{"train_loss": 0.002922492567449808, "global_step": 34744, "epoch": 291, "lr": 5.266842078248824e-05} +{"train_loss": 0.003585490398108959, "global_step": 34745, "epoch": 291, "lr": 5.266620842758413e-05} +{"train_loss": 0.0015062862075865269, "global_step": 34746, "epoch": 291, "lr": 5.266399606744521e-05} +{"train_loss": 0.00267456316275663, "global_step": 34747, "epoch": 291, "lr": 5.266178370207582e-05, "val_loss": 0.019238028675317764} +{"train_loss": 0.0014920186949893832, "global_step": 34748, "epoch": 292, "lr": 5.265957133148029e-05} +{"train_loss": 0.002542741596698761, "global_step": 34749, "epoch": 292, "lr": 5.2657358955662985e-05} +{"train_loss": 0.0019282714929431677, "global_step": 34750, "epoch": 292, "lr": 5.265514657462826e-05} +{"train_loss": 0.002998956711962819, "global_step": 34751, "epoch": 292, "lr": 5.265293418838041e-05} +{"train_loss": 0.0016646857839077711, "global_step": 34752, "epoch": 292, "lr": 5.2650721796923804e-05} +{"train_loss": 0.0029594325460493565, "global_step": 34753, "epoch": 292, "lr": 5.264850940026279e-05} +{"train_loss": 0.0029887112323194742, "global_step": 34754, "epoch": 292, "lr": 5.2646296998401726e-05} +{"train_loss": 0.0012791143963113427, "global_step": 34755, "epoch": 292, "lr": 5.2644084591344935e-05} +{"train_loss": 0.004260695073753595, "global_step": 34756, "epoch": 292, "lr": 5.2641872179096773e-05} +{"train_loss": 0.002921839477494359, "global_step": 34757, "epoch": 292, "lr": 5.263965976166157e-05} +{"train_loss": 0.003436069004237652, "global_step": 34758, "epoch": 292, "lr": 5.2637447339043674e-05} +{"train_loss": 0.0016274233348667622, "global_step": 34759, "epoch": 292, "lr": 5.2635234911247443e-05} +{"train_loss": 0.00272631854750216, "global_step": 34760, "epoch": 292, "lr": 5.26330224782772e-05} +{"train_loss": 0.002251686528325081, "global_step": 34761, "epoch": 292, "lr": 5.2630810040137305e-05} +{"train_loss": 0.002121414290741086, "global_step": 34762, "epoch": 292, "lr": 5.26285975968321e-05} +{"train_loss": 0.003599907737225294, "global_step": 34763, "epoch": 292, "lr": 5.262638514836591e-05} +{"train_loss": 0.0022601147647947073, "global_step": 34764, "epoch": 292, "lr": 5.26241726947431e-05} +{"train_loss": 0.0028453334234654903, "global_step": 34765, "epoch": 292, "lr": 5.2621960235968006e-05} +{"train_loss": 0.00291417702101171, "global_step": 34766, "epoch": 292, "lr": 5.261974777204497e-05} +{"train_loss": 0.0016826860373839736, "global_step": 34767, "epoch": 292, "lr": 5.261753530297834e-05} +{"train_loss": 0.0023695200216025114, "global_step": 34768, "epoch": 292, "lr": 5.261532282877246e-05} +{"train_loss": 0.0020515150390565395, "global_step": 34769, "epoch": 292, "lr": 5.2613110349431686e-05} +{"train_loss": 0.0015505930641666055, "global_step": 34770, "epoch": 292, "lr": 5.261089786496033e-05} +{"train_loss": 0.00196602800861001, "global_step": 34771, "epoch": 292, "lr": 5.260868537536277e-05} +{"train_loss": 0.0021900131832808256, "global_step": 34772, "epoch": 292, "lr": 5.260647288064332e-05} +{"train_loss": 0.0026853950694203377, "global_step": 34773, "epoch": 292, "lr": 5.2604260380806346e-05} +{"train_loss": 0.0032130854669958353, "global_step": 34774, "epoch": 292, "lr": 5.260204787585619e-05} +{"train_loss": 0.0018680186476558447, "global_step": 34775, "epoch": 292, "lr": 5.259983536579719e-05} +{"train_loss": 0.0013706969330087304, "global_step": 34776, "epoch": 292, "lr": 5.259762285063369e-05} +{"train_loss": 0.0022837978322058916, "global_step": 34777, "epoch": 292, "lr": 5.259541033037003e-05} +{"train_loss": 0.0021489658392965794, "global_step": 34778, "epoch": 292, "lr": 5.259319780501056e-05} +{"train_loss": 0.0037655974738299847, "global_step": 34779, "epoch": 292, "lr": 5.259098527455962e-05} +{"train_loss": 0.0023080334067344666, "global_step": 34780, "epoch": 292, "lr": 5.2588772739021566e-05} +{"train_loss": 0.0014536493690684438, "global_step": 34781, "epoch": 292, "lr": 5.258656019840074e-05} +{"train_loss": 0.0022314880043268204, "global_step": 34782, "epoch": 292, "lr": 5.258434765270147e-05} +{"train_loss": 0.0027038983535021544, "global_step": 34783, "epoch": 292, "lr": 5.258213510192811e-05} +{"train_loss": 0.002269129268825054, "global_step": 34784, "epoch": 292, "lr": 5.2579922546085e-05} +{"train_loss": 0.0018686583498492837, "global_step": 34785, "epoch": 292, "lr": 5.2577709985176494e-05} +{"train_loss": 0.0018461474683135748, "global_step": 34786, "epoch": 292, "lr": 5.257549741920692e-05} +{"train_loss": 0.003438880667090416, "global_step": 34787, "epoch": 292, "lr": 5.257328484818064e-05} +{"train_loss": 0.0016133160097524524, "global_step": 34788, "epoch": 292, "lr": 5.257107227210199e-05} +{"train_loss": 0.002465622266754508, "global_step": 34789, "epoch": 292, "lr": 5.2568859690975304e-05} +{"train_loss": 0.002352853072807193, "global_step": 34790, "epoch": 292, "lr": 5.2566647104804946e-05} +{"train_loss": 0.003245267551392317, "global_step": 34791, "epoch": 292, "lr": 5.256443451359525e-05} +{"train_loss": 0.002003944478929043, "global_step": 34792, "epoch": 292, "lr": 5.256222191735055e-05} +{"train_loss": 0.0026493093464523554, "global_step": 34793, "epoch": 292, "lr": 5.256000931607521e-05} +{"train_loss": 0.002300599589943886, "global_step": 34794, "epoch": 292, "lr": 5.255779670977358e-05} +{"train_loss": 0.003820448648184538, "global_step": 34795, "epoch": 292, "lr": 5.2555584098449974e-05} +{"train_loss": 0.0013236101949587464, "global_step": 34796, "epoch": 292, "lr": 5.255337148210875e-05} +{"train_loss": 0.002233851468190551, "global_step": 34797, "epoch": 292, "lr": 5.2551158860754255e-05} +{"train_loss": 0.001685775350779295, "global_step": 34798, "epoch": 292, "lr": 5.254894623439084e-05} +{"train_loss": 0.002888366114348173, "global_step": 34799, "epoch": 292, "lr": 5.254673360302283e-05} +{"train_loss": 0.0033341008238494396, "global_step": 34800, "epoch": 292, "lr": 5.25445209666546e-05} +{"train_loss": 0.0020340504124760628, "global_step": 34801, "epoch": 292, "lr": 5.2542308325290456e-05} +{"train_loss": 0.0021465979516506195, "global_step": 34802, "epoch": 292, "lr": 5.2540095678934754e-05} +{"train_loss": 0.0016825271304696798, "global_step": 34803, "epoch": 292, "lr": 5.253788302759186e-05} +{"train_loss": 0.003574058646336198, "global_step": 34804, "epoch": 292, "lr": 5.25356703712661e-05} +{"train_loss": 0.0026888938155025244, "global_step": 34805, "epoch": 292, "lr": 5.253345770996183e-05} +{"train_loss": 0.0017538589891046286, "global_step": 34806, "epoch": 292, "lr": 5.2531245043683386e-05} +{"train_loss": 0.001805096515454352, "global_step": 34807, "epoch": 292, "lr": 5.252903237243511e-05} +{"train_loss": 0.002791882725432515, "global_step": 34808, "epoch": 292, "lr": 5.252681969622134e-05} +{"train_loss": 0.003336318302899599, "global_step": 34809, "epoch": 292, "lr": 5.252460701504644e-05} +{"train_loss": 0.002464501652866602, "global_step": 34810, "epoch": 292, "lr": 5.252239432891474e-05} +{"train_loss": 0.0020498279482126236, "global_step": 34811, "epoch": 292, "lr": 5.252018163783058e-05} +{"train_loss": 0.0022420508321374655, "global_step": 34812, "epoch": 292, "lr": 5.2517968941798336e-05} +{"train_loss": 0.003737299470230937, "global_step": 34813, "epoch": 292, "lr": 5.251575624082231e-05} +{"train_loss": 0.002486469689756632, "global_step": 34814, "epoch": 292, "lr": 5.2513543534906865e-05} +{"train_loss": 0.002658701501786709, "global_step": 34815, "epoch": 292, "lr": 5.251133082405635e-05} +{"train_loss": 0.003661646042019129, "global_step": 34816, "epoch": 292, "lr": 5.25091181082751e-05} +{"train_loss": 0.0026023013051599264, "global_step": 34817, "epoch": 292, "lr": 5.250690538756747e-05} +{"train_loss": 0.0021890848875045776, "global_step": 34818, "epoch": 292, "lr": 5.250469266193781e-05} +{"train_loss": 0.002871795790269971, "global_step": 34819, "epoch": 292, "lr": 5.250247993139044e-05} +{"train_loss": 0.0021828189492225647, "global_step": 34820, "epoch": 292, "lr": 5.250026719592971e-05} +{"train_loss": 0.001258249394595623, "global_step": 34821, "epoch": 292, "lr": 5.2498054455559986e-05} +{"train_loss": 0.0016723680309951305, "global_step": 34822, "epoch": 292, "lr": 5.249584171028559e-05} +{"train_loss": 0.002508580219000578, "global_step": 34823, "epoch": 292, "lr": 5.2493628960110875e-05} +{"train_loss": 0.0018074112012982368, "global_step": 34824, "epoch": 292, "lr": 5.24914162050402e-05} +{"train_loss": 0.002078488003462553, "global_step": 34825, "epoch": 292, "lr": 5.2489203445077894e-05} +{"train_loss": 0.0028157485648989677, "global_step": 34826, "epoch": 292, "lr": 5.24869906802283e-05} +{"train_loss": 0.0020945253781974316, "global_step": 34827, "epoch": 292, "lr": 5.248477791049575e-05} +{"train_loss": 0.0017896912759169936, "global_step": 34828, "epoch": 292, "lr": 5.248256513588462e-05} +{"train_loss": 0.0028982616495341063, "global_step": 34829, "epoch": 292, "lr": 5.248035235639923e-05} +{"train_loss": 0.0018885559402406216, "global_step": 34830, "epoch": 292, "lr": 5.247813957204394e-05} +{"train_loss": 0.002940773032605648, "global_step": 34831, "epoch": 292, "lr": 5.2475926782823094e-05} +{"train_loss": 0.0014889038866385818, "global_step": 34832, "epoch": 292, "lr": 5.2473713988741025e-05} +{"train_loss": 0.0036547696217894554, "global_step": 34833, "epoch": 292, "lr": 5.2471501189802076e-05} +{"train_loss": 0.0018405250739306211, "global_step": 34834, "epoch": 292, "lr": 5.2469288386010596e-05} +{"train_loss": 0.0009357570670545101, "global_step": 34835, "epoch": 292, "lr": 5.246707557737094e-05} +{"train_loss": 0.0019345973851159215, "global_step": 34836, "epoch": 292, "lr": 5.2464862763887444e-05} +{"train_loss": 0.0028020378667861223, "global_step": 34837, "epoch": 292, "lr": 5.246264994556444e-05} +{"train_loss": 0.0020160628482699394, "global_step": 34838, "epoch": 292, "lr": 5.24604371224063e-05} +{"train_loss": 0.0017351285787299275, "global_step": 34839, "epoch": 292, "lr": 5.245822429441736e-05} +{"train_loss": 0.002235806081444025, "global_step": 34840, "epoch": 292, "lr": 5.245601146160195e-05} +{"train_loss": 0.0018422151915729046, "global_step": 34841, "epoch": 292, "lr": 5.2453798623964426e-05} +{"train_loss": 0.002724767429754138, "global_step": 34842, "epoch": 292, "lr": 5.2451585781509125e-05} +{"train_loss": 0.002722088946029544, "global_step": 34843, "epoch": 292, "lr": 5.2449372934240407e-05} +{"train_loss": 0.0015322464751079679, "global_step": 34844, "epoch": 292, "lr": 5.244716008216261e-05} +{"train_loss": 0.0019550276920199394, "global_step": 34845, "epoch": 292, "lr": 5.244494722528006e-05} +{"train_loss": 0.002101925667375326, "global_step": 34846, "epoch": 292, "lr": 5.2442734363597124e-05} +{"train_loss": 0.002530646976083517, "global_step": 34847, "epoch": 292, "lr": 5.2440521497118146e-05} +{"train_loss": 0.003387891221791506, "global_step": 34848, "epoch": 292, "lr": 5.2438308625847455e-05} +{"train_loss": 0.002403993858024478, "global_step": 34849, "epoch": 292, "lr": 5.2436095749789415e-05} +{"train_loss": 0.0015179418260231614, "global_step": 34850, "epoch": 292, "lr": 5.243388286894837e-05} +{"train_loss": 0.0016446284716948867, "global_step": 34851, "epoch": 292, "lr": 5.243166998332862e-05} +{"train_loss": 0.0023569974582642317, "global_step": 34852, "epoch": 292, "lr": 5.242945709293458e-05} +{"train_loss": 0.0013538800412788987, "global_step": 34853, "epoch": 292, "lr": 5.2427244197770544e-05} +{"train_loss": 0.0019122489029541612, "global_step": 34854, "epoch": 292, "lr": 5.242503129784088e-05} +{"train_loss": 0.0027029456105083227, "global_step": 34855, "epoch": 292, "lr": 5.242281839314992e-05} +{"train_loss": 0.00268495618365705, "global_step": 34856, "epoch": 292, "lr": 5.2420605483702025e-05} +{"train_loss": 0.0020833497401326895, "global_step": 34857, "epoch": 292, "lr": 5.241839256950153e-05} +{"train_loss": 0.0011522517306730151, "global_step": 34858, "epoch": 292, "lr": 5.241617965055276e-05} +{"train_loss": 0.0017340952763333917, "global_step": 34859, "epoch": 292, "lr": 5.24139667268601e-05} +{"train_loss": 0.0016959293279796839, "global_step": 34860, "epoch": 292, "lr": 5.241175379842786e-05} +{"train_loss": 0.002716834656894207, "global_step": 34861, "epoch": 292, "lr": 5.240954086526041e-05} +{"train_loss": 0.002070845803245902, "global_step": 34862, "epoch": 292, "lr": 5.240732792736209e-05} +{"train_loss": 0.0020400627981871367, "global_step": 34863, "epoch": 292, "lr": 5.240511498473724e-05} +{"train_loss": 0.0025204941630363464, "global_step": 34864, "epoch": 292, "lr": 5.240290203739018e-05} +{"train_loss": 0.002158102113753557, "global_step": 34865, "epoch": 292, "lr": 5.240068908532529e-05} +{"train_loss": 0.002324903740923257, "global_step": 34866, "epoch": 292, "lr": 5.2398476128546903e-05, "val_loss": 0.010012878105044365} +{"train_loss": 0.0019525995012372732, "global_step": 34867, "epoch": 293, "lr": 5.239626316705937e-05} +{"train_loss": 0.0015376120572909713, "global_step": 34868, "epoch": 293, "lr": 5.239405020086703e-05} +{"train_loss": 0.0016322453739121556, "global_step": 34869, "epoch": 293, "lr": 5.239183722997422e-05} +{"train_loss": 0.0015707899583503604, "global_step": 34870, "epoch": 293, "lr": 5.2389624254385295e-05} +{"train_loss": 0.0022458569146692753, "global_step": 34871, "epoch": 293, "lr": 5.23874112741046e-05} +{"train_loss": 0.002559301210567355, "global_step": 34872, "epoch": 293, "lr": 5.2385198289136474e-05} +{"train_loss": 0.0037490944378077984, "global_step": 34873, "epoch": 293, "lr": 5.238298529948528e-05} +{"train_loss": 0.004406984895467758, "global_step": 34874, "epoch": 293, "lr": 5.238077230515534e-05} +{"train_loss": 0.0012816727394238114, "global_step": 34875, "epoch": 293, "lr": 5.237855930615101e-05} +{"train_loss": 0.0023254193365573883, "global_step": 34876, "epoch": 293, "lr": 5.237634630247663e-05} +{"train_loss": 0.0022298120893538, "global_step": 34877, "epoch": 293, "lr": 5.237413329413655e-05} +{"train_loss": 0.0022514553274959326, "global_step": 34878, "epoch": 293, "lr": 5.2371920281135115e-05} +{"train_loss": 0.0020199192222207785, "global_step": 34879, "epoch": 293, "lr": 5.236970726347665e-05} +{"train_loss": 0.0017162645235657692, "global_step": 34880, "epoch": 293, "lr": 5.236749424116554e-05} +{"train_loss": 0.0013014315627515316, "global_step": 34881, "epoch": 293, "lr": 5.236528121420611e-05} +{"train_loss": 0.0025431551039218903, "global_step": 34882, "epoch": 293, "lr": 5.236306818260269e-05} +{"train_loss": 0.002027517417445779, "global_step": 34883, "epoch": 293, "lr": 5.236085514635964e-05} +{"train_loss": 0.0025898267049342394, "global_step": 34884, "epoch": 293, "lr": 5.23586421054813e-05} +{"train_loss": 0.0026668431237339973, "global_step": 34885, "epoch": 293, "lr": 5.2356429059972025e-05} +{"train_loss": 0.0019307313486933708, "global_step": 34886, "epoch": 293, "lr": 5.2354216009836144e-05} +{"train_loss": 0.0018494741525501013, "global_step": 34887, "epoch": 293, "lr": 5.235200295507802e-05} +{"train_loss": 0.004432254005223513, "global_step": 34888, "epoch": 293, "lr": 5.2349789895702e-05} +{"train_loss": 0.001423272187821567, "global_step": 34889, "epoch": 293, "lr": 5.23475768317124e-05} +{"train_loss": 0.0019042467465624213, "global_step": 34890, "epoch": 293, "lr": 5.2345363763113586e-05} +{"train_loss": 0.003041391260921955, "global_step": 34891, "epoch": 293, "lr": 5.23431506899099e-05} +{"train_loss": 0.001567200175486505, "global_step": 34892, "epoch": 293, "lr": 5.23409376121057e-05} +{"train_loss": 0.0012203715741634369, "global_step": 34893, "epoch": 293, "lr": 5.233872452970531e-05} +{"train_loss": 0.0021146961953490973, "global_step": 34894, "epoch": 293, "lr": 5.23365114427131e-05} +{"train_loss": 0.0016893367283046246, "global_step": 34895, "epoch": 293, "lr": 5.233429835113338e-05} +{"train_loss": 0.0032481530215591192, "global_step": 34896, "epoch": 293, "lr": 5.233208525497052e-05} +{"train_loss": 0.0023548526223748922, "global_step": 34897, "epoch": 293, "lr": 5.2329872154228855e-05} +{"train_loss": 0.0027987079229205847, "global_step": 34898, "epoch": 293, "lr": 5.2327659048912736e-05} +{"train_loss": 0.0036528087221086025, "global_step": 34899, "epoch": 293, "lr": 5.232544593902652e-05} +{"train_loss": 0.003150650067254901, "global_step": 34900, "epoch": 293, "lr": 5.232323282457452e-05} +{"train_loss": 0.0026253932155668736, "global_step": 34901, "epoch": 293, "lr": 5.232101970556111e-05} +{"train_loss": 0.0032681291922926903, "global_step": 34902, "epoch": 293, "lr": 5.2318806581990633e-05} +{"train_loss": 0.00298661389388144, "global_step": 34903, "epoch": 293, "lr": 5.231659345386741e-05} +{"train_loss": 0.003351422492414713, "global_step": 34904, "epoch": 293, "lr": 5.231438032119582e-05} +{"train_loss": 0.0011785299284383655, "global_step": 34905, "epoch": 293, "lr": 5.2312167183980184e-05} +{"train_loss": 0.0029588311444967985, "global_step": 34906, "epoch": 293, "lr": 5.230995404222486e-05} +{"train_loss": 0.002870063064619899, "global_step": 34907, "epoch": 293, "lr": 5.230774089593419e-05} +{"train_loss": 0.0036584092304110527, "global_step": 34908, "epoch": 293, "lr": 5.230552774511251e-05} +{"train_loss": 0.0021140086464583874, "global_step": 34909, "epoch": 293, "lr": 5.2303314589764175e-05} +{"train_loss": 0.0031433128751814365, "global_step": 34910, "epoch": 293, "lr": 5.230110142989353e-05} +{"train_loss": 0.0020408835262060165, "global_step": 34911, "epoch": 293, "lr": 5.2298888265504905e-05} +{"train_loss": 0.0019471296109259129, "global_step": 34912, "epoch": 293, "lr": 5.229667509660268e-05} +{"train_loss": 0.0017993043875321746, "global_step": 34913, "epoch": 293, "lr": 5.2294461923191176e-05} +{"train_loss": 0.0017180234426632524, "global_step": 34914, "epoch": 293, "lr": 5.229224874527473e-05} +{"train_loss": 0.002153734676539898, "global_step": 34915, "epoch": 293, "lr": 5.2290035562857695e-05} +{"train_loss": 0.0017152032814919949, "global_step": 34916, "epoch": 293, "lr": 5.228782237594443e-05} +{"train_loss": 0.003855411196127534, "global_step": 34917, "epoch": 293, "lr": 5.2285609184539264e-05} +{"train_loss": 0.0012621444184333086, "global_step": 34918, "epoch": 293, "lr": 5.2283395988646544e-05} +{"train_loss": 0.003291006665676832, "global_step": 34919, "epoch": 293, "lr": 5.2281182788270634e-05} +{"train_loss": 0.002850291086360812, "global_step": 34920, "epoch": 293, "lr": 5.227896958341585e-05} +{"train_loss": 0.0018223098013550043, "global_step": 34921, "epoch": 293, "lr": 5.227675637408656e-05} +{"train_loss": 0.0023362403735518456, "global_step": 34922, "epoch": 293, "lr": 5.22745431602871e-05} +{"train_loss": 0.0021500876173377037, "global_step": 34923, "epoch": 293, "lr": 5.227232994202183e-05} +{"train_loss": 0.0029946540016680956, "global_step": 34924, "epoch": 293, "lr": 5.2270116719295056e-05} +{"train_loss": 0.0025720749981701374, "global_step": 34925, "epoch": 293, "lr": 5.2267903492111183e-05} +{"train_loss": 0.0012735493946820498, "global_step": 34926, "epoch": 293, "lr": 5.2265690260474506e-05} +{"train_loss": 0.0022125770337879658, "global_step": 34927, "epoch": 293, "lr": 5.2263477024389395e-05} +{"train_loss": 0.0018653830047696829, "global_step": 34928, "epoch": 293, "lr": 5.226126378386018e-05} +{"train_loss": 0.0023874961771070957, "global_step": 34929, "epoch": 293, "lr": 5.225905053889122e-05} +{"train_loss": 0.003557243151590228, "global_step": 34930, "epoch": 293, "lr": 5.225683728948685e-05} +{"train_loss": 0.00278186472132802, "global_step": 34931, "epoch": 293, "lr": 5.2254624035651446e-05} +{"train_loss": 0.0025439828168600798, "global_step": 34932, "epoch": 293, "lr": 5.2252410777389304e-05} +{"train_loss": 0.0018124490743502975, "global_step": 34933, "epoch": 293, "lr": 5.225019751470479e-05} +{"train_loss": 0.0030260926578193903, "global_step": 34934, "epoch": 293, "lr": 5.224798424760227e-05} +{"train_loss": 0.00213408749550581, "global_step": 34935, "epoch": 293, "lr": 5.224577097608605e-05} +{"train_loss": 0.0024518684949725866, "global_step": 34936, "epoch": 293, "lr": 5.2243557700160515e-05} +{"train_loss": 0.0018063385505229235, "global_step": 34937, "epoch": 293, "lr": 5.224134441982999e-05} +{"train_loss": 0.0025922853965312243, "global_step": 34938, "epoch": 293, "lr": 5.223913113509884e-05} +{"train_loss": 0.003043130971491337, "global_step": 34939, "epoch": 293, "lr": 5.223691784597138e-05} +{"train_loss": 0.0018761049723252654, "global_step": 34940, "epoch": 293, "lr": 5.223470455245197e-05} +{"train_loss": 0.001796140568330884, "global_step": 34941, "epoch": 293, "lr": 5.2232491254544955e-05} +{"train_loss": 0.0025840343441814184, "global_step": 34942, "epoch": 293, "lr": 5.223027795225469e-05} +{"train_loss": 0.002497429959475994, "global_step": 34943, "epoch": 293, "lr": 5.2228064645585504e-05} +{"train_loss": 0.002051341813057661, "global_step": 34944, "epoch": 293, "lr": 5.222585133454178e-05} +{"train_loss": 0.0026782306376844645, "global_step": 34945, "epoch": 293, "lr": 5.222363801912781e-05} +{"train_loss": 0.003359529422596097, "global_step": 34946, "epoch": 293, "lr": 5.2221424699347955e-05} +{"train_loss": 0.0034379709977656603, "global_step": 34947, "epoch": 293, "lr": 5.221921137520658e-05} +{"train_loss": 0.00173160620033741, "global_step": 34948, "epoch": 293, "lr": 5.221699804670802e-05} +{"train_loss": 0.002409596461802721, "global_step": 34949, "epoch": 293, "lr": 5.221478471385662e-05} +{"train_loss": 0.0018804949941113591, "global_step": 34950, "epoch": 293, "lr": 5.221257137665674e-05} +{"train_loss": 0.002091726753860712, "global_step": 34951, "epoch": 293, "lr": 5.2210358035112696e-05} +{"train_loss": 0.002685246290639043, "global_step": 34952, "epoch": 293, "lr": 5.220814468922885e-05} +{"train_loss": 0.0016535884933546185, "global_step": 34953, "epoch": 293, "lr": 5.220593133900955e-05} +{"train_loss": 0.001759146573022008, "global_step": 34954, "epoch": 293, "lr": 5.2203717984459147e-05} +{"train_loss": 0.0020695021376013756, "global_step": 34955, "epoch": 293, "lr": 5.220150462558198e-05} +{"train_loss": 0.002170132240280509, "global_step": 34956, "epoch": 293, "lr": 5.2199291262382396e-05} +{"train_loss": 0.0017591915093362331, "global_step": 34957, "epoch": 293, "lr": 5.2197077894864734e-05} +{"train_loss": 0.001684584654867649, "global_step": 34958, "epoch": 293, "lr": 5.219486452303334e-05} +{"train_loss": 0.0032662299927324057, "global_step": 34959, "epoch": 293, "lr": 5.2192651146892554e-05} +{"train_loss": 0.0023687221109867096, "global_step": 34960, "epoch": 293, "lr": 5.2190437766446757e-05} +{"train_loss": 0.0030199321918189526, "global_step": 34961, "epoch": 293, "lr": 5.218822438170025e-05} +{"train_loss": 0.0025043224450200796, "global_step": 34962, "epoch": 293, "lr": 5.21860109926574e-05} +{"train_loss": 0.0011579105630517006, "global_step": 34963, "epoch": 293, "lr": 5.218379759932257e-05} +{"train_loss": 0.0026147926691919565, "global_step": 34964, "epoch": 293, "lr": 5.218158420170007e-05} +{"train_loss": 0.0024398001842200756, "global_step": 34965, "epoch": 293, "lr": 5.217937079979426e-05} +{"train_loss": 0.003200179897248745, "global_step": 34966, "epoch": 293, "lr": 5.217715739360949e-05} +{"train_loss": 0.00301925977692008, "global_step": 34967, "epoch": 293, "lr": 5.2174943983150104e-05} +{"train_loss": 0.0019122911617159843, "global_step": 34968, "epoch": 293, "lr": 5.217273056842046e-05} +{"train_loss": 0.0018530536908656359, "global_step": 34969, "epoch": 293, "lr": 5.217051714942488e-05} +{"train_loss": 0.002445447724312544, "global_step": 34970, "epoch": 293, "lr": 5.2168303726167724e-05} +{"train_loss": 0.0025709134060889482, "global_step": 34971, "epoch": 293, "lr": 5.216609029865332e-05} +{"train_loss": 0.0015306345885619521, "global_step": 34972, "epoch": 293, "lr": 5.216387686688605e-05} +{"train_loss": 0.0015711220912635326, "global_step": 34973, "epoch": 293, "lr": 5.2161663430870235e-05} +{"train_loss": 0.002958358032628894, "global_step": 34974, "epoch": 293, "lr": 5.2159449990610224e-05} +{"train_loss": 0.0022770827636122704, "global_step": 34975, "epoch": 293, "lr": 5.2157236546110365e-05} +{"train_loss": 0.0029992207419127226, "global_step": 34976, "epoch": 293, "lr": 5.2155023097374997e-05} +{"train_loss": 0.0014647352509200573, "global_step": 34977, "epoch": 293, "lr": 5.215280964440848e-05} +{"train_loss": 0.0022756834514439106, "global_step": 34978, "epoch": 293, "lr": 5.215059618721515e-05} +{"train_loss": 0.0014974805526435375, "global_step": 34979, "epoch": 293, "lr": 5.214838272579935e-05} +{"train_loss": 0.0015714939218014479, "global_step": 34980, "epoch": 293, "lr": 5.2146169260165425e-05} +{"train_loss": 0.003160610096529126, "global_step": 34981, "epoch": 293, "lr": 5.2143955790317747e-05} +{"train_loss": 0.002320149913430214, "global_step": 34982, "epoch": 293, "lr": 5.214174231626061e-05} +{"train_loss": 0.0016858219169080257, "global_step": 34983, "epoch": 293, "lr": 5.21395288379984e-05} +{"train_loss": 0.0017258557491004467, "global_step": 34984, "epoch": 293, "lr": 5.213731535553545e-05} +{"train_loss": 0.002353684715496204, "global_step": 34985, "epoch": 293, "lr": 5.213510186887612e-05, "val_loss": 0.012635220773518085} +{"train_loss": 0.002029955154284835, "global_step": 34986, "epoch": 294, "lr": 5.2132888378024744e-05} +{"train_loss": 0.0022695097140967846, "global_step": 34987, "epoch": 294, "lr": 5.2130674882985675e-05} +{"train_loss": 0.0013108575949445367, "global_step": 34988, "epoch": 294, "lr": 5.212846138376326e-05} +{"train_loss": 0.0025722715072333813, "global_step": 34989, "epoch": 294, "lr": 5.212624788036182e-05} +{"train_loss": 0.0013119981158524752, "global_step": 34990, "epoch": 294, "lr": 5.212403437278572e-05} +{"train_loss": 0.003576428396627307, "global_step": 34991, "epoch": 294, "lr": 5.2121820861039316e-05} +{"train_loss": 0.0024890468921512365, "global_step": 34992, "epoch": 294, "lr": 5.211960734512694e-05} +{"train_loss": 0.0034428806975483894, "global_step": 34993, "epoch": 294, "lr": 5.211739382505294e-05} +{"train_loss": 0.001841670018620789, "global_step": 34994, "epoch": 294, "lr": 5.2115180300821675e-05} +{"train_loss": 0.0023606542963534594, "global_step": 34995, "epoch": 294, "lr": 5.211296677243747e-05} +{"train_loss": 0.0013996998313814402, "global_step": 34996, "epoch": 294, "lr": 5.2110753239904675e-05} +{"train_loss": 0.0036817402578890324, "global_step": 34997, "epoch": 294, "lr": 5.210853970322764e-05} +{"train_loss": 0.0017693222034722567, "global_step": 34998, "epoch": 294, "lr": 5.2106326162410725e-05} +{"train_loss": 0.0019176427740603685, "global_step": 34999, "epoch": 294, "lr": 5.2104112617458254e-05} +{"train_loss": 0.0019910275004804134, "global_step": 35000, "epoch": 294, "lr": 5.210189906837458e-05} +{"train_loss": 0.0021986921783536673, "global_step": 35001, "epoch": 294, "lr": 5.209968551516407e-05} +{"train_loss": 0.0019093435257673264, "global_step": 35002, "epoch": 294, "lr": 5.2097471957831024e-05} +{"train_loss": 0.0032581735868006945, "global_step": 35003, "epoch": 294, "lr": 5.209525839637983e-05} +{"train_loss": 0.0017266646027565002, "global_step": 35004, "epoch": 294, "lr": 5.209304483081482e-05} +{"train_loss": 0.002519164700061083, "global_step": 35005, "epoch": 294, "lr": 5.2090831261140336e-05} +{"train_loss": 0.003839548211544752, "global_step": 35006, "epoch": 294, "lr": 5.208861768736074e-05} +{"train_loss": 0.001365878852084279, "global_step": 35007, "epoch": 294, "lr": 5.208640410948037e-05} +{"train_loss": 0.00347869168035686, "global_step": 35008, "epoch": 294, "lr": 5.208419052750355e-05} +{"train_loss": 0.0018754337215796113, "global_step": 35009, "epoch": 294, "lr": 5.208197694143466e-05} +{"train_loss": 0.0034301162231713533, "global_step": 35010, "epoch": 294, "lr": 5.207976335127802e-05} +{"train_loss": 0.0030134322587400675, "global_step": 35011, "epoch": 294, "lr": 5.207754975703799e-05} +{"train_loss": 0.0012446101754903793, "global_step": 35012, "epoch": 294, "lr": 5.2075336158718915e-05} +{"train_loss": 0.0033494923263788223, "global_step": 35013, "epoch": 294, "lr": 5.2073122556325136e-05} +{"train_loss": 0.0035224154125899076, "global_step": 35014, "epoch": 294, "lr": 5.207090894986101e-05} +{"train_loss": 0.0017551922937855124, "global_step": 35015, "epoch": 294, "lr": 5.206869533933086e-05} +{"train_loss": 0.0025949273258447647, "global_step": 35016, "epoch": 294, "lr": 5.206648172473906e-05} +{"train_loss": 0.004446676000952721, "global_step": 35017, "epoch": 294, "lr": 5.206426810608994e-05} +{"train_loss": 0.002906164387241006, "global_step": 35018, "epoch": 294, "lr": 5.206205448338784e-05} +{"train_loss": 0.0013464224757626653, "global_step": 35019, "epoch": 294, "lr": 5.205984085663713e-05} +{"train_loss": 0.0027505261823534966, "global_step": 35020, "epoch": 294, "lr": 5.205762722584214e-05} +{"train_loss": 0.0019400098826736212, "global_step": 35021, "epoch": 294, "lr": 5.2055413591007215e-05} +{"train_loss": 0.0020079759415239096, "global_step": 35022, "epoch": 294, "lr": 5.205319995213671e-05} +{"train_loss": 0.00179380364716053, "global_step": 35023, "epoch": 294, "lr": 5.205098630923497e-05} +{"train_loss": 0.003395606065168977, "global_step": 35024, "epoch": 294, "lr": 5.2048772662306336e-05} +{"train_loss": 0.003243716200813651, "global_step": 35025, "epoch": 294, "lr": 5.204655901135515e-05} +{"train_loss": 0.0022031154949218035, "global_step": 35026, "epoch": 294, "lr": 5.2044345356385774e-05} +{"train_loss": 0.0023668543435633183, "global_step": 35027, "epoch": 294, "lr": 5.204213169740253e-05} +{"train_loss": 0.0024130658712238073, "global_step": 35028, "epoch": 294, "lr": 5.2039918034409784e-05} +{"train_loss": 0.005139009561389685, "global_step": 35029, "epoch": 294, "lr": 5.203770436741188e-05} +{"train_loss": 0.002750869607552886, "global_step": 35030, "epoch": 294, "lr": 5.2035490696413155e-05} +{"train_loss": 0.0027442281134426594, "global_step": 35031, "epoch": 294, "lr": 5.203327702141797e-05} +{"train_loss": 0.001318452414125204, "global_step": 35032, "epoch": 294, "lr": 5.203106334243065e-05} +{"train_loss": 0.0018648020923137665, "global_step": 35033, "epoch": 294, "lr": 5.2028849659455556e-05} +{"train_loss": 0.003334341337904334, "global_step": 35034, "epoch": 294, "lr": 5.202663597249704e-05} +{"train_loss": 0.0018629210535436869, "global_step": 35035, "epoch": 294, "lr": 5.202442228155944e-05} +{"train_loss": 0.0024213579017668962, "global_step": 35036, "epoch": 294, "lr": 5.2022208586647105e-05} +{"train_loss": 0.002223944291472435, "global_step": 35037, "epoch": 294, "lr": 5.201999488776438e-05} +{"train_loss": 0.0027790332678705454, "global_step": 35038, "epoch": 294, "lr": 5.201778118491562e-05} +{"train_loss": 0.003933676518499851, "global_step": 35039, "epoch": 294, "lr": 5.2015567478105145e-05} +{"train_loss": 0.0018141448963433504, "global_step": 35040, "epoch": 294, "lr": 5.201335376733732e-05} +{"train_loss": 0.0021750517189502716, "global_step": 35041, "epoch": 294, "lr": 5.201114005261649e-05} +{"train_loss": 0.0023674487601965666, "global_step": 35042, "epoch": 294, "lr": 5.200892633394701e-05} +{"train_loss": 0.002100195037201047, "global_step": 35043, "epoch": 294, "lr": 5.2006712611333206e-05} +{"train_loss": 0.0024297249037772417, "global_step": 35044, "epoch": 294, "lr": 5.2004498884779454e-05} +{"train_loss": 0.0017018356593325734, "global_step": 35045, "epoch": 294, "lr": 5.2002285154290074e-05} +{"train_loss": 0.0011563855223357677, "global_step": 35046, "epoch": 294, "lr": 5.200007141986941e-05} +{"train_loss": 0.0036037475802004337, "global_step": 35047, "epoch": 294, "lr": 5.1997857681521837e-05} +{"train_loss": 0.0029522294644266367, "global_step": 35048, "epoch": 294, "lr": 5.199564393925167e-05} +{"train_loss": 0.0023369358386844397, "global_step": 35049, "epoch": 294, "lr": 5.1993430193063276e-05} +{"train_loss": 0.001380088971927762, "global_step": 35050, "epoch": 294, "lr": 5.199121644296099e-05} +{"train_loss": 0.0030563732143491507, "global_step": 35051, "epoch": 294, "lr": 5.198900268894916e-05} +{"train_loss": 0.0024169012904167175, "global_step": 35052, "epoch": 294, "lr": 5.198678893103215e-05} +{"train_loss": 0.0028151085134595633, "global_step": 35053, "epoch": 294, "lr": 5.198457516921428e-05} +{"train_loss": 0.002096465788781643, "global_step": 35054, "epoch": 294, "lr": 5.198236140349991e-05} +{"train_loss": 0.0026432941667735577, "global_step": 35055, "epoch": 294, "lr": 5.1980147633893385e-05} +{"train_loss": 0.001973872072994709, "global_step": 35056, "epoch": 294, "lr": 5.197793386039905e-05} +{"train_loss": 0.0022157151252031326, "global_step": 35057, "epoch": 294, "lr": 5.1975720083021276e-05} +{"train_loss": 0.0019083573715761304, "global_step": 35058, "epoch": 294, "lr": 5.197350630176436e-05} +{"train_loss": 0.003419002750888467, "global_step": 35059, "epoch": 294, "lr": 5.197129251663269e-05} +{"train_loss": 0.002984466264024377, "global_step": 35060, "epoch": 294, "lr": 5.1969078727630585e-05} +{"train_loss": 0.0015253305900841951, "global_step": 35061, "epoch": 294, "lr": 5.196686493476241e-05} +{"train_loss": 0.0010425401851534843, "global_step": 35062, "epoch": 294, "lr": 5.19646511380325e-05} +{"train_loss": 0.0024244398809969425, "global_step": 35063, "epoch": 294, "lr": 5.196243733744524e-05} +{"train_loss": 0.002230099169537425, "global_step": 35064, "epoch": 294, "lr": 5.19602235330049e-05} +{"train_loss": 0.0021084528416395187, "global_step": 35065, "epoch": 294, "lr": 5.195800972471589e-05} +{"train_loss": 0.002298787236213684, "global_step": 35066, "epoch": 294, "lr": 5.195579591258254e-05} +{"train_loss": 0.0022140606306493282, "global_step": 35067, "epoch": 294, "lr": 5.195358209660918e-05} +{"train_loss": 0.001509615103714168, "global_step": 35068, "epoch": 294, "lr": 5.1951368276800173e-05} +{"train_loss": 0.002903902204707265, "global_step": 35069, "epoch": 294, "lr": 5.194915445315988e-05} +{"train_loss": 0.001547010033391416, "global_step": 35070, "epoch": 294, "lr": 5.194694062569262e-05} +{"train_loss": 0.00247393362224102, "global_step": 35071, "epoch": 294, "lr": 5.194472679440274e-05} +{"train_loss": 0.0019991635344922543, "global_step": 35072, "epoch": 294, "lr": 5.194251295929461e-05} +{"train_loss": 0.0023355756420642138, "global_step": 35073, "epoch": 294, "lr": 5.194029912037256e-05} +{"train_loss": 0.004573761951178312, "global_step": 35074, "epoch": 294, "lr": 5.193808527764095e-05} +{"train_loss": 0.0017983608413487673, "global_step": 35075, "epoch": 294, "lr": 5.193587143110411e-05} +{"train_loss": 0.0016287117032334208, "global_step": 35076, "epoch": 294, "lr": 5.193365758076638e-05} +{"train_loss": 0.00268960022367537, "global_step": 35077, "epoch": 294, "lr": 5.193144372663213e-05} +{"train_loss": 0.0016677206149324775, "global_step": 35078, "epoch": 294, "lr": 5.19292298687057e-05} +{"train_loss": 0.002307617338374257, "global_step": 35079, "epoch": 294, "lr": 5.192701600699143e-05} +{"train_loss": 0.0026708533987402916, "global_step": 35080, "epoch": 294, "lr": 5.192480214149367e-05} +{"train_loss": 0.0023435931652784348, "global_step": 35081, "epoch": 294, "lr": 5.192258827221676e-05} +{"train_loss": 0.0019657807424664497, "global_step": 35082, "epoch": 294, "lr": 5.192037439916506e-05} +{"train_loss": 0.0018561752513051033, "global_step": 35083, "epoch": 294, "lr": 5.191816052234291e-05} +{"train_loss": 0.002302010776475072, "global_step": 35084, "epoch": 294, "lr": 5.1915946641754656e-05} +{"train_loss": 0.0016257480019703507, "global_step": 35085, "epoch": 294, "lr": 5.191373275740464e-05} +{"train_loss": 0.0021223360672593117, "global_step": 35086, "epoch": 294, "lr": 5.1911518869297224e-05} +{"train_loss": 0.0019747193437069654, "global_step": 35087, "epoch": 294, "lr": 5.190930497743674e-05} +{"train_loss": 0.0018247164553031325, "global_step": 35088, "epoch": 294, "lr": 5.1907091081827555e-05} +{"train_loss": 0.0009341348195448518, "global_step": 35089, "epoch": 294, "lr": 5.190487718247398e-05} +{"train_loss": 0.0044528706930577755, "global_step": 35090, "epoch": 294, "lr": 5.190266327938038e-05} +{"train_loss": 0.001996344421058893, "global_step": 35091, "epoch": 294, "lr": 5.190044937255112e-05} +{"train_loss": 0.0034300778061151505, "global_step": 35092, "epoch": 294, "lr": 5.189823546199052e-05} +{"train_loss": 0.0023031258024275303, "global_step": 35093, "epoch": 294, "lr": 5.189602154770293e-05} +{"train_loss": 0.0026822485961019993, "global_step": 35094, "epoch": 294, "lr": 5.189380762969272e-05} +{"train_loss": 0.0018559308955445886, "global_step": 35095, "epoch": 294, "lr": 5.189159370796422e-05} +{"train_loss": 0.003041283693164587, "global_step": 35096, "epoch": 294, "lr": 5.1889379782521774e-05} +{"train_loss": 0.0022382852621376514, "global_step": 35097, "epoch": 294, "lr": 5.1887165853369734e-05} +{"train_loss": 0.00151209463365376, "global_step": 35098, "epoch": 294, "lr": 5.1884951920512433e-05} +{"train_loss": 0.002041249768808484, "global_step": 35099, "epoch": 294, "lr": 5.188273798395424e-05} +{"train_loss": 0.0017204384785145521, "global_step": 35100, "epoch": 294, "lr": 5.18805240436995e-05} +{"train_loss": 0.0012814677320420742, "global_step": 35101, "epoch": 294, "lr": 5.1878310099752544e-05} +{"train_loss": 0.003964865580201149, "global_step": 35102, "epoch": 294, "lr": 5.1876096152117724e-05} +{"train_loss": 0.002588993404060602, "global_step": 35103, "epoch": 294, "lr": 5.1873882200799395e-05} +{"train_loss": 0.002378636788177703, "global_step": 35104, "epoch": 294, "lr": 5.18716682458019e-05, "val_loss": 0.015054414980113506} +{"train_loss": 0.0017724235076457262, "global_step": 35105, "epoch": 295, "lr": 5.186945428712957e-05} +{"train_loss": 0.002194628119468689, "global_step": 35106, "epoch": 295, "lr": 5.186724032478678e-05} +{"train_loss": 0.001582391676492989, "global_step": 35107, "epoch": 295, "lr": 5.186502635877787e-05} +{"train_loss": 0.0025403499603271484, "global_step": 35108, "epoch": 295, "lr": 5.186281238910718e-05} +{"train_loss": 0.002028432209044695, "global_step": 35109, "epoch": 295, "lr": 5.1860598415779035e-05} +{"train_loss": 0.0023140106350183487, "global_step": 35110, "epoch": 295, "lr": 5.1858384438797816e-05} +{"train_loss": 0.002647955669090152, "global_step": 35111, "epoch": 295, "lr": 5.185617045816785e-05} +{"train_loss": 0.0026281392201781273, "global_step": 35112, "epoch": 295, "lr": 5.185395647389351e-05} +{"train_loss": 0.002281229244545102, "global_step": 35113, "epoch": 295, "lr": 5.1851742485979114e-05} +{"train_loss": 0.001492618815973401, "global_step": 35114, "epoch": 295, "lr": 5.1849528494429024e-05} +{"train_loss": 0.0031726243905723095, "global_step": 35115, "epoch": 295, "lr": 5.184731449924757e-05} +{"train_loss": 0.002514416119083762, "global_step": 35116, "epoch": 295, "lr": 5.1845100500439116e-05} +{"train_loss": 0.0024223809596151114, "global_step": 35117, "epoch": 295, "lr": 5.1842886498008e-05} +{"train_loss": 0.001807168242521584, "global_step": 35118, "epoch": 295, "lr": 5.1840672491958575e-05} +{"train_loss": 0.0019488404504954815, "global_step": 35119, "epoch": 295, "lr": 5.183845848229521e-05} +{"train_loss": 0.001678748638369143, "global_step": 35120, "epoch": 295, "lr": 5.18362444690222e-05} +{"train_loss": 0.0018030714709311724, "global_step": 35121, "epoch": 295, "lr": 5.183403045214393e-05} +{"train_loss": 0.0028842883184552193, "global_step": 35122, "epoch": 295, "lr": 5.183181643166474e-05} +{"train_loss": 0.0019433395937085152, "global_step": 35123, "epoch": 295, "lr": 5.1829602407588976e-05} +{"train_loss": 0.003060565795749426, "global_step": 35124, "epoch": 295, "lr": 5.1827388379920974e-05} +{"train_loss": 0.0011437700595706701, "global_step": 35125, "epoch": 295, "lr": 5.1825174348665096e-05} +{"train_loss": 0.0034435447305440903, "global_step": 35126, "epoch": 295, "lr": 5.1822960313825686e-05} +{"train_loss": 0.0031935477163642645, "global_step": 35127, "epoch": 295, "lr": 5.182074627540709e-05} +{"train_loss": 0.0017485120333731174, "global_step": 35128, "epoch": 295, "lr": 5.181853223341364e-05} +{"train_loss": 0.002013210440054536, "global_step": 35129, "epoch": 295, "lr": 5.18163181878497e-05} +{"train_loss": 0.0022601496893912554, "global_step": 35130, "epoch": 295, "lr": 5.181410413871962e-05} +{"train_loss": 0.0038490956649184227, "global_step": 35131, "epoch": 295, "lr": 5.181189008602774e-05} +{"train_loss": 0.0018881208961829543, "global_step": 35132, "epoch": 295, "lr": 5.18096760297784e-05} +{"train_loss": 0.003333853790536523, "global_step": 35133, "epoch": 295, "lr": 5.180746196997596e-05} +{"train_loss": 0.0026913511101156473, "global_step": 35134, "epoch": 295, "lr": 5.1805247906624756e-05} +{"train_loss": 0.0031701247207820415, "global_step": 35135, "epoch": 295, "lr": 5.180303383972914e-05} +{"train_loss": 0.002595246536657214, "global_step": 35136, "epoch": 295, "lr": 5.180081976929346e-05} +{"train_loss": 0.0018989661475643516, "global_step": 35137, "epoch": 295, "lr": 5.1798605695322065e-05} +{"train_loss": 0.002868455136194825, "global_step": 35138, "epoch": 295, "lr": 5.179639161781932e-05} +{"train_loss": 0.0020217658020555973, "global_step": 35139, "epoch": 295, "lr": 5.1794177536789536e-05} +{"train_loss": 0.0023662985768169165, "global_step": 35140, "epoch": 295, "lr": 5.179196345223707e-05} +{"train_loss": 0.0023874451871961355, "global_step": 35141, "epoch": 295, "lr": 5.1789749364166275e-05} +{"train_loss": 0.0020868030842393637, "global_step": 35142, "epoch": 295, "lr": 5.17875352725815e-05} +{"train_loss": 0.002857838524505496, "global_step": 35143, "epoch": 295, "lr": 5.17853211774871e-05} +{"train_loss": 0.0027893218211829662, "global_step": 35144, "epoch": 295, "lr": 5.178310707888742e-05} +{"train_loss": 0.0012305889977142215, "global_step": 35145, "epoch": 295, "lr": 5.1780892976786776e-05} +{"train_loss": 0.003966327290982008, "global_step": 35146, "epoch": 295, "lr": 5.177867887118955e-05} +{"train_loss": 0.002391181653365493, "global_step": 35147, "epoch": 295, "lr": 5.1776464762100076e-05} +{"train_loss": 0.0033673366997390985, "global_step": 35148, "epoch": 295, "lr": 5.1774250649522706e-05} +{"train_loss": 0.002381098223850131, "global_step": 35149, "epoch": 295, "lr": 5.1772036533461774e-05} +{"train_loss": 0.002611317904666066, "global_step": 35150, "epoch": 295, "lr": 5.1769822413921644e-05} +{"train_loss": 0.002778794150799513, "global_step": 35151, "epoch": 295, "lr": 5.176760829090665e-05} +{"train_loss": 0.0025227628648281097, "global_step": 35152, "epoch": 295, "lr": 5.1765394164421165e-05} +{"train_loss": 0.003275039605796337, "global_step": 35153, "epoch": 295, "lr": 5.17631800344695e-05} +{"train_loss": 0.00188964803237468, "global_step": 35154, "epoch": 295, "lr": 5.176096590105602e-05} +{"train_loss": 0.0032497704960405827, "global_step": 35155, "epoch": 295, "lr": 5.1758751764185084e-05} +{"train_loss": 0.0023532193154096603, "global_step": 35156, "epoch": 295, "lr": 5.175653762386102e-05} +{"train_loss": 0.0018001166172325611, "global_step": 35157, "epoch": 295, "lr": 5.1754323480088195e-05} +{"train_loss": 0.0018073839601129293, "global_step": 35158, "epoch": 295, "lr": 5.1752109332870924e-05} +{"train_loss": 0.002266290131956339, "global_step": 35159, "epoch": 295, "lr": 5.174989518221358e-05} +{"train_loss": 0.0015780263347551227, "global_step": 35160, "epoch": 295, "lr": 5.174768102812051e-05} +{"train_loss": 0.0028499653562903404, "global_step": 35161, "epoch": 295, "lr": 5.174546687059605e-05} +{"train_loss": 0.0028332762885838747, "global_step": 35162, "epoch": 295, "lr": 5.174325270964454e-05} +{"train_loss": 0.004238214809447527, "global_step": 35163, "epoch": 295, "lr": 5.174103854527036e-05} +{"train_loss": 0.0028559481725096703, "global_step": 35164, "epoch": 295, "lr": 5.173882437747783e-05} +{"train_loss": 0.0023936545476317406, "global_step": 35165, "epoch": 295, "lr": 5.173661020627128e-05} +{"train_loss": 0.0037971220444887877, "global_step": 35166, "epoch": 295, "lr": 5.1734396031655105e-05} +{"train_loss": 0.0027732711751013994, "global_step": 35167, "epoch": 295, "lr": 5.173218185363363e-05} +{"train_loss": 0.0011429502628743649, "global_step": 35168, "epoch": 295, "lr": 5.17299676722112e-05} +{"train_loss": 0.003070117672905326, "global_step": 35169, "epoch": 295, "lr": 5.172775348739217e-05} +{"train_loss": 0.0017417380586266518, "global_step": 35170, "epoch": 295, "lr": 5.172553929918087e-05} +{"train_loss": 0.002777633024379611, "global_step": 35171, "epoch": 295, "lr": 5.172332510758166e-05} +{"train_loss": 0.0034078520257025957, "global_step": 35172, "epoch": 295, "lr": 5.172111091259888e-05} +{"train_loss": 0.0044944146648049355, "global_step": 35173, "epoch": 295, "lr": 5.171889671423688e-05} +{"train_loss": 0.0026385050732642412, "global_step": 35174, "epoch": 295, "lr": 5.1716682512500026e-05} +{"train_loss": 0.002375097945332527, "global_step": 35175, "epoch": 295, "lr": 5.171446830739264e-05} +{"train_loss": 0.002159407828003168, "global_step": 35176, "epoch": 295, "lr": 5.1712254098919086e-05} +{"train_loss": 0.0024350930470973253, "global_step": 35177, "epoch": 295, "lr": 5.1710039887083705e-05} +{"train_loss": 0.0022327927872538567, "global_step": 35178, "epoch": 295, "lr": 5.170782567189083e-05} +{"train_loss": 0.0017396326875314116, "global_step": 35179, "epoch": 295, "lr": 5.1705611453344825e-05} +{"train_loss": 0.002661244012415409, "global_step": 35180, "epoch": 295, "lr": 5.1703397231450034e-05} +{"train_loss": 0.002314957557246089, "global_step": 35181, "epoch": 295, "lr": 5.1701183006210804e-05} +{"train_loss": 0.003185535315424204, "global_step": 35182, "epoch": 295, "lr": 5.169896877763149e-05} +{"train_loss": 0.002692353678867221, "global_step": 35183, "epoch": 295, "lr": 5.169675454571643e-05} +{"train_loss": 0.0015266772825270891, "global_step": 35184, "epoch": 295, "lr": 5.169454031046997e-05} +{"train_loss": 0.002297669416293502, "global_step": 35185, "epoch": 295, "lr": 5.169232607189646e-05} +{"train_loss": 0.001348835532553494, "global_step": 35186, "epoch": 295, "lr": 5.169011183000025e-05} +{"train_loss": 0.002345794579014182, "global_step": 35187, "epoch": 295, "lr": 5.1687897584785694e-05} +{"train_loss": 0.0024604841601103544, "global_step": 35188, "epoch": 295, "lr": 5.168568333625713e-05} +{"train_loss": 0.0032415720634162426, "global_step": 35189, "epoch": 295, "lr": 5.16834690844189e-05} +{"train_loss": 0.0029425243847072124, "global_step": 35190, "epoch": 295, "lr": 5.168125482927536e-05} +{"train_loss": 0.0028060670010745525, "global_step": 35191, "epoch": 295, "lr": 5.167904057083085e-05} +{"train_loss": 0.0017434126930311322, "global_step": 35192, "epoch": 295, "lr": 5.167682630908973e-05} +{"train_loss": 0.0028579006902873516, "global_step": 35193, "epoch": 295, "lr": 5.1674612044056346e-05} +{"train_loss": 0.004688338842242956, "global_step": 35194, "epoch": 295, "lr": 5.167239777573503e-05} +{"train_loss": 0.0024490440264344215, "global_step": 35195, "epoch": 295, "lr": 5.167018350413016e-05} +{"train_loss": 0.0013158029178157449, "global_step": 35196, "epoch": 295, "lr": 5.166796922924604e-05} +{"train_loss": 0.002068652305752039, "global_step": 35197, "epoch": 295, "lr": 5.1665754951087045e-05} +{"train_loss": 0.003477959893643856, "global_step": 35198, "epoch": 295, "lr": 5.166354066965752e-05} +{"train_loss": 0.0017151945503428578, "global_step": 35199, "epoch": 295, "lr": 5.166132638496181e-05} +{"train_loss": 0.0018645278178155422, "global_step": 35200, "epoch": 295, "lr": 5.165911209700425e-05} +{"train_loss": 0.0023908012080937624, "global_step": 35201, "epoch": 295, "lr": 5.165689780578923e-05} +{"train_loss": 0.0019168092403560877, "global_step": 35202, "epoch": 295, "lr": 5.165468351132105e-05} +{"train_loss": 0.00334200169891119, "global_step": 35203, "epoch": 295, "lr": 5.165246921360408e-05} +{"train_loss": 0.0029163684230297804, "global_step": 35204, "epoch": 295, "lr": 5.165025491264266e-05} +{"train_loss": 0.003301517805084586, "global_step": 35205, "epoch": 295, "lr": 5.164804060844114e-05} +{"train_loss": 0.0014456998324021697, "global_step": 35206, "epoch": 295, "lr": 5.1645826301003875e-05} +{"train_loss": 0.002064960775896907, "global_step": 35207, "epoch": 295, "lr": 5.1643611990335206e-05} +{"train_loss": 0.0031276443041861057, "global_step": 35208, "epoch": 295, "lr": 5.164139767643948e-05} +{"train_loss": 0.002089973771944642, "global_step": 35209, "epoch": 295, "lr": 5.1639183359321045e-05} +{"train_loss": 0.0020569271873682737, "global_step": 35210, "epoch": 295, "lr": 5.163696903898424e-05} +{"train_loss": 0.0017040559323504567, "global_step": 35211, "epoch": 295, "lr": 5.163475471543342e-05} +{"train_loss": 0.004741469398140907, "global_step": 35212, "epoch": 295, "lr": 5.163254038867295e-05} +{"train_loss": 0.002408812288194895, "global_step": 35213, "epoch": 295, "lr": 5.1630326058707146e-05} +{"train_loss": 0.002365828724578023, "global_step": 35214, "epoch": 295, "lr": 5.1628111725540374e-05} +{"train_loss": 0.0022533582523465157, "global_step": 35215, "epoch": 295, "lr": 5.162589738917698e-05} +{"train_loss": 0.0025749290362000465, "global_step": 35216, "epoch": 295, "lr": 5.162368304962131e-05} +{"train_loss": 0.0013087366241961718, "global_step": 35217, "epoch": 295, "lr": 5.1621468706877705e-05} +{"train_loss": 0.0032924271654337645, "global_step": 35218, "epoch": 295, "lr": 5.161925436095053e-05} +{"train_loss": 0.002750053070485592, "global_step": 35219, "epoch": 295, "lr": 5.161704001184412e-05} +{"train_loss": 0.003452954115346074, "global_step": 35220, "epoch": 295, "lr": 5.161482565956284e-05} +{"train_loss": 0.002469670958817005, "global_step": 35221, "epoch": 295, "lr": 5.1612611304111e-05} +{"train_loss": 0.0020197604317218065, "global_step": 35222, "epoch": 295, "lr": 5.161039694549298e-05} +{"train_loss": 0.0025018984031229584, "global_step": 35223, "epoch": 295, "lr": 5.160818258371311e-05, "val_loss": 0.02455991320312023, "train_action_mse_error": 4.639411417883821e-05} +{"train_loss": 0.0019025127403438091, "global_step": 35224, "epoch": 296, "lr": 5.160596821877575e-05} +{"train_loss": 0.0015279398066923022, "global_step": 35225, "epoch": 296, "lr": 5.1603753850685245e-05} +{"train_loss": 0.0033869228791445494, "global_step": 35226, "epoch": 296, "lr": 5.1601539479445934e-05} +{"train_loss": 0.002482945565134287, "global_step": 35227, "epoch": 296, "lr": 5.159932510506218e-05} +{"train_loss": 0.0022360109724104404, "global_step": 35228, "epoch": 296, "lr": 5.1597110727538325e-05} +{"train_loss": 0.0020171143114566803, "global_step": 35229, "epoch": 296, "lr": 5.159489634687869e-05} +{"train_loss": 0.0023924699053168297, "global_step": 35230, "epoch": 296, "lr": 5.1592681963087675e-05} +{"train_loss": 0.0019960501231253147, "global_step": 35231, "epoch": 296, "lr": 5.1590467576169575e-05} +{"train_loss": 0.0026346344966441393, "global_step": 35232, "epoch": 296, "lr": 5.1588253186128775e-05} +{"train_loss": 0.0021294557955116034, "global_step": 35233, "epoch": 296, "lr": 5.1586038792969614e-05} +{"train_loss": 0.003444218309596181, "global_step": 35234, "epoch": 296, "lr": 5.158382439669642e-05} +{"train_loss": 0.003201340092346072, "global_step": 35235, "epoch": 296, "lr": 5.158160999731357e-05} +{"train_loss": 0.002351670525968075, "global_step": 35236, "epoch": 296, "lr": 5.1579395594825386e-05} +{"train_loss": 0.002362340223044157, "global_step": 35237, "epoch": 296, "lr": 5.157718118923623e-05} +{"train_loss": 0.001640154398046434, "global_step": 35238, "epoch": 296, "lr": 5.157496678055047e-05} +{"train_loss": 0.0027872463688254356, "global_step": 35239, "epoch": 296, "lr": 5.157275236877241e-05} +{"train_loss": 0.0017089530592784286, "global_step": 35240, "epoch": 296, "lr": 5.157053795390642e-05} +{"train_loss": 0.001153022050857544, "global_step": 35241, "epoch": 296, "lr": 5.1568323535956853e-05} +{"train_loss": 0.0020275525748729706, "global_step": 35242, "epoch": 296, "lr": 5.156610911492804e-05} +{"train_loss": 0.0021460314746946096, "global_step": 35243, "epoch": 296, "lr": 5.1563894690824344e-05} +{"train_loss": 0.0018740949453786016, "global_step": 35244, "epoch": 296, "lr": 5.15616802636501e-05} +{"train_loss": 0.0012375008082017303, "global_step": 35245, "epoch": 296, "lr": 5.1559465833409694e-05} +{"train_loss": 0.0024120458401739597, "global_step": 35246, "epoch": 296, "lr": 5.155725140010742e-05} +{"train_loss": 0.00159563182387501, "global_step": 35247, "epoch": 296, "lr": 5.155503696374765e-05} +{"train_loss": 0.001960095949470997, "global_step": 35248, "epoch": 296, "lr": 5.155282252433472e-05} +{"train_loss": 0.002547129523009062, "global_step": 35249, "epoch": 296, "lr": 5.1550608081872994e-05} +{"train_loss": 0.0012073256075382233, "global_step": 35250, "epoch": 296, "lr": 5.1548393636366824e-05} +{"train_loss": 0.0012652641162276268, "global_step": 35251, "epoch": 296, "lr": 5.154617918782055e-05} +{"train_loss": 0.003449699841439724, "global_step": 35252, "epoch": 296, "lr": 5.154396473623851e-05} +{"train_loss": 0.0019981765653938055, "global_step": 35253, "epoch": 296, "lr": 5.154175028162507e-05} +{"train_loss": 0.0013092149747535586, "global_step": 35254, "epoch": 296, "lr": 5.153953582398456e-05} +{"train_loss": 0.0025438040029257536, "global_step": 35255, "epoch": 296, "lr": 5.1537321363321335e-05} +{"train_loss": 0.0017195900436490774, "global_step": 35256, "epoch": 296, "lr": 5.153510689963975e-05} +{"train_loss": 0.0016379423905164003, "global_step": 35257, "epoch": 296, "lr": 5.153289243294415e-05} +{"train_loss": 0.002828742377460003, "global_step": 35258, "epoch": 296, "lr": 5.153067796323887e-05} +{"train_loss": 0.003245963715016842, "global_step": 35259, "epoch": 296, "lr": 5.1528463490528264e-05} +{"train_loss": 0.0012617572210729122, "global_step": 35260, "epoch": 296, "lr": 5.1526249014816695e-05} +{"train_loss": 0.00265022786334157, "global_step": 35261, "epoch": 296, "lr": 5.152403453610849e-05} +{"train_loss": 0.0014495900832116604, "global_step": 35262, "epoch": 296, "lr": 5.152182005440801e-05} +{"train_loss": 0.0014847255079075694, "global_step": 35263, "epoch": 296, "lr": 5.15196055697196e-05} +{"train_loss": 0.00253197830170393, "global_step": 35264, "epoch": 296, "lr": 5.151739108204761e-05} +{"train_loss": 0.0026950067840516567, "global_step": 35265, "epoch": 296, "lr": 5.1515176591396376e-05} +{"train_loss": 0.0012177990283817053, "global_step": 35266, "epoch": 296, "lr": 5.151296209777026e-05} +{"train_loss": 0.0026429477147758007, "global_step": 35267, "epoch": 296, "lr": 5.15107476011736e-05} +{"train_loss": 0.002437584800645709, "global_step": 35268, "epoch": 296, "lr": 5.150853310161074e-05} +{"train_loss": 0.004249860532581806, "global_step": 35269, "epoch": 296, "lr": 5.1506318599086056e-05} +{"train_loss": 0.002068668371066451, "global_step": 35270, "epoch": 296, "lr": 5.150410409360388e-05} +{"train_loss": 0.002067240886390209, "global_step": 35271, "epoch": 296, "lr": 5.1501889585168536e-05} +{"train_loss": 0.0021180305629968643, "global_step": 35272, "epoch": 296, "lr": 5.1499675073784406e-05} +{"train_loss": 0.0023350187111645937, "global_step": 35273, "epoch": 296, "lr": 5.1497460559455826e-05} +{"train_loss": 0.0031453121919184923, "global_step": 35274, "epoch": 296, "lr": 5.149524604218713e-05} +{"train_loss": 0.0013750592479482293, "global_step": 35275, "epoch": 296, "lr": 5.149303152198268e-05} +{"train_loss": 0.0022302258294075727, "global_step": 35276, "epoch": 296, "lr": 5.1490816998846834e-05} +{"train_loss": 0.0025631594471633434, "global_step": 35277, "epoch": 296, "lr": 5.148860247278392e-05} +{"train_loss": 0.0032592667266726494, "global_step": 35278, "epoch": 296, "lr": 5.1486387943798296e-05} +{"train_loss": 0.0034408648498356342, "global_step": 35279, "epoch": 296, "lr": 5.14841734118943e-05} +{"train_loss": 0.0016902899369597435, "global_step": 35280, "epoch": 296, "lr": 5.1481958877076296e-05} +{"train_loss": 0.0034779312554746866, "global_step": 35281, "epoch": 296, "lr": 5.147974433934862e-05} +{"train_loss": 0.0025384228210896254, "global_step": 35282, "epoch": 296, "lr": 5.147752979871563e-05} +{"train_loss": 0.0033397276420146227, "global_step": 35283, "epoch": 296, "lr": 5.147531525518166e-05} +{"train_loss": 0.003163203364238143, "global_step": 35284, "epoch": 296, "lr": 5.1473100708751065e-05} +{"train_loss": 0.0027049260679632425, "global_step": 35285, "epoch": 296, "lr": 5.14708861594282e-05} +{"train_loss": 0.001245636842213571, "global_step": 35286, "epoch": 296, "lr": 5.146867160721741e-05} +{"train_loss": 0.0030713018495589495, "global_step": 35287, "epoch": 296, "lr": 5.146645705212303e-05} +{"train_loss": 0.003553622169420123, "global_step": 35288, "epoch": 296, "lr": 5.146424249414944e-05} +{"train_loss": 0.0020283726043999195, "global_step": 35289, "epoch": 296, "lr": 5.146202793330095e-05} +{"train_loss": 0.0018921134760603309, "global_step": 35290, "epoch": 296, "lr": 5.145981336958192e-05} +{"train_loss": 0.0023589604534208775, "global_step": 35291, "epoch": 296, "lr": 5.145759880299671e-05} +{"train_loss": 0.002011653734371066, "global_step": 35292, "epoch": 296, "lr": 5.1455384233549655e-05} +{"train_loss": 0.001881724689155817, "global_step": 35293, "epoch": 296, "lr": 5.145316966124511e-05} +{"train_loss": 0.0044386498630046844, "global_step": 35294, "epoch": 296, "lr": 5.1450955086087424e-05} +{"train_loss": 0.0016081928042694926, "global_step": 35295, "epoch": 296, "lr": 5.1448740508080954e-05} +{"train_loss": 0.001426540082320571, "global_step": 35296, "epoch": 296, "lr": 5.1446525927230025e-05} +{"train_loss": 0.002701342571526766, "global_step": 35297, "epoch": 296, "lr": 5.144431134353899e-05} +{"train_loss": 0.0023943623527884483, "global_step": 35298, "epoch": 296, "lr": 5.1442096757012206e-05} +{"train_loss": 0.002960256766527891, "global_step": 35299, "epoch": 296, "lr": 5.143988216765402e-05} +{"train_loss": 0.0024342755787074566, "global_step": 35300, "epoch": 296, "lr": 5.1437667575468784e-05} +{"train_loss": 0.002158315386623144, "global_step": 35301, "epoch": 296, "lr": 5.143545298046085e-05} +{"train_loss": 0.002740514697507024, "global_step": 35302, "epoch": 296, "lr": 5.1433238382634555e-05} +{"train_loss": 0.002646933775395155, "global_step": 35303, "epoch": 296, "lr": 5.143102378199424e-05} +{"train_loss": 0.002721501048654318, "global_step": 35304, "epoch": 296, "lr": 5.1428809178544255e-05} +{"train_loss": 0.0024644089862704277, "global_step": 35305, "epoch": 296, "lr": 5.1426594572288965e-05} +{"train_loss": 0.0034576798789203167, "global_step": 35306, "epoch": 296, "lr": 5.142437996323272e-05} +{"train_loss": 0.0015351783949881792, "global_step": 35307, "epoch": 296, "lr": 5.142216535137985e-05} +{"train_loss": 0.0029164934530854225, "global_step": 35308, "epoch": 296, "lr": 5.141995073673471e-05} +{"train_loss": 0.0015782297123223543, "global_step": 35309, "epoch": 296, "lr": 5.141773611930164e-05} +{"train_loss": 0.001902932533994317, "global_step": 35310, "epoch": 296, "lr": 5.1415521499085006e-05} +{"train_loss": 0.005286470986902714, "global_step": 35311, "epoch": 296, "lr": 5.141330687608914e-05} +{"train_loss": 0.002572861034423113, "global_step": 35312, "epoch": 296, "lr": 5.141109225031841e-05} +{"train_loss": 0.0013429163955152035, "global_step": 35313, "epoch": 296, "lr": 5.140887762177713e-05} +{"train_loss": 0.002275412902235985, "global_step": 35314, "epoch": 296, "lr": 5.1406662990469676e-05} +{"train_loss": 0.0018267289269715548, "global_step": 35315, "epoch": 296, "lr": 5.1404448356400405e-05} +{"train_loss": 0.003048770362511277, "global_step": 35316, "epoch": 296, "lr": 5.1402233719573636e-05} +{"train_loss": 0.0027500547003000975, "global_step": 35317, "epoch": 296, "lr": 5.140001907999373e-05} +{"train_loss": 0.002792603336274624, "global_step": 35318, "epoch": 296, "lr": 5.139780443766504e-05} +{"train_loss": 0.0032669466454535723, "global_step": 35319, "epoch": 296, "lr": 5.13955897925919e-05} +{"train_loss": 0.002603589091449976, "global_step": 35320, "epoch": 296, "lr": 5.13933751447787e-05} +{"train_loss": 0.0036745339166373014, "global_step": 35321, "epoch": 296, "lr": 5.1391160494229726e-05} +{"train_loss": 0.0024918015114963055, "global_step": 35322, "epoch": 296, "lr": 5.138894584094936e-05} +{"train_loss": 0.00297888764180243, "global_step": 35323, "epoch": 296, "lr": 5.138673118494196e-05} +{"train_loss": 0.002832868369296193, "global_step": 35324, "epoch": 296, "lr": 5.138451652621186e-05} +{"train_loss": 0.0017871764721348882, "global_step": 35325, "epoch": 296, "lr": 5.138230186476341e-05} +{"train_loss": 0.0027009553741663694, "global_step": 35326, "epoch": 296, "lr": 5.138008720060096e-05} +{"train_loss": 0.0015263870591297746, "global_step": 35327, "epoch": 296, "lr": 5.137787253372884e-05} +{"train_loss": 0.002299371873959899, "global_step": 35328, "epoch": 296, "lr": 5.137565786415143e-05} +{"train_loss": 0.002082881983369589, "global_step": 35329, "epoch": 296, "lr": 5.137344319187305e-05} +{"train_loss": 0.0015687418635934591, "global_step": 35330, "epoch": 296, "lr": 5.1371228516898065e-05} +{"train_loss": 0.0035682718735188246, "global_step": 35331, "epoch": 296, "lr": 5.1369013839230816e-05} +{"train_loss": 0.0024494321551173925, "global_step": 35332, "epoch": 296, "lr": 5.136679915887567e-05} +{"train_loss": 0.00200364226475358, "global_step": 35333, "epoch": 296, "lr": 5.136458447583694e-05} +{"train_loss": 0.0040064300410449505, "global_step": 35334, "epoch": 296, "lr": 5.1362369790119004e-05} +{"train_loss": 0.002909422153607011, "global_step": 35335, "epoch": 296, "lr": 5.1360155101726204e-05} +{"train_loss": 0.002410659333691001, "global_step": 35336, "epoch": 296, "lr": 5.1357940410662885e-05} +{"train_loss": 0.0022989576682448387, "global_step": 35337, "epoch": 296, "lr": 5.135572571693339e-05} +{"train_loss": 0.003631941508501768, "global_step": 35338, "epoch": 296, "lr": 5.1353511020542066e-05} +{"train_loss": 0.0011693652486428618, "global_step": 35339, "epoch": 296, "lr": 5.135129632149329e-05} +{"train_loss": 0.002695351140573621, "global_step": 35340, "epoch": 296, "lr": 5.1349081619791376e-05} +{"train_loss": 0.0030345390550792217, "global_step": 35341, "epoch": 296, "lr": 5.134686691544067e-05} +{"train_loss": 0.0024096308962809816, "global_step": 35342, "epoch": 296, "lr": 5.134465220844556e-05, "val_loss": 0.017127666622400284} +{"train_loss": 0.0021841078996658325, "global_step": 35343, "epoch": 297, "lr": 5.134243749881035e-05} +{"train_loss": 0.0025447465013712645, "global_step": 35344, "epoch": 297, "lr": 5.1340222786539406e-05} +{"train_loss": 0.00411522900685668, "global_step": 35345, "epoch": 297, "lr": 5.13380080716371e-05} +{"train_loss": 0.003252069465816021, "global_step": 35346, "epoch": 297, "lr": 5.133579335410773e-05} +{"train_loss": 0.002803435316309333, "global_step": 35347, "epoch": 297, "lr": 5.133357863395568e-05} +{"train_loss": 0.002774846041575074, "global_step": 35348, "epoch": 297, "lr": 5.1331363911185305e-05} +{"train_loss": 0.002971749985590577, "global_step": 35349, "epoch": 297, "lr": 5.132914918580093e-05} +{"train_loss": 0.003231433220207691, "global_step": 35350, "epoch": 297, "lr": 5.1326934457806906e-05} +{"train_loss": 0.003348174737766385, "global_step": 35351, "epoch": 297, "lr": 5.1324719727207606e-05} +{"train_loss": 0.0020405477844178677, "global_step": 35352, "epoch": 297, "lr": 5.1322504994007346e-05} +{"train_loss": 0.002093793358653784, "global_step": 35353, "epoch": 297, "lr": 5.132029025821049e-05} +{"train_loss": 0.0022217142395675182, "global_step": 35354, "epoch": 297, "lr": 5.1318075519821386e-05} +{"train_loss": 0.0017123566940426826, "global_step": 35355, "epoch": 297, "lr": 5.131586077884438e-05} +{"train_loss": 0.002344164066016674, "global_step": 35356, "epoch": 297, "lr": 5.1313646035283823e-05} +{"train_loss": 0.0018680111970752478, "global_step": 35357, "epoch": 297, "lr": 5.1311431289144085e-05} +{"train_loss": 0.002765111858025193, "global_step": 35358, "epoch": 297, "lr": 5.130921654042946e-05} +{"train_loss": 0.001968889031559229, "global_step": 35359, "epoch": 297, "lr": 5.130700178914435e-05} +{"train_loss": 0.0021504031028598547, "global_step": 35360, "epoch": 297, "lr": 5.1304787035293066e-05} +{"train_loss": 0.0019234451465308666, "global_step": 35361, "epoch": 297, "lr": 5.130257227887997e-05} +{"train_loss": 0.0022175954654812813, "global_step": 35362, "epoch": 297, "lr": 5.130035751990942e-05} +{"train_loss": 0.0023801110219210386, "global_step": 35363, "epoch": 297, "lr": 5.1298142758385756e-05} +{"train_loss": 0.0010822162730619311, "global_step": 35364, "epoch": 297, "lr": 5.1295927994313334e-05} +{"train_loss": 0.002210126258432865, "global_step": 35365, "epoch": 297, "lr": 5.1293713227696485e-05} +{"train_loss": 0.0019678580574691296, "global_step": 35366, "epoch": 297, "lr": 5.129149845853957e-05} +{"train_loss": 0.0036151097156107426, "global_step": 35367, "epoch": 297, "lr": 5.128928368684693e-05} +{"train_loss": 0.0023105540312826633, "global_step": 35368, "epoch": 297, "lr": 5.1287068912622935e-05} +{"train_loss": 0.002370092086493969, "global_step": 35369, "epoch": 297, "lr": 5.1284854135871906e-05} +{"train_loss": 0.0017164885066449642, "global_step": 35370, "epoch": 297, "lr": 5.128263935659822e-05} +{"train_loss": 0.0016533688176423311, "global_step": 35371, "epoch": 297, "lr": 5.12804245748062e-05} +{"train_loss": 0.0017902968684211373, "global_step": 35372, "epoch": 297, "lr": 5.1278209790500184e-05} +{"train_loss": 0.002291829790920019, "global_step": 35373, "epoch": 297, "lr": 5.127599500368456e-05} +{"train_loss": 0.004213366191834211, "global_step": 35374, "epoch": 297, "lr": 5.127378021436365e-05} +{"train_loss": 0.0020305037032812834, "global_step": 35375, "epoch": 297, "lr": 5.127156542254181e-05} +{"train_loss": 0.0016189224552363157, "global_step": 35376, "epoch": 297, "lr": 5.12693506282234e-05} +{"train_loss": 0.0020774127915501595, "global_step": 35377, "epoch": 297, "lr": 5.1267135831412736e-05} +{"train_loss": 0.0009798671817407012, "global_step": 35378, "epoch": 297, "lr": 5.12649210321142e-05} +{"train_loss": 0.0030108292121440172, "global_step": 35379, "epoch": 297, "lr": 5.1262706230332114e-05} +{"train_loss": 0.0022929466795176268, "global_step": 35380, "epoch": 297, "lr": 5.1260491426070844e-05} +{"train_loss": 0.002523507922887802, "global_step": 35381, "epoch": 297, "lr": 5.125827661933472e-05} +{"train_loss": 0.0021729813888669014, "global_step": 35382, "epoch": 297, "lr": 5.1256061810128134e-05} +{"train_loss": 0.0019961760845035315, "global_step": 35383, "epoch": 297, "lr": 5.125384699845538e-05} +{"train_loss": 0.0021984572522342205, "global_step": 35384, "epoch": 297, "lr": 5.1251632184320844e-05} +{"train_loss": 0.001915360800921917, "global_step": 35385, "epoch": 297, "lr": 5.1249417367728855e-05} +{"train_loss": 0.003993837162852287, "global_step": 35386, "epoch": 297, "lr": 5.124720254868377e-05} +{"train_loss": 0.0018884819000959396, "global_step": 35387, "epoch": 297, "lr": 5.124498772718994e-05} +{"train_loss": 0.0020749212708324194, "global_step": 35388, "epoch": 297, "lr": 5.124277290325171e-05} +{"train_loss": 0.002270181430503726, "global_step": 35389, "epoch": 297, "lr": 5.1240558076873434e-05} +{"train_loss": 0.0014113617362454534, "global_step": 35390, "epoch": 297, "lr": 5.123834324805945e-05} +{"train_loss": 0.0022636577486991882, "global_step": 35391, "epoch": 297, "lr": 5.12361284168141e-05} +{"train_loss": 0.003524257568642497, "global_step": 35392, "epoch": 297, "lr": 5.123391358314176e-05} +{"train_loss": 0.002457638271152973, "global_step": 35393, "epoch": 297, "lr": 5.123169874704675e-05} +{"train_loss": 0.002004481852054596, "global_step": 35394, "epoch": 297, "lr": 5.1229483908533436e-05} +{"train_loss": 0.002408628584817052, "global_step": 35395, "epoch": 297, "lr": 5.122726906760616e-05} +{"train_loss": 0.001383829629048705, "global_step": 35396, "epoch": 297, "lr": 5.1225054224269265e-05} +{"train_loss": 0.0037638572975993156, "global_step": 35397, "epoch": 297, "lr": 5.122283937852712e-05} +{"train_loss": 0.002697699936106801, "global_step": 35398, "epoch": 297, "lr": 5.1220624530384054e-05} +{"train_loss": 0.002318731276318431, "global_step": 35399, "epoch": 297, "lr": 5.121840967984443e-05} +{"train_loss": 0.0027011570055037737, "global_step": 35400, "epoch": 297, "lr": 5.121619482691258e-05} +{"train_loss": 0.002970194211229682, "global_step": 35401, "epoch": 297, "lr": 5.121397997159287e-05} +{"train_loss": 0.004480366595089436, "global_step": 35402, "epoch": 297, "lr": 5.121176511388963e-05} +{"train_loss": 0.0026894425973296165, "global_step": 35403, "epoch": 297, "lr": 5.1209550253807224e-05} +{"train_loss": 0.0018440823769196868, "global_step": 35404, "epoch": 297, "lr": 5.120733539135e-05} +{"train_loss": 0.0019970231223851442, "global_step": 35405, "epoch": 297, "lr": 5.120512052652229e-05} +{"train_loss": 0.0021200852934271097, "global_step": 35406, "epoch": 297, "lr": 5.120290565932846e-05} +{"train_loss": 0.003001820994541049, "global_step": 35407, "epoch": 297, "lr": 5.1200690789772854e-05} +{"train_loss": 0.0015015446115285158, "global_step": 35408, "epoch": 297, "lr": 5.1198475917859836e-05} +{"train_loss": 0.002204285003244877, "global_step": 35409, "epoch": 297, "lr": 5.119626104359372e-05} +{"train_loss": 0.0022057187743484974, "global_step": 35410, "epoch": 297, "lr": 5.119404616697887e-05} +{"train_loss": 0.0015605514636263251, "global_step": 35411, "epoch": 297, "lr": 5.119183128801964e-05} +{"train_loss": 0.0027846985030919313, "global_step": 35412, "epoch": 297, "lr": 5.1189616406720385e-05} +{"train_loss": 0.0027809208258986473, "global_step": 35413, "epoch": 297, "lr": 5.1187401523085434e-05} +{"train_loss": 0.002626581583172083, "global_step": 35414, "epoch": 297, "lr": 5.1185186637119156e-05} +{"train_loss": 0.0036043457221239805, "global_step": 35415, "epoch": 297, "lr": 5.118297174882589e-05} +{"train_loss": 0.002740585943683982, "global_step": 35416, "epoch": 297, "lr": 5.1180756858209977e-05} +{"train_loss": 0.0023084967397153378, "global_step": 35417, "epoch": 297, "lr": 5.117854196527578e-05} +{"train_loss": 0.0019438373856246471, "global_step": 35418, "epoch": 297, "lr": 5.117632707002764e-05} +{"train_loss": 0.004805652424693108, "global_step": 35419, "epoch": 297, "lr": 5.117411217246991e-05} +{"train_loss": 0.003196043660864234, "global_step": 35420, "epoch": 297, "lr": 5.117189727260695e-05} +{"train_loss": 0.0017545167356729507, "global_step": 35421, "epoch": 297, "lr": 5.1169682370443086e-05} +{"train_loss": 0.001496726181358099, "global_step": 35422, "epoch": 297, "lr": 5.1167467465982664e-05} +{"train_loss": 0.0033418885432183743, "global_step": 35423, "epoch": 297, "lr": 5.116525255923005e-05} +{"train_loss": 0.001310862717218697, "global_step": 35424, "epoch": 297, "lr": 5.1163037650189584e-05} +{"train_loss": 0.0011951660271734, "global_step": 35425, "epoch": 297, "lr": 5.116082273886562e-05} +{"train_loss": 0.0016453351126983762, "global_step": 35426, "epoch": 297, "lr": 5.1158607825262514e-05} +{"train_loss": 0.004200746305286884, "global_step": 35427, "epoch": 297, "lr": 5.1156392909384596e-05} +{"train_loss": 0.003544182749465108, "global_step": 35428, "epoch": 297, "lr": 5.115417799123623e-05} +{"train_loss": 0.001875363988801837, "global_step": 35429, "epoch": 297, "lr": 5.115196307082175e-05} +{"train_loss": 0.002112068235874176, "global_step": 35430, "epoch": 297, "lr": 5.114974814814551e-05} +{"train_loss": 0.0019224273273721337, "global_step": 35431, "epoch": 297, "lr": 5.114753322321187e-05} +{"train_loss": 0.002014191821217537, "global_step": 35432, "epoch": 297, "lr": 5.114531829602517e-05} +{"train_loss": 0.002941144397482276, "global_step": 35433, "epoch": 297, "lr": 5.114310336658977e-05} +{"train_loss": 0.0026557014789432287, "global_step": 35434, "epoch": 297, "lr": 5.1140888434910006e-05} +{"train_loss": 0.0031444106716662645, "global_step": 35435, "epoch": 297, "lr": 5.113867350099022e-05} +{"train_loss": 0.0017904180567711592, "global_step": 35436, "epoch": 297, "lr": 5.1136458564834765e-05} +{"train_loss": 0.0047877817414700985, "global_step": 35437, "epoch": 297, "lr": 5.113424362644801e-05} +{"train_loss": 0.0018296331400051713, "global_step": 35438, "epoch": 297, "lr": 5.113202868583428e-05} +{"train_loss": 0.0013988750288262963, "global_step": 35439, "epoch": 297, "lr": 5.1129813742997943e-05} +{"train_loss": 0.0015773597406223416, "global_step": 35440, "epoch": 297, "lr": 5.112759879794333e-05} +{"train_loss": 0.00289649935439229, "global_step": 35441, "epoch": 297, "lr": 5.11253838506748e-05} +{"train_loss": 0.0032693909015506506, "global_step": 35442, "epoch": 297, "lr": 5.11231689011967e-05} +{"train_loss": 0.0017108058091253042, "global_step": 35443, "epoch": 297, "lr": 5.112095394951336e-05} +{"train_loss": 0.0012337504886090755, "global_step": 35444, "epoch": 297, "lr": 5.111873899562917e-05} +{"train_loss": 0.0015638696495443583, "global_step": 35445, "epoch": 297, "lr": 5.111652403954844e-05} +{"train_loss": 0.0025638833176344633, "global_step": 35446, "epoch": 297, "lr": 5.111430908127553e-05} +{"train_loss": 0.002635036129504442, "global_step": 35447, "epoch": 297, "lr": 5.1112094120814815e-05} +{"train_loss": 0.0018820606637746096, "global_step": 35448, "epoch": 297, "lr": 5.11098791581706e-05} +{"train_loss": 0.0019376177806407213, "global_step": 35449, "epoch": 297, "lr": 5.110766419334727e-05} +{"train_loss": 0.003096997970715165, "global_step": 35450, "epoch": 297, "lr": 5.110544922634915e-05} +{"train_loss": 0.0023806686513125896, "global_step": 35451, "epoch": 297, "lr": 5.110323425718062e-05} +{"train_loss": 0.0019723670557141304, "global_step": 35452, "epoch": 297, "lr": 5.1101019285845996e-05} +{"train_loss": 0.002009875373914838, "global_step": 35453, "epoch": 297, "lr": 5.109880431234964e-05} +{"train_loss": 0.0026111083570867777, "global_step": 35454, "epoch": 297, "lr": 5.1096589336695886e-05} +{"train_loss": 0.0029711334500461817, "global_step": 35455, "epoch": 297, "lr": 5.10943743588891e-05} +{"train_loss": 0.0025906087830662727, "global_step": 35456, "epoch": 297, "lr": 5.1092159378933626e-05} +{"train_loss": 0.002852168632671237, "global_step": 35457, "epoch": 297, "lr": 5.1089944396833825e-05} +{"train_loss": 0.0013940047938376665, "global_step": 35458, "epoch": 297, "lr": 5.108772941259403e-05} +{"train_loss": 0.002462560310959816, "global_step": 35459, "epoch": 297, "lr": 5.108551442621859e-05} +{"train_loss": 0.0024835714139044285, "global_step": 35460, "epoch": 297, "lr": 5.108329943771186e-05} +{"train_loss": 0.002406632498360607, "global_step": 35461, "epoch": 297, "lr": 5.108108444707819e-05, "val_loss": 0.011655006557703018} +{"train_loss": 0.0013358664000406861, "global_step": 35462, "epoch": 298, "lr": 5.107886945432192e-05} +{"train_loss": 0.0014890169259160757, "global_step": 35463, "epoch": 298, "lr": 5.1076654459447414e-05} +{"train_loss": 0.0025195458438247442, "global_step": 35464, "epoch": 298, "lr": 5.1074439462459e-05} +{"train_loss": 0.0015251539880409837, "global_step": 35465, "epoch": 298, "lr": 5.1072224463361054e-05} +{"train_loss": 0.0012994760181754827, "global_step": 35466, "epoch": 298, "lr": 5.1070009462157895e-05} +{"train_loss": 0.003138936823233962, "global_step": 35467, "epoch": 298, "lr": 5.106779445885389e-05} +{"train_loss": 0.004068294074386358, "global_step": 35468, "epoch": 298, "lr": 5.106557945345339e-05} +{"train_loss": 0.0009160802001133561, "global_step": 35469, "epoch": 298, "lr": 5.106336444596074e-05} +{"train_loss": 0.0031088136602193117, "global_step": 35470, "epoch": 298, "lr": 5.1061149436380294e-05} +{"train_loss": 0.002770465798676014, "global_step": 35471, "epoch": 298, "lr": 5.1058934424716373e-05} +{"train_loss": 0.004014735110104084, "global_step": 35472, "epoch": 298, "lr": 5.1056719410973366e-05} +{"train_loss": 0.002111826092004776, "global_step": 35473, "epoch": 298, "lr": 5.105450439515559e-05} +{"train_loss": 0.0020512198098003864, "global_step": 35474, "epoch": 298, "lr": 5.105228937726741e-05} +{"train_loss": 0.003936518914997578, "global_step": 35475, "epoch": 298, "lr": 5.105007435731318e-05} +{"train_loss": 0.003419573651626706, "global_step": 35476, "epoch": 298, "lr": 5.104785933529726e-05} +{"train_loss": 0.002757276874035597, "global_step": 35477, "epoch": 298, "lr": 5.104564431122395e-05} +{"train_loss": 0.002359697362408042, "global_step": 35478, "epoch": 298, "lr": 5.1043429285097635e-05} +{"train_loss": 0.0021369163878262043, "global_step": 35479, "epoch": 298, "lr": 5.1041214256922644e-05} +{"train_loss": 0.0030613052658736706, "global_step": 35480, "epoch": 298, "lr": 5.1038999226703355e-05} +{"train_loss": 0.0028003056067973375, "global_step": 35481, "epoch": 298, "lr": 5.10367841944441e-05} +{"train_loss": 0.0018838607938960195, "global_step": 35482, "epoch": 298, "lr": 5.103456916014924e-05} +{"train_loss": 0.0036431208718568087, "global_step": 35483, "epoch": 298, "lr": 5.103235412382311e-05} +{"train_loss": 0.002720457734540105, "global_step": 35484, "epoch": 298, "lr": 5.1030139085470054e-05} +{"train_loss": 0.002419303171336651, "global_step": 35485, "epoch": 298, "lr": 5.1027924045094434e-05} +{"train_loss": 0.0018729879520833492, "global_step": 35486, "epoch": 298, "lr": 5.102570900270059e-05} +{"train_loss": 0.002974804025143385, "global_step": 35487, "epoch": 298, "lr": 5.102349395829289e-05} +{"train_loss": 0.001793085946701467, "global_step": 35488, "epoch": 298, "lr": 5.1021278911875656e-05} +{"train_loss": 0.0023652203381061554, "global_step": 35489, "epoch": 298, "lr": 5.101906386345328e-05} +{"train_loss": 0.0020086835138499737, "global_step": 35490, "epoch": 298, "lr": 5.101684881303005e-05} +{"train_loss": 0.0018273472087457776, "global_step": 35491, "epoch": 298, "lr": 5.101463376061034e-05} +{"train_loss": 0.0015874671516939998, "global_step": 35492, "epoch": 298, "lr": 5.101241870619853e-05} +{"train_loss": 0.003607640042901039, "global_step": 35493, "epoch": 298, "lr": 5.101020364979893e-05} +{"train_loss": 0.002840283792465925, "global_step": 35494, "epoch": 298, "lr": 5.10079885914159e-05} +{"train_loss": 0.002079999540001154, "global_step": 35495, "epoch": 298, "lr": 5.100577353105379e-05} +{"train_loss": 0.0029643247835338116, "global_step": 35496, "epoch": 298, "lr": 5.100355846871696e-05} +{"train_loss": 0.003236620919778943, "global_step": 35497, "epoch": 298, "lr": 5.100134340440974e-05} +{"train_loss": 0.0018459407147020102, "global_step": 35498, "epoch": 298, "lr": 5.09991283381365e-05} +{"train_loss": 0.0019488385878503323, "global_step": 35499, "epoch": 298, "lr": 5.099691326990158e-05} +{"train_loss": 0.0022893277928233147, "global_step": 35500, "epoch": 298, "lr": 5.099469819970931e-05} +{"train_loss": 0.0021483309101313353, "global_step": 35501, "epoch": 298, "lr": 5.0992483127564074e-05} +{"train_loss": 0.0039846100844442844, "global_step": 35502, "epoch": 298, "lr": 5.099026805347021e-05} +{"train_loss": 0.0026317837182432413, "global_step": 35503, "epoch": 298, "lr": 5.0988052977432046e-05} +{"train_loss": 0.0016606706194579601, "global_step": 35504, "epoch": 298, "lr": 5.098583789945395e-05} +{"train_loss": 0.0016767410561442375, "global_step": 35505, "epoch": 298, "lr": 5.098362281954027e-05} +{"train_loss": 0.0014363557565957308, "global_step": 35506, "epoch": 298, "lr": 5.0981407737695344e-05} +{"train_loss": 0.002566433511674404, "global_step": 35507, "epoch": 298, "lr": 5.097919265392352e-05} +{"train_loss": 0.0031469136010855436, "global_step": 35508, "epoch": 298, "lr": 5.097697756822918e-05} +{"train_loss": 0.0013454451691359282, "global_step": 35509, "epoch": 298, "lr": 5.097476248061663e-05} +{"train_loss": 0.0027989791706204414, "global_step": 35510, "epoch": 298, "lr": 5.097254739109025e-05} +{"train_loss": 0.0018711333395913243, "global_step": 35511, "epoch": 298, "lr": 5.097033229965437e-05} +{"train_loss": 0.0038674543611705303, "global_step": 35512, "epoch": 298, "lr": 5.096811720631335e-05} +{"train_loss": 0.001725405571050942, "global_step": 35513, "epoch": 298, "lr": 5.096590211107153e-05} +{"train_loss": 0.001554820453748107, "global_step": 35514, "epoch": 298, "lr": 5.096368701393326e-05} +{"train_loss": 0.0043273745104670525, "global_step": 35515, "epoch": 298, "lr": 5.09614719149029e-05} +{"train_loss": 0.003004259429872036, "global_step": 35516, "epoch": 298, "lr": 5.095925681398479e-05} +{"train_loss": 0.0026426634285598993, "global_step": 35517, "epoch": 298, "lr": 5.095704171118328e-05} +{"train_loss": 0.0035979377571493387, "global_step": 35518, "epoch": 298, "lr": 5.0954826606502736e-05} +{"train_loss": 0.003425409086048603, "global_step": 35519, "epoch": 298, "lr": 5.0952611499947476e-05} +{"train_loss": 0.0036256362218409777, "global_step": 35520, "epoch": 298, "lr": 5.095039639152188e-05} +{"train_loss": 0.002820908557623625, "global_step": 35521, "epoch": 298, "lr": 5.0948181281230276e-05} +{"train_loss": 0.004132436588406563, "global_step": 35522, "epoch": 298, "lr": 5.094596616907702e-05} +{"train_loss": 0.0030876125674694777, "global_step": 35523, "epoch": 298, "lr": 5.094375105506645e-05} +{"train_loss": 0.003165149362757802, "global_step": 35524, "epoch": 298, "lr": 5.0941535939202935e-05} +{"train_loss": 0.0024181611370295286, "global_step": 35525, "epoch": 298, "lr": 5.093932082149081e-05} +{"train_loss": 0.0018331544706597924, "global_step": 35526, "epoch": 298, "lr": 5.0937105701934426e-05} +{"train_loss": 0.0049783410504460335, "global_step": 35527, "epoch": 298, "lr": 5.093489058053814e-05} +{"train_loss": 0.002828138181939721, "global_step": 35528, "epoch": 298, "lr": 5.09326754573063e-05} +{"train_loss": 0.003576446557417512, "global_step": 35529, "epoch": 298, "lr": 5.0930460332243246e-05} +{"train_loss": 0.003721937770023942, "global_step": 35530, "epoch": 298, "lr": 5.0928245205353334e-05} +{"train_loss": 0.004116498865187168, "global_step": 35531, "epoch": 298, "lr": 5.0926030076640905e-05} +{"train_loss": 0.002394973300397396, "global_step": 35532, "epoch": 298, "lr": 5.0923814946110324e-05} +{"train_loss": 0.003276183269917965, "global_step": 35533, "epoch": 298, "lr": 5.092159981376594e-05} +{"train_loss": 0.0019280195701867342, "global_step": 35534, "epoch": 298, "lr": 5.091938467961208e-05} +{"train_loss": 0.002352144569158554, "global_step": 35535, "epoch": 298, "lr": 5.091716954365311e-05} +{"train_loss": 0.002412910107523203, "global_step": 35536, "epoch": 298, "lr": 5.091495440589337e-05} +{"train_loss": 0.002965920139104128, "global_step": 35537, "epoch": 298, "lr": 5.0912739266337216e-05} +{"train_loss": 0.0021166051737964153, "global_step": 35538, "epoch": 298, "lr": 5.0910524124989e-05} +{"train_loss": 0.002900706371292472, "global_step": 35539, "epoch": 298, "lr": 5.0908308981853085e-05} +{"train_loss": 0.0014227359788492322, "global_step": 35540, "epoch": 298, "lr": 5.090609383693378e-05} +{"train_loss": 0.003473487216979265, "global_step": 35541, "epoch": 298, "lr": 5.090387869023545e-05} +{"train_loss": 0.003855739952996373, "global_step": 35542, "epoch": 298, "lr": 5.090166354176247e-05} +{"train_loss": 0.002031370997428894, "global_step": 35543, "epoch": 298, "lr": 5.0899448391519154e-05} +{"train_loss": 0.002640951657667756, "global_step": 35544, "epoch": 298, "lr": 5.089723323950988e-05} +{"train_loss": 0.0038607600145041943, "global_step": 35545, "epoch": 298, "lr": 5.089501808573897e-05} +{"train_loss": 0.0034232018515467644, "global_step": 35546, "epoch": 298, "lr": 5.089280293021079e-05} +{"train_loss": 0.004513246472924948, "global_step": 35547, "epoch": 298, "lr": 5.08905877729297e-05} +{"train_loss": 0.00417097145691514, "global_step": 35548, "epoch": 298, "lr": 5.0888372613900026e-05} +{"train_loss": 0.0033851678017526865, "global_step": 35549, "epoch": 298, "lr": 5.0886157453126126e-05} +{"train_loss": 0.0011096530361101031, "global_step": 35550, "epoch": 298, "lr": 5.088394229061235e-05} +{"train_loss": 0.0030772949103266, "global_step": 35551, "epoch": 298, "lr": 5.088172712636306e-05} +{"train_loss": 0.0032890653237700462, "global_step": 35552, "epoch": 298, "lr": 5.087951196038259e-05} +{"train_loss": 0.003741384716704488, "global_step": 35553, "epoch": 298, "lr": 5.087729679267529e-05} +{"train_loss": 0.0028402928728610277, "global_step": 35554, "epoch": 298, "lr": 5.08750816232455e-05} +{"train_loss": 0.0016151127638295293, "global_step": 35555, "epoch": 298, "lr": 5.08728664520976e-05} +{"train_loss": 0.0018189114052802324, "global_step": 35556, "epoch": 298, "lr": 5.0870651279235904e-05} +{"train_loss": 0.0018776865908876061, "global_step": 35557, "epoch": 298, "lr": 5.0868436104664786e-05} +{"train_loss": 0.005654488690197468, "global_step": 35558, "epoch": 298, "lr": 5.0866220928388584e-05} +{"train_loss": 0.0013010147958993912, "global_step": 35559, "epoch": 298, "lr": 5.086400575041166e-05} +{"train_loss": 0.003631924046203494, "global_step": 35560, "epoch": 298, "lr": 5.086179057073833e-05} +{"train_loss": 0.0031704739667475224, "global_step": 35561, "epoch": 298, "lr": 5.0859575389372984e-05} +{"train_loss": 0.003080687951296568, "global_step": 35562, "epoch": 298, "lr": 5.0857360206319936e-05} +{"train_loss": 0.002475353889167309, "global_step": 35563, "epoch": 298, "lr": 5.085514502158356e-05} +{"train_loss": 0.0030517331324517727, "global_step": 35564, "epoch": 298, "lr": 5.085292983516822e-05} +{"train_loss": 0.002109955996274948, "global_step": 35565, "epoch": 298, "lr": 5.0850714647078226e-05} +{"train_loss": 0.003582725301384926, "global_step": 35566, "epoch": 298, "lr": 5.0848499457317943e-05} +{"train_loss": 0.002078836318105459, "global_step": 35567, "epoch": 298, "lr": 5.084628426589172e-05} +{"train_loss": 0.0029638686683028936, "global_step": 35568, "epoch": 298, "lr": 5.084406907280391e-05} +{"train_loss": 0.0018630243139341474, "global_step": 35569, "epoch": 298, "lr": 5.0841853878058866e-05} +{"train_loss": 0.0023330736439675093, "global_step": 35570, "epoch": 298, "lr": 5.083963868166094e-05} +{"train_loss": 0.004801984876394272, "global_step": 35571, "epoch": 298, "lr": 5.0837423483614456e-05} +{"train_loss": 0.0018471060320734978, "global_step": 35572, "epoch": 298, "lr": 5.083520828392378e-05} +{"train_loss": 0.0027855669613927603, "global_step": 35573, "epoch": 298, "lr": 5.0832993082593275e-05} +{"train_loss": 0.0011944337747991085, "global_step": 35574, "epoch": 298, "lr": 5.083077787962727e-05} +{"train_loss": 0.0012626040261238813, "global_step": 35575, "epoch": 298, "lr": 5.082856267503011e-05} +{"train_loss": 0.0017898411024361849, "global_step": 35576, "epoch": 298, "lr": 5.082634746880617e-05} +{"train_loss": 0.00206012069247663, "global_step": 35577, "epoch": 298, "lr": 5.0824132260959786e-05} +{"train_loss": 0.001473529846407473, "global_step": 35578, "epoch": 298, "lr": 5.08219170514953e-05} +{"train_loss": 0.0029424852691590786, "global_step": 35579, "epoch": 298, "lr": 5.0819701840417064e-05} +{"train_loss": 0.002686827490497537, "global_step": 35580, "epoch": 298, "lr": 5.081748662772944e-05, "val_loss": 0.01189245656132698} +{"train_loss": 0.0024569209199398756, "global_step": 35581, "epoch": 299, "lr": 5.081527141343676e-05} +{"train_loss": 0.004428320564329624, "global_step": 35582, "epoch": 299, "lr": 5.0813056197543394e-05} +{"train_loss": 0.0024709117133170366, "global_step": 35583, "epoch": 299, "lr": 5.081084098005368e-05} +{"train_loss": 0.0016392600955441594, "global_step": 35584, "epoch": 299, "lr": 5.080862576097196e-05} +{"train_loss": 0.004619725048542023, "global_step": 35585, "epoch": 299, "lr": 5.080641054030259e-05} +{"train_loss": 0.0025536371394991875, "global_step": 35586, "epoch": 299, "lr": 5.0804195318049905e-05} +{"train_loss": 0.0021651179995387793, "global_step": 35587, "epoch": 299, "lr": 5.0801980094218285e-05} +{"train_loss": 0.001936685061082244, "global_step": 35588, "epoch": 299, "lr": 5.079976486881206e-05} +{"train_loss": 0.0011477820808067918, "global_step": 35589, "epoch": 299, "lr": 5.079754964183559e-05} +{"train_loss": 0.0021338120568543673, "global_step": 35590, "epoch": 299, "lr": 5.0795334413293204e-05} +{"train_loss": 0.001751112169586122, "global_step": 35591, "epoch": 299, "lr": 5.0793119183189264e-05} +{"train_loss": 0.0026267312932759523, "global_step": 35592, "epoch": 299, "lr": 5.0790903951528126e-05} +{"train_loss": 0.0013033229624852538, "global_step": 35593, "epoch": 299, "lr": 5.0788688718314125e-05} +{"train_loss": 0.00207413244061172, "global_step": 35594, "epoch": 299, "lr": 5.078647348355162e-05} +{"train_loss": 0.002760095288977027, "global_step": 35595, "epoch": 299, "lr": 5.0784258247244966e-05} +{"train_loss": 0.003334929933771491, "global_step": 35596, "epoch": 299, "lr": 5.0782043009398495e-05} +{"train_loss": 0.002181556774303317, "global_step": 35597, "epoch": 299, "lr": 5.077982777001656e-05} +{"train_loss": 0.0026060312520712614, "global_step": 35598, "epoch": 299, "lr": 5.0777612529103534e-05} +{"train_loss": 0.0028613212052732706, "global_step": 35599, "epoch": 299, "lr": 5.077539728666374e-05} +{"train_loss": 0.0016901124035939574, "global_step": 35600, "epoch": 299, "lr": 5.077318204270154e-05} +{"train_loss": 0.002039210870862007, "global_step": 35601, "epoch": 299, "lr": 5.077096679722128e-05} +{"train_loss": 0.0011670331005007029, "global_step": 35602, "epoch": 299, "lr": 5.076875155022731e-05} +{"train_loss": 0.0012772602494806051, "global_step": 35603, "epoch": 299, "lr": 5.076653630172398e-05} +{"train_loss": 0.002493390580639243, "global_step": 35604, "epoch": 299, "lr": 5.0764321051715626e-05} +{"train_loss": 0.001400130451656878, "global_step": 35605, "epoch": 299, "lr": 5.0762105800206615e-05} +{"train_loss": 0.0022444711066782475, "global_step": 35606, "epoch": 299, "lr": 5.0759890547201296e-05} +{"train_loss": 0.0027169736567884684, "global_step": 35607, "epoch": 299, "lr": 5.0757675292704e-05} +{"train_loss": 0.0031882154289633036, "global_step": 35608, "epoch": 299, "lr": 5.0755460036719105e-05} +{"train_loss": 0.0025260550901293755, "global_step": 35609, "epoch": 299, "lr": 5.075324477925094e-05} +{"train_loss": 0.0013175082858651876, "global_step": 35610, "epoch": 299, "lr": 5.075102952030386e-05} +{"train_loss": 0.00190801452845335, "global_step": 35611, "epoch": 299, "lr": 5.074881425988219e-05} +{"train_loss": 0.0017474221531301737, "global_step": 35612, "epoch": 299, "lr": 5.074659899799033e-05} +{"train_loss": 0.0021658327896147966, "global_step": 35613, "epoch": 299, "lr": 5.074438373463259e-05} +{"train_loss": 0.0025587992276996374, "global_step": 35614, "epoch": 299, "lr": 5.074216846981336e-05} +{"train_loss": 0.0034814313985407352, "global_step": 35615, "epoch": 299, "lr": 5.073995320353694e-05} +{"train_loss": 0.001883306773379445, "global_step": 35616, "epoch": 299, "lr": 5.0737737935807694e-05} +{"train_loss": 0.0023096115328371525, "global_step": 35617, "epoch": 299, "lr": 5.073552266662999e-05} +{"train_loss": 0.002391387475654483, "global_step": 35618, "epoch": 299, "lr": 5.0733307396008154e-05} +{"train_loss": 0.002091757021844387, "global_step": 35619, "epoch": 299, "lr": 5.073109212394655e-05} +{"train_loss": 0.0023469803854823112, "global_step": 35620, "epoch": 299, "lr": 5.0728876850449535e-05} +{"train_loss": 0.003299280069768429, "global_step": 35621, "epoch": 299, "lr": 5.072666157552145e-05} +{"train_loss": 0.0019790104124695063, "global_step": 35622, "epoch": 299, "lr": 5.072444629916664e-05} +{"train_loss": 0.002676317235454917, "global_step": 35623, "epoch": 299, "lr": 5.072223102138946e-05} +{"train_loss": 0.0017795340390875936, "global_step": 35624, "epoch": 299, "lr": 5.072001574219424e-05} +{"train_loss": 0.0017165588214993477, "global_step": 35625, "epoch": 299, "lr": 5.071780046158535e-05} +{"train_loss": 0.0013356987619772553, "global_step": 35626, "epoch": 299, "lr": 5.071558517956714e-05} +{"train_loss": 0.002090353285893798, "global_step": 35627, "epoch": 299, "lr": 5.071336989614396e-05} +{"train_loss": 0.0014250774402171373, "global_step": 35628, "epoch": 299, "lr": 5.071115461132014e-05} +{"train_loss": 0.0031949442345649004, "global_step": 35629, "epoch": 299, "lr": 5.070893932510006e-05} +{"train_loss": 0.0028907163068652153, "global_step": 35630, "epoch": 299, "lr": 5.070672403748804e-05} +{"train_loss": 0.002554940991103649, "global_step": 35631, "epoch": 299, "lr": 5.0704508748488454e-05} +{"train_loss": 0.0026650861836969852, "global_step": 35632, "epoch": 299, "lr": 5.070229345810563e-05} +{"train_loss": 0.002510455437004566, "global_step": 35633, "epoch": 299, "lr": 5.0700078166343955e-05} +{"train_loss": 0.0024969473015516996, "global_step": 35634, "epoch": 299, "lr": 5.0697862873207726e-05} +{"train_loss": 0.003133772872388363, "global_step": 35635, "epoch": 299, "lr": 5.0695647578701324e-05} +{"train_loss": 0.0016908850520849228, "global_step": 35636, "epoch": 299, "lr": 5.069343228282909e-05} +{"train_loss": 0.0023253944236785173, "global_step": 35637, "epoch": 299, "lr": 5.069121698559537e-05} +{"train_loss": 0.0018379915272817016, "global_step": 35638, "epoch": 299, "lr": 5.068900168700452e-05} +{"train_loss": 0.0023716387804597616, "global_step": 35639, "epoch": 299, "lr": 5.068678638706091e-05} +{"train_loss": 0.0032108535524457693, "global_step": 35640, "epoch": 299, "lr": 5.068457108576885e-05} +{"train_loss": 0.0024353698827326298, "global_step": 35641, "epoch": 299, "lr": 5.068235578313272e-05} +{"train_loss": 0.0017383979866281152, "global_step": 35642, "epoch": 299, "lr": 5.068014047915685e-05} +{"train_loss": 0.0014629862271249294, "global_step": 35643, "epoch": 299, "lr": 5.0677925173845584e-05} +{"train_loss": 0.0026322761550545692, "global_step": 35644, "epoch": 299, "lr": 5.067570986720329e-05} +{"train_loss": 0.0024203923530876637, "global_step": 35645, "epoch": 299, "lr": 5.0673494559234325e-05} +{"train_loss": 0.0025816666893661022, "global_step": 35646, "epoch": 299, "lr": 5.067127924994302e-05} +{"train_loss": 0.001217774348333478, "global_step": 35647, "epoch": 299, "lr": 5.066906393933372e-05} +{"train_loss": 0.0021353834308683872, "global_step": 35648, "epoch": 299, "lr": 5.066684862741079e-05} +{"train_loss": 0.002722474979236722, "global_step": 35649, "epoch": 299, "lr": 5.066463331417858e-05} +{"train_loss": 0.002668654080480337, "global_step": 35650, "epoch": 299, "lr": 5.066241799964142e-05} +{"train_loss": 0.0017095102230086923, "global_step": 35651, "epoch": 299, "lr": 5.066020268380368e-05} +{"train_loss": 0.004190374165773392, "global_step": 35652, "epoch": 299, "lr": 5.065798736666972e-05} +{"train_loss": 0.0033579906448721886, "global_step": 35653, "epoch": 299, "lr": 5.065577204824385e-05} +{"train_loss": 0.0021829893812537193, "global_step": 35654, "epoch": 299, "lr": 5.065355672853045e-05} +{"train_loss": 0.0031290636397898197, "global_step": 35655, "epoch": 299, "lr": 5.0651341407533856e-05} +{"train_loss": 0.003345207078382373, "global_step": 35656, "epoch": 299, "lr": 5.0649126085258434e-05} +{"train_loss": 0.002214918378740549, "global_step": 35657, "epoch": 299, "lr": 5.064691076170851e-05} +{"train_loss": 0.002436400856822729, "global_step": 35658, "epoch": 299, "lr": 5.064469543688847e-05} +{"train_loss": 0.0031797185074537992, "global_step": 35659, "epoch": 299, "lr": 5.0642480110802616e-05} +{"train_loss": 0.0022264677099883556, "global_step": 35660, "epoch": 299, "lr": 5.06402647834553e-05} +{"train_loss": 0.002138093812391162, "global_step": 35661, "epoch": 299, "lr": 5.0638049454850925e-05} +{"train_loss": 0.0025009927339851856, "global_step": 35662, "epoch": 299, "lr": 5.06358341249938e-05} +{"train_loss": 0.0035863202065229416, "global_step": 35663, "epoch": 299, "lr": 5.063361879388828e-05} +{"train_loss": 0.0013217921368777752, "global_step": 35664, "epoch": 299, "lr": 5.063140346153873e-05} +{"train_loss": 0.004342336673289537, "global_step": 35665, "epoch": 299, "lr": 5.062918812794948e-05} +{"train_loss": 0.0028902667108923197, "global_step": 35666, "epoch": 299, "lr": 5.062697279312488e-05} +{"train_loss": 0.002249295823276043, "global_step": 35667, "epoch": 299, "lr": 5.062475745706929e-05} +{"train_loss": 0.0011422679526731372, "global_step": 35668, "epoch": 299, "lr": 5.0622542119787054e-05} +{"train_loss": 0.001334115513600409, "global_step": 35669, "epoch": 299, "lr": 5.062032678128252e-05} +{"train_loss": 0.0028688767924904823, "global_step": 35670, "epoch": 299, "lr": 5.061811144156004e-05} +{"train_loss": 0.002294496400281787, "global_step": 35671, "epoch": 299, "lr": 5.0615896100623984e-05} +{"train_loss": 0.0014783915830776095, "global_step": 35672, "epoch": 299, "lr": 5.0613680758478666e-05} +{"train_loss": 0.0021483979653567076, "global_step": 35673, "epoch": 299, "lr": 5.061146541512845e-05} +{"train_loss": 0.0024833213537931442, "global_step": 35674, "epoch": 299, "lr": 5.0609250070577685e-05} +{"train_loss": 0.002867126604542136, "global_step": 35675, "epoch": 299, "lr": 5.060703472483073e-05} +{"train_loss": 0.0027402432169765234, "global_step": 35676, "epoch": 299, "lr": 5.0604819377891924e-05} +{"train_loss": 0.004041607957333326, "global_step": 35677, "epoch": 299, "lr": 5.060260402976562e-05} +{"train_loss": 0.002558372914791107, "global_step": 35678, "epoch": 299, "lr": 5.060038868045616e-05} +{"train_loss": 0.0011634797556325793, "global_step": 35679, "epoch": 299, "lr": 5.059817332996791e-05} +{"train_loss": 0.0038230852223932743, "global_step": 35680, "epoch": 299, "lr": 5.059595797830521e-05} +{"train_loss": 0.0014724141219630837, "global_step": 35681, "epoch": 299, "lr": 5.059374262547241e-05} +{"train_loss": 0.001362721319310367, "global_step": 35682, "epoch": 299, "lr": 5.059152727147385e-05} +{"train_loss": 0.0025143565144389868, "global_step": 35683, "epoch": 299, "lr": 5.058931191631391e-05} +{"train_loss": 0.002533361781388521, "global_step": 35684, "epoch": 299, "lr": 5.0587096559996905e-05} +{"train_loss": 0.0024998646695166826, "global_step": 35685, "epoch": 299, "lr": 5.05848812025272e-05} +{"train_loss": 0.001835753209888935, "global_step": 35686, "epoch": 299, "lr": 5.058266584390914e-05} +{"train_loss": 0.002714479574933648, "global_step": 35687, "epoch": 299, "lr": 5.0580450484147076e-05} +{"train_loss": 0.0017403612146154046, "global_step": 35688, "epoch": 299, "lr": 5.0578235123245366e-05} +{"train_loss": 0.003984674345701933, "global_step": 35689, "epoch": 299, "lr": 5.057601976120837e-05} +{"train_loss": 0.003073385450989008, "global_step": 35690, "epoch": 299, "lr": 5.0573804398040404e-05} +{"train_loss": 0.0012335242936387658, "global_step": 35691, "epoch": 299, "lr": 5.0571589033745825e-05} +{"train_loss": 0.0026056079659610987, "global_step": 35692, "epoch": 299, "lr": 5.0569373668329e-05} +{"train_loss": 0.0020489131566137075, "global_step": 35693, "epoch": 299, "lr": 5.056715830179427e-05} +{"train_loss": 0.0024778966326266527, "global_step": 35694, "epoch": 299, "lr": 5.0564942934145986e-05} +{"train_loss": 0.0018966903444379568, "global_step": 35695, "epoch": 299, "lr": 5.056272756538848e-05} +{"train_loss": 0.00284249777905643, "global_step": 35696, "epoch": 299, "lr": 5.0560512195526156e-05} +{"train_loss": 0.003987085539847612, "global_step": 35697, "epoch": 299, "lr": 5.05582968245633e-05} +{"train_loss": 0.0020401878282427788, "global_step": 35698, "epoch": 299, "lr": 5.055608145250429e-05} +{"train_loss": 0.0023862783740345042, "global_step": 35699, "epoch": 299, "lr": 5.055386607935347e-05, "val_loss": 0.02008252963423729} +{"train_loss": 0.003228261135518551, "global_step": 35700, "epoch": 300, "lr": 5.055165070511521e-05} +{"train_loss": 0.0018310241866856813, "global_step": 35701, "epoch": 300, "lr": 5.0549435329793826e-05} +{"train_loss": 0.002641037805005908, "global_step": 35702, "epoch": 300, "lr": 5.05472199533937e-05} +{"train_loss": 0.0031343039590865374, "global_step": 35703, "epoch": 300, "lr": 5.0545004575919164e-05} +{"train_loss": 0.0025222753174602985, "global_step": 35704, "epoch": 300, "lr": 5.0542789197374564e-05} +{"train_loss": 0.0038776893634349108, "global_step": 35705, "epoch": 300, "lr": 5.054057381776425e-05} +{"train_loss": 0.0029457516502588987, "global_step": 35706, "epoch": 300, "lr": 5.0538358437092584e-05} +{"train_loss": 0.002030792413279414, "global_step": 35707, "epoch": 300, "lr": 5.0536143055363906e-05} +{"train_loss": 0.0017974047223106027, "global_step": 35708, "epoch": 300, "lr": 5.053392767258257e-05} +{"train_loss": 0.001689401688054204, "global_step": 35709, "epoch": 300, "lr": 5.053171228875291e-05} +{"train_loss": 0.0020797657780349255, "global_step": 35710, "epoch": 300, "lr": 5.05294969038793e-05} +{"train_loss": 0.002781218383461237, "global_step": 35711, "epoch": 300, "lr": 5.052728151796608e-05} +{"train_loss": 0.002525071147829294, "global_step": 35712, "epoch": 300, "lr": 5.052506613101761e-05} +{"train_loss": 0.0029235759284347296, "global_step": 35713, "epoch": 300, "lr": 5.052285074303822e-05} +{"train_loss": 0.002228613942861557, "global_step": 35714, "epoch": 300, "lr": 5.052063535403226e-05} +{"train_loss": 0.0020543753635138273, "global_step": 35715, "epoch": 300, "lr": 5.0518419964004104e-05} +{"train_loss": 0.0034742727875709534, "global_step": 35716, "epoch": 300, "lr": 5.051620457295808e-05} +{"train_loss": 0.0026246763300150633, "global_step": 35717, "epoch": 300, "lr": 5.0513989180898544e-05} +{"train_loss": 0.003045453689992428, "global_step": 35718, "epoch": 300, "lr": 5.051177378782984e-05} +{"train_loss": 0.0035245444159954786, "global_step": 35719, "epoch": 300, "lr": 5.050955839375633e-05} +{"train_loss": 0.0023250719532370567, "global_step": 35720, "epoch": 300, "lr": 5.050734299868235e-05} +{"train_loss": 0.0023489580489695072, "global_step": 35721, "epoch": 300, "lr": 5.0505127602612265e-05} +{"train_loss": 0.0031089549884200096, "global_step": 35722, "epoch": 300, "lr": 5.05029122055504e-05} +{"train_loss": 0.0028615042101591825, "global_step": 35723, "epoch": 300, "lr": 5.050069680750114e-05} +{"train_loss": 0.002159582218155265, "global_step": 35724, "epoch": 300, "lr": 5.0498481408468804e-05} +{"train_loss": 0.0029883231036365032, "global_step": 35725, "epoch": 300, "lr": 5.0496266008457746e-05} +{"train_loss": 0.0015380870318040252, "global_step": 35726, "epoch": 300, "lr": 5.049405060747233e-05} +{"train_loss": 0.001971400110051036, "global_step": 35727, "epoch": 300, "lr": 5.0491835205516904e-05} +{"train_loss": 0.0030351958703249693, "global_step": 35728, "epoch": 300, "lr": 5.04896198025958e-05} +{"train_loss": 0.0030305131804198027, "global_step": 35729, "epoch": 300, "lr": 5.048740439871339e-05} +{"train_loss": 0.0023040510714054108, "global_step": 35730, "epoch": 300, "lr": 5.048518899387401e-05} +{"train_loss": 0.0027676369063556194, "global_step": 35731, "epoch": 300, "lr": 5.0482973588082016e-05} +{"train_loss": 0.0025450338143855333, "global_step": 35732, "epoch": 300, "lr": 5.048075818134175e-05} +{"train_loss": 0.0027032915968447924, "global_step": 35733, "epoch": 300, "lr": 5.0478542773657576e-05} +{"train_loss": 0.0036702114157378674, "global_step": 35734, "epoch": 300, "lr": 5.0476327365033826e-05} +{"train_loss": 0.002238305751234293, "global_step": 35735, "epoch": 300, "lr": 5.047411195547486e-05} +{"train_loss": 0.002077495213598013, "global_step": 35736, "epoch": 300, "lr": 5.047189654498503e-05} +{"train_loss": 0.003177837934345007, "global_step": 35737, "epoch": 300, "lr": 5.046968113356867e-05} +{"train_loss": 0.003249888075515628, "global_step": 35738, "epoch": 300, "lr": 5.0467465721230145e-05} +{"train_loss": 0.0017396858893334866, "global_step": 35739, "epoch": 300, "lr": 5.046525030797381e-05} +{"train_loss": 0.0031708970200270414, "global_step": 35740, "epoch": 300, "lr": 5.046303489380401e-05} +{"train_loss": 0.003005016129463911, "global_step": 35741, "epoch": 300, "lr": 5.046081947872507e-05} +{"train_loss": 0.001955383224412799, "global_step": 35742, "epoch": 300, "lr": 5.045860406274138e-05} +{"train_loss": 0.00244328286498785, "global_step": 35743, "epoch": 300, "lr": 5.0456388645857256e-05} +{"train_loss": 0.0020259858574718237, "global_step": 35744, "epoch": 300, "lr": 5.045417322807706e-05} +{"train_loss": 0.0019067063694819808, "global_step": 35745, "epoch": 300, "lr": 5.045195780940515e-05} +{"train_loss": 0.0015748274745419621, "global_step": 35746, "epoch": 300, "lr": 5.044974238984588e-05} +{"train_loss": 0.002669519279152155, "global_step": 35747, "epoch": 300, "lr": 5.044752696940357e-05} +{"train_loss": 0.0020898343063890934, "global_step": 35748, "epoch": 300, "lr": 5.0445311548082595e-05} +{"train_loss": 0.0019519372144713998, "global_step": 35749, "epoch": 300, "lr": 5.0443096125887304e-05} +{"train_loss": 0.003075741697102785, "global_step": 35750, "epoch": 300, "lr": 5.0440880702822036e-05} +{"train_loss": 0.0016903768992051482, "global_step": 35751, "epoch": 300, "lr": 5.043866527889115e-05} +{"train_loss": 0.0012372840428724885, "global_step": 35752, "epoch": 300, "lr": 5.0436449854099e-05} +{"train_loss": 0.0023065616842359304, "global_step": 35753, "epoch": 300, "lr": 5.043423442844991e-05} +{"train_loss": 0.0022281643468886614, "global_step": 35754, "epoch": 300, "lr": 5.043201900194825e-05} +{"train_loss": 0.001860738848336041, "global_step": 35755, "epoch": 300, "lr": 5.0429803574598364e-05} +{"train_loss": 0.0020728649105876684, "global_step": 35756, "epoch": 300, "lr": 5.0427588146404616e-05} +{"train_loss": 0.0023998741526156664, "global_step": 35757, "epoch": 300, "lr": 5.0425372717371336e-05} +{"train_loss": 0.0028721108101308346, "global_step": 35758, "epoch": 300, "lr": 5.042315728750289e-05} +{"train_loss": 0.0035870603751391172, "global_step": 35759, "epoch": 300, "lr": 5.0420941856803604e-05} +{"train_loss": 0.0022932197898626328, "global_step": 35760, "epoch": 300, "lr": 5.0418726425277865e-05} +{"train_loss": 0.0015029975911602378, "global_step": 35761, "epoch": 300, "lr": 5.0416510992929976e-05} +{"train_loss": 0.0016214733477681875, "global_step": 35762, "epoch": 300, "lr": 5.0414295559764335e-05} +{"train_loss": 0.0018774019554257393, "global_step": 35763, "epoch": 300, "lr": 5.041208012578526e-05} +{"train_loss": 0.0025257286615669727, "global_step": 35764, "epoch": 300, "lr": 5.040986469099711e-05} +{"train_loss": 0.002397498581558466, "global_step": 35765, "epoch": 300, "lr": 5.040764925540424e-05} +{"train_loss": 0.0027713526505976915, "global_step": 35766, "epoch": 300, "lr": 5.0405433819011e-05} +{"train_loss": 0.003786162007600069, "global_step": 35767, "epoch": 300, "lr": 5.040321838182171e-05} +{"train_loss": 0.0018605474615469575, "global_step": 35768, "epoch": 300, "lr": 5.0401002943840756e-05} +{"train_loss": 0.0018317998619750142, "global_step": 35769, "epoch": 300, "lr": 5.039878750507248e-05} +{"train_loss": 0.0035088853910565376, "global_step": 35770, "epoch": 300, "lr": 5.039657206552122e-05} +{"train_loss": 0.0009183273650705814, "global_step": 35771, "epoch": 300, "lr": 5.039435662519135e-05} +{"train_loss": 0.0024826412554830313, "global_step": 35772, "epoch": 300, "lr": 5.039214118408718e-05} +{"train_loss": 0.001898772781714797, "global_step": 35773, "epoch": 300, "lr": 5.038992574221309e-05} +{"train_loss": 0.0027870472986251116, "global_step": 35774, "epoch": 300, "lr": 5.0387710299573435e-05} +{"train_loss": 0.0018802911508828402, "global_step": 35775, "epoch": 300, "lr": 5.0385494856172545e-05} +{"train_loss": 0.0022089341655373573, "global_step": 35776, "epoch": 300, "lr": 5.0383279412014774e-05} +{"train_loss": 0.0018070173682644963, "global_step": 35777, "epoch": 300, "lr": 5.038106396710447e-05} +{"train_loss": 0.0013798651052638888, "global_step": 35778, "epoch": 300, "lr": 5.037884852144599e-05} +{"train_loss": 0.0017691474640741944, "global_step": 35779, "epoch": 300, "lr": 5.037663307504369e-05} +{"train_loss": 0.0016471485141664743, "global_step": 35780, "epoch": 300, "lr": 5.0374417627901895e-05} +{"train_loss": 0.002338835271075368, "global_step": 35781, "epoch": 300, "lr": 5.0372202180024985e-05} +{"train_loss": 0.0011602062731981277, "global_step": 35782, "epoch": 300, "lr": 5.036998673141728e-05} +{"train_loss": 0.0016675281804054976, "global_step": 35783, "epoch": 300, "lr": 5.036777128208318e-05} +{"train_loss": 0.003800473175942898, "global_step": 35784, "epoch": 300, "lr": 5.036555583202698e-05} +{"train_loss": 0.002124019432812929, "global_step": 35785, "epoch": 300, "lr": 5.036334038125304e-05} +{"train_loss": 0.002186630852520466, "global_step": 35786, "epoch": 300, "lr": 5.0361124929765725e-05} +{"train_loss": 0.002374348696321249, "global_step": 35787, "epoch": 300, "lr": 5.035890947756938e-05} +{"train_loss": 0.002275807084515691, "global_step": 35788, "epoch": 300, "lr": 5.035669402466836e-05} +{"train_loss": 0.0022565205581486225, "global_step": 35789, "epoch": 300, "lr": 5.035447857106701e-05} +{"train_loss": 0.0028508934192359447, "global_step": 35790, "epoch": 300, "lr": 5.035226311676968e-05} +{"train_loss": 0.002421565121039748, "global_step": 35791, "epoch": 300, "lr": 5.035004766178072e-05} +{"train_loss": 0.0016970885917544365, "global_step": 35792, "epoch": 300, "lr": 5.0347832206104475e-05} +{"train_loss": 0.0023067083675414324, "global_step": 35793, "epoch": 300, "lr": 5.034561674974528e-05} +{"train_loss": 0.0015042198356240988, "global_step": 35794, "epoch": 300, "lr": 5.034340129270753e-05} +{"train_loss": 0.0021689031273126602, "global_step": 35795, "epoch": 300, "lr": 5.034118583499553e-05} +{"train_loss": 0.0022068293765187263, "global_step": 35796, "epoch": 300, "lr": 5.033897037661367e-05} +{"train_loss": 0.0032381811179220676, "global_step": 35797, "epoch": 300, "lr": 5.0336754917566265e-05} +{"train_loss": 0.002767396392300725, "global_step": 35798, "epoch": 300, "lr": 5.0334539457857673e-05} +{"train_loss": 0.0021699031349271536, "global_step": 35799, "epoch": 300, "lr": 5.033232399749226e-05} +{"train_loss": 0.002379754325374961, "global_step": 35800, "epoch": 300, "lr": 5.033010853647435e-05} +{"train_loss": 0.004442266188561916, "global_step": 35801, "epoch": 300, "lr": 5.032789307480832e-05} +{"train_loss": 0.0016050186241045594, "global_step": 35802, "epoch": 300, "lr": 5.032567761249851e-05} +{"train_loss": 0.0023781333584338427, "global_step": 35803, "epoch": 300, "lr": 5.032346214954926e-05} +{"train_loss": 0.003964140545576811, "global_step": 35804, "epoch": 300, "lr": 5.032124668596492e-05} +{"train_loss": 0.0012957421131432056, "global_step": 35805, "epoch": 300, "lr": 5.031903122174986e-05} +{"train_loss": 0.004290354438126087, "global_step": 35806, "epoch": 300, "lr": 5.03168157569084e-05} +{"train_loss": 0.0032834778539836407, "global_step": 35807, "epoch": 300, "lr": 5.0314600291444916e-05} +{"train_loss": 0.002188027137890458, "global_step": 35808, "epoch": 300, "lr": 5.031238482536374e-05} +{"train_loss": 0.002006117021664977, "global_step": 35809, "epoch": 300, "lr": 5.031016935866924e-05} +{"train_loss": 0.0016328237252309918, "global_step": 35810, "epoch": 300, "lr": 5.030795389136574e-05} +{"train_loss": 0.0026207626797258854, "global_step": 35811, "epoch": 300, "lr": 5.030573842345763e-05} +{"train_loss": 0.003838865552097559, "global_step": 35812, "epoch": 300, "lr": 5.030352295494921e-05} +{"train_loss": 0.0028732840437442064, "global_step": 35813, "epoch": 300, "lr": 5.0301307485844876e-05} +{"train_loss": 0.0024252296425402164, "global_step": 35814, "epoch": 300, "lr": 5.029909201614894e-05} +{"train_loss": 0.0015927567146718502, "global_step": 35815, "epoch": 300, "lr": 5.029687654586579e-05} +{"train_loss": 0.00122781191021204, "global_step": 35816, "epoch": 300, "lr": 5.029466107499974e-05} +{"train_loss": 0.002605198184028268, "global_step": 35817, "epoch": 300, "lr": 5.029244560355516e-05} +{"train_loss": 0.0024214882438830217, "global_step": 35818, "epoch": 300, "lr": 5.029023013153639e-05, "val_loss": 0.037264786660671234, "train_action_mse_error": 4.51011183031369e-05} +{"train_loss": 0.003341280622407794, "global_step": 35819, "epoch": 301, "lr": 5.028801465894778e-05} +{"train_loss": 0.002716867486014962, "global_step": 35820, "epoch": 301, "lr": 5.028579918579368e-05} +{"train_loss": 0.0017050366150215268, "global_step": 35821, "epoch": 301, "lr": 5.028358371207846e-05} +{"train_loss": 0.0030223920475691557, "global_step": 35822, "epoch": 301, "lr": 5.028136823780646e-05} +{"train_loss": 0.003113037906587124, "global_step": 35823, "epoch": 301, "lr": 5.027915276298201e-05} +{"train_loss": 0.003556110430508852, "global_step": 35824, "epoch": 301, "lr": 5.027693728760946e-05} +{"train_loss": 0.0025306311435997486, "global_step": 35825, "epoch": 301, "lr": 5.0274721811693194e-05} +{"train_loss": 0.002238919958472252, "global_step": 35826, "epoch": 301, "lr": 5.027250633523752e-05} +{"train_loss": 0.00198997906409204, "global_step": 35827, "epoch": 301, "lr": 5.027029085824683e-05} +{"train_loss": 0.0016119217034429312, "global_step": 35828, "epoch": 301, "lr": 5.0268075380725446e-05} +{"train_loss": 0.0029981532134115696, "global_step": 35829, "epoch": 301, "lr": 5.026585990267772e-05} +{"train_loss": 0.003305498044937849, "global_step": 35830, "epoch": 301, "lr": 5.026364442410801e-05} +{"train_loss": 0.0016061965143308043, "global_step": 35831, "epoch": 301, "lr": 5.026142894502066e-05} +{"train_loss": 0.0033773542381823063, "global_step": 35832, "epoch": 301, "lr": 5.025921346542003e-05} +{"train_loss": 0.0021726747509092093, "global_step": 35833, "epoch": 301, "lr": 5.025699798531045e-05} +{"train_loss": 0.003163120709359646, "global_step": 35834, "epoch": 301, "lr": 5.02547825046963e-05} +{"train_loss": 0.003052076091989875, "global_step": 35835, "epoch": 301, "lr": 5.0252567023581896e-05} +{"train_loss": 0.001760221435688436, "global_step": 35836, "epoch": 301, "lr": 5.025035154197161e-05} +{"train_loss": 0.0034446842037141323, "global_step": 35837, "epoch": 301, "lr": 5.0248136059869775e-05} +{"train_loss": 0.0025210443418473005, "global_step": 35838, "epoch": 301, "lr": 5.024592057728077e-05} +{"train_loss": 0.0022393192630261183, "global_step": 35839, "epoch": 301, "lr": 5.024370509420892e-05} +{"train_loss": 0.0016445998335257173, "global_step": 35840, "epoch": 301, "lr": 5.024148961065858e-05} +{"train_loss": 0.002387122018262744, "global_step": 35841, "epoch": 301, "lr": 5.023927412663408e-05} +{"train_loss": 0.003344512078911066, "global_step": 35842, "epoch": 301, "lr": 5.023705864213981e-05} +{"train_loss": 0.002713787602260709, "global_step": 35843, "epoch": 301, "lr": 5.02348431571801e-05} +{"train_loss": 0.0021478564012795687, "global_step": 35844, "epoch": 301, "lr": 5.0232627671759304e-05} +{"train_loss": 0.001873012981377542, "global_step": 35845, "epoch": 301, "lr": 5.023041218588176e-05} +{"train_loss": 0.0019569091964513063, "global_step": 35846, "epoch": 301, "lr": 5.022819669955184e-05} +{"train_loss": 0.0022883517667651176, "global_step": 35847, "epoch": 301, "lr": 5.0225981212773875e-05} +{"train_loss": 0.0027600463945418596, "global_step": 35848, "epoch": 301, "lr": 5.022376572555221e-05} +{"train_loss": 0.0024376935325562954, "global_step": 35849, "epoch": 301, "lr": 5.022155023789121e-05} +{"train_loss": 0.002602132735773921, "global_step": 35850, "epoch": 301, "lr": 5.021933474979522e-05} +{"train_loss": 0.001193279167637229, "global_step": 35851, "epoch": 301, "lr": 5.021711926126859e-05} +{"train_loss": 0.002788935089483857, "global_step": 35852, "epoch": 301, "lr": 5.021490377231568e-05} +{"train_loss": 0.002469083061441779, "global_step": 35853, "epoch": 301, "lr": 5.021268828294082e-05} +{"train_loss": 0.0037197519559413195, "global_step": 35854, "epoch": 301, "lr": 5.0210472793148363e-05} +{"train_loss": 0.002072179690003395, "global_step": 35855, "epoch": 301, "lr": 5.0208257302942676e-05} +{"train_loss": 0.0024454998783767223, "global_step": 35856, "epoch": 301, "lr": 5.020604181232809e-05} +{"train_loss": 0.0012551476247608662, "global_step": 35857, "epoch": 301, "lr": 5.0203826321308965e-05} +{"train_loss": 0.0030562197789549828, "global_step": 35858, "epoch": 301, "lr": 5.020161082988964e-05} +{"train_loss": 0.0020974911749362946, "global_step": 35859, "epoch": 301, "lr": 5.0199395338074484e-05} +{"train_loss": 0.003689222037792206, "global_step": 35860, "epoch": 301, "lr": 5.0197179845867833e-05} +{"train_loss": 0.002639985177665949, "global_step": 35861, "epoch": 301, "lr": 5.0194964353274055e-05} +{"train_loss": 0.002114619594067335, "global_step": 35862, "epoch": 301, "lr": 5.0192748860297466e-05} +{"train_loss": 0.0030908065382391214, "global_step": 35863, "epoch": 301, "lr": 5.0190533366942435e-05} +{"train_loss": 0.0032440917566418648, "global_step": 35864, "epoch": 301, "lr": 5.018831787321333e-05} +{"train_loss": 0.0024342755787074566, "global_step": 35865, "epoch": 301, "lr": 5.0186102379114474e-05} +{"train_loss": 0.0022809389047324657, "global_step": 35866, "epoch": 301, "lr": 5.018388688465023e-05} +{"train_loss": 0.003793492214754224, "global_step": 35867, "epoch": 301, "lr": 5.0181671389824933e-05} +{"train_loss": 0.0038006152026355267, "global_step": 35868, "epoch": 301, "lr": 5.017945589464295e-05} +{"train_loss": 0.003399865934625268, "global_step": 35869, "epoch": 301, "lr": 5.017724039910863e-05} +{"train_loss": 0.0022859685122966766, "global_step": 35870, "epoch": 301, "lr": 5.017502490322631e-05} +{"train_loss": 0.0024919905699789524, "global_step": 35871, "epoch": 301, "lr": 5.0172809407000354e-05} +{"train_loss": 0.005255826283246279, "global_step": 35872, "epoch": 301, "lr": 5.0170593910435096e-05} +{"train_loss": 0.0015814841026440263, "global_step": 35873, "epoch": 301, "lr": 5.01683784135349e-05} +{"train_loss": 0.003137588035315275, "global_step": 35874, "epoch": 301, "lr": 5.0166162916304105e-05} +{"train_loss": 0.0029139297548681498, "global_step": 35875, "epoch": 301, "lr": 5.016394741874707e-05} +{"train_loss": 0.002371671376749873, "global_step": 35876, "epoch": 301, "lr": 5.016173192086814e-05} +{"train_loss": 0.002010608557611704, "global_step": 35877, "epoch": 301, "lr": 5.0159516422671674e-05} +{"train_loss": 0.0033137958962470293, "global_step": 35878, "epoch": 301, "lr": 5.015730092416201e-05} +{"train_loss": 0.0028968665283173323, "global_step": 35879, "epoch": 301, "lr": 5.015508542534349e-05} +{"train_loss": 0.002234111772850156, "global_step": 35880, "epoch": 301, "lr": 5.01528699262205e-05} +{"train_loss": 0.0011622455203905702, "global_step": 35881, "epoch": 301, "lr": 5.015065442679735e-05} +{"train_loss": 0.0037043748889118433, "global_step": 35882, "epoch": 301, "lr": 5.0148438927078414e-05} +{"train_loss": 0.004744734615087509, "global_step": 35883, "epoch": 301, "lr": 5.014622342706803e-05} +{"train_loss": 0.0026206462644040585, "global_step": 35884, "epoch": 301, "lr": 5.014400792677056e-05} +{"train_loss": 0.002018612576648593, "global_step": 35885, "epoch": 301, "lr": 5.014179242619034e-05} +{"train_loss": 0.003275779075920582, "global_step": 35886, "epoch": 301, "lr": 5.013957692533172e-05} +{"train_loss": 0.0014885037671774626, "global_step": 35887, "epoch": 301, "lr": 5.013736142419907e-05} +{"train_loss": 0.0017506997101008892, "global_step": 35888, "epoch": 301, "lr": 5.0135145922796714e-05} +{"train_loss": 0.0024329898878932, "global_step": 35889, "epoch": 301, "lr": 5.013293042112901e-05} +{"train_loss": 0.0031798251438885927, "global_step": 35890, "epoch": 301, "lr": 5.013071491920032e-05} +{"train_loss": 0.0029366284143179655, "global_step": 35891, "epoch": 301, "lr": 5.012849941701497e-05} +{"train_loss": 0.002393115311861038, "global_step": 35892, "epoch": 301, "lr": 5.012628391457734e-05} +{"train_loss": 0.0021603209897875786, "global_step": 35893, "epoch": 301, "lr": 5.012406841189177e-05} +{"train_loss": 0.0019517051987349987, "global_step": 35894, "epoch": 301, "lr": 5.0121852908962596e-05} +{"train_loss": 0.0026390079874545336, "global_step": 35895, "epoch": 301, "lr": 5.0119637405794174e-05} +{"train_loss": 0.004401728045195341, "global_step": 35896, "epoch": 301, "lr": 5.011742190239087e-05} +{"train_loss": 0.003928366117179394, "global_step": 35897, "epoch": 301, "lr": 5.011520639875701e-05} +{"train_loss": 0.0023043379187583923, "global_step": 35898, "epoch": 301, "lr": 5.011299089489695e-05} +{"train_loss": 0.002971625654026866, "global_step": 35899, "epoch": 301, "lr": 5.011077539081506e-05} +{"train_loss": 0.0025388142094016075, "global_step": 35900, "epoch": 301, "lr": 5.010855988651566e-05} +{"train_loss": 0.0017498735105618834, "global_step": 35901, "epoch": 301, "lr": 5.010634438200311e-05} +{"train_loss": 0.002580563072115183, "global_step": 35902, "epoch": 301, "lr": 5.010412887728178e-05} +{"train_loss": 0.0034747826866805553, "global_step": 35903, "epoch": 301, "lr": 5.0101913372356e-05} +{"train_loss": 0.002186750527471304, "global_step": 35904, "epoch": 301, "lr": 5.0099697867230125e-05} +{"train_loss": 0.0035513360053300858, "global_step": 35905, "epoch": 301, "lr": 5.00974823619085e-05} +{"train_loss": 0.0035281318705528975, "global_step": 35906, "epoch": 301, "lr": 5.0095266856395475e-05} +{"train_loss": 0.0034722615964710712, "global_step": 35907, "epoch": 301, "lr": 5.009305135069541e-05} +{"train_loss": 0.0025828112848103046, "global_step": 35908, "epoch": 301, "lr": 5.0090835844812644e-05} +{"train_loss": 0.0023042275570333004, "global_step": 35909, "epoch": 301, "lr": 5.008862033875154e-05} +{"train_loss": 0.0018758773803710938, "global_step": 35910, "epoch": 301, "lr": 5.008640483251642e-05} +{"train_loss": 0.003337954403832555, "global_step": 35911, "epoch": 301, "lr": 5.0084189326111676e-05} +{"train_loss": 0.001621172297745943, "global_step": 35912, "epoch": 301, "lr": 5.008197381954162e-05} +{"train_loss": 0.0035379771143198013, "global_step": 35913, "epoch": 301, "lr": 5.007975831281062e-05} +{"train_loss": 0.0031946797389537096, "global_step": 35914, "epoch": 301, "lr": 5.007754280592303e-05} +{"train_loss": 0.0022725570015609264, "global_step": 35915, "epoch": 301, "lr": 5.007532729888319e-05} +{"train_loss": 0.0021075657568871975, "global_step": 35916, "epoch": 301, "lr": 5.007311179169546e-05} +{"train_loss": 0.0021746524143964052, "global_step": 35917, "epoch": 301, "lr": 5.0070896284364164e-05} +{"train_loss": 0.002757269423455, "global_step": 35918, "epoch": 301, "lr": 5.006868077689368e-05} +{"train_loss": 0.0011474820785224438, "global_step": 35919, "epoch": 301, "lr": 5.006646526928835e-05} +{"train_loss": 0.003856718773022294, "global_step": 35920, "epoch": 301, "lr": 5.006424976155253e-05} +{"train_loss": 0.0019670953042805195, "global_step": 35921, "epoch": 301, "lr": 5.006203425369056e-05} +{"train_loss": 0.0018584835343062878, "global_step": 35922, "epoch": 301, "lr": 5.005981874570679e-05} +{"train_loss": 0.0017302252817898989, "global_step": 35923, "epoch": 301, "lr": 5.0057603237605564e-05} +{"train_loss": 0.0026613541413098574, "global_step": 35924, "epoch": 301, "lr": 5.0055387729391245e-05} +{"train_loss": 0.00221981736831367, "global_step": 35925, "epoch": 301, "lr": 5.0053172221068166e-05} +{"train_loss": 0.003344756318256259, "global_step": 35926, "epoch": 301, "lr": 5.0050956712640706e-05} +{"train_loss": 0.0020070266909897327, "global_step": 35927, "epoch": 301, "lr": 5.0048741204113195e-05} +{"train_loss": 0.0028319486882537603, "global_step": 35928, "epoch": 301, "lr": 5.004652569548999e-05} +{"train_loss": 0.0027931786607950926, "global_step": 35929, "epoch": 301, "lr": 5.004431018677543e-05} +{"train_loss": 0.0025397364515811205, "global_step": 35930, "epoch": 301, "lr": 5.0042094677973875e-05} +{"train_loss": 0.003952513914555311, "global_step": 35931, "epoch": 301, "lr": 5.003987916908967e-05} +{"train_loss": 0.0022330954670906067, "global_step": 35932, "epoch": 301, "lr": 5.003766366012717e-05} +{"train_loss": 0.002644679509103298, "global_step": 35933, "epoch": 301, "lr": 5.003544815109071e-05} +{"train_loss": 0.0021464477758854628, "global_step": 35934, "epoch": 301, "lr": 5.003323264198467e-05} +{"train_loss": 0.0026063856203109026, "global_step": 35935, "epoch": 301, "lr": 5.0031017132813366e-05} +{"train_loss": 0.0013559807557612658, "global_step": 35936, "epoch": 301, "lr": 5.002880162358117e-05} +{"train_loss": 0.0026225025605159896, "global_step": 35937, "epoch": 301, "lr": 5.002658611429242e-05, "val_loss": 0.0169900543987751} +{"train_loss": 0.0021748554427176714, "global_step": 35938, "epoch": 302, "lr": 5.002437060495147e-05} +{"train_loss": 0.0025179507210850716, "global_step": 35939, "epoch": 302, "lr": 5.002215509556267e-05} +{"train_loss": 0.0023777310270816088, "global_step": 35940, "epoch": 302, "lr": 5.001993958613038e-05} +{"train_loss": 0.002208616118878126, "global_step": 35941, "epoch": 302, "lr": 5.0017724076658934e-05} +{"train_loss": 0.0030353027395904064, "global_step": 35942, "epoch": 302, "lr": 5.001550856715269e-05} +{"train_loss": 0.00318419118411839, "global_step": 35943, "epoch": 302, "lr": 5.001329305761599e-05} +{"train_loss": 0.0018055879045277834, "global_step": 35944, "epoch": 302, "lr": 5.001107754805321e-05} +{"train_loss": 0.002712795278057456, "global_step": 35945, "epoch": 302, "lr": 5.000886203846866e-05} +{"train_loss": 0.002309752395376563, "global_step": 35946, "epoch": 302, "lr": 5.000664652886673e-05} +{"train_loss": 0.0021713459864258766, "global_step": 35947, "epoch": 302, "lr": 5.000443101925174e-05} +{"train_loss": 0.002339884638786316, "global_step": 35948, "epoch": 302, "lr": 5.000221550962805e-05} +{"train_loss": 0.0019000229658558965, "global_step": 35949, "epoch": 302, "lr": 5e-05} +{"train_loss": 0.002755732974037528, "global_step": 35950, "epoch": 302, "lr": 4.999778449037197e-05} +{"train_loss": 0.0042463126592338085, "global_step": 35951, "epoch": 302, "lr": 4.999556898074827e-05} +{"train_loss": 0.0015616790624335408, "global_step": 35952, "epoch": 302, "lr": 4.999335347113329e-05} +{"train_loss": 0.0018990692915394902, "global_step": 35953, "epoch": 302, "lr": 4.9991137961531335e-05} +{"train_loss": 0.004711764864623547, "global_step": 35954, "epoch": 302, "lr": 4.998892245194681e-05} +{"train_loss": 0.003313568653538823, "global_step": 35955, "epoch": 302, "lr": 4.9986706942384005e-05} +{"train_loss": 0.002779946895316243, "global_step": 35956, "epoch": 302, "lr": 4.998449143284732e-05} +{"train_loss": 0.0023041374515742064, "global_step": 35957, "epoch": 302, "lr": 4.998227592334108e-05} +{"train_loss": 0.002174780471250415, "global_step": 35958, "epoch": 302, "lr": 4.9980060413869626e-05} +{"train_loss": 0.002396377269178629, "global_step": 35959, "epoch": 302, "lr": 4.9977844904437334e-05} +{"train_loss": 0.0014425088884308934, "global_step": 35960, "epoch": 302, "lr": 4.997562939504853e-05} +{"train_loss": 0.0018885827157646418, "global_step": 35961, "epoch": 302, "lr": 4.997341388570759e-05} +{"train_loss": 0.0016809231601655483, "global_step": 35962, "epoch": 302, "lr": 4.9971198376418855e-05} +{"train_loss": 0.0020438593346625566, "global_step": 35963, "epoch": 302, "lr": 4.996898286718664e-05} +{"train_loss": 0.0017399495700374246, "global_step": 35964, "epoch": 302, "lr": 4.9966767358015355e-05} +{"train_loss": 0.0021714726462960243, "global_step": 35965, "epoch": 302, "lr": 4.996455184890929e-05} +{"train_loss": 0.002491803839802742, "global_step": 35966, "epoch": 302, "lr": 4.996233633987285e-05} +{"train_loss": 0.0022863559424877167, "global_step": 35967, "epoch": 302, "lr": 4.996012083091034e-05} +{"train_loss": 0.0025338183622807264, "global_step": 35968, "epoch": 302, "lr": 4.9957905322026136e-05} +{"train_loss": 0.001885768724605441, "global_step": 35969, "epoch": 302, "lr": 4.995568981322459e-05} +{"train_loss": 0.0023978552781045437, "global_step": 35970, "epoch": 302, "lr": 4.995347430451002e-05} +{"train_loss": 0.0020595728419721127, "global_step": 35971, "epoch": 302, "lr": 4.995125879588682e-05} +{"train_loss": 0.0020753866992890835, "global_step": 35972, "epoch": 302, "lr": 4.99490432873593e-05} +{"train_loss": 0.0013209792086854577, "global_step": 35973, "epoch": 302, "lr": 4.9946827778931845e-05} +{"train_loss": 0.003138092579320073, "global_step": 35974, "epoch": 302, "lr": 4.994461227060877e-05} +{"train_loss": 0.0021041734144091606, "global_step": 35975, "epoch": 302, "lr": 4.994239676239445e-05} +{"train_loss": 0.003124051261693239, "global_step": 35976, "epoch": 302, "lr": 4.994018125429323e-05} +{"train_loss": 0.003327453974634409, "global_step": 35977, "epoch": 302, "lr": 4.9937965746309454e-05} +{"train_loss": 0.0025852308608591557, "global_step": 35978, "epoch": 302, "lr": 4.9935750238447486e-05} +{"train_loss": 0.0025729842018336058, "global_step": 35979, "epoch": 302, "lr": 4.9933534730711646e-05} +{"train_loss": 0.002679145196452737, "global_step": 35980, "epoch": 302, "lr": 4.993131922310633e-05} +{"train_loss": 0.0023666711058467627, "global_step": 35981, "epoch": 302, "lr": 4.9929103715635854e-05} +{"train_loss": 0.0018452791264280677, "global_step": 35982, "epoch": 302, "lr": 4.992688820830456e-05} +{"train_loss": 0.0020674169063568115, "global_step": 35983, "epoch": 302, "lr": 4.992467270111683e-05} +{"train_loss": 0.003271366935223341, "global_step": 35984, "epoch": 302, "lr": 4.992245719407698e-05} +{"train_loss": 0.002984634367749095, "global_step": 35985, "epoch": 302, "lr": 4.992024168718939e-05} +{"train_loss": 0.002282440662384033, "global_step": 35986, "epoch": 302, "lr": 4.991802618045838e-05} +{"train_loss": 0.002129662549123168, "global_step": 35987, "epoch": 302, "lr": 4.991581067388834e-05} +{"train_loss": 0.002528458135202527, "global_step": 35988, "epoch": 302, "lr": 4.991359516748358e-05} +{"train_loss": 0.002078048652037978, "global_step": 35989, "epoch": 302, "lr": 4.991137966124848e-05} +{"train_loss": 0.0031772933434695005, "global_step": 35990, "epoch": 302, "lr": 4.990916415518737e-05} +{"train_loss": 0.0028875034768134356, "global_step": 35991, "epoch": 302, "lr": 4.9906948649304605e-05} +{"train_loss": 0.0024597416631877422, "global_step": 35992, "epoch": 302, "lr": 4.990473314360453e-05} +{"train_loss": 0.001671587466262281, "global_step": 35993, "epoch": 302, "lr": 4.990251763809152e-05} +{"train_loss": 0.002031288342550397, "global_step": 35994, "epoch": 302, "lr": 4.9900302132769886e-05} +{"train_loss": 0.0017937023658305407, "global_step": 35995, "epoch": 302, "lr": 4.989808662764402e-05} +{"train_loss": 0.0013198292581364512, "global_step": 35996, "epoch": 302, "lr": 4.989587112271823e-05} +{"train_loss": 0.0033422624692320824, "global_step": 35997, "epoch": 302, "lr": 4.9893655617996895e-05} +{"train_loss": 0.0022055162116885185, "global_step": 35998, "epoch": 302, "lr": 4.989144011348435e-05} +{"train_loss": 0.0014214256079867482, "global_step": 35999, "epoch": 302, "lr": 4.988922460918496e-05} +{"train_loss": 0.0018351639155298471, "global_step": 36000, "epoch": 302, "lr": 4.988700910510306e-05} +{"train_loss": 0.0030099309515208006, "global_step": 36001, "epoch": 302, "lr": 4.9884793601243e-05} +{"train_loss": 0.002688248408958316, "global_step": 36002, "epoch": 302, "lr": 4.988257809760915e-05} +{"train_loss": 0.0023374627344310284, "global_step": 36003, "epoch": 302, "lr": 4.9880362594205824e-05} +{"train_loss": 0.0020348327234387398, "global_step": 36004, "epoch": 302, "lr": 4.987814709103742e-05} +{"train_loss": 0.00200301269069314, "global_step": 36005, "epoch": 302, "lr": 4.987593158810823e-05} +{"train_loss": 0.0025248853489756584, "global_step": 36006, "epoch": 302, "lr": 4.987371608542267e-05} +{"train_loss": 0.0021703706588596106, "global_step": 36007, "epoch": 302, "lr": 4.9871500582985034e-05} +{"train_loss": 0.003669144120067358, "global_step": 36008, "epoch": 302, "lr": 4.986928508079969e-05} +{"train_loss": 0.0043145837262272835, "global_step": 36009, "epoch": 302, "lr": 4.9867069578871e-05} +{"train_loss": 0.002602766267955303, "global_step": 36010, "epoch": 302, "lr": 4.986485407720329e-05} +{"train_loss": 0.004236185923218727, "global_step": 36011, "epoch": 302, "lr": 4.9862638575800946e-05} +{"train_loss": 0.0014686438953503966, "global_step": 36012, "epoch": 302, "lr": 4.9860423074668296e-05} +{"train_loss": 0.002705433638766408, "global_step": 36013, "epoch": 302, "lr": 4.9858207573809665e-05} +{"train_loss": 0.0023889681324362755, "global_step": 36014, "epoch": 302, "lr": 4.985599207322946e-05} +{"train_loss": 0.0023947476875036955, "global_step": 36015, "epoch": 302, "lr": 4.985377657293197e-05} +{"train_loss": 0.003982430789619684, "global_step": 36016, "epoch": 302, "lr": 4.98515610729216e-05} +{"train_loss": 0.0017570933559909463, "global_step": 36017, "epoch": 302, "lr": 4.984934557320265e-05} +{"train_loss": 0.0019598212093114853, "global_step": 36018, "epoch": 302, "lr": 4.984713007377951e-05} +{"train_loss": 0.001857462339103222, "global_step": 36019, "epoch": 302, "lr": 4.984491457465652e-05} +{"train_loss": 0.0022479684557765722, "global_step": 36020, "epoch": 302, "lr": 4.9842699075838e-05} +{"train_loss": 0.0022519954945892096, "global_step": 36021, "epoch": 302, "lr": 4.984048357732835e-05} +{"train_loss": 0.0016234525246545672, "global_step": 36022, "epoch": 302, "lr": 4.9838268079131864e-05} +{"train_loss": 0.0032174817752093077, "global_step": 36023, "epoch": 302, "lr": 4.983605258125294e-05} +{"train_loss": 0.0022859126329421997, "global_step": 36024, "epoch": 302, "lr": 4.983383708369591e-05} +{"train_loss": 0.001897356123663485, "global_step": 36025, "epoch": 302, "lr": 4.983162158646511e-05} +{"train_loss": 0.003601063508540392, "global_step": 36026, "epoch": 302, "lr": 4.982940608956492e-05} +{"train_loss": 0.0015119266463443637, "global_step": 36027, "epoch": 302, "lr": 4.982719059299966e-05} +{"train_loss": 0.0023632978554815054, "global_step": 36028, "epoch": 302, "lr": 4.982497509677371e-05} +{"train_loss": 0.003103759838268161, "global_step": 36029, "epoch": 302, "lr": 4.9822759600891374e-05} +{"train_loss": 0.002084208419546485, "global_step": 36030, "epoch": 302, "lr": 4.982054410535706e-05} +{"train_loss": 0.001109729870222509, "global_step": 36031, "epoch": 302, "lr": 4.9818328610175085e-05} +{"train_loss": 0.0035270480439066887, "global_step": 36032, "epoch": 302, "lr": 4.981611311534978e-05} +{"train_loss": 0.0017243546899408102, "global_step": 36033, "epoch": 302, "lr": 4.9813897620885544e-05} +{"train_loss": 0.0025408188812434673, "global_step": 36034, "epoch": 302, "lr": 4.981168212678668e-05} +{"train_loss": 0.0033406023867428303, "global_step": 36035, "epoch": 302, "lr": 4.980946663305757e-05} +{"train_loss": 0.002151038497686386, "global_step": 36036, "epoch": 302, "lr": 4.980725113970253e-05} +{"train_loss": 0.0013742835726588964, "global_step": 36037, "epoch": 302, "lr": 4.980503564672596e-05} +{"train_loss": 0.0017577969701960683, "global_step": 36038, "epoch": 302, "lr": 4.980282015413217e-05} +{"train_loss": 0.0029527891892939806, "global_step": 36039, "epoch": 302, "lr": 4.980060466192552e-05} +{"train_loss": 0.0029210809152573347, "global_step": 36040, "epoch": 302, "lr": 4.979838917011036e-05} +{"train_loss": 0.003035586792975664, "global_step": 36041, "epoch": 302, "lr": 4.9796173678691047e-05} +{"train_loss": 0.0030177098233252764, "global_step": 36042, "epoch": 302, "lr": 4.979395818767192e-05} +{"train_loss": 0.004682091064751148, "global_step": 36043, "epoch": 302, "lr": 4.979174269705735e-05} +{"train_loss": 0.00267957616597414, "global_step": 36044, "epoch": 302, "lr": 4.978952720685164e-05} +{"train_loss": 0.0015400891425088048, "global_step": 36045, "epoch": 302, "lr": 4.9787311717059204e-05} +{"train_loss": 0.0025435849092900753, "global_step": 36046, "epoch": 302, "lr": 4.978509622768433e-05} +{"train_loss": 0.001975899562239647, "global_step": 36047, "epoch": 302, "lr": 4.9782880738731416e-05} +{"train_loss": 0.0011384716490283608, "global_step": 36048, "epoch": 302, "lr": 4.978066525020478e-05} +{"train_loss": 0.0057580964639782906, "global_step": 36049, "epoch": 302, "lr": 4.97784497621088e-05} +{"train_loss": 0.0026763868518173695, "global_step": 36050, "epoch": 302, "lr": 4.9776234274447815e-05} +{"train_loss": 0.0013555445475503802, "global_step": 36051, "epoch": 302, "lr": 4.977401878722614e-05} +{"train_loss": 0.0033282586373388767, "global_step": 36052, "epoch": 302, "lr": 4.977180330044818e-05} +{"train_loss": 0.002259067492559552, "global_step": 36053, "epoch": 302, "lr": 4.976958781411824e-05} +{"train_loss": 0.0020238712895661592, "global_step": 36054, "epoch": 302, "lr": 4.9767372328240714e-05} +{"train_loss": 0.0025764084421098232, "global_step": 36055, "epoch": 302, "lr": 4.9765156842819896e-05} +{"train_loss": 0.002456361332031734, "global_step": 36056, "epoch": 302, "lr": 4.97629413578602e-05, "val_loss": 0.028761040419340134} +{"train_loss": 0.0017472372855991125, "global_step": 36057, "epoch": 303, "lr": 4.976072587336593e-05} +{"train_loss": 0.002422390040010214, "global_step": 36058, "epoch": 303, "lr": 4.9758510389341434e-05} +{"train_loss": 0.00404183566570282, "global_step": 36059, "epoch": 303, "lr": 4.97562949057911e-05} +{"train_loss": 0.003364497097209096, "global_step": 36060, "epoch": 303, "lr": 4.9754079422719234e-05} +{"train_loss": 0.0029887782875448465, "global_step": 36061, "epoch": 303, "lr": 4.975186394013023e-05} +{"train_loss": 0.002216267166659236, "global_step": 36062, "epoch": 303, "lr": 4.974964845802841e-05} +{"train_loss": 0.0015029811765998602, "global_step": 36063, "epoch": 303, "lr": 4.974743297641811e-05} +{"train_loss": 0.0020336750894784927, "global_step": 36064, "epoch": 303, "lr": 4.974521749530373e-05} +{"train_loss": 0.0027748150750994682, "global_step": 36065, "epoch": 303, "lr": 4.974300201468955e-05} +{"train_loss": 0.004627901595085859, "global_step": 36066, "epoch": 303, "lr": 4.974078653457999e-05} +{"train_loss": 0.0036320947110652924, "global_step": 36067, "epoch": 303, "lr": 4.9738571054979336e-05} +{"train_loss": 0.001741797081194818, "global_step": 36068, "epoch": 303, "lr": 4.9736355575892e-05} +{"train_loss": 0.0048810685984790325, "global_step": 36069, "epoch": 303, "lr": 4.97341400973223e-05} +{"train_loss": 0.0029947860166430473, "global_step": 36070, "epoch": 303, "lr": 4.9731924619274566e-05} +{"train_loss": 0.0026734613347798586, "global_step": 36071, "epoch": 303, "lr": 4.9729709141753183e-05} +{"train_loss": 0.0036475248634815216, "global_step": 36072, "epoch": 303, "lr": 4.9727493664762484e-05} +{"train_loss": 0.002186845988035202, "global_step": 36073, "epoch": 303, "lr": 4.9725278188306825e-05} +{"train_loss": 0.004407402593642473, "global_step": 36074, "epoch": 303, "lr": 4.972306271239054e-05} +{"train_loss": 0.0032997133675962687, "global_step": 36075, "epoch": 303, "lr": 4.972084723701801e-05} +{"train_loss": 0.0032316423021256924, "global_step": 36076, "epoch": 303, "lr": 4.9718631762193565e-05} +{"train_loss": 0.002339850412681699, "global_step": 36077, "epoch": 303, "lr": 4.971641628792154e-05} +{"train_loss": 0.002940839622169733, "global_step": 36078, "epoch": 303, "lr": 4.971420081420633e-05} +{"train_loss": 0.002532174112275243, "global_step": 36079, "epoch": 303, "lr": 4.971198534105222e-05} +{"train_loss": 0.004441023804247379, "global_step": 36080, "epoch": 303, "lr": 4.9709769868463624e-05} +{"train_loss": 0.0043306476436555386, "global_step": 36081, "epoch": 303, "lr": 4.9707554396444866e-05} +{"train_loss": 0.0017837408231571317, "global_step": 36082, "epoch": 303, "lr": 4.9705338925000274e-05} +{"train_loss": 0.0032573339994996786, "global_step": 36083, "epoch": 303, "lr": 4.970312345413423e-05} +{"train_loss": 0.0025621585082262754, "global_step": 36084, "epoch": 303, "lr": 4.970090798385106e-05} +{"train_loss": 0.0046065812930464745, "global_step": 36085, "epoch": 303, "lr": 4.969869251415514e-05} +{"train_loss": 0.003671756014227867, "global_step": 36086, "epoch": 303, "lr": 4.969647704505079e-05} +{"train_loss": 0.002513900399208069, "global_step": 36087, "epoch": 303, "lr": 4.969426157654239e-05} +{"train_loss": 0.003798999357968569, "global_step": 36088, "epoch": 303, "lr": 4.969204610863426e-05} +{"train_loss": 0.00243283249437809, "global_step": 36089, "epoch": 303, "lr": 4.9689830641330774e-05} +{"train_loss": 0.0024328846484422684, "global_step": 36090, "epoch": 303, "lr": 4.968761517463627e-05} +{"train_loss": 0.0021581612527370453, "global_step": 36091, "epoch": 303, "lr": 4.9685399708555096e-05} +{"train_loss": 0.0038832668215036392, "global_step": 36092, "epoch": 303, "lr": 4.9683184243091614e-05} +{"train_loss": 0.0027747834101319313, "global_step": 36093, "epoch": 303, "lr": 4.9680968778250145e-05} +{"train_loss": 0.005379574839025736, "global_step": 36094, "epoch": 303, "lr": 4.9678753314035094e-05} +{"train_loss": 0.0019048667745664716, "global_step": 36095, "epoch": 303, "lr": 4.9676537850450765e-05} +{"train_loss": 0.00175300776027143, "global_step": 36096, "epoch": 303, "lr": 4.967432238750151e-05} +{"train_loss": 0.003354616928845644, "global_step": 36097, "epoch": 303, "lr": 4.96721069251917e-05} +{"train_loss": 0.0023939264938235283, "global_step": 36098, "epoch": 303, "lr": 4.966989146352565e-05} +{"train_loss": 0.003935317043215036, "global_step": 36099, "epoch": 303, "lr": 4.966767600250776e-05} +{"train_loss": 0.002729665255174041, "global_step": 36100, "epoch": 303, "lr": 4.9665460542142345e-05} +{"train_loss": 0.0017363490769639611, "global_step": 36101, "epoch": 303, "lr": 4.966324508243375e-05} +{"train_loss": 0.002622624160721898, "global_step": 36102, "epoch": 303, "lr": 4.966102962338635e-05} +{"train_loss": 0.003309813095256686, "global_step": 36103, "epoch": 303, "lr": 4.965881416500447e-05} +{"train_loss": 0.003125672461465001, "global_step": 36104, "epoch": 303, "lr": 4.965659870729249e-05} +{"train_loss": 0.0032880580984055996, "global_step": 36105, "epoch": 303, "lr": 4.9654383250254716e-05} +{"train_loss": 0.0038974329363554716, "global_step": 36106, "epoch": 303, "lr": 4.9652167793895537e-05} +{"train_loss": 0.0020995517261326313, "global_step": 36107, "epoch": 303, "lr": 4.96499523382193e-05} +{"train_loss": 0.002007963601499796, "global_step": 36108, "epoch": 303, "lr": 4.9647736883230325e-05} +{"train_loss": 0.002382917795330286, "global_step": 36109, "epoch": 303, "lr": 4.9645521428933e-05} +{"train_loss": 0.00246588047593832, "global_step": 36110, "epoch": 303, "lr": 4.964330597533164e-05} +{"train_loss": 0.003958366811275482, "global_step": 36111, "epoch": 303, "lr": 4.9641090522430624e-05} +{"train_loss": 0.0017342105275020003, "global_step": 36112, "epoch": 303, "lr": 4.963887507023429e-05} +{"train_loss": 0.0025062758941203356, "global_step": 36113, "epoch": 303, "lr": 4.963665961874697e-05} +{"train_loss": 0.00392888905480504, "global_step": 36114, "epoch": 303, "lr": 4.963444416797305e-05} +{"train_loss": 0.0017561394488438964, "global_step": 36115, "epoch": 303, "lr": 4.9632228717916834e-05} +{"train_loss": 0.002426762133836746, "global_step": 36116, "epoch": 303, "lr": 4.963001326858272e-05} +{"train_loss": 0.0024830305483192205, "global_step": 36117, "epoch": 303, "lr": 4.962779781997502e-05} +{"train_loss": 0.002129257656633854, "global_step": 36118, "epoch": 303, "lr": 4.962558237209811e-05} +{"train_loss": 0.003012514440342784, "global_step": 36119, "epoch": 303, "lr": 4.9623366924956336e-05} +{"train_loss": 0.0030096066184341908, "global_step": 36120, "epoch": 303, "lr": 4.962115147855402e-05} +{"train_loss": 0.0029435507021844387, "global_step": 36121, "epoch": 303, "lr": 4.961893603289554e-05} +{"train_loss": 0.0022875305730849504, "global_step": 36122, "epoch": 303, "lr": 4.9616720587985244e-05} +{"train_loss": 0.0018881672294810414, "global_step": 36123, "epoch": 303, "lr": 4.961450514382747e-05} +{"train_loss": 0.0030068422202020884, "global_step": 36124, "epoch": 303, "lr": 4.9612289700426576e-05} +{"train_loss": 0.004126705229282379, "global_step": 36125, "epoch": 303, "lr": 4.961007425778691e-05} +{"train_loss": 0.002395785879343748, "global_step": 36126, "epoch": 303, "lr": 4.9607858815912836e-05} +{"train_loss": 0.0020503951236605644, "global_step": 36127, "epoch": 303, "lr": 4.9605643374808666e-05} +{"train_loss": 0.0032261169981211424, "global_step": 36128, "epoch": 303, "lr": 4.960342793447879e-05} +{"train_loss": 0.0027034501545131207, "global_step": 36129, "epoch": 303, "lr": 4.9601212494927526e-05} +{"train_loss": 0.003035446861758828, "global_step": 36130, "epoch": 303, "lr": 4.959899705615925e-05} +{"train_loss": 0.0021438770927488804, "global_step": 36131, "epoch": 303, "lr": 4.959678161817831e-05} +{"train_loss": 0.0036812222097069025, "global_step": 36132, "epoch": 303, "lr": 4.959456618098902e-05} +{"train_loss": 0.002925136359408498, "global_step": 36133, "epoch": 303, "lr": 4.959235074459578e-05} +{"train_loss": 0.0020937034860253334, "global_step": 36134, "epoch": 303, "lr": 4.959013530900289e-05} +{"train_loss": 0.00341884046792984, "global_step": 36135, "epoch": 303, "lr": 4.9587919874214755e-05} +{"train_loss": 0.0019269735785201192, "global_step": 36136, "epoch": 303, "lr": 4.958570444023567e-05} +{"train_loss": 0.0023779578041285276, "global_step": 36137, "epoch": 303, "lr": 4.958348900707003e-05} +{"train_loss": 0.003914395347237587, "global_step": 36138, "epoch": 303, "lr": 4.958127357472215e-05} +{"train_loss": 0.0023918473161756992, "global_step": 36139, "epoch": 303, "lr": 4.957905814319641e-05} +{"train_loss": 0.0021460417192429304, "global_step": 36140, "epoch": 303, "lr": 4.957684271249713e-05} +{"train_loss": 0.0019983965903520584, "global_step": 36141, "epoch": 303, "lr": 4.957462728262867e-05} +{"train_loss": 0.0022826166823506355, "global_step": 36142, "epoch": 303, "lr": 4.9572411853595396e-05} +{"train_loss": 0.0024775646161288023, "global_step": 36143, "epoch": 303, "lr": 4.9570196425401634e-05} +{"train_loss": 0.002442737342789769, "global_step": 36144, "epoch": 303, "lr": 4.956798099805176e-05} +{"train_loss": 0.0036481251008808613, "global_step": 36145, "epoch": 303, "lr": 4.9565765571550114e-05} +{"train_loss": 0.0036038330290466547, "global_step": 36146, "epoch": 303, "lr": 4.9563550145901016e-05} +{"train_loss": 0.0028985529206693172, "global_step": 36147, "epoch": 303, "lr": 4.9561334721108864e-05} +{"train_loss": 0.002751145279034972, "global_step": 36148, "epoch": 303, "lr": 4.955911929717796e-05} +{"train_loss": 0.0024195180740207434, "global_step": 36149, "epoch": 303, "lr": 4.955690387411271e-05} +{"train_loss": 0.0024340152740478516, "global_step": 36150, "epoch": 303, "lr": 4.955468845191742e-05} +{"train_loss": 0.0030406401492655277, "global_step": 36151, "epoch": 303, "lr": 4.955247303059643e-05} +{"train_loss": 0.002186698140576482, "global_step": 36152, "epoch": 303, "lr": 4.955025761015414e-05} +{"train_loss": 0.0013846891233697534, "global_step": 36153, "epoch": 303, "lr": 4.954804219059485e-05} +{"train_loss": 0.002710866741836071, "global_step": 36154, "epoch": 303, "lr": 4.954582677192295e-05} +{"train_loss": 0.002914592856541276, "global_step": 36155, "epoch": 303, "lr": 4.954361135414275e-05} +{"train_loss": 0.0034724059514701366, "global_step": 36156, "epoch": 303, "lr": 4.954139593725863e-05} +{"train_loss": 0.0020455252379179, "global_step": 36157, "epoch": 303, "lr": 4.953918052127494e-05} +{"train_loss": 0.0036184382624924183, "global_step": 36158, "epoch": 303, "lr": 4.9536965106196005e-05} +{"train_loss": 0.0018506122287362814, "global_step": 36159, "epoch": 303, "lr": 4.95347496920262e-05} +{"train_loss": 0.002394285751506686, "global_step": 36160, "epoch": 303, "lr": 4.9532534278769846e-05} +{"train_loss": 0.002795363776385784, "global_step": 36161, "epoch": 303, "lr": 4.953031886643134e-05} +{"train_loss": 0.004219914320856333, "global_step": 36162, "epoch": 303, "lr": 4.952810345501497e-05} +{"train_loss": 0.0013492872240021825, "global_step": 36163, "epoch": 303, "lr": 4.952588804452515e-05} +{"train_loss": 0.0017936879303306341, "global_step": 36164, "epoch": 303, "lr": 4.952367263496619e-05} +{"train_loss": 0.0026932689361274242, "global_step": 36165, "epoch": 303, "lr": 4.9521457226342436e-05} +{"train_loss": 0.0013005962828174233, "global_step": 36166, "epoch": 303, "lr": 4.951924181865826e-05} +{"train_loss": 0.0027603893540799618, "global_step": 36167, "epoch": 303, "lr": 4.951702641191799e-05} +{"train_loss": 0.00356359058059752, "global_step": 36168, "epoch": 303, "lr": 4.9514811006126006e-05} +{"train_loss": 0.0010326781775802374, "global_step": 36169, "epoch": 303, "lr": 4.951259560128662e-05} +{"train_loss": 0.0015522029716521502, "global_step": 36170, "epoch": 303, "lr": 4.951038019740421e-05} +{"train_loss": 0.00358555163256824, "global_step": 36171, "epoch": 303, "lr": 4.950816479448311e-05} +{"train_loss": 0.0024109145160764456, "global_step": 36172, "epoch": 303, "lr": 4.9505949392527676e-05} +{"train_loss": 0.002045150613412261, "global_step": 36173, "epoch": 303, "lr": 4.950373399154226e-05} +{"train_loss": 0.0028839048463851213, "global_step": 36174, "epoch": 303, "lr": 4.950151859153121e-05} +{"train_loss": 0.002788864986916237, "global_step": 36175, "epoch": 303, "lr": 4.949930319249887e-05, "val_loss": 0.02053392119705677} +{"train_loss": 0.002749483799561858, "global_step": 36176, "epoch": 304, "lr": 4.949708779444961e-05} +{"train_loss": 0.001953922910615802, "global_step": 36177, "epoch": 304, "lr": 4.9494872397387746e-05} +{"train_loss": 0.0019782097078859806, "global_step": 36178, "epoch": 304, "lr": 4.949265700131767e-05} +{"train_loss": 0.001474545570090413, "global_step": 36179, "epoch": 304, "lr": 4.9490441606243674e-05} +{"train_loss": 0.002503172727301717, "global_step": 36180, "epoch": 304, "lr": 4.9488226212170175e-05} +{"train_loss": 0.0028326837345957756, "global_step": 36181, "epoch": 304, "lr": 4.948601081910148e-05} +{"train_loss": 0.0016409538220614195, "global_step": 36182, "epoch": 304, "lr": 4.948379542704193e-05} +{"train_loss": 0.001188793801702559, "global_step": 36183, "epoch": 304, "lr": 4.9481580035995915e-05} +{"train_loss": 0.0021812710911035538, "global_step": 36184, "epoch": 304, "lr": 4.947936464596774e-05} +{"train_loss": 0.002177631016820669, "global_step": 36185, "epoch": 304, "lr": 4.94771492569618e-05} +{"train_loss": 0.001902684336528182, "global_step": 36186, "epoch": 304, "lr": 4.947493386898239e-05} +{"train_loss": 0.0025013803970068693, "global_step": 36187, "epoch": 304, "lr": 4.947271848203393e-05} +{"train_loss": 0.0016723738517612219, "global_step": 36188, "epoch": 304, "lr": 4.9470503096120704e-05} +{"train_loss": 0.0014358385233208537, "global_step": 36189, "epoch": 304, "lr": 4.9468287711247094e-05} +{"train_loss": 0.0013096702750772238, "global_step": 36190, "epoch": 304, "lr": 4.946607232741745e-05} +{"train_loss": 0.0024546512868255377, "global_step": 36191, "epoch": 304, "lr": 4.94638569446361e-05} +{"train_loss": 0.0019624445121735334, "global_step": 36192, "epoch": 304, "lr": 4.9461641562907434e-05} +{"train_loss": 0.0018948984798043966, "global_step": 36193, "epoch": 304, "lr": 4.945942618223575e-05} +{"train_loss": 0.0027853448409587145, "global_step": 36194, "epoch": 304, "lr": 4.9457210802625455e-05} +{"train_loss": 0.0019749198108911514, "global_step": 36195, "epoch": 304, "lr": 4.945499542408086e-05} +{"train_loss": 0.0023908549919724464, "global_step": 36196, "epoch": 304, "lr": 4.945278004660631e-05} +{"train_loss": 0.0020601521246135235, "global_step": 36197, "epoch": 304, "lr": 4.9450564670206185e-05} +{"train_loss": 0.002451519016176462, "global_step": 36198, "epoch": 304, "lr": 4.9448349294884796e-05} +{"train_loss": 0.0013787008356302977, "global_step": 36199, "epoch": 304, "lr": 4.944613392064653e-05} +{"train_loss": 0.0021192922722548246, "global_step": 36200, "epoch": 304, "lr": 4.944391854749573e-05} +{"train_loss": 0.001982215093448758, "global_step": 36201, "epoch": 304, "lr": 4.944170317543671e-05} +{"train_loss": 0.0012226541293784976, "global_step": 36202, "epoch": 304, "lr": 4.943948780447387e-05} +{"train_loss": 0.0019487326499074697, "global_step": 36203, "epoch": 304, "lr": 4.943727243461151e-05} +{"train_loss": 0.0016299497801810503, "global_step": 36204, "epoch": 304, "lr": 4.9435057065854026e-05} +{"train_loss": 0.0012706387788057327, "global_step": 36205, "epoch": 304, "lr": 4.943284169820574e-05} +{"train_loss": 0.0013785575283691287, "global_step": 36206, "epoch": 304, "lr": 4.943062633167101e-05} +{"train_loss": 0.004245865624397993, "global_step": 36207, "epoch": 304, "lr": 4.942841096625419e-05} +{"train_loss": 0.0023801131173968315, "global_step": 36208, "epoch": 304, "lr": 4.9426195601959615e-05} +{"train_loss": 0.0025114447344094515, "global_step": 36209, "epoch": 304, "lr": 4.942398023879166e-05} +{"train_loss": 0.0020095310173928738, "global_step": 36210, "epoch": 304, "lr": 4.9421764876754625e-05} +{"train_loss": 0.0018834223737940192, "global_step": 36211, "epoch": 304, "lr": 4.941954951585293e-05} +{"train_loss": 0.0021083273459225893, "global_step": 36212, "epoch": 304, "lr": 4.9417334156090864e-05} +{"train_loss": 0.002011865144595504, "global_step": 36213, "epoch": 304, "lr": 4.9415118797472816e-05} +{"train_loss": 0.0011769324773922563, "global_step": 36214, "epoch": 304, "lr": 4.9412903440003113e-05} +{"train_loss": 0.002054032636806369, "global_step": 36215, "epoch": 304, "lr": 4.94106880836861e-05} +{"train_loss": 0.0020742022898048162, "global_step": 36216, "epoch": 304, "lr": 4.940847272852616e-05} +{"train_loss": 0.00196373020298779, "global_step": 36217, "epoch": 304, "lr": 4.9406257374527595e-05} +{"train_loss": 0.0012085170019418001, "global_step": 36218, "epoch": 304, "lr": 4.940404202169481e-05} +{"train_loss": 0.0017999523552134633, "global_step": 36219, "epoch": 304, "lr": 4.94018266700321e-05} +{"train_loss": 0.001702506560832262, "global_step": 36220, "epoch": 304, "lr": 4.939961131954385e-05} +{"train_loss": 0.003439611289650202, "global_step": 36221, "epoch": 304, "lr": 4.939739597023439e-05} +{"train_loss": 0.001361642382107675, "global_step": 36222, "epoch": 304, "lr": 4.939518062210809e-05} +{"train_loss": 0.0024374977219849825, "global_step": 36223, "epoch": 304, "lr": 4.939296527516928e-05} +{"train_loss": 0.0019500594353303313, "global_step": 36224, "epoch": 304, "lr": 4.939074992942232e-05} +{"train_loss": 0.0012954722624272108, "global_step": 36225, "epoch": 304, "lr": 4.938853458487156e-05} +{"train_loss": 0.003931168466806412, "global_step": 36226, "epoch": 304, "lr": 4.938631924152136e-05} +{"train_loss": 0.0012871426297351718, "global_step": 36227, "epoch": 304, "lr": 4.938410389937603e-05} +{"train_loss": 0.0023482751566916704, "global_step": 36228, "epoch": 304, "lr": 4.938188855843996e-05} +{"train_loss": 0.0015804042341187596, "global_step": 36229, "epoch": 304, "lr": 4.937967321871748e-05} +{"train_loss": 0.002219078131020069, "global_step": 36230, "epoch": 304, "lr": 4.937745788021296e-05} +{"train_loss": 0.002417173935100436, "global_step": 36231, "epoch": 304, "lr": 4.9375242542930734e-05} +{"train_loss": 0.0015784037532284856, "global_step": 36232, "epoch": 304, "lr": 4.9373027206875136e-05} +{"train_loss": 0.0016889258986338973, "global_step": 36233, "epoch": 304, "lr": 4.937081187205054e-05} +{"train_loss": 0.0010135264601558447, "global_step": 36234, "epoch": 304, "lr": 4.936859653846128e-05} +{"train_loss": 0.0012570623075589538, "global_step": 36235, "epoch": 304, "lr": 4.936638120611173e-05} +{"train_loss": 0.004001813009381294, "global_step": 36236, "epoch": 304, "lr": 4.9364165875006205e-05} +{"train_loss": 0.002024630084633827, "global_step": 36237, "epoch": 304, "lr": 4.9361950545149086e-05} +{"train_loss": 0.0024221157655119896, "global_step": 36238, "epoch": 304, "lr": 4.93597352165447e-05} +{"train_loss": 0.0013871771516278386, "global_step": 36239, "epoch": 304, "lr": 4.93575198891974e-05} +{"train_loss": 0.0018867016769945621, "global_step": 36240, "epoch": 304, "lr": 4.935530456311156e-05} +{"train_loss": 0.001492121140472591, "global_step": 36241, "epoch": 304, "lr": 4.9353089238291486e-05} +{"train_loss": 0.0013908382970839739, "global_step": 36242, "epoch": 304, "lr": 4.935087391474158e-05} +{"train_loss": 0.0023530160542577505, "global_step": 36243, "epoch": 304, "lr": 4.934865859246614e-05} +{"train_loss": 0.001399736269377172, "global_step": 36244, "epoch": 304, "lr": 4.934644327146956e-05} +{"train_loss": 0.001722637563943863, "global_step": 36245, "epoch": 304, "lr": 4.9344227951756165e-05} +{"train_loss": 0.0026132853236049414, "global_step": 36246, "epoch": 304, "lr": 4.934201263333029e-05} +{"train_loss": 0.0015788638265803456, "global_step": 36247, "epoch": 304, "lr": 4.933979731619633e-05} +{"train_loss": 0.0019941050559282303, "global_step": 36248, "epoch": 304, "lr": 4.933758200035858e-05} +{"train_loss": 0.002018118044361472, "global_step": 36249, "epoch": 304, "lr": 4.933536668582144e-05} +{"train_loss": 0.0020972415804862976, "global_step": 36250, "epoch": 304, "lr": 4.933315137258923e-05} +{"train_loss": 0.0020109470933675766, "global_step": 36251, "epoch": 304, "lr": 4.933093606066629e-05} +{"train_loss": 0.0019380804151296616, "global_step": 36252, "epoch": 304, "lr": 4.9328720750057015e-05} +{"train_loss": 0.001943620853126049, "global_step": 36253, "epoch": 304, "lr": 4.932650544076569e-05} +{"train_loss": 0.0034683411940932274, "global_step": 36254, "epoch": 304, "lr": 4.932429013279671e-05} +{"train_loss": 0.002525710267946124, "global_step": 36255, "epoch": 304, "lr": 4.932207482615442e-05} +{"train_loss": 0.0015290408628061414, "global_step": 36256, "epoch": 304, "lr": 4.931985952084317e-05} +{"train_loss": 0.002794772619381547, "global_step": 36257, "epoch": 304, "lr": 4.9317644216867306e-05} +{"train_loss": 0.0040629226714372635, "global_step": 36258, "epoch": 304, "lr": 4.9315428914231156e-05} +{"train_loss": 0.0034016829449683428, "global_step": 36259, "epoch": 304, "lr": 4.9313213612939105e-05} +{"train_loss": 0.0026278456207364798, "global_step": 36260, "epoch": 304, "lr": 4.931099831299547e-05} +{"train_loss": 0.003197761019691825, "global_step": 36261, "epoch": 304, "lr": 4.9308783014404634e-05} +{"train_loss": 0.0028083554934710264, "global_step": 36262, "epoch": 304, "lr": 4.9306567717170914e-05} +{"train_loss": 0.0019561664666980505, "global_step": 36263, "epoch": 304, "lr": 4.930435242129869e-05} +{"train_loss": 0.0016343421302735806, "global_step": 36264, "epoch": 304, "lr": 4.93021371267923e-05} +{"train_loss": 0.0024234966840595007, "global_step": 36265, "epoch": 304, "lr": 4.929992183365606e-05} +{"train_loss": 0.0022882716730237007, "global_step": 36266, "epoch": 304, "lr": 4.929770654189437e-05} +{"train_loss": 0.0019574579782783985, "global_step": 36267, "epoch": 304, "lr": 4.9295491251511544e-05} +{"train_loss": 0.002715473063290119, "global_step": 36268, "epoch": 304, "lr": 4.929327596251197e-05} +{"train_loss": 0.004555439576506615, "global_step": 36269, "epoch": 304, "lr": 4.929106067489995e-05} +{"train_loss": 0.001903143129311502, "global_step": 36270, "epoch": 304, "lr": 4.928884538867986e-05} +{"train_loss": 0.0033468010369688272, "global_step": 36271, "epoch": 304, "lr": 4.928663010385605e-05} +{"train_loss": 0.002139536663889885, "global_step": 36272, "epoch": 304, "lr": 4.9284414820432864e-05} +{"train_loss": 0.0022282449062913656, "global_step": 36273, "epoch": 304, "lr": 4.928219953841466e-05} +{"train_loss": 0.0017491747858002782, "global_step": 36274, "epoch": 304, "lr": 4.927998425780576e-05} +{"train_loss": 0.0015619733603671193, "global_step": 36275, "epoch": 304, "lr": 4.927776897861056e-05} +{"train_loss": 0.004602409899234772, "global_step": 36276, "epoch": 304, "lr": 4.9275553700833385e-05} +{"train_loss": 0.0018765414133667946, "global_step": 36277, "epoch": 304, "lr": 4.927333842447855e-05} +{"train_loss": 0.001610508537851274, "global_step": 36278, "epoch": 304, "lr": 4.9271123149550476e-05} +{"train_loss": 0.001689206575974822, "global_step": 36279, "epoch": 304, "lr": 4.9268907876053446e-05} +{"train_loss": 0.002252985490486026, "global_step": 36280, "epoch": 304, "lr": 4.926669260399185e-05} +{"train_loss": 0.00303631741553545, "global_step": 36281, "epoch": 304, "lr": 4.9264477333370016e-05} +{"train_loss": 0.0026921636890619993, "global_step": 36282, "epoch": 304, "lr": 4.926226206419232e-05} +{"train_loss": 0.0037586658727377653, "global_step": 36283, "epoch": 304, "lr": 4.9260046796463087e-05} +{"train_loss": 0.0018952247919514775, "global_step": 36284, "epoch": 304, "lr": 4.925783153018665e-05} +{"train_loss": 0.0034807513002306223, "global_step": 36285, "epoch": 304, "lr": 4.925561626536741e-05} +{"train_loss": 0.001563945203088224, "global_step": 36286, "epoch": 304, "lr": 4.925340100200967e-05} +{"train_loss": 0.0018390030600130558, "global_step": 36287, "epoch": 304, "lr": 4.925118574011782e-05} +{"train_loss": 0.004033992532640696, "global_step": 36288, "epoch": 304, "lr": 4.9248970479696164e-05} +{"train_loss": 0.0015060331206768751, "global_step": 36289, "epoch": 304, "lr": 4.9246755220749066e-05} +{"train_loss": 0.0029638195410370827, "global_step": 36290, "epoch": 304, "lr": 4.9244539963280914e-05} +{"train_loss": 0.002528971992433071, "global_step": 36291, "epoch": 304, "lr": 4.9242324707296e-05} +{"train_loss": 0.0033645061776041985, "global_step": 36292, "epoch": 304, "lr": 4.924010945279872e-05} +{"train_loss": 0.002532039536163211, "global_step": 36293, "epoch": 304, "lr": 4.923789419979339e-05} +{"train_loss": 0.0021977507648206934, "global_step": 36294, "epoch": 304, "lr": 4.9235678948284386e-05, "val_loss": 0.021633010357618332} +{"train_loss": 0.0016598773654550314, "global_step": 36295, "epoch": 305, "lr": 4.923346369827605e-05} +{"train_loss": 0.0038769450038671494, "global_step": 36296, "epoch": 305, "lr": 4.92312484497727e-05} +{"train_loss": 0.0013538056518882513, "global_step": 36297, "epoch": 305, "lr": 4.922903320277874e-05} +{"train_loss": 0.003776346566155553, "global_step": 36298, "epoch": 305, "lr": 4.9226817957298464e-05} +{"train_loss": 0.0027507164049893618, "global_step": 36299, "epoch": 305, "lr": 4.922460271333627e-05} +{"train_loss": 0.002070431364700198, "global_step": 36300, "epoch": 305, "lr": 4.9222387470896484e-05} +{"train_loss": 0.0028455695137381554, "global_step": 36301, "epoch": 305, "lr": 4.922017222998344e-05} +{"train_loss": 0.00191611354239285, "global_step": 36302, "epoch": 305, "lr": 4.921795699060152e-05} +{"train_loss": 0.0023994569201022387, "global_step": 36303, "epoch": 305, "lr": 4.921574175275505e-05} +{"train_loss": 0.0013038881588727236, "global_step": 36304, "epoch": 305, "lr": 4.9213526516448385e-05} +{"train_loss": 0.0020739659667015076, "global_step": 36305, "epoch": 305, "lr": 4.9211311281685886e-05} +{"train_loss": 0.0022971732541918755, "global_step": 36306, "epoch": 305, "lr": 4.9209096048471886e-05} +{"train_loss": 0.0016528696287423372, "global_step": 36307, "epoch": 305, "lr": 4.9206880816810754e-05} +{"train_loss": 0.0027248382102698088, "global_step": 36308, "epoch": 305, "lr": 4.920466558670681e-05} +{"train_loss": 0.0030280468054115772, "global_step": 36309, "epoch": 305, "lr": 4.920245035816443e-05} +{"train_loss": 0.00247150007635355, "global_step": 36310, "epoch": 305, "lr": 4.920023513118794e-05} +{"train_loss": 0.0018354002386331558, "global_step": 36311, "epoch": 305, "lr": 4.919801990578172e-05} +{"train_loss": 0.0021481080912053585, "global_step": 36312, "epoch": 305, "lr": 4.919580468195009e-05} +{"train_loss": 0.0033571398817002773, "global_step": 36313, "epoch": 305, "lr": 4.9193589459697424e-05} +{"train_loss": 0.001677567488513887, "global_step": 36314, "epoch": 305, "lr": 4.919137423902806e-05} +{"train_loss": 0.003347355406731367, "global_step": 36315, "epoch": 305, "lr": 4.9189159019946326e-05} +{"train_loss": 0.002286304486915469, "global_step": 36316, "epoch": 305, "lr": 4.918694380245662e-05} +{"train_loss": 0.001992868958041072, "global_step": 36317, "epoch": 305, "lr": 4.9184728586563235e-05} +{"train_loss": 0.0014405400725081563, "global_step": 36318, "epoch": 305, "lr": 4.9182513372270575e-05} +{"train_loss": 0.002305482281371951, "global_step": 36319, "epoch": 305, "lr": 4.918029815958294e-05} +{"train_loss": 0.0032894941978156567, "global_step": 36320, "epoch": 305, "lr": 4.917808294850471e-05} +{"train_loss": 0.002797348191961646, "global_step": 36321, "epoch": 305, "lr": 4.9175867739040225e-05} +{"train_loss": 0.002670590067282319, "global_step": 36322, "epoch": 305, "lr": 4.917365253119384e-05} +{"train_loss": 0.001598911825567484, "global_step": 36323, "epoch": 305, "lr": 4.917143732496989e-05} +{"train_loss": 0.0024490950163453817, "global_step": 36324, "epoch": 305, "lr": 4.916922212037273e-05} +{"train_loss": 0.0020469813607633114, "global_step": 36325, "epoch": 305, "lr": 4.916700691740674e-05} +{"train_loss": 0.001255777315236628, "global_step": 36326, "epoch": 305, "lr": 4.9164791716076235e-05} +{"train_loss": 0.0015355241484940052, "global_step": 36327, "epoch": 305, "lr": 4.9162576516385556e-05} +{"train_loss": 0.0022348843049257994, "global_step": 36328, "epoch": 305, "lr": 4.916036131833909e-05} +{"train_loss": 0.002684841165319085, "global_step": 36329, "epoch": 305, "lr": 4.915814612194114e-05} +{"train_loss": 0.002108546905219555, "global_step": 36330, "epoch": 305, "lr": 4.91559309271961e-05} +{"train_loss": 0.003564257640391588, "global_step": 36331, "epoch": 305, "lr": 4.915371573410828e-05} +{"train_loss": 0.003962029702961445, "global_step": 36332, "epoch": 305, "lr": 4.9151500542682075e-05} +{"train_loss": 0.0014778461772948503, "global_step": 36333, "epoch": 305, "lr": 4.9149285352921806e-05} +{"train_loss": 0.0032591905910521746, "global_step": 36334, "epoch": 305, "lr": 4.914707016483179e-05} +{"train_loss": 0.0017248941585421562, "global_step": 36335, "epoch": 305, "lr": 4.914485497841645e-05} +{"train_loss": 0.0031381419394165277, "global_step": 36336, "epoch": 305, "lr": 4.914263979368007e-05} +{"train_loss": 0.0012993112904950976, "global_step": 36337, "epoch": 305, "lr": 4.914042461062703e-05} +{"train_loss": 0.0027433400973677635, "global_step": 36338, "epoch": 305, "lr": 4.913820942926169e-05} +{"train_loss": 0.002249431796371937, "global_step": 36339, "epoch": 305, "lr": 4.913599424958836e-05} +{"train_loss": 0.0020872685126960278, "global_step": 36340, "epoch": 305, "lr": 4.913377907161143e-05} +{"train_loss": 0.0018633344443514943, "global_step": 36341, "epoch": 305, "lr": 4.913156389533522e-05} +{"train_loss": 0.0027513906825333834, "global_step": 36342, "epoch": 305, "lr": 4.912934872076411e-05} +{"train_loss": 0.00232297508046031, "global_step": 36343, "epoch": 305, "lr": 4.9127133547902404e-05} +{"train_loss": 0.004070041701197624, "global_step": 36344, "epoch": 305, "lr": 4.9124918376754506e-05} +{"train_loss": 0.0016861787298694253, "global_step": 36345, "epoch": 305, "lr": 4.9122703207324736e-05} +{"train_loss": 0.0023798923939466476, "global_step": 36346, "epoch": 305, "lr": 4.912048803961742e-05} +{"train_loss": 0.001955257263034582, "global_step": 36347, "epoch": 305, "lr": 4.9118272873636955e-05} +{"train_loss": 0.002596707548946142, "global_step": 36348, "epoch": 305, "lr": 4.9116057709387645e-05} +{"train_loss": 0.003359236055985093, "global_step": 36349, "epoch": 305, "lr": 4.9113842546873885e-05} +{"train_loss": 0.002632859395816922, "global_step": 36350, "epoch": 305, "lr": 4.9111627386099986e-05} +{"train_loss": 0.0028892725240439177, "global_step": 36351, "epoch": 305, "lr": 4.910941222707031e-05} +{"train_loss": 0.0035949202720075846, "global_step": 36352, "epoch": 305, "lr": 4.910719706978922e-05} +{"train_loss": 0.002579685766249895, "global_step": 36353, "epoch": 305, "lr": 4.910498191426104e-05} +{"train_loss": 0.005932034458965063, "global_step": 36354, "epoch": 305, "lr": 4.9102766760490135e-05} +{"train_loss": 0.002671548631042242, "global_step": 36355, "epoch": 305, "lr": 4.910055160848086e-05} +{"train_loss": 0.0022850660607218742, "global_step": 36356, "epoch": 305, "lr": 4.909833645823755e-05} +{"train_loss": 0.00152976147364825, "global_step": 36357, "epoch": 305, "lr": 4.909612130976457e-05} +{"train_loss": 0.003432303899899125, "global_step": 36358, "epoch": 305, "lr": 4.9093906163066234e-05} +{"train_loss": 0.0026849585119634867, "global_step": 36359, "epoch": 305, "lr": 4.909169101814695e-05} +{"train_loss": 0.0021923913154751062, "global_step": 36360, "epoch": 305, "lr": 4.9089475875011e-05} +{"train_loss": 0.0033315839245915413, "global_step": 36361, "epoch": 305, "lr": 4.9087260733662796e-05} +{"train_loss": 0.0035182361025363207, "global_step": 36362, "epoch": 305, "lr": 4.9085045594106624e-05} +{"train_loss": 0.0017663479084149003, "global_step": 36363, "epoch": 305, "lr": 4.90828304563469e-05} +{"train_loss": 0.0034545487724244595, "global_step": 36364, "epoch": 305, "lr": 4.908061532038794e-05} +{"train_loss": 0.0016900200862437487, "global_step": 36365, "epoch": 305, "lr": 4.907840018623407e-05} +{"train_loss": 0.0022236600052565336, "global_step": 36366, "epoch": 305, "lr": 4.907618505388968e-05} +{"train_loss": 0.0021152570843696594, "global_step": 36367, "epoch": 305, "lr": 4.907396992335909e-05} +{"train_loss": 0.002866625552996993, "global_step": 36368, "epoch": 305, "lr": 4.907175479464668e-05} +{"train_loss": 0.0027696078177541494, "global_step": 36369, "epoch": 305, "lr": 4.906953966775677e-05} +{"train_loss": 0.0014739636098966002, "global_step": 36370, "epoch": 305, "lr": 4.9067324542693714e-05} +{"train_loss": 0.0019371930975466967, "global_step": 36371, "epoch": 305, "lr": 4.9065109419461866e-05} +{"train_loss": 0.0016113410238176584, "global_step": 36372, "epoch": 305, "lr": 4.906289429806557e-05} +{"train_loss": 0.0031605204567313194, "global_step": 36373, "epoch": 305, "lr": 4.90606791785092e-05} +{"train_loss": 0.0017361612990498543, "global_step": 36374, "epoch": 305, "lr": 4.905846406079706e-05} +{"train_loss": 0.0022002384066581726, "global_step": 36375, "epoch": 305, "lr": 4.9056248944933555e-05} +{"train_loss": 0.0033392549958080053, "global_step": 36376, "epoch": 305, "lr": 4.905403383092301e-05} +{"train_loss": 0.0025394868571311235, "global_step": 36377, "epoch": 305, "lr": 4.9051818718769736e-05} +{"train_loss": 0.001920161535963416, "global_step": 36378, "epoch": 305, "lr": 4.904960360847814e-05} +{"train_loss": 0.004238783847540617, "global_step": 36379, "epoch": 305, "lr": 4.904738850005252e-05} +{"train_loss": 0.003050575964152813, "global_step": 36380, "epoch": 305, "lr": 4.9045173393497276e-05} +{"train_loss": 0.0023795024026185274, "global_step": 36381, "epoch": 305, "lr": 4.904295828881671e-05} +{"train_loss": 0.0012811388587579131, "global_step": 36382, "epoch": 305, "lr": 4.9040743186015215e-05} +{"train_loss": 0.0018985343631356955, "global_step": 36383, "epoch": 305, "lr": 4.9038528085097116e-05} +{"train_loss": 0.0016265757149085402, "global_step": 36384, "epoch": 305, "lr": 4.903631298606675e-05} +{"train_loss": 0.0023171945940703154, "global_step": 36385, "epoch": 305, "lr": 4.903409788892848e-05} +{"train_loss": 0.0017145893070846796, "global_step": 36386, "epoch": 305, "lr": 4.903188279368667e-05} +{"train_loss": 0.0017600638093426824, "global_step": 36387, "epoch": 305, "lr": 4.9029667700345644e-05} +{"train_loss": 0.0019422690384089947, "global_step": 36388, "epoch": 305, "lr": 4.902745260890977e-05} +{"train_loss": 0.0023337751626968384, "global_step": 36389, "epoch": 305, "lr": 4.902523751938338e-05} +{"train_loss": 0.0016849137609824538, "global_step": 36390, "epoch": 305, "lr": 4.9023022431770845e-05} +{"train_loss": 0.0016741822473704815, "global_step": 36391, "epoch": 305, "lr": 4.9020807346076475e-05} +{"train_loss": 0.003406854812055826, "global_step": 36392, "epoch": 305, "lr": 4.9018592262304674e-05} +{"train_loss": 0.0025916562881320715, "global_step": 36393, "epoch": 305, "lr": 4.901637718045974e-05} +{"train_loss": 0.0013226793380454183, "global_step": 36394, "epoch": 305, "lr": 4.901416210054606e-05} +{"train_loss": 0.0019826372154057026, "global_step": 36395, "epoch": 305, "lr": 4.901194702256797e-05} +{"train_loss": 0.0010167097207158804, "global_step": 36396, "epoch": 305, "lr": 4.9009731946529805e-05} +{"train_loss": 0.0021347394213080406, "global_step": 36397, "epoch": 305, "lr": 4.900751687243594e-05} +{"train_loss": 0.0032822617795318365, "global_step": 36398, "epoch": 305, "lr": 4.900530180029068e-05} +{"train_loss": 0.0025425280909985304, "global_step": 36399, "epoch": 305, "lr": 4.9003086730098436e-05} +{"train_loss": 0.002738366834819317, "global_step": 36400, "epoch": 305, "lr": 4.90008716618635e-05} +{"train_loss": 0.0016966217663139105, "global_step": 36401, "epoch": 305, "lr": 4.899865659559026e-05} +{"train_loss": 0.003078969893977046, "global_step": 36402, "epoch": 305, "lr": 4.8996441531283055e-05} +{"train_loss": 0.0024725934490561485, "global_step": 36403, "epoch": 305, "lr": 4.899422646894622e-05} +{"train_loss": 0.004560703877359629, "global_step": 36404, "epoch": 305, "lr": 4.8992011408584114e-05} +{"train_loss": 0.0029857633635401726, "global_step": 36405, "epoch": 305, "lr": 4.898979635020109e-05} +{"train_loss": 0.001737077021971345, "global_step": 36406, "epoch": 305, "lr": 4.898758129380149e-05} +{"train_loss": 0.001485229004174471, "global_step": 36407, "epoch": 305, "lr": 4.898536623938967e-05} +{"train_loss": 0.0025746221654117107, "global_step": 36408, "epoch": 305, "lr": 4.898315118696997e-05} +{"train_loss": 0.005428567994385958, "global_step": 36409, "epoch": 305, "lr": 4.898093613654675e-05} +{"train_loss": 0.0015955900307744741, "global_step": 36410, "epoch": 305, "lr": 4.897872108812434e-05} +{"train_loss": 0.0012201876379549503, "global_step": 36411, "epoch": 305, "lr": 4.897650604170712e-05} +{"train_loss": 0.004047691356390715, "global_step": 36412, "epoch": 305, "lr": 4.89742909972994e-05} +{"train_loss": 0.0024471517883147263, "global_step": 36413, "epoch": 305, "lr": 4.897207595490557e-05, "val_loss": 0.019992005079984665, "train_action_mse_error": 3.695753912325017e-05} +{"train_loss": 0.003505538683384657, "global_step": 36414, "epoch": 306, "lr": 4.8969860914529964e-05} +{"train_loss": 0.00268114753998816, "global_step": 36415, "epoch": 306, "lr": 4.89676458761769e-05} +{"train_loss": 0.002135812770575285, "global_step": 36416, "epoch": 306, "lr": 4.896543083985078e-05} +{"train_loss": 0.001848307903856039, "global_step": 36417, "epoch": 306, "lr": 4.89632158055559e-05} +{"train_loss": 0.0025001601316034794, "global_step": 36418, "epoch": 306, "lr": 4.896100077329666e-05} +{"train_loss": 0.00387717061676085, "global_step": 36419, "epoch": 306, "lr": 4.895878574307737e-05} +{"train_loss": 0.0017469009617343545, "global_step": 36420, "epoch": 306, "lr": 4.8956570714902376e-05} +{"train_loss": 0.0033235247246921062, "global_step": 36421, "epoch": 306, "lr": 4.895435568877608e-05} +{"train_loss": 0.001673425198532641, "global_step": 36422, "epoch": 306, "lr": 4.895214066470276e-05} +{"train_loss": 0.0017915521748363972, "global_step": 36423, "epoch": 306, "lr": 4.894992564268683e-05} +{"train_loss": 0.002262669615447521, "global_step": 36424, "epoch": 306, "lr": 4.8947710622732585e-05} +{"train_loss": 0.002461993368342519, "global_step": 36425, "epoch": 306, "lr": 4.8945495604844415e-05} +{"train_loss": 0.0027377898804843426, "global_step": 36426, "epoch": 306, "lr": 4.894328058902666e-05} +{"train_loss": 0.002080356003716588, "global_step": 36427, "epoch": 306, "lr": 4.894106557528363e-05} +{"train_loss": 0.002166228834539652, "global_step": 36428, "epoch": 306, "lr": 4.893885056361973e-05} +{"train_loss": 0.0023658666759729385, "global_step": 36429, "epoch": 306, "lr": 4.893663555403926e-05} +{"train_loss": 0.002024021465331316, "global_step": 36430, "epoch": 306, "lr": 4.8934420546546625e-05} +{"train_loss": 0.0026608784683048725, "global_step": 36431, "epoch": 306, "lr": 4.8932205541146107e-05} +{"train_loss": 0.0016637176740914583, "global_step": 36432, "epoch": 306, "lr": 4.8929990537842117e-05} +{"train_loss": 0.0016341524897143245, "global_step": 36433, "epoch": 306, "lr": 4.892777553663898e-05} +{"train_loss": 0.0025955913588404655, "global_step": 36434, "epoch": 306, "lr": 4.892556053754101e-05} +{"train_loss": 0.002055724151432514, "global_step": 36435, "epoch": 306, "lr": 4.89233455405526e-05} +{"train_loss": 0.002220344264060259, "global_step": 36436, "epoch": 306, "lr": 4.892113054567809e-05} +{"train_loss": 0.004318954888731241, "global_step": 36437, "epoch": 306, "lr": 4.891891555292182e-05} +{"train_loss": 0.0021956840064376593, "global_step": 36438, "epoch": 306, "lr": 4.891670056228816e-05} +{"train_loss": 0.002543789567425847, "global_step": 36439, "epoch": 306, "lr": 4.891448557378141e-05} +{"train_loss": 0.0017345261294394732, "global_step": 36440, "epoch": 306, "lr": 4.891227058740599e-05} +{"train_loss": 0.0020575018133968115, "global_step": 36441, "epoch": 306, "lr": 4.891005560316618e-05} +{"train_loss": 0.002210192149505019, "global_step": 36442, "epoch": 306, "lr": 4.890784062106638e-05} +{"train_loss": 0.002444328274577856, "global_step": 36443, "epoch": 306, "lr": 4.89056256411109e-05} +{"train_loss": 0.0021607792004942894, "global_step": 36444, "epoch": 306, "lr": 4.8903410663304126e-05} +{"train_loss": 0.0016272987704724073, "global_step": 36445, "epoch": 306, "lr": 4.8901195687650395e-05} +{"train_loss": 0.003538368735462427, "global_step": 36446, "epoch": 306, "lr": 4.8898980714154016e-05} +{"train_loss": 0.0026758420281112194, "global_step": 36447, "epoch": 306, "lr": 4.88967657428194e-05} +{"train_loss": 0.0016959365457296371, "global_step": 36448, "epoch": 306, "lr": 4.8894550773650845e-05} +{"train_loss": 0.002929294714704156, "global_step": 36449, "epoch": 306, "lr": 4.889233580665274e-05} +{"train_loss": 0.0031796458642929792, "global_step": 36450, "epoch": 306, "lr": 4.8890120841829396e-05} +{"train_loss": 0.0015610115369781852, "global_step": 36451, "epoch": 306, "lr": 4.88879058791852e-05} +{"train_loss": 0.0033880015835165977, "global_step": 36452, "epoch": 306, "lr": 4.888569091872447e-05} +{"train_loss": 0.0024255127646028996, "global_step": 36453, "epoch": 306, "lr": 4.888347596045157e-05} +{"train_loss": 0.00332090281881392, "global_step": 36454, "epoch": 306, "lr": 4.888126100437085e-05} +{"train_loss": 0.0009245586697943509, "global_step": 36455, "epoch": 306, "lr": 4.887904605048664e-05} +{"train_loss": 0.002612214768305421, "global_step": 36456, "epoch": 306, "lr": 4.8876831098803314e-05} +{"train_loss": 0.0029360970947891474, "global_step": 36457, "epoch": 306, "lr": 4.8874616149325226e-05} +{"train_loss": 0.0017564422450959682, "global_step": 36458, "epoch": 306, "lr": 4.887240120205668e-05} +{"train_loss": 0.0017916886135935783, "global_step": 36459, "epoch": 306, "lr": 4.8870186257002075e-05} +{"train_loss": 0.0026686920318752527, "global_step": 36460, "epoch": 306, "lr": 4.8867971314165714e-05} +{"train_loss": 0.0020953118801116943, "global_step": 36461, "epoch": 306, "lr": 4.8865756373552e-05} +{"train_loss": 0.0025889305397868156, "global_step": 36462, "epoch": 306, "lr": 4.8863541435165226e-05} +{"train_loss": 0.0021839060354977846, "global_step": 36463, "epoch": 306, "lr": 4.886132649900979e-05} +{"train_loss": 0.001782487495802343, "global_step": 36464, "epoch": 306, "lr": 4.885911156509002e-05} +{"train_loss": 0.0025985874235630035, "global_step": 36465, "epoch": 306, "lr": 4.885689663341024e-05} +{"train_loss": 0.002530770841985941, "global_step": 36466, "epoch": 306, "lr": 4.885468170397484e-05} +{"train_loss": 0.0017416584305465221, "global_step": 36467, "epoch": 306, "lr": 4.885246677678813e-05} +{"train_loss": 0.0019357391865924, "global_step": 36468, "epoch": 306, "lr": 4.88502518518545e-05} +{"train_loss": 0.0017980133416131139, "global_step": 36469, "epoch": 306, "lr": 4.884803692917826e-05} +{"train_loss": 0.001992021920159459, "global_step": 36470, "epoch": 306, "lr": 4.884582200876378e-05} +{"train_loss": 0.0022804751060903072, "global_step": 36471, "epoch": 306, "lr": 4.884360709061542e-05} +{"train_loss": 0.003734196536242962, "global_step": 36472, "epoch": 306, "lr": 4.884139217473749e-05} +{"train_loss": 0.0022163460962474346, "global_step": 36473, "epoch": 306, "lr": 4.883917726113439e-05} +{"train_loss": 0.0030074354726821184, "global_step": 36474, "epoch": 306, "lr": 4.8836962349810414e-05} +{"train_loss": 0.0030613024719059467, "global_step": 36475, "epoch": 306, "lr": 4.883474744076996e-05} +{"train_loss": 0.002112865913659334, "global_step": 36476, "epoch": 306, "lr": 4.883253253401736e-05} +{"train_loss": 0.0018586382502689958, "global_step": 36477, "epoch": 306, "lr": 4.883031762955693e-05} +{"train_loss": 0.004056189209222794, "global_step": 36478, "epoch": 306, "lr": 4.8828102727393074e-05} +{"train_loss": 0.0018861193675547838, "global_step": 36479, "epoch": 306, "lr": 4.882588782753009e-05} +{"train_loss": 0.0020514195784926414, "global_step": 36480, "epoch": 306, "lr": 4.882367292997237e-05} +{"train_loss": 0.001734062796458602, "global_step": 36481, "epoch": 306, "lr": 4.8821458034724216e-05} +{"train_loss": 0.002041308907791972, "global_step": 36482, "epoch": 306, "lr": 4.8819243141790035e-05} +{"train_loss": 0.0016753098461776972, "global_step": 36483, "epoch": 306, "lr": 4.881702825117412e-05} +{"train_loss": 0.0019016670994460583, "global_step": 36484, "epoch": 306, "lr": 4.8814813362880856e-05} +{"train_loss": 0.002003937028348446, "global_step": 36485, "epoch": 306, "lr": 4.881259847691457e-05} +{"train_loss": 0.00374432560056448, "global_step": 36486, "epoch": 306, "lr": 4.8810383593279626e-05} +{"train_loss": 0.002335120690986514, "global_step": 36487, "epoch": 306, "lr": 4.8808168711980365e-05} +{"train_loss": 0.003023536643013358, "global_step": 36488, "epoch": 306, "lr": 4.880595383302115e-05} +{"train_loss": 0.0022621965035796165, "global_step": 36489, "epoch": 306, "lr": 4.88037389564063e-05} +{"train_loss": 0.0018759112572297454, "global_step": 36490, "epoch": 306, "lr": 4.8801524082140196e-05} +{"train_loss": 0.004737903364002705, "global_step": 36491, "epoch": 306, "lr": 4.8799309210227144e-05} +{"train_loss": 0.0031360064167529345, "global_step": 36492, "epoch": 306, "lr": 4.879709434067155e-05} +{"train_loss": 0.003635713830590248, "global_step": 36493, "epoch": 306, "lr": 4.8794879473477714e-05} +{"train_loss": 0.0025567312259227037, "global_step": 36494, "epoch": 306, "lr": 4.879266460865002e-05} +{"train_loss": 0.002416186034679413, "global_step": 36495, "epoch": 306, "lr": 4.8790449746192794e-05} +{"train_loss": 0.003750524017959833, "global_step": 36496, "epoch": 306, "lr": 4.878823488611038e-05} +{"train_loss": 0.002270540688186884, "global_step": 36497, "epoch": 306, "lr": 4.878602002840715e-05} +{"train_loss": 0.002338114660233259, "global_step": 36498, "epoch": 306, "lr": 4.878380517308743e-05} +{"train_loss": 0.002392493886873126, "global_step": 36499, "epoch": 306, "lr": 4.8781590320155584e-05} +{"train_loss": 0.003983804024755955, "global_step": 36500, "epoch": 306, "lr": 4.8779375469615944e-05} +{"train_loss": 0.0018192464485764503, "global_step": 36501, "epoch": 306, "lr": 4.8777160621472886e-05} +{"train_loss": 0.0026599883567541838, "global_step": 36502, "epoch": 306, "lr": 4.877494577573074e-05} +{"train_loss": 0.0018315846100449562, "global_step": 36503, "epoch": 306, "lr": 4.877273093239385e-05} +{"train_loss": 0.0009476622799411416, "global_step": 36504, "epoch": 306, "lr": 4.8770516091466575e-05} +{"train_loss": 0.0022247096057981253, "global_step": 36505, "epoch": 306, "lr": 4.876830125295325e-05} +{"train_loss": 0.001158671802841127, "global_step": 36506, "epoch": 306, "lr": 4.876608641685826e-05} +{"train_loss": 0.0016171940369531512, "global_step": 36507, "epoch": 306, "lr": 4.8763871583185914e-05} +{"train_loss": 0.0017428438877686858, "global_step": 36508, "epoch": 306, "lr": 4.876165675194057e-05} +{"train_loss": 0.0023328035604208708, "global_step": 36509, "epoch": 306, "lr": 4.8759441923126584e-05} +{"train_loss": 0.0021950961090624332, "global_step": 36510, "epoch": 306, "lr": 4.8757227096748295e-05} +{"train_loss": 0.0033196168951690197, "global_step": 36511, "epoch": 306, "lr": 4.875501227281007e-05} +{"train_loss": 0.0032097327057272196, "global_step": 36512, "epoch": 306, "lr": 4.875279745131622e-05} +{"train_loss": 0.002426450839266181, "global_step": 36513, "epoch": 306, "lr": 4.875058263227115e-05} +{"train_loss": 0.002172746229916811, "global_step": 36514, "epoch": 306, "lr": 4.874836781567918e-05} +{"train_loss": 0.0029960155952721834, "global_step": 36515, "epoch": 306, "lr": 4.8746153001544625e-05} +{"train_loss": 0.002586349844932556, "global_step": 36516, "epoch": 306, "lr": 4.874393818987189e-05} +{"train_loss": 0.0032455616164952517, "global_step": 36517, "epoch": 306, "lr": 4.874172338066528e-05} +{"train_loss": 0.002583763562142849, "global_step": 36518, "epoch": 306, "lr": 4.873950857392917e-05} +{"train_loss": 0.0029242003802210093, "global_step": 36519, "epoch": 306, "lr": 4.87372937696679e-05} +{"train_loss": 0.003013267181813717, "global_step": 36520, "epoch": 306, "lr": 4.873507896788582e-05} +{"train_loss": 0.002987782470881939, "global_step": 36521, "epoch": 306, "lr": 4.873286416858728e-05} +{"train_loss": 0.002458258531987667, "global_step": 36522, "epoch": 306, "lr": 4.8730649371776616e-05} +{"train_loss": 0.0019113654270768166, "global_step": 36523, "epoch": 306, "lr": 4.87284345774582e-05} +{"train_loss": 0.004450971260666847, "global_step": 36524, "epoch": 306, "lr": 4.8726219785636347e-05} +{"train_loss": 0.001609409344382584, "global_step": 36525, "epoch": 306, "lr": 4.872400499631545e-05} +{"train_loss": 0.0021371706388890743, "global_step": 36526, "epoch": 306, "lr": 4.872179020949983e-05} +{"train_loss": 0.002458651317283511, "global_step": 36527, "epoch": 306, "lr": 4.871957542519382e-05} +{"train_loss": 0.0009210704592987895, "global_step": 36528, "epoch": 306, "lr": 4.871736064340181e-05} +{"train_loss": 0.0031560861971229315, "global_step": 36529, "epoch": 306, "lr": 4.871514586412809e-05} +{"train_loss": 0.0028549341950565577, "global_step": 36530, "epoch": 306, "lr": 4.871293108737708e-05} +{"train_loss": 0.0013064916711300611, "global_step": 36531, "epoch": 306, "lr": 4.8710716313153066e-05} +{"train_loss": 0.0024256127922670494, "global_step": 36532, "epoch": 306, "lr": 4.8708501541460444e-05, "val_loss": 0.028337134048342705} +{"train_loss": 0.0013647725572809577, "global_step": 36533, "epoch": 307, "lr": 4.8706286772303526e-05} +{"train_loss": 0.003381613874807954, "global_step": 36534, "epoch": 307, "lr": 4.8704072005686685e-05} +{"train_loss": 0.002085519954562187, "global_step": 36535, "epoch": 307, "lr": 4.870185724161425e-05} +{"train_loss": 0.0013327992055565119, "global_step": 36536, "epoch": 307, "lr": 4.869964248009059e-05} +{"train_loss": 0.0019364445470273495, "global_step": 36537, "epoch": 307, "lr": 4.8697427721120035e-05} +{"train_loss": 0.0020345065277069807, "global_step": 36538, "epoch": 307, "lr": 4.869521296470696e-05} +{"train_loss": 0.0016151999589055777, "global_step": 36539, "epoch": 307, "lr": 4.869299821085567e-05} +{"train_loss": 0.0014038305962458253, "global_step": 36540, "epoch": 307, "lr": 4.869078345957056e-05} +{"train_loss": 0.003172626020386815, "global_step": 36541, "epoch": 307, "lr": 4.8688568710855934e-05} +{"train_loss": 0.002191545208916068, "global_step": 36542, "epoch": 307, "lr": 4.868635396471618e-05} +{"train_loss": 0.003196301171556115, "global_step": 36543, "epoch": 307, "lr": 4.868413922115561e-05} +{"train_loss": 0.0027166595682501793, "global_step": 36544, "epoch": 307, "lr": 4.868192448017862e-05} +{"train_loss": 0.002365348394960165, "global_step": 36545, "epoch": 307, "lr": 4.867970974178953e-05} +{"train_loss": 0.0035476116463541985, "global_step": 36546, "epoch": 307, "lr": 4.8677495005992666e-05} +{"train_loss": 0.002001747488975525, "global_step": 36547, "epoch": 307, "lr": 4.867528027279242e-05} +{"train_loss": 0.0009174945298582315, "global_step": 36548, "epoch": 307, "lr": 4.867306554219309e-05} +{"train_loss": 0.002637953031808138, "global_step": 36549, "epoch": 307, "lr": 4.867085081419909e-05} +{"train_loss": 0.0016937755281105638, "global_step": 36550, "epoch": 307, "lr": 4.86686360888147e-05} +{"train_loss": 0.003966460004448891, "global_step": 36551, "epoch": 307, "lr": 4.866642136604433e-05} +{"train_loss": 0.0032528555020689964, "global_step": 36552, "epoch": 307, "lr": 4.866420664589228e-05} +{"train_loss": 0.0023478460498154163, "global_step": 36553, "epoch": 307, "lr": 4.866199192836291e-05} +{"train_loss": 0.00261854799464345, "global_step": 36554, "epoch": 307, "lr": 4.86597772134606e-05} +{"train_loss": 0.0026425763498991728, "global_step": 36555, "epoch": 307, "lr": 4.8657562501189655e-05} +{"train_loss": 0.001951264450326562, "global_step": 36556, "epoch": 307, "lr": 4.8655347791554454e-05} +{"train_loss": 0.0017537178937345743, "global_step": 36557, "epoch": 307, "lr": 4.865313308455935e-05} +{"train_loss": 0.0024647549726068974, "global_step": 36558, "epoch": 307, "lr": 4.8650918380208636e-05} +{"train_loss": 0.0019256534287706017, "global_step": 36559, "epoch": 307, "lr": 4.864870367850673e-05} +{"train_loss": 0.0015295316698029637, "global_step": 36560, "epoch": 307, "lr": 4.864648897945793e-05} +{"train_loss": 0.001182728330604732, "global_step": 36561, "epoch": 307, "lr": 4.864427428306663e-05} +{"train_loss": 0.001962883397936821, "global_step": 36562, "epoch": 307, "lr": 4.864205958933712e-05} +{"train_loss": 0.0016445994842797518, "global_step": 36563, "epoch": 307, "lr": 4.863984489827381e-05} +{"train_loss": 0.002672092290595174, "global_step": 36564, "epoch": 307, "lr": 4.8637630209881014e-05} +{"train_loss": 0.004337362013757229, "global_step": 36565, "epoch": 307, "lr": 4.863541552416306e-05} +{"train_loss": 0.001898966496810317, "global_step": 36566, "epoch": 307, "lr": 4.863320084112436e-05} +{"train_loss": 0.0027053682133555412, "global_step": 36567, "epoch": 307, "lr": 4.863098616076919e-05} +{"train_loss": 0.0034749130718410015, "global_step": 36568, "epoch": 307, "lr": 4.862877148310194e-05} +{"train_loss": 0.00217285193502903, "global_step": 36569, "epoch": 307, "lr": 4.862655680812696e-05} +{"train_loss": 0.003924518823623657, "global_step": 36570, "epoch": 307, "lr": 4.862434213584859e-05} +{"train_loss": 0.00329317688010633, "global_step": 36571, "epoch": 307, "lr": 4.862212746627118e-05} +{"train_loss": 0.002087001921609044, "global_step": 36572, "epoch": 307, "lr": 4.861991279939906e-05} +{"train_loss": 0.0026125640142709017, "global_step": 36573, "epoch": 307, "lr": 4.861769813523661e-05} +{"train_loss": 0.0025308982003480196, "global_step": 36574, "epoch": 307, "lr": 4.8615483473788146e-05} +{"train_loss": 0.0022095663007348776, "global_step": 36575, "epoch": 307, "lr": 4.8613268815058046e-05} +{"train_loss": 0.002182736061513424, "global_step": 36576, "epoch": 307, "lr": 4.861105415905065e-05} +{"train_loss": 0.0031483841594308615, "global_step": 36577, "epoch": 307, "lr": 4.860883950577028e-05} +{"train_loss": 0.0019455289002507925, "global_step": 36578, "epoch": 307, "lr": 4.8606624855221325e-05} +{"train_loss": 0.0019354789983481169, "global_step": 36579, "epoch": 307, "lr": 4.860441020740809e-05} +{"train_loss": 0.0016672017518430948, "global_step": 36580, "epoch": 307, "lr": 4.8602195562334975e-05} +{"train_loss": 0.002175691071897745, "global_step": 36581, "epoch": 307, "lr": 4.859998092000627e-05} +{"train_loss": 0.0023545001167804003, "global_step": 36582, "epoch": 307, "lr": 4.8597766280426376e-05} +{"train_loss": 0.002258972730487585, "global_step": 36583, "epoch": 307, "lr": 4.859555164359961e-05} +{"train_loss": 0.002219301648437977, "global_step": 36584, "epoch": 307, "lr": 4.859333700953033e-05} +{"train_loss": 0.0027198249008506536, "global_step": 36585, "epoch": 307, "lr": 4.859112237822288e-05} +{"train_loss": 0.004067919682711363, "global_step": 36586, "epoch": 307, "lr": 4.858890774968161e-05} +{"train_loss": 0.001557437120936811, "global_step": 36587, "epoch": 307, "lr": 4.858669312391087e-05} +{"train_loss": 0.0024603058118373156, "global_step": 36588, "epoch": 307, "lr": 4.858447850091499e-05} +{"train_loss": 0.0022511009592562914, "global_step": 36589, "epoch": 307, "lr": 4.858226388069836e-05} +{"train_loss": 0.002184835262596607, "global_step": 36590, "epoch": 307, "lr": 4.8580049263265314e-05} +{"train_loss": 0.003730272874236107, "global_step": 36591, "epoch": 307, "lr": 4.8577834648620156e-05} +{"train_loss": 0.001619574730284512, "global_step": 36592, "epoch": 307, "lr": 4.857562003676729e-05} +{"train_loss": 0.0027669041883200407, "global_step": 36593, "epoch": 307, "lr": 4.857340542771103e-05} +{"train_loss": 0.0029488010331988335, "global_step": 36594, "epoch": 307, "lr": 4.857119082145575e-05} +{"train_loss": 0.0019225227879360318, "global_step": 36595, "epoch": 307, "lr": 4.8568976218005785e-05} +{"train_loss": 0.0026215401012450457, "global_step": 36596, "epoch": 307, "lr": 4.8566761617365456e-05} +{"train_loss": 0.002820040797814727, "global_step": 36597, "epoch": 307, "lr": 4.856454701953917e-05} +{"train_loss": 0.0025843398179858923, "global_step": 36598, "epoch": 307, "lr": 4.8562332424531214e-05} +{"train_loss": 0.005635703913867474, "global_step": 36599, "epoch": 307, "lr": 4.856011783234599e-05} +{"train_loss": 0.0025010774843394756, "global_step": 36600, "epoch": 307, "lr": 4.855790324298779e-05} +{"train_loss": 0.0031979200430214405, "global_step": 36601, "epoch": 307, "lr": 4.8555688656461024e-05} +{"train_loss": 0.0015953812981024384, "global_step": 36602, "epoch": 307, "lr": 4.8553474072769994e-05} +{"train_loss": 0.0019824421033263206, "global_step": 36603, "epoch": 307, "lr": 4.855125949191905e-05} +{"train_loss": 0.0025196343194693327, "global_step": 36604, "epoch": 307, "lr": 4.854904491391258e-05} +{"train_loss": 0.0032177206594496965, "global_step": 36605, "epoch": 307, "lr": 4.8546830338754886e-05} +{"train_loss": 0.0015184269286692142, "global_step": 36606, "epoch": 307, "lr": 4.854461576645035e-05} +{"train_loss": 0.0028575791511684656, "global_step": 36607, "epoch": 307, "lr": 4.854240119700331e-05} +{"train_loss": 0.0045072222128510475, "global_step": 36608, "epoch": 307, "lr": 4.854018663041809e-05} +{"train_loss": 0.0017442216631025076, "global_step": 36609, "epoch": 307, "lr": 4.853797206669907e-05} +{"train_loss": 0.0019443692872300744, "global_step": 36610, "epoch": 307, "lr": 4.853575750585057e-05} +{"train_loss": 0.0031610799487680197, "global_step": 36611, "epoch": 307, "lr": 4.853354294787698e-05} +{"train_loss": 0.0018347392324358225, "global_step": 36612, "epoch": 307, "lr": 4.853132839278259e-05} +{"train_loss": 0.002438205061480403, "global_step": 36613, "epoch": 307, "lr": 4.852911384057181e-05} +{"train_loss": 0.001273261965252459, "global_step": 36614, "epoch": 307, "lr": 4.8526899291248954e-05} +{"train_loss": 0.0029855510219931602, "global_step": 36615, "epoch": 307, "lr": 4.852468474481835e-05} +{"train_loss": 0.0017949106404557824, "global_step": 36616, "epoch": 307, "lr": 4.852247020128439e-05} +{"train_loss": 0.0014516828814521432, "global_step": 36617, "epoch": 307, "lr": 4.852025566065139e-05} +{"train_loss": 0.003593819448724389, "global_step": 36618, "epoch": 307, "lr": 4.8518041122923716e-05} +{"train_loss": 0.0027151298709213734, "global_step": 36619, "epoch": 307, "lr": 4.851582658810571e-05} +{"train_loss": 0.0025783770252019167, "global_step": 36620, "epoch": 307, "lr": 4.8513612056201715e-05} +{"train_loss": 0.0026481659151613712, "global_step": 36621, "epoch": 307, "lr": 4.8511397527216105e-05} +{"train_loss": 0.0023494206834584475, "global_step": 36622, "epoch": 307, "lr": 4.850918300115318e-05} +{"train_loss": 0.0020634266547858715, "global_step": 36623, "epoch": 307, "lr": 4.850696847801733e-05} +{"train_loss": 0.0018833335489034653, "global_step": 36624, "epoch": 307, "lr": 4.850475395781287e-05} +{"train_loss": 0.00373410084284842, "global_step": 36625, "epoch": 307, "lr": 4.850253944054419e-05} +{"train_loss": 0.0017474369378760457, "global_step": 36626, "epoch": 307, "lr": 4.850032492621562e-05} +{"train_loss": 0.0020598184783011675, "global_step": 36627, "epoch": 307, "lr": 4.849811041483147e-05} +{"train_loss": 0.0030475256498903036, "global_step": 36628, "epoch": 307, "lr": 4.8495895906396144e-05} +{"train_loss": 0.002758482936769724, "global_step": 36629, "epoch": 307, "lr": 4.849368140091394e-05} +{"train_loss": 0.0028753841761499643, "global_step": 36630, "epoch": 307, "lr": 4.849146689838926e-05} +{"train_loss": 0.0021217502653598785, "global_step": 36631, "epoch": 307, "lr": 4.8489252398826404e-05} +{"train_loss": 0.0025143586099147797, "global_step": 36632, "epoch": 307, "lr": 4.8487037902229754e-05} +{"train_loss": 0.002278275787830353, "global_step": 36633, "epoch": 307, "lr": 4.8484823408603635e-05} +{"train_loss": 0.0024069445207715034, "global_step": 36634, "epoch": 307, "lr": 4.8482608917952405e-05} +{"train_loss": 0.0023450483568012714, "global_step": 36635, "epoch": 307, "lr": 4.848039443028041e-05} +{"train_loss": 0.0022507766261696815, "global_step": 36636, "epoch": 307, "lr": 4.8478179945592e-05} +{"train_loss": 0.0017097912495955825, "global_step": 36637, "epoch": 307, "lr": 4.847596546389152e-05} +{"train_loss": 0.001882110838778317, "global_step": 36638, "epoch": 307, "lr": 4.84737509851833e-05} +{"train_loss": 0.0015251787845045328, "global_step": 36639, "epoch": 307, "lr": 4.847153650947174e-05} +{"train_loss": 0.0024604196660220623, "global_step": 36640, "epoch": 307, "lr": 4.846932203676115e-05} +{"train_loss": 0.00291581847704947, "global_step": 36641, "epoch": 307, "lr": 4.846710756705586e-05} +{"train_loss": 0.0014605593169108033, "global_step": 36642, "epoch": 307, "lr": 4.846489310036026e-05} +{"train_loss": 0.0010373303666710854, "global_step": 36643, "epoch": 307, "lr": 4.846267863667866e-05} +{"train_loss": 0.0019651195034384727, "global_step": 36644, "epoch": 307, "lr": 4.8460464176015455e-05} +{"train_loss": 0.0011037664953619242, "global_step": 36645, "epoch": 307, "lr": 4.8458249718374955e-05} +{"train_loss": 0.00322973495349288, "global_step": 36646, "epoch": 307, "lr": 4.845603526376149e-05} +{"train_loss": 0.0029893340542912483, "global_step": 36647, "epoch": 307, "lr": 4.845382081217947e-05} +{"train_loss": 0.00136956584174186, "global_step": 36648, "epoch": 307, "lr": 4.845160636363318e-05} +{"train_loss": 0.0014860776718705893, "global_step": 36649, "epoch": 307, "lr": 4.844939191812702e-05} +{"train_loss": 0.0019503330113366246, "global_step": 36650, "epoch": 307, "lr": 4.8447177475665287e-05} +{"train_loss": 0.002384648937145013, "global_step": 36651, "epoch": 307, "lr": 4.8444963036252366e-05, "val_loss": 0.010598491877317429} +{"train_loss": 0.0011286389781162143, "global_step": 36652, "epoch": 308, "lr": 4.844274859989261e-05} +{"train_loss": 0.0017659447621554136, "global_step": 36653, "epoch": 308, "lr": 4.8440534166590325e-05} +{"train_loss": 0.0014483644627034664, "global_step": 36654, "epoch": 308, "lr": 4.8438319736349904e-05} +{"train_loss": 0.0017309242393821478, "global_step": 36655, "epoch": 308, "lr": 4.8436105309175654e-05} +{"train_loss": 0.0014679634477943182, "global_step": 36656, "epoch": 308, "lr": 4.843389088507197e-05} +{"train_loss": 0.001847709994763136, "global_step": 36657, "epoch": 308, "lr": 4.843167646404317e-05} +{"train_loss": 0.0021949440706521273, "global_step": 36658, "epoch": 308, "lr": 4.8429462046093585e-05} +{"train_loss": 0.002016263548284769, "global_step": 36659, "epoch": 308, "lr": 4.842724763122761e-05} +{"train_loss": 0.002907771850004792, "global_step": 36660, "epoch": 308, "lr": 4.842503321944954e-05} +{"train_loss": 0.0030599134042859077, "global_step": 36661, "epoch": 308, "lr": 4.842281881076377e-05} +{"train_loss": 0.001944101182743907, "global_step": 36662, "epoch": 308, "lr": 4.8420604405174605e-05} +{"train_loss": 0.0016553866444155574, "global_step": 36663, "epoch": 308, "lr": 4.841839000268644e-05} +{"train_loss": 0.001343087526038289, "global_step": 36664, "epoch": 308, "lr": 4.8416175603303585e-05} +{"train_loss": 0.002180368173867464, "global_step": 36665, "epoch": 308, "lr": 4.84139612070304e-05} +{"train_loss": 0.0012933405814692378, "global_step": 36666, "epoch": 308, "lr": 4.8411746813871237e-05} +{"train_loss": 0.002737437142059207, "global_step": 36667, "epoch": 308, "lr": 4.840953242383043e-05} +{"train_loss": 0.0021411129273474216, "global_step": 36668, "epoch": 308, "lr": 4.840731803691234e-05} +{"train_loss": 0.0025235048960894346, "global_step": 36669, "epoch": 308, "lr": 4.840510365312131e-05} +{"train_loss": 0.0024224254302680492, "global_step": 36670, "epoch": 308, "lr": 4.8402889272461694e-05} +{"train_loss": 0.0016506087267771363, "global_step": 36671, "epoch": 308, "lr": 4.840067489493784e-05} +{"train_loss": 0.001510515110567212, "global_step": 36672, "epoch": 308, "lr": 4.839846052055407e-05} +{"train_loss": 0.0012280704686418176, "global_step": 36673, "epoch": 308, "lr": 4.839624614931477e-05} +{"train_loss": 0.0014262365875765681, "global_step": 36674, "epoch": 308, "lr": 4.839403178122425e-05} +{"train_loss": 0.0020625253673642874, "global_step": 36675, "epoch": 308, "lr": 4.83918174162869e-05} +{"train_loss": 0.0013481642818078399, "global_step": 36676, "epoch": 308, "lr": 4.838960305450705e-05} +{"train_loss": 0.0011229976080358028, "global_step": 36677, "epoch": 308, "lr": 4.8387388695889016e-05} +{"train_loss": 0.00240833917632699, "global_step": 36678, "epoch": 308, "lr": 4.8385174340437186e-05} +{"train_loss": 0.001670291880145669, "global_step": 36679, "epoch": 308, "lr": 4.838295998815588e-05} +{"train_loss": 0.001319731236435473, "global_step": 36680, "epoch": 308, "lr": 4.838074563904948e-05} +{"train_loss": 0.0017203321913257241, "global_step": 36681, "epoch": 308, "lr": 4.8378531293122286e-05} +{"train_loss": 0.0018629172118380666, "global_step": 36682, "epoch": 308, "lr": 4.83763169503787e-05} +{"train_loss": 0.002181150484830141, "global_step": 36683, "epoch": 308, "lr": 4.837410261082304e-05} +{"train_loss": 0.0012186249950900674, "global_step": 36684, "epoch": 308, "lr": 4.837188827445964e-05} +{"train_loss": 0.0010174032067880034, "global_step": 36685, "epoch": 308, "lr": 4.836967394129287e-05} +{"train_loss": 0.001972706289961934, "global_step": 36686, "epoch": 308, "lr": 4.836745961132706e-05} +{"train_loss": 0.0009784427238628268, "global_step": 36687, "epoch": 308, "lr": 4.8365245284566586e-05} +{"train_loss": 0.0011923365527763963, "global_step": 36688, "epoch": 308, "lr": 4.836303096101576e-05} +{"train_loss": 0.0020191846415400505, "global_step": 36689, "epoch": 308, "lr": 4.8360816640678974e-05} +{"train_loss": 0.0015040942234918475, "global_step": 36690, "epoch": 308, "lr": 4.835860232356054e-05} +{"train_loss": 0.0021754379849880934, "global_step": 36691, "epoch": 308, "lr": 4.8356388009664806e-05} +{"train_loss": 0.0016795855481177568, "global_step": 36692, "epoch": 308, "lr": 4.835417369899614e-05} +{"train_loss": 0.00107061886228621, "global_step": 36693, "epoch": 308, "lr": 4.835195939155886e-05} +{"train_loss": 0.0019751363433897495, "global_step": 36694, "epoch": 308, "lr": 4.834974508735735e-05} +{"train_loss": 0.0013055859599262476, "global_step": 36695, "epoch": 308, "lr": 4.8347530786395945e-05} +{"train_loss": 0.001061582239344716, "global_step": 36696, "epoch": 308, "lr": 4.834531648867896e-05} +{"train_loss": 0.0012800645781680942, "global_step": 36697, "epoch": 308, "lr": 4.834310219421079e-05} +{"train_loss": 0.0020419354550540447, "global_step": 36698, "epoch": 308, "lr": 4.8340887902995744e-05} +{"train_loss": 0.003056237008422613, "global_step": 36699, "epoch": 308, "lr": 4.83386736150382e-05} +{"train_loss": 0.0015397615497931838, "global_step": 36700, "epoch": 308, "lr": 4.833645933034249e-05} +{"train_loss": 0.00091199716553092, "global_step": 36701, "epoch": 308, "lr": 4.833424504891296e-05} +{"train_loss": 0.0012815173249691725, "global_step": 36702, "epoch": 308, "lr": 4.8332030770753984e-05} +{"train_loss": 0.0023362741339951754, "global_step": 36703, "epoch": 308, "lr": 4.8329816495869855e-05} +{"train_loss": 0.001258430304005742, "global_step": 36704, "epoch": 308, "lr": 4.8327602224264976e-05} +{"train_loss": 0.002000052947551012, "global_step": 36705, "epoch": 308, "lr": 4.832538795594366e-05} +{"train_loss": 0.0029961192049086094, "global_step": 36706, "epoch": 308, "lr": 4.832317369091028e-05} +{"train_loss": 0.001987447729334235, "global_step": 36707, "epoch": 308, "lr": 4.8320959429169146e-05} +{"train_loss": 0.0013601743848994374, "global_step": 36708, "epoch": 308, "lr": 4.831874517072465e-05} +{"train_loss": 0.002010723575949669, "global_step": 36709, "epoch": 308, "lr": 4.831653091558112e-05} +{"train_loss": 0.0015771448379382491, "global_step": 36710, "epoch": 308, "lr": 4.831431666374288e-05} +{"train_loss": 0.002771079773083329, "global_step": 36711, "epoch": 308, "lr": 4.8312102415214324e-05} +{"train_loss": 0.0013528583804145455, "global_step": 36712, "epoch": 308, "lr": 4.830988816999975e-05} +{"train_loss": 0.002141432836651802, "global_step": 36713, "epoch": 308, "lr": 4.8307673928103546e-05} +{"train_loss": 0.00216434127651155, "global_step": 36714, "epoch": 308, "lr": 4.830545968953004e-05} +{"train_loss": 0.0025991410948336124, "global_step": 36715, "epoch": 308, "lr": 4.830324545428359e-05} +{"train_loss": 0.002198395784944296, "global_step": 36716, "epoch": 308, "lr": 4.830103122236852e-05} +{"train_loss": 0.001734949997626245, "global_step": 36717, "epoch": 308, "lr": 4.82988169937892e-05} +{"train_loss": 0.0016732857329770923, "global_step": 36718, "epoch": 308, "lr": 4.829660276854998e-05} +{"train_loss": 0.0028236687649041414, "global_step": 36719, "epoch": 308, "lr": 4.8294388546655186e-05} +{"train_loss": 0.00198411475867033, "global_step": 36720, "epoch": 308, "lr": 4.8292174328109177e-05} +{"train_loss": 0.0016426804941147566, "global_step": 36721, "epoch": 308, "lr": 4.828996011291632e-05} +{"train_loss": 0.0024458980187773705, "global_step": 36722, "epoch": 308, "lr": 4.8287745901080925e-05} +{"train_loss": 0.0026177153922617435, "global_step": 36723, "epoch": 308, "lr": 4.828553169260737e-05} +{"train_loss": 0.0014857158530503511, "global_step": 36724, "epoch": 308, "lr": 4.828331748749997e-05} +{"train_loss": 0.0017372892471030354, "global_step": 36725, "epoch": 308, "lr": 4.828110328576312e-05} +{"train_loss": 0.0021266033872962, "global_step": 36726, "epoch": 308, "lr": 4.8278889087401135e-05} +{"train_loss": 0.002601772313937545, "global_step": 36727, "epoch": 308, "lr": 4.827667489241835e-05} +{"train_loss": 0.0015263204695656896, "global_step": 36728, "epoch": 308, "lr": 4.8274460700819154e-05} +{"train_loss": 0.0024035514798015356, "global_step": 36729, "epoch": 308, "lr": 4.827224651260784e-05} +{"train_loss": 0.002179123228415847, "global_step": 36730, "epoch": 308, "lr": 4.827003232778881e-05} +{"train_loss": 0.0020011470187455416, "global_step": 36731, "epoch": 308, "lr": 4.8267818146366366e-05} +{"train_loss": 0.002406021114438772, "global_step": 36732, "epoch": 308, "lr": 4.82656039683449e-05} +{"train_loss": 0.0030655215959995985, "global_step": 36733, "epoch": 308, "lr": 4.826338979372872e-05} +{"train_loss": 0.002476360648870468, "global_step": 36734, "epoch": 308, "lr": 4.826117562252218e-05} +{"train_loss": 0.002488597994670272, "global_step": 36735, "epoch": 308, "lr": 4.825896145472966e-05} +{"train_loss": 0.0017419375944882631, "global_step": 36736, "epoch": 308, "lr": 4.825674729035546e-05} +{"train_loss": 0.004678788129240274, "global_step": 36737, "epoch": 308, "lr": 4.825453312940397e-05} +{"train_loss": 0.0027552051469683647, "global_step": 36738, "epoch": 308, "lr": 4.825231897187949e-05} +{"train_loss": 0.0017743561184033751, "global_step": 36739, "epoch": 308, "lr": 4.825010481778643e-05} +{"train_loss": 0.0014724801294505596, "global_step": 36740, "epoch": 308, "lr": 4.8247890667129094e-05} +{"train_loss": 0.002553586382418871, "global_step": 36741, "epoch": 308, "lr": 4.824567651991182e-05} +{"train_loss": 0.0014252348337322474, "global_step": 36742, "epoch": 308, "lr": 4.824346237613899e-05} +{"train_loss": 0.0016145273111760616, "global_step": 36743, "epoch": 308, "lr": 4.824124823581492e-05} +{"train_loss": 0.0028881581965833902, "global_step": 36744, "epoch": 308, "lr": 4.823903409894398e-05} +{"train_loss": 0.0019672594498842955, "global_step": 36745, "epoch": 308, "lr": 4.8236819965530516e-05} +{"train_loss": 0.0035846568644046783, "global_step": 36746, "epoch": 308, "lr": 4.823460583557885e-05} +{"train_loss": 0.0020648143254220486, "global_step": 36747, "epoch": 308, "lr": 4.823239170909336e-05} +{"train_loss": 0.003255981020629406, "global_step": 36748, "epoch": 308, "lr": 4.823017758607837e-05} +{"train_loss": 0.004136641975492239, "global_step": 36749, "epoch": 308, "lr": 4.822796346653823e-05} +{"train_loss": 0.0020809315610677004, "global_step": 36750, "epoch": 308, "lr": 4.822574935047731e-05} +{"train_loss": 0.0020915463101118803, "global_step": 36751, "epoch": 308, "lr": 4.8223535237899936e-05} +{"train_loss": 0.002495693974196911, "global_step": 36752, "epoch": 308, "lr": 4.822132112881048e-05} +{"train_loss": 0.0024335214402526617, "global_step": 36753, "epoch": 308, "lr": 4.8219107023213236e-05} +{"train_loss": 0.0024283442180603743, "global_step": 36754, "epoch": 308, "lr": 4.821689292111261e-05} +{"train_loss": 0.0020514612551778555, "global_step": 36755, "epoch": 308, "lr": 4.8214678822512906e-05} +{"train_loss": 0.0023590971250087023, "global_step": 36756, "epoch": 308, "lr": 4.8212464727418506e-05} +{"train_loss": 0.002248986391350627, "global_step": 36757, "epoch": 308, "lr": 4.821025063583372e-05} +{"train_loss": 0.0018592007691040635, "global_step": 36758, "epoch": 308, "lr": 4.820803654776294e-05} +{"train_loss": 0.001555454102344811, "global_step": 36759, "epoch": 308, "lr": 4.820582246321049e-05} +{"train_loss": 0.0012696473859250546, "global_step": 36760, "epoch": 308, "lr": 4.820360838218069e-05} +{"train_loss": 0.0024199699983000755, "global_step": 36761, "epoch": 308, "lr": 4.820139430467794e-05} +{"train_loss": 0.0027455331292003393, "global_step": 36762, "epoch": 308, "lr": 4.8199180230706536e-05} +{"train_loss": 0.002168220467865467, "global_step": 36763, "epoch": 308, "lr": 4.8196966160270865e-05} +{"train_loss": 0.0021338199730962515, "global_step": 36764, "epoch": 308, "lr": 4.8194752093375255e-05} +{"train_loss": 0.004022396169602871, "global_step": 36765, "epoch": 308, "lr": 4.819253803002406e-05} +{"train_loss": 0.0026206437032669783, "global_step": 36766, "epoch": 308, "lr": 4.819032397022161e-05} +{"train_loss": 0.001735732308588922, "global_step": 36767, "epoch": 308, "lr": 4.818810991397228e-05} +{"train_loss": 0.0033615052234381437, "global_step": 36768, "epoch": 308, "lr": 4.8185895861280396e-05} +{"train_loss": 0.0025056221056729555, "global_step": 36769, "epoch": 308, "lr": 4.818368181215031e-05} +{"train_loss": 0.00204013502949207, "global_step": 36770, "epoch": 308, "lr": 4.8181467766586375e-05, "val_loss": 0.02247617207467556} +{"train_loss": 0.0019493013387545943, "global_step": 36771, "epoch": 309, "lr": 4.817925372459294e-05} +{"train_loss": 0.002999289194121957, "global_step": 36772, "epoch": 309, "lr": 4.8177039686174326e-05} +{"train_loss": 0.0011857416247949004, "global_step": 36773, "epoch": 309, "lr": 4.817482565133492e-05} +{"train_loss": 0.0018000586424022913, "global_step": 36774, "epoch": 309, "lr": 4.817261162007903e-05} +{"train_loss": 0.0028216198552399874, "global_step": 36775, "epoch": 309, "lr": 4.817039759241104e-05} +{"train_loss": 0.00167192576918751, "global_step": 36776, "epoch": 309, "lr": 4.816818356833526e-05} +{"train_loss": 0.0028833451215177774, "global_step": 36777, "epoch": 309, "lr": 4.816596954785608e-05} +{"train_loss": 0.0018566359067335725, "global_step": 36778, "epoch": 309, "lr": 4.8163755530977814e-05} +{"train_loss": 0.0014849529834464192, "global_step": 36779, "epoch": 309, "lr": 4.8161541517704804e-05} +{"train_loss": 0.001928259851410985, "global_step": 36780, "epoch": 309, "lr": 4.815932750804143e-05} +{"train_loss": 0.0013700752751901746, "global_step": 36781, "epoch": 309, "lr": 4.8157113501992005e-05} +{"train_loss": 0.0022601012606173754, "global_step": 36782, "epoch": 309, "lr": 4.81548994995609e-05} +{"train_loss": 0.0011926450533792377, "global_step": 36783, "epoch": 309, "lr": 4.815268550075245e-05} +{"train_loss": 0.0023959290701895952, "global_step": 36784, "epoch": 309, "lr": 4.8150471505570995e-05} +{"train_loss": 0.0015178864123299718, "global_step": 36785, "epoch": 309, "lr": 4.8148257514020904e-05} +{"train_loss": 0.0019762376323342323, "global_step": 36786, "epoch": 309, "lr": 4.8146043526106496e-05} +{"train_loss": 0.003641844727098942, "global_step": 36787, "epoch": 309, "lr": 4.814382954183216e-05} +{"train_loss": 0.001632423372939229, "global_step": 36788, "epoch": 309, "lr": 4.814161556120219e-05} +{"train_loss": 0.0022124506067484617, "global_step": 36789, "epoch": 309, "lr": 4.8139401584220977e-05} +{"train_loss": 0.0024482039734721184, "global_step": 36790, "epoch": 309, "lr": 4.8137187610892855e-05} +{"train_loss": 0.0014585333410650492, "global_step": 36791, "epoch": 309, "lr": 4.813497364122214e-05} +{"train_loss": 0.002062619663774967, "global_step": 36792, "epoch": 309, "lr": 4.813275967521324e-05} +{"train_loss": 0.001394512946717441, "global_step": 36793, "epoch": 309, "lr": 4.813054571287043e-05} +{"train_loss": 0.0026521258987486362, "global_step": 36794, "epoch": 309, "lr": 4.812833175419812e-05} +{"train_loss": 0.0020176495891064405, "global_step": 36795, "epoch": 309, "lr": 4.812611779920063e-05} +{"train_loss": 0.002896872814744711, "global_step": 36796, "epoch": 309, "lr": 4.812390384788229e-05} +{"train_loss": 0.0016645126743242145, "global_step": 36797, "epoch": 309, "lr": 4.812168990024747e-05} +{"train_loss": 0.001899384893476963, "global_step": 36798, "epoch": 309, "lr": 4.811947595630051e-05} +{"train_loss": 0.0015948211075738072, "global_step": 36799, "epoch": 309, "lr": 4.811726201604576e-05} +{"train_loss": 0.003609053324908018, "global_step": 36800, "epoch": 309, "lr": 4.811504807948757e-05} +{"train_loss": 0.0009190663695335388, "global_step": 36801, "epoch": 309, "lr": 4.8112834146630284e-05} +{"train_loss": 0.0018976839492097497, "global_step": 36802, "epoch": 309, "lr": 4.8110620217478245e-05} +{"train_loss": 0.001146815251559019, "global_step": 36803, "epoch": 309, "lr": 4.810840629203578e-05} +{"train_loss": 0.0019342045998200774, "global_step": 36804, "epoch": 309, "lr": 4.810619237030729e-05} +{"train_loss": 0.0019869941752403975, "global_step": 36805, "epoch": 309, "lr": 4.8103978452297066e-05} +{"train_loss": 0.0021642278879880905, "global_step": 36806, "epoch": 309, "lr": 4.81017645380095e-05} +{"train_loss": 0.0025653610937297344, "global_step": 36807, "epoch": 309, "lr": 4.8099550627448884e-05} +{"train_loss": 0.0025606462731957436, "global_step": 36808, "epoch": 309, "lr": 4.809733672061963e-05} +{"train_loss": 0.0024472144432365894, "global_step": 36809, "epoch": 309, "lr": 4.8095122817526046e-05} +{"train_loss": 0.0014679544838145375, "global_step": 36810, "epoch": 309, "lr": 4.809290891817246e-05} +{"train_loss": 0.001315740286372602, "global_step": 36811, "epoch": 309, "lr": 4.8090695022563274e-05} +{"train_loss": 0.0024190067779272795, "global_step": 36812, "epoch": 309, "lr": 4.808848113070278e-05} +{"train_loss": 0.0019113026792183518, "global_step": 36813, "epoch": 309, "lr": 4.808626724259537e-05} +{"train_loss": 0.0019012382254004478, "global_step": 36814, "epoch": 309, "lr": 4.8084053358245355e-05} +{"train_loss": 0.0036979876458644867, "global_step": 36815, "epoch": 309, "lr": 4.80818394776571e-05} +{"train_loss": 0.001900667673908174, "global_step": 36816, "epoch": 309, "lr": 4.807962560083495e-05} +{"train_loss": 0.0011766294483095407, "global_step": 36817, "epoch": 309, "lr": 4.807741172778325e-05} +{"train_loss": 0.003022477263584733, "global_step": 36818, "epoch": 309, "lr": 4.807519785850634e-05} +{"train_loss": 0.0014451420865952969, "global_step": 36819, "epoch": 309, "lr": 4.807298399300857e-05} +{"train_loss": 0.003095475258305669, "global_step": 36820, "epoch": 309, "lr": 4.8070770131294313e-05} +{"train_loss": 0.001944062882103026, "global_step": 36821, "epoch": 309, "lr": 4.8068556273367885e-05} +{"train_loss": 0.001949946628883481, "global_step": 36822, "epoch": 309, "lr": 4.8066342419233623e-05} +{"train_loss": 0.0016214767238125205, "global_step": 36823, "epoch": 309, "lr": 4.806412856889592e-05} +{"train_loss": 0.0028265579603612423, "global_step": 36824, "epoch": 309, "lr": 4.8061914722359055e-05} +{"train_loss": 0.0025571142323315144, "global_step": 36825, "epoch": 309, "lr": 4.805970087962745e-05} +{"train_loss": 0.002939515979960561, "global_step": 36826, "epoch": 309, "lr": 4.8057487040705384e-05} +{"train_loss": 0.003230360336601734, "global_step": 36827, "epoch": 309, "lr": 4.8055273205597265e-05} +{"train_loss": 0.0019241470145061612, "global_step": 36828, "epoch": 309, "lr": 4.80530593743074e-05} +{"train_loss": 0.0022508760448545218, "global_step": 36829, "epoch": 309, "lr": 4.805084554684013e-05} +{"train_loss": 0.0016767625929787755, "global_step": 36830, "epoch": 309, "lr": 4.804863172319984e-05} +{"train_loss": 0.0020796828903257847, "global_step": 36831, "epoch": 309, "lr": 4.804641790339082e-05} +{"train_loss": 0.0023282133042812347, "global_step": 36832, "epoch": 309, "lr": 4.8044204087417474e-05} +{"train_loss": 0.00288340519182384, "global_step": 36833, "epoch": 309, "lr": 4.804199027528413e-05} +{"train_loss": 0.0017298373859375715, "global_step": 36834, "epoch": 309, "lr": 4.80397764669951e-05} +{"train_loss": 0.00171372399199754, "global_step": 36835, "epoch": 309, "lr": 4.8037562662554794e-05} +{"train_loss": 0.002202624222263694, "global_step": 36836, "epoch": 309, "lr": 4.8035348861967495e-05} +{"train_loss": 0.0018301261588931084, "global_step": 36837, "epoch": 309, "lr": 4.80331350652376e-05} +{"train_loss": 0.0013316178228706121, "global_step": 36838, "epoch": 309, "lr": 4.803092127236941e-05} +{"train_loss": 0.0029976810328662395, "global_step": 36839, "epoch": 309, "lr": 4.802870748336732e-05} +{"train_loss": 0.0028657845687121153, "global_step": 36840, "epoch": 309, "lr": 4.802649369823566e-05} +{"train_loss": 0.0013967803679406643, "global_step": 36841, "epoch": 309, "lr": 4.8024279916978735e-05} +{"train_loss": 0.0017733467975631356, "global_step": 36842, "epoch": 309, "lr": 4.802206613960096e-05} +{"train_loss": 0.0027394595090299845, "global_step": 36843, "epoch": 309, "lr": 4.801985236610661e-05} +{"train_loss": 0.0028846573550254107, "global_step": 36844, "epoch": 309, "lr": 4.80176385965001e-05} +{"train_loss": 0.002221127739176154, "global_step": 36845, "epoch": 309, "lr": 4.801542483078573e-05} +{"train_loss": 0.001555669354274869, "global_step": 36846, "epoch": 309, "lr": 4.801321106896787e-05} +{"train_loss": 0.0024532368406653404, "global_step": 36847, "epoch": 309, "lr": 4.801099731105085e-05} +{"train_loss": 0.002712146146222949, "global_step": 36848, "epoch": 309, "lr": 4.800878355703902e-05} +{"train_loss": 0.001566327759064734, "global_step": 36849, "epoch": 309, "lr": 4.800656980693674e-05} +{"train_loss": 0.0021323533728718758, "global_step": 36850, "epoch": 309, "lr": 4.800435606074834e-05} +{"train_loss": 0.0023388145491480827, "global_step": 36851, "epoch": 309, "lr": 4.8002142318478175e-05} +{"train_loss": 0.002008122857660055, "global_step": 36852, "epoch": 309, "lr": 4.799992858013061e-05} +{"train_loss": 0.0016831544926390052, "global_step": 36853, "epoch": 309, "lr": 4.799771484570994e-05} +{"train_loss": 0.003185607260093093, "global_step": 36854, "epoch": 309, "lr": 4.7995501115220565e-05} +{"train_loss": 0.0018798259552568197, "global_step": 36855, "epoch": 309, "lr": 4.799328738866679e-05} +{"train_loss": 0.0019723116420209408, "global_step": 36856, "epoch": 309, "lr": 4.7991073666053e-05} +{"train_loss": 0.0026298274751752615, "global_step": 36857, "epoch": 309, "lr": 4.798885994738351e-05} +{"train_loss": 0.0035600478295236826, "global_step": 36858, "epoch": 309, "lr": 4.798664623266269e-05} +{"train_loss": 0.0031801501754671335, "global_step": 36859, "epoch": 309, "lr": 4.798443252189488e-05} +{"train_loss": 0.0024841707199811935, "global_step": 36860, "epoch": 309, "lr": 4.7982218815084395e-05} +{"train_loss": 0.002008009236305952, "global_step": 36861, "epoch": 309, "lr": 4.798000511223564e-05} +{"train_loss": 0.0024389601312577724, "global_step": 36862, "epoch": 309, "lr": 4.7977791413352893e-05} +{"train_loss": 0.0017369542038068175, "global_step": 36863, "epoch": 309, "lr": 4.7975577718440565e-05} +{"train_loss": 0.0020081799011677504, "global_step": 36864, "epoch": 309, "lr": 4.797336402750296e-05} +{"train_loss": 0.0028826729394495487, "global_step": 36865, "epoch": 309, "lr": 4.797115034054445e-05} +{"train_loss": 0.0015305948909372091, "global_step": 36866, "epoch": 309, "lr": 4.7968936657569355e-05} +{"train_loss": 0.002432728186249733, "global_step": 36867, "epoch": 309, "lr": 4.796672297858203e-05} +{"train_loss": 0.001393705839291215, "global_step": 36868, "epoch": 309, "lr": 4.796450930358686e-05} +{"train_loss": 0.0013511209981516004, "global_step": 36869, "epoch": 309, "lr": 4.7962295632588125e-05} +{"train_loss": 0.0015777659136801958, "global_step": 36870, "epoch": 309, "lr": 4.796008196559023e-05} +{"train_loss": 0.0015061168232932687, "global_step": 36871, "epoch": 309, "lr": 4.795786830259749e-05} +{"train_loss": 0.0011905275750905275, "global_step": 36872, "epoch": 309, "lr": 4.795565464361424e-05} +{"train_loss": 0.0034394816029816866, "global_step": 36873, "epoch": 309, "lr": 4.7953440988644866e-05} +{"train_loss": 0.0024886312894523144, "global_step": 36874, "epoch": 309, "lr": 4.795122733769367e-05} +{"train_loss": 0.0012380275875329971, "global_step": 36875, "epoch": 309, "lr": 4.7949013690765045e-05} +{"train_loss": 0.0017904663691297174, "global_step": 36876, "epoch": 309, "lr": 4.7946800047863284e-05} +{"train_loss": 0.001011166488751769, "global_step": 36877, "epoch": 309, "lr": 4.794458640899279e-05} +{"train_loss": 0.0029315236024558544, "global_step": 36878, "epoch": 309, "lr": 4.794237277415788e-05} +{"train_loss": 0.0020742190536111593, "global_step": 36879, "epoch": 309, "lr": 4.7940159143362874e-05} +{"train_loss": 0.0016124197281897068, "global_step": 36880, "epoch": 309, "lr": 4.793794551661217e-05} +{"train_loss": 0.0024078143760561943, "global_step": 36881, "epoch": 309, "lr": 4.793573189391007e-05} +{"train_loss": 0.0012251953594386578, "global_step": 36882, "epoch": 309, "lr": 4.793351827526095e-05} +{"train_loss": 0.004253779537975788, "global_step": 36883, "epoch": 309, "lr": 4.7931304660669155e-05} +{"train_loss": 0.0010184459388256073, "global_step": 36884, "epoch": 309, "lr": 4.7929091050139e-05} +{"train_loss": 0.0013468220131471753, "global_step": 36885, "epoch": 309, "lr": 4.7926877443674876e-05} +{"train_loss": 0.0018556384602561593, "global_step": 36886, "epoch": 309, "lr": 4.792466384128109e-05} +{"train_loss": 0.0020328573882579803, "global_step": 36887, "epoch": 309, "lr": 4.7922450242962027e-05} +{"train_loss": 0.0026814534794539213, "global_step": 36888, "epoch": 309, "lr": 4.792023664872198e-05} +{"train_loss": 0.0021135983411457483, "global_step": 36889, "epoch": 309, "lr": 4.7918023058565356e-05, "val_loss": 0.0359991230070591} +{"train_loss": 0.0029805065132677555, "global_step": 36890, "epoch": 310, "lr": 4.791580947249646e-05} +{"train_loss": 0.0016994659090414643, "global_step": 36891, "epoch": 310, "lr": 4.791359589051964e-05} +{"train_loss": 0.002864147536456585, "global_step": 36892, "epoch": 310, "lr": 4.791138231263927e-05} +{"train_loss": 0.001889589475467801, "global_step": 36893, "epoch": 310, "lr": 4.7909168738859655e-05} +{"train_loss": 0.0032457145862281322, "global_step": 36894, "epoch": 310, "lr": 4.7906955169185186e-05} +{"train_loss": 0.004141294397413731, "global_step": 36895, "epoch": 310, "lr": 4.790474160362017e-05} +{"train_loss": 0.0029925438575446606, "global_step": 36896, "epoch": 310, "lr": 4.790252804216898e-05} +{"train_loss": 0.002572482917457819, "global_step": 36897, "epoch": 310, "lr": 4.790031448483595e-05} +{"train_loss": 0.00124006113037467, "global_step": 36898, "epoch": 310, "lr": 4.789810093162543e-05} +{"train_loss": 0.002434018300846219, "global_step": 36899, "epoch": 310, "lr": 4.789588738254176e-05} +{"train_loss": 0.0022996007464826107, "global_step": 36900, "epoch": 310, "lr": 4.789367383758929e-05} +{"train_loss": 0.0019540367648005486, "global_step": 36901, "epoch": 310, "lr": 4.789146029677237e-05} +{"train_loss": 0.002601476153358817, "global_step": 36902, "epoch": 310, "lr": 4.7889246760095344e-05} +{"train_loss": 0.0016840414609760046, "global_step": 36903, "epoch": 310, "lr": 4.7887033227562545e-05} +{"train_loss": 0.0014187645865604281, "global_step": 36904, "epoch": 310, "lr": 4.788481969917834e-05} +{"train_loss": 0.0029554415959864855, "global_step": 36905, "epoch": 310, "lr": 4.788260617494706e-05} +{"train_loss": 0.002309947507455945, "global_step": 36906, "epoch": 310, "lr": 4.788039265487307e-05} +{"train_loss": 0.003927235491573811, "global_step": 36907, "epoch": 310, "lr": 4.787817913896068e-05} +{"train_loss": 0.0029192371293902397, "global_step": 36908, "epoch": 310, "lr": 4.787596562721428e-05} +{"train_loss": 0.002369058784097433, "global_step": 36909, "epoch": 310, "lr": 4.78737521196382e-05} +{"train_loss": 0.0041102198883891106, "global_step": 36910, "epoch": 310, "lr": 4.787153861623676e-05} +{"train_loss": 0.0015680965734645724, "global_step": 36911, "epoch": 310, "lr": 4.7869325117014336e-05} +{"train_loss": 0.0023103756830096245, "global_step": 36912, "epoch": 310, "lr": 4.7867111621975254e-05} +{"train_loss": 0.0016393755795434117, "global_step": 36913, "epoch": 310, "lr": 4.786489813112389e-05} +{"train_loss": 0.003204993437975645, "global_step": 36914, "epoch": 310, "lr": 4.786268464446455e-05} +{"train_loss": 0.002401812467724085, "global_step": 36915, "epoch": 310, "lr": 4.786047116200161e-05} +{"train_loss": 0.0021929312497377396, "global_step": 36916, "epoch": 310, "lr": 4.7858257683739406e-05} +{"train_loss": 0.0011599978897720575, "global_step": 36917, "epoch": 310, "lr": 4.785604420968227e-05} +{"train_loss": 0.002270191442221403, "global_step": 36918, "epoch": 310, "lr": 4.7853830739834586e-05} +{"train_loss": 0.0016808533109724522, "global_step": 36919, "epoch": 310, "lr": 4.785161727420065e-05} +{"train_loss": 0.001490372815169394, "global_step": 36920, "epoch": 310, "lr": 4.784940381278487e-05} +{"train_loss": 0.0009180819615721703, "global_step": 36921, "epoch": 310, "lr": 4.7847190355591544e-05} +{"train_loss": 0.0021816398948431015, "global_step": 36922, "epoch": 310, "lr": 4.784497690262501e-05} +{"train_loss": 0.0029216234106570482, "global_step": 36923, "epoch": 310, "lr": 4.784276345388965e-05} +{"train_loss": 0.0034335190430283546, "global_step": 36924, "epoch": 310, "lr": 4.784055000938978e-05} +{"train_loss": 0.0018644870724529028, "global_step": 36925, "epoch": 310, "lr": 4.7838336569129776e-05} +{"train_loss": 0.0023555560037493706, "global_step": 36926, "epoch": 310, "lr": 4.783612313311395e-05} +{"train_loss": 0.004745754413306713, "global_step": 36927, "epoch": 310, "lr": 4.783390970134668e-05} +{"train_loss": 0.0034585734829306602, "global_step": 36928, "epoch": 310, "lr": 4.783169627383231e-05} +{"train_loss": 0.001347396639175713, "global_step": 36929, "epoch": 310, "lr": 4.7829482850575135e-05} +{"train_loss": 0.00243035308085382, "global_step": 36930, "epoch": 310, "lr": 4.782726943157956e-05} +{"train_loss": 0.0033523915335536003, "global_step": 36931, "epoch": 310, "lr": 4.78250560168499e-05} +{"train_loss": 0.002241733716800809, "global_step": 36932, "epoch": 310, "lr": 4.7822842606390515e-05} +{"train_loss": 0.001735116820782423, "global_step": 36933, "epoch": 310, "lr": 4.782062920020576e-05} +{"train_loss": 0.00133120350074023, "global_step": 36934, "epoch": 310, "lr": 4.781841579829994e-05} +{"train_loss": 0.0021435434464365244, "global_step": 36935, "epoch": 310, "lr": 4.7816202400677453e-05} +{"train_loss": 0.0016822433099150658, "global_step": 36936, "epoch": 310, "lr": 4.78139890073426e-05} +{"train_loss": 0.0024194277357310057, "global_step": 36937, "epoch": 310, "lr": 4.7811775618299764e-05} +{"train_loss": 0.002944495063275099, "global_step": 36938, "epoch": 310, "lr": 4.780956223355325e-05} +{"train_loss": 0.00227171229198575, "global_step": 36939, "epoch": 310, "lr": 4.780734885310745e-05} +{"train_loss": 0.002774452557787299, "global_step": 36940, "epoch": 310, "lr": 4.780513547696668e-05} +{"train_loss": 0.0021670360583812, "global_step": 36941, "epoch": 310, "lr": 4.7802922105135284e-05} +{"train_loss": 0.001987155992537737, "global_step": 36942, "epoch": 310, "lr": 4.780070873761763e-05} +{"train_loss": 0.0024753331672400236, "global_step": 36943, "epoch": 310, "lr": 4.7798495374418025e-05} +{"train_loss": 0.0014320564223453403, "global_step": 36944, "epoch": 310, "lr": 4.779628201554086e-05} +{"train_loss": 0.0017143824370577931, "global_step": 36945, "epoch": 310, "lr": 4.7794068660990444e-05} +{"train_loss": 0.0012409469345584512, "global_step": 36946, "epoch": 310, "lr": 4.779185531077115e-05} +{"train_loss": 0.001955114072188735, "global_step": 36947, "epoch": 310, "lr": 4.7789641964887315e-05} +{"train_loss": 0.0026258928701281548, "global_step": 36948, "epoch": 310, "lr": 4.7787428623343275e-05} +{"train_loss": 0.0011582034640014172, "global_step": 36949, "epoch": 310, "lr": 4.778521528614339e-05} +{"train_loss": 0.0017984170699492097, "global_step": 36950, "epoch": 310, "lr": 4.7783001953291986e-05} +{"train_loss": 0.0023978380486369133, "global_step": 36951, "epoch": 310, "lr": 4.7780788624793425e-05} +{"train_loss": 0.002944209845736623, "global_step": 36952, "epoch": 310, "lr": 4.777857530065206e-05} +{"train_loss": 0.0016287827165797353, "global_step": 36953, "epoch": 310, "lr": 4.777636198087221e-05} +{"train_loss": 0.0021834259387105703, "global_step": 36954, "epoch": 310, "lr": 4.777414866545825e-05} +{"train_loss": 0.001957374159246683, "global_step": 36955, "epoch": 310, "lr": 4.777193535441449e-05} +{"train_loss": 0.0012174617731943727, "global_step": 36956, "epoch": 310, "lr": 4.776972204774532e-05} +{"train_loss": 0.0016580016817897558, "global_step": 36957, "epoch": 310, "lr": 4.7767508745455037e-05} +{"train_loss": 0.0029149691108614206, "global_step": 36958, "epoch": 310, "lr": 4.776529544754804e-05} +{"train_loss": 0.0022016987204551697, "global_step": 36959, "epoch": 310, "lr": 4.7763082154028646e-05} +{"train_loss": 0.0030834281351417303, "global_step": 36960, "epoch": 310, "lr": 4.776086886490117e-05} +{"train_loss": 0.0010820693569257855, "global_step": 36961, "epoch": 310, "lr": 4.775865558017002e-05} +{"train_loss": 0.001987460535019636, "global_step": 36962, "epoch": 310, "lr": 4.775644229983949e-05} +{"train_loss": 0.0032167350873351097, "global_step": 36963, "epoch": 310, "lr": 4.775422902391396e-05} +{"train_loss": 0.001453970791772008, "global_step": 36964, "epoch": 310, "lr": 4.7752015752397745e-05} +{"train_loss": 0.002708837855607271, "global_step": 36965, "epoch": 310, "lr": 4.7749802485295215e-05} +{"train_loss": 0.0025508664548397064, "global_step": 36966, "epoch": 310, "lr": 4.774758922261072e-05} +{"train_loss": 0.0018162756459787488, "global_step": 36967, "epoch": 310, "lr": 4.774537596434857e-05} +{"train_loss": 0.0027934478130191565, "global_step": 36968, "epoch": 310, "lr": 4.7743162710513154e-05} +{"train_loss": 0.002169843763113022, "global_step": 36969, "epoch": 310, "lr": 4.774094946110878e-05} +{"train_loss": 0.0018972614780068398, "global_step": 36970, "epoch": 310, "lr": 4.7738736216139826e-05} +{"train_loss": 0.002368408953770995, "global_step": 36971, "epoch": 310, "lr": 4.773652297561063e-05} +{"train_loss": 0.0023602170404046774, "global_step": 36972, "epoch": 310, "lr": 4.77343097395255e-05} +{"train_loss": 0.0013062101788818836, "global_step": 36973, "epoch": 310, "lr": 4.7732096507888835e-05} +{"train_loss": 0.002795417793095112, "global_step": 36974, "epoch": 310, "lr": 4.7729883280704935e-05} +{"train_loss": 0.002449723891913891, "global_step": 36975, "epoch": 310, "lr": 4.772767005797819e-05} +{"train_loss": 0.002676838543266058, "global_step": 36976, "epoch": 310, "lr": 4.77254568397129e-05} +{"train_loss": 0.0012213537702336907, "global_step": 36977, "epoch": 310, "lr": 4.7723243625913446e-05} +{"train_loss": 0.0026519906241446733, "global_step": 36978, "epoch": 310, "lr": 4.772103041658416e-05} +{"train_loss": 0.0016743158921599388, "global_step": 36979, "epoch": 310, "lr": 4.7718817211729385e-05} +{"train_loss": 0.002520202659070492, "global_step": 36980, "epoch": 310, "lr": 4.771660401135347e-05} +{"train_loss": 0.0009257928468286991, "global_step": 36981, "epoch": 310, "lr": 4.7714390815460754e-05} +{"train_loss": 0.0020808973349630833, "global_step": 36982, "epoch": 310, "lr": 4.771217762405559e-05} +{"train_loss": 0.0011298076715320349, "global_step": 36983, "epoch": 310, "lr": 4.7709964437142324e-05} +{"train_loss": 0.0029971995390951633, "global_step": 36984, "epoch": 310, "lr": 4.770775125472529e-05} +{"train_loss": 0.0018228287808597088, "global_step": 36985, "epoch": 310, "lr": 4.7705538076808856e-05} +{"train_loss": 0.0013773082755506039, "global_step": 36986, "epoch": 310, "lr": 4.7703324903397325e-05} +{"train_loss": 0.0044664316810667515, "global_step": 36987, "epoch": 310, "lr": 4.77011117344951e-05} +{"train_loss": 0.0026278547011315823, "global_step": 36988, "epoch": 310, "lr": 4.7698898570106475e-05} +{"train_loss": 0.0025968856643885374, "global_step": 36989, "epoch": 310, "lr": 4.7696685410235836e-05} +{"train_loss": 0.002653784118592739, "global_step": 36990, "epoch": 310, "lr": 4.7694472254887514e-05} +{"train_loss": 0.0014586042379960418, "global_step": 36991, "epoch": 310, "lr": 4.769225910406582e-05} +{"train_loss": 0.0031798365525901318, "global_step": 36992, "epoch": 310, "lr": 4.7690045957775155e-05} +{"train_loss": 0.0013454456347972155, "global_step": 36993, "epoch": 310, "lr": 4.768783281601982e-05} +{"train_loss": 0.0025693816132843494, "global_step": 36994, "epoch": 310, "lr": 4.768561967880419e-05} +{"train_loss": 0.0035620350390672684, "global_step": 36995, "epoch": 310, "lr": 4.768340654613258e-05} +{"train_loss": 0.002554235514253378, "global_step": 36996, "epoch": 310, "lr": 4.768119341800938e-05} +{"train_loss": 0.002233902458101511, "global_step": 36997, "epoch": 310, "lr": 4.76789802944389e-05} +{"train_loss": 0.002125862520188093, "global_step": 36998, "epoch": 310, "lr": 4.7676767175425484e-05} +{"train_loss": 0.0025381052400916815, "global_step": 36999, "epoch": 310, "lr": 4.76745540609735e-05} +{"train_loss": 0.0016724917804822326, "global_step": 37000, "epoch": 310, "lr": 4.7672340951087256e-05} +{"train_loss": 0.0017027690773829818, "global_step": 37001, "epoch": 310, "lr": 4.767012784577115e-05} +{"train_loss": 0.0016231947811320424, "global_step": 37002, "epoch": 310, "lr": 4.76679147450295e-05} +{"train_loss": 0.0020723759662359953, "global_step": 37003, "epoch": 310, "lr": 4.766570164886663e-05} +{"train_loss": 0.0018840422853827477, "global_step": 37004, "epoch": 310, "lr": 4.7663488557286926e-05} +{"train_loss": 0.0020332629792392254, "global_step": 37005, "epoch": 310, "lr": 4.766127547029469e-05} +{"train_loss": 0.0031274459324777126, "global_step": 37006, "epoch": 310, "lr": 4.7659062387894315e-05} +{"train_loss": 0.0022075395099818707, "global_step": 37007, "epoch": 310, "lr": 4.76568493100901e-05} +{"train_loss": 0.0022682082719960007, "global_step": 37008, "epoch": 310, "lr": 4.7654636236886426e-05, "val_loss": 0.02378096431493759, "train_action_mse_error": 3.886795821017586e-05} +{"train_loss": 0.0019981605000793934, "global_step": 37009, "epoch": 311, "lr": 4.7652423168287626e-05} +{"train_loss": 0.0026049816515296698, "global_step": 37010, "epoch": 311, "lr": 4.765021010429802e-05} +{"train_loss": 0.002992224181070924, "global_step": 37011, "epoch": 311, "lr": 4.7647997044922e-05} +{"train_loss": 0.0027497352566570044, "global_step": 37012, "epoch": 311, "lr": 4.764578399016386e-05} +{"train_loss": 0.0021674258168786764, "global_step": 37013, "epoch": 311, "lr": 4.764357094002798e-05} +{"train_loss": 0.005227609537541866, "global_step": 37014, "epoch": 311, "lr": 4.764135789451871e-05} +{"train_loss": 0.0016043123323470354, "global_step": 37015, "epoch": 311, "lr": 4.763914485364037e-05} +{"train_loss": 0.0018791200127452612, "global_step": 37016, "epoch": 311, "lr": 4.7636931817397334e-05} +{"train_loss": 0.0018163116183131933, "global_step": 37017, "epoch": 311, "lr": 4.7634718785793904e-05} +{"train_loss": 0.0019529779674485326, "global_step": 37018, "epoch": 311, "lr": 4.763250575883447e-05} +{"train_loss": 0.002678930526599288, "global_step": 37019, "epoch": 311, "lr": 4.763029273652334e-05} +{"train_loss": 0.003060359740629792, "global_step": 37020, "epoch": 311, "lr": 4.7628079718864904e-05} +{"train_loss": 0.0029231435619294643, "global_step": 37021, "epoch": 311, "lr": 4.7625866705863476e-05} +{"train_loss": 0.0032908881548792124, "global_step": 37022, "epoch": 311, "lr": 4.762365369752338e-05} +{"train_loss": 0.001633624779060483, "global_step": 37023, "epoch": 311, "lr": 4.762144069384901e-05} +{"train_loss": 0.002818494103848934, "global_step": 37024, "epoch": 311, "lr": 4.761922769484467e-05} +{"train_loss": 0.0022221137769520283, "global_step": 37025, "epoch": 311, "lr": 4.761701470051474e-05} +{"train_loss": 0.0017046043649315834, "global_step": 37026, "epoch": 311, "lr": 4.7614801710863524e-05} +{"train_loss": 0.0034465293865650892, "global_step": 37027, "epoch": 311, "lr": 4.761258872589541e-05} +{"train_loss": 0.0029424054082483053, "global_step": 37028, "epoch": 311, "lr": 4.761037574561472e-05} +{"train_loss": 0.00210260646417737, "global_step": 37029, "epoch": 311, "lr": 4.760816277002579e-05} +{"train_loss": 0.0019408260704949498, "global_step": 37030, "epoch": 311, "lr": 4.760594979913299e-05} +{"train_loss": 0.0025534103624522686, "global_step": 37031, "epoch": 311, "lr": 4.760373683294064e-05} +{"train_loss": 0.0027258924674242735, "global_step": 37032, "epoch": 311, "lr": 4.76015238714531e-05} +{"train_loss": 0.002043904270976782, "global_step": 37033, "epoch": 311, "lr": 4.7599310914674726e-05} +{"train_loss": 0.00213065673597157, "global_step": 37034, "epoch": 311, "lr": 4.7597097962609824e-05} +{"train_loss": 0.002038209466263652, "global_step": 37035, "epoch": 311, "lr": 4.759488501526279e-05} +{"train_loss": 0.002097048331052065, "global_step": 37036, "epoch": 311, "lr": 4.759267207263792e-05} +{"train_loss": 0.002162831136956811, "global_step": 37037, "epoch": 311, "lr": 4.7590459134739603e-05} +{"train_loss": 0.002226106123998761, "global_step": 37038, "epoch": 311, "lr": 4.7588246201572136e-05} +{"train_loss": 0.0023707044310867786, "global_step": 37039, "epoch": 311, "lr": 4.7586033273139914e-05} +{"train_loss": 0.0027712855953723192, "global_step": 37040, "epoch": 311, "lr": 4.7583820349447255e-05} +{"train_loss": 0.002467273734509945, "global_step": 37041, "epoch": 311, "lr": 4.758160743049849e-05} +{"train_loss": 0.0033401199616491795, "global_step": 37042, "epoch": 311, "lr": 4.7579394516297994e-05} +{"train_loss": 0.0024236643221229315, "global_step": 37043, "epoch": 311, "lr": 4.7577181606850084e-05} +{"train_loss": 0.002648679306730628, "global_step": 37044, "epoch": 311, "lr": 4.757496870215914e-05} +{"train_loss": 0.0023491191677749157, "global_step": 37045, "epoch": 311, "lr": 4.7572755802229454e-05} +{"train_loss": 0.0032921484671533108, "global_step": 37046, "epoch": 311, "lr": 4.757054290706544e-05} +{"train_loss": 0.0018536146963015199, "global_step": 37047, "epoch": 311, "lr": 4.756833001667139e-05} +{"train_loss": 0.003154647769406438, "global_step": 37048, "epoch": 311, "lr": 4.756611713105165e-05} +{"train_loss": 0.0023509752936661243, "global_step": 37049, "epoch": 311, "lr": 4.75639042502106e-05} +{"train_loss": 0.0024251234717667103, "global_step": 37050, "epoch": 311, "lr": 4.7561691374152536e-05} +{"train_loss": 0.002614707453176379, "global_step": 37051, "epoch": 311, "lr": 4.7559478502881866e-05} +{"train_loss": 0.003040773095563054, "global_step": 37052, "epoch": 311, "lr": 4.7557265636402894e-05} +{"train_loss": 0.0023229210637509823, "global_step": 37053, "epoch": 311, "lr": 4.7555052774719946e-05} +{"train_loss": 0.0023338692262768745, "global_step": 37054, "epoch": 311, "lr": 4.755283991783742e-05} +{"train_loss": 0.0027933758683502674, "global_step": 37055, "epoch": 311, "lr": 4.75506270657596e-05} +{"train_loss": 0.003119220258668065, "global_step": 37056, "epoch": 311, "lr": 4.754841421849088e-05} +{"train_loss": 0.003646119963377714, "global_step": 37057, "epoch": 311, "lr": 4.754620137603558e-05} +{"train_loss": 0.001008795341476798, "global_step": 37058, "epoch": 311, "lr": 4.754398853839806e-05} +{"train_loss": 0.0022109101992100477, "global_step": 37059, "epoch": 311, "lr": 4.7541775705582664e-05} +{"train_loss": 0.0024272273294627666, "global_step": 37060, "epoch": 311, "lr": 4.7539562877593704e-05} +{"train_loss": 0.004553151782602072, "global_step": 37061, "epoch": 311, "lr": 4.753735005443557e-05} +{"train_loss": 0.002429508138448, "global_step": 37062, "epoch": 311, "lr": 4.753513723611257e-05} +{"train_loss": 0.002412739908322692, "global_step": 37063, "epoch": 311, "lr": 4.7532924422629074e-05} +{"train_loss": 0.0024403955321758986, "global_step": 37064, "epoch": 311, "lr": 4.753071161398941e-05} +{"train_loss": 0.0015418364200741053, "global_step": 37065, "epoch": 311, "lr": 4.7528498810197936e-05} +{"train_loss": 0.003197623649612069, "global_step": 37066, "epoch": 311, "lr": 4.7526286011259e-05} +{"train_loss": 0.0019194423221051693, "global_step": 37067, "epoch": 311, "lr": 4.752407321717692e-05} +{"train_loss": 0.0020824670791625977, "global_step": 37068, "epoch": 311, "lr": 4.752186042795607e-05} +{"train_loss": 0.0038076946511864662, "global_step": 37069, "epoch": 311, "lr": 4.7519647643600767e-05} +{"train_loss": 0.0022401264868676662, "global_step": 37070, "epoch": 311, "lr": 4.751743486411539e-05} +{"train_loss": 0.002315153367817402, "global_step": 37071, "epoch": 311, "lr": 4.7515222089504266e-05} +{"train_loss": 0.0024192926939576864, "global_step": 37072, "epoch": 311, "lr": 4.751300931977172e-05} +{"train_loss": 0.0033871070481836796, "global_step": 37073, "epoch": 311, "lr": 4.7510796554922124e-05} +{"train_loss": 0.0024146363139152527, "global_step": 37074, "epoch": 311, "lr": 4.75085837949598e-05} +{"train_loss": 0.0019172963220626116, "global_step": 37075, "epoch": 311, "lr": 4.750637103988913e-05} +{"train_loss": 0.0016013392014428973, "global_step": 37076, "epoch": 311, "lr": 4.750415828971441e-05} +{"train_loss": 0.0023900873493403196, "global_step": 37077, "epoch": 311, "lr": 4.750194554444003e-05} +{"train_loss": 0.0018984877970069647, "global_step": 37078, "epoch": 311, "lr": 4.74997328040703e-05} +{"train_loss": 0.002872689161449671, "global_step": 37079, "epoch": 311, "lr": 4.749752006860958e-05} +{"train_loss": 0.002345124026760459, "global_step": 37080, "epoch": 311, "lr": 4.749530733806221e-05} +{"train_loss": 0.002802301663905382, "global_step": 37081, "epoch": 311, "lr": 4.749309461243254e-05} +{"train_loss": 0.0016816752031445503, "global_step": 37082, "epoch": 311, "lr": 4.749088189172491e-05} +{"train_loss": 0.00215520360507071, "global_step": 37083, "epoch": 311, "lr": 4.7488669175943665e-05} +{"train_loss": 0.003551274770870805, "global_step": 37084, "epoch": 311, "lr": 4.748645646509314e-05} +{"train_loss": 0.0021218026522547007, "global_step": 37085, "epoch": 311, "lr": 4.7484243759177714e-05} +{"train_loss": 0.0033048095647245646, "global_step": 37086, "epoch": 311, "lr": 4.748203105820168e-05} +{"train_loss": 0.0033304423559457064, "global_step": 37087, "epoch": 311, "lr": 4.747981836216943e-05} +{"train_loss": 0.002904537133872509, "global_step": 37088, "epoch": 311, "lr": 4.7477605671085266e-05} +{"train_loss": 0.002257277024909854, "global_step": 37089, "epoch": 311, "lr": 4.7475392984953575e-05} +{"train_loss": 0.002394037786871195, "global_step": 37090, "epoch": 311, "lr": 4.747318030377868e-05} +{"train_loss": 0.003100821515545249, "global_step": 37091, "epoch": 311, "lr": 4.7470967627564904e-05} +{"train_loss": 0.0025006080977618694, "global_step": 37092, "epoch": 311, "lr": 4.746875495631663e-05} +{"train_loss": 0.002247881842777133, "global_step": 37093, "epoch": 311, "lr": 4.7466542290038174e-05} +{"train_loss": 0.0023355025332421064, "global_step": 37094, "epoch": 311, "lr": 4.7464329628733913e-05} +{"train_loss": 0.0032271132804453373, "global_step": 37095, "epoch": 311, "lr": 4.746211697240814e-05} +{"train_loss": 0.0015445374883711338, "global_step": 37096, "epoch": 311, "lr": 4.745990432106525e-05} +{"train_loss": 0.0016295126406475902, "global_step": 37097, "epoch": 311, "lr": 4.745769167470956e-05} +{"train_loss": 0.002232098486274481, "global_step": 37098, "epoch": 311, "lr": 4.745547903334541e-05} +{"train_loss": 0.0021190247498452663, "global_step": 37099, "epoch": 311, "lr": 4.745326639697717e-05} +{"train_loss": 0.0033396717626601458, "global_step": 37100, "epoch": 311, "lr": 4.745105376560916e-05} +{"train_loss": 0.00234795268625021, "global_step": 37101, "epoch": 311, "lr": 4.7448841139245756e-05} +{"train_loss": 0.0030150392558425665, "global_step": 37102, "epoch": 311, "lr": 4.744662851789127e-05} +{"train_loss": 0.0026060710661113262, "global_step": 37103, "epoch": 311, "lr": 4.744441590155004e-05} +{"train_loss": 0.0017589781200513244, "global_step": 37104, "epoch": 311, "lr": 4.744220329022644e-05} +{"train_loss": 0.0022757702972739935, "global_step": 37105, "epoch": 311, "lr": 4.7439990683924785e-05} +{"train_loss": 0.001165467081591487, "global_step": 37106, "epoch": 311, "lr": 4.743777808264946e-05} +{"train_loss": 0.0028041310142725706, "global_step": 37107, "epoch": 311, "lr": 4.7435565486404755e-05} +{"train_loss": 0.0021371468901634216, "global_step": 37108, "epoch": 311, "lr": 4.7433352895195065e-05} +{"train_loss": 0.0020784910302609205, "global_step": 37109, "epoch": 311, "lr": 4.743114030902472e-05} +{"train_loss": 0.0014452715404331684, "global_step": 37110, "epoch": 311, "lr": 4.7428927727898024e-05} +{"train_loss": 0.0015789273893460631, "global_step": 37111, "epoch": 311, "lr": 4.742671515181937e-05} +{"train_loss": 0.0027622508350759745, "global_step": 37112, "epoch": 311, "lr": 4.742450258079309e-05} +{"train_loss": 0.0034581590443849564, "global_step": 37113, "epoch": 311, "lr": 4.7422290014823525e-05} +{"train_loss": 0.0025275449734181166, "global_step": 37114, "epoch": 311, "lr": 4.742007745391501e-05} +{"train_loss": 0.0022679539397358894, "global_step": 37115, "epoch": 311, "lr": 4.74178648980719e-05} +{"train_loss": 0.0022406368516385555, "global_step": 37116, "epoch": 311, "lr": 4.741565234729855e-05} +{"train_loss": 0.0030811734031885862, "global_step": 37117, "epoch": 311, "lr": 4.741343980159927e-05} +{"train_loss": 0.002062990330159664, "global_step": 37118, "epoch": 311, "lr": 4.741122726097844e-05} +{"train_loss": 0.0020981726702302694, "global_step": 37119, "epoch": 311, "lr": 4.7409014725440376e-05} +{"train_loss": 0.00155174289830029, "global_step": 37120, "epoch": 311, "lr": 4.7406802194989445e-05} +{"train_loss": 0.001641616108827293, "global_step": 37121, "epoch": 311, "lr": 4.740458966962999e-05} +{"train_loss": 0.0014866857090964913, "global_step": 37122, "epoch": 311, "lr": 4.740237714936632e-05} +{"train_loss": 0.00264759105630219, "global_step": 37123, "epoch": 311, "lr": 4.740016463420283e-05} +{"train_loss": 0.002981505123898387, "global_step": 37124, "epoch": 311, "lr": 4.7397952124143816e-05} +{"train_loss": 0.0032279430888593197, "global_step": 37125, "epoch": 311, "lr": 4.7395739619193666e-05} +{"train_loss": 0.0017215381376445293, "global_step": 37126, "epoch": 311, "lr": 4.739352711935668e-05} +{"train_loss": 0.002462365880741605, "global_step": 37127, "epoch": 311, "lr": 4.739131462463725e-05, "val_loss": 0.0087156742811203} +{"train_loss": 0.001512073096819222, "global_step": 37128, "epoch": 312, "lr": 4.738910213503968e-05} +{"train_loss": 0.0030966459307819605, "global_step": 37129, "epoch": 312, "lr": 4.738688965056833e-05} +{"train_loss": 0.0030603227205574512, "global_step": 37130, "epoch": 312, "lr": 4.7384677171227545e-05} +{"train_loss": 0.002310545649379492, "global_step": 37131, "epoch": 312, "lr": 4.738246469702167e-05} +{"train_loss": 0.0016090036369860172, "global_step": 37132, "epoch": 312, "lr": 4.738025222795504e-05} +{"train_loss": 0.0025407634675502777, "global_step": 37133, "epoch": 312, "lr": 4.7378039764032e-05} +{"train_loss": 0.0010539194336161017, "global_step": 37134, "epoch": 312, "lr": 4.7375827305256913e-05} +{"train_loss": 0.001965999836102128, "global_step": 37135, "epoch": 312, "lr": 4.737361485163411e-05} +{"train_loss": 0.0023554253857582808, "global_step": 37136, "epoch": 312, "lr": 4.7371402403167914e-05} +{"train_loss": 0.0019909623079001904, "global_step": 37137, "epoch": 312, "lr": 4.736918995986271e-05} +{"train_loss": 0.0028738444671034813, "global_step": 37138, "epoch": 312, "lr": 4.73669775217228e-05} +{"train_loss": 0.0020219397265464067, "global_step": 37139, "epoch": 312, "lr": 4.7364765088752575e-05} +{"train_loss": 0.00133030884899199, "global_step": 37140, "epoch": 312, "lr": 4.7362552660956344e-05} +{"train_loss": 0.0032344034407287836, "global_step": 37141, "epoch": 312, "lr": 4.736034023833844e-05} +{"train_loss": 0.0026982086710631847, "global_step": 37142, "epoch": 312, "lr": 4.7358127820903245e-05} +{"train_loss": 0.002601810498163104, "global_step": 37143, "epoch": 312, "lr": 4.735591540865506e-05} +{"train_loss": 0.002361980965360999, "global_step": 37144, "epoch": 312, "lr": 4.7353703001598285e-05} +{"train_loss": 0.0016696464736014605, "global_step": 37145, "epoch": 312, "lr": 4.73514905997372e-05} +{"train_loss": 0.0016006628284230828, "global_step": 37146, "epoch": 312, "lr": 4.73492782030762e-05} +{"train_loss": 0.0030719495844095945, "global_step": 37147, "epoch": 312, "lr": 4.7347065811619615e-05} +{"train_loss": 0.003071317682042718, "global_step": 37148, "epoch": 312, "lr": 4.734485342537176e-05} +{"train_loss": 0.00336004002019763, "global_step": 37149, "epoch": 312, "lr": 4.734264104433702e-05} +{"train_loss": 0.001986643997952342, "global_step": 37150, "epoch": 312, "lr": 4.7340428668519705e-05} +{"train_loss": 0.0015088435029610991, "global_step": 37151, "epoch": 312, "lr": 4.73382162979242e-05} +{"train_loss": 0.0028909945394843817, "global_step": 37152, "epoch": 312, "lr": 4.733600393255481e-05} +{"train_loss": 0.00331413303501904, "global_step": 37153, "epoch": 312, "lr": 4.733379157241588e-05} +{"train_loss": 0.0014370718272402883, "global_step": 37154, "epoch": 312, "lr": 4.733157921751178e-05} +{"train_loss": 0.0025879070162773132, "global_step": 37155, "epoch": 312, "lr": 4.7329366867846825e-05} +{"train_loss": 0.0032922099344432354, "global_step": 37156, "epoch": 312, "lr": 4.732715452342539e-05} +{"train_loss": 0.0014580499846488237, "global_step": 37157, "epoch": 312, "lr": 4.7324942184251783e-05} +{"train_loss": 0.0018968927906826138, "global_step": 37158, "epoch": 312, "lr": 4.7322729850330385e-05} +{"train_loss": 0.0012251506559550762, "global_step": 37159, "epoch": 312, "lr": 4.732051752166551e-05} +{"train_loss": 0.0019959500059485435, "global_step": 37160, "epoch": 312, "lr": 4.7318305198261517e-05} +{"train_loss": 0.002086228458210826, "global_step": 37161, "epoch": 312, "lr": 4.7316092880122734e-05} +{"train_loss": 0.001914135878905654, "global_step": 37162, "epoch": 312, "lr": 4.7313880567253526e-05} +{"train_loss": 0.001841261750087142, "global_step": 37163, "epoch": 312, "lr": 4.731166825965822e-05} +{"train_loss": 0.0013766863849014044, "global_step": 37164, "epoch": 312, "lr": 4.7309455957341176e-05} +{"train_loss": 0.003267312655225396, "global_step": 37165, "epoch": 312, "lr": 4.730724366030672e-05} +{"train_loss": 0.0021803430281579494, "global_step": 37166, "epoch": 312, "lr": 4.7305031368559214e-05} +{"train_loss": 0.0013511603465303779, "global_step": 37167, "epoch": 312, "lr": 4.7302819082102974e-05} +{"train_loss": 0.0022516967728734016, "global_step": 37168, "epoch": 312, "lr": 4.730060680094238e-05} +{"train_loss": 0.001818594173528254, "global_step": 37169, "epoch": 312, "lr": 4.729839452508173e-05} +{"train_loss": 0.0021915738470852375, "global_step": 37170, "epoch": 312, "lr": 4.7296182254525425e-05} +{"train_loss": 0.0021721809171140194, "global_step": 37171, "epoch": 312, "lr": 4.729396998927777e-05} +{"train_loss": 0.0029174790252000093, "global_step": 37172, "epoch": 312, "lr": 4.7291757729343095e-05} +{"train_loss": 0.0021815579384565353, "global_step": 37173, "epoch": 312, "lr": 4.728954547472579e-05} +{"train_loss": 0.0028552233707159758, "global_step": 37174, "epoch": 312, "lr": 4.728733322543015e-05} +{"train_loss": 0.0016784886829555035, "global_step": 37175, "epoch": 312, "lr": 4.728512098146056e-05} +{"train_loss": 0.0019844903144985437, "global_step": 37176, "epoch": 312, "lr": 4.728290874282132e-05} +{"train_loss": 0.0020458493381738663, "global_step": 37177, "epoch": 312, "lr": 4.7280696509516825e-05} +{"train_loss": 0.0021235886961221695, "global_step": 37178, "epoch": 312, "lr": 4.727848428155138e-05} +{"train_loss": 0.0010024766670539975, "global_step": 37179, "epoch": 312, "lr": 4.7276272058929346e-05} +{"train_loss": 0.0015946601051837206, "global_step": 37180, "epoch": 312, "lr": 4.727405984165506e-05} +{"train_loss": 0.0011659027077257633, "global_step": 37181, "epoch": 312, "lr": 4.7271847629732844e-05} +{"train_loss": 0.00336119020357728, "global_step": 37182, "epoch": 312, "lr": 4.726963542316709e-05} +{"train_loss": 0.001504132291302085, "global_step": 37183, "epoch": 312, "lr": 4.72674232219621e-05} +{"train_loss": 0.0014530260814353824, "global_step": 37184, "epoch": 312, "lr": 4.7265211026122245e-05} +{"train_loss": 0.0016039804322645068, "global_step": 37185, "epoch": 312, "lr": 4.7262998835651866e-05} +{"train_loss": 0.0016753457020968199, "global_step": 37186, "epoch": 312, "lr": 4.7260786650555275e-05} +{"train_loss": 0.002302035689353943, "global_step": 37187, "epoch": 312, "lr": 4.725857447083685e-05} +{"train_loss": 0.0012891344958916306, "global_step": 37188, "epoch": 312, "lr": 4.72563622965009e-05} +{"train_loss": 0.002795132575556636, "global_step": 37189, "epoch": 312, "lr": 4.7254150127551814e-05} +{"train_loss": 0.0014330859994515777, "global_step": 37190, "epoch": 312, "lr": 4.7251937963993915e-05} +{"train_loss": 0.0031941274646669626, "global_step": 37191, "epoch": 312, "lr": 4.7249725805831514e-05} +{"train_loss": 0.0011635466944426298, "global_step": 37192, "epoch": 312, "lr": 4.724751365306901e-05} +{"train_loss": 0.001696689403615892, "global_step": 37193, "epoch": 312, "lr": 4.724530150571069e-05} +{"train_loss": 0.0020143575966358185, "global_step": 37194, "epoch": 312, "lr": 4.724308936376095e-05} +{"train_loss": 0.0021281694062054157, "global_step": 37195, "epoch": 312, "lr": 4.72408772272241e-05} +{"train_loss": 0.0014871120220050216, "global_step": 37196, "epoch": 312, "lr": 4.723866509610448e-05} +{"train_loss": 0.0015984359197318554, "global_step": 37197, "epoch": 312, "lr": 4.723645297040648e-05} +{"train_loss": 0.0017917666118592024, "global_step": 37198, "epoch": 312, "lr": 4.7234240850134374e-05} +{"train_loss": 0.0011680539464578032, "global_step": 37199, "epoch": 312, "lr": 4.7232028735292565e-05} +{"train_loss": 0.003835586830973625, "global_step": 37200, "epoch": 312, "lr": 4.7229816625885354e-05} +{"train_loss": 0.0016352887032553554, "global_step": 37201, "epoch": 312, "lr": 4.7227604521917124e-05} +{"train_loss": 0.0014046666910871863, "global_step": 37202, "epoch": 312, "lr": 4.7225392423392165e-05} +{"train_loss": 0.002983186626806855, "global_step": 37203, "epoch": 312, "lr": 4.722318033031489e-05} +{"train_loss": 0.0016097163315862417, "global_step": 37204, "epoch": 312, "lr": 4.722096824268959e-05} +{"train_loss": 0.0015200480120256543, "global_step": 37205, "epoch": 312, "lr": 4.7218756160520606e-05} +{"train_loss": 0.0011236760765314102, "global_step": 37206, "epoch": 312, "lr": 4.7216544083812316e-05} +{"train_loss": 0.0020608208142220974, "global_step": 37207, "epoch": 312, "lr": 4.721433201256902e-05} +{"train_loss": 0.0007981854723766446, "global_step": 37208, "epoch": 312, "lr": 4.721211994679511e-05} +{"train_loss": 0.0017815796891227365, "global_step": 37209, "epoch": 312, "lr": 4.72099078864949e-05} +{"train_loss": 0.0022330405190587044, "global_step": 37210, "epoch": 312, "lr": 4.720769583167273e-05} +{"train_loss": 0.001875980058684945, "global_step": 37211, "epoch": 312, "lr": 4.720548378233295e-05} +{"train_loss": 0.0033542991150170565, "global_step": 37212, "epoch": 312, "lr": 4.720327173847991e-05} +{"train_loss": 0.002464007120579481, "global_step": 37213, "epoch": 312, "lr": 4.720105970011794e-05} +{"train_loss": 0.0018334940541535616, "global_step": 37214, "epoch": 312, "lr": 4.71988476672514e-05} +{"train_loss": 0.001733048353344202, "global_step": 37215, "epoch": 312, "lr": 4.719663563988462e-05} +{"train_loss": 0.0034177780617028475, "global_step": 37216, "epoch": 312, "lr": 4.719442361802196e-05} +{"train_loss": 0.0014415333280339837, "global_step": 37217, "epoch": 312, "lr": 4.719221160166772e-05} +{"train_loss": 0.0015268006827682257, "global_step": 37218, "epoch": 312, "lr": 4.7189999590826295e-05} +{"train_loss": 0.002695885021239519, "global_step": 37219, "epoch": 312, "lr": 4.7187787585501984e-05} +{"train_loss": 0.0017035383498296142, "global_step": 37220, "epoch": 312, "lr": 4.7185575585699176e-05} +{"train_loss": 0.0020206421613693237, "global_step": 37221, "epoch": 312, "lr": 4.7183363591422194e-05} +{"train_loss": 0.0026427058037370443, "global_step": 37222, "epoch": 312, "lr": 4.718115160267535e-05} +{"train_loss": 0.0013844065833836794, "global_step": 37223, "epoch": 312, "lr": 4.717893961946303e-05} +{"train_loss": 0.0011728066019713879, "global_step": 37224, "epoch": 312, "lr": 4.7176727641789545e-05} +{"train_loss": 0.0012725625419989228, "global_step": 37225, "epoch": 312, "lr": 4.7174515669659276e-05} +{"train_loss": 0.0009666230180300772, "global_step": 37226, "epoch": 312, "lr": 4.717230370307652e-05} +{"train_loss": 0.0011874351184815168, "global_step": 37227, "epoch": 312, "lr": 4.7170091742045666e-05} +{"train_loss": 0.0017454377375543118, "global_step": 37228, "epoch": 312, "lr": 4.7167879786571026e-05} +{"train_loss": 0.0019630249589681625, "global_step": 37229, "epoch": 312, "lr": 4.7165667836656954e-05} +{"train_loss": 0.0037828467320650816, "global_step": 37230, "epoch": 312, "lr": 4.716345589230779e-05} +{"train_loss": 0.0017080196412280202, "global_step": 37231, "epoch": 312, "lr": 4.7161243953527855e-05} +{"train_loss": 0.0023893301840871572, "global_step": 37232, "epoch": 312, "lr": 4.715903202032154e-05} +{"train_loss": 0.0012208044063299894, "global_step": 37233, "epoch": 312, "lr": 4.715682009269314e-05} +{"train_loss": 0.0019184383563697338, "global_step": 37234, "epoch": 312, "lr": 4.715460817064705e-05} +{"train_loss": 0.003910158760845661, "global_step": 37235, "epoch": 312, "lr": 4.715239625418758e-05} +{"train_loss": 0.00291850115172565, "global_step": 37236, "epoch": 312, "lr": 4.7150184343319046e-05} +{"train_loss": 0.0018726888811215758, "global_step": 37237, "epoch": 312, "lr": 4.714797243804585e-05} +{"train_loss": 0.0017334773438051343, "global_step": 37238, "epoch": 312, "lr": 4.714576053837229e-05} +{"train_loss": 0.0014175765682011843, "global_step": 37239, "epoch": 312, "lr": 4.714354864430273e-05} +{"train_loss": 0.0019196879584342241, "global_step": 37240, "epoch": 312, "lr": 4.714133675584152e-05} +{"train_loss": 0.0024719382636249065, "global_step": 37241, "epoch": 312, "lr": 4.7139124872992965e-05} +{"train_loss": 0.001727823750115931, "global_step": 37242, "epoch": 312, "lr": 4.713691299576145e-05} +{"train_loss": 0.0036716763861477375, "global_step": 37243, "epoch": 312, "lr": 4.713470112415128e-05} +{"train_loss": 0.0017888855654746294, "global_step": 37244, "epoch": 312, "lr": 4.713248925816683e-05} +{"train_loss": 0.0021490331273525953, "global_step": 37245, "epoch": 312, "lr": 4.7130277397812434e-05} +{"train_loss": 0.0020806275336502293, "global_step": 37246, "epoch": 312, "lr": 4.712806554309243e-05, "val_loss": 0.03775549307465553} +{"train_loss": 0.0018951896345242858, "global_step": 37247, "epoch": 313, "lr": 4.7125853694011174e-05} +{"train_loss": 0.00370733137242496, "global_step": 37248, "epoch": 313, "lr": 4.712364185057297e-05} +{"train_loss": 0.002043073531240225, "global_step": 37249, "epoch": 313, "lr": 4.7121430012782216e-05} +{"train_loss": 0.0017293099081143737, "global_step": 37250, "epoch": 313, "lr": 4.7119218180643204e-05} +{"train_loss": 0.0017457338981330395, "global_step": 37251, "epoch": 313, "lr": 4.711700635416032e-05} +{"train_loss": 0.0017167495097965002, "global_step": 37252, "epoch": 313, "lr": 4.711479453333786e-05} +{"train_loss": 0.001968377036973834, "global_step": 37253, "epoch": 313, "lr": 4.711258271818022e-05} +{"train_loss": 0.0014708226080983877, "global_step": 37254, "epoch": 313, "lr": 4.7110370908691715e-05} +{"train_loss": 0.002034643664956093, "global_step": 37255, "epoch": 313, "lr": 4.7108159104876664e-05} +{"train_loss": 0.0011990948114544153, "global_step": 37256, "epoch": 313, "lr": 4.710594730673946e-05} +{"train_loss": 0.0011527147144079208, "global_step": 37257, "epoch": 313, "lr": 4.710373551428439e-05} +{"train_loss": 0.0029036500491201878, "global_step": 37258, "epoch": 313, "lr": 4.710152372751586e-05} +{"train_loss": 0.002551755867898464, "global_step": 37259, "epoch": 313, "lr": 4.7099311946438154e-05} +{"train_loss": 0.0023696226999163628, "global_step": 37260, "epoch": 313, "lr": 4.709710017105564e-05} +{"train_loss": 0.0009944842895492911, "global_step": 37261, "epoch": 313, "lr": 4.709488840137266e-05} +{"train_loss": 0.002242530230432749, "global_step": 37262, "epoch": 313, "lr": 4.7092676637393565e-05} +{"train_loss": 0.0016501982463523746, "global_step": 37263, "epoch": 313, "lr": 4.709046487912269e-05} +{"train_loss": 0.0017759189940989017, "global_step": 37264, "epoch": 313, "lr": 4.708825312656437e-05} +{"train_loss": 0.002581111155450344, "global_step": 37265, "epoch": 313, "lr": 4.7086041379722954e-05} +{"train_loss": 0.0015733317704871297, "global_step": 37266, "epoch": 313, "lr": 4.7083829638602795e-05} +{"train_loss": 0.0030255853198468685, "global_step": 37267, "epoch": 313, "lr": 4.7081617903208206e-05} +{"train_loss": 0.0020230128429830074, "global_step": 37268, "epoch": 313, "lr": 4.7079406173543564e-05} +{"train_loss": 0.003116379724815488, "global_step": 37269, "epoch": 313, "lr": 4.707719444961318e-05} +{"train_loss": 0.0014010010054334998, "global_step": 37270, "epoch": 313, "lr": 4.707498273142144e-05} +{"train_loss": 0.002935259137302637, "global_step": 37271, "epoch": 313, "lr": 4.7072771018972625e-05} +{"train_loss": 0.0026227342896163464, "global_step": 37272, "epoch": 313, "lr": 4.7070559312271135e-05} +{"train_loss": 0.0016699919942766428, "global_step": 37273, "epoch": 313, "lr": 4.7068347611321296e-05} +{"train_loss": 0.0008028885931707919, "global_step": 37274, "epoch": 313, "lr": 4.706613591612741e-05} +{"train_loss": 0.003059637499973178, "global_step": 37275, "epoch": 313, "lr": 4.706392422669388e-05} +{"train_loss": 0.0019220156827941537, "global_step": 37276, "epoch": 313, "lr": 4.7061712543025006e-05} +{"train_loss": 0.002175896428525448, "global_step": 37277, "epoch": 313, "lr": 4.705950086512516e-05} +{"train_loss": 0.0026801025960594416, "global_step": 37278, "epoch": 313, "lr": 4.7057289192998664e-05} +{"train_loss": 0.00173799111507833, "global_step": 37279, "epoch": 313, "lr": 4.705507752664986e-05} +{"train_loss": 0.0015324312262237072, "global_step": 37280, "epoch": 313, "lr": 4.705286586608311e-05} +{"train_loss": 0.0018297635251656175, "global_step": 37281, "epoch": 313, "lr": 4.705065421130272e-05} +{"train_loss": 0.0021282294765114784, "global_step": 37282, "epoch": 313, "lr": 4.704844256231308e-05} +{"train_loss": 0.001764637534506619, "global_step": 37283, "epoch": 313, "lr": 4.7046230919118486e-05} +{"train_loss": 0.0015176818706095219, "global_step": 37284, "epoch": 313, "lr": 4.704401928172332e-05} +{"train_loss": 0.0018611479317769408, "global_step": 37285, "epoch": 313, "lr": 4.7041807650131905e-05} +{"train_loss": 0.00364126730710268, "global_step": 37286, "epoch": 313, "lr": 4.703959602434857e-05} +{"train_loss": 0.0017087864689528942, "global_step": 37287, "epoch": 313, "lr": 4.703738440437769e-05} +{"train_loss": 0.002807484706863761, "global_step": 37288, "epoch": 313, "lr": 4.703517279022357e-05} +{"train_loss": 0.0019512419821694493, "global_step": 37289, "epoch": 313, "lr": 4.7032961181890597e-05} +{"train_loss": 0.0019672911148518324, "global_step": 37290, "epoch": 313, "lr": 4.703074957938308e-05} +{"train_loss": 0.0015621761558577418, "global_step": 37291, "epoch": 313, "lr": 4.702853798270535e-05} +{"train_loss": 0.002403012476861477, "global_step": 37292, "epoch": 313, "lr": 4.702632639186178e-05} +{"train_loss": 0.0016680605476722121, "global_step": 37293, "epoch": 313, "lr": 4.70241148068567e-05} +{"train_loss": 0.0023276926949620247, "global_step": 37294, "epoch": 313, "lr": 4.702190322769445e-05} +{"train_loss": 0.0013020538026466966, "global_step": 37295, "epoch": 313, "lr": 4.701969165437938e-05} +{"train_loss": 0.002220697235316038, "global_step": 37296, "epoch": 313, "lr": 4.701748008691582e-05} +{"train_loss": 0.00331094884313643, "global_step": 37297, "epoch": 313, "lr": 4.701526852530814e-05} +{"train_loss": 0.0011993185617029667, "global_step": 37298, "epoch": 313, "lr": 4.701305696956063e-05} +{"train_loss": 0.002867975039407611, "global_step": 37299, "epoch": 313, "lr": 4.701084541967769e-05} +{"train_loss": 0.00241855438798666, "global_step": 37300, "epoch": 313, "lr": 4.700863387566361e-05} +{"train_loss": 0.0025355215184390545, "global_step": 37301, "epoch": 313, "lr": 4.700642233752278e-05} +{"train_loss": 0.001627989811822772, "global_step": 37302, "epoch": 313, "lr": 4.7004210805259505e-05} +{"train_loss": 0.0021314078476279974, "global_step": 37303, "epoch": 313, "lr": 4.7001999278878156e-05} +{"train_loss": 0.002078218152746558, "global_step": 37304, "epoch": 313, "lr": 4.699978775838307e-05} +{"train_loss": 0.002532988553866744, "global_step": 37305, "epoch": 313, "lr": 4.699757624377855e-05} +{"train_loss": 0.0023885308764874935, "global_step": 37306, "epoch": 313, "lr": 4.699536473506899e-05} +{"train_loss": 0.0018340634414926171, "global_step": 37307, "epoch": 313, "lr": 4.69931532322587e-05} +{"train_loss": 0.00107965141069144, "global_step": 37308, "epoch": 313, "lr": 4.699094173535204e-05} +{"train_loss": 0.0023206656333059072, "global_step": 37309, "epoch": 313, "lr": 4.698873024435334e-05} +{"train_loss": 0.003410665551200509, "global_step": 37310, "epoch": 313, "lr": 4.698651875926695e-05} +{"train_loss": 0.0013601592509076, "global_step": 37311, "epoch": 313, "lr": 4.69843072800972e-05} +{"train_loss": 0.0019106533145532012, "global_step": 37312, "epoch": 313, "lr": 4.698209580684845e-05} +{"train_loss": 0.001252029906027019, "global_step": 37313, "epoch": 313, "lr": 4.697988433952502e-05} +{"train_loss": 0.0024013561196625233, "global_step": 37314, "epoch": 313, "lr": 4.697767287813126e-05} +{"train_loss": 0.0019458606839179993, "global_step": 37315, "epoch": 313, "lr": 4.697546142267154e-05} +{"train_loss": 0.0016358296852558851, "global_step": 37316, "epoch": 313, "lr": 4.697324997315018e-05} +{"train_loss": 0.0017907738219946623, "global_step": 37317, "epoch": 313, "lr": 4.6971038529571496e-05} +{"train_loss": 0.0016929705161601305, "global_step": 37318, "epoch": 313, "lr": 4.6968827091939874e-05} +{"train_loss": 0.0021055866964161396, "global_step": 37319, "epoch": 313, "lr": 4.6966615660259614e-05} +{"train_loss": 0.0029932979959994555, "global_step": 37320, "epoch": 313, "lr": 4.696440423453511e-05} +{"train_loss": 0.0014524605358019471, "global_step": 37321, "epoch": 313, "lr": 4.696219281477064e-05} +{"train_loss": 0.0016033980064094067, "global_step": 37322, "epoch": 313, "lr": 4.695998140097061e-05} +{"train_loss": 0.0032981138210743666, "global_step": 37323, "epoch": 313, "lr": 4.6957769993139336e-05} +{"train_loss": 0.0019864500500261784, "global_step": 37324, "epoch": 313, "lr": 4.695555859128113e-05} +{"train_loss": 0.0019707130268216133, "global_step": 37325, "epoch": 313, "lr": 4.695334719540037e-05} +{"train_loss": 0.002268742071464658, "global_step": 37326, "epoch": 313, "lr": 4.695113580550138e-05} +{"train_loss": 0.0010996974306181073, "global_step": 37327, "epoch": 313, "lr": 4.694892442158851e-05} +{"train_loss": 0.0014981452841311693, "global_step": 37328, "epoch": 313, "lr": 4.694671304366612e-05} +{"train_loss": 0.0016888990066945553, "global_step": 37329, "epoch": 313, "lr": 4.69445016717385e-05} +{"train_loss": 0.0024692267179489136, "global_step": 37330, "epoch": 313, "lr": 4.694229030581006e-05} +{"train_loss": 0.002117398427799344, "global_step": 37331, "epoch": 313, "lr": 4.6940078945885075e-05} +{"train_loss": 0.0027565895579755306, "global_step": 37332, "epoch": 313, "lr": 4.693786759196794e-05} +{"train_loss": 0.0029762459453195333, "global_step": 37333, "epoch": 313, "lr": 4.693565624406296e-05} +{"train_loss": 0.0025224213022738695, "global_step": 37334, "epoch": 313, "lr": 4.693344490217451e-05} +{"train_loss": 0.0021385271102190018, "global_step": 37335, "epoch": 313, "lr": 4.693123356630691e-05} +{"train_loss": 0.004018278792500496, "global_step": 37336, "epoch": 313, "lr": 4.6929022236464485e-05} +{"train_loss": 0.0011415258049964905, "global_step": 37337, "epoch": 313, "lr": 4.692681091265162e-05} +{"train_loss": 0.001536452560685575, "global_step": 37338, "epoch": 313, "lr": 4.6924599594872606e-05} +{"train_loss": 0.0029522518161684275, "global_step": 37339, "epoch": 313, "lr": 4.6922388283131846e-05} +{"train_loss": 0.0030694615561515093, "global_step": 37340, "epoch": 313, "lr": 4.692017697743364e-05} +{"train_loss": 0.0016350509831681848, "global_step": 37341, "epoch": 313, "lr": 4.691796567778232e-05} +{"train_loss": 0.003730212803930044, "global_step": 37342, "epoch": 313, "lr": 4.6915754384182245e-05} +{"train_loss": 0.0032242091838270426, "global_step": 37343, "epoch": 313, "lr": 4.691354309663777e-05} +{"train_loss": 0.0025125674437731504, "global_step": 37344, "epoch": 313, "lr": 4.691133181515321e-05} +{"train_loss": 0.0021989771630614996, "global_step": 37345, "epoch": 313, "lr": 4.6909120539732934e-05} +{"train_loss": 0.001929919933900237, "global_step": 37346, "epoch": 313, "lr": 4.690690927038126e-05} +{"train_loss": 0.002779910108074546, "global_step": 37347, "epoch": 313, "lr": 4.6904698007102554e-05} +{"train_loss": 0.0020232705865055323, "global_step": 37348, "epoch": 313, "lr": 4.690248674990112e-05} +{"train_loss": 0.0023371726274490356, "global_step": 37349, "epoch": 313, "lr": 4.690027549878135e-05} +{"train_loss": 0.0014993618242442608, "global_step": 37350, "epoch": 313, "lr": 4.689806425374752e-05} +{"train_loss": 0.0021572851110249758, "global_step": 37351, "epoch": 313, "lr": 4.6895853014804046e-05} +{"train_loss": 0.0027604985516518354, "global_step": 37352, "epoch": 313, "lr": 4.689364178195521e-05} +{"train_loss": 0.002425949554890394, "global_step": 37353, "epoch": 313, "lr": 4.6891430555205396e-05} +{"train_loss": 0.001590777887031436, "global_step": 37354, "epoch": 313, "lr": 4.688921933455893e-05} +{"train_loss": 0.0020542109850794077, "global_step": 37355, "epoch": 313, "lr": 4.688700812002011e-05} +{"train_loss": 0.0030331125017255545, "global_step": 37356, "epoch": 313, "lr": 4.688479691159336e-05} +{"train_loss": 0.00222203996963799, "global_step": 37357, "epoch": 313, "lr": 4.688258570928295e-05} +{"train_loss": 0.0017461362294852734, "global_step": 37358, "epoch": 313, "lr": 4.6880374513093265e-05} +{"train_loss": 0.0027395919896662235, "global_step": 37359, "epoch": 313, "lr": 4.687816332302863e-05} +{"train_loss": 0.001996006816625595, "global_step": 37360, "epoch": 313, "lr": 4.687595213909338e-05} +{"train_loss": 0.0031916580628603697, "global_step": 37361, "epoch": 313, "lr": 4.6873740961291865e-05} +{"train_loss": 0.002902220468968153, "global_step": 37362, "epoch": 313, "lr": 4.687152978962842e-05} +{"train_loss": 0.001181735540740192, "global_step": 37363, "epoch": 313, "lr": 4.686931862410741e-05} +{"train_loss": 0.0012054478283971548, "global_step": 37364, "epoch": 313, "lr": 4.686710746473314e-05} +{"train_loss": 0.0021629203898448717, "global_step": 37365, "epoch": 313, "lr": 4.6864896311509995e-05, "val_loss": 0.02304876782000065} +{"train_loss": 0.003720187582075596, "global_step": 37366, "epoch": 314, "lr": 4.6862685164442285e-05} +{"train_loss": 0.0024711000733077526, "global_step": 37367, "epoch": 314, "lr": 4.6860474023534335e-05} +{"train_loss": 0.004349307157099247, "global_step": 37368, "epoch": 314, "lr": 4.685826288879053e-05} +{"train_loss": 0.001554080517962575, "global_step": 37369, "epoch": 314, "lr": 4.6856051760215166e-05} +{"train_loss": 0.0020713508129119873, "global_step": 37370, "epoch": 314, "lr": 4.685384063781264e-05} +{"train_loss": 0.002282319124788046, "global_step": 37371, "epoch": 314, "lr": 4.685162952158723e-05} +{"train_loss": 0.0020287230145186186, "global_step": 37372, "epoch": 314, "lr": 4.684941841154334e-05} +{"train_loss": 0.001452305936254561, "global_step": 37373, "epoch": 314, "lr": 4.6847207307685274e-05} +{"train_loss": 0.002483564196154475, "global_step": 37374, "epoch": 314, "lr": 4.684499621001736e-05} +{"train_loss": 0.004392855800688267, "global_step": 37375, "epoch": 314, "lr": 4.684278511854398e-05} +{"train_loss": 0.0029302758630365133, "global_step": 37376, "epoch": 314, "lr": 4.684057403326944e-05} +{"train_loss": 0.0036056842654943466, "global_step": 37377, "epoch": 314, "lr": 4.683836295419809e-05} +{"train_loss": 0.0017177609261125326, "global_step": 37378, "epoch": 314, "lr": 4.68361518813343e-05} +{"train_loss": 0.0018267405685037374, "global_step": 37379, "epoch": 314, "lr": 4.683394081468236e-05} +{"train_loss": 0.0025012055411934853, "global_step": 37380, "epoch": 314, "lr": 4.683172975424666e-05} +{"train_loss": 0.0023280158638954163, "global_step": 37381, "epoch": 314, "lr": 4.68295187000315e-05} +{"train_loss": 0.0021562809124588966, "global_step": 37382, "epoch": 314, "lr": 4.682730765204127e-05} +{"train_loss": 0.003640461713075638, "global_step": 37383, "epoch": 314, "lr": 4.6825096610280255e-05} +{"train_loss": 0.0011402410455048084, "global_step": 37384, "epoch": 314, "lr": 4.6822885574752845e-05} +{"train_loss": 0.0016169962473213673, "global_step": 37385, "epoch": 314, "lr": 4.682067454546336e-05} +{"train_loss": 0.003260830184444785, "global_step": 37386, "epoch": 314, "lr": 4.681846352241612e-05} +{"train_loss": 0.0027690508868545294, "global_step": 37387, "epoch": 314, "lr": 4.681625250561551e-05} +{"train_loss": 0.0034293397329747677, "global_step": 37388, "epoch": 314, "lr": 4.681404149506582e-05} +{"train_loss": 0.0016329464269801974, "global_step": 37389, "epoch": 314, "lr": 4.6811830490771445e-05} +{"train_loss": 0.001776877325028181, "global_step": 37390, "epoch": 314, "lr": 4.680961949273668e-05} +{"train_loss": 0.001175956684164703, "global_step": 37391, "epoch": 314, "lr": 4.680740850096591e-05} +{"train_loss": 0.0026215454563498497, "global_step": 37392, "epoch": 314, "lr": 4.680519751546344e-05} +{"train_loss": 0.0013703341828659177, "global_step": 37393, "epoch": 314, "lr": 4.6802986536233615e-05} +{"train_loss": 0.0017875065095722675, "global_step": 37394, "epoch": 314, "lr": 4.68007755632808e-05} +{"train_loss": 0.0027551972307264805, "global_step": 37395, "epoch": 314, "lr": 4.679856459660931e-05} +{"train_loss": 0.002487348159775138, "global_step": 37396, "epoch": 314, "lr": 4.679635363622349e-05} +{"train_loss": 0.0012334805214777589, "global_step": 37397, "epoch": 314, "lr": 4.679414268212771e-05} +{"train_loss": 0.0014333246508613229, "global_step": 37398, "epoch": 314, "lr": 4.679193173432627e-05} +{"train_loss": 0.0019881445914506912, "global_step": 37399, "epoch": 314, "lr": 4.6789720792823535e-05} +{"train_loss": 0.002604962093755603, "global_step": 37400, "epoch": 314, "lr": 4.678750985762383e-05} +{"train_loss": 0.0022634207271039486, "global_step": 37401, "epoch": 314, "lr": 4.678529892873153e-05} +{"train_loss": 0.0018660399364307523, "global_step": 37402, "epoch": 314, "lr": 4.678308800615092e-05} +{"train_loss": 0.0013032786082476377, "global_step": 37403, "epoch": 314, "lr": 4.67808770898864e-05} +{"train_loss": 0.001301945187151432, "global_step": 37404, "epoch": 314, "lr": 4.677866617994229e-05} +{"train_loss": 0.0024706050753593445, "global_step": 37405, "epoch": 314, "lr": 4.6776455276322895e-05} +{"train_loss": 0.004216086119413376, "global_step": 37406, "epoch": 314, "lr": 4.6774244379032604e-05} +{"train_loss": 0.003176930360496044, "global_step": 37407, "epoch": 314, "lr": 4.677203348807573e-05} +{"train_loss": 0.003083819290623069, "global_step": 37408, "epoch": 314, "lr": 4.676982260345664e-05} +{"train_loss": 0.0020992315839976072, "global_step": 37409, "epoch": 314, "lr": 4.676761172517965e-05} +{"train_loss": 0.003390758763998747, "global_step": 37410, "epoch": 314, "lr": 4.6765400853249096e-05} +{"train_loss": 0.0015147554222494364, "global_step": 37411, "epoch": 314, "lr": 4.676318998766934e-05} +{"train_loss": 0.0023667984642088413, "global_step": 37412, "epoch": 314, "lr": 4.6760979128444704e-05} +{"train_loss": 0.0020197476260364056, "global_step": 37413, "epoch": 314, "lr": 4.675876827557957e-05} +{"train_loss": 0.0030112366657704115, "global_step": 37414, "epoch": 314, "lr": 4.6756557429078215e-05} +{"train_loss": 0.003949877806007862, "global_step": 37415, "epoch": 314, "lr": 4.675434658894504e-05} +{"train_loss": 0.0032167318277060986, "global_step": 37416, "epoch": 314, "lr": 4.675213575518436e-05} +{"train_loss": 0.001629894133657217, "global_step": 37417, "epoch": 314, "lr": 4.674992492780048e-05} +{"train_loss": 0.0025103348307311535, "global_step": 37418, "epoch": 314, "lr": 4.6747714106797815e-05} +{"train_loss": 0.0013979023788124323, "global_step": 37419, "epoch": 314, "lr": 4.674550329218063e-05} +{"train_loss": 0.0021450361236929893, "global_step": 37420, "epoch": 314, "lr": 4.6743292483953326e-05} +{"train_loss": 0.002215880434960127, "global_step": 37421, "epoch": 314, "lr": 4.67410816821202e-05} +{"train_loss": 0.0022916540037840605, "global_step": 37422, "epoch": 314, "lr": 4.6738870886685635e-05} +{"train_loss": 0.0012491330271586776, "global_step": 37423, "epoch": 314, "lr": 4.673666009765395e-05} +{"train_loss": 0.004242182243615389, "global_step": 37424, "epoch": 314, "lr": 4.673444931502946e-05} +{"train_loss": 0.0024411403574049473, "global_step": 37425, "epoch": 314, "lr": 4.673223853881654e-05} +{"train_loss": 0.001303533441387117, "global_step": 37426, "epoch": 314, "lr": 4.673002776901953e-05} +{"train_loss": 0.002204394433647394, "global_step": 37427, "epoch": 314, "lr": 4.672781700564275e-05} +{"train_loss": 0.0026755838189274073, "global_step": 37428, "epoch": 314, "lr": 4.672560624869056e-05} +{"train_loss": 0.00323047349229455, "global_step": 37429, "epoch": 314, "lr": 4.6723395498167276e-05} +{"train_loss": 0.0015460551949217916, "global_step": 37430, "epoch": 314, "lr": 4.672118475407728e-05} +{"train_loss": 0.0036004811991006136, "global_step": 37431, "epoch": 314, "lr": 4.671897401642486e-05} +{"train_loss": 0.002183058299124241, "global_step": 37432, "epoch": 314, "lr": 4.671676328521441e-05} +{"train_loss": 0.002059809397906065, "global_step": 37433, "epoch": 314, "lr": 4.671455256045022e-05} +{"train_loss": 0.002224863274022937, "global_step": 37434, "epoch": 314, "lr": 4.671234184213668e-05} +{"train_loss": 0.0014870933955535293, "global_step": 37435, "epoch": 314, "lr": 4.67101311302781e-05} +{"train_loss": 0.0017305200453847647, "global_step": 37436, "epoch": 314, "lr": 4.670792042487881e-05} +{"train_loss": 0.0036004972644150257, "global_step": 37437, "epoch": 314, "lr": 4.6705709725943184e-05} +{"train_loss": 0.0022720880806446075, "global_step": 37438, "epoch": 314, "lr": 4.670349903347553e-05} +{"train_loss": 0.004109307192265987, "global_step": 37439, "epoch": 314, "lr": 4.670128834748022e-05} +{"train_loss": 0.0027914405800402164, "global_step": 37440, "epoch": 314, "lr": 4.6699077667961555e-05} +{"train_loss": 0.0022859997116029263, "global_step": 37441, "epoch": 314, "lr": 4.669686699492392e-05} +{"train_loss": 0.001691067824140191, "global_step": 37442, "epoch": 314, "lr": 4.669465632837162e-05} +{"train_loss": 0.0018899828428402543, "global_step": 37443, "epoch": 314, "lr": 4.669244566830901e-05} +{"train_loss": 0.004107700660824776, "global_step": 37444, "epoch": 314, "lr": 4.669023501474044e-05} +{"train_loss": 0.002414598362520337, "global_step": 37445, "epoch": 314, "lr": 4.668802436767023e-05} +{"train_loss": 0.00276388181373477, "global_step": 37446, "epoch": 314, "lr": 4.668581372710274e-05} +{"train_loss": 0.003306426340714097, "global_step": 37447, "epoch": 314, "lr": 4.66836030930423e-05} +{"train_loss": 0.0022231382317841053, "global_step": 37448, "epoch": 314, "lr": 4.668139246549323e-05} +{"train_loss": 0.0034216500353068113, "global_step": 37449, "epoch": 314, "lr": 4.6679181844459925e-05} +{"train_loss": 0.0018433532677590847, "global_step": 37450, "epoch": 314, "lr": 4.667697122994666e-05} +{"train_loss": 0.002210304606705904, "global_step": 37451, "epoch": 314, "lr": 4.667476062195783e-05} +{"train_loss": 0.0008288205717690289, "global_step": 37452, "epoch": 314, "lr": 4.667255002049774e-05} +{"train_loss": 0.0023805005475878716, "global_step": 37453, "epoch": 314, "lr": 4.667033942557075e-05} +{"train_loss": 0.0024823620915412903, "global_step": 37454, "epoch": 314, "lr": 4.66681288371812e-05} +{"train_loss": 0.0014807545812800527, "global_step": 37455, "epoch": 314, "lr": 4.66659182553334e-05} +{"train_loss": 0.0021288383286446333, "global_step": 37456, "epoch": 314, "lr": 4.666370768003173e-05} +{"train_loss": 0.0020816472824662924, "global_step": 37457, "epoch": 314, "lr": 4.66614971112805e-05} +{"train_loss": 0.0032385250087827444, "global_step": 37458, "epoch": 314, "lr": 4.665928654908408e-05} +{"train_loss": 0.0015826750313863158, "global_step": 37459, "epoch": 314, "lr": 4.665707599344679e-05} +{"train_loss": 0.002046995796263218, "global_step": 37460, "epoch": 314, "lr": 4.6654865444372956e-05} +{"train_loss": 0.00208953651599586, "global_step": 37461, "epoch": 314, "lr": 4.665265490186696e-05} +{"train_loss": 0.002259289612993598, "global_step": 37462, "epoch": 314, "lr": 4.66504443659331e-05} +{"train_loss": 0.002078654710203409, "global_step": 37463, "epoch": 314, "lr": 4.664823383657576e-05} +{"train_loss": 0.002815527142956853, "global_step": 37464, "epoch": 314, "lr": 4.664602331379922e-05} +{"train_loss": 0.0033568202052265406, "global_step": 37465, "epoch": 314, "lr": 4.6643812797607885e-05} +{"train_loss": 0.0020852768793702126, "global_step": 37466, "epoch": 314, "lr": 4.6641602288006065e-05} +{"train_loss": 0.0017495661741122603, "global_step": 37467, "epoch": 314, "lr": 4.663939178499808e-05} +{"train_loss": 0.002213106257840991, "global_step": 37468, "epoch": 314, "lr": 4.66371812885883e-05} +{"train_loss": 0.0017987493192777038, "global_step": 37469, "epoch": 314, "lr": 4.6634970798781046e-05} +{"train_loss": 0.003902639262378216, "global_step": 37470, "epoch": 314, "lr": 4.663276031558069e-05} +{"train_loss": 0.0019038015743717551, "global_step": 37471, "epoch": 314, "lr": 4.6630549838991516e-05} +{"train_loss": 0.0022329322528094053, "global_step": 37472, "epoch": 314, "lr": 4.662833936901793e-05} +{"train_loss": 0.0031508905813097954, "global_step": 37473, "epoch": 314, "lr": 4.662612890566422e-05} +{"train_loss": 0.0017263884656131268, "global_step": 37474, "epoch": 314, "lr": 4.6623918448934755e-05} +{"train_loss": 0.004514304921030998, "global_step": 37475, "epoch": 314, "lr": 4.6621707998833856e-05} +{"train_loss": 0.002034152625128627, "global_step": 37476, "epoch": 314, "lr": 4.661949755536588e-05} +{"train_loss": 0.002210071077570319, "global_step": 37477, "epoch": 314, "lr": 4.6617287118535156e-05} +{"train_loss": 0.003283127211034298, "global_step": 37478, "epoch": 314, "lr": 4.6615076688346035e-05} +{"train_loss": 0.001568861654959619, "global_step": 37479, "epoch": 314, "lr": 4.661286626480284e-05} +{"train_loss": 0.0024050865322351456, "global_step": 37480, "epoch": 314, "lr": 4.6610655847909926e-05} +{"train_loss": 0.0023675491102039814, "global_step": 37481, "epoch": 314, "lr": 4.6608445437671616e-05} +{"train_loss": 0.002858742605894804, "global_step": 37482, "epoch": 314, "lr": 4.660623503409228e-05} +{"train_loss": 0.0018000418785959482, "global_step": 37483, "epoch": 314, "lr": 4.660402463717622e-05} +{"train_loss": 0.0024026290972388406, "global_step": 37484, "epoch": 314, "lr": 4.6601814246927814e-05, "val_loss": 0.013721590861678123} +{"train_loss": 0.0016849864041432738, "global_step": 37485, "epoch": 315, "lr": 4.659960386335138e-05} +{"train_loss": 0.001194869983009994, "global_step": 37486, "epoch": 315, "lr": 4.659739348645124e-05} +{"train_loss": 0.003306387923657894, "global_step": 37487, "epoch": 315, "lr": 4.6595183116231776e-05} +{"train_loss": 0.002096116077154875, "global_step": 37488, "epoch": 315, "lr": 4.6592972752697285e-05} +{"train_loss": 0.0027196137234568596, "global_step": 37489, "epoch": 315, "lr": 4.659076239585215e-05} +{"train_loss": 0.0019496639724820852, "global_step": 37490, "epoch": 315, "lr": 4.6588552045700665e-05} +{"train_loss": 0.001101012690924108, "global_step": 37491, "epoch": 315, "lr": 4.6586341702247224e-05} +{"train_loss": 0.002070601098239422, "global_step": 37492, "epoch": 315, "lr": 4.658413136549612e-05} +{"train_loss": 0.001998881809413433, "global_step": 37493, "epoch": 315, "lr": 4.65819210354517e-05} +{"train_loss": 0.0019556100014597178, "global_step": 37494, "epoch": 315, "lr": 4.657971071211832e-05} +{"train_loss": 0.0015035155229270458, "global_step": 37495, "epoch": 315, "lr": 4.657750039550031e-05} +{"train_loss": 0.0012057519052177668, "global_step": 37496, "epoch": 315, "lr": 4.6575290085602024e-05} +{"train_loss": 0.002048888010904193, "global_step": 37497, "epoch": 315, "lr": 4.657307978242779e-05} +{"train_loss": 0.0032463925890624523, "global_step": 37498, "epoch": 315, "lr": 4.6570869485981935e-05} +{"train_loss": 0.0017478062072768807, "global_step": 37499, "epoch": 315, "lr": 4.6568659196268825e-05} +{"train_loss": 0.0017185978358611465, "global_step": 37500, "epoch": 315, "lr": 4.6566448913292763e-05} +{"train_loss": 0.0023153983056545258, "global_step": 37501, "epoch": 315, "lr": 4.6564238637058136e-05} +{"train_loss": 0.0017156362300738692, "global_step": 37502, "epoch": 315, "lr": 4.6562028367569245e-05} +{"train_loss": 0.0027526384219527245, "global_step": 37503, "epoch": 315, "lr": 4.6559818104830455e-05} +{"train_loss": 0.001445409026928246, "global_step": 37504, "epoch": 315, "lr": 4.65576078488461e-05} +{"train_loss": 0.0013673797948285937, "global_step": 37505, "epoch": 315, "lr": 4.6555397599620495e-05} +{"train_loss": 0.002004993613809347, "global_step": 37506, "epoch": 315, "lr": 4.655318735715801e-05} +{"train_loss": 0.0011914620408788323, "global_step": 37507, "epoch": 315, "lr": 4.6550977121462965e-05} +{"train_loss": 0.0024749101139605045, "global_step": 37508, "epoch": 315, "lr": 4.654876689253971e-05} +{"train_loss": 0.002390926005318761, "global_step": 37509, "epoch": 315, "lr": 4.654655667039258e-05} +{"train_loss": 0.0015638030599802732, "global_step": 37510, "epoch": 315, "lr": 4.654434645502593e-05} +{"train_loss": 0.0014508686726912856, "global_step": 37511, "epoch": 315, "lr": 4.654213624644408e-05} +{"train_loss": 0.001997999846935272, "global_step": 37512, "epoch": 315, "lr": 4.653992604465137e-05} +{"train_loss": 0.0016316965920850635, "global_step": 37513, "epoch": 315, "lr": 4.653771584965216e-05} +{"train_loss": 0.0014774218434467912, "global_step": 37514, "epoch": 315, "lr": 4.653550566145075e-05} +{"train_loss": 0.003932006657123566, "global_step": 37515, "epoch": 315, "lr": 4.6533295480051535e-05} +{"train_loss": 0.0026831331197172403, "global_step": 37516, "epoch": 315, "lr": 4.653108530545882e-05} +{"train_loss": 0.0007815337157808244, "global_step": 37517, "epoch": 315, "lr": 4.6528875137676924e-05} +{"train_loss": 0.0024794968776404858, "global_step": 37518, "epoch": 315, "lr": 4.652666497671024e-05} +{"train_loss": 0.0018617413006722927, "global_step": 37519, "epoch": 315, "lr": 4.6524454822563045e-05} +{"train_loss": 0.0019926715176552534, "global_step": 37520, "epoch": 315, "lr": 4.652224467523974e-05} +{"train_loss": 0.0023579527623951435, "global_step": 37521, "epoch": 315, "lr": 4.652003453474461e-05} +{"train_loss": 0.0017975466325879097, "global_step": 37522, "epoch": 315, "lr": 4.651782440108205e-05} +{"train_loss": 0.0011467705480754375, "global_step": 37523, "epoch": 315, "lr": 4.651561427425636e-05} +{"train_loss": 0.003285417566075921, "global_step": 37524, "epoch": 315, "lr": 4.651340415427188e-05} +{"train_loss": 0.0028884545899927616, "global_step": 37525, "epoch": 315, "lr": 4.651119404113296e-05} +{"train_loss": 0.001947028678841889, "global_step": 37526, "epoch": 315, "lr": 4.650898393484394e-05} +{"train_loss": 0.0023177005350589752, "global_step": 37527, "epoch": 315, "lr": 4.650677383540916e-05} +{"train_loss": 0.0030101092997938395, "global_step": 37528, "epoch": 315, "lr": 4.650456374283296e-05} +{"train_loss": 0.004340033978223801, "global_step": 37529, "epoch": 315, "lr": 4.6502353657119665e-05} +{"train_loss": 0.00253856903873384, "global_step": 37530, "epoch": 315, "lr": 4.6500143578273645e-05} +{"train_loss": 0.00203466578386724, "global_step": 37531, "epoch": 315, "lr": 4.649793350629918e-05} +{"train_loss": 0.0028059189207851887, "global_step": 37532, "epoch": 315, "lr": 4.649572344120069e-05} +{"train_loss": 0.0015918392455205321, "global_step": 37533, "epoch": 315, "lr": 4.6493513382982444e-05} +{"train_loss": 0.0027091563679277897, "global_step": 37534, "epoch": 315, "lr": 4.6491303331648827e-05} +{"train_loss": 0.0024098732974380255, "global_step": 37535, "epoch": 315, "lr": 4.648909328720417e-05} +{"train_loss": 0.003757922910153866, "global_step": 37536, "epoch": 315, "lr": 4.6486883249652774e-05} +{"train_loss": 0.0021306793205440044, "global_step": 37537, "epoch": 315, "lr": 4.648467321899904e-05} +{"train_loss": 0.004044846631586552, "global_step": 37538, "epoch": 315, "lr": 4.648246319524724e-05} +{"train_loss": 0.003974525257945061, "global_step": 37539, "epoch": 315, "lr": 4.6480253178401775e-05} +{"train_loss": 0.002285906346514821, "global_step": 37540, "epoch": 315, "lr": 4.6478043168466934e-05} +{"train_loss": 0.001624777098186314, "global_step": 37541, "epoch": 315, "lr": 4.64758331654471e-05} +{"train_loss": 0.002833607140928507, "global_step": 37542, "epoch": 315, "lr": 4.6473623169346584e-05} +{"train_loss": 0.00267200474627316, "global_step": 37543, "epoch": 315, "lr": 4.647141318016973e-05} +{"train_loss": 0.0012547054793685675, "global_step": 37544, "epoch": 315, "lr": 4.646920319792088e-05} +{"train_loss": 0.00217262445949018, "global_step": 37545, "epoch": 315, "lr": 4.646699322260435e-05} +{"train_loss": 0.00280979136005044, "global_step": 37546, "epoch": 315, "lr": 4.646478325422454e-05} +{"train_loss": 0.001529988250695169, "global_step": 37547, "epoch": 315, "lr": 4.6462573292785745e-05} +{"train_loss": 0.0019805256742984056, "global_step": 37548, "epoch": 315, "lr": 4.6460363338292286e-05} +{"train_loss": 0.0032489525619894266, "global_step": 37549, "epoch": 315, "lr": 4.645815339074855e-05} +{"train_loss": 0.0024480209685862064, "global_step": 37550, "epoch": 315, "lr": 4.6455943450158826e-05} +{"train_loss": 0.0017853961326181889, "global_step": 37551, "epoch": 315, "lr": 4.64537335165275e-05} +{"train_loss": 0.0021859966218471527, "global_step": 37552, "epoch": 315, "lr": 4.645152358985887e-05} +{"train_loss": 0.0029920144006609917, "global_step": 37553, "epoch": 315, "lr": 4.6449313670157314e-05} +{"train_loss": 0.0017445912817493081, "global_step": 37554, "epoch": 315, "lr": 4.6447103757427154e-05} +{"train_loss": 0.0025800212752074003, "global_step": 37555, "epoch": 315, "lr": 4.6444893851672696e-05} +{"train_loss": 0.0023188870400190353, "global_step": 37556, "epoch": 315, "lr": 4.644268395289834e-05} +{"train_loss": 0.002681811572983861, "global_step": 37557, "epoch": 315, "lr": 4.644047406110837e-05} +{"train_loss": 0.0031391207594424486, "global_step": 37558, "epoch": 315, "lr": 4.6438264176307164e-05} +{"train_loss": 0.0025612444151192904, "global_step": 37559, "epoch": 315, "lr": 4.643605429849904e-05} +{"train_loss": 0.002104719402268529, "global_step": 37560, "epoch": 315, "lr": 4.6433844427688344e-05} +{"train_loss": 0.002410746645182371, "global_step": 37561, "epoch": 315, "lr": 4.6431634563879426e-05} +{"train_loss": 0.004809588193893433, "global_step": 37562, "epoch": 315, "lr": 4.642942470707659e-05} +{"train_loss": 0.002508104545995593, "global_step": 37563, "epoch": 315, "lr": 4.642721485728422e-05} +{"train_loss": 0.0019352352246642113, "global_step": 37564, "epoch": 315, "lr": 4.64250050145066e-05} +{"train_loss": 0.0036396582145243883, "global_step": 37565, "epoch": 315, "lr": 4.6422795178748135e-05} +{"train_loss": 0.0022748273331671953, "global_step": 37566, "epoch": 315, "lr": 4.642058535001312e-05} +{"train_loss": 0.0031796940602362156, "global_step": 37567, "epoch": 315, "lr": 4.641837552830589e-05} +{"train_loss": 0.002989885164424777, "global_step": 37568, "epoch": 315, "lr": 4.641616571363082e-05} +{"train_loss": 0.0044054025784134865, "global_step": 37569, "epoch": 315, "lr": 4.64139559059922e-05} +{"train_loss": 0.0018832063069567084, "global_step": 37570, "epoch": 315, "lr": 4.641174610539441e-05} +{"train_loss": 0.0025078963954001665, "global_step": 37571, "epoch": 315, "lr": 4.6409536311841754e-05} +{"train_loss": 0.002006930997595191, "global_step": 37572, "epoch": 315, "lr": 4.640732652533862e-05} +{"train_loss": 0.0023394355084747076, "global_step": 37573, "epoch": 315, "lr": 4.6405116745889296e-05} +{"train_loss": 0.002562417881563306, "global_step": 37574, "epoch": 315, "lr": 4.640290697349815e-05} +{"train_loss": 0.003097285283729434, "global_step": 37575, "epoch": 315, "lr": 4.640069720816951e-05} +{"train_loss": 0.0023353651631623507, "global_step": 37576, "epoch": 315, "lr": 4.639848744990771e-05} +{"train_loss": 0.004240019246935844, "global_step": 37577, "epoch": 315, "lr": 4.63962776987171e-05} +{"train_loss": 0.0035367875825613737, "global_step": 37578, "epoch": 315, "lr": 4.639406795460201e-05} +{"train_loss": 0.0015685458201915026, "global_step": 37579, "epoch": 315, "lr": 4.6391858217566786e-05} +{"train_loss": 0.0023722797632217407, "global_step": 37580, "epoch": 315, "lr": 4.638964848761577e-05} +{"train_loss": 0.0025027720257639885, "global_step": 37581, "epoch": 315, "lr": 4.638743876475328e-05} +{"train_loss": 0.002600844018161297, "global_step": 37582, "epoch": 315, "lr": 4.638522904898368e-05} +{"train_loss": 0.0026620300486683846, "global_step": 37583, "epoch": 315, "lr": 4.638301934031129e-05} +{"train_loss": 0.002702052239328623, "global_step": 37584, "epoch": 315, "lr": 4.638080963874046e-05} +{"train_loss": 0.002416865201666951, "global_step": 37585, "epoch": 315, "lr": 4.637859994427552e-05} +{"train_loss": 0.0034303630236536264, "global_step": 37586, "epoch": 315, "lr": 4.637639025692081e-05} +{"train_loss": 0.0014449324226006866, "global_step": 37587, "epoch": 315, "lr": 4.6374180576680684e-05} +{"train_loss": 0.0037063362542539835, "global_step": 37588, "epoch": 315, "lr": 4.637197090355944e-05} +{"train_loss": 0.0015605028020218015, "global_step": 37589, "epoch": 315, "lr": 4.6369761237561474e-05} +{"train_loss": 0.001967035699635744, "global_step": 37590, "epoch": 315, "lr": 4.636755157869106e-05} +{"train_loss": 0.003099672729149461, "global_step": 37591, "epoch": 315, "lr": 4.63653419269526e-05} +{"train_loss": 0.0018612855346873403, "global_step": 37592, "epoch": 315, "lr": 4.6363132282350394e-05} +{"train_loss": 0.002191288163885474, "global_step": 37593, "epoch": 315, "lr": 4.636092264488878e-05} +{"train_loss": 0.0037000980228185654, "global_step": 37594, "epoch": 315, "lr": 4.635871301457212e-05} +{"train_loss": 0.00177636684384197, "global_step": 37595, "epoch": 315, "lr": 4.635650339140471e-05} +{"train_loss": 0.001954283332452178, "global_step": 37596, "epoch": 315, "lr": 4.635429377539095e-05} +{"train_loss": 0.0031474244315177202, "global_step": 37597, "epoch": 315, "lr": 4.635208416653515e-05} +{"train_loss": 0.002048888709396124, "global_step": 37598, "epoch": 315, "lr": 4.6349874564841614e-05} +{"train_loss": 0.00245582964271307, "global_step": 37599, "epoch": 315, "lr": 4.634766497031472e-05} +{"train_loss": 0.0013835289282724261, "global_step": 37600, "epoch": 315, "lr": 4.634545538295879e-05} +{"train_loss": 0.0023286016657948494, "global_step": 37601, "epoch": 315, "lr": 4.634324580277818e-05} +{"train_loss": 0.0022081034258008003, "global_step": 37602, "epoch": 315, "lr": 4.6341036229777203e-05} +{"train_loss": 0.0023831985054435915, "global_step": 37603, "epoch": 315, "lr": 4.633882666396023e-05, "val_loss": 0.01935475505888462, "train_action_mse_error": 3.363796349731274e-05} +{"train_loss": 0.0030233622528612614, "global_step": 37604, "epoch": 316, "lr": 4.6336617105331575e-05} +{"train_loss": 0.00564684858545661, "global_step": 37605, "epoch": 316, "lr": 4.6334407553895567e-05} +{"train_loss": 0.0019743938464671373, "global_step": 37606, "epoch": 316, "lr": 4.633219800965656e-05} +{"train_loss": 0.0023855334147810936, "global_step": 37607, "epoch": 316, "lr": 4.632998847261889e-05} +{"train_loss": 0.005262457299977541, "global_step": 37608, "epoch": 316, "lr": 4.6327778942786905e-05} +{"train_loss": 0.003300644923001528, "global_step": 37609, "epoch": 316, "lr": 4.6325569420164924e-05} +{"train_loss": 0.002084453357383609, "global_step": 37610, "epoch": 316, "lr": 4.63233599047573e-05} +{"train_loss": 0.0019654855132102966, "global_step": 37611, "epoch": 316, "lr": 4.6321150396568374e-05} +{"train_loss": 0.0026327925734221935, "global_step": 37612, "epoch": 316, "lr": 4.631894089560246e-05} +{"train_loss": 0.0016974906902760267, "global_step": 37613, "epoch": 316, "lr": 4.631673140186393e-05} +{"train_loss": 0.0026381080970168114, "global_step": 37614, "epoch": 316, "lr": 4.631452191535709e-05} +{"train_loss": 0.0025860206224024296, "global_step": 37615, "epoch": 316, "lr": 4.63123124360863e-05} +{"train_loss": 0.0024779450614005327, "global_step": 37616, "epoch": 316, "lr": 4.6310102964055897e-05} +{"train_loss": 0.0019160584779456258, "global_step": 37617, "epoch": 316, "lr": 4.630789349927019e-05} +{"train_loss": 0.002033982193097472, "global_step": 37618, "epoch": 316, "lr": 4.6305684041733566e-05} +{"train_loss": 0.0022832071408629417, "global_step": 37619, "epoch": 316, "lr": 4.6303474591450314e-05} +{"train_loss": 0.002361153019592166, "global_step": 37620, "epoch": 316, "lr": 4.630126514842481e-05} +{"train_loss": 0.0036916055250912905, "global_step": 37621, "epoch": 316, "lr": 4.629905571266136e-05} +{"train_loss": 0.0026590083725750446, "global_step": 37622, "epoch": 316, "lr": 4.629684628416434e-05} +{"train_loss": 0.0014264866476878524, "global_step": 37623, "epoch": 316, "lr": 4.629463686293806e-05} +{"train_loss": 0.0027847776655107737, "global_step": 37624, "epoch": 316, "lr": 4.629242744898686e-05} +{"train_loss": 0.0029133292846381664, "global_step": 37625, "epoch": 316, "lr": 4.629021804231508e-05} +{"train_loss": 0.0011770061682909727, "global_step": 37626, "epoch": 316, "lr": 4.628800864292707e-05} +{"train_loss": 0.0018585888901725411, "global_step": 37627, "epoch": 316, "lr": 4.628579925082715e-05} +{"train_loss": 0.0022639979142695665, "global_step": 37628, "epoch": 316, "lr": 4.628358986601965e-05} +{"train_loss": 0.0014388908166438341, "global_step": 37629, "epoch": 316, "lr": 4.628138048850896e-05} +{"train_loss": 0.0014476452488452196, "global_step": 37630, "epoch": 316, "lr": 4.6279171118299376e-05} +{"train_loss": 0.0014439848018810153, "global_step": 37631, "epoch": 316, "lr": 4.627696175539522e-05} +{"train_loss": 0.002061353763565421, "global_step": 37632, "epoch": 316, "lr": 4.6274752399800874e-05} +{"train_loss": 0.0022721863351762295, "global_step": 37633, "epoch": 316, "lr": 4.627254305152063e-05} +{"train_loss": 0.002784754615277052, "global_step": 37634, "epoch": 316, "lr": 4.627033371055887e-05} +{"train_loss": 0.005059509072452784, "global_step": 37635, "epoch": 316, "lr": 4.626812437691992e-05} +{"train_loss": 0.0013147162972018123, "global_step": 37636, "epoch": 316, "lr": 4.626591505060808e-05} +{"train_loss": 0.0022463302593678236, "global_step": 37637, "epoch": 316, "lr": 4.626370573162774e-05} +{"train_loss": 0.0018051418010145426, "global_step": 37638, "epoch": 316, "lr": 4.6261496419983194e-05} +{"train_loss": 0.003972742240875959, "global_step": 37639, "epoch": 316, "lr": 4.625928711567882e-05} +{"train_loss": 0.0018716498743742704, "global_step": 37640, "epoch": 316, "lr": 4.625707781871891e-05} +{"train_loss": 0.0013801134191453457, "global_step": 37641, "epoch": 316, "lr": 4.625486852910785e-05} +{"train_loss": 0.0028804766479879618, "global_step": 37642, "epoch": 316, "lr": 4.625265924684996e-05} +{"train_loss": 0.0015757051296532154, "global_step": 37643, "epoch": 316, "lr": 4.625044997194955e-05} +{"train_loss": 0.001954038394615054, "global_step": 37644, "epoch": 316, "lr": 4.624824070441101e-05} +{"train_loss": 0.0013981976080685854, "global_step": 37645, "epoch": 316, "lr": 4.624603144423862e-05} +{"train_loss": 0.0015400308184325695, "global_step": 37646, "epoch": 316, "lr": 4.624382219143677e-05} +{"train_loss": 0.003417191095650196, "global_step": 37647, "epoch": 316, "lr": 4.624161294600977e-05} +{"train_loss": 0.0024771932512521744, "global_step": 37648, "epoch": 316, "lr": 4.623940370796194e-05} +{"train_loss": 0.001277648494578898, "global_step": 37649, "epoch": 316, "lr": 4.623719447729767e-05} +{"train_loss": 0.0042248982936143875, "global_step": 37650, "epoch": 316, "lr": 4.6234985254021236e-05} +{"train_loss": 0.0016446539666503668, "global_step": 37651, "epoch": 316, "lr": 4.623277603813703e-05} +{"train_loss": 0.0025958078913390636, "global_step": 37652, "epoch": 316, "lr": 4.623056682964935e-05} +{"train_loss": 0.001489314716309309, "global_step": 37653, "epoch": 316, "lr": 4.6228357628562566e-05} +{"train_loss": 0.0023278805892914534, "global_step": 37654, "epoch": 316, "lr": 4.622614843488099e-05} +{"train_loss": 0.0015892493538558483, "global_step": 37655, "epoch": 316, "lr": 4.6223939248608964e-05} +{"train_loss": 0.001522229751572013, "global_step": 37656, "epoch": 316, "lr": 4.622173006975083e-05} +{"train_loss": 0.002150357933714986, "global_step": 37657, "epoch": 316, "lr": 4.621952089831093e-05} +{"train_loss": 0.0014880654634907842, "global_step": 37658, "epoch": 316, "lr": 4.6217311734293586e-05} +{"train_loss": 0.0030363542027771473, "global_step": 37659, "epoch": 316, "lr": 4.621510257770316e-05} +{"train_loss": 0.001916257431730628, "global_step": 37660, "epoch": 316, "lr": 4.621289342854397e-05} +{"train_loss": 0.0027032094076275826, "global_step": 37661, "epoch": 316, "lr": 4.621068428682036e-05} +{"train_loss": 0.00177003163844347, "global_step": 37662, "epoch": 316, "lr": 4.620847515253666e-05} +{"train_loss": 0.002489810111001134, "global_step": 37663, "epoch": 316, "lr": 4.620626602569723e-05} +{"train_loss": 0.0033873433712869883, "global_step": 37664, "epoch": 316, "lr": 4.6204056906306375e-05} +{"train_loss": 0.0022672037594020367, "global_step": 37665, "epoch": 316, "lr": 4.620184779436846e-05} +{"train_loss": 0.0017353123985230923, "global_step": 37666, "epoch": 316, "lr": 4.6199638689887825e-05} +{"train_loss": 0.005205641966313124, "global_step": 37667, "epoch": 316, "lr": 4.6197429592868763e-05} +{"train_loss": 0.0011547990143299103, "global_step": 37668, "epoch": 316, "lr": 4.619522050331566e-05} +{"train_loss": 0.0031645966228097677, "global_step": 37669, "epoch": 316, "lr": 4.619301142123282e-05} +{"train_loss": 0.00180872343480587, "global_step": 37670, "epoch": 316, "lr": 4.619080234662461e-05} +{"train_loss": 0.001184012508019805, "global_step": 37671, "epoch": 316, "lr": 4.618859327949534e-05} +{"train_loss": 0.0018044456373900175, "global_step": 37672, "epoch": 316, "lr": 4.618638421984938e-05} +{"train_loss": 0.0014930791221559048, "global_step": 37673, "epoch": 316, "lr": 4.618417516769103e-05} +{"train_loss": 0.0025029685348272324, "global_step": 37674, "epoch": 316, "lr": 4.618196612302465e-05} +{"train_loss": 0.001994050107896328, "global_step": 37675, "epoch": 316, "lr": 4.617975708585457e-05} +{"train_loss": 0.001562593737617135, "global_step": 37676, "epoch": 316, "lr": 4.617754805618511e-05} +{"train_loss": 0.0024132586549967527, "global_step": 37677, "epoch": 316, "lr": 4.6175339034020656e-05} +{"train_loss": 0.0013556984486058354, "global_step": 37678, "epoch": 316, "lr": 4.617313001936549e-05} +{"train_loss": 0.0021536860149353743, "global_step": 37679, "epoch": 316, "lr": 4.6170921012224006e-05} +{"train_loss": 0.0032570476178079844, "global_step": 37680, "epoch": 316, "lr": 4.61687120126005e-05} +{"train_loss": 0.001996445469558239, "global_step": 37681, "epoch": 316, "lr": 4.61665030204993e-05} +{"train_loss": 0.002096722135320306, "global_step": 37682, "epoch": 316, "lr": 4.616429403592478e-05} +{"train_loss": 0.002369299530982971, "global_step": 37683, "epoch": 316, "lr": 4.616208505888125e-05} +{"train_loss": 0.00224303244613111, "global_step": 37684, "epoch": 316, "lr": 4.615987608937306e-05} +{"train_loss": 0.0023557001259177923, "global_step": 37685, "epoch": 316, "lr": 4.615766712740455e-05} +{"train_loss": 0.001373408129438758, "global_step": 37686, "epoch": 316, "lr": 4.615545817298003e-05} +{"train_loss": 0.001790954964235425, "global_step": 37687, "epoch": 316, "lr": 4.6153249226103876e-05} +{"train_loss": 0.002238336717709899, "global_step": 37688, "epoch": 316, "lr": 4.615104028678039e-05} +{"train_loss": 0.0025980777572840452, "global_step": 37689, "epoch": 316, "lr": 4.6148831355013944e-05} +{"train_loss": 0.0025923498906195164, "global_step": 37690, "epoch": 316, "lr": 4.6146622430808834e-05} +{"train_loss": 0.002795238746330142, "global_step": 37691, "epoch": 316, "lr": 4.614441351416943e-05} +{"train_loss": 0.0019332480151206255, "global_step": 37692, "epoch": 316, "lr": 4.614220460510007e-05} +{"train_loss": 0.00241463677957654, "global_step": 37693, "epoch": 316, "lr": 4.6139995703605057e-05} +{"train_loss": 0.003372438717633486, "global_step": 37694, "epoch": 316, "lr": 4.613778680968877e-05} +{"train_loss": 0.0015210724668577313, "global_step": 37695, "epoch": 316, "lr": 4.61355779233555e-05} +{"train_loss": 0.0017890920862555504, "global_step": 37696, "epoch": 316, "lr": 4.613336904460964e-05} +{"train_loss": 0.001438760431483388, "global_step": 37697, "epoch": 316, "lr": 4.613116017345547e-05} +{"train_loss": 0.0018223453080281615, "global_step": 37698, "epoch": 316, "lr": 4.6128951309897376e-05} +{"train_loss": 0.002154688350856304, "global_step": 37699, "epoch": 316, "lr": 4.6126742453939676e-05} +{"train_loss": 0.0021404612343758345, "global_step": 37700, "epoch": 316, "lr": 4.612453360558668e-05} +{"train_loss": 0.0011220461456105113, "global_step": 37701, "epoch": 316, "lr": 4.612232476484277e-05} +{"train_loss": 0.0018829734763130546, "global_step": 37702, "epoch": 316, "lr": 4.612011593171224e-05} +{"train_loss": 0.003385160816833377, "global_step": 37703, "epoch": 316, "lr": 4.6117907106199466e-05} +{"train_loss": 0.0012426389148458838, "global_step": 37704, "epoch": 316, "lr": 4.6115698288308756e-05} +{"train_loss": 0.0027801645919680595, "global_step": 37705, "epoch": 316, "lr": 4.611348947804446e-05} +{"train_loss": 0.0028744342271238565, "global_step": 37706, "epoch": 316, "lr": 4.611128067541091e-05} +{"train_loss": 0.002370893256738782, "global_step": 37707, "epoch": 316, "lr": 4.6109071880412445e-05} +{"train_loss": 0.002440550597384572, "global_step": 37708, "epoch": 316, "lr": 4.610686309305341e-05} +{"train_loss": 0.0011221987660974264, "global_step": 37709, "epoch": 316, "lr": 4.610465431333813e-05} +{"train_loss": 0.0023347006645053625, "global_step": 37710, "epoch": 316, "lr": 4.610244554127093e-05} +{"train_loss": 0.002301805652678013, "global_step": 37711, "epoch": 316, "lr": 4.610023677685619e-05} +{"train_loss": 0.0018403963185846806, "global_step": 37712, "epoch": 316, "lr": 4.6098028020098196e-05} +{"train_loss": 0.002070465823635459, "global_step": 37713, "epoch": 316, "lr": 4.609581927100132e-05} +{"train_loss": 0.002719075186178088, "global_step": 37714, "epoch": 316, "lr": 4.609361052956987e-05} +{"train_loss": 0.0025844338815659285, "global_step": 37715, "epoch": 316, "lr": 4.6091401795808216e-05} +{"train_loss": 0.0018432147335261106, "global_step": 37716, "epoch": 316, "lr": 4.6089193069720685e-05} +{"train_loss": 0.0015820827102288604, "global_step": 37717, "epoch": 316, "lr": 4.6086984351311574e-05} +{"train_loss": 0.0027757587376981974, "global_step": 37718, "epoch": 316, "lr": 4.6084775640585276e-05} +{"train_loss": 0.0019625197164714336, "global_step": 37719, "epoch": 316, "lr": 4.608256693754608e-05} +{"train_loss": 0.003444560104981065, "global_step": 37720, "epoch": 316, "lr": 4.608035824219837e-05} +{"train_loss": 0.0009378489339724183, "global_step": 37721, "epoch": 316, "lr": 4.6078149554546436e-05} +{"train_loss": 0.0022730398365539035, "global_step": 37722, "epoch": 316, "lr": 4.607594087459466e-05, "val_loss": 0.010397644713521004} +{"train_loss": 0.002384469611570239, "global_step": 37723, "epoch": 317, "lr": 4.6073732202347335e-05} +{"train_loss": 0.002410131972283125, "global_step": 37724, "epoch": 317, "lr": 4.607152353780882e-05} +{"train_loss": 0.0018313052132725716, "global_step": 37725, "epoch": 317, "lr": 4.606931488098346e-05} +{"train_loss": 0.0014138504629954696, "global_step": 37726, "epoch": 317, "lr": 4.606710623187556e-05} +{"train_loss": 0.0007764108013361692, "global_step": 37727, "epoch": 317, "lr": 4.60648975904895e-05} +{"train_loss": 0.002333629410713911, "global_step": 37728, "epoch": 317, "lr": 4.6062688956829575e-05} +{"train_loss": 0.0029705192428082228, "global_step": 37729, "epoch": 317, "lr": 4.606048033090016e-05} +{"train_loss": 0.0019723577424883842, "global_step": 37730, "epoch": 317, "lr": 4.605827171270556e-05} +{"train_loss": 0.002587745664641261, "global_step": 37731, "epoch": 317, "lr": 4.605606310225011e-05} +{"train_loss": 0.0022332218941301107, "global_step": 37732, "epoch": 317, "lr": 4.6053854499538186e-05} +{"train_loss": 0.0014555006055161357, "global_step": 37733, "epoch": 317, "lr": 4.605164590457407e-05} +{"train_loss": 0.0019916994497179985, "global_step": 37734, "epoch": 317, "lr": 4.6049437317362145e-05} +{"train_loss": 0.002173281740397215, "global_step": 37735, "epoch": 317, "lr": 4.604722873790674e-05} +{"train_loss": 0.0018998500891029835, "global_step": 37736, "epoch": 317, "lr": 4.6045020166212135e-05} +{"train_loss": 0.0017552380450069904, "global_step": 37737, "epoch": 317, "lr": 4.6042811602282746e-05} +{"train_loss": 0.0016788386274129152, "global_step": 37738, "epoch": 317, "lr": 4.604060304612285e-05} +{"train_loss": 0.0024733603931963444, "global_step": 37739, "epoch": 317, "lr": 4.603839449773682e-05} +{"train_loss": 0.0012506382772698998, "global_step": 37740, "epoch": 317, "lr": 4.603618595712897e-05} +{"train_loss": 0.002385457744821906, "global_step": 37741, "epoch": 317, "lr": 4.603397742430366e-05} +{"train_loss": 0.002216937718912959, "global_step": 37742, "epoch": 317, "lr": 4.6031768899265215e-05} +{"train_loss": 0.0025323897134512663, "global_step": 37743, "epoch": 317, "lr": 4.6029560382017945e-05} +{"train_loss": 0.0021299973595887423, "global_step": 37744, "epoch": 317, "lr": 4.602735187256623e-05} +{"train_loss": 0.0018740235827863216, "global_step": 37745, "epoch": 317, "lr": 4.6025143370914364e-05} +{"train_loss": 0.002448495477437973, "global_step": 37746, "epoch": 317, "lr": 4.6022934877066725e-05} +{"train_loss": 0.0010127455461770296, "global_step": 37747, "epoch": 317, "lr": 4.602072639102761e-05} +{"train_loss": 0.0025676568038761616, "global_step": 37748, "epoch": 317, "lr": 4.6018517912801396e-05} +{"train_loss": 0.002354988595470786, "global_step": 37749, "epoch": 317, "lr": 4.60163094423924e-05} +{"train_loss": 0.0014053458580747247, "global_step": 37750, "epoch": 317, "lr": 4.6014100979804925e-05} +{"train_loss": 0.0012436375254765153, "global_step": 37751, "epoch": 317, "lr": 4.601189252504336e-05} +{"train_loss": 0.002450519008561969, "global_step": 37752, "epoch": 317, "lr": 4.6009684078112e-05} +{"train_loss": 0.002190537052229047, "global_step": 37753, "epoch": 317, "lr": 4.6007475639015216e-05} +{"train_loss": 0.0025332211516797543, "global_step": 37754, "epoch": 317, "lr": 4.600526720775732e-05} +{"train_loss": 0.001000216230750084, "global_step": 37755, "epoch": 317, "lr": 4.6003058784342655e-05} +{"train_loss": 0.0017725109355524182, "global_step": 37756, "epoch": 317, "lr": 4.600085036877556e-05} +{"train_loss": 0.0020799010526388884, "global_step": 37757, "epoch": 317, "lr": 4.5998641961060356e-05} +{"train_loss": 0.0018366931471973658, "global_step": 37758, "epoch": 317, "lr": 4.5996433561201404e-05} +{"train_loss": 0.0010562526294961572, "global_step": 37759, "epoch": 317, "lr": 4.599422516920302e-05} +{"train_loss": 0.001275460934266448, "global_step": 37760, "epoch": 317, "lr": 4.5992016785069546e-05} +{"train_loss": 0.0020816263277083635, "global_step": 37761, "epoch": 317, "lr": 4.5989808408805334e-05} +{"train_loss": 0.0016657330561429262, "global_step": 37762, "epoch": 317, "lr": 4.5987600040414686e-05} +{"train_loss": 0.0017363883089274168, "global_step": 37763, "epoch": 317, "lr": 4.5985391679901973e-05} +{"train_loss": 0.0014209680957719684, "global_step": 37764, "epoch": 317, "lr": 4.59831833272715e-05} +{"train_loss": 0.004196261987090111, "global_step": 37765, "epoch": 317, "lr": 4.5980974982527625e-05} +{"train_loss": 0.0014914496568962932, "global_step": 37766, "epoch": 317, "lr": 4.5978766645674684e-05} +{"train_loss": 0.0012190267443656921, "global_step": 37767, "epoch": 317, "lr": 4.5976558316716984e-05} +{"train_loss": 0.0013333059614524245, "global_step": 37768, "epoch": 317, "lr": 4.59743499956589e-05} +{"train_loss": 0.001988067524507642, "global_step": 37769, "epoch": 317, "lr": 4.597214168250474e-05} +{"train_loss": 0.0027745359111577272, "global_step": 37770, "epoch": 317, "lr": 4.596993337725886e-05} +{"train_loss": 0.002146637300029397, "global_step": 37771, "epoch": 317, "lr": 4.596772507992556e-05} +{"train_loss": 0.002154379151761532, "global_step": 37772, "epoch": 317, "lr": 4.5965516790509235e-05} +{"train_loss": 0.002129447413608432, "global_step": 37773, "epoch": 317, "lr": 4.5963308509014166e-05} +{"train_loss": 0.002122645266354084, "global_step": 37774, "epoch": 317, "lr": 4.59611002354447e-05} +{"train_loss": 0.0012775417417287827, "global_step": 37775, "epoch": 317, "lr": 4.595889196980521e-05} +{"train_loss": 0.0035793581046164036, "global_step": 37776, "epoch": 317, "lr": 4.595668371209998e-05} +{"train_loss": 0.002183441771194339, "global_step": 37777, "epoch": 317, "lr": 4.595447546233339e-05} +{"train_loss": 0.0019865052308887243, "global_step": 37778, "epoch": 317, "lr": 4.5952267220509734e-05} +{"train_loss": 0.0018078408902511, "global_step": 37779, "epoch": 317, "lr": 4.595005898663339e-05} +{"train_loss": 0.001470229821279645, "global_step": 37780, "epoch": 317, "lr": 4.594785076070867e-05} +{"train_loss": 0.002752402564510703, "global_step": 37781, "epoch": 317, "lr": 4.594564254273989e-05} +{"train_loss": 0.0021908485796302557, "global_step": 37782, "epoch": 317, "lr": 4.594343433273143e-05} +{"train_loss": 0.0020876929629594088, "global_step": 37783, "epoch": 317, "lr": 4.5941226130687586e-05} +{"train_loss": 0.002058200305327773, "global_step": 37784, "epoch": 317, "lr": 4.5939017936612734e-05} +{"train_loss": 0.0033443167340010405, "global_step": 37785, "epoch": 317, "lr": 4.5936809750511186e-05} +{"train_loss": 0.0017148631159216166, "global_step": 37786, "epoch": 317, "lr": 4.5934601572387246e-05} +{"train_loss": 0.0032119506504386663, "global_step": 37787, "epoch": 317, "lr": 4.59323934022453e-05} +{"train_loss": 0.00328113348223269, "global_step": 37788, "epoch": 317, "lr": 4.593018524008967e-05} +{"train_loss": 0.002439668867737055, "global_step": 37789, "epoch": 317, "lr": 4.592797708592468e-05} +{"train_loss": 0.002489923033863306, "global_step": 37790, "epoch": 317, "lr": 4.592576893975467e-05} +{"train_loss": 0.0016165048582479358, "global_step": 37791, "epoch": 317, "lr": 4.5923560801583984e-05} +{"train_loss": 0.0013916261959820986, "global_step": 37792, "epoch": 317, "lr": 4.5921352671416955e-05} +{"train_loss": 0.00239941175095737, "global_step": 37793, "epoch": 317, "lr": 4.591914454925789e-05} +{"train_loss": 0.0013798701111227274, "global_step": 37794, "epoch": 317, "lr": 4.591693643511118e-05} +{"train_loss": 0.0016040198970586061, "global_step": 37795, "epoch": 317, "lr": 4.5914728328981104e-05} +{"train_loss": 0.0017571907956153154, "global_step": 37796, "epoch": 317, "lr": 4.591252023087204e-05} +{"train_loss": 0.002012865152209997, "global_step": 37797, "epoch": 317, "lr": 4.591031214078829e-05} +{"train_loss": 0.0023309881798923016, "global_step": 37798, "epoch": 317, "lr": 4.5908104058734226e-05} +{"train_loss": 0.0024013405200093985, "global_step": 37799, "epoch": 317, "lr": 4.590589598471416e-05} +{"train_loss": 0.0015521117020398378, "global_step": 37800, "epoch": 317, "lr": 4.5903687918732406e-05} +{"train_loss": 0.003150917822495103, "global_step": 37801, "epoch": 317, "lr": 4.590147986079335e-05} +{"train_loss": 0.0009089431841857731, "global_step": 37802, "epoch": 317, "lr": 4.5899271810901276e-05} +{"train_loss": 0.0025916132144629955, "global_step": 37803, "epoch": 317, "lr": 4.5897063769060566e-05} +{"train_loss": 0.00232766498811543, "global_step": 37804, "epoch": 317, "lr": 4.5894855735275525e-05} +{"train_loss": 0.0029178832191973925, "global_step": 37805, "epoch": 317, "lr": 4.58926477095505e-05} +{"train_loss": 0.002087644301354885, "global_step": 37806, "epoch": 317, "lr": 4.589043969188981e-05} +{"train_loss": 0.0018693783786147833, "global_step": 37807, "epoch": 317, "lr": 4.588823168229781e-05} +{"train_loss": 0.0015117148868739605, "global_step": 37808, "epoch": 317, "lr": 4.588602368077882e-05} +{"train_loss": 0.0015836585080251098, "global_step": 37809, "epoch": 317, "lr": 4.588381568733718e-05} +{"train_loss": 0.002862835768610239, "global_step": 37810, "epoch": 317, "lr": 4.588160770197725e-05} +{"train_loss": 0.001588856102898717, "global_step": 37811, "epoch": 317, "lr": 4.587939972470334e-05} +{"train_loss": 0.0013258106773719192, "global_step": 37812, "epoch": 317, "lr": 4.587719175551977e-05} +{"train_loss": 0.0010051928693428636, "global_step": 37813, "epoch": 317, "lr": 4.587498379443092e-05} +{"train_loss": 0.0018000041600316763, "global_step": 37814, "epoch": 317, "lr": 4.587277584144106e-05} +{"train_loss": 0.002140494529157877, "global_step": 37815, "epoch": 317, "lr": 4.5870567896554604e-05} +{"train_loss": 0.0029241761658340693, "global_step": 37816, "epoch": 317, "lr": 4.5868359959775815e-05} +{"train_loss": 0.002199205569922924, "global_step": 37817, "epoch": 317, "lr": 4.586615203110908e-05} +{"train_loss": 0.0023659002035856247, "global_step": 37818, "epoch": 317, "lr": 4.586394411055872e-05} +{"train_loss": 0.0015521821333095431, "global_step": 37819, "epoch": 317, "lr": 4.586173619812904e-05} +{"train_loss": 0.0012016756227239966, "global_step": 37820, "epoch": 317, "lr": 4.585952829382441e-05} +{"train_loss": 0.0017739159520715475, "global_step": 37821, "epoch": 317, "lr": 4.585732039764915e-05} +{"train_loss": 0.002075737342238426, "global_step": 37822, "epoch": 317, "lr": 4.58551125096076e-05} +{"train_loss": 0.001883148797787726, "global_step": 37823, "epoch": 317, "lr": 4.585290462970411e-05} +{"train_loss": 0.001511912327259779, "global_step": 37824, "epoch": 317, "lr": 4.585069675794297e-05} +{"train_loss": 0.0027604354545474052, "global_step": 37825, "epoch": 317, "lr": 4.584848889432857e-05} +{"train_loss": 0.001705292146652937, "global_step": 37826, "epoch": 317, "lr": 4.5846281038865195e-05} +{"train_loss": 0.0014909239253029227, "global_step": 37827, "epoch": 317, "lr": 4.584407319155723e-05} +{"train_loss": 0.0032899240031838417, "global_step": 37828, "epoch": 317, "lr": 4.5841865352408955e-05} +{"train_loss": 0.0033904763404279947, "global_step": 37829, "epoch": 317, "lr": 4.5839657521424765e-05} +{"train_loss": 0.001462325919419527, "global_step": 37830, "epoch": 317, "lr": 4.5837449698608946e-05} +{"train_loss": 0.0015529138036072254, "global_step": 37831, "epoch": 317, "lr": 4.5835241883965844e-05} +{"train_loss": 0.0010723051382228732, "global_step": 37832, "epoch": 317, "lr": 4.583303407749981e-05} +{"train_loss": 0.0020855036564171314, "global_step": 37833, "epoch": 317, "lr": 4.583082627921515e-05} +{"train_loss": 0.003086859593167901, "global_step": 37834, "epoch": 317, "lr": 4.582861848911624e-05} +{"train_loss": 0.002165338024497032, "global_step": 37835, "epoch": 317, "lr": 4.58264107072074e-05} +{"train_loss": 0.002449972089380026, "global_step": 37836, "epoch": 317, "lr": 4.582420293349292e-05} +{"train_loss": 0.0012758866650983691, "global_step": 37837, "epoch": 317, "lr": 4.582199516797719e-05} +{"train_loss": 0.002870737574994564, "global_step": 37838, "epoch": 317, "lr": 4.5819787410664526e-05} +{"train_loss": 0.002199347596615553, "global_step": 37839, "epoch": 317, "lr": 4.581757966155926e-05} +{"train_loss": 0.0014152727089822292, "global_step": 37840, "epoch": 317, "lr": 4.5815371920665734e-05} +{"train_loss": 0.002040923073664777, "global_step": 37841, "epoch": 317, "lr": 4.5813164187988275e-05, "val_loss": 0.020865444093942642} +{"train_loss": 0.0015152947744354606, "global_step": 37842, "epoch": 318, "lr": 4.581095646353124e-05} +{"train_loss": 0.0019650638569146395, "global_step": 37843, "epoch": 318, "lr": 4.5808748747298916e-05} +{"train_loss": 0.0012817200040444732, "global_step": 37844, "epoch": 318, "lr": 4.580654103929568e-05} +{"train_loss": 0.0027504796162247658, "global_step": 37845, "epoch": 318, "lr": 4.580433333952584e-05} +{"train_loss": 0.0028260413091629744, "global_step": 37846, "epoch": 318, "lr": 4.5802125647993765e-05} +{"train_loss": 0.0020528724417090416, "global_step": 37847, "epoch": 318, "lr": 4.579991796470374e-05} +{"train_loss": 0.0020805164240300655, "global_step": 37848, "epoch": 318, "lr": 4.579771028966016e-05} +{"train_loss": 0.0033093474339693785, "global_step": 37849, "epoch": 318, "lr": 4.5795502622867315e-05} +{"train_loss": 0.0015013519441708922, "global_step": 37850, "epoch": 318, "lr": 4.579329496432954e-05} +{"train_loss": 0.0034147603437304497, "global_step": 37851, "epoch": 318, "lr": 4.5791087314051194e-05} +{"train_loss": 0.002561334054917097, "global_step": 37852, "epoch": 318, "lr": 4.578887967203658e-05} +{"train_loss": 0.0021572699770331383, "global_step": 37853, "epoch": 318, "lr": 4.5786672038290074e-05} +{"train_loss": 0.002773182699456811, "global_step": 37854, "epoch": 318, "lr": 4.578446441281598e-05} +{"train_loss": 0.0013110643485561013, "global_step": 37855, "epoch": 318, "lr": 4.578225679561863e-05} +{"train_loss": 0.003072321880608797, "global_step": 37856, "epoch": 318, "lr": 4.578004918670237e-05} +{"train_loss": 0.001993529498577118, "global_step": 37857, "epoch": 318, "lr": 4.577784158607154e-05} +{"train_loss": 0.0034534528385847807, "global_step": 37858, "epoch": 318, "lr": 4.577563399373046e-05} +{"train_loss": 0.000873781566042453, "global_step": 37859, "epoch": 318, "lr": 4.5773426409683466e-05} +{"train_loss": 0.002961938502267003, "global_step": 37860, "epoch": 318, "lr": 4.577121883393491e-05} +{"train_loss": 0.0026975402142852545, "global_step": 37861, "epoch": 318, "lr": 4.576901126648913e-05} +{"train_loss": 0.003019311698153615, "global_step": 37862, "epoch": 318, "lr": 4.576680370735041e-05} +{"train_loss": 0.0017840617801994085, "global_step": 37863, "epoch": 318, "lr": 4.5764596156523145e-05} +{"train_loss": 0.0018741318490356207, "global_step": 37864, "epoch": 318, "lr": 4.5762388614011617e-05} +{"train_loss": 0.002561626024544239, "global_step": 37865, "epoch": 318, "lr": 4.5760181079820215e-05} +{"train_loss": 0.002323295921087265, "global_step": 37866, "epoch": 318, "lr": 4.5757973553953216e-05} +{"train_loss": 0.0021705026738345623, "global_step": 37867, "epoch": 318, "lr": 4.575576603641501e-05} +{"train_loss": 0.001618078676983714, "global_step": 37868, "epoch": 318, "lr": 4.57535585272099e-05} +{"train_loss": 0.0014435389311984181, "global_step": 37869, "epoch": 318, "lr": 4.5751351026342206e-05} +{"train_loss": 0.0015881265280768275, "global_step": 37870, "epoch": 318, "lr": 4.5749143533816294e-05} +{"train_loss": 0.0033056072425097227, "global_step": 37871, "epoch": 318, "lr": 4.5746936049636475e-05} +{"train_loss": 0.002233730396255851, "global_step": 37872, "epoch": 318, "lr": 4.5744728573807094e-05} +{"train_loss": 0.002651914721354842, "global_step": 37873, "epoch": 318, "lr": 4.57425211063325e-05} +{"train_loss": 0.0023028538562357426, "global_step": 37874, "epoch": 318, "lr": 4.574031364721699e-05} +{"train_loss": 0.0012061467859894037, "global_step": 37875, "epoch": 318, "lr": 4.573810619646493e-05} +{"train_loss": 0.0018392375204712152, "global_step": 37876, "epoch": 318, "lr": 4.573589875408063e-05} +{"train_loss": 0.0034427500795572996, "global_step": 37877, "epoch": 318, "lr": 4.573369132006846e-05} +{"train_loss": 0.003253272036090493, "global_step": 37878, "epoch": 318, "lr": 4.573148389443271e-05} +{"train_loss": 0.0023370073176920414, "global_step": 37879, "epoch": 318, "lr": 4.572927647717775e-05} +{"train_loss": 0.003546573221683502, "global_step": 37880, "epoch": 318, "lr": 4.572706906830791e-05} +{"train_loss": 0.0023317928425967693, "global_step": 37881, "epoch": 318, "lr": 4.572486166782749e-05} +{"train_loss": 0.0015737840440124273, "global_step": 37882, "epoch": 318, "lr": 4.572265427574086e-05} +{"train_loss": 0.001902040676213801, "global_step": 37883, "epoch": 318, "lr": 4.5720446892052324e-05} +{"train_loss": 0.002401751698926091, "global_step": 37884, "epoch": 318, "lr": 4.5718239516766255e-05} +{"train_loss": 0.0017491474281996489, "global_step": 37885, "epoch": 318, "lr": 4.571603214988695e-05} +{"train_loss": 0.002392606809735298, "global_step": 37886, "epoch": 318, "lr": 4.571382479141877e-05} +{"train_loss": 0.0020851034205406904, "global_step": 37887, "epoch": 318, "lr": 4.571161744136603e-05} +{"train_loss": 0.0011827992275357246, "global_step": 37888, "epoch": 318, "lr": 4.5709410099733075e-05} +{"train_loss": 0.0021803267300128937, "global_step": 37889, "epoch": 318, "lr": 4.570720276652423e-05} +{"train_loss": 0.0017074467614293098, "global_step": 37890, "epoch": 318, "lr": 4.570499544174383e-05} +{"train_loss": 0.0018866336904466152, "global_step": 37891, "epoch": 318, "lr": 4.570278812539622e-05} +{"train_loss": 0.0015016172546893358, "global_step": 37892, "epoch": 318, "lr": 4.570058081748574e-05} +{"train_loss": 0.0024409641046077013, "global_step": 37893, "epoch": 318, "lr": 4.569837351801668e-05} +{"train_loss": 0.0017624400788918138, "global_step": 37894, "epoch": 318, "lr": 4.569616622699343e-05} +{"train_loss": 0.0025605312548577785, "global_step": 37895, "epoch": 318, "lr": 4.5693958944420274e-05} +{"train_loss": 0.0035366909578442574, "global_step": 37896, "epoch": 318, "lr": 4.569175167030159e-05} +{"train_loss": 0.0021731562446802855, "global_step": 37897, "epoch": 318, "lr": 4.5689544404641677e-05} +{"train_loss": 0.001301631098613143, "global_step": 37898, "epoch": 318, "lr": 4.5687337147444895e-05} +{"train_loss": 0.0019592116586863995, "global_step": 37899, "epoch": 318, "lr": 4.568512989871557e-05} +{"train_loss": 0.002477676374837756, "global_step": 37900, "epoch": 318, "lr": 4.568292265845802e-05} +{"train_loss": 0.0020802058279514313, "global_step": 37901, "epoch": 318, "lr": 4.5680715426676597e-05} +{"train_loss": 0.0012586263474076986, "global_step": 37902, "epoch": 318, "lr": 4.5678508203375614e-05} +{"train_loss": 0.0011479046661406755, "global_step": 37903, "epoch": 318, "lr": 4.5676300988559435e-05} +{"train_loss": 0.0014927010051906109, "global_step": 37904, "epoch": 318, "lr": 4.567409378223237e-05} +{"train_loss": 0.0027432742062956095, "global_step": 37905, "epoch": 318, "lr": 4.567188658439876e-05} +{"train_loss": 0.0022881783079355955, "global_step": 37906, "epoch": 318, "lr": 4.566967939506294e-05} +{"train_loss": 0.0017537414096295834, "global_step": 37907, "epoch": 318, "lr": 4.566747221422922e-05} +{"train_loss": 0.002907965099439025, "global_step": 37908, "epoch": 318, "lr": 4.566526504190199e-05} +{"train_loss": 0.003335781628265977, "global_step": 37909, "epoch": 318, "lr": 4.5663057878085516e-05} +{"train_loss": 0.002275927923619747, "global_step": 37910, "epoch": 318, "lr": 4.5660850722784197e-05} +{"train_loss": 0.0020861562807112932, "global_step": 37911, "epoch": 318, "lr": 4.565864357600233e-05} +{"train_loss": 0.0017527177697047591, "global_step": 37912, "epoch": 318, "lr": 4.565643643774423e-05} +{"train_loss": 0.0026364491786807775, "global_step": 37913, "epoch": 318, "lr": 4.5654229308014275e-05} +{"train_loss": 0.0018178719328716397, "global_step": 37914, "epoch": 318, "lr": 4.565202218681676e-05} +{"train_loss": 0.0018056943081319332, "global_step": 37915, "epoch": 318, "lr": 4.5649815074156046e-05} +{"train_loss": 0.0015141053590923548, "global_step": 37916, "epoch": 318, "lr": 4.564760797003644e-05} +{"train_loss": 0.0016252048080787063, "global_step": 37917, "epoch": 318, "lr": 4.5645400874462315e-05} +{"train_loss": 0.0030742918606847525, "global_step": 37918, "epoch": 318, "lr": 4.564319378743798e-05} +{"train_loss": 0.0017759513575583696, "global_step": 37919, "epoch": 318, "lr": 4.5640986708967736e-05} +{"train_loss": 0.002717384370043874, "global_step": 37920, "epoch": 318, "lr": 4.563877963905597e-05} +{"train_loss": 0.0015045130858197808, "global_step": 37921, "epoch": 318, "lr": 4.563657257770699e-05} +{"train_loss": 0.002044468652456999, "global_step": 37922, "epoch": 318, "lr": 4.563436552492514e-05} +{"train_loss": 0.0021723357494920492, "global_step": 37923, "epoch": 318, "lr": 4.563215848071475e-05} +{"train_loss": 0.002705435734242201, "global_step": 37924, "epoch": 318, "lr": 4.562995144508013e-05} +{"train_loss": 0.0025949617847800255, "global_step": 37925, "epoch": 318, "lr": 4.562774441802566e-05} +{"train_loss": 0.0019725433085113764, "global_step": 37926, "epoch": 318, "lr": 4.562553739955562e-05} +{"train_loss": 0.002390496898442507, "global_step": 37927, "epoch": 318, "lr": 4.562333038967439e-05} +{"train_loss": 0.0025176811031997204, "global_step": 37928, "epoch": 318, "lr": 4.562112338838627e-05} +{"train_loss": 0.0035066227428615093, "global_step": 37929, "epoch": 318, "lr": 4.5618916395695624e-05} +{"train_loss": 0.0011767856776714325, "global_step": 37930, "epoch": 318, "lr": 4.561670941160676e-05} +{"train_loss": 0.00203425670042634, "global_step": 37931, "epoch": 318, "lr": 4.5614502436124004e-05} +{"train_loss": 0.0029491735622286797, "global_step": 37932, "epoch": 318, "lr": 4.561229546925173e-05} +{"train_loss": 0.005025721620768309, "global_step": 37933, "epoch": 318, "lr": 4.561008851099422e-05} +{"train_loss": 0.0017745988443493843, "global_step": 37934, "epoch": 318, "lr": 4.5607881561355855e-05} +{"train_loss": 0.0016312053194269538, "global_step": 37935, "epoch": 318, "lr": 4.5605674620340915e-05} +{"train_loss": 0.0026282216422259808, "global_step": 37936, "epoch": 318, "lr": 4.560346768795379e-05} +{"train_loss": 0.002157837152481079, "global_step": 37937, "epoch": 318, "lr": 4.560126076419878e-05} +{"train_loss": 0.0023733172565698624, "global_step": 37938, "epoch": 318, "lr": 4.559905384908022e-05} +{"train_loss": 0.001549531240016222, "global_step": 37939, "epoch": 318, "lr": 4.559684694260245e-05} +{"train_loss": 0.003035231027752161, "global_step": 37940, "epoch": 318, "lr": 4.5594640044769806e-05} +{"train_loss": 0.0022392261307686567, "global_step": 37941, "epoch": 318, "lr": 4.559243315558661e-05} +{"train_loss": 0.0020045232959091663, "global_step": 37942, "epoch": 318, "lr": 4.5590226275057206e-05} +{"train_loss": 0.0026095479261130095, "global_step": 37943, "epoch": 318, "lr": 4.5588019403185904e-05} +{"train_loss": 0.0008340322528965771, "global_step": 37944, "epoch": 318, "lr": 4.558581253997708e-05} +{"train_loss": 0.0019448541570454836, "global_step": 37945, "epoch": 318, "lr": 4.5583605685435014e-05} +{"train_loss": 0.001852003624662757, "global_step": 37946, "epoch": 318, "lr": 4.5581398839564094e-05} +{"train_loss": 0.0036449667531996965, "global_step": 37947, "epoch": 318, "lr": 4.55791920023686e-05} +{"train_loss": 0.0023230176884680986, "global_step": 37948, "epoch": 318, "lr": 4.557698517385291e-05} +{"train_loss": 0.0017135334201157093, "global_step": 37949, "epoch": 318, "lr": 4.557477835402134e-05} +{"train_loss": 0.0028185320552438498, "global_step": 37950, "epoch": 318, "lr": 4.55725715428782e-05} +{"train_loss": 0.0016961210640147328, "global_step": 37951, "epoch": 318, "lr": 4.557036474042786e-05} +{"train_loss": 0.0017800733912736177, "global_step": 37952, "epoch": 318, "lr": 4.5568157946674614e-05} +{"train_loss": 0.002083406550809741, "global_step": 37953, "epoch": 318, "lr": 4.556595116162284e-05} +{"train_loss": 0.0017573018558323383, "global_step": 37954, "epoch": 318, "lr": 4.556374438527684e-05} +{"train_loss": 0.000965854327660054, "global_step": 37955, "epoch": 318, "lr": 4.556153761764094e-05} +{"train_loss": 0.0032096640206873417, "global_step": 37956, "epoch": 318, "lr": 4.5559330858719506e-05} +{"train_loss": 0.0016271464992314577, "global_step": 37957, "epoch": 318, "lr": 4.555712410851684e-05} +{"train_loss": 0.004429623018950224, "global_step": 37958, "epoch": 318, "lr": 4.555491736703729e-05} +{"train_loss": 0.0024395931977778673, "global_step": 37959, "epoch": 318, "lr": 4.5552710634285175e-05} +{"train_loss": 0.0022355032260060123, "global_step": 37960, "epoch": 318, "lr": 4.5550503910264857e-05, "val_loss": 0.015609062276780605} +{"train_loss": 0.0009465116891078651, "global_step": 37961, "epoch": 319, "lr": 4.5548297194980646e-05} +{"train_loss": 0.002287243725731969, "global_step": 37962, "epoch": 319, "lr": 4.554609048843687e-05} +{"train_loss": 0.0030006044544279575, "global_step": 37963, "epoch": 319, "lr": 4.5543883790637876e-05} +{"train_loss": 0.0009761858964338899, "global_step": 37964, "epoch": 319, "lr": 4.554167710158798e-05} +{"train_loss": 0.001549420179799199, "global_step": 37965, "epoch": 319, "lr": 4.553947042129153e-05} +{"train_loss": 0.002814890118315816, "global_step": 37966, "epoch": 319, "lr": 4.553726374975285e-05} +{"train_loss": 0.0023406685795634985, "global_step": 37967, "epoch": 319, "lr": 4.5535057086976283e-05} +{"train_loss": 0.0016391415847465396, "global_step": 37968, "epoch": 319, "lr": 4.5532850432966165e-05} +{"train_loss": 0.002079678699374199, "global_step": 37969, "epoch": 319, "lr": 4.553064378772678e-05} +{"train_loss": 0.0010859140893444419, "global_step": 37970, "epoch": 319, "lr": 4.5528437151262524e-05} +{"train_loss": 0.0018423805013298988, "global_step": 37971, "epoch": 319, "lr": 4.552623052357771e-05} +{"train_loss": 0.0023182437289506197, "global_step": 37972, "epoch": 319, "lr": 4.552402390467665e-05} +{"train_loss": 0.00255398266017437, "global_step": 37973, "epoch": 319, "lr": 4.5521817294563705e-05} +{"train_loss": 0.0016264155274257064, "global_step": 37974, "epoch": 319, "lr": 4.5519610693243176e-05} +{"train_loss": 0.0010760793229565024, "global_step": 37975, "epoch": 319, "lr": 4.551740410071943e-05} +{"train_loss": 0.000982203520834446, "global_step": 37976, "epoch": 319, "lr": 4.5515197516996764e-05} +{"train_loss": 0.0013241029810160398, "global_step": 37977, "epoch": 319, "lr": 4.5512990942079546e-05} +{"train_loss": 0.0017561987042427063, "global_step": 37978, "epoch": 319, "lr": 4.551078437597207e-05} +{"train_loss": 0.0014986397000029683, "global_step": 37979, "epoch": 319, "lr": 4.550857781867871e-05} +{"train_loss": 0.0017660228768363595, "global_step": 37980, "epoch": 319, "lr": 4.5506371270203784e-05} +{"train_loss": 0.003994063474237919, "global_step": 37981, "epoch": 319, "lr": 4.55041647305516e-05} +{"train_loss": 0.002616346348077059, "global_step": 37982, "epoch": 319, "lr": 4.550195819972652e-05} +{"train_loss": 0.0008530963095836341, "global_step": 37983, "epoch": 319, "lr": 4.549975167773284e-05} +{"train_loss": 0.0015388663159683347, "global_step": 37984, "epoch": 319, "lr": 4.549754516457494e-05} +{"train_loss": 0.002561531262472272, "global_step": 37985, "epoch": 319, "lr": 4.5495338660257116e-05} +{"train_loss": 0.0007874371949583292, "global_step": 37986, "epoch": 319, "lr": 4.549313216478373e-05} +{"train_loss": 0.001614863402210176, "global_step": 37987, "epoch": 319, "lr": 4.5490925678159084e-05} +{"train_loss": 0.001214808551594615, "global_step": 37988, "epoch": 319, "lr": 4.548871920038753e-05} +{"train_loss": 0.0015452930238097906, "global_step": 37989, "epoch": 319, "lr": 4.548651273147339e-05} +{"train_loss": 0.0031260093674063683, "global_step": 37990, "epoch": 319, "lr": 4.548430627142099e-05} +{"train_loss": 0.0017349949339404702, "global_step": 37991, "epoch": 319, "lr": 4.548209982023469e-05} +{"train_loss": 0.0018340949900448322, "global_step": 37992, "epoch": 319, "lr": 4.547989337791881e-05} +{"train_loss": 0.0023137156385928392, "global_step": 37993, "epoch": 319, "lr": 4.547768694447765e-05} +{"train_loss": 0.0032434300519526005, "global_step": 37994, "epoch": 319, "lr": 4.54754805199156e-05} +{"train_loss": 0.0021898197010159492, "global_step": 37995, "epoch": 319, "lr": 4.547327410423693e-05} +{"train_loss": 0.0022951753344386816, "global_step": 37996, "epoch": 319, "lr": 4.547106769744602e-05} +{"train_loss": 0.0017044995911419392, "global_step": 37997, "epoch": 319, "lr": 4.546886129954717e-05} +{"train_loss": 0.0025953210424631834, "global_step": 37998, "epoch": 319, "lr": 4.5466654910544755e-05} +{"train_loss": 0.00257723405957222, "global_step": 37999, "epoch": 319, "lr": 4.546444853044307e-05} +{"train_loss": 0.001744039705954492, "global_step": 38000, "epoch": 319, "lr": 4.546224215924643e-05} +{"train_loss": 0.0018763976404443383, "global_step": 38001, "epoch": 319, "lr": 4.546003579695922e-05} +{"train_loss": 0.0020736209116876125, "global_step": 38002, "epoch": 319, "lr": 4.545782944358572e-05} +{"train_loss": 0.0019346065819263458, "global_step": 38003, "epoch": 319, "lr": 4.545562309913032e-05} +{"train_loss": 0.002379039768129587, "global_step": 38004, "epoch": 319, "lr": 4.5453416763597286e-05} +{"train_loss": 0.0015850297641009092, "global_step": 38005, "epoch": 319, "lr": 4.5451210436990996e-05} +{"train_loss": 0.0021143637131899595, "global_step": 38006, "epoch": 319, "lr": 4.544900411931578e-05} +{"train_loss": 0.003963612951338291, "global_step": 38007, "epoch": 319, "lr": 4.544679781057593e-05} +{"train_loss": 0.002643168903887272, "global_step": 38008, "epoch": 319, "lr": 4.544459151077583e-05} +{"train_loss": 0.0023137300740927458, "global_step": 38009, "epoch": 319, "lr": 4.5442385219919775e-05} +{"train_loss": 0.001979522407054901, "global_step": 38010, "epoch": 319, "lr": 4.5440178938012125e-05} +{"train_loss": 0.0022389867808669806, "global_step": 38011, "epoch": 319, "lr": 4.54379726650572e-05} +{"train_loss": 0.0014639305882155895, "global_step": 38012, "epoch": 319, "lr": 4.5435766401059296e-05} +{"train_loss": 0.002267408650368452, "global_step": 38013, "epoch": 319, "lr": 4.543356014602281e-05} +{"train_loss": 0.002077357843518257, "global_step": 38014, "epoch": 319, "lr": 4.543135389995202e-05} +{"train_loss": 0.0012500142911449075, "global_step": 38015, "epoch": 319, "lr": 4.542914766285129e-05} +{"train_loss": 0.0015220673521980643, "global_step": 38016, "epoch": 319, "lr": 4.542694143472493e-05} +{"train_loss": 0.001303472905419767, "global_step": 38017, "epoch": 319, "lr": 4.54247352155773e-05} +{"train_loss": 0.002698334399610758, "global_step": 38018, "epoch": 319, "lr": 4.5422529005412697e-05} +{"train_loss": 0.0017049928428605199, "global_step": 38019, "epoch": 319, "lr": 4.542032280423547e-05} +{"train_loss": 0.0014840561198070645, "global_step": 38020, "epoch": 319, "lr": 4.5418116612049957e-05} +{"train_loss": 0.00292394170537591, "global_step": 38021, "epoch": 319, "lr": 4.541591042886047e-05} +{"train_loss": 0.0014196214033290744, "global_step": 38022, "epoch": 319, "lr": 4.541370425467137e-05} +{"train_loss": 0.0009478356223553419, "global_step": 38023, "epoch": 319, "lr": 4.541149808948697e-05} +{"train_loss": 0.0015635791933164, "global_step": 38024, "epoch": 319, "lr": 4.540929193331159e-05} +{"train_loss": 0.002752730157226324, "global_step": 38025, "epoch": 319, "lr": 4.540708578614959e-05} +{"train_loss": 0.001422865898348391, "global_step": 38026, "epoch": 319, "lr": 4.540487964800527e-05} +{"train_loss": 0.0018997216830030084, "global_step": 38027, "epoch": 319, "lr": 4.5402673518882996e-05} +{"train_loss": 0.0032777399756014347, "global_step": 38028, "epoch": 319, "lr": 4.540046739878706e-05} +{"train_loss": 0.0012665630783885717, "global_step": 38029, "epoch": 319, "lr": 4.5398261287721834e-05} +{"train_loss": 0.0008931547636166215, "global_step": 38030, "epoch": 319, "lr": 4.539605518569163e-05} +{"train_loss": 0.001200393307954073, "global_step": 38031, "epoch": 319, "lr": 4.539384909270076e-05} +{"train_loss": 0.0021872238721698523, "global_step": 38032, "epoch": 319, "lr": 4.5391643008753596e-05} +{"train_loss": 0.0016852801200002432, "global_step": 38033, "epoch": 319, "lr": 4.5389436933854436e-05} +{"train_loss": 0.0029110340401530266, "global_step": 38034, "epoch": 319, "lr": 4.538723086800764e-05} +{"train_loss": 0.0011426352430135012, "global_step": 38035, "epoch": 319, "lr": 4.53850248112175e-05} +{"train_loss": 0.0027225306257605553, "global_step": 38036, "epoch": 319, "lr": 4.538281876348839e-05} +{"train_loss": 0.003378175897523761, "global_step": 38037, "epoch": 319, "lr": 4.538061272482461e-05} +{"train_loss": 0.0020802204962819815, "global_step": 38038, "epoch": 319, "lr": 4.537840669523051e-05} +{"train_loss": 0.0016458421014249325, "global_step": 38039, "epoch": 319, "lr": 4.537620067471041e-05} +{"train_loss": 0.0022167921997606754, "global_step": 38040, "epoch": 319, "lr": 4.5373994663268634e-05} +{"train_loss": 0.0025498447939753532, "global_step": 38041, "epoch": 319, "lr": 4.537178866090955e-05} +{"train_loss": 0.0015452656662091613, "global_step": 38042, "epoch": 319, "lr": 4.536958266763747e-05} +{"train_loss": 0.002434544265270233, "global_step": 38043, "epoch": 319, "lr": 4.536737668345669e-05} +{"train_loss": 0.0018080698791891336, "global_step": 38044, "epoch": 319, "lr": 4.53651707083716e-05} +{"train_loss": 0.002955735893920064, "global_step": 38045, "epoch": 319, "lr": 4.536296474238648e-05} +{"train_loss": 0.0022857259027659893, "global_step": 38046, "epoch": 319, "lr": 4.53607587855057e-05} +{"train_loss": 0.0013860604958608747, "global_step": 38047, "epoch": 319, "lr": 4.535855283773355e-05} +{"train_loss": 0.0017038773512467742, "global_step": 38048, "epoch": 319, "lr": 4.535634689907441e-05} +{"train_loss": 0.0012979954481124878, "global_step": 38049, "epoch": 319, "lr": 4.535414096953259e-05} +{"train_loss": 0.0019121574005112052, "global_step": 38050, "epoch": 319, "lr": 4.535193504911239e-05} +{"train_loss": 0.0016829990781843662, "global_step": 38051, "epoch": 319, "lr": 4.53497291378182e-05} +{"train_loss": 0.0023016699124127626, "global_step": 38052, "epoch": 319, "lr": 4.5347523235654285e-05} +{"train_loss": 0.0012124336790293455, "global_step": 38053, "epoch": 319, "lr": 4.534531734262504e-05} +{"train_loss": 0.002389285247772932, "global_step": 38054, "epoch": 319, "lr": 4.5343111458734755e-05} +{"train_loss": 0.0010056080063804984, "global_step": 38055, "epoch": 319, "lr": 4.534090558398777e-05} +{"train_loss": 0.0019592433236539364, "global_step": 38056, "epoch": 319, "lr": 4.533869971838844e-05} +{"train_loss": 0.002098855096846819, "global_step": 38057, "epoch": 319, "lr": 4.533649386194105e-05} +{"train_loss": 0.0017715288558974862, "global_step": 38058, "epoch": 319, "lr": 4.5334288014649975e-05} +{"train_loss": 0.0013878491008654237, "global_step": 38059, "epoch": 319, "lr": 4.53320821765195e-05} +{"train_loss": 0.0010342957684770226, "global_step": 38060, "epoch": 319, "lr": 4.532987634755402e-05} +{"train_loss": 0.0014290624530985951, "global_step": 38061, "epoch": 319, "lr": 4.532767052775782e-05} +{"train_loss": 0.0012858365662395954, "global_step": 38062, "epoch": 319, "lr": 4.532546471713521e-05} +{"train_loss": 0.002358076861128211, "global_step": 38063, "epoch": 319, "lr": 4.5323258915690584e-05} +{"train_loss": 0.0024740532971918583, "global_step": 38064, "epoch": 319, "lr": 4.532105312342821e-05} +{"train_loss": 0.0020822135265916586, "global_step": 38065, "epoch": 319, "lr": 4.5318847340352474e-05} +{"train_loss": 0.0013449431862682104, "global_step": 38066, "epoch": 319, "lr": 4.531664156646767e-05} +{"train_loss": 0.0018620730843394995, "global_step": 38067, "epoch": 319, "lr": 4.531443580177815e-05} +{"train_loss": 0.0016263170400634408, "global_step": 38068, "epoch": 319, "lr": 4.531223004628822e-05} +{"train_loss": 0.0014102400746196508, "global_step": 38069, "epoch": 319, "lr": 4.5310024300002235e-05} +{"train_loss": 0.001029890845529735, "global_step": 38070, "epoch": 319, "lr": 4.5307818562924506e-05} +{"train_loss": 0.0015538649167865515, "global_step": 38071, "epoch": 319, "lr": 4.5305612835059386e-05} +{"train_loss": 0.0014782599173486233, "global_step": 38072, "epoch": 319, "lr": 4.5303407116411183e-05} +{"train_loss": 0.001518536009825766, "global_step": 38073, "epoch": 319, "lr": 4.5301201406984256e-05} +{"train_loss": 0.0012970268726348877, "global_step": 38074, "epoch": 319, "lr": 4.529899570678289e-05} +{"train_loss": 0.0015030610375106335, "global_step": 38075, "epoch": 319, "lr": 4.529679001581147e-05} +{"train_loss": 0.0012053532991558313, "global_step": 38076, "epoch": 319, "lr": 4.529458433407429e-05} +{"train_loss": 0.0011316839372739196, "global_step": 38077, "epoch": 319, "lr": 4.529237866157569e-05} +{"train_loss": 0.0027997023425996304, "global_step": 38078, "epoch": 319, "lr": 4.5290172998319997e-05} +{"train_loss": 0.0018963583406577465, "global_step": 38079, "epoch": 319, "lr": 4.528796734431156e-05, "val_loss": 0.02003331296145916} +{"train_loss": 0.0008874976774677634, "global_step": 38080, "epoch": 320, "lr": 4.52857616995547e-05} +{"train_loss": 0.0009443148737773299, "global_step": 38081, "epoch": 320, "lr": 4.5283556064053717e-05} +{"train_loss": 0.0030477577820420265, "global_step": 38082, "epoch": 320, "lr": 4.5281350437812994e-05} +{"train_loss": 0.0016382720787078142, "global_step": 38083, "epoch": 320, "lr": 4.5279144820836805e-05} +{"train_loss": 0.0013318655546754599, "global_step": 38084, "epoch": 320, "lr": 4.527693921312954e-05} +{"train_loss": 0.0022609818261116743, "global_step": 38085, "epoch": 320, "lr": 4.527473361469548e-05} +{"train_loss": 0.0014906361466273665, "global_step": 38086, "epoch": 320, "lr": 4.527252802553899e-05} +{"train_loss": 0.00115316198207438, "global_step": 38087, "epoch": 320, "lr": 4.527032244566438e-05} +{"train_loss": 0.0026288803201168776, "global_step": 38088, "epoch": 320, "lr": 4.526811687507598e-05} +{"train_loss": 0.0022703553549945354, "global_step": 38089, "epoch": 320, "lr": 4.5265911313778144e-05} +{"train_loss": 0.0019040288170799613, "global_step": 38090, "epoch": 320, "lr": 4.526370576177516e-05} +{"train_loss": 0.001139991800300777, "global_step": 38091, "epoch": 320, "lr": 4.526150021907141e-05} +{"train_loss": 0.0023129270412027836, "global_step": 38092, "epoch": 320, "lr": 4.52592946856712e-05} +{"train_loss": 0.0011076753726229072, "global_step": 38093, "epoch": 320, "lr": 4.5257089161578833e-05} +{"train_loss": 0.0015515655977651477, "global_step": 38094, "epoch": 320, "lr": 4.525488364679869e-05} +{"train_loss": 0.0026205899193882942, "global_step": 38095, "epoch": 320, "lr": 4.5252678141335045e-05} +{"train_loss": 0.0025924176443368196, "global_step": 38096, "epoch": 320, "lr": 4.5250472645192294e-05} +{"train_loss": 0.0020251793321222067, "global_step": 38097, "epoch": 320, "lr": 4.5248267158374705e-05} +{"train_loss": 0.0012129625538364053, "global_step": 38098, "epoch": 320, "lr": 4.5246061680886656e-05} +{"train_loss": 0.0018698174972087145, "global_step": 38099, "epoch": 320, "lr": 4.524385621273246e-05} +{"train_loss": 0.001384587725624442, "global_step": 38100, "epoch": 320, "lr": 4.524165075391642e-05} +{"train_loss": 0.0011828672140836716, "global_step": 38101, "epoch": 320, "lr": 4.52394453044429e-05} +{"train_loss": 0.001497362507507205, "global_step": 38102, "epoch": 320, "lr": 4.523723986431622e-05} +{"train_loss": 0.001210640650242567, "global_step": 38103, "epoch": 320, "lr": 4.523503443354072e-05} +{"train_loss": 0.0010472950525581837, "global_step": 38104, "epoch": 320, "lr": 4.523282901212071e-05} +{"train_loss": 0.0013383910991251469, "global_step": 38105, "epoch": 320, "lr": 4.523062360006053e-05} +{"train_loss": 0.0018703608075156808, "global_step": 38106, "epoch": 320, "lr": 4.522841819736453e-05} +{"train_loss": 0.0029830769635736942, "global_step": 38107, "epoch": 320, "lr": 4.5226212804036996e-05} +{"train_loss": 0.0018108744407072663, "global_step": 38108, "epoch": 320, "lr": 4.522400742008231e-05} +{"train_loss": 0.0021773912012577057, "global_step": 38109, "epoch": 320, "lr": 4.5221802045504745e-05} +{"train_loss": 0.0018474528333172202, "global_step": 38110, "epoch": 320, "lr": 4.521959668030869e-05} +{"train_loss": 0.0014082712586969137, "global_step": 38111, "epoch": 320, "lr": 4.5217391324498445e-05} +{"train_loss": 0.003510952228680253, "global_step": 38112, "epoch": 320, "lr": 4.521518597807831e-05} +{"train_loss": 0.0019134992035105824, "global_step": 38113, "epoch": 320, "lr": 4.5212980641052675e-05} +{"train_loss": 0.0018574479036033154, "global_step": 38114, "epoch": 320, "lr": 4.521077531342582e-05} +{"train_loss": 0.002044587628915906, "global_step": 38115, "epoch": 320, "lr": 4.520856999520212e-05} +{"train_loss": 0.0029415751341730356, "global_step": 38116, "epoch": 320, "lr": 4.5206364686385854e-05} +{"train_loss": 0.001670817960985005, "global_step": 38117, "epoch": 320, "lr": 4.5204159386981406e-05} +{"train_loss": 0.0016803466714918613, "global_step": 38118, "epoch": 320, "lr": 4.5201954096993065e-05} +{"train_loss": 0.0013154526241123676, "global_step": 38119, "epoch": 320, "lr": 4.519974881642517e-05} +{"train_loss": 0.0012799713294953108, "global_step": 38120, "epoch": 320, "lr": 4.519754354528206e-05} +{"train_loss": 0.003322057891637087, "global_step": 38121, "epoch": 320, "lr": 4.519533828356806e-05} +{"train_loss": 0.001726628514006734, "global_step": 38122, "epoch": 320, "lr": 4.51931330312875e-05} +{"train_loss": 0.001623470918275416, "global_step": 38123, "epoch": 320, "lr": 4.51909277884447e-05} +{"train_loss": 0.0015403464203700423, "global_step": 38124, "epoch": 320, "lr": 4.5188722555044024e-05} +{"train_loss": 0.001964289927855134, "global_step": 38125, "epoch": 320, "lr": 4.5186517331089775e-05} +{"train_loss": 0.0022851049434393644, "global_step": 38126, "epoch": 320, "lr": 4.518431211658626e-05} +{"train_loss": 0.00296520977281034, "global_step": 38127, "epoch": 320, "lr": 4.518210691153786e-05} +{"train_loss": 0.0020853367168456316, "global_step": 38128, "epoch": 320, "lr": 4.5179901715948846e-05} +{"train_loss": 0.001909311511553824, "global_step": 38129, "epoch": 320, "lr": 4.517769652982361e-05} +{"train_loss": 0.0024026581086218357, "global_step": 38130, "epoch": 320, "lr": 4.5175491353166454e-05} +{"train_loss": 0.003099947702139616, "global_step": 38131, "epoch": 320, "lr": 4.517328618598168e-05} +{"train_loss": 0.0013036648742854595, "global_step": 38132, "epoch": 320, "lr": 4.517108102827367e-05} +{"train_loss": 0.002375456038862467, "global_step": 38133, "epoch": 320, "lr": 4.51688758800467e-05} +{"train_loss": 0.0019511687569320202, "global_step": 38134, "epoch": 320, "lr": 4.516667074130514e-05} +{"train_loss": 0.0023226768244057894, "global_step": 38135, "epoch": 320, "lr": 4.51644656120533e-05} +{"train_loss": 0.0019416194409132004, "global_step": 38136, "epoch": 320, "lr": 4.516226049229551e-05} +{"train_loss": 0.0015494351973757148, "global_step": 38137, "epoch": 320, "lr": 4.516005538203612e-05} +{"train_loss": 0.0013883569044992328, "global_step": 38138, "epoch": 320, "lr": 4.515785028127943e-05} +{"train_loss": 0.0014248593943193555, "global_step": 38139, "epoch": 320, "lr": 4.5155645190029804e-05} +{"train_loss": 0.002599545521661639, "global_step": 38140, "epoch": 320, "lr": 4.5153440108291526e-05} +{"train_loss": 0.002386484295129776, "global_step": 38141, "epoch": 320, "lr": 4.515123503606897e-05} +{"train_loss": 0.0019151319283992052, "global_step": 38142, "epoch": 320, "lr": 4.514902997336645e-05} +{"train_loss": 0.003096472704783082, "global_step": 38143, "epoch": 320, "lr": 4.514682492018827e-05} +{"train_loss": 0.0024860084522515535, "global_step": 38144, "epoch": 320, "lr": 4.5144619876538805e-05} +{"train_loss": 0.0010950518772006035, "global_step": 38145, "epoch": 320, "lr": 4.514241484242233e-05} +{"train_loss": 0.003424298018217087, "global_step": 38146, "epoch": 320, "lr": 4.514020981784323e-05} +{"train_loss": 0.0009222871158272028, "global_step": 38147, "epoch": 320, "lr": 4.513800480280579e-05} +{"train_loss": 0.002455121837556362, "global_step": 38148, "epoch": 320, "lr": 4.5135799797314376e-05} +{"train_loss": 0.0021911778021603823, "global_step": 38149, "epoch": 320, "lr": 4.5133594801373305e-05} +{"train_loss": 0.0018178236205130816, "global_step": 38150, "epoch": 320, "lr": 4.513138981498687e-05} +{"train_loss": 0.0027677298057824373, "global_step": 38151, "epoch": 320, "lr": 4.512918483815945e-05} +{"train_loss": 0.0021026935428380966, "global_step": 38152, "epoch": 320, "lr": 4.512697987089535e-05} +{"train_loss": 0.0020530615001916885, "global_step": 38153, "epoch": 320, "lr": 4.5124774913198907e-05} +{"train_loss": 0.0017418109346181154, "global_step": 38154, "epoch": 320, "lr": 4.5122569965074445e-05} +{"train_loss": 0.001987540628761053, "global_step": 38155, "epoch": 320, "lr": 4.51203650265263e-05} +{"train_loss": 0.0011732986895367503, "global_step": 38156, "epoch": 320, "lr": 4.5118160097558804e-05} +{"train_loss": 0.002306706737726927, "global_step": 38157, "epoch": 320, "lr": 4.5115955178176264e-05} +{"train_loss": 0.002014159457758069, "global_step": 38158, "epoch": 320, "lr": 4.511375026838304e-05} +{"train_loss": 0.0011187817435711622, "global_step": 38159, "epoch": 320, "lr": 4.511154536818342e-05} +{"train_loss": 0.003065187716856599, "global_step": 38160, "epoch": 320, "lr": 4.510934047758179e-05} +{"train_loss": 0.0018522292375564575, "global_step": 38161, "epoch": 320, "lr": 4.510713559658244e-05} +{"train_loss": 0.0017697702860459685, "global_step": 38162, "epoch": 320, "lr": 4.510493072518969e-05} +{"train_loss": 0.0014785020612180233, "global_step": 38163, "epoch": 320, "lr": 4.51027258634079e-05} +{"train_loss": 0.0012002207804471254, "global_step": 38164, "epoch": 320, "lr": 4.510052101124137e-05} +{"train_loss": 0.003060834249481559, "global_step": 38165, "epoch": 320, "lr": 4.509831616869446e-05} +{"train_loss": 0.001805102452635765, "global_step": 38166, "epoch": 320, "lr": 4.5096111335771463e-05} +{"train_loss": 0.0022257862146943808, "global_step": 38167, "epoch": 320, "lr": 4.509390651247675e-05} +{"train_loss": 0.0011377992341294885, "global_step": 38168, "epoch": 320, "lr": 4.509170169881461e-05} +{"train_loss": 0.001288948580622673, "global_step": 38169, "epoch": 320, "lr": 4.50894968947894e-05} +{"train_loss": 0.002327215624973178, "global_step": 38170, "epoch": 320, "lr": 4.508729210040544e-05} +{"train_loss": 0.0012480750447139144, "global_step": 38171, "epoch": 320, "lr": 4.5085087315667046e-05} +{"train_loss": 0.0019364176550880075, "global_step": 38172, "epoch": 320, "lr": 4.508288254057856e-05} +{"train_loss": 0.0016215593786910176, "global_step": 38173, "epoch": 320, "lr": 4.5080677775144306e-05} +{"train_loss": 0.00171681959182024, "global_step": 38174, "epoch": 320, "lr": 4.5078473019368626e-05} +{"train_loss": 0.0022107118275016546, "global_step": 38175, "epoch": 320, "lr": 4.507626827325585e-05} +{"train_loss": 0.002374026458710432, "global_step": 38176, "epoch": 320, "lr": 4.507406353681026e-05} +{"train_loss": 0.002006742637604475, "global_step": 38177, "epoch": 320, "lr": 4.507185881003625e-05} +{"train_loss": 0.0017083392012864351, "global_step": 38178, "epoch": 320, "lr": 4.50696540929381e-05} +{"train_loss": 0.0011597633128985763, "global_step": 38179, "epoch": 320, "lr": 4.506744938552018e-05} +{"train_loss": 0.0021227800752967596, "global_step": 38180, "epoch": 320, "lr": 4.506524468778679e-05} +{"train_loss": 0.0018344512209296227, "global_step": 38181, "epoch": 320, "lr": 4.5063039999742246e-05} +{"train_loss": 0.00230834586545825, "global_step": 38182, "epoch": 320, "lr": 4.5060835321390914e-05} +{"train_loss": 0.0025216450449079275, "global_step": 38183, "epoch": 320, "lr": 4.5058630652737085e-05} +{"train_loss": 0.0020706390496343374, "global_step": 38184, "epoch": 320, "lr": 4.505642599378513e-05} +{"train_loss": 0.0026083977427333593, "global_step": 38185, "epoch": 320, "lr": 4.5054221344539336e-05} +{"train_loss": 0.0023256940767169, "global_step": 38186, "epoch": 320, "lr": 4.5052016705004054e-05} +{"train_loss": 0.0025493085850030184, "global_step": 38187, "epoch": 320, "lr": 4.5049812075183616e-05} +{"train_loss": 0.0023174185771495104, "global_step": 38188, "epoch": 320, "lr": 4.5047607455082333e-05} +{"train_loss": 0.0011528637260198593, "global_step": 38189, "epoch": 320, "lr": 4.5045402844704555e-05} +{"train_loss": 0.001830192981287837, "global_step": 38190, "epoch": 320, "lr": 4.5043198244054584e-05} +{"train_loss": 0.0029934742487967014, "global_step": 38191, "epoch": 320, "lr": 4.5040993653136784e-05} +{"train_loss": 0.0012504911283031106, "global_step": 38192, "epoch": 320, "lr": 4.503878907195544e-05} +{"train_loss": 0.002430059015750885, "global_step": 38193, "epoch": 320, "lr": 4.5036584500514924e-05} +{"train_loss": 0.0018364312127232552, "global_step": 38194, "epoch": 320, "lr": 4.503437993881955e-05} +{"train_loss": 0.0017726393416523933, "global_step": 38195, "epoch": 320, "lr": 4.503217538687361e-05} +{"train_loss": 0.002542740199714899, "global_step": 38196, "epoch": 320, "lr": 4.502997084468149e-05} +{"train_loss": 0.0018358433153480291, "global_step": 38197, "epoch": 320, "lr": 4.502776631224747e-05} +{"train_loss": 0.001953149782767629, "global_step": 38198, "epoch": 320, "lr": 4.502556178957592e-05, "val_loss": 0.022757019847631454, "train_action_mse_error": 4.034278754261322e-05} +{"train_loss": 0.0015849522314965725, "global_step": 38199, "epoch": 321, "lr": 4.502335727667114e-05} +{"train_loss": 0.0019629818852990866, "global_step": 38200, "epoch": 321, "lr": 4.502115277353746e-05} +{"train_loss": 0.0015821210108697414, "global_step": 38201, "epoch": 321, "lr": 4.5018948280179215e-05} +{"train_loss": 0.001845765975303948, "global_step": 38202, "epoch": 321, "lr": 4.5016743796600744e-05} +{"train_loss": 0.00083064945647493, "global_step": 38203, "epoch": 321, "lr": 4.501453932280635e-05} +{"train_loss": 0.0027494619134813547, "global_step": 38204, "epoch": 321, "lr": 4.5012334858800385e-05} +{"train_loss": 0.0031786179170012474, "global_step": 38205, "epoch": 321, "lr": 4.5010130404587164e-05} +{"train_loss": 0.0022983700037002563, "global_step": 38206, "epoch": 321, "lr": 4.500792596017103e-05} +{"train_loss": 0.0020474211778491735, "global_step": 38207, "epoch": 321, "lr": 4.5005721525556275e-05} +{"train_loss": 0.0015805155271664262, "global_step": 38208, "epoch": 321, "lr": 4.500351710074728e-05} +{"train_loss": 0.001626603421755135, "global_step": 38209, "epoch": 321, "lr": 4.500131268574832e-05} +{"train_loss": 0.0015534876147285104, "global_step": 38210, "epoch": 321, "lr": 4.4999108280563776e-05} +{"train_loss": 0.0015514722326770425, "global_step": 38211, "epoch": 321, "lr": 4.4996903885197946e-05} +{"train_loss": 0.0014807881088927388, "global_step": 38212, "epoch": 321, "lr": 4.4994699499655136e-05} +{"train_loss": 0.002078601624816656, "global_step": 38213, "epoch": 321, "lr": 4.4992495123939724e-05} +{"train_loss": 0.002591395052149892, "global_step": 38214, "epoch": 321, "lr": 4.4990290758055986e-05} +{"train_loss": 0.001969420351088047, "global_step": 38215, "epoch": 321, "lr": 4.49880864020083e-05} +{"train_loss": 0.0023844835814088583, "global_step": 38216, "epoch": 321, "lr": 4.498588205580095e-05} +{"train_loss": 0.0012279143556952477, "global_step": 38217, "epoch": 321, "lr": 4.498367771943831e-05} +{"train_loss": 0.001135038211941719, "global_step": 38218, "epoch": 321, "lr": 4.498147339292467e-05} +{"train_loss": 0.0016617763321846724, "global_step": 38219, "epoch": 321, "lr": 4.4979269076264366e-05} +{"train_loss": 0.0011239382438361645, "global_step": 38220, "epoch": 321, "lr": 4.497706476946173e-05} +{"train_loss": 0.0022900253534317017, "global_step": 38221, "epoch": 321, "lr": 4.497486047252109e-05} +{"train_loss": 0.0024791446048766375, "global_step": 38222, "epoch": 321, "lr": 4.497265618544679e-05} +{"train_loss": 0.0021964507177472115, "global_step": 38223, "epoch": 321, "lr": 4.4970451908243124e-05} +{"train_loss": 0.0022329888306558132, "global_step": 38224, "epoch": 321, "lr": 4.4968247640914455e-05} +{"train_loss": 0.0018391722114756703, "global_step": 38225, "epoch": 321, "lr": 4.49660433834651e-05} +{"train_loss": 0.0021054609678685665, "global_step": 38226, "epoch": 321, "lr": 4.496383913589935e-05} +{"train_loss": 0.0013800051528960466, "global_step": 38227, "epoch": 321, "lr": 4.4961634898221594e-05} +{"train_loss": 0.0018426316091790795, "global_step": 38228, "epoch": 321, "lr": 4.495943067043611e-05} +{"train_loss": 0.001115769031457603, "global_step": 38229, "epoch": 321, "lr": 4.4957226452547256e-05} +{"train_loss": 0.001195533201098442, "global_step": 38230, "epoch": 321, "lr": 4.4955022244559357e-05} +{"train_loss": 0.0017685065977275372, "global_step": 38231, "epoch": 321, "lr": 4.4952818046476715e-05} +{"train_loss": 0.0017645112238824368, "global_step": 38232, "epoch": 321, "lr": 4.4950613858303695e-05} +{"train_loss": 0.0024274762254208326, "global_step": 38233, "epoch": 321, "lr": 4.494840968004457e-05} +{"train_loss": 0.0016234214417636395, "global_step": 38234, "epoch": 321, "lr": 4.494620551170373e-05} +{"train_loss": 0.0024084628093987703, "global_step": 38235, "epoch": 321, "lr": 4.494400135328547e-05} +{"train_loss": 0.0023103528656065464, "global_step": 38236, "epoch": 321, "lr": 4.4941797204794124e-05} +{"train_loss": 0.001210561254993081, "global_step": 38237, "epoch": 321, "lr": 4.493959306623403e-05} +{"train_loss": 0.002562479814514518, "global_step": 38238, "epoch": 321, "lr": 4.493738893760948e-05} +{"train_loss": 0.002261459594592452, "global_step": 38239, "epoch": 321, "lr": 4.493518481892485e-05} +{"train_loss": 0.001792333205230534, "global_step": 38240, "epoch": 321, "lr": 4.493298071018442e-05} +{"train_loss": 0.001595254521816969, "global_step": 38241, "epoch": 321, "lr": 4.4930776611392563e-05} +{"train_loss": 0.0024712192825973034, "global_step": 38242, "epoch": 321, "lr": 4.4928572522553564e-05} +{"train_loss": 0.0024432651698589325, "global_step": 38243, "epoch": 321, "lr": 4.4926368443671795e-05} +{"train_loss": 0.0018082811729982495, "global_step": 38244, "epoch": 321, "lr": 4.4924164374751554e-05} +{"train_loss": 0.001989792799577117, "global_step": 38245, "epoch": 321, "lr": 4.492196031579716e-05} +{"train_loss": 0.0010090690338984132, "global_step": 38246, "epoch": 321, "lr": 4.491975626681297e-05} +{"train_loss": 0.0012851294595748186, "global_step": 38247, "epoch": 321, "lr": 4.491755222780327e-05} +{"train_loss": 0.0027031381614506245, "global_step": 38248, "epoch": 321, "lr": 4.491534819877245e-05} +{"train_loss": 0.0013343167956918478, "global_step": 38249, "epoch": 321, "lr": 4.4913144179724775e-05} +{"train_loss": 0.001885251491330564, "global_step": 38250, "epoch": 321, "lr": 4.49109401706646e-05} +{"train_loss": 0.0022568311542272568, "global_step": 38251, "epoch": 321, "lr": 4.4908736171596255e-05} +{"train_loss": 0.002567920833826065, "global_step": 38252, "epoch": 321, "lr": 4.490653218252406e-05} +{"train_loss": 0.001288760220631957, "global_step": 38253, "epoch": 321, "lr": 4.490432820345235e-05} +{"train_loss": 0.0026914000045508146, "global_step": 38254, "epoch": 321, "lr": 4.490212423438544e-05} +{"train_loss": 0.0013078812044113874, "global_step": 38255, "epoch": 321, "lr": 4.489992027532767e-05} +{"train_loss": 0.0015930228400975466, "global_step": 38256, "epoch": 321, "lr": 4.4897716326283365e-05} +{"train_loss": 0.001535880845040083, "global_step": 38257, "epoch": 321, "lr": 4.489551238725684e-05} +{"train_loss": 0.0016403994522988796, "global_step": 38258, "epoch": 321, "lr": 4.489330845825244e-05} +{"train_loss": 0.002252155216410756, "global_step": 38259, "epoch": 321, "lr": 4.489110453927447e-05} +{"train_loss": 0.0021295289043337107, "global_step": 38260, "epoch": 321, "lr": 4.488890063032728e-05} +{"train_loss": 0.00234810053370893, "global_step": 38261, "epoch": 321, "lr": 4.48866967314152e-05} +{"train_loss": 0.00310497242026031, "global_step": 38262, "epoch": 321, "lr": 4.4884492842542526e-05} +{"train_loss": 0.0025199917145073414, "global_step": 38263, "epoch": 321, "lr": 4.4882288963713616e-05} +{"train_loss": 0.001145192887634039, "global_step": 38264, "epoch": 321, "lr": 4.4880085094932766e-05} +{"train_loss": 0.002319765044376254, "global_step": 38265, "epoch": 321, "lr": 4.487788123620435e-05} +{"train_loss": 0.0028094255831092596, "global_step": 38266, "epoch": 321, "lr": 4.4875677387532635e-05} +{"train_loss": 0.001579488511197269, "global_step": 38267, "epoch": 321, "lr": 4.4873473548922e-05} +{"train_loss": 0.0020573751535266638, "global_step": 38268, "epoch": 321, "lr": 4.4871269720376755e-05} +{"train_loss": 0.0017041594255715609, "global_step": 38269, "epoch": 321, "lr": 4.48690659019012e-05} +{"train_loss": 0.00303526665084064, "global_step": 38270, "epoch": 321, "lr": 4.486686209349971e-05} +{"train_loss": 0.001663587405346334, "global_step": 38271, "epoch": 321, "lr": 4.486465829517657e-05} +{"train_loss": 0.0017212084494531155, "global_step": 38272, "epoch": 321, "lr": 4.486245450693615e-05} +{"train_loss": 0.001763578038662672, "global_step": 38273, "epoch": 321, "lr": 4.486025072878272e-05} +{"train_loss": 0.0030993910040706396, "global_step": 38274, "epoch": 321, "lr": 4.485804696072067e-05} +{"train_loss": 0.0018919871654361486, "global_step": 38275, "epoch": 321, "lr": 4.4855843202754286e-05} +{"train_loss": 0.002782955067232251, "global_step": 38276, "epoch": 321, "lr": 4.485363945488789e-05} +{"train_loss": 0.0009855286916717887, "global_step": 38277, "epoch": 321, "lr": 4.485143571712584e-05} +{"train_loss": 0.0014448821311816573, "global_step": 38278, "epoch": 321, "lr": 4.484923198947243e-05} +{"train_loss": 0.0019507389515638351, "global_step": 38279, "epoch": 321, "lr": 4.4847028271932016e-05} +{"train_loss": 0.002123425714671612, "global_step": 38280, "epoch": 321, "lr": 4.4844824564508916e-05} +{"train_loss": 0.0013924813829362392, "global_step": 38281, "epoch": 321, "lr": 4.4842620867207434e-05} +{"train_loss": 0.00300037139095366, "global_step": 38282, "epoch": 321, "lr": 4.484041718003193e-05} +{"train_loss": 0.0023026156704872847, "global_step": 38283, "epoch": 321, "lr": 4.483821350298671e-05} +{"train_loss": 0.003565422259271145, "global_step": 38284, "epoch": 321, "lr": 4.4836009836076095e-05} +{"train_loss": 0.002236573491245508, "global_step": 38285, "epoch": 321, "lr": 4.4833806179304434e-05} +{"train_loss": 0.0019203746924176812, "global_step": 38286, "epoch": 321, "lr": 4.483160253267604e-05} +{"train_loss": 0.0018903486197814345, "global_step": 38287, "epoch": 321, "lr": 4.482939889619526e-05} +{"train_loss": 0.001777574187144637, "global_step": 38288, "epoch": 321, "lr": 4.4827195269866374e-05} +{"train_loss": 0.0012912830570712686, "global_step": 38289, "epoch": 321, "lr": 4.482499165369376e-05} +{"train_loss": 0.0015475848922505975, "global_step": 38290, "epoch": 321, "lr": 4.48227880476817e-05} +{"train_loss": 0.0023102827835828066, "global_step": 38291, "epoch": 321, "lr": 4.4820584451834566e-05} +{"train_loss": 0.0022583967074751854, "global_step": 38292, "epoch": 321, "lr": 4.481838086615664e-05} +{"train_loss": 0.003010146552696824, "global_step": 38293, "epoch": 321, "lr": 4.481617729065229e-05} +{"train_loss": 0.0029809349216520786, "global_step": 38294, "epoch": 321, "lr": 4.481397372532582e-05} +{"train_loss": 0.0021738088689744473, "global_step": 38295, "epoch": 321, "lr": 4.481177017018154e-05} +{"train_loss": 0.0017861822852864861, "global_step": 38296, "epoch": 321, "lr": 4.4809566625223817e-05} +{"train_loss": 0.0022410538513213396, "global_step": 38297, "epoch": 321, "lr": 4.480736309045693e-05} +{"train_loss": 0.0026014463510364294, "global_step": 38298, "epoch": 321, "lr": 4.480515956588526e-05} +{"train_loss": 0.0018417653627693653, "global_step": 38299, "epoch": 321, "lr": 4.4802956051513085e-05} +{"train_loss": 0.0010721480939537287, "global_step": 38300, "epoch": 321, "lr": 4.480075254734476e-05} +{"train_loss": 0.0022264569997787476, "global_step": 38301, "epoch": 321, "lr": 4.479854905338459e-05} +{"train_loss": 0.001227246131747961, "global_step": 38302, "epoch": 321, "lr": 4.479634556963692e-05} +{"train_loss": 0.0021428288891911507, "global_step": 38303, "epoch": 321, "lr": 4.4794142096106066e-05} +{"train_loss": 0.001176193356513977, "global_step": 38304, "epoch": 321, "lr": 4.479193863279635e-05} +{"train_loss": 0.0011072896886616945, "global_step": 38305, "epoch": 321, "lr": 4.4789735179712126e-05} +{"train_loss": 0.0019225483993068337, "global_step": 38306, "epoch": 321, "lr": 4.47875317368577e-05} +{"train_loss": 0.002364944200962782, "global_step": 38307, "epoch": 321, "lr": 4.4785328304237385e-05} +{"train_loss": 0.0023714059498161077, "global_step": 38308, "epoch": 321, "lr": 4.478312488185553e-05} +{"train_loss": 0.0020215788390487432, "global_step": 38309, "epoch": 321, "lr": 4.478092146971644e-05} +{"train_loss": 0.0008957918034866452, "global_step": 38310, "epoch": 321, "lr": 4.477871806782447e-05} +{"train_loss": 0.001876162365078926, "global_step": 38311, "epoch": 321, "lr": 4.4776514676183914e-05} +{"train_loss": 0.0023033502511680126, "global_step": 38312, "epoch": 321, "lr": 4.4774311294799124e-05} +{"train_loss": 0.0028144316747784615, "global_step": 38313, "epoch": 321, "lr": 4.477210792367442e-05} +{"train_loss": 0.0018081573070958257, "global_step": 38314, "epoch": 321, "lr": 4.476990456281411e-05} +{"train_loss": 0.002128945430740714, "global_step": 38315, "epoch": 321, "lr": 4.4767701212222544e-05} +{"train_loss": 0.002061461564153433, "global_step": 38316, "epoch": 321, "lr": 4.476549787190402e-05} +{"train_loss": 0.0019709693983064164, "global_step": 38317, "epoch": 321, "lr": 4.47632945418629e-05, "val_loss": 0.007996715605258942} +{"train_loss": 0.0013400926254689693, "global_step": 38318, "epoch": 322, "lr": 4.4761091222103494e-05} +{"train_loss": 0.0019027981907129288, "global_step": 38319, "epoch": 322, "lr": 4.47588879126301e-05} +{"train_loss": 0.002362635685130954, "global_step": 38320, "epoch": 322, "lr": 4.47566846134471e-05} +{"train_loss": 0.0018537917640060186, "global_step": 38321, "epoch": 322, "lr": 4.475448132455876e-05} +{"train_loss": 0.0020447680726647377, "global_step": 38322, "epoch": 322, "lr": 4.475227804596946e-05} +{"train_loss": 0.0014201918384060264, "global_step": 38323, "epoch": 322, "lr": 4.4750074777683486e-05} +{"train_loss": 0.002564893802627921, "global_step": 38324, "epoch": 322, "lr": 4.4747871519705196e-05} +{"train_loss": 0.0017128039617091417, "global_step": 38325, "epoch": 322, "lr": 4.47456682720389e-05} +{"train_loss": 0.002050672424957156, "global_step": 38326, "epoch": 322, "lr": 4.47434650346889e-05} +{"train_loss": 0.0023165959864854813, "global_step": 38327, "epoch": 322, "lr": 4.4741261807659574e-05} +{"train_loss": 0.0015707450220361352, "global_step": 38328, "epoch": 322, "lr": 4.473905859095519e-05} +{"train_loss": 0.002616231795400381, "global_step": 38329, "epoch": 322, "lr": 4.473685538458012e-05} +{"train_loss": 0.00340201030485332, "global_step": 38330, "epoch": 322, "lr": 4.473465218853868e-05} +{"train_loss": 0.002703026868402958, "global_step": 38331, "epoch": 322, "lr": 4.473244900283516e-05} +{"train_loss": 0.0012098482111468911, "global_step": 38332, "epoch": 322, "lr": 4.473024582747393e-05} +{"train_loss": 0.0014766642125323415, "global_step": 38333, "epoch": 322, "lr": 4.4728042662459295e-05} +{"train_loss": 0.0037174210883677006, "global_step": 38334, "epoch": 322, "lr": 4.4725839507795586e-05} +{"train_loss": 0.0014941660920158029, "global_step": 38335, "epoch": 322, "lr": 4.472363636348713e-05} +{"train_loss": 0.001887712744064629, "global_step": 38336, "epoch": 322, "lr": 4.472143322953825e-05} +{"train_loss": 0.0016020459588617086, "global_step": 38337, "epoch": 322, "lr": 4.4719230105953284e-05} +{"train_loss": 0.002508170437067747, "global_step": 38338, "epoch": 322, "lr": 4.471702699273652e-05} +{"train_loss": 0.0029576809611171484, "global_step": 38339, "epoch": 322, "lr": 4.471482388989233e-05} +{"train_loss": 0.0011096502421423793, "global_step": 38340, "epoch": 322, "lr": 4.4712620797425e-05} +{"train_loss": 0.0023347255773842335, "global_step": 38341, "epoch": 322, "lr": 4.47104177153389e-05} +{"train_loss": 0.003037748159840703, "global_step": 38342, "epoch": 322, "lr": 4.4708214643638305e-05} +{"train_loss": 0.0028512782882899046, "global_step": 38343, "epoch": 322, "lr": 4.470601158232758e-05} +{"train_loss": 0.0014090699842199683, "global_step": 38344, "epoch": 322, "lr": 4.470380853141104e-05} +{"train_loss": 0.0028893244452774525, "global_step": 38345, "epoch": 322, "lr": 4.4701605490892984e-05} +{"train_loss": 0.002406838582828641, "global_step": 38346, "epoch": 322, "lr": 4.4699402460777785e-05} +{"train_loss": 0.0013237952953204513, "global_step": 38347, "epoch": 322, "lr": 4.469719944106972e-05} +{"train_loss": 0.00208785617724061, "global_step": 38348, "epoch": 322, "lr": 4.4694996431773155e-05} +{"train_loss": 0.0021182752680033445, "global_step": 38349, "epoch": 322, "lr": 4.469279343289239e-05} +{"train_loss": 0.0014825707767158747, "global_step": 38350, "epoch": 322, "lr": 4.469059044443176e-05} +{"train_loss": 0.0014013723703101277, "global_step": 38351, "epoch": 322, "lr": 4.468838746639559e-05} +{"train_loss": 0.0015380459371954203, "global_step": 38352, "epoch": 322, "lr": 4.4686184498788194e-05} +{"train_loss": 0.0008802796946838498, "global_step": 38353, "epoch": 322, "lr": 4.468398154161391e-05} +{"train_loss": 0.002213321626186371, "global_step": 38354, "epoch": 322, "lr": 4.4681778594877056e-05} +{"train_loss": 0.0030184753704816103, "global_step": 38355, "epoch": 322, "lr": 4.467957565858198e-05} +{"train_loss": 0.001293593319132924, "global_step": 38356, "epoch": 322, "lr": 4.467737273273299e-05} +{"train_loss": 0.0014606890035793185, "global_step": 38357, "epoch": 322, "lr": 4.4675169817334384e-05} +{"train_loss": 0.0016438388265669346, "global_step": 38358, "epoch": 322, "lr": 4.467296691239054e-05} +{"train_loss": 0.0023546458687633276, "global_step": 38359, "epoch": 322, "lr": 4.467076401790573e-05} +{"train_loss": 0.002281242748722434, "global_step": 38360, "epoch": 322, "lr": 4.466856113388433e-05} +{"train_loss": 0.001070220721885562, "global_step": 38361, "epoch": 322, "lr": 4.466635826033062e-05} +{"train_loss": 0.001974757295101881, "global_step": 38362, "epoch": 322, "lr": 4.466415539724896e-05} +{"train_loss": 0.002480510389432311, "global_step": 38363, "epoch": 322, "lr": 4.466195254464367e-05} +{"train_loss": 0.0016917490866035223, "global_step": 38364, "epoch": 322, "lr": 4.4659749702519046e-05} +{"train_loss": 0.0010128077119588852, "global_step": 38365, "epoch": 322, "lr": 4.465754687087945e-05} +{"train_loss": 0.0020724174100905657, "global_step": 38366, "epoch": 322, "lr": 4.465534404972916e-05} +{"train_loss": 0.002298984443768859, "global_step": 38367, "epoch": 322, "lr": 4.4653141239072556e-05} +{"train_loss": 0.002187049714848399, "global_step": 38368, "epoch": 322, "lr": 4.465093843891394e-05} +{"train_loss": 0.0018069986253976822, "global_step": 38369, "epoch": 322, "lr": 4.464873564925762e-05} +{"train_loss": 0.0022555929608643055, "global_step": 38370, "epoch": 322, "lr": 4.464653287010795e-05} +{"train_loss": 0.0027295653708279133, "global_step": 38371, "epoch": 322, "lr": 4.4644330101469225e-05} +{"train_loss": 0.0013908924302086234, "global_step": 38372, "epoch": 322, "lr": 4.46421273433458e-05} +{"train_loss": 0.0019446026999503374, "global_step": 38373, "epoch": 322, "lr": 4.4639924595741973e-05} +{"train_loss": 0.0038662878796458244, "global_step": 38374, "epoch": 322, "lr": 4.46377218586621e-05} +{"train_loss": 0.004925421439111233, "global_step": 38375, "epoch": 322, "lr": 4.4635519132110484e-05} +{"train_loss": 0.0029893137980252504, "global_step": 38376, "epoch": 322, "lr": 4.463331641609143e-05} +{"train_loss": 0.001074681873433292, "global_step": 38377, "epoch": 322, "lr": 4.4631113710609315e-05} +{"train_loss": 0.002296058926731348, "global_step": 38378, "epoch": 322, "lr": 4.462891101566841e-05} +{"train_loss": 0.0018269295105710626, "global_step": 38379, "epoch": 322, "lr": 4.462670833127308e-05} +{"train_loss": 0.0025183947291225195, "global_step": 38380, "epoch": 322, "lr": 4.462450565742762e-05} +{"train_loss": 0.0017520006513223052, "global_step": 38381, "epoch": 322, "lr": 4.462230299413639e-05} +{"train_loss": 0.002226183656603098, "global_step": 38382, "epoch": 322, "lr": 4.462010034140368e-05} +{"train_loss": 0.0014011949533596635, "global_step": 38383, "epoch": 322, "lr": 4.4617897699233826e-05} +{"train_loss": 0.0028164403047412634, "global_step": 38384, "epoch": 322, "lr": 4.4615695067631156e-05} +{"train_loss": 0.002202806994318962, "global_step": 38385, "epoch": 322, "lr": 4.46134924466e-05} +{"train_loss": 0.002337152138352394, "global_step": 38386, "epoch": 322, "lr": 4.461128983614467e-05} +{"train_loss": 0.0020762276835739613, "global_step": 38387, "epoch": 322, "lr": 4.460908723626951e-05} +{"train_loss": 0.002954225055873394, "global_step": 38388, "epoch": 322, "lr": 4.4606884646978806e-05} +{"train_loss": 0.0009423604351468384, "global_step": 38389, "epoch": 322, "lr": 4.4604682068276935e-05} +{"train_loss": 0.002360378624871373, "global_step": 38390, "epoch": 322, "lr": 4.460247950016817e-05} +{"train_loss": 0.0027230794075876474, "global_step": 38391, "epoch": 322, "lr": 4.4600276942656883e-05} +{"train_loss": 0.0010843907948583364, "global_step": 38392, "epoch": 322, "lr": 4.4598074395747343e-05} +{"train_loss": 0.002101134043186903, "global_step": 38393, "epoch": 322, "lr": 4.4595871859443943e-05} +{"train_loss": 0.0014739584876224399, "global_step": 38394, "epoch": 322, "lr": 4.4593669333750966e-05} +{"train_loss": 0.0020018843933939934, "global_step": 38395, "epoch": 322, "lr": 4.459146681867272e-05} +{"train_loss": 0.002516162348911166, "global_step": 38396, "epoch": 322, "lr": 4.458926431421357e-05} +{"train_loss": 0.0032863097731024027, "global_step": 38397, "epoch": 322, "lr": 4.458706182037781e-05} +{"train_loss": 0.0039007235318422318, "global_step": 38398, "epoch": 322, "lr": 4.458485933716978e-05} +{"train_loss": 0.003338837530463934, "global_step": 38399, "epoch": 322, "lr": 4.45826568645938e-05} +{"train_loss": 0.0017374325543642044, "global_step": 38400, "epoch": 322, "lr": 4.45804544026542e-05} +{"train_loss": 0.002327369060367346, "global_step": 38401, "epoch": 322, "lr": 4.4578251951355286e-05} +{"train_loss": 0.002151996362954378, "global_step": 38402, "epoch": 322, "lr": 4.4576049510701394e-05} +{"train_loss": 0.0016012085834518075, "global_step": 38403, "epoch": 322, "lr": 4.457384708069687e-05} +{"train_loss": 0.0020295267459005117, "global_step": 38404, "epoch": 322, "lr": 4.457164466134599e-05} +{"train_loss": 0.0016046719392761588, "global_step": 38405, "epoch": 322, "lr": 4.456944225265313e-05} +{"train_loss": 0.0019410991808399558, "global_step": 38406, "epoch": 322, "lr": 4.4567239854622595e-05} +{"train_loss": 0.0017841114895418286, "global_step": 38407, "epoch": 322, "lr": 4.456503746725868e-05} +{"train_loss": 0.0014779415214434266, "global_step": 38408, "epoch": 322, "lr": 4.456283509056575e-05} +{"train_loss": 0.0027578414883464575, "global_step": 38409, "epoch": 322, "lr": 4.456063272454809e-05} +{"train_loss": 0.003061912255361676, "global_step": 38410, "epoch": 322, "lr": 4.455843036921007e-05} +{"train_loss": 0.0019680478144437075, "global_step": 38411, "epoch": 322, "lr": 4.455622802455598e-05} +{"train_loss": 0.0016545766266062856, "global_step": 38412, "epoch": 322, "lr": 4.455402569059016e-05} +{"train_loss": 0.002185395685955882, "global_step": 38413, "epoch": 322, "lr": 4.455182336731694e-05} +{"train_loss": 0.0011993714142590761, "global_step": 38414, "epoch": 322, "lr": 4.454962105474061e-05} +{"train_loss": 0.0012930745724588633, "global_step": 38415, "epoch": 322, "lr": 4.454741875286552e-05} +{"train_loss": 0.0024312851019203663, "global_step": 38416, "epoch": 322, "lr": 4.4545216461696e-05} +{"train_loss": 0.0012338454835116863, "global_step": 38417, "epoch": 322, "lr": 4.454301418123636e-05} +{"train_loss": 0.002489375416189432, "global_step": 38418, "epoch": 322, "lr": 4.454081191149094e-05} +{"train_loss": 0.0014280781615525484, "global_step": 38419, "epoch": 322, "lr": 4.453860965246403e-05} +{"train_loss": 0.0008729745750315487, "global_step": 38420, "epoch": 322, "lr": 4.453640740416e-05} +{"train_loss": 0.0016250823391601443, "global_step": 38421, "epoch": 322, "lr": 4.453420516658313e-05} +{"train_loss": 0.004597875755280256, "global_step": 38422, "epoch": 322, "lr": 4.453200293973778e-05} +{"train_loss": 0.001721177832223475, "global_step": 38423, "epoch": 322, "lr": 4.452980072362824e-05} +{"train_loss": 0.0024126560892909765, "global_step": 38424, "epoch": 322, "lr": 4.4527598518258876e-05} +{"train_loss": 0.0021213360596448183, "global_step": 38425, "epoch": 322, "lr": 4.4525396323633984e-05} +{"train_loss": 0.0026474683545529842, "global_step": 38426, "epoch": 322, "lr": 4.452319413975787e-05} +{"train_loss": 0.0019129394786432385, "global_step": 38427, "epoch": 322, "lr": 4.45209919666349e-05} +{"train_loss": 0.0017780149355530739, "global_step": 38428, "epoch": 322, "lr": 4.451878980426936e-05} +{"train_loss": 0.0011920490069314837, "global_step": 38429, "epoch": 322, "lr": 4.451658765266561e-05} +{"train_loss": 0.002255168976262212, "global_step": 38430, "epoch": 322, "lr": 4.451438551182793e-05} +{"train_loss": 0.001371800433844328, "global_step": 38431, "epoch": 322, "lr": 4.4512183381760694e-05} +{"train_loss": 0.0025069124531000853, "global_step": 38432, "epoch": 322, "lr": 4.450998126246819e-05} +{"train_loss": 0.003324656281620264, "global_step": 38433, "epoch": 322, "lr": 4.450777915395474e-05} +{"train_loss": 0.0013779879081994295, "global_step": 38434, "epoch": 322, "lr": 4.450557705622469e-05} +{"train_loss": 0.0011706538498401642, "global_step": 38435, "epoch": 322, "lr": 4.450337496928235e-05} +{"train_loss": 0.002092620820597503, "global_step": 38436, "epoch": 322, "lr": 4.450117289313204e-05, "val_loss": 0.017902253195643425} +{"train_loss": 0.0012505933409556746, "global_step": 38437, "epoch": 323, "lr": 4.4498970827778106e-05} +{"train_loss": 0.0025546064134687185, "global_step": 38438, "epoch": 323, "lr": 4.449676877322484e-05} +{"train_loss": 0.0013478838372975588, "global_step": 38439, "epoch": 323, "lr": 4.449456672947659e-05} +{"train_loss": 0.0028851055540144444, "global_step": 38440, "epoch": 323, "lr": 4.449236469653766e-05} +{"train_loss": 0.0022005471400916576, "global_step": 38441, "epoch": 323, "lr": 4.4490162674412395e-05} +{"train_loss": 0.002103846287354827, "global_step": 38442, "epoch": 323, "lr": 4.448796066310509e-05} +{"train_loss": 0.0017143847653642297, "global_step": 38443, "epoch": 323, "lr": 4.4485758662620104e-05} +{"train_loss": 0.0014901303220540285, "global_step": 38444, "epoch": 323, "lr": 4.448355667296175e-05} +{"train_loss": 0.001417455030605197, "global_step": 38445, "epoch": 323, "lr": 4.448135469413431e-05} +{"train_loss": 0.0014765638625249267, "global_step": 38446, "epoch": 323, "lr": 4.447915272614217e-05} +{"train_loss": 0.00198434223420918, "global_step": 38447, "epoch": 323, "lr": 4.44769507689896e-05} +{"train_loss": 0.0034132234286516905, "global_step": 38448, "epoch": 323, "lr": 4.447474882268097e-05} +{"train_loss": 0.0015177343739196658, "global_step": 38449, "epoch": 323, "lr": 4.4472546887220565e-05} +{"train_loss": 0.0013641933910548687, "global_step": 38450, "epoch": 323, "lr": 4.4470344962612714e-05} +{"train_loss": 0.0014827398117631674, "global_step": 38451, "epoch": 323, "lr": 4.446814304886178e-05} +{"train_loss": 0.002855083206668496, "global_step": 38452, "epoch": 323, "lr": 4.446594114597202e-05} +{"train_loss": 0.001724167144857347, "global_step": 38453, "epoch": 323, "lr": 4.446373925394782e-05} +{"train_loss": 0.0021396311931312084, "global_step": 38454, "epoch": 323, "lr": 4.446153737279346e-05} +{"train_loss": 0.0019166311249136925, "global_step": 38455, "epoch": 323, "lr": 4.44593355025133e-05} +{"train_loss": 0.0015676808543503284, "global_step": 38456, "epoch": 323, "lr": 4.4457133643111644e-05} +{"train_loss": 0.002334337681531906, "global_step": 38457, "epoch": 323, "lr": 4.445493179459279e-05} +{"train_loss": 0.0013178675435483456, "global_step": 38458, "epoch": 323, "lr": 4.445272995696111e-05} +{"train_loss": 0.0027708481065928936, "global_step": 38459, "epoch": 323, "lr": 4.4450528130220874e-05} +{"train_loss": 0.00269729970023036, "global_step": 38460, "epoch": 323, "lr": 4.444832631437646e-05} +{"train_loss": 0.001925165532156825, "global_step": 38461, "epoch": 323, "lr": 4.4446124509432144e-05} +{"train_loss": 0.0030959872528910637, "global_step": 38462, "epoch": 323, "lr": 4.444392271539228e-05} +{"train_loss": 0.0023560593836009502, "global_step": 38463, "epoch": 323, "lr": 4.4441720932261185e-05} +{"train_loss": 0.0015436363173648715, "global_step": 38464, "epoch": 323, "lr": 4.443951916004316e-05} +{"train_loss": 0.002220769878476858, "global_step": 38465, "epoch": 323, "lr": 4.443731739874256e-05} +{"train_loss": 0.0019144716206938028, "global_step": 38466, "epoch": 323, "lr": 4.4435115648363685e-05} +{"train_loss": 0.0012729261070489883, "global_step": 38467, "epoch": 323, "lr": 4.443291390891087e-05} +{"train_loss": 0.0022148345597088337, "global_step": 38468, "epoch": 323, "lr": 4.443071218038844e-05} +{"train_loss": 0.0018294730689376593, "global_step": 38469, "epoch": 323, "lr": 4.4428510462800693e-05} +{"train_loss": 0.0031775841489434242, "global_step": 38470, "epoch": 323, "lr": 4.442630875615199e-05} +{"train_loss": 0.0011474562343209982, "global_step": 38471, "epoch": 323, "lr": 4.4424107060446615e-05} +{"train_loss": 0.0031137524638324976, "global_step": 38472, "epoch": 323, "lr": 4.442190537568893e-05} +{"train_loss": 0.001960206311196089, "global_step": 38473, "epoch": 323, "lr": 4.441970370188322e-05} +{"train_loss": 0.0023582372814416885, "global_step": 38474, "epoch": 323, "lr": 4.4417502039033845e-05} +{"train_loss": 0.002241524402052164, "global_step": 38475, "epoch": 323, "lr": 4.4415300387145104e-05} +{"train_loss": 0.0015752359759062529, "global_step": 38476, "epoch": 323, "lr": 4.4413098746221306e-05} +{"train_loss": 0.0038226323667913675, "global_step": 38477, "epoch": 323, "lr": 4.4410897116266816e-05} +{"train_loss": 0.0036619030870497227, "global_step": 38478, "epoch": 323, "lr": 4.440869549728591e-05} +{"train_loss": 0.00171466707251966, "global_step": 38479, "epoch": 323, "lr": 4.4406493889282954e-05} +{"train_loss": 0.001358264940790832, "global_step": 38480, "epoch": 323, "lr": 4.440429229226222e-05} +{"train_loss": 0.0017798879416659474, "global_step": 38481, "epoch": 323, "lr": 4.440209070622809e-05} +{"train_loss": 0.0019599911756813526, "global_step": 38482, "epoch": 323, "lr": 4.439988913118485e-05} +{"train_loss": 0.0017896095523610711, "global_step": 38483, "epoch": 323, "lr": 4.439768756713682e-05} +{"train_loss": 0.002686513355001807, "global_step": 38484, "epoch": 323, "lr": 4.439548601408834e-05} +{"train_loss": 0.0021456375252455473, "global_step": 38485, "epoch": 323, "lr": 4.439328447204372e-05} +{"train_loss": 0.0012870188802480698, "global_step": 38486, "epoch": 323, "lr": 4.439108294100729e-05} +{"train_loss": 0.002468160353600979, "global_step": 38487, "epoch": 323, "lr": 4.438888142098338e-05} +{"train_loss": 0.0022249554749578238, "global_step": 38488, "epoch": 323, "lr": 4.438667991197627e-05} +{"train_loss": 0.0025426612701267004, "global_step": 38489, "epoch": 323, "lr": 4.438447841399035e-05} +{"train_loss": 0.001517389784567058, "global_step": 38490, "epoch": 323, "lr": 4.4382276927029874e-05} +{"train_loss": 0.0021672199945896864, "global_step": 38491, "epoch": 323, "lr": 4.4380075451099224e-05} +{"train_loss": 0.002505328506231308, "global_step": 38492, "epoch": 323, "lr": 4.4377873986202677e-05} +{"train_loss": 0.002677065087482333, "global_step": 38493, "epoch": 323, "lr": 4.4375672532344594e-05} +{"train_loss": 0.0014906068099662662, "global_step": 38494, "epoch": 323, "lr": 4.4373471089529274e-05} +{"train_loss": 0.001956123625859618, "global_step": 38495, "epoch": 323, "lr": 4.4371269657761025e-05} +{"train_loss": 0.001455969992093742, "global_step": 38496, "epoch": 323, "lr": 4.43690682370442e-05} +{"train_loss": 0.0029352116398513317, "global_step": 38497, "epoch": 323, "lr": 4.436686682738309e-05} +{"train_loss": 0.0022728540934622288, "global_step": 38498, "epoch": 323, "lr": 4.436466542878206e-05} +{"train_loss": 0.003027470549568534, "global_step": 38499, "epoch": 323, "lr": 4.4362464041245384e-05} +{"train_loss": 0.0009072772227227688, "global_step": 38500, "epoch": 323, "lr": 4.4360262664777416e-05} +{"train_loss": 0.0030713395681232214, "global_step": 38501, "epoch": 323, "lr": 4.4358061299382485e-05} +{"train_loss": 0.0020346094388514757, "global_step": 38502, "epoch": 323, "lr": 4.4355859945064876e-05} +{"train_loss": 0.0017128689214587212, "global_step": 38503, "epoch": 323, "lr": 4.435365860182895e-05} +{"train_loss": 0.0017624548636376858, "global_step": 38504, "epoch": 323, "lr": 4.4351457269679e-05} +{"train_loss": 0.002628110582008958, "global_step": 38505, "epoch": 323, "lr": 4.434925594861937e-05} +{"train_loss": 0.0013833158882334828, "global_step": 38506, "epoch": 323, "lr": 4.434705463865438e-05} +{"train_loss": 0.001621087547391653, "global_step": 38507, "epoch": 323, "lr": 4.4344853339788325e-05} +{"train_loss": 0.0016956399194896221, "global_step": 38508, "epoch": 323, "lr": 4.434265205202556e-05} +{"train_loss": 0.0020867176353931427, "global_step": 38509, "epoch": 323, "lr": 4.434045077537037e-05} +{"train_loss": 0.001770331640727818, "global_step": 38510, "epoch": 323, "lr": 4.433824950982713e-05} +{"train_loss": 0.0021623140200972557, "global_step": 38511, "epoch": 323, "lr": 4.433604825540011e-05} +{"train_loss": 0.0019859569147229195, "global_step": 38512, "epoch": 323, "lr": 4.433384701209367e-05} +{"train_loss": 0.002664684085175395, "global_step": 38513, "epoch": 323, "lr": 4.433164577991211e-05} +{"train_loss": 0.0008839692454785109, "global_step": 38514, "epoch": 323, "lr": 4.432944455885976e-05} +{"train_loss": 0.0015524575719609857, "global_step": 38515, "epoch": 323, "lr": 4.432724334894093e-05} +{"train_loss": 0.002560728695243597, "global_step": 38516, "epoch": 323, "lr": 4.432504215015996e-05} +{"train_loss": 0.0035590706393122673, "global_step": 38517, "epoch": 323, "lr": 4.4322840962521165e-05} +{"train_loss": 0.0018480506259948015, "global_step": 38518, "epoch": 323, "lr": 4.4320639786028866e-05} +{"train_loss": 0.0012500499142333865, "global_step": 38519, "epoch": 323, "lr": 4.4318438620687376e-05} +{"train_loss": 0.0011750500416383147, "global_step": 38520, "epoch": 323, "lr": 4.431623746650104e-05} +{"train_loss": 0.001689706346951425, "global_step": 38521, "epoch": 323, "lr": 4.431403632347414e-05} +{"train_loss": 0.0022609687875956297, "global_step": 38522, "epoch": 323, "lr": 4.4311835191611044e-05} +{"train_loss": 0.0022154399193823338, "global_step": 38523, "epoch": 323, "lr": 4.430963407091603e-05} +{"train_loss": 0.0015679356874898076, "global_step": 38524, "epoch": 323, "lr": 4.430743296139347e-05} +{"train_loss": 0.002404401544481516, "global_step": 38525, "epoch": 323, "lr": 4.4305231863047645e-05} +{"train_loss": 0.0011021316749975085, "global_step": 38526, "epoch": 323, "lr": 4.430303077588288e-05} +{"train_loss": 0.0011146378237754107, "global_step": 38527, "epoch": 323, "lr": 4.430082969990352e-05} +{"train_loss": 0.0015537373255938292, "global_step": 38528, "epoch": 323, "lr": 4.4298628635113855e-05} +{"train_loss": 0.0035079449880868196, "global_step": 38529, "epoch": 323, "lr": 4.429642758151824e-05} +{"train_loss": 0.0017922588158398867, "global_step": 38530, "epoch": 323, "lr": 4.4294226539120965e-05} +{"train_loss": 0.0020399431232362986, "global_step": 38531, "epoch": 323, "lr": 4.429202550792638e-05} +{"train_loss": 0.0016845008358359337, "global_step": 38532, "epoch": 323, "lr": 4.428982448793879e-05} +{"train_loss": 0.002776011126115918, "global_step": 38533, "epoch": 323, "lr": 4.4287623479162515e-05} +{"train_loss": 0.0021056681871414185, "global_step": 38534, "epoch": 323, "lr": 4.428542248160188e-05} +{"train_loss": 0.0017108182655647397, "global_step": 38535, "epoch": 323, "lr": 4.4283221495261195e-05} +{"train_loss": 0.0017813598969951272, "global_step": 38536, "epoch": 323, "lr": 4.428102052014482e-05} +{"train_loss": 0.0015576203586533666, "global_step": 38537, "epoch": 323, "lr": 4.427881955625705e-05} +{"train_loss": 0.001687730080448091, "global_step": 38538, "epoch": 323, "lr": 4.427661860360219e-05} +{"train_loss": 0.0014860533410683274, "global_step": 38539, "epoch": 323, "lr": 4.427441766218459e-05} +{"train_loss": 0.0032529481686651707, "global_step": 38540, "epoch": 323, "lr": 4.427221673200854e-05} +{"train_loss": 0.002661327365785837, "global_step": 38541, "epoch": 323, "lr": 4.427001581307841e-05} +{"train_loss": 0.0020873122848570347, "global_step": 38542, "epoch": 323, "lr": 4.426781490539846e-05} +{"train_loss": 0.0013253160286694765, "global_step": 38543, "epoch": 323, "lr": 4.4265614008973064e-05} +{"train_loss": 0.0018795221112668514, "global_step": 38544, "epoch": 323, "lr": 4.426341312380653e-05} +{"train_loss": 0.0021695620380342007, "global_step": 38545, "epoch": 323, "lr": 4.426121224990315e-05} +{"train_loss": 0.0017287575174123049, "global_step": 38546, "epoch": 323, "lr": 4.4259011387267286e-05} +{"train_loss": 0.0023913991171866655, "global_step": 38547, "epoch": 323, "lr": 4.425681053590322e-05} +{"train_loss": 0.0021672281436622143, "global_step": 38548, "epoch": 323, "lr": 4.42546096958153e-05} +{"train_loss": 0.0023197936825454235, "global_step": 38549, "epoch": 323, "lr": 4.425240886700783e-05} +{"train_loss": 0.0022646808065474033, "global_step": 38550, "epoch": 323, "lr": 4.4250208049485156e-05} +{"train_loss": 0.0011625804472714663, "global_step": 38551, "epoch": 323, "lr": 4.424800724325159e-05} +{"train_loss": 0.001880004769191146, "global_step": 38552, "epoch": 323, "lr": 4.424580644831143e-05} +{"train_loss": 0.0016988295828923583, "global_step": 38553, "epoch": 323, "lr": 4.424360566466903e-05} +{"train_loss": 0.0015584856737405062, "global_step": 38554, "epoch": 323, "lr": 4.4241404892328675e-05} +{"train_loss": 0.0020345054339899237, "global_step": 38555, "epoch": 323, "lr": 4.4239204131294734e-05, "val_loss": 0.016305267810821533} +{"train_loss": 0.0026807936374098063, "global_step": 38556, "epoch": 324, "lr": 4.4237003381571495e-05} +{"train_loss": 0.0019232719205319881, "global_step": 38557, "epoch": 324, "lr": 4.423480264316326e-05} +{"train_loss": 0.001690876903012395, "global_step": 38558, "epoch": 324, "lr": 4.42326019160744e-05} +{"train_loss": 0.001512856688350439, "global_step": 38559, "epoch": 324, "lr": 4.423040120030918e-05} +{"train_loss": 0.0024987156502902508, "global_step": 38560, "epoch": 324, "lr": 4.4228200495871984e-05} +{"train_loss": 0.0008620523731224239, "global_step": 38561, "epoch": 324, "lr": 4.422599980276708e-05} +{"train_loss": 0.0018702003872022033, "global_step": 38562, "epoch": 324, "lr": 4.422379912099882e-05} +{"train_loss": 0.0009661248186603189, "global_step": 38563, "epoch": 324, "lr": 4.4221598450571504e-05} +{"train_loss": 0.0028813977260142565, "global_step": 38564, "epoch": 324, "lr": 4.421939779148947e-05} +{"train_loss": 0.0018648331752046943, "global_step": 38565, "epoch": 324, "lr": 4.421719714375702e-05} +{"train_loss": 0.0025514147710055113, "global_step": 38566, "epoch": 324, "lr": 4.4214996507378494e-05} +{"train_loss": 0.0019786423072218895, "global_step": 38567, "epoch": 324, "lr": 4.4212795882358196e-05} +{"train_loss": 0.0032818750478327274, "global_step": 38568, "epoch": 324, "lr": 4.421059526870048e-05} +{"train_loss": 0.0019769605714827776, "global_step": 38569, "epoch": 324, "lr": 4.420839466640961e-05} +{"train_loss": 0.002130674198269844, "global_step": 38570, "epoch": 324, "lr": 4.420619407548996e-05} +{"train_loss": 0.0009851097129285336, "global_step": 38571, "epoch": 324, "lr": 4.420399349594581e-05} +{"train_loss": 0.0018635890446603298, "global_step": 38572, "epoch": 324, "lr": 4.420179292778152e-05} +{"train_loss": 0.002954707248136401, "global_step": 38573, "epoch": 324, "lr": 4.419959237100137e-05} +{"train_loss": 0.002987976185977459, "global_step": 38574, "epoch": 324, "lr": 4.4197391825609716e-05} +{"train_loss": 0.00140997557900846, "global_step": 38575, "epoch": 324, "lr": 4.419519129161087e-05} +{"train_loss": 0.002238825662061572, "global_step": 38576, "epoch": 324, "lr": 4.419299076900912e-05} +{"train_loss": 0.00125172920525074, "global_step": 38577, "epoch": 324, "lr": 4.419079025780883e-05} +{"train_loss": 0.005379881244152784, "global_step": 38578, "epoch": 324, "lr": 4.4188589758014286e-05} +{"train_loss": 0.0031929416581988335, "global_step": 38579, "epoch": 324, "lr": 4.418638926962985e-05} +{"train_loss": 0.0013870239490643144, "global_step": 38580, "epoch": 324, "lr": 4.418418879265979e-05} +{"train_loss": 0.0018983925692737103, "global_step": 38581, "epoch": 324, "lr": 4.418198832710848e-05} +{"train_loss": 0.001166459871456027, "global_step": 38582, "epoch": 324, "lr": 4.417978787298021e-05} +{"train_loss": 0.002541161375120282, "global_step": 38583, "epoch": 324, "lr": 4.417758743027928e-05} +{"train_loss": 0.002204151591286063, "global_step": 38584, "epoch": 324, "lr": 4.4175386999010064e-05} +{"train_loss": 0.0015369202010333538, "global_step": 38585, "epoch": 324, "lr": 4.417318657917684e-05} +{"train_loss": 0.0035063691902905703, "global_step": 38586, "epoch": 324, "lr": 4.417098617078394e-05} +{"train_loss": 0.0025524338707327843, "global_step": 38587, "epoch": 324, "lr": 4.416878577383571e-05} +{"train_loss": 0.001387882512062788, "global_step": 38588, "epoch": 324, "lr": 4.4166585388336414e-05} +{"train_loss": 0.002677375916391611, "global_step": 38589, "epoch": 324, "lr": 4.416438501429042e-05} +{"train_loss": 0.0018876140238717198, "global_step": 38590, "epoch": 324, "lr": 4.416218465170202e-05} +{"train_loss": 0.002091508125886321, "global_step": 38591, "epoch": 324, "lr": 4.415998430057557e-05} +{"train_loss": 0.0025253482162952423, "global_step": 38592, "epoch": 324, "lr": 4.415778396091534e-05} +{"train_loss": 0.0012882803566753864, "global_step": 38593, "epoch": 324, "lr": 4.41555836327257e-05} +{"train_loss": 0.0020095608197152615, "global_step": 38594, "epoch": 324, "lr": 4.415338331601094e-05} +{"train_loss": 0.0027884305454790592, "global_step": 38595, "epoch": 324, "lr": 4.4151183010775376e-05} +{"train_loss": 0.0013553404714912176, "global_step": 38596, "epoch": 324, "lr": 4.414898271702335e-05} +{"train_loss": 0.00226839748211205, "global_step": 38597, "epoch": 324, "lr": 4.414678243475916e-05} +{"train_loss": 0.004177646245807409, "global_step": 38598, "epoch": 324, "lr": 4.414458216398715e-05} +{"train_loss": 0.002796469023451209, "global_step": 38599, "epoch": 324, "lr": 4.414238190471163e-05} +{"train_loss": 0.0020965877920389175, "global_step": 38600, "epoch": 324, "lr": 4.414018165693691e-05} +{"train_loss": 0.002375206910073757, "global_step": 38601, "epoch": 324, "lr": 4.4137981420667324e-05} +{"train_loss": 0.002355175092816353, "global_step": 38602, "epoch": 324, "lr": 4.413578119590717e-05} +{"train_loss": 0.0021152750123292208, "global_step": 38603, "epoch": 324, "lr": 4.41335809826608e-05} +{"train_loss": 0.001826113322749734, "global_step": 38604, "epoch": 324, "lr": 4.4131380780932496e-05} +{"train_loss": 0.002021564869210124, "global_step": 38605, "epoch": 324, "lr": 4.412918059072663e-05} +{"train_loss": 0.0019876332953572273, "global_step": 38606, "epoch": 324, "lr": 4.412698041204748e-05} +{"train_loss": 0.0021475995890796185, "global_step": 38607, "epoch": 324, "lr": 4.4124780244899356e-05} +{"train_loss": 0.0024396884255111217, "global_step": 38608, "epoch": 324, "lr": 4.4122580089286626e-05} +{"train_loss": 0.0027184609789401293, "global_step": 38609, "epoch": 324, "lr": 4.4120379945213554e-05} +{"train_loss": 0.0010264411102980375, "global_step": 38610, "epoch": 324, "lr": 4.411817981268451e-05} +{"train_loss": 0.0016121220542117953, "global_step": 38611, "epoch": 324, "lr": 4.411597969170377e-05} +{"train_loss": 0.0014387377304956317, "global_step": 38612, "epoch": 324, "lr": 4.4113779582275697e-05} +{"train_loss": 0.0034088504035025835, "global_step": 38613, "epoch": 324, "lr": 4.4111579484404585e-05} +{"train_loss": 0.0007858174503780901, "global_step": 38614, "epoch": 324, "lr": 4.410937939809475e-05} +{"train_loss": 0.001379836699925363, "global_step": 38615, "epoch": 324, "lr": 4.4107179323350524e-05} +{"train_loss": 0.0012616146123036742, "global_step": 38616, "epoch": 324, "lr": 4.4104979260176213e-05} +{"train_loss": 0.0018644197843968868, "global_step": 38617, "epoch": 324, "lr": 4.4102779208576154e-05} +{"train_loss": 0.001954692183062434, "global_step": 38618, "epoch": 324, "lr": 4.410057916855465e-05} +{"train_loss": 0.002302099484950304, "global_step": 38619, "epoch": 324, "lr": 4.409837914011604e-05} +{"train_loss": 0.002229001373052597, "global_step": 38620, "epoch": 324, "lr": 4.409617912326464e-05} +{"train_loss": 0.0017290464602410793, "global_step": 38621, "epoch": 324, "lr": 4.409397911800474e-05} +{"train_loss": 0.001218073652125895, "global_step": 38622, "epoch": 324, "lr": 4.4091779124340696e-05} +{"train_loss": 0.0015711098676547408, "global_step": 38623, "epoch": 324, "lr": 4.4089579142276796e-05} +{"train_loss": 0.0012171769049018621, "global_step": 38624, "epoch": 324, "lr": 4.40873791718174e-05} +{"train_loss": 0.0013570112641900778, "global_step": 38625, "epoch": 324, "lr": 4.4085179212966796e-05} +{"train_loss": 0.0017769535770639777, "global_step": 38626, "epoch": 324, "lr": 4.408297926572929e-05} +{"train_loss": 0.003379856003448367, "global_step": 38627, "epoch": 324, "lr": 4.4080779330109254e-05} +{"train_loss": 0.0014145370805636048, "global_step": 38628, "epoch": 324, "lr": 4.407857940611094e-05} +{"train_loss": 0.0014525080332532525, "global_step": 38629, "epoch": 324, "lr": 4.407637949373874e-05} +{"train_loss": 0.002193954773247242, "global_step": 38630, "epoch": 324, "lr": 4.40741795929969e-05} +{"train_loss": 0.0012314331252127886, "global_step": 38631, "epoch": 324, "lr": 4.40719797038898e-05} +{"train_loss": 0.0014706227229908109, "global_step": 38632, "epoch": 324, "lr": 4.406977982642173e-05} +{"train_loss": 0.0007942951051518321, "global_step": 38633, "epoch": 324, "lr": 4.406757996059699e-05} +{"train_loss": 0.0013147459831088781, "global_step": 38634, "epoch": 324, "lr": 4.406538010641996e-05} +{"train_loss": 0.001578283729031682, "global_step": 38635, "epoch": 324, "lr": 4.406318026389489e-05} +{"train_loss": 0.0012009863276034594, "global_step": 38636, "epoch": 324, "lr": 4.406098043302616e-05} +{"train_loss": 0.0013359312433749437, "global_step": 38637, "epoch": 324, "lr": 4.4058780613818056e-05} +{"train_loss": 0.0021210387349128723, "global_step": 38638, "epoch": 324, "lr": 4.405658080627488e-05} +{"train_loss": 0.0015118787996470928, "global_step": 38639, "epoch": 324, "lr": 4.4054381010401e-05} +{"train_loss": 0.0018729633884504437, "global_step": 38640, "epoch": 324, "lr": 4.405218122620068e-05} +{"train_loss": 0.0015726449200883508, "global_step": 38641, "epoch": 324, "lr": 4.404998145367829e-05} +{"train_loss": 0.0023132101632654667, "global_step": 38642, "epoch": 324, "lr": 4.4047781692838104e-05} +{"train_loss": 0.00244781537912786, "global_step": 38643, "epoch": 324, "lr": 4.404558194368448e-05} +{"train_loss": 0.0010927491821348667, "global_step": 38644, "epoch": 324, "lr": 4.404338220622173e-05} +{"train_loss": 0.0014503574930131435, "global_step": 38645, "epoch": 324, "lr": 4.404118248045413e-05} +{"train_loss": 0.001317224116064608, "global_step": 38646, "epoch": 324, "lr": 4.403898276638605e-05} +{"train_loss": 0.0022322852164506912, "global_step": 38647, "epoch": 324, "lr": 4.4036783064021784e-05} +{"train_loss": 0.002719518495723605, "global_step": 38648, "epoch": 324, "lr": 4.403458337336566e-05} +{"train_loss": 0.001337189576588571, "global_step": 38649, "epoch": 324, "lr": 4.4032383694422e-05} +{"train_loss": 0.0020080783870071173, "global_step": 38650, "epoch": 324, "lr": 4.403018402719511e-05} +{"train_loss": 0.001291703782044351, "global_step": 38651, "epoch": 324, "lr": 4.402798437168933e-05} +{"train_loss": 0.001249571330845356, "global_step": 38652, "epoch": 324, "lr": 4.402578472790894e-05} +{"train_loss": 0.00201224721968174, "global_step": 38653, "epoch": 324, "lr": 4.402358509585831e-05} +{"train_loss": 0.0024840079713612795, "global_step": 38654, "epoch": 324, "lr": 4.402138547554171e-05} +{"train_loss": 0.00186020543333143, "global_step": 38655, "epoch": 324, "lr": 4.4019185866963496e-05} +{"train_loss": 0.0017587769543752074, "global_step": 38656, "epoch": 324, "lr": 4.401698627012798e-05} +{"train_loss": 0.0016634395578876138, "global_step": 38657, "epoch": 324, "lr": 4.401478668503945e-05} +{"train_loss": 0.002441881690174341, "global_step": 38658, "epoch": 324, "lr": 4.401258711170226e-05} +{"train_loss": 0.0013456280576065183, "global_step": 38659, "epoch": 324, "lr": 4.4010387550120705e-05} +{"train_loss": 0.0029980770777910948, "global_step": 38660, "epoch": 324, "lr": 4.400818800029912e-05} +{"train_loss": 0.0015999068273231387, "global_step": 38661, "epoch": 324, "lr": 4.400598846224181e-05} +{"train_loss": 0.002976988209411502, "global_step": 38662, "epoch": 324, "lr": 4.400378893595312e-05} +{"train_loss": 0.0009040178847499192, "global_step": 38663, "epoch": 324, "lr": 4.400158942143734e-05} +{"train_loss": 0.0010055293096229434, "global_step": 38664, "epoch": 324, "lr": 4.399938991869879e-05} +{"train_loss": 0.0018448291812092066, "global_step": 38665, "epoch": 324, "lr": 4.3997190427741805e-05} +{"train_loss": 0.00173747178632766, "global_step": 38666, "epoch": 324, "lr": 4.399499094857069e-05} +{"train_loss": 0.0014921355759724975, "global_step": 38667, "epoch": 324, "lr": 4.3992791481189773e-05} +{"train_loss": 0.0011165940668433905, "global_step": 38668, "epoch": 324, "lr": 4.399059202560336e-05} +{"train_loss": 0.001888059196062386, "global_step": 38669, "epoch": 324, "lr": 4.39883925818158e-05} +{"train_loss": 0.0029889182187616825, "global_step": 38670, "epoch": 324, "lr": 4.398619314983138e-05} +{"train_loss": 0.0010388776427134871, "global_step": 38671, "epoch": 324, "lr": 4.398399372965441e-05} +{"train_loss": 0.0012201484059914947, "global_step": 38672, "epoch": 324, "lr": 4.398179432128925e-05} +{"train_loss": 0.0015639285556972027, "global_step": 38673, "epoch": 324, "lr": 4.397959492474016e-05} +{"train_loss": 0.0019446170048498619, "global_step": 38674, "epoch": 324, "lr": 4.397739554001153e-05, "val_loss": 0.0220317579805851} +{"train_loss": 0.0009835195960476995, "global_step": 38675, "epoch": 325, "lr": 4.3975196167107635e-05} +{"train_loss": 0.0015042859595268965, "global_step": 38676, "epoch": 325, "lr": 4.3972996806032775e-05} +{"train_loss": 0.0014842209639027715, "global_step": 38677, "epoch": 325, "lr": 4.397079745679131e-05} +{"train_loss": 0.0014063314301893115, "global_step": 38678, "epoch": 325, "lr": 4.3968598119387524e-05} +{"train_loss": 0.0019229899626225233, "global_step": 38679, "epoch": 325, "lr": 4.3966398793825774e-05} +{"train_loss": 0.00233289273455739, "global_step": 38680, "epoch": 325, "lr": 4.3964199480110335e-05} +{"train_loss": 0.0018826820887625217, "global_step": 38681, "epoch": 325, "lr": 4.396200017824555e-05} +{"train_loss": 0.001052652602083981, "global_step": 38682, "epoch": 325, "lr": 4.3959800888235746e-05} +{"train_loss": 0.0020846836268901825, "global_step": 38683, "epoch": 325, "lr": 4.395760161008521e-05} +{"train_loss": 0.0015841011190786958, "global_step": 38684, "epoch": 325, "lr": 4.395540234379829e-05} +{"train_loss": 0.0018153423443436623, "global_step": 38685, "epoch": 325, "lr": 4.395320308937928e-05} +{"train_loss": 0.001453430624678731, "global_step": 38686, "epoch": 325, "lr": 4.395100384683253e-05} +{"train_loss": 0.0011999242706224322, "global_step": 38687, "epoch": 325, "lr": 4.3948804616162306e-05} +{"train_loss": 0.0021001920104026794, "global_step": 38688, "epoch": 325, "lr": 4.394660539737299e-05} +{"train_loss": 0.0022819004952907562, "global_step": 38689, "epoch": 325, "lr": 4.3944406190468865e-05} +{"train_loss": 0.002030924428254366, "global_step": 38690, "epoch": 325, "lr": 4.3942206995454225e-05} +{"train_loss": 0.0012745371786877513, "global_step": 38691, "epoch": 325, "lr": 4.394000781233344e-05} +{"train_loss": 0.002086516935378313, "global_step": 38692, "epoch": 325, "lr": 4.393780864111078e-05} +{"train_loss": 0.001794877927750349, "global_step": 38693, "epoch": 325, "lr": 4.393560948179061e-05} +{"train_loss": 0.0012047392083331943, "global_step": 38694, "epoch": 325, "lr": 4.393341033437721e-05} +{"train_loss": 0.0012645379174500704, "global_step": 38695, "epoch": 325, "lr": 4.3931211198874914e-05} +{"train_loss": 0.0008337803883478045, "global_step": 38696, "epoch": 325, "lr": 4.392901207528803e-05} +{"train_loss": 0.0019687251187860966, "global_step": 38697, "epoch": 325, "lr": 4.392681296362089e-05} +{"train_loss": 0.002646411070600152, "global_step": 38698, "epoch": 325, "lr": 4.392461386387779e-05} +{"train_loss": 0.0012134670978412032, "global_step": 38699, "epoch": 325, "lr": 4.392241477606307e-05} +{"train_loss": 0.001590998494066298, "global_step": 38700, "epoch": 325, "lr": 4.392021570018104e-05} +{"train_loss": 0.0010892795398831367, "global_step": 38701, "epoch": 325, "lr": 4.3918016636236024e-05} +{"train_loss": 0.002143769757822156, "global_step": 38702, "epoch": 325, "lr": 4.391581758423232e-05} +{"train_loss": 0.0017657430144026875, "global_step": 38703, "epoch": 325, "lr": 4.391361854417427e-05} +{"train_loss": 0.0025763255544006824, "global_step": 38704, "epoch": 325, "lr": 4.3911419516066166e-05} +{"train_loss": 0.0016693755751475692, "global_step": 38705, "epoch": 325, "lr": 4.390922049991235e-05} +{"train_loss": 0.0013991228770464659, "global_step": 38706, "epoch": 325, "lr": 4.390702149571714e-05} +{"train_loss": 0.001523687387816608, "global_step": 38707, "epoch": 325, "lr": 4.3904822503484814e-05} +{"train_loss": 0.0024621710181236267, "global_step": 38708, "epoch": 325, "lr": 4.3902623523219744e-05} +{"train_loss": 0.0021267018746584654, "global_step": 38709, "epoch": 325, "lr": 4.39004245549262e-05} +{"train_loss": 0.0021470196079462767, "global_step": 38710, "epoch": 325, "lr": 4.389822559860854e-05} +{"train_loss": 0.002109876833856106, "global_step": 38711, "epoch": 325, "lr": 4.3896026654271036e-05} +{"train_loss": 0.0025715925730764866, "global_step": 38712, "epoch": 325, "lr": 4.389382772191806e-05} +{"train_loss": 0.0020561369601637125, "global_step": 38713, "epoch": 325, "lr": 4.389162880155389e-05} +{"train_loss": 0.001615704270079732, "global_step": 38714, "epoch": 325, "lr": 4.388942989318285e-05} +{"train_loss": 0.0018302409444004297, "global_step": 38715, "epoch": 325, "lr": 4.388723099680926e-05} +{"train_loss": 0.0025394910480827093, "global_step": 38716, "epoch": 325, "lr": 4.3885032112437435e-05} +{"train_loss": 0.00177613808773458, "global_step": 38717, "epoch": 325, "lr": 4.388283324007172e-05} +{"train_loss": 0.001333122025243938, "global_step": 38718, "epoch": 325, "lr": 4.388063437971638e-05} +{"train_loss": 0.002004191279411316, "global_step": 38719, "epoch": 325, "lr": 4.3878435531375785e-05} +{"train_loss": 0.001729840412735939, "global_step": 38720, "epoch": 325, "lr": 4.387623669505423e-05} +{"train_loss": 0.002235904335975647, "global_step": 38721, "epoch": 325, "lr": 4.3874037870756e-05} +{"train_loss": 0.0010397431906312704, "global_step": 38722, "epoch": 325, "lr": 4.3871839058485466e-05} +{"train_loss": 0.0013204425340518355, "global_step": 38723, "epoch": 325, "lr": 4.38696402582469e-05} +{"train_loss": 0.002562388312071562, "global_step": 38724, "epoch": 325, "lr": 4.386744147004467e-05} +{"train_loss": 0.0012408546172082424, "global_step": 38725, "epoch": 325, "lr": 4.386524269388306e-05} +{"train_loss": 0.0016159663209691644, "global_step": 38726, "epoch": 325, "lr": 4.386304392976636e-05} +{"train_loss": 0.0009577899472787976, "global_step": 38727, "epoch": 325, "lr": 4.386084517769895e-05} +{"train_loss": 0.0016109556891024113, "global_step": 38728, "epoch": 325, "lr": 4.3858646437685085e-05} +{"train_loss": 0.0014665116323158145, "global_step": 38729, "epoch": 325, "lr": 4.3856447709729135e-05} +{"train_loss": 0.0019596097990870476, "global_step": 38730, "epoch": 325, "lr": 4.385424899383538e-05} +{"train_loss": 0.0017728107050061226, "global_step": 38731, "epoch": 325, "lr": 4.385205029000815e-05} +{"train_loss": 0.0020482733380049467, "global_step": 38732, "epoch": 325, "lr": 4.384985159825178e-05} +{"train_loss": 0.0014541026903316379, "global_step": 38733, "epoch": 325, "lr": 4.384765291857055e-05} +{"train_loss": 0.0024674590677022934, "global_step": 38734, "epoch": 325, "lr": 4.3845454250968815e-05} +{"train_loss": 0.001591921434737742, "global_step": 38735, "epoch": 325, "lr": 4.384325559545085e-05} +{"train_loss": 0.001623630290850997, "global_step": 38736, "epoch": 325, "lr": 4.384105695202102e-05} +{"train_loss": 0.001334930071607232, "global_step": 38737, "epoch": 325, "lr": 4.383885832068359e-05} +{"train_loss": 0.0033925019670277834, "global_step": 38738, "epoch": 325, "lr": 4.3836659701442926e-05} +{"train_loss": 0.0019276385428383946, "global_step": 38739, "epoch": 325, "lr": 4.3834461094303324e-05} +{"train_loss": 0.0026786704547703266, "global_step": 38740, "epoch": 325, "lr": 4.3832262499269076e-05} +{"train_loss": 0.002362999599426985, "global_step": 38741, "epoch": 325, "lr": 4.3830063916344547e-05} +{"train_loss": 0.001644363161176443, "global_step": 38742, "epoch": 325, "lr": 4.3827865345534004e-05} +{"train_loss": 0.0012955149868503213, "global_step": 38743, "epoch": 325, "lr": 4.3825666786841813e-05} +{"train_loss": 0.00196982454508543, "global_step": 38744, "epoch": 325, "lr": 4.382346824027225e-05} +{"train_loss": 0.002156935166567564, "global_step": 38745, "epoch": 325, "lr": 4.382126970582965e-05} +{"train_loss": 0.0029326551593840122, "global_step": 38746, "epoch": 325, "lr": 4.3819071183518324e-05} +{"train_loss": 0.002374710515141487, "global_step": 38747, "epoch": 325, "lr": 4.381687267334259e-05} +{"train_loss": 0.0018729050643742085, "global_step": 38748, "epoch": 325, "lr": 4.381467417530677e-05} +{"train_loss": 0.002271628938615322, "global_step": 38749, "epoch": 325, "lr": 4.381247568941518e-05} +{"train_loss": 0.0031224628910422325, "global_step": 38750, "epoch": 325, "lr": 4.3810277215672125e-05} +{"train_loss": 0.0015908335335552692, "global_step": 38751, "epoch": 325, "lr": 4.380807875408194e-05} +{"train_loss": 0.0015190268168225884, "global_step": 38752, "epoch": 325, "lr": 4.380588030464892e-05} +{"train_loss": 0.002409896580502391, "global_step": 38753, "epoch": 325, "lr": 4.380368186737741e-05} +{"train_loss": 0.0022749335039407015, "global_step": 38754, "epoch": 325, "lr": 4.380148344227168e-05} +{"train_loss": 0.002519160509109497, "global_step": 38755, "epoch": 325, "lr": 4.37992850293361e-05} +{"train_loss": 0.0025044307112693787, "global_step": 38756, "epoch": 325, "lr": 4.3797086628574954e-05} +{"train_loss": 0.0026625492610037327, "global_step": 38757, "epoch": 325, "lr": 4.379488823999256e-05} +{"train_loss": 0.0014090304030105472, "global_step": 38758, "epoch": 325, "lr": 4.379268986359325e-05} +{"train_loss": 0.002688076114282012, "global_step": 38759, "epoch": 325, "lr": 4.3790491499381314e-05} +{"train_loss": 0.002180566545575857, "global_step": 38760, "epoch": 325, "lr": 4.37882931473611e-05} +{"train_loss": 0.0018290772568434477, "global_step": 38761, "epoch": 325, "lr": 4.378609480753689e-05} +{"train_loss": 0.0016846939688548446, "global_step": 38762, "epoch": 325, "lr": 4.378389647991305e-05} +{"train_loss": 0.0017177551053464413, "global_step": 38763, "epoch": 325, "lr": 4.378169816449385e-05} +{"train_loss": 0.001354234991595149, "global_step": 38764, "epoch": 325, "lr": 4.37794998612836e-05} +{"train_loss": 0.0031258740928024054, "global_step": 38765, "epoch": 325, "lr": 4.3777301570286664e-05} +{"train_loss": 0.0019913320429623127, "global_step": 38766, "epoch": 325, "lr": 4.377510329150731e-05} +{"train_loss": 0.0011052221525460482, "global_step": 38767, "epoch": 325, "lr": 4.377290502494991e-05} +{"train_loss": 0.0012083423789590597, "global_step": 38768, "epoch": 325, "lr": 4.377070677061871e-05} +{"train_loss": 0.0012595977168530226, "global_step": 38769, "epoch": 325, "lr": 4.376850852851808e-05} +{"train_loss": 0.0030804506968706846, "global_step": 38770, "epoch": 325, "lr": 4.376631029865233e-05} +{"train_loss": 0.0017927981680259109, "global_step": 38771, "epoch": 325, "lr": 4.376411208102574e-05} +{"train_loss": 0.0017272033728659153, "global_step": 38772, "epoch": 325, "lr": 4.3761913875642665e-05} +{"train_loss": 0.0024022734723985195, "global_step": 38773, "epoch": 325, "lr": 4.375971568250738e-05} +{"train_loss": 0.002179773524403572, "global_step": 38774, "epoch": 325, "lr": 4.3757517501624264e-05} +{"train_loss": 0.001117329578846693, "global_step": 38775, "epoch": 325, "lr": 4.375531933299758e-05} +{"train_loss": 0.002099960343912244, "global_step": 38776, "epoch": 325, "lr": 4.375312117663165e-05} +{"train_loss": 0.0024257057812064886, "global_step": 38777, "epoch": 325, "lr": 4.375092303253081e-05} +{"train_loss": 0.002953767077997327, "global_step": 38778, "epoch": 325, "lr": 4.374872490069936e-05} +{"train_loss": 0.0015319661470130086, "global_step": 38779, "epoch": 325, "lr": 4.3746526781141614e-05} +{"train_loss": 0.0024597267620265484, "global_step": 38780, "epoch": 325, "lr": 4.37443286738619e-05} +{"train_loss": 0.0020647167693823576, "global_step": 38781, "epoch": 325, "lr": 4.374213057886453e-05} +{"train_loss": 0.0024813704658299685, "global_step": 38782, "epoch": 325, "lr": 4.373993249615383e-05} +{"train_loss": 0.0020704332273453474, "global_step": 38783, "epoch": 325, "lr": 4.373773442573408e-05} +{"train_loss": 0.002742596436291933, "global_step": 38784, "epoch": 325, "lr": 4.373553636760964e-05} +{"train_loss": 0.0022751425858587027, "global_step": 38785, "epoch": 325, "lr": 4.373333832178478e-05} +{"train_loss": 0.0016386640490964055, "global_step": 38786, "epoch": 325, "lr": 4.3731140288263874e-05} +{"train_loss": 0.003952528350055218, "global_step": 38787, "epoch": 325, "lr": 4.3728942267051174e-05} +{"train_loss": 0.002295027719810605, "global_step": 38788, "epoch": 325, "lr": 4.372674425815105e-05} +{"train_loss": 0.001453921664506197, "global_step": 38789, "epoch": 325, "lr": 4.372454626156779e-05} +{"train_loss": 0.0015108814695850015, "global_step": 38790, "epoch": 325, "lr": 4.3722348277305696e-05} +{"train_loss": 0.002491225488483906, "global_step": 38791, "epoch": 325, "lr": 4.3720150305369125e-05} +{"train_loss": 0.0023362257052212954, "global_step": 38792, "epoch": 325, "lr": 4.371795234576234e-05} +{"train_loss": 0.0019271929852054024, "global_step": 38793, "epoch": 325, "lr": 4.3715754398489706e-05, "val_loss": 0.023789087310433388, "train_action_mse_error": 3.296639260952361e-05} +{"train_loss": 0.002139089163392782, "global_step": 38794, "epoch": 326, "lr": 4.3713556463555505e-05} +{"train_loss": 0.0021305475383996964, "global_step": 38795, "epoch": 326, "lr": 4.3711358540964065e-05} +{"train_loss": 0.0013525098329409957, "global_step": 38796, "epoch": 326, "lr": 4.37091606307197e-05} +{"train_loss": 0.0023621597792953253, "global_step": 38797, "epoch": 326, "lr": 4.370696273282673e-05} +{"train_loss": 0.0020133720245212317, "global_step": 38798, "epoch": 326, "lr": 4.370476484728947e-05} +{"train_loss": 0.0020364688243716955, "global_step": 38799, "epoch": 326, "lr": 4.3702566974112214e-05} +{"train_loss": 0.001970648532733321, "global_step": 38800, "epoch": 326, "lr": 4.3700369113299325e-05} +{"train_loss": 0.0017923836130648851, "global_step": 38801, "epoch": 326, "lr": 4.3698171264855075e-05} +{"train_loss": 0.001485173823311925, "global_step": 38802, "epoch": 326, "lr": 4.3695973428783774e-05} +{"train_loss": 0.0021439206320792437, "global_step": 38803, "epoch": 326, "lr": 4.369377560508979e-05} +{"train_loss": 0.002394644310697913, "global_step": 38804, "epoch": 326, "lr": 4.3691577793777374e-05} +{"train_loss": 0.0019587294664233923, "global_step": 38805, "epoch": 326, "lr": 4.368937999485089e-05} +{"train_loss": 0.002029524417594075, "global_step": 38806, "epoch": 326, "lr": 4.368718220831461e-05} +{"train_loss": 0.002202901989221573, "global_step": 38807, "epoch": 326, "lr": 4.3684984434172896e-05} +{"train_loss": 0.0028424812480807304, "global_step": 38808, "epoch": 326, "lr": 4.368278667243005e-05} +{"train_loss": 0.0014006803976371884, "global_step": 38809, "epoch": 326, "lr": 4.368058892309035e-05} +{"train_loss": 0.0025778182316571474, "global_step": 38810, "epoch": 326, "lr": 4.367839118615816e-05} +{"train_loss": 0.002973308553919196, "global_step": 38811, "epoch": 326, "lr": 4.367619346163775e-05} +{"train_loss": 0.0021275351755321026, "global_step": 38812, "epoch": 326, "lr": 4.367399574953348e-05} +{"train_loss": 0.0024614138528704643, "global_step": 38813, "epoch": 326, "lr": 4.3671798049849636e-05} +{"train_loss": 0.0016847412334755063, "global_step": 38814, "epoch": 326, "lr": 4.3669600362590525e-05} +{"train_loss": 0.001117297331802547, "global_step": 38815, "epoch": 326, "lr": 4.3667402687760504e-05} +{"train_loss": 0.0013802493922412395, "global_step": 38816, "epoch": 326, "lr": 4.3665205025363836e-05} +{"train_loss": 0.0014114400837570429, "global_step": 38817, "epoch": 326, "lr": 4.3663007375404885e-05} +{"train_loss": 0.0032298078294843435, "global_step": 38818, "epoch": 326, "lr": 4.366080973788792e-05} +{"train_loss": 0.0019819678273051977, "global_step": 38819, "epoch": 326, "lr": 4.3658612112817296e-05} +{"train_loss": 0.0025440379977226257, "global_step": 38820, "epoch": 326, "lr": 4.365641450019732e-05} +{"train_loss": 0.0012170023983344436, "global_step": 38821, "epoch": 326, "lr": 4.365421690003226e-05} +{"train_loss": 0.0017978711985051632, "global_step": 38822, "epoch": 326, "lr": 4.3652019312326506e-05} +{"train_loss": 0.003886588616296649, "global_step": 38823, "epoch": 326, "lr": 4.3649821737084304e-05} +{"train_loss": 0.0018464319873601198, "global_step": 38824, "epoch": 326, "lr": 4.364762417431001e-05} +{"train_loss": 0.001196942524984479, "global_step": 38825, "epoch": 326, "lr": 4.364542662400794e-05} +{"train_loss": 0.0018677528714761138, "global_step": 38826, "epoch": 326, "lr": 4.364322908618237e-05} +{"train_loss": 0.0009762314148247242, "global_step": 38827, "epoch": 326, "lr": 4.3641031560837654e-05} +{"train_loss": 0.0026012782473117113, "global_step": 38828, "epoch": 326, "lr": 4.3638834047978094e-05} +{"train_loss": 0.002002433640882373, "global_step": 38829, "epoch": 326, "lr": 4.3636636547608e-05} +{"train_loss": 0.0015349764144048095, "global_step": 38830, "epoch": 326, "lr": 4.363443905973169e-05} +{"train_loss": 0.00250932271592319, "global_step": 38831, "epoch": 326, "lr": 4.363224158435348e-05} +{"train_loss": 0.002359328093007207, "global_step": 38832, "epoch": 326, "lr": 4.363004412147769e-05} +{"train_loss": 0.0033315278124064207, "global_step": 38833, "epoch": 326, "lr": 4.362784667110861e-05} +{"train_loss": 0.003218044526875019, "global_step": 38834, "epoch": 326, "lr": 4.36256492332506e-05} +{"train_loss": 0.001300473348237574, "global_step": 38835, "epoch": 326, "lr": 4.362345180790792e-05} +{"train_loss": 0.0022549116984009743, "global_step": 38836, "epoch": 326, "lr": 4.3621254395084935e-05} +{"train_loss": 0.0021821141708642244, "global_step": 38837, "epoch": 326, "lr": 4.361905699478591e-05} +{"train_loss": 0.0017131586791947484, "global_step": 38838, "epoch": 326, "lr": 4.3616859607015205e-05} +{"train_loss": 0.002910237992182374, "global_step": 38839, "epoch": 326, "lr": 4.361466223177711e-05} +{"train_loss": 0.0028995268512517214, "global_step": 38840, "epoch": 326, "lr": 4.3612464869075934e-05} +{"train_loss": 0.0023310179822146893, "global_step": 38841, "epoch": 326, "lr": 4.361026751891602e-05} +{"train_loss": 0.0013648250605911016, "global_step": 38842, "epoch": 326, "lr": 4.360807018130164e-05} +{"train_loss": 0.0014679089654237032, "global_step": 38843, "epoch": 326, "lr": 4.360587285623715e-05} +{"train_loss": 0.0024623009376227856, "global_step": 38844, "epoch": 326, "lr": 4.3603675543726836e-05} +{"train_loss": 0.0014085336588323116, "global_step": 38845, "epoch": 326, "lr": 4.3601478243775024e-05} +{"train_loss": 0.002169150160625577, "global_step": 38846, "epoch": 326, "lr": 4.3599280956386025e-05} +{"train_loss": 0.0014185153413563967, "global_step": 38847, "epoch": 326, "lr": 4.359708368156415e-05} +{"train_loss": 0.0033193316776305437, "global_step": 38848, "epoch": 326, "lr": 4.359488641931372e-05} +{"train_loss": 0.0022122494410723448, "global_step": 38849, "epoch": 326, "lr": 4.359268916963903e-05} +{"train_loss": 0.0020537818782031536, "global_step": 38850, "epoch": 326, "lr": 4.3590491932544444e-05} +{"train_loss": 0.002086251275613904, "global_step": 38851, "epoch": 326, "lr": 4.358829470803424e-05} +{"train_loss": 0.0020183115266263485, "global_step": 38852, "epoch": 326, "lr": 4.3586097496112704e-05} +{"train_loss": 0.001127417664974928, "global_step": 38853, "epoch": 326, "lr": 4.3583900296784205e-05} +{"train_loss": 0.0012397393584251404, "global_step": 38854, "epoch": 326, "lr": 4.358170311005302e-05} +{"train_loss": 0.0013914239825680852, "global_step": 38855, "epoch": 326, "lr": 4.3579505935923484e-05} +{"train_loss": 0.0007933739107102156, "global_step": 38856, "epoch": 326, "lr": 4.357730877439988e-05} +{"train_loss": 0.0016628603916615248, "global_step": 38857, "epoch": 326, "lr": 4.357511162548657e-05} +{"train_loss": 0.001861018594354391, "global_step": 38858, "epoch": 326, "lr": 4.357291448918785e-05} +{"train_loss": 0.0010934420861303806, "global_step": 38859, "epoch": 326, "lr": 4.3570717365508e-05} +{"train_loss": 0.0016363781178370118, "global_step": 38860, "epoch": 326, "lr": 4.356852025445138e-05} +{"train_loss": 0.0017841034568846226, "global_step": 38861, "epoch": 326, "lr": 4.356632315602226e-05} +{"train_loss": 0.0021538129076361656, "global_step": 38862, "epoch": 326, "lr": 4.3564126070224984e-05} +{"train_loss": 0.0022370980586856604, "global_step": 38863, "epoch": 326, "lr": 4.356192899706388e-05} +{"train_loss": 0.001510524656623602, "global_step": 38864, "epoch": 326, "lr": 4.355973193654321e-05} +{"train_loss": 0.0023520004469901323, "global_step": 38865, "epoch": 326, "lr": 4.355753488866734e-05} +{"train_loss": 0.0021522212773561478, "global_step": 38866, "epoch": 326, "lr": 4.355533785344055e-05} +{"train_loss": 0.0018053033854812384, "global_step": 38867, "epoch": 326, "lr": 4.355314083086718e-05} +{"train_loss": 0.0011859716614708304, "global_step": 38868, "epoch": 326, "lr": 4.355094382095151e-05} +{"train_loss": 0.0019470874685794115, "global_step": 38869, "epoch": 326, "lr": 4.354874682369789e-05} +{"train_loss": 0.0018867228645831347, "global_step": 38870, "epoch": 326, "lr": 4.3546549839110616e-05} +{"train_loss": 0.002533574588596821, "global_step": 38871, "epoch": 326, "lr": 4.354435286719398e-05} +{"train_loss": 0.003635881468653679, "global_step": 38872, "epoch": 326, "lr": 4.3542155907952344e-05} +{"train_loss": 0.0016181791434064507, "global_step": 38873, "epoch": 326, "lr": 4.353995896138997e-05} +{"train_loss": 0.0017860052175819874, "global_step": 38874, "epoch": 326, "lr": 4.353776202751123e-05} +{"train_loss": 0.002953128656372428, "global_step": 38875, "epoch": 326, "lr": 4.3535565106320376e-05} +{"train_loss": 0.002985558472573757, "global_step": 38876, "epoch": 326, "lr": 4.353336819782176e-05} +{"train_loss": 0.0011796586913987994, "global_step": 38877, "epoch": 326, "lr": 4.353117130201968e-05} +{"train_loss": 0.0009763866546563804, "global_step": 38878, "epoch": 326, "lr": 4.352897441891846e-05} +{"train_loss": 0.0015459469286724925, "global_step": 38879, "epoch": 326, "lr": 4.35267775485224e-05} +{"train_loss": 0.0015226172981783748, "global_step": 38880, "epoch": 326, "lr": 4.352458069083582e-05} +{"train_loss": 0.002077455399557948, "global_step": 38881, "epoch": 326, "lr": 4.3522383845863034e-05} +{"train_loss": 0.0013609501766040921, "global_step": 38882, "epoch": 326, "lr": 4.352018701360837e-05} +{"train_loss": 0.0017120251432061195, "global_step": 38883, "epoch": 326, "lr": 4.3517990194076104e-05} +{"train_loss": 0.0014915239298716187, "global_step": 38884, "epoch": 326, "lr": 4.3515793387270594e-05} +{"train_loss": 0.001565971877425909, "global_step": 38885, "epoch": 326, "lr": 4.351359659319611e-05} +{"train_loss": 0.0014622246380895376, "global_step": 38886, "epoch": 326, "lr": 4.3511399811857006e-05} +{"train_loss": 0.0021909631323069334, "global_step": 38887, "epoch": 326, "lr": 4.3509203043257554e-05} +{"train_loss": 0.0020041409879922867, "global_step": 38888, "epoch": 326, "lr": 4.3507006287402106e-05} +{"train_loss": 0.001250204280950129, "global_step": 38889, "epoch": 326, "lr": 4.3504809544294964e-05} +{"train_loss": 0.0021485574543476105, "global_step": 38890, "epoch": 326, "lr": 4.350261281394041e-05} +{"train_loss": 0.001147689763456583, "global_step": 38891, "epoch": 326, "lr": 4.3500416096342806e-05} +{"train_loss": 0.0035819702316075563, "global_step": 38892, "epoch": 326, "lr": 4.3498219391506416e-05} +{"train_loss": 0.0012497756397351623, "global_step": 38893, "epoch": 326, "lr": 4.34960226994356e-05} +{"train_loss": 0.0010015969164669514, "global_step": 38894, "epoch": 326, "lr": 4.3493826020134635e-05} +{"train_loss": 0.0014428164577111602, "global_step": 38895, "epoch": 326, "lr": 4.349162935360786e-05} +{"train_loss": 0.002038312144577503, "global_step": 38896, "epoch": 326, "lr": 4.348943269985956e-05} +{"train_loss": 0.0013726608594879508, "global_step": 38897, "epoch": 326, "lr": 4.348723605889406e-05} +{"train_loss": 0.0017226985655725002, "global_step": 38898, "epoch": 326, "lr": 4.34850394307157e-05} +{"train_loss": 0.001880634925328195, "global_step": 38899, "epoch": 326, "lr": 4.348284281532874e-05} +{"train_loss": 0.001799191813915968, "global_step": 38900, "epoch": 326, "lr": 4.348064621273755e-05} +{"train_loss": 0.0026004337705671787, "global_step": 38901, "epoch": 326, "lr": 4.3478449622946404e-05} +{"train_loss": 0.002241020556539297, "global_step": 38902, "epoch": 326, "lr": 4.3476253045959615e-05} +{"train_loss": 0.0012413475196808577, "global_step": 38903, "epoch": 326, "lr": 4.347405648178152e-05} +{"train_loss": 0.0030254675075411797, "global_step": 38904, "epoch": 326, "lr": 4.34718599304164e-05} +{"train_loss": 0.0008304959628731012, "global_step": 38905, "epoch": 326, "lr": 4.3469663391868606e-05} +{"train_loss": 0.0016523507656529546, "global_step": 38906, "epoch": 326, "lr": 4.3467466866142414e-05} +{"train_loss": 0.003171410644426942, "global_step": 38907, "epoch": 326, "lr": 4.346527035324217e-05} +{"train_loss": 0.0020587402395904064, "global_step": 38908, "epoch": 326, "lr": 4.3463073853172174e-05} +{"train_loss": 0.0014628440840169787, "global_step": 38909, "epoch": 326, "lr": 4.346087736593671e-05} +{"train_loss": 0.0012838082620874047, "global_step": 38910, "epoch": 326, "lr": 4.345868089154013e-05} +{"train_loss": 0.0015126076759770513, "global_step": 38911, "epoch": 326, "lr": 4.3456484429986724e-05} +{"train_loss": 0.0019552848588463953, "global_step": 38912, "epoch": 326, "lr": 4.345428798128081e-05, "val_loss": 0.007556971162557602} +{"train_loss": 0.0026918898802250624, "global_step": 38913, "epoch": 327, "lr": 4.345209154542671e-05} +{"train_loss": 0.0011740544578060508, "global_step": 38914, "epoch": 327, "lr": 4.344989512242872e-05} +{"train_loss": 0.0016861973563209176, "global_step": 38915, "epoch": 327, "lr": 4.3447698712291176e-05} +{"train_loss": 0.0013407591031864285, "global_step": 38916, "epoch": 327, "lr": 4.344550231501836e-05} +{"train_loss": 0.0018641476053744555, "global_step": 38917, "epoch": 327, "lr": 4.3443305930614606e-05} +{"train_loss": 0.0040623038075864315, "global_step": 38918, "epoch": 327, "lr": 4.3441109559084217e-05} +{"train_loss": 0.0017353682778775692, "global_step": 38919, "epoch": 327, "lr": 4.343891320043152e-05} +{"train_loss": 0.0015811969060450792, "global_step": 38920, "epoch": 327, "lr": 4.343671685466082e-05} +{"train_loss": 0.0009013070375658572, "global_step": 38921, "epoch": 327, "lr": 4.34345205217764e-05} +{"train_loss": 0.0026195270475000143, "global_step": 38922, "epoch": 327, "lr": 4.343232420178262e-05} +{"train_loss": 0.0014834427274763584, "global_step": 38923, "epoch": 327, "lr": 4.3430127894683745e-05} +{"train_loss": 0.0020165182650089264, "global_step": 38924, "epoch": 327, "lr": 4.342793160048414e-05} +{"train_loss": 0.0017963172867894173, "global_step": 38925, "epoch": 327, "lr": 4.3425735319188065e-05} +{"train_loss": 0.0011124220909550786, "global_step": 38926, "epoch": 327, "lr": 4.3423539050799875e-05} +{"train_loss": 0.0019032564014196396, "global_step": 38927, "epoch": 327, "lr": 4.342134279532386e-05} +{"train_loss": 0.0030923844315111637, "global_step": 38928, "epoch": 327, "lr": 4.3419146552764335e-05} +{"train_loss": 0.0032319400925189257, "global_step": 38929, "epoch": 327, "lr": 4.3416950323125605e-05} +{"train_loss": 0.0019603611435741186, "global_step": 38930, "epoch": 327, "lr": 4.3414754106411994e-05} +{"train_loss": 0.001893034321255982, "global_step": 38931, "epoch": 327, "lr": 4.3412557902627806e-05} +{"train_loss": 0.0016156398924067616, "global_step": 38932, "epoch": 327, "lr": 4.341036171177738e-05} +{"train_loss": 0.0017589048948138952, "global_step": 38933, "epoch": 327, "lr": 4.340816553386497e-05} +{"train_loss": 0.002717735478654504, "global_step": 38934, "epoch": 327, "lr": 4.340596936889495e-05} +{"train_loss": 0.0021318518556654453, "global_step": 38935, "epoch": 327, "lr": 4.340377321687158e-05} +{"train_loss": 0.00198824773542583, "global_step": 38936, "epoch": 327, "lr": 4.3401577077799216e-05} +{"train_loss": 0.0029824397061020136, "global_step": 38937, "epoch": 327, "lr": 4.3399380951682135e-05} +{"train_loss": 0.0016534009482711554, "global_step": 38938, "epoch": 327, "lr": 4.3397184838524686e-05} +{"train_loss": 0.002163716359063983, "global_step": 38939, "epoch": 327, "lr": 4.339498873833116e-05} +{"train_loss": 0.0015198045875877142, "global_step": 38940, "epoch": 327, "lr": 4.339279265110584e-05} +{"train_loss": 0.0015937254065647721, "global_step": 38941, "epoch": 327, "lr": 4.3390596576853086e-05} +{"train_loss": 0.0030521240551024675, "global_step": 38942, "epoch": 327, "lr": 4.338840051557718e-05} +{"train_loss": 0.0017330424161627889, "global_step": 38943, "epoch": 327, "lr": 4.3386204467282455e-05} +{"train_loss": 0.0009484007605351508, "global_step": 38944, "epoch": 327, "lr": 4.33840084319732e-05} +{"train_loss": 0.0015332790790125728, "global_step": 38945, "epoch": 327, "lr": 4.338181240965374e-05} +{"train_loss": 0.0013892928836867213, "global_step": 38946, "epoch": 327, "lr": 4.337961640032838e-05} +{"train_loss": 0.0023841538932174444, "global_step": 38947, "epoch": 327, "lr": 4.3377420404001435e-05} +{"train_loss": 0.002339686267077923, "global_step": 38948, "epoch": 327, "lr": 4.3375224420677236e-05} +{"train_loss": 0.0019302464788779616, "global_step": 38949, "epoch": 327, "lr": 4.337302845036005e-05} +{"train_loss": 0.0027743743266910315, "global_step": 38950, "epoch": 327, "lr": 4.3370832493054235e-05} +{"train_loss": 0.0026017609052360058, "global_step": 38951, "epoch": 327, "lr": 4.336863654876409e-05} +{"train_loss": 0.0026696512941271067, "global_step": 38952, "epoch": 327, "lr": 4.336644061749389e-05} +{"train_loss": 0.0022839398588985205, "global_step": 38953, "epoch": 327, "lr": 4.3364244699248e-05} +{"train_loss": 0.0018275559414178133, "global_step": 38954, "epoch": 327, "lr": 4.336204879403069e-05} +{"train_loss": 0.003712437581270933, "global_step": 38955, "epoch": 327, "lr": 4.33598529018463e-05} +{"train_loss": 0.001181205385364592, "global_step": 38956, "epoch": 327, "lr": 4.335765702269911e-05} +{"train_loss": 0.0017733101267367601, "global_step": 38957, "epoch": 327, "lr": 4.3355461156593476e-05} +{"train_loss": 0.0024364558048546314, "global_step": 38958, "epoch": 327, "lr": 4.335326530353369e-05} +{"train_loss": 0.0018029852071776986, "global_step": 38959, "epoch": 327, "lr": 4.3351069463524016e-05} +{"train_loss": 0.0026717677246779203, "global_step": 38960, "epoch": 327, "lr": 4.3348873636568835e-05} +{"train_loss": 0.001823993748985231, "global_step": 38961, "epoch": 327, "lr": 4.334667782267242e-05} +{"train_loss": 0.0011900789104402065, "global_step": 38962, "epoch": 327, "lr": 4.33444820218391e-05} +{"train_loss": 0.002460100222378969, "global_step": 38963, "epoch": 327, "lr": 4.3342286234073186e-05} +{"train_loss": 0.0018669964047148824, "global_step": 38964, "epoch": 327, "lr": 4.334009045937896e-05} +{"train_loss": 0.001866332022473216, "global_step": 38965, "epoch": 327, "lr": 4.3337894697760786e-05} +{"train_loss": 0.0018880559364333749, "global_step": 38966, "epoch": 327, "lr": 4.3335698949222905e-05} +{"train_loss": 0.002057506935670972, "global_step": 38967, "epoch": 327, "lr": 4.33335032137697e-05} +{"train_loss": 0.002125654835253954, "global_step": 38968, "epoch": 327, "lr": 4.333130749140543e-05} +{"train_loss": 0.0010936431353911757, "global_step": 38969, "epoch": 327, "lr": 4.3329111782134436e-05} +{"train_loss": 0.0015463449526578188, "global_step": 38970, "epoch": 327, "lr": 4.332691608596102e-05} +{"train_loss": 0.0021042018197476864, "global_step": 38971, "epoch": 327, "lr": 4.3324720402889477e-05} +{"train_loss": 0.0010963749373331666, "global_step": 38972, "epoch": 327, "lr": 4.3322524732924155e-05} +{"train_loss": 0.0015889335190877318, "global_step": 38973, "epoch": 327, "lr": 4.332032907606932e-05} +{"train_loss": 0.0020626066252589226, "global_step": 38974, "epoch": 327, "lr": 4.3318133432329314e-05} +{"train_loss": 0.002867776434868574, "global_step": 38975, "epoch": 327, "lr": 4.331593780170843e-05} +{"train_loss": 0.0015672051813453436, "global_step": 38976, "epoch": 327, "lr": 4.331374218421101e-05} +{"train_loss": 0.002176034962758422, "global_step": 38977, "epoch": 327, "lr": 4.331154657984133e-05} +{"train_loss": 0.002778570167720318, "global_step": 38978, "epoch": 327, "lr": 4.330935098860371e-05} +{"train_loss": 0.0013011886039748788, "global_step": 38979, "epoch": 327, "lr": 4.3307155410502464e-05} +{"train_loss": 0.001579433330334723, "global_step": 38980, "epoch": 327, "lr": 4.330495984554191e-05} +{"train_loss": 0.001824763836339116, "global_step": 38981, "epoch": 327, "lr": 4.330276429372634e-05} +{"train_loss": 0.0016919837798923254, "global_step": 38982, "epoch": 327, "lr": 4.33005687550601e-05} +{"train_loss": 0.001455600024200976, "global_step": 38983, "epoch": 327, "lr": 4.329837322954745e-05} +{"train_loss": 0.002510550431907177, "global_step": 38984, "epoch": 327, "lr": 4.3296177717192755e-05} +{"train_loss": 0.001178933773189783, "global_step": 38985, "epoch": 327, "lr": 4.329398221800027e-05} +{"train_loss": 0.0024693855084478855, "global_step": 38986, "epoch": 327, "lr": 4.329178673197436e-05} +{"train_loss": 0.001746898633427918, "global_step": 38987, "epoch": 327, "lr": 4.328959125911929e-05} +{"train_loss": 0.0034762914292514324, "global_step": 38988, "epoch": 327, "lr": 4.3287395799439414e-05} +{"train_loss": 0.001919776201248169, "global_step": 38989, "epoch": 327, "lr": 4.3285200352939015e-05} +{"train_loss": 0.0017079456010833383, "global_step": 38990, "epoch": 327, "lr": 4.3283004919622386e-05} +{"train_loss": 0.001503120525740087, "global_step": 38991, "epoch": 327, "lr": 4.3280809499493884e-05} +{"train_loss": 0.0024562987964600325, "global_step": 38992, "epoch": 327, "lr": 4.327861409255777e-05} +{"train_loss": 0.00262941000983119, "global_step": 38993, "epoch": 327, "lr": 4.3276418698818404e-05} +{"train_loss": 0.002235294785350561, "global_step": 38994, "epoch": 327, "lr": 4.327422331828005e-05} +{"train_loss": 0.0018415097147226334, "global_step": 38995, "epoch": 327, "lr": 4.3272027950947046e-05} +{"train_loss": 0.0013590666931122541, "global_step": 38996, "epoch": 327, "lr": 4.326983259682371e-05} +{"train_loss": 0.0016344471368938684, "global_step": 38997, "epoch": 327, "lr": 4.3267637255914315e-05} +{"train_loss": 0.002209221478551626, "global_step": 38998, "epoch": 327, "lr": 4.326544192822322e-05} +{"train_loss": 0.0026064650155603886, "global_step": 38999, "epoch": 327, "lr": 4.326324661375469e-05} +{"train_loss": 0.001705659320577979, "global_step": 39000, "epoch": 327, "lr": 4.3261051312513074e-05} +{"train_loss": 0.0027513981331139803, "global_step": 39001, "epoch": 327, "lr": 4.325885602450266e-05} +{"train_loss": 0.003734911559149623, "global_step": 39002, "epoch": 327, "lr": 4.3256660749727746e-05} +{"train_loss": 0.0025168494321405888, "global_step": 39003, "epoch": 327, "lr": 4.325446548819268e-05} +{"train_loss": 0.002821170026436448, "global_step": 39004, "epoch": 327, "lr": 4.3252270239901724e-05} +{"train_loss": 0.0022143935784697533, "global_step": 39005, "epoch": 327, "lr": 4.3250075004859244e-05} +{"train_loss": 0.0020639109425246716, "global_step": 39006, "epoch": 327, "lr": 4.324787978306949e-05} +{"train_loss": 0.0011874450137838721, "global_step": 39007, "epoch": 327, "lr": 4.3245684574536825e-05} +{"train_loss": 0.0016541002551093698, "global_step": 39008, "epoch": 327, "lr": 4.324348937926553e-05} +{"train_loss": 0.0013994470937177539, "global_step": 39009, "epoch": 327, "lr": 4.3241294197259925e-05} +{"train_loss": 0.0018789463210850954, "global_step": 39010, "epoch": 327, "lr": 4.323909902852431e-05} +{"train_loss": 0.002716574352234602, "global_step": 39011, "epoch": 327, "lr": 4.323690387306301e-05} +{"train_loss": 0.0026280859019607306, "global_step": 39012, "epoch": 327, "lr": 4.323470873088032e-05} +{"train_loss": 0.002854486694559455, "global_step": 39013, "epoch": 327, "lr": 4.323251360198057e-05} +{"train_loss": 0.0015025113243609667, "global_step": 39014, "epoch": 327, "lr": 4.3230318486368034e-05} +{"train_loss": 0.003825426334515214, "global_step": 39015, "epoch": 327, "lr": 4.3228123384047066e-05} +{"train_loss": 0.003657127730548382, "global_step": 39016, "epoch": 327, "lr": 4.322592829502193e-05} +{"train_loss": 0.0019887203816324472, "global_step": 39017, "epoch": 327, "lr": 4.322373321929699e-05} +{"train_loss": 0.0019788523204624653, "global_step": 39018, "epoch": 327, "lr": 4.3221538156876496e-05} +{"train_loss": 0.0013360850280150771, "global_step": 39019, "epoch": 327, "lr": 4.321934310776481e-05} +{"train_loss": 0.0019369684159755707, "global_step": 39020, "epoch": 327, "lr": 4.321714807196622e-05} +{"train_loss": 0.0017385142855346203, "global_step": 39021, "epoch": 327, "lr": 4.321495304948501e-05} +{"train_loss": 0.0024115638807415962, "global_step": 39022, "epoch": 327, "lr": 4.3212758040325544e-05} +{"train_loss": 0.0035005020909011364, "global_step": 39023, "epoch": 327, "lr": 4.321056304449208e-05} +{"train_loss": 0.00212337588891387, "global_step": 39024, "epoch": 327, "lr": 4.320836806198897e-05} +{"train_loss": 0.0015826087910681963, "global_step": 39025, "epoch": 327, "lr": 4.320617309282048e-05} +{"train_loss": 0.001127513125538826, "global_step": 39026, "epoch": 327, "lr": 4.3203978136990965e-05} +{"train_loss": 0.0017622383311390877, "global_step": 39027, "epoch": 327, "lr": 4.320178319450471e-05} +{"train_loss": 0.0018842240097001195, "global_step": 39028, "epoch": 327, "lr": 4.319958826536602e-05} +{"train_loss": 0.002337871817871928, "global_step": 39029, "epoch": 327, "lr": 4.3197393349579207e-05} +{"train_loss": 0.0009480706648901105, "global_step": 39030, "epoch": 327, "lr": 4.319519844714858e-05} +{"train_loss": 0.0020593073622112265, "global_step": 39031, "epoch": 327, "lr": 4.3193003558078485e-05, "val_loss": 0.013390910811722279} +{"train_loss": 0.0014512811321765184, "global_step": 39032, "epoch": 328, "lr": 4.3190808682373186e-05} +{"train_loss": 0.003924044314771891, "global_step": 39033, "epoch": 328, "lr": 4.3188613820036995e-05} +{"train_loss": 0.0010451114503666759, "global_step": 39034, "epoch": 328, "lr": 4.318641897107425e-05} +{"train_loss": 0.0014156915713101625, "global_step": 39035, "epoch": 328, "lr": 4.318422413548921e-05} +{"train_loss": 0.0015326327411457896, "global_step": 39036, "epoch": 328, "lr": 4.318202931328626e-05} +{"train_loss": 0.0020401643123477697, "global_step": 39037, "epoch": 328, "lr": 4.317983450446964e-05} +{"train_loss": 0.0012928087962791324, "global_step": 39038, "epoch": 328, "lr": 4.31776397090437e-05} +{"train_loss": 0.002007733564823866, "global_step": 39039, "epoch": 328, "lr": 4.317544492701274e-05} +{"train_loss": 0.0017746296944096684, "global_step": 39040, "epoch": 328, "lr": 4.3173250158381045e-05} +{"train_loss": 0.001640522968955338, "global_step": 39041, "epoch": 328, "lr": 4.317105540315297e-05} +{"train_loss": 0.003072167281061411, "global_step": 39042, "epoch": 328, "lr": 4.316886066133277e-05} +{"train_loss": 0.0011725700460374355, "global_step": 39043, "epoch": 328, "lr": 4.316666593292479e-05} +{"train_loss": 0.0017122008139267564, "global_step": 39044, "epoch": 328, "lr": 4.3164471217933335e-05} +{"train_loss": 0.0016237430972978473, "global_step": 39045, "epoch": 328, "lr": 4.316227651636271e-05} +{"train_loss": 0.0014539255062118173, "global_step": 39046, "epoch": 328, "lr": 4.316008182821724e-05} +{"train_loss": 0.002687138272449374, "global_step": 39047, "epoch": 328, "lr": 4.315788715350119e-05} +{"train_loss": 0.002269335091114044, "global_step": 39048, "epoch": 328, "lr": 4.3155692492218925e-05} +{"train_loss": 0.0026192967779934406, "global_step": 39049, "epoch": 328, "lr": 4.3153497844374705e-05} +{"train_loss": 0.0023170141503214836, "global_step": 39050, "epoch": 328, "lr": 4.315130320997287e-05} +{"train_loss": 0.0011300226906314492, "global_step": 39051, "epoch": 328, "lr": 4.314910858901773e-05} +{"train_loss": 0.0032400034833699465, "global_step": 39052, "epoch": 328, "lr": 4.314691398151356e-05} +{"train_loss": 0.002865266753360629, "global_step": 39053, "epoch": 328, "lr": 4.314471938746472e-05} +{"train_loss": 0.0013093181187286973, "global_step": 39054, "epoch": 328, "lr": 4.314252480687546e-05} +{"train_loss": 0.002562857698649168, "global_step": 39055, "epoch": 328, "lr": 4.314033023975015e-05} +{"train_loss": 0.003491076407954097, "global_step": 39056, "epoch": 328, "lr": 4.313813568609304e-05} +{"train_loss": 0.002747936639934778, "global_step": 39057, "epoch": 328, "lr": 4.313594114590849e-05} +{"train_loss": 0.002344283740967512, "global_step": 39058, "epoch": 328, "lr": 4.313374661920078e-05} +{"train_loss": 0.0018833607900887728, "global_step": 39059, "epoch": 328, "lr": 4.3131552105974224e-05} +{"train_loss": 0.0022508041001856327, "global_step": 39060, "epoch": 328, "lr": 4.3129357606233125e-05} +{"train_loss": 0.0037507247179746628, "global_step": 39061, "epoch": 328, "lr": 4.3127163119981805e-05} +{"train_loss": 0.002658511744812131, "global_step": 39062, "epoch": 328, "lr": 4.312496864722456e-05} +{"train_loss": 0.0034182185772806406, "global_step": 39063, "epoch": 328, "lr": 4.312277418796572e-05} +{"train_loss": 0.00184676016215235, "global_step": 39064, "epoch": 328, "lr": 4.312057974220956e-05} +{"train_loss": 0.00101923116017133, "global_step": 39065, "epoch": 328, "lr": 4.311838530996043e-05} +{"train_loss": 0.001741283806040883, "global_step": 39066, "epoch": 328, "lr": 4.311619089122258e-05} +{"train_loss": 0.0025186443235725164, "global_step": 39067, "epoch": 328, "lr": 4.311399648600038e-05} +{"train_loss": 0.0029413187876343727, "global_step": 39068, "epoch": 328, "lr": 4.31118020942981e-05} +{"train_loss": 0.0022148059215396643, "global_step": 39069, "epoch": 328, "lr": 4.310960771612008e-05} +{"train_loss": 0.0013244317378848791, "global_step": 39070, "epoch": 328, "lr": 4.31074133514706e-05} +{"train_loss": 0.0011230346281081438, "global_step": 39071, "epoch": 328, "lr": 4.310521900035396e-05} +{"train_loss": 0.002691976260393858, "global_step": 39072, "epoch": 328, "lr": 4.310302466277451e-05} +{"train_loss": 0.0014193715760484338, "global_step": 39073, "epoch": 328, "lr": 4.310083033873651e-05} +{"train_loss": 0.002096538431942463, "global_step": 39074, "epoch": 328, "lr": 4.309863602824431e-05} +{"train_loss": 0.002901986939832568, "global_step": 39075, "epoch": 328, "lr": 4.309644173130219e-05} +{"train_loss": 0.0017120410921052098, "global_step": 39076, "epoch": 328, "lr": 4.3094247447914485e-05} +{"train_loss": 0.0014975018566474319, "global_step": 39077, "epoch": 328, "lr": 4.309205317808548e-05} +{"train_loss": 0.001807178370654583, "global_step": 39078, "epoch": 328, "lr": 4.308985892181948e-05} +{"train_loss": 0.001751359086483717, "global_step": 39079, "epoch": 328, "lr": 4.308766467912082e-05} +{"train_loss": 0.0037874169647693634, "global_step": 39080, "epoch": 328, "lr": 4.308547044999377e-05} +{"train_loss": 0.002065122127532959, "global_step": 39081, "epoch": 328, "lr": 4.308327623444268e-05} +{"train_loss": 0.0026529852766543627, "global_step": 39082, "epoch": 328, "lr": 4.308108203247185e-05} +{"train_loss": 0.001820181729272008, "global_step": 39083, "epoch": 328, "lr": 4.307888784408555e-05} +{"train_loss": 0.0013905272353440523, "global_step": 39084, "epoch": 328, "lr": 4.3076693669288126e-05} +{"train_loss": 0.00155100307893008, "global_step": 39085, "epoch": 328, "lr": 4.3074499508083856e-05} +{"train_loss": 0.0023499091621488333, "global_step": 39086, "epoch": 328, "lr": 4.3072305360477095e-05} +{"train_loss": 0.002179431263357401, "global_step": 39087, "epoch": 328, "lr": 4.3070111226472097e-05} +{"train_loss": 0.002358119934797287, "global_step": 39088, "epoch": 328, "lr": 4.306791710607322e-05} +{"train_loss": 0.002441256772726774, "global_step": 39089, "epoch": 328, "lr": 4.3065722999284745e-05} +{"train_loss": 0.0015184053918346763, "global_step": 39090, "epoch": 328, "lr": 4.306352890611096e-05} +{"train_loss": 0.002172621665522456, "global_step": 39091, "epoch": 328, "lr": 4.306133482655622e-05} +{"train_loss": 0.0012832926586270332, "global_step": 39092, "epoch": 328, "lr": 4.305914076062478e-05} +{"train_loss": 0.0018588351085782051, "global_step": 39093, "epoch": 328, "lr": 4.3056946708320985e-05} +{"train_loss": 0.0024520852603018284, "global_step": 39094, "epoch": 328, "lr": 4.305475266964914e-05} +{"train_loss": 0.0011113386135548353, "global_step": 39095, "epoch": 328, "lr": 4.305255864461355e-05} +{"train_loss": 0.0013296965043991804, "global_step": 39096, "epoch": 328, "lr": 4.305036463321851e-05} +{"train_loss": 0.003259182209149003, "global_step": 39097, "epoch": 328, "lr": 4.304817063546833e-05} +{"train_loss": 0.003412791993469, "global_step": 39098, "epoch": 328, "lr": 4.304597665136735e-05} +{"train_loss": 0.0014830828877165914, "global_step": 39099, "epoch": 328, "lr": 4.304378268091982e-05} +{"train_loss": 0.003139867912977934, "global_step": 39100, "epoch": 328, "lr": 4.304158872413011e-05} +{"train_loss": 0.0014148507034406066, "global_step": 39101, "epoch": 328, "lr": 4.303939478100249e-05} +{"train_loss": 0.0017718957969918847, "global_step": 39102, "epoch": 328, "lr": 4.303720085154126e-05} +{"train_loss": 0.002047120127826929, "global_step": 39103, "epoch": 328, "lr": 4.303500693575075e-05} +{"train_loss": 0.0019632522016763687, "global_step": 39104, "epoch": 328, "lr": 4.303281303363525e-05} +{"train_loss": 0.0019582859240472317, "global_step": 39105, "epoch": 328, "lr": 4.3030619145199106e-05} +{"train_loss": 0.0014287346275523305, "global_step": 39106, "epoch": 328, "lr": 4.302842527044656e-05} +{"train_loss": 0.0022545685060322285, "global_step": 39107, "epoch": 328, "lr": 4.3026231409381984e-05} +{"train_loss": 0.001827543368563056, "global_step": 39108, "epoch": 328, "lr": 4.302403756200964e-05} +{"train_loss": 0.0012774913338944316, "global_step": 39109, "epoch": 328, "lr": 4.302184372833386e-05} +{"train_loss": 0.002103352453559637, "global_step": 39110, "epoch": 328, "lr": 4.301964990835895e-05} +{"train_loss": 0.0029350868426263332, "global_step": 39111, "epoch": 328, "lr": 4.301745610208921e-05} +{"train_loss": 0.001838656491599977, "global_step": 39112, "epoch": 328, "lr": 4.301526230952894e-05} +{"train_loss": 0.0018308007856830955, "global_step": 39113, "epoch": 328, "lr": 4.301306853068245e-05} +{"train_loss": 0.003717993851751089, "global_step": 39114, "epoch": 328, "lr": 4.301087476555408e-05} +{"train_loss": 0.0008316783350892365, "global_step": 39115, "epoch": 328, "lr": 4.30086810141481e-05} +{"train_loss": 0.0010051729623228312, "global_step": 39116, "epoch": 328, "lr": 4.300648727646881e-05} +{"train_loss": 0.0022631031461060047, "global_step": 39117, "epoch": 328, "lr": 4.300429355252056e-05} +{"train_loss": 0.0035549188032746315, "global_step": 39118, "epoch": 328, "lr": 4.300209984230761e-05} +{"train_loss": 0.0010548238642513752, "global_step": 39119, "epoch": 328, "lr": 4.299990614583431e-05} +{"train_loss": 0.002491987543180585, "global_step": 39120, "epoch": 328, "lr": 4.2997712463104947e-05} +{"train_loss": 0.002643843647092581, "global_step": 39121, "epoch": 328, "lr": 4.299551879412381e-05} +{"train_loss": 0.0027806484140455723, "global_step": 39122, "epoch": 328, "lr": 4.299332513889524e-05} +{"train_loss": 0.0013479393674060702, "global_step": 39123, "epoch": 328, "lr": 4.29911314974235e-05} +{"train_loss": 0.0022034316789358854, "global_step": 39124, "epoch": 328, "lr": 4.298893786971295e-05} +{"train_loss": 0.0015290755545720458, "global_step": 39125, "epoch": 328, "lr": 4.298674425576786e-05} +{"train_loss": 0.0017431828891858459, "global_step": 39126, "epoch": 328, "lr": 4.298455065559256e-05} +{"train_loss": 0.0016811012756079435, "global_step": 39127, "epoch": 328, "lr": 4.2982357069191336e-05} +{"train_loss": 0.002218585694208741, "global_step": 39128, "epoch": 328, "lr": 4.2980163496568496e-05} +{"train_loss": 0.0012355017242953181, "global_step": 39129, "epoch": 328, "lr": 4.297796993772837e-05} +{"train_loss": 0.0023856654297560453, "global_step": 39130, "epoch": 328, "lr": 4.2975776392675235e-05} +{"train_loss": 0.0023095912765711546, "global_step": 39131, "epoch": 328, "lr": 4.2973582861413434e-05} +{"train_loss": 0.0019006725633516908, "global_step": 39132, "epoch": 328, "lr": 4.297138934394725e-05} +{"train_loss": 0.0014125033048912883, "global_step": 39133, "epoch": 328, "lr": 4.296919584028097e-05} +{"train_loss": 0.0034340168349444866, "global_step": 39134, "epoch": 328, "lr": 4.296700235041895e-05} +{"train_loss": 0.0026144643779844046, "global_step": 39135, "epoch": 328, "lr": 4.296480887436544e-05} +{"train_loss": 0.0022274404764175415, "global_step": 39136, "epoch": 328, "lr": 4.2962615412124804e-05} +{"train_loss": 0.002446920843794942, "global_step": 39137, "epoch": 328, "lr": 4.29604219637013e-05} +{"train_loss": 0.0019347253255546093, "global_step": 39138, "epoch": 328, "lr": 4.295822852909927e-05} +{"train_loss": 0.0014067136216908693, "global_step": 39139, "epoch": 328, "lr": 4.2956035108323014e-05} +{"train_loss": 0.001676743384450674, "global_step": 39140, "epoch": 328, "lr": 4.29538417013768e-05} +{"train_loss": 0.0017354519804939628, "global_step": 39141, "epoch": 328, "lr": 4.295164830826498e-05} +{"train_loss": 0.002176903188228607, "global_step": 39142, "epoch": 328, "lr": 4.294945492899185e-05} +{"train_loss": 0.0011941570555791259, "global_step": 39143, "epoch": 328, "lr": 4.294726156356171e-05} +{"train_loss": 0.001051710918545723, "global_step": 39144, "epoch": 328, "lr": 4.294506821197886e-05} +{"train_loss": 0.0017157658003270626, "global_step": 39145, "epoch": 328, "lr": 4.294287487424762e-05} +{"train_loss": 0.001456915051676333, "global_step": 39146, "epoch": 328, "lr": 4.294068155037231e-05} +{"train_loss": 0.003104723058640957, "global_step": 39147, "epoch": 328, "lr": 4.293848824035719e-05} +{"train_loss": 0.0018316295463591814, "global_step": 39148, "epoch": 328, "lr": 4.2936294944206615e-05} +{"train_loss": 0.0021825237199664116, "global_step": 39149, "epoch": 328, "lr": 4.293410166192485e-05} +{"train_loss": 0.002062407580983019, "global_step": 39150, "epoch": 328, "lr": 4.293190839351624e-05, "val_loss": 0.010349627584218979} +{"train_loss": 0.0016381186433136463, "global_step": 39151, "epoch": 329, "lr": 4.2929715138985074e-05} +{"train_loss": 0.001903651049360633, "global_step": 39152, "epoch": 329, "lr": 4.2927521898335635e-05} +{"train_loss": 0.0020020506344735622, "global_step": 39153, "epoch": 329, "lr": 4.292532867157227e-05} +{"train_loss": 0.00187154789455235, "global_step": 39154, "epoch": 329, "lr": 4.2923135458699246e-05} +{"train_loss": 0.0011254693381488323, "global_step": 39155, "epoch": 329, "lr": 4.292094225972092e-05} +{"train_loss": 0.002158127957955003, "global_step": 39156, "epoch": 329, "lr": 4.291874907464154e-05} +{"train_loss": 0.0016912303399294615, "global_step": 39157, "epoch": 329, "lr": 4.291655590346546e-05} +{"train_loss": 0.00161185790784657, "global_step": 39158, "epoch": 329, "lr": 4.2914362746196954e-05} +{"train_loss": 0.0015197702450677752, "global_step": 39159, "epoch": 329, "lr": 4.291216960284034e-05} +{"train_loss": 0.001325288088992238, "global_step": 39160, "epoch": 329, "lr": 4.2909976473399926e-05} +{"train_loss": 0.0009878786513581872, "global_step": 39161, "epoch": 329, "lr": 4.2907783357880015e-05} +{"train_loss": 0.002129514468833804, "global_step": 39162, "epoch": 329, "lr": 4.290559025628491e-05} +{"train_loss": 0.0013703074073418975, "global_step": 39163, "epoch": 329, "lr": 4.290339716861892e-05} +{"train_loss": 0.0017669630469754338, "global_step": 39164, "epoch": 329, "lr": 4.290120409488636e-05} +{"train_loss": 0.002110046800225973, "global_step": 39165, "epoch": 329, "lr": 4.289901103509154e-05} +{"train_loss": 0.0029746193904429674, "global_step": 39166, "epoch": 329, "lr": 4.2896817989238726e-05} +{"train_loss": 0.0007730632205493748, "global_step": 39167, "epoch": 329, "lr": 4.289462495733227e-05} +{"train_loss": 0.0016778141725808382, "global_step": 39168, "epoch": 329, "lr": 4.289243193937644e-05} +{"train_loss": 0.0026703716721385717, "global_step": 39169, "epoch": 329, "lr": 4.289023893537558e-05} +{"train_loss": 0.0011328147957101464, "global_step": 39170, "epoch": 329, "lr": 4.288804594533398e-05} +{"train_loss": 0.0014662460889667273, "global_step": 39171, "epoch": 329, "lr": 4.2885852969255916e-05} +{"train_loss": 0.0020200915168970823, "global_step": 39172, "epoch": 329, "lr": 4.288366000714574e-05} +{"train_loss": 0.002765075536444783, "global_step": 39173, "epoch": 329, "lr": 4.288146705900772e-05} +{"train_loss": 0.0023278642911463976, "global_step": 39174, "epoch": 329, "lr": 4.28792741248462e-05} +{"train_loss": 0.0014137605903670192, "global_step": 39175, "epoch": 329, "lr": 4.2877081204665445e-05} +{"train_loss": 0.0013655420625582337, "global_step": 39176, "epoch": 329, "lr": 4.2874888298469785e-05} +{"train_loss": 0.0015099101001396775, "global_step": 39177, "epoch": 329, "lr": 4.287269540626354e-05} +{"train_loss": 0.0014266098150983453, "global_step": 39178, "epoch": 329, "lr": 4.2870502528050966e-05} +{"train_loss": 0.0021932211238890886, "global_step": 39179, "epoch": 329, "lr": 4.2868309663836426e-05} +{"train_loss": 0.002028262009844184, "global_step": 39180, "epoch": 329, "lr": 4.286611681362417e-05} +{"train_loss": 0.0021188657265156507, "global_step": 39181, "epoch": 329, "lr": 4.2863923977418556e-05} +{"train_loss": 0.0016633406048640609, "global_step": 39182, "epoch": 329, "lr": 4.2861731155223864e-05} +{"train_loss": 0.002788258483633399, "global_step": 39183, "epoch": 329, "lr": 4.285953834704439e-05} +{"train_loss": 0.0023749605752527714, "global_step": 39184, "epoch": 329, "lr": 4.2857345552884456e-05} +{"train_loss": 0.0017245231429114938, "global_step": 39185, "epoch": 329, "lr": 4.2855152772748345e-05} +{"train_loss": 0.0017502406844869256, "global_step": 39186, "epoch": 329, "lr": 4.28529600066404e-05} +{"train_loss": 0.0018472992815077305, "global_step": 39187, "epoch": 329, "lr": 4.2850767254564886e-05} +{"train_loss": 0.0016263601137325168, "global_step": 39188, "epoch": 329, "lr": 4.284857451652614e-05} +{"train_loss": 0.0018980109598487616, "global_step": 39189, "epoch": 329, "lr": 4.284638179252845e-05} +{"train_loss": 0.0021230680868029594, "global_step": 39190, "epoch": 329, "lr": 4.2844189082576126e-05} +{"train_loss": 0.0017707711085677147, "global_step": 39191, "epoch": 329, "lr": 4.2841996386673464e-05} +{"train_loss": 0.0033270271960645914, "global_step": 39192, "epoch": 329, "lr": 4.2839803704824787e-05} +{"train_loss": 0.0014733623247593641, "global_step": 39193, "epoch": 329, "lr": 4.283761103703439e-05} +{"train_loss": 0.002380657009780407, "global_step": 39194, "epoch": 329, "lr": 4.283541838330657e-05} +{"train_loss": 0.0022368119098246098, "global_step": 39195, "epoch": 329, "lr": 4.283322574364564e-05} +{"train_loss": 0.0012592487037181854, "global_step": 39196, "epoch": 329, "lr": 4.283103311805593e-05} +{"train_loss": 0.002638074103742838, "global_step": 39197, "epoch": 329, "lr": 4.282884050654169e-05} +{"train_loss": 0.0010239335242658854, "global_step": 39198, "epoch": 329, "lr": 4.282664790910728e-05} +{"train_loss": 0.001082034781575203, "global_step": 39199, "epoch": 329, "lr": 4.282445532575696e-05} +{"train_loss": 0.0021731783635914326, "global_step": 39200, "epoch": 329, "lr": 4.282226275649507e-05} +{"train_loss": 0.001896448084153235, "global_step": 39201, "epoch": 329, "lr": 4.28200702013259e-05} +{"train_loss": 0.0012683874228969216, "global_step": 39202, "epoch": 329, "lr": 4.281787766025374e-05} +{"train_loss": 0.0022181575186550617, "global_step": 39203, "epoch": 329, "lr": 4.281568513328293e-05} +{"train_loss": 0.0014345558593049645, "global_step": 39204, "epoch": 329, "lr": 4.2813492620417736e-05} +{"train_loss": 0.0016798082506284118, "global_step": 39205, "epoch": 329, "lr": 4.2811300121662494e-05} +{"train_loss": 0.002744044177234173, "global_step": 39206, "epoch": 329, "lr": 4.2809107637021484e-05} +{"train_loss": 0.0024427734315395355, "global_step": 39207, "epoch": 329, "lr": 4.2806915166499036e-05} +{"train_loss": 0.0019981693476438522, "global_step": 39208, "epoch": 329, "lr": 4.280472271009944e-05} +{"train_loss": 0.0013205636059865355, "global_step": 39209, "epoch": 329, "lr": 4.2802530267827e-05} +{"train_loss": 0.0024240848142653704, "global_step": 39210, "epoch": 329, "lr": 4.280033783968602e-05} +{"train_loss": 0.002384306164458394, "global_step": 39211, "epoch": 329, "lr": 4.2798145425680794e-05} +{"train_loss": 0.002687415573745966, "global_step": 39212, "epoch": 329, "lr": 4.2795953025815667e-05} +{"train_loss": 0.002803462790325284, "global_step": 39213, "epoch": 329, "lr": 4.2793760640094884e-05} +{"train_loss": 0.0012335211504250765, "global_step": 39214, "epoch": 329, "lr": 4.279156826852282e-05} +{"train_loss": 0.00217898259870708, "global_step": 39215, "epoch": 329, "lr": 4.278937591110374e-05} +{"train_loss": 0.0010267427423968911, "global_step": 39216, "epoch": 329, "lr": 4.278718356784191e-05} +{"train_loss": 0.0016189790330827236, "global_step": 39217, "epoch": 329, "lr": 4.278499123874171e-05} +{"train_loss": 0.002720448188483715, "global_step": 39218, "epoch": 329, "lr": 4.278279892380739e-05} +{"train_loss": 0.0012676753103733063, "global_step": 39219, "epoch": 329, "lr": 4.278060662304329e-05} +{"train_loss": 0.0008558142581023276, "global_step": 39220, "epoch": 329, "lr": 4.27784143364537e-05} +{"train_loss": 0.0013852114789187908, "global_step": 39221, "epoch": 329, "lr": 4.27762220640429e-05} +{"train_loss": 0.0013194683706387877, "global_step": 39222, "epoch": 329, "lr": 4.277402980581523e-05} +{"train_loss": 0.0018586250953376293, "global_step": 39223, "epoch": 329, "lr": 4.277183756177497e-05} +{"train_loss": 0.001905681099742651, "global_step": 39224, "epoch": 329, "lr": 4.2769645331926436e-05} +{"train_loss": 0.0018204267835244536, "global_step": 39225, "epoch": 329, "lr": 4.2767453116273946e-05} +{"train_loss": 0.002179789124056697, "global_step": 39226, "epoch": 329, "lr": 4.276526091482177e-05} +{"train_loss": 0.0032115518115460873, "global_step": 39227, "epoch": 329, "lr": 4.2763068727574254e-05} +{"train_loss": 0.002298804698511958, "global_step": 39228, "epoch": 329, "lr": 4.276087655453566e-05} +{"train_loss": 0.0027127256616950035, "global_step": 39229, "epoch": 329, "lr": 4.2758684395710324e-05} +{"train_loss": 0.002017553197219968, "global_step": 39230, "epoch": 329, "lr": 4.275649225110252e-05} +{"train_loss": 0.0024213148280978203, "global_step": 39231, "epoch": 329, "lr": 4.275430012071659e-05} +{"train_loss": 0.0012864088639616966, "global_step": 39232, "epoch": 329, "lr": 4.27521080045568e-05} +{"train_loss": 0.002306134905666113, "global_step": 39233, "epoch": 329, "lr": 4.274991590262749e-05} +{"train_loss": 0.0017189586069434881, "global_step": 39234, "epoch": 329, "lr": 4.274772381493295e-05} +{"train_loss": 0.0008472023764625192, "global_step": 39235, "epoch": 329, "lr": 4.2745531741477454e-05} +{"train_loss": 0.0023051192983984947, "global_step": 39236, "epoch": 329, "lr": 4.274333968226535e-05} +{"train_loss": 0.0013803646434098482, "global_step": 39237, "epoch": 329, "lr": 4.2741147637300906e-05} +{"train_loss": 0.0025803102180361748, "global_step": 39238, "epoch": 329, "lr": 4.273895560658846e-05} +{"train_loss": 0.001285783713683486, "global_step": 39239, "epoch": 329, "lr": 4.273676359013229e-05} +{"train_loss": 0.001332588610239327, "global_step": 39240, "epoch": 329, "lr": 4.273457158793671e-05} +{"train_loss": 0.0028929642867296934, "global_step": 39241, "epoch": 329, "lr": 4.273237960000602e-05} +{"train_loss": 0.0008434029878117144, "global_step": 39242, "epoch": 329, "lr": 4.2730187626344534e-05} +{"train_loss": 0.0015651962021365762, "global_step": 39243, "epoch": 329, "lr": 4.272799566695654e-05} +{"train_loss": 0.0015470178332179785, "global_step": 39244, "epoch": 329, "lr": 4.2725803721846355e-05} +{"train_loss": 0.001169017399661243, "global_step": 39245, "epoch": 329, "lr": 4.2723611791018274e-05} +{"train_loss": 0.0011517140083014965, "global_step": 39246, "epoch": 329, "lr": 4.272141987447662e-05} +{"train_loss": 0.001130365184508264, "global_step": 39247, "epoch": 329, "lr": 4.271922797222565e-05} +{"train_loss": 0.0018936574924737215, "global_step": 39248, "epoch": 329, "lr": 4.2717036084269725e-05} +{"train_loss": 0.0011944822035729885, "global_step": 39249, "epoch": 329, "lr": 4.2714844210613096e-05} +{"train_loss": 0.0012215611059218645, "global_step": 39250, "epoch": 329, "lr": 4.2712652351260115e-05} +{"train_loss": 0.002845261711627245, "global_step": 39251, "epoch": 329, "lr": 4.2710460506215066e-05} +{"train_loss": 0.0024789045564830303, "global_step": 39252, "epoch": 329, "lr": 4.2708268675482224e-05} +{"train_loss": 0.0017386568943038583, "global_step": 39253, "epoch": 329, "lr": 4.270607685906595e-05} +{"train_loss": 0.001484746695496142, "global_step": 39254, "epoch": 329, "lr": 4.2703885056970476e-05} +{"train_loss": 0.0009608193067833781, "global_step": 39255, "epoch": 329, "lr": 4.2701693269200175e-05} +{"train_loss": 0.0013262236025184393, "global_step": 39256, "epoch": 329, "lr": 4.26995014957593e-05} +{"train_loss": 0.0021923359017819166, "global_step": 39257, "epoch": 329, "lr": 4.2697309736652194e-05} +{"train_loss": 0.0022125584073364735, "global_step": 39258, "epoch": 329, "lr": 4.269511799188312e-05} +{"train_loss": 0.0008627987699583173, "global_step": 39259, "epoch": 329, "lr": 4.2692926261456415e-05} +{"train_loss": 0.0010558561189100146, "global_step": 39260, "epoch": 329, "lr": 4.269073454537636e-05} +{"train_loss": 0.0015546082286164165, "global_step": 39261, "epoch": 329, "lr": 4.268854284364725e-05} +{"train_loss": 0.000879238941706717, "global_step": 39262, "epoch": 329, "lr": 4.268635115627344e-05} +{"train_loss": 0.00264820852316916, "global_step": 39263, "epoch": 329, "lr": 4.268415948325917e-05} +{"train_loss": 0.00195248459931463, "global_step": 39264, "epoch": 329, "lr": 4.26819678246088e-05} +{"train_loss": 0.0013529520947486162, "global_step": 39265, "epoch": 329, "lr": 4.26797761803266e-05} +{"train_loss": 0.0017189980717375875, "global_step": 39266, "epoch": 329, "lr": 4.267758455041685e-05} +{"train_loss": 0.001190934213809669, "global_step": 39267, "epoch": 329, "lr": 4.2675392934883904e-05} +{"train_loss": 0.0017181189032271504, "global_step": 39268, "epoch": 329, "lr": 4.2673201333732024e-05} +{"train_loss": 0.0018046207333711453, "global_step": 39269, "epoch": 329, "lr": 4.2671009746965556e-05, "val_loss": 0.008023208938539028} +{"train_loss": 0.0017574565717950463, "global_step": 39270, "epoch": 330, "lr": 4.266881817458877e-05} +{"train_loss": 0.002970207016915083, "global_step": 39271, "epoch": 330, "lr": 4.266662661660596e-05} +{"train_loss": 0.001684775692410767, "global_step": 39272, "epoch": 330, "lr": 4.2664435073021464e-05} +{"train_loss": 0.0018663047812879086, "global_step": 39273, "epoch": 330, "lr": 4.266224354383954e-05} +{"train_loss": 0.0016686732415109873, "global_step": 39274, "epoch": 330, "lr": 4.266005202906454e-05} +{"train_loss": 0.0008601379231549799, "global_step": 39275, "epoch": 330, "lr": 4.265786052870073e-05} +{"train_loss": 0.002370267640799284, "global_step": 39276, "epoch": 330, "lr": 4.265566904275243e-05} +{"train_loss": 0.0022484485525637865, "global_step": 39277, "epoch": 330, "lr": 4.2653477571223954e-05} +{"train_loss": 0.0013973192544654012, "global_step": 39278, "epoch": 330, "lr": 4.265128611411957e-05} +{"train_loss": 0.0011391433654353023, "global_step": 39279, "epoch": 330, "lr": 4.2649094671443615e-05} +{"train_loss": 0.0006887068739160895, "global_step": 39280, "epoch": 330, "lr": 4.264690324320035e-05} +{"train_loss": 0.0020054862834513187, "global_step": 39281, "epoch": 330, "lr": 4.264471182939414e-05} +{"train_loss": 0.0010875245789065957, "global_step": 39282, "epoch": 330, "lr": 4.2642520430029234e-05} +{"train_loss": 0.0018371765036135912, "global_step": 39283, "epoch": 330, "lr": 4.2640329045109964e-05} +{"train_loss": 0.0016215489013120532, "global_step": 39284, "epoch": 330, "lr": 4.263813767464062e-05} +{"train_loss": 0.0017717186128720641, "global_step": 39285, "epoch": 330, "lr": 4.263594631862549e-05} +{"train_loss": 0.003401370020583272, "global_step": 39286, "epoch": 330, "lr": 4.2633754977068916e-05} +{"train_loss": 0.002907694550231099, "global_step": 39287, "epoch": 330, "lr": 4.2631563649975156e-05} +{"train_loss": 0.001717588515020907, "global_step": 39288, "epoch": 330, "lr": 4.262937233734855e-05} +{"train_loss": 0.0016867431113496423, "global_step": 39289, "epoch": 330, "lr": 4.262718103919338e-05} +{"train_loss": 0.0018639317713677883, "global_step": 39290, "epoch": 330, "lr": 4.262498975551395e-05} +{"train_loss": 0.001564083737321198, "global_step": 39291, "epoch": 330, "lr": 4.262279848631456e-05} +{"train_loss": 0.0020759578328579664, "global_step": 39292, "epoch": 330, "lr": 4.262060723159952e-05} +{"train_loss": 0.0021013787481933832, "global_step": 39293, "epoch": 330, "lr": 4.261841599137312e-05} +{"train_loss": 0.0022558248601853848, "global_step": 39294, "epoch": 330, "lr": 4.261622476563969e-05} +{"train_loss": 0.0009672187152318656, "global_step": 39295, "epoch": 330, "lr": 4.26140335544035e-05} +{"train_loss": 0.001758027938194573, "global_step": 39296, "epoch": 330, "lr": 4.261184235766888e-05} +{"train_loss": 0.0018768543377518654, "global_step": 39297, "epoch": 330, "lr": 4.26096511754401e-05} +{"train_loss": 0.0019174256594851613, "global_step": 39298, "epoch": 330, "lr": 4.26074600077215e-05} +{"train_loss": 0.0020698767621070147, "global_step": 39299, "epoch": 330, "lr": 4.260526885451734e-05} +{"train_loss": 0.0020981221459805965, "global_step": 39300, "epoch": 330, "lr": 4.260307771583197e-05} +{"train_loss": 0.0018907657358795404, "global_step": 39301, "epoch": 330, "lr": 4.260088659166964e-05} +{"train_loss": 0.0011722348863258958, "global_step": 39302, "epoch": 330, "lr": 4.25986954820347e-05} +{"train_loss": 0.0016122342785820365, "global_step": 39303, "epoch": 330, "lr": 4.2596504386931436e-05} +{"train_loss": 0.0016629326855763793, "global_step": 39304, "epoch": 330, "lr": 4.259431330636412e-05} +{"train_loss": 0.0011472818441689014, "global_step": 39305, "epoch": 330, "lr": 4.25921222403371e-05} +{"train_loss": 0.0018488401547074318, "global_step": 39306, "epoch": 330, "lr": 4.258993118885464e-05} +{"train_loss": 0.0027871420606970787, "global_step": 39307, "epoch": 330, "lr": 4.2587740151921066e-05} +{"train_loss": 0.0016289671184495091, "global_step": 39308, "epoch": 330, "lr": 4.2585549129540674e-05} +{"train_loss": 0.0023154080845415592, "global_step": 39309, "epoch": 330, "lr": 4.2583358121717755e-05} +{"train_loss": 0.001751244068145752, "global_step": 39310, "epoch": 330, "lr": 4.2581167128456634e-05} +{"train_loss": 0.0028849979862570763, "global_step": 39311, "epoch": 330, "lr": 4.257897614976158e-05} +{"train_loss": 0.00312464265152812, "global_step": 39312, "epoch": 330, "lr": 4.2576785185636934e-05} +{"train_loss": 0.0015013228403404355, "global_step": 39313, "epoch": 330, "lr": 4.2574594236086955e-05} +{"train_loss": 0.002128549851477146, "global_step": 39314, "epoch": 330, "lr": 4.257240330111599e-05} +{"train_loss": 0.002275566104799509, "global_step": 39315, "epoch": 330, "lr": 4.257021238072832e-05} +{"train_loss": 0.0024541388265788555, "global_step": 39316, "epoch": 330, "lr": 4.256802147492822e-05} +{"train_loss": 0.002445928053930402, "global_step": 39317, "epoch": 330, "lr": 4.256583058372004e-05} +{"train_loss": 0.0015355661744251847, "global_step": 39318, "epoch": 330, "lr": 4.256363970710803e-05} +{"train_loss": 0.0015636307653039694, "global_step": 39319, "epoch": 330, "lr": 4.256144884509655e-05} +{"train_loss": 0.0019637695513665676, "global_step": 39320, "epoch": 330, "lr": 4.255925799768986e-05} +{"train_loss": 0.0011087451130151749, "global_step": 39321, "epoch": 330, "lr": 4.255706716489226e-05} +{"train_loss": 0.002665875246748328, "global_step": 39322, "epoch": 330, "lr": 4.2554876346708064e-05} +{"train_loss": 0.0018478555139154196, "global_step": 39323, "epoch": 330, "lr": 4.255268554314158e-05} +{"train_loss": 0.0007340908632613719, "global_step": 39324, "epoch": 330, "lr": 4.25504947541971e-05} +{"train_loss": 0.0017990098567679524, "global_step": 39325, "epoch": 330, "lr": 4.2548303979878934e-05} +{"train_loss": 0.0016722220461815596, "global_step": 39326, "epoch": 330, "lr": 4.254611322019137e-05} +{"train_loss": 0.002479923190549016, "global_step": 39327, "epoch": 330, "lr": 4.2543922475138725e-05} +{"train_loss": 0.00101715256460011, "global_step": 39328, "epoch": 330, "lr": 4.254173174472528e-05} +{"train_loss": 0.002621928695589304, "global_step": 39329, "epoch": 330, "lr": 4.253954102895536e-05} +{"train_loss": 0.002206510631367564, "global_step": 39330, "epoch": 330, "lr": 4.253735032783323e-05} +{"train_loss": 0.0024021691642701626, "global_step": 39331, "epoch": 330, "lr": 4.253515964136325e-05} +{"train_loss": 0.0018554385751485825, "global_step": 39332, "epoch": 330, "lr": 4.2532968969549656e-05} +{"train_loss": 0.001889251172542572, "global_step": 39333, "epoch": 330, "lr": 4.25307783123968e-05} +{"train_loss": 0.0013954357709735632, "global_step": 39334, "epoch": 330, "lr": 4.252858766990897e-05} +{"train_loss": 0.0031137329060584307, "global_step": 39335, "epoch": 330, "lr": 4.2526397042090434e-05} +{"train_loss": 0.0016853648703545332, "global_step": 39336, "epoch": 330, "lr": 4.252420642894554e-05} +{"train_loss": 0.0010284802410751581, "global_step": 39337, "epoch": 330, "lr": 4.252201583047855e-05} +{"train_loss": 0.001593823079019785, "global_step": 39338, "epoch": 330, "lr": 4.25198252466938e-05} +{"train_loss": 0.0021106060594320297, "global_step": 39339, "epoch": 330, "lr": 4.251763467759556e-05} +{"train_loss": 0.0018305868143215775, "global_step": 39340, "epoch": 330, "lr": 4.251544412318815e-05} +{"train_loss": 0.0009079038281925023, "global_step": 39341, "epoch": 330, "lr": 4.2513253583475864e-05} +{"train_loss": 0.0016527078114449978, "global_step": 39342, "epoch": 330, "lr": 4.2511063058463006e-05} +{"train_loss": 0.0019462114432826638, "global_step": 39343, "epoch": 330, "lr": 4.2508872548153874e-05} +{"train_loss": 0.0021223374642431736, "global_step": 39344, "epoch": 330, "lr": 4.250668205255277e-05} +{"train_loss": 0.0023120110854506493, "global_step": 39345, "epoch": 330, "lr": 4.250449157166401e-05} +{"train_loss": 0.0012777817901223898, "global_step": 39346, "epoch": 330, "lr": 4.250230110549188e-05} +{"train_loss": 0.0029490410815924406, "global_step": 39347, "epoch": 330, "lr": 4.2500110654040655e-05} +{"train_loss": 0.0010422380873933434, "global_step": 39348, "epoch": 330, "lr": 4.2497920217314685e-05} +{"train_loss": 0.0010521324584260583, "global_step": 39349, "epoch": 330, "lr": 4.2495729795318225e-05} +{"train_loss": 0.0023136038798838854, "global_step": 39350, "epoch": 330, "lr": 4.249353938805562e-05} +{"train_loss": 0.002278008032590151, "global_step": 39351, "epoch": 330, "lr": 4.249134899553113e-05} +{"train_loss": 0.001997490180656314, "global_step": 39352, "epoch": 330, "lr": 4.248915861774909e-05} +{"train_loss": 0.0010412093251943588, "global_step": 39353, "epoch": 330, "lr": 4.2486968254713786e-05} +{"train_loss": 0.0030976668931543827, "global_step": 39354, "epoch": 330, "lr": 4.24847779064295e-05} +{"train_loss": 0.0014379500644281507, "global_step": 39355, "epoch": 330, "lr": 4.248258757290057e-05} +{"train_loss": 0.0012312852777540684, "global_step": 39356, "epoch": 330, "lr": 4.2480397254131256e-05} +{"train_loss": 0.00208448339253664, "global_step": 39357, "epoch": 330, "lr": 4.247820695012589e-05} +{"train_loss": 0.001804468920454383, "global_step": 39358, "epoch": 330, "lr": 4.2476016660888765e-05} +{"train_loss": 0.0016970012802630663, "global_step": 39359, "epoch": 330, "lr": 4.247382638642416e-05} +{"train_loss": 0.0015846517635509372, "global_step": 39360, "epoch": 330, "lr": 4.247163612673641e-05} +{"train_loss": 0.0012832473730668426, "global_step": 39361, "epoch": 330, "lr": 4.2469445881829786e-05} +{"train_loss": 0.003610794898122549, "global_step": 39362, "epoch": 330, "lr": 4.2467255651708616e-05} +{"train_loss": 0.0015049425419420004, "global_step": 39363, "epoch": 330, "lr": 4.246506543637716e-05} +{"train_loss": 0.0015846147434785962, "global_step": 39364, "epoch": 330, "lr": 4.246287523583977e-05} +{"train_loss": 0.0019241656409576535, "global_step": 39365, "epoch": 330, "lr": 4.2460685050100715e-05} +{"train_loss": 0.0025679597165435553, "global_step": 39366, "epoch": 330, "lr": 4.2458494879164285e-05} +{"train_loss": 0.002077685669064522, "global_step": 39367, "epoch": 330, "lr": 4.245630472303481e-05} +{"train_loss": 0.0008986404864117503, "global_step": 39368, "epoch": 330, "lr": 4.2454114581716555e-05} +{"train_loss": 0.004708831198513508, "global_step": 39369, "epoch": 330, "lr": 4.245192445521387e-05} +{"train_loss": 0.0014554659137502313, "global_step": 39370, "epoch": 330, "lr": 4.244973434353101e-05} +{"train_loss": 0.002125381724908948, "global_step": 39371, "epoch": 330, "lr": 4.2447544246672274e-05} +{"train_loss": 0.0016920348862186074, "global_step": 39372, "epoch": 330, "lr": 4.244535416464199e-05} +{"train_loss": 0.001467163790948689, "global_step": 39373, "epoch": 330, "lr": 4.244316409744444e-05} +{"train_loss": 0.0020040012896060944, "global_step": 39374, "epoch": 330, "lr": 4.2440974045083936e-05} +{"train_loss": 0.0015068623470142484, "global_step": 39375, "epoch": 330, "lr": 4.243878400756478e-05} +{"train_loss": 0.003280100878328085, "global_step": 39376, "epoch": 330, "lr": 4.2436593984891246e-05} +{"train_loss": 0.0016631109174340963, "global_step": 39377, "epoch": 330, "lr": 4.243440397706768e-05} +{"train_loss": 0.0030077011324465275, "global_step": 39378, "epoch": 330, "lr": 4.243221398409832e-05} +{"train_loss": 0.002861019689589739, "global_step": 39379, "epoch": 330, "lr": 4.2430024005987524e-05} +{"train_loss": 0.0025801127776503563, "global_step": 39380, "epoch": 330, "lr": 4.242783404273955e-05} +{"train_loss": 0.0015029769856482744, "global_step": 39381, "epoch": 330, "lr": 4.242564409435873e-05} +{"train_loss": 0.0012166679371148348, "global_step": 39382, "epoch": 330, "lr": 4.242345416084933e-05} +{"train_loss": 0.0015198325272649527, "global_step": 39383, "epoch": 330, "lr": 4.2421264242215686e-05} +{"train_loss": 0.002970858011394739, "global_step": 39384, "epoch": 330, "lr": 4.2419074338462084e-05} +{"train_loss": 0.0030249119736254215, "global_step": 39385, "epoch": 330, "lr": 4.2416884449592796e-05} +{"train_loss": 0.0027920370921492577, "global_step": 39386, "epoch": 330, "lr": 4.241469457561217e-05} +{"train_loss": 0.0018438431434333324, "global_step": 39387, "epoch": 330, "lr": 4.241250471652446e-05} +{"train_loss": 0.0019348604729821702, "global_step": 39388, "epoch": 330, "lr": 4.2410314872334005e-05, "val_loss": 0.02750237286090851, "train_action_mse_error": 3.2123527489602566e-05} +{"train_loss": 0.0024170230608433485, "global_step": 39389, "epoch": 331, "lr": 4.2408125043045076e-05} +{"train_loss": 0.0019935648888349533, "global_step": 39390, "epoch": 331, "lr": 4.240593522866199e-05} +{"train_loss": 0.002459523733705282, "global_step": 39391, "epoch": 331, "lr": 4.2403745429189025e-05} +{"train_loss": 0.0024556582793593407, "global_step": 39392, "epoch": 331, "lr": 4.240155564463049e-05} +{"train_loss": 0.0020347698591649532, "global_step": 39393, "epoch": 331, "lr": 4.239936587499071e-05} +{"train_loss": 0.0018108573276549578, "global_step": 39394, "epoch": 331, "lr": 4.239717612027394e-05} +{"train_loss": 0.00236045615747571, "global_step": 39395, "epoch": 331, "lr": 4.239498638048453e-05} +{"train_loss": 0.0014726610388606787, "global_step": 39396, "epoch": 331, "lr": 4.2392796655626745e-05} +{"train_loss": 0.0030067877378314734, "global_step": 39397, "epoch": 331, "lr": 4.239060694570487e-05} +{"train_loss": 0.0015794209903106093, "global_step": 39398, "epoch": 331, "lr": 4.2388417250723245e-05} +{"train_loss": 0.0024686483666300774, "global_step": 39399, "epoch": 331, "lr": 4.2386227570686136e-05} +{"train_loss": 0.0010395869612693787, "global_step": 39400, "epoch": 331, "lr": 4.238403790559787e-05} +{"train_loss": 0.0016680917469784617, "global_step": 39401, "epoch": 331, "lr": 4.238184825546272e-05} +{"train_loss": 0.002037367317825556, "global_step": 39402, "epoch": 331, "lr": 4.237965862028501e-05} +{"train_loss": 0.0021270678844302893, "global_step": 39403, "epoch": 331, "lr": 4.2377469000069024e-05} +{"train_loss": 0.0011941343545913696, "global_step": 39404, "epoch": 331, "lr": 4.237527939481905e-05} +{"train_loss": 0.0012004958698526025, "global_step": 39405, "epoch": 331, "lr": 4.237308980453941e-05} +{"train_loss": 0.002519455971196294, "global_step": 39406, "epoch": 331, "lr": 4.237090022923438e-05} +{"train_loss": 0.0014182132435962558, "global_step": 39407, "epoch": 331, "lr": 4.236871066890828e-05} +{"train_loss": 0.0022528613917529583, "global_step": 39408, "epoch": 331, "lr": 4.2366521123565416e-05} +{"train_loss": 0.0012710621813312173, "global_step": 39409, "epoch": 331, "lr": 4.236433159321005e-05} +{"train_loss": 0.0019570353906601667, "global_step": 39410, "epoch": 331, "lr": 4.236214207784653e-05} +{"train_loss": 0.001464189263060689, "global_step": 39411, "epoch": 331, "lr": 4.23599525774791e-05} +{"train_loss": 0.0017610084032639861, "global_step": 39412, "epoch": 331, "lr": 4.2357763092112104e-05} +{"train_loss": 0.0018223179504275322, "global_step": 39413, "epoch": 331, "lr": 4.2355573621749814e-05} +{"train_loss": 0.0033423358108848333, "global_step": 39414, "epoch": 331, "lr": 4.235338416639655e-05} +{"train_loss": 0.0016576239140704274, "global_step": 39415, "epoch": 331, "lr": 4.2351194726056604e-05} +{"train_loss": 0.0024084520991891623, "global_step": 39416, "epoch": 331, "lr": 4.234900530073425e-05} +{"train_loss": 0.0023994562216103077, "global_step": 39417, "epoch": 331, "lr": 4.2346815890433825e-05} +{"train_loss": 0.001373597769998014, "global_step": 39418, "epoch": 331, "lr": 4.234462649515958e-05} +{"train_loss": 0.001150767900981009, "global_step": 39419, "epoch": 331, "lr": 4.234243711491588e-05} +{"train_loss": 0.004500159528106451, "global_step": 39420, "epoch": 331, "lr": 4.234024774970695e-05} +{"train_loss": 0.0021026208996772766, "global_step": 39421, "epoch": 331, "lr": 4.233805839953715e-05} +{"train_loss": 0.002197242807596922, "global_step": 39422, "epoch": 331, "lr": 4.2335869064410754e-05} +{"train_loss": 0.0015772831393405795, "global_step": 39423, "epoch": 331, "lr": 4.233367974433205e-05} +{"train_loss": 0.002731123473495245, "global_step": 39424, "epoch": 331, "lr": 4.2331490439305356e-05} +{"train_loss": 0.002621913095936179, "global_step": 39425, "epoch": 331, "lr": 4.2329301149334955e-05} +{"train_loss": 0.0019698068499565125, "global_step": 39426, "epoch": 331, "lr": 4.232711187442515e-05} +{"train_loss": 0.0027082739397883415, "global_step": 39427, "epoch": 331, "lr": 4.232492261458026e-05} +{"train_loss": 0.0014714192366227508, "global_step": 39428, "epoch": 331, "lr": 4.232273336980453e-05} +{"train_loss": 0.0019341313745826483, "global_step": 39429, "epoch": 331, "lr": 4.232054414010232e-05} +{"train_loss": 0.0018455834360793233, "global_step": 39430, "epoch": 331, "lr": 4.231835492547789e-05} +{"train_loss": 0.001955368323251605, "global_step": 39431, "epoch": 331, "lr": 4.231616572593556e-05} +{"train_loss": 0.0027742621023207903, "global_step": 39432, "epoch": 331, "lr": 4.23139765414796e-05} +{"train_loss": 0.0010507437400519848, "global_step": 39433, "epoch": 331, "lr": 4.231178737211434e-05} +{"train_loss": 0.0021768747828900814, "global_step": 39434, "epoch": 331, "lr": 4.2309598217844074e-05} +{"train_loss": 0.0021417555399239063, "global_step": 39435, "epoch": 331, "lr": 4.230740907867306e-05} +{"train_loss": 0.0023453636094927788, "global_step": 39436, "epoch": 331, "lr": 4.230521995460566e-05} +{"train_loss": 0.0016981344670057297, "global_step": 39437, "epoch": 331, "lr": 4.230303084564611e-05} +{"train_loss": 0.0016251804772764444, "global_step": 39438, "epoch": 331, "lr": 4.230084175179876e-05} +{"train_loss": 0.00329257152043283, "global_step": 39439, "epoch": 331, "lr": 4.229865267306787e-05} +{"train_loss": 0.0018342577386647463, "global_step": 39440, "epoch": 331, "lr": 4.229646360945775e-05} +{"train_loss": 0.0023480611853301525, "global_step": 39441, "epoch": 331, "lr": 4.229427456097271e-05} +{"train_loss": 0.0018363511189818382, "global_step": 39442, "epoch": 331, "lr": 4.229208552761702e-05} +{"train_loss": 0.0019897716119885445, "global_step": 39443, "epoch": 331, "lr": 4.228989650939502e-05} +{"train_loss": 0.0019380019512027502, "global_step": 39444, "epoch": 331, "lr": 4.228770750631097e-05} +{"train_loss": 0.001995918806642294, "global_step": 39445, "epoch": 331, "lr": 4.228551851836919e-05} +{"train_loss": 0.00406797556206584, "global_step": 39446, "epoch": 331, "lr": 4.2283329545573984e-05} +{"train_loss": 0.0026436613406986, "global_step": 39447, "epoch": 331, "lr": 4.228114058792961e-05} +{"train_loss": 0.0019261948764324188, "global_step": 39448, "epoch": 331, "lr": 4.227895164544041e-05} +{"train_loss": 0.001346974866464734, "global_step": 39449, "epoch": 331, "lr": 4.227676271811065e-05} +{"train_loss": 0.0013904341030865908, "global_step": 39450, "epoch": 331, "lr": 4.227457380594465e-05} +{"train_loss": 0.0031568158883601427, "global_step": 39451, "epoch": 331, "lr": 4.227238490894669e-05} +{"train_loss": 0.0013402880867943168, "global_step": 39452, "epoch": 331, "lr": 4.227019602712109e-05} +{"train_loss": 0.0026772315613925457, "global_step": 39453, "epoch": 331, "lr": 4.2268007160472135e-05} +{"train_loss": 0.002869266550987959, "global_step": 39454, "epoch": 331, "lr": 4.2265818309004104e-05} +{"train_loss": 0.0020332317799329758, "global_step": 39455, "epoch": 331, "lr": 4.226362947272132e-05} +{"train_loss": 0.0023152069188654423, "global_step": 39456, "epoch": 331, "lr": 4.2261440651628075e-05} +{"train_loss": 0.0024599838070571423, "global_step": 39457, "epoch": 331, "lr": 4.225925184572866e-05} +{"train_loss": 0.0018859223928302526, "global_step": 39458, "epoch": 331, "lr": 4.22570630550274e-05} +{"train_loss": 0.0034017302095890045, "global_step": 39459, "epoch": 331, "lr": 4.225487427952854e-05} +{"train_loss": 0.00209942739456892, "global_step": 39460, "epoch": 331, "lr": 4.225268551923642e-05} +{"train_loss": 0.0012930394150316715, "global_step": 39461, "epoch": 331, "lr": 4.225049677415532e-05} +{"train_loss": 0.0010877774329856038, "global_step": 39462, "epoch": 331, "lr": 4.224830804428955e-05} +{"train_loss": 0.003476548008620739, "global_step": 39463, "epoch": 331, "lr": 4.2246119329643384e-05} +{"train_loss": 0.0014033929910510778, "global_step": 39464, "epoch": 331, "lr": 4.224393063022115e-05} +{"train_loss": 0.0014134044758975506, "global_step": 39465, "epoch": 331, "lr": 4.2241741946027136e-05} +{"train_loss": 0.002028412651270628, "global_step": 39466, "epoch": 331, "lr": 4.223955327706561e-05} +{"train_loss": 0.0020201820880174637, "global_step": 39467, "epoch": 331, "lr": 4.2237364623340915e-05} +{"train_loss": 0.0019161747768521309, "global_step": 39468, "epoch": 331, "lr": 4.22351759848573e-05} +{"train_loss": 0.0023988578468561172, "global_step": 39469, "epoch": 331, "lr": 4.2232987361619105e-05} +{"train_loss": 0.0018828186439350247, "global_step": 39470, "epoch": 331, "lr": 4.2230798753630594e-05} +{"train_loss": 0.0015783874550834298, "global_step": 39471, "epoch": 331, "lr": 4.2228610160896095e-05} +{"train_loss": 0.0017215259140357375, "global_step": 39472, "epoch": 331, "lr": 4.222642158341989e-05} +{"train_loss": 0.0023871916346251965, "global_step": 39473, "epoch": 331, "lr": 4.2224233021206274e-05} +{"train_loss": 0.0022404950577765703, "global_step": 39474, "epoch": 331, "lr": 4.222204447425954e-05} +{"train_loss": 0.0016920828493312001, "global_step": 39475, "epoch": 331, "lr": 4.221985594258399e-05} +{"train_loss": 0.0030572975520044565, "global_step": 39476, "epoch": 331, "lr": 4.2217667426183926e-05} +{"train_loss": 0.0018225442618131638, "global_step": 39477, "epoch": 331, "lr": 4.2215478925063644e-05} +{"train_loss": 0.0017934005009010434, "global_step": 39478, "epoch": 331, "lr": 4.221329043922743e-05} +{"train_loss": 0.002474418841302395, "global_step": 39479, "epoch": 331, "lr": 4.221110196867959e-05} +{"train_loss": 0.0016512534348294139, "global_step": 39480, "epoch": 331, "lr": 4.220891351342442e-05} +{"train_loss": 0.0023177252151072025, "global_step": 39481, "epoch": 331, "lr": 4.220672507346622e-05} +{"train_loss": 0.0028566208202391863, "global_step": 39482, "epoch": 331, "lr": 4.2204536648809264e-05} +{"train_loss": 0.0011642625322565436, "global_step": 39483, "epoch": 331, "lr": 4.2202348239457893e-05} +{"train_loss": 0.0022309867199510336, "global_step": 39484, "epoch": 331, "lr": 4.220015984541638e-05} +{"train_loss": 0.0018855435773730278, "global_step": 39485, "epoch": 331, "lr": 4.2197971466688996e-05} +{"train_loss": 0.0022056486923247576, "global_step": 39486, "epoch": 331, "lr": 4.219578310328008e-05} +{"train_loss": 0.0010371613316237926, "global_step": 39487, "epoch": 331, "lr": 4.2193594755193894e-05} +{"train_loss": 0.001933992258273065, "global_step": 39488, "epoch": 331, "lr": 4.219140642243477e-05} +{"train_loss": 0.00190680380910635, "global_step": 39489, "epoch": 331, "lr": 4.218921810500698e-05} +{"train_loss": 0.002086188644170761, "global_step": 39490, "epoch": 331, "lr": 4.21870298029148e-05} +{"train_loss": 0.0009113189298659563, "global_step": 39491, "epoch": 331, "lr": 4.218484151616259e-05} +{"train_loss": 0.0012945950729772449, "global_step": 39492, "epoch": 331, "lr": 4.218265324475458e-05} +{"train_loss": 0.0009323658305220306, "global_step": 39493, "epoch": 331, "lr": 4.218046498869511e-05} +{"train_loss": 0.0016074455343186855, "global_step": 39494, "epoch": 331, "lr": 4.2178276747988446e-05} +{"train_loss": 0.0013141795061528683, "global_step": 39495, "epoch": 331, "lr": 4.217608852263893e-05} +{"train_loss": 0.002297611441463232, "global_step": 39496, "epoch": 331, "lr": 4.217390031265082e-05} +{"train_loss": 0.0020690273959189653, "global_step": 39497, "epoch": 331, "lr": 4.21717121180284e-05} +{"train_loss": 0.0011317009339109063, "global_step": 39498, "epoch": 331, "lr": 4.216952393877601e-05} +{"train_loss": 0.0016744398744776845, "global_step": 39499, "epoch": 331, "lr": 4.21673357748979e-05} +{"train_loss": 0.002239500405266881, "global_step": 39500, "epoch": 331, "lr": 4.216514762639841e-05} +{"train_loss": 0.0025591375306248665, "global_step": 39501, "epoch": 331, "lr": 4.21629594932818e-05} +{"train_loss": 0.0013533438323065639, "global_step": 39502, "epoch": 331, "lr": 4.216077137555239e-05} +{"train_loss": 0.0012584691867232323, "global_step": 39503, "epoch": 331, "lr": 4.215858327321447e-05} +{"train_loss": 0.001254090340808034, "global_step": 39504, "epoch": 331, "lr": 4.2156395186272325e-05} +{"train_loss": 0.0017559718107804656, "global_step": 39505, "epoch": 331, "lr": 4.215420711473026e-05} +{"train_loss": 0.0017790759447962046, "global_step": 39506, "epoch": 331, "lr": 4.215201905859259e-05} +{"train_loss": 0.0020163885455680305, "global_step": 39507, "epoch": 331, "lr": 4.214983101786357e-05, "val_loss": 0.01610822044312954} +{"train_loss": 0.001534526702016592, "global_step": 39508, "epoch": 332, "lr": 4.214764299254754e-05} +{"train_loss": 0.0016979459905996919, "global_step": 39509, "epoch": 332, "lr": 4.214545498264875e-05} +{"train_loss": 0.0011218562722206116, "global_step": 39510, "epoch": 332, "lr": 4.2143266988171534e-05} +{"train_loss": 0.0015181557973846793, "global_step": 39511, "epoch": 332, "lr": 4.2141079009120164e-05} +{"train_loss": 0.0019266230519860983, "global_step": 39512, "epoch": 332, "lr": 4.2138891045498964e-05} +{"train_loss": 0.0016468401299789548, "global_step": 39513, "epoch": 332, "lr": 4.213670309731219e-05} +{"train_loss": 0.0011330817360430956, "global_step": 39514, "epoch": 332, "lr": 4.213451516456418e-05} +{"train_loss": 0.0011104311561211944, "global_step": 39515, "epoch": 332, "lr": 4.213232724725921e-05} +{"train_loss": 0.0014042293187230825, "global_step": 39516, "epoch": 332, "lr": 4.213013934540155e-05} +{"train_loss": 0.002720913849771023, "global_step": 39517, "epoch": 332, "lr": 4.212795145899554e-05} +{"train_loss": 0.0017856421181932092, "global_step": 39518, "epoch": 332, "lr": 4.212576358804544e-05} +{"train_loss": 0.0016978876665234566, "global_step": 39519, "epoch": 332, "lr": 4.212357573255558e-05} +{"train_loss": 0.0009365750011056662, "global_step": 39520, "epoch": 332, "lr": 4.212138789253022e-05} +{"train_loss": 0.002419819124042988, "global_step": 39521, "epoch": 332, "lr": 4.21192000679737e-05} +{"train_loss": 0.0013419087044894695, "global_step": 39522, "epoch": 332, "lr": 4.211701225889026e-05} +{"train_loss": 0.0015712775057181716, "global_step": 39523, "epoch": 332, "lr": 4.211482446528424e-05} +{"train_loss": 0.002833280013874173, "global_step": 39524, "epoch": 332, "lr": 4.2112636687159916e-05} +{"train_loss": 0.0010148201836273074, "global_step": 39525, "epoch": 332, "lr": 4.2110448924521575e-05} +{"train_loss": 0.0015967657091096044, "global_step": 39526, "epoch": 332, "lr": 4.210826117737355e-05} +{"train_loss": 0.0010592120233923197, "global_step": 39527, "epoch": 332, "lr": 4.210607344572011e-05} +{"train_loss": 0.0023217126727104187, "global_step": 39528, "epoch": 332, "lr": 4.2103885729565524e-05} +{"train_loss": 0.000974854570813477, "global_step": 39529, "epoch": 332, "lr": 4.210169802891414e-05} +{"train_loss": 0.001714825164526701, "global_step": 39530, "epoch": 332, "lr": 4.209951034377021e-05} +{"train_loss": 0.0012720212107524276, "global_step": 39531, "epoch": 332, "lr": 4.209732267413806e-05} +{"train_loss": 0.001399352797307074, "global_step": 39532, "epoch": 332, "lr": 4.209513502002196e-05} +{"train_loss": 0.0024268454872071743, "global_step": 39533, "epoch": 332, "lr": 4.209294738142624e-05} +{"train_loss": 0.0016382539179176092, "global_step": 39534, "epoch": 332, "lr": 4.209075975835517e-05} +{"train_loss": 0.0026434443425387144, "global_step": 39535, "epoch": 332, "lr": 4.208857215081302e-05} +{"train_loss": 0.0010407547233626246, "global_step": 39536, "epoch": 332, "lr": 4.208638455880414e-05} +{"train_loss": 0.002357532735913992, "global_step": 39537, "epoch": 332, "lr": 4.208419698233278e-05} +{"train_loss": 0.0017739314353093505, "global_step": 39538, "epoch": 332, "lr": 4.208200942140326e-05} +{"train_loss": 0.001219628844410181, "global_step": 39539, "epoch": 332, "lr": 4.207982187601988e-05} +{"train_loss": 0.002146851969882846, "global_step": 39540, "epoch": 332, "lr": 4.207763434618691e-05} +{"train_loss": 0.0024000098928809166, "global_step": 39541, "epoch": 332, "lr": 4.207544683190867e-05} +{"train_loss": 0.0016334598185494542, "global_step": 39542, "epoch": 332, "lr": 4.207325933318943e-05} +{"train_loss": 0.0010579269146546721, "global_step": 39543, "epoch": 332, "lr": 4.2071071850033516e-05} +{"train_loss": 0.0017929375171661377, "global_step": 39544, "epoch": 332, "lr": 4.2068884382445184e-05} +{"train_loss": 0.0009443701710551977, "global_step": 39545, "epoch": 332, "lr": 4.2066696930428766e-05} +{"train_loss": 0.0009670695872046053, "global_step": 39546, "epoch": 332, "lr": 4.2064509493988546e-05} +{"train_loss": 0.0014129114570096135, "global_step": 39547, "epoch": 332, "lr": 4.20623220731288e-05} +{"train_loss": 0.0032985589932650328, "global_step": 39548, "epoch": 332, "lr": 4.206013466785385e-05} +{"train_loss": 0.0013989645522087812, "global_step": 39549, "epoch": 332, "lr": 4.2057947278167956e-05} +{"train_loss": 0.0013190157478675246, "global_step": 39550, "epoch": 332, "lr": 4.205575990407545e-05} +{"train_loss": 0.002622639061883092, "global_step": 39551, "epoch": 332, "lr": 4.20535725455806e-05} +{"train_loss": 0.002379442797973752, "global_step": 39552, "epoch": 332, "lr": 4.205138520268773e-05} +{"train_loss": 0.0012303913244977593, "global_step": 39553, "epoch": 332, "lr": 4.2049197875401106e-05} +{"train_loss": 0.0031051302794367075, "global_step": 39554, "epoch": 332, "lr": 4.204701056372502e-05} +{"train_loss": 0.002281719818711281, "global_step": 39555, "epoch": 332, "lr": 4.204482326766379e-05} +{"train_loss": 0.0010499414056539536, "global_step": 39556, "epoch": 332, "lr": 4.20426359872217e-05} +{"train_loss": 0.0037981730420142412, "global_step": 39557, "epoch": 332, "lr": 4.204044872240304e-05} +{"train_loss": 0.00290649919770658, "global_step": 39558, "epoch": 332, "lr": 4.203826147321213e-05} +{"train_loss": 0.002274713246151805, "global_step": 39559, "epoch": 332, "lr": 4.203607423965321e-05} +{"train_loss": 0.0021033494267612696, "global_step": 39560, "epoch": 332, "lr": 4.203388702173063e-05} +{"train_loss": 0.003156001213937998, "global_step": 39561, "epoch": 332, "lr": 4.2031699819448645e-05} +{"train_loss": 0.0012384116416797042, "global_step": 39562, "epoch": 332, "lr": 4.202951263281159e-05} +{"train_loss": 0.0016719925915822387, "global_step": 39563, "epoch": 332, "lr": 4.2027325461823706e-05} +{"train_loss": 0.002525039715692401, "global_step": 39564, "epoch": 332, "lr": 4.202513830648934e-05} +{"train_loss": 0.0012332606129348278, "global_step": 39565, "epoch": 332, "lr": 4.2022951166812764e-05} +{"train_loss": 0.002540700137615204, "global_step": 39566, "epoch": 332, "lr": 4.202076404279825e-05} +{"train_loss": 0.0008504582801833749, "global_step": 39567, "epoch": 332, "lr": 4.201857693445014e-05} +{"train_loss": 0.002256623236462474, "global_step": 39568, "epoch": 332, "lr": 4.201638984177267e-05} +{"train_loss": 0.0009738694643601775, "global_step": 39569, "epoch": 332, "lr": 4.201420276477019e-05} +{"train_loss": 0.0009257893543690443, "global_step": 39570, "epoch": 332, "lr": 4.2012015703446956e-05} +{"train_loss": 0.0027352655306458473, "global_step": 39571, "epoch": 332, "lr": 4.2009828657807287e-05} +{"train_loss": 0.001616011606529355, "global_step": 39572, "epoch": 332, "lr": 4.200764162785547e-05} +{"train_loss": 0.004716539289802313, "global_step": 39573, "epoch": 332, "lr": 4.200545461359577e-05} +{"train_loss": 0.0024694439489394426, "global_step": 39574, "epoch": 332, "lr": 4.200326761503253e-05} +{"train_loss": 0.0016544657992199063, "global_step": 39575, "epoch": 332, "lr": 4.2001080632169995e-05} +{"train_loss": 0.0019215233623981476, "global_step": 39576, "epoch": 332, "lr": 4.199889366501251e-05} +{"train_loss": 0.0029015871696174145, "global_step": 39577, "epoch": 332, "lr": 4.1996706713564347e-05} +{"train_loss": 0.0032001580111682415, "global_step": 39578, "epoch": 332, "lr": 4.1994519777829764e-05} +{"train_loss": 0.0019806292839348316, "global_step": 39579, "epoch": 332, "lr": 4.199233285781311e-05} +{"train_loss": 0.0017466790741309524, "global_step": 39580, "epoch": 332, "lr": 4.199014595351864e-05} +{"train_loss": 0.0020301993936300278, "global_step": 39581, "epoch": 332, "lr": 4.1987959064950676e-05} +{"train_loss": 0.003211726201698184, "global_step": 39582, "epoch": 332, "lr": 4.198577219211348e-05} +{"train_loss": 0.0016892087878659368, "global_step": 39583, "epoch": 332, "lr": 4.198358533501139e-05} +{"train_loss": 0.0014722492778673768, "global_step": 39584, "epoch": 332, "lr": 4.198139849364867e-05} +{"train_loss": 0.0019742813892662525, "global_step": 39585, "epoch": 332, "lr": 4.197921166802959e-05} +{"train_loss": 0.002160992007702589, "global_step": 39586, "epoch": 332, "lr": 4.19770248581585e-05} +{"train_loss": 0.00200358172878623, "global_step": 39587, "epoch": 332, "lr": 4.197483806403965e-05} +{"train_loss": 0.001974927494302392, "global_step": 39588, "epoch": 332, "lr": 4.197265128567734e-05} +{"train_loss": 0.0024060835130512714, "global_step": 39589, "epoch": 332, "lr": 4.1970464523075895e-05} +{"train_loss": 0.002364289714023471, "global_step": 39590, "epoch": 332, "lr": 4.1968277776239566e-05} +{"train_loss": 0.0023061553947627544, "global_step": 39591, "epoch": 332, "lr": 4.196609104517269e-05} +{"train_loss": 0.0009620406781323254, "global_step": 39592, "epoch": 332, "lr": 4.19639043298795e-05} +{"train_loss": 0.001970551209524274, "global_step": 39593, "epoch": 332, "lr": 4.196171763036435e-05} +{"train_loss": 0.002003192435950041, "global_step": 39594, "epoch": 332, "lr": 4.195953094663149e-05} +{"train_loss": 0.001434089383110404, "global_step": 39595, "epoch": 332, "lr": 4.195734427868526e-05} +{"train_loss": 0.0032499623484909534, "global_step": 39596, "epoch": 332, "lr": 4.195515762652992e-05} +{"train_loss": 0.002803925657644868, "global_step": 39597, "epoch": 332, "lr": 4.1952970990169746e-05} +{"train_loss": 0.0018161149928346276, "global_step": 39598, "epoch": 332, "lr": 4.1950784369609075e-05} +{"train_loss": 0.002280142856761813, "global_step": 39599, "epoch": 332, "lr": 4.194859776485216e-05} +{"train_loss": 0.0029259591829031706, "global_step": 39600, "epoch": 332, "lr": 4.194641117590333e-05} +{"train_loss": 0.0021999143064022064, "global_step": 39601, "epoch": 332, "lr": 4.194422460276685e-05} +{"train_loss": 0.003619302297011018, "global_step": 39602, "epoch": 332, "lr": 4.1942038045447034e-05} +{"train_loss": 0.002818512497469783, "global_step": 39603, "epoch": 332, "lr": 4.1939851503948155e-05} +{"train_loss": 0.0021921368315815926, "global_step": 39604, "epoch": 332, "lr": 4.193766497827453e-05} +{"train_loss": 0.001648552599363029, "global_step": 39605, "epoch": 332, "lr": 4.193547846843042e-05} +{"train_loss": 0.0028568811248987913, "global_step": 39606, "epoch": 332, "lr": 4.193329197442015e-05} +{"train_loss": 0.0016419276362285018, "global_step": 39607, "epoch": 332, "lr": 4.1931105496248e-05} +{"train_loss": 0.002060951665043831, "global_step": 39608, "epoch": 332, "lr": 4.192891903391825e-05} +{"train_loss": 0.0010198462987318635, "global_step": 39609, "epoch": 332, "lr": 4.192673258743521e-05} +{"train_loss": 0.001898538670502603, "global_step": 39610, "epoch": 332, "lr": 4.192454615680319e-05} +{"train_loss": 0.0022723479196429253, "global_step": 39611, "epoch": 332, "lr": 4.192235974202643e-05} +{"train_loss": 0.0029909734148532152, "global_step": 39612, "epoch": 332, "lr": 4.192017334310927e-05} +{"train_loss": 0.0021041708532720804, "global_step": 39613, "epoch": 332, "lr": 4.191798696005598e-05} +{"train_loss": 0.0026279231533408165, "global_step": 39614, "epoch": 332, "lr": 4.191580059287087e-05} +{"train_loss": 0.0025577039923518896, "global_step": 39615, "epoch": 332, "lr": 4.191361424155822e-05} +{"train_loss": 0.0013012991985306144, "global_step": 39616, "epoch": 332, "lr": 4.1911427906122305e-05} +{"train_loss": 0.002673397772014141, "global_step": 39617, "epoch": 332, "lr": 4.190924158656746e-05} +{"train_loss": 0.0037298190873116255, "global_step": 39618, "epoch": 332, "lr": 4.190705528289793e-05} +{"train_loss": 0.0029065210837870836, "global_step": 39619, "epoch": 332, "lr": 4.190486899511806e-05} +{"train_loss": 0.0025902208872139454, "global_step": 39620, "epoch": 332, "lr": 4.1902682723232094e-05} +{"train_loss": 0.0025975359603762627, "global_step": 39621, "epoch": 332, "lr": 4.1900496467244365e-05} +{"train_loss": 0.0029226166661828756, "global_step": 39622, "epoch": 332, "lr": 4.189831022715913e-05} +{"train_loss": 0.0023611055221408606, "global_step": 39623, "epoch": 332, "lr": 4.189612400298069e-05} +{"train_loss": 0.0015084270853549242, "global_step": 39624, "epoch": 332, "lr": 4.1893937794713365e-05} +{"train_loss": 0.001636922126635909, "global_step": 39625, "epoch": 332, "lr": 4.189175160236141e-05} +{"train_loss": 0.002046306571578842, "global_step": 39626, "epoch": 332, "lr": 4.188956542592915e-05, "val_loss": 0.027172332629561424} +{"train_loss": 0.004410639405250549, "global_step": 39627, "epoch": 333, "lr": 4.188737926542087e-05} +{"train_loss": 0.002859801286831498, "global_step": 39628, "epoch": 333, "lr": 4.188519312084083e-05} +{"train_loss": 0.0015317477518692613, "global_step": 39629, "epoch": 333, "lr": 4.188300699219336e-05} +{"train_loss": 0.0022832192480564117, "global_step": 39630, "epoch": 333, "lr": 4.188082087948273e-05} +{"train_loss": 0.004465812351554632, "global_step": 39631, "epoch": 333, "lr": 4.187863478271325e-05} +{"train_loss": 0.003434075741097331, "global_step": 39632, "epoch": 333, "lr": 4.1876448701889185e-05} +{"train_loss": 0.0034731407649815083, "global_step": 39633, "epoch": 333, "lr": 4.187426263701487e-05} +{"train_loss": 0.0014074837090447545, "global_step": 39634, "epoch": 333, "lr": 4.187207658809457e-05} +{"train_loss": 0.0016031705308705568, "global_step": 39635, "epoch": 333, "lr": 4.1869890555132556e-05} +{"train_loss": 0.0030487256590276957, "global_step": 39636, "epoch": 333, "lr": 4.1867704538133154e-05} +{"train_loss": 0.004038440063595772, "global_step": 39637, "epoch": 333, "lr": 4.186551853710065e-05} +{"train_loss": 0.0020806838292628527, "global_step": 39638, "epoch": 333, "lr": 4.186333255203933e-05} +{"train_loss": 0.003323886776342988, "global_step": 39639, "epoch": 333, "lr": 4.186114658295349e-05} +{"train_loss": 0.0031804991886019707, "global_step": 39640, "epoch": 333, "lr": 4.185896062984741e-05} +{"train_loss": 0.0016850134124979377, "global_step": 39641, "epoch": 333, "lr": 4.185677469272541e-05} +{"train_loss": 0.0022876346483826637, "global_step": 39642, "epoch": 333, "lr": 4.185458877159174e-05} +{"train_loss": 0.0022453879937529564, "global_step": 39643, "epoch": 333, "lr": 4.1852402866450735e-05} +{"train_loss": 0.0013109225546941161, "global_step": 39644, "epoch": 333, "lr": 4.185021697730665e-05} +{"train_loss": 0.0021751669701188803, "global_step": 39645, "epoch": 333, "lr": 4.18480311041638e-05} +{"train_loss": 0.0021733888424932957, "global_step": 39646, "epoch": 333, "lr": 4.184584524702648e-05} +{"train_loss": 0.0029151244089007378, "global_step": 39647, "epoch": 333, "lr": 4.184365940589895e-05} +{"train_loss": 0.001626154175028205, "global_step": 39648, "epoch": 333, "lr": 4.1841473580785544e-05} +{"train_loss": 0.0013326837215572596, "global_step": 39649, "epoch": 333, "lr": 4.1839287771690514e-05} +{"train_loss": 0.0022867766674607992, "global_step": 39650, "epoch": 333, "lr": 4.183710197861819e-05} +{"train_loss": 0.0017840575892478228, "global_step": 39651, "epoch": 333, "lr": 4.183491620157282e-05} +{"train_loss": 0.0016603699186816812, "global_step": 39652, "epoch": 333, "lr": 4.183273044055875e-05} +{"train_loss": 0.0028970548883080482, "global_step": 39653, "epoch": 333, "lr": 4.183054469558022e-05} +{"train_loss": 0.001777931465767324, "global_step": 39654, "epoch": 333, "lr": 4.182835896664155e-05} +{"train_loss": 0.0022572199814021587, "global_step": 39655, "epoch": 333, "lr": 4.182617325374702e-05} +{"train_loss": 0.001910905702970922, "global_step": 39656, "epoch": 333, "lr": 4.182398755690093e-05} +{"train_loss": 0.0015829679323360324, "global_step": 39657, "epoch": 333, "lr": 4.182180187610756e-05} +{"train_loss": 0.0018927681958302855, "global_step": 39658, "epoch": 333, "lr": 4.18196162113712e-05} +{"train_loss": 0.0012391989585012197, "global_step": 39659, "epoch": 333, "lr": 4.1817430562696177e-05} +{"train_loss": 0.0017654497642070055, "global_step": 39660, "epoch": 333, "lr": 4.181524493008675e-05} +{"train_loss": 0.0031024995259940624, "global_step": 39661, "epoch": 333, "lr": 4.181305931354719e-05} +{"train_loss": 0.0022612237371504307, "global_step": 39662, "epoch": 333, "lr": 4.1810873713081845e-05} +{"train_loss": 0.0010684594744816422, "global_step": 39663, "epoch": 333, "lr": 4.1808688128694946e-05} +{"train_loss": 0.0019201966933906078, "global_step": 39664, "epoch": 333, "lr": 4.180650256039084e-05} +{"train_loss": 0.0014824564568698406, "global_step": 39665, "epoch": 333, "lr": 4.180431700817378e-05} +{"train_loss": 0.003830705303698778, "global_step": 39666, "epoch": 333, "lr": 4.1802131472048055e-05} +{"train_loss": 0.0021613980643451214, "global_step": 39667, "epoch": 333, "lr": 4.179994595201799e-05} +{"train_loss": 0.002063135150820017, "global_step": 39668, "epoch": 333, "lr": 4.179776044808783e-05} +{"train_loss": 0.001591867650859058, "global_step": 39669, "epoch": 333, "lr": 4.179557496026191e-05} +{"train_loss": 0.0012552014086395502, "global_step": 39670, "epoch": 333, "lr": 4.179338948854449e-05} +{"train_loss": 0.0011495680082589388, "global_step": 39671, "epoch": 333, "lr": 4.1791204032939876e-05} +{"train_loss": 0.0013306594919413328, "global_step": 39672, "epoch": 333, "lr": 4.178901859345237e-05} +{"train_loss": 0.0015736783389002085, "global_step": 39673, "epoch": 333, "lr": 4.178683317008622e-05} +{"train_loss": 0.0019032234558835626, "global_step": 39674, "epoch": 333, "lr": 4.178464776284578e-05} +{"train_loss": 0.002141581615433097, "global_step": 39675, "epoch": 333, "lr": 4.178246237173528e-05} +{"train_loss": 0.0015746509889140725, "global_step": 39676, "epoch": 333, "lr": 4.178027699675906e-05} +{"train_loss": 0.0016535712638869882, "global_step": 39677, "epoch": 333, "lr": 4.1778091637921385e-05} +{"train_loss": 0.0015405496815219522, "global_step": 39678, "epoch": 333, "lr": 4.177590629522653e-05} +{"train_loss": 0.0016192697221413255, "global_step": 39679, "epoch": 333, "lr": 4.177372096867882e-05} +{"train_loss": 0.0010826879879459739, "global_step": 39680, "epoch": 333, "lr": 4.177153565828251e-05} +{"train_loss": 0.0016876121517270803, "global_step": 39681, "epoch": 333, "lr": 4.176935036404194e-05} +{"train_loss": 0.0015193993458524346, "global_step": 39682, "epoch": 333, "lr": 4.176716508596134e-05} +{"train_loss": 0.0018338192021474242, "global_step": 39683, "epoch": 333, "lr": 4.1764979824045056e-05} +{"train_loss": 0.001128275878727436, "global_step": 39684, "epoch": 333, "lr": 4.176279457829735e-05} +{"train_loss": 0.003004898549988866, "global_step": 39685, "epoch": 333, "lr": 4.176060934872251e-05} +{"train_loss": 0.002252080710604787, "global_step": 39686, "epoch": 333, "lr": 4.175842413532483e-05} +{"train_loss": 0.0015153097920119762, "global_step": 39687, "epoch": 333, "lr": 4.175623893810861e-05} +{"train_loss": 0.0018259519711136818, "global_step": 39688, "epoch": 333, "lr": 4.1754053757078135e-05} +{"train_loss": 0.0022228199522942305, "global_step": 39689, "epoch": 333, "lr": 4.175186859223769e-05} +{"train_loss": 0.0036138570867478848, "global_step": 39690, "epoch": 333, "lr": 4.174968344359157e-05} +{"train_loss": 0.0014661304885521531, "global_step": 39691, "epoch": 333, "lr": 4.174749831114408e-05} +{"train_loss": 0.001704230671748519, "global_step": 39692, "epoch": 333, "lr": 4.174531319489947e-05} +{"train_loss": 0.002680861158296466, "global_step": 39693, "epoch": 333, "lr": 4.1743128094862086e-05} +{"train_loss": 0.0014614892425015569, "global_step": 39694, "epoch": 333, "lr": 4.174094301103615e-05} +{"train_loss": 0.001309323008172214, "global_step": 39695, "epoch": 333, "lr": 4.1738757943426025e-05} +{"train_loss": 0.0030793799087405205, "global_step": 39696, "epoch": 333, "lr": 4.173657289203596e-05} +{"train_loss": 0.002186967758461833, "global_step": 39697, "epoch": 333, "lr": 4.173438785687024e-05} +{"train_loss": 0.0023692555259913206, "global_step": 39698, "epoch": 333, "lr": 4.1732202837933176e-05} +{"train_loss": 0.001597739988937974, "global_step": 39699, "epoch": 333, "lr": 4.173001783522903e-05} +{"train_loss": 0.002498124958947301, "global_step": 39700, "epoch": 333, "lr": 4.172783284876213e-05} +{"train_loss": 0.0023556379601359367, "global_step": 39701, "epoch": 333, "lr": 4.172564787853673e-05} +{"train_loss": 0.00193502358160913, "global_step": 39702, "epoch": 333, "lr": 4.1723462924557154e-05} +{"train_loss": 0.0013277680845931172, "global_step": 39703, "epoch": 333, "lr": 4.1721277986827665e-05} +{"train_loss": 0.0028845013584941626, "global_step": 39704, "epoch": 333, "lr": 4.171909306535257e-05} +{"train_loss": 0.0013010593829676509, "global_step": 39705, "epoch": 333, "lr": 4.171690816013614e-05} +{"train_loss": 0.001920654671266675, "global_step": 39706, "epoch": 333, "lr": 4.171472327118267e-05} +{"train_loss": 0.001570476102642715, "global_step": 39707, "epoch": 333, "lr": 4.171253839849648e-05} +{"train_loss": 0.002558698644861579, "global_step": 39708, "epoch": 333, "lr": 4.1710353542081805e-05} +{"train_loss": 0.0013564523542299867, "global_step": 39709, "epoch": 333, "lr": 4.170816870194299e-05} +{"train_loss": 0.0007512022857554257, "global_step": 39710, "epoch": 333, "lr": 4.1705983878084305e-05} +{"train_loss": 0.002984566381201148, "global_step": 39711, "epoch": 333, "lr": 4.170379907051001e-05} +{"train_loss": 0.0021271775476634502, "global_step": 39712, "epoch": 333, "lr": 4.170161427922444e-05} +{"train_loss": 0.0017728075617924333, "global_step": 39713, "epoch": 333, "lr": 4.169942950423184e-05} +{"train_loss": 0.0015971221728250384, "global_step": 39714, "epoch": 333, "lr": 4.1697244745536545e-05} +{"train_loss": 0.0015412903157994151, "global_step": 39715, "epoch": 333, "lr": 4.169506000314283e-05} +{"train_loss": 0.0018700106302276254, "global_step": 39716, "epoch": 333, "lr": 4.169287527705495e-05} +{"train_loss": 0.0030310682486742735, "global_step": 39717, "epoch": 333, "lr": 4.1690690567277246e-05} +{"train_loss": 0.0011969972401857376, "global_step": 39718, "epoch": 333, "lr": 4.168850587381396e-05} +{"train_loss": 0.002401175908744335, "global_step": 39719, "epoch": 333, "lr": 4.168632119666943e-05} +{"train_loss": 0.0016919064801186323, "global_step": 39720, "epoch": 333, "lr": 4.16841365358479e-05} +{"train_loss": 0.002218985464423895, "global_step": 39721, "epoch": 333, "lr": 4.168195189135368e-05} +{"train_loss": 0.0014982762513682246, "global_step": 39722, "epoch": 333, "lr": 4.167976726319107e-05} +{"train_loss": 0.0016725215828046203, "global_step": 39723, "epoch": 333, "lr": 4.167758265136433e-05} +{"train_loss": 0.0022107509430497885, "global_step": 39724, "epoch": 333, "lr": 4.167539805587779e-05} +{"train_loss": 0.001969622215256095, "global_step": 39725, "epoch": 333, "lr": 4.16732134767357e-05} +{"train_loss": 0.0019705535378307104, "global_step": 39726, "epoch": 333, "lr": 4.167102891394238e-05} +{"train_loss": 0.0022664149291813374, "global_step": 39727, "epoch": 333, "lr": 4.1668844367502094e-05} +{"train_loss": 0.0016740445280447602, "global_step": 39728, "epoch": 333, "lr": 4.166665983741915e-05} +{"train_loss": 0.0020508801098912954, "global_step": 39729, "epoch": 333, "lr": 4.166447532369784e-05} +{"train_loss": 0.0026169808115810156, "global_step": 39730, "epoch": 333, "lr": 4.1662290826342414e-05} +{"train_loss": 0.0011745867086574435, "global_step": 39731, "epoch": 333, "lr": 4.1660106345357214e-05} +{"train_loss": 0.0017895500641316175, "global_step": 39732, "epoch": 333, "lr": 4.165792188074648e-05} +{"train_loss": 0.001945829251781106, "global_step": 39733, "epoch": 333, "lr": 4.165573743251455e-05} +{"train_loss": 0.00258325575850904, "global_step": 39734, "epoch": 333, "lr": 4.1653553000665675e-05} +{"train_loss": 0.001182064414024353, "global_step": 39735, "epoch": 333, "lr": 4.165136858520415e-05} +{"train_loss": 0.0010781437158584595, "global_step": 39736, "epoch": 333, "lr": 4.164918418613428e-05} +{"train_loss": 0.0020555942319333553, "global_step": 39737, "epoch": 333, "lr": 4.1646999803460346e-05} +{"train_loss": 0.002532867481932044, "global_step": 39738, "epoch": 333, "lr": 4.1644815437186636e-05} +{"train_loss": 0.0014874374028295279, "global_step": 39739, "epoch": 333, "lr": 4.164263108731743e-05} +{"train_loss": 0.0029602600261569023, "global_step": 39740, "epoch": 333, "lr": 4.1640446753857034e-05} +{"train_loss": 0.0023326869122684, "global_step": 39741, "epoch": 333, "lr": 4.1638262436809734e-05} +{"train_loss": 0.0014145452296361327, "global_step": 39742, "epoch": 333, "lr": 4.163607813617979e-05} +{"train_loss": 0.0017637514974921942, "global_step": 39743, "epoch": 333, "lr": 4.163389385197153e-05} +{"train_loss": 0.0015622933860868216, "global_step": 39744, "epoch": 333, "lr": 4.163170958418921e-05} +{"train_loss": 0.0020452211899565486, "global_step": 39745, "epoch": 333, "lr": 4.162952533283716e-05, "val_loss": 0.018804021179676056} +{"train_loss": 0.0020668222568929195, "global_step": 39746, "epoch": 334, "lr": 4.162734109791964e-05} +{"train_loss": 0.0014906934229657054, "global_step": 39747, "epoch": 334, "lr": 4.162515687944091e-05} +{"train_loss": 0.0012128406669944525, "global_step": 39748, "epoch": 334, "lr": 4.1622972677405324e-05} +{"train_loss": 0.0009488190989941359, "global_step": 39749, "epoch": 334, "lr": 4.162078849181711e-05} +{"train_loss": 0.0011339605553075671, "global_step": 39750, "epoch": 334, "lr": 4.16186043226806e-05} +{"train_loss": 0.002524096053093672, "global_step": 39751, "epoch": 334, "lr": 4.1616420170000046e-05} +{"train_loss": 0.001225487794727087, "global_step": 39752, "epoch": 334, "lr": 4.1614236033779786e-05} +{"train_loss": 0.003214087802916765, "global_step": 39753, "epoch": 334, "lr": 4.161205191402406e-05} +{"train_loss": 0.0018321165116503835, "global_step": 39754, "epoch": 334, "lr": 4.160986781073717e-05} +{"train_loss": 0.0017425828846171498, "global_step": 39755, "epoch": 334, "lr": 4.1607683723923415e-05} +{"train_loss": 0.0014063474955037236, "global_step": 39756, "epoch": 334, "lr": 4.160549965358705e-05} +{"train_loss": 0.0012553215492516756, "global_step": 39757, "epoch": 334, "lr": 4.160331559973243e-05} +{"train_loss": 0.0015285952249541879, "global_step": 39758, "epoch": 334, "lr": 4.1601131562363777e-05} +{"train_loss": 0.002959043253213167, "global_step": 39759, "epoch": 334, "lr": 4.159894754148542e-05} +{"train_loss": 0.002333352342247963, "global_step": 39760, "epoch": 334, "lr": 4.1596763537101634e-05} +{"train_loss": 0.001406577997840941, "global_step": 39761, "epoch": 334, "lr": 4.159457954921669e-05} +{"train_loss": 0.000837681582197547, "global_step": 39762, "epoch": 334, "lr": 4.159239557783491e-05} +{"train_loss": 0.0023696483112871647, "global_step": 39763, "epoch": 334, "lr": 4.1590211622960536e-05} +{"train_loss": 0.0013948468258604407, "global_step": 39764, "epoch": 334, "lr": 4.158802768459791e-05} +{"train_loss": 0.002814303617924452, "global_step": 39765, "epoch": 334, "lr": 4.158584376275129e-05} +{"train_loss": 0.0016924981027841568, "global_step": 39766, "epoch": 334, "lr": 4.1583659857424945e-05} +{"train_loss": 0.001179297687485814, "global_step": 39767, "epoch": 334, "lr": 4.1581475968623205e-05} +{"train_loss": 0.002020217478275299, "global_step": 39768, "epoch": 334, "lr": 4.157929209635032e-05} +{"train_loss": 0.0026895678602159023, "global_step": 39769, "epoch": 334, "lr": 4.1577108240610606e-05} +{"train_loss": 0.0015956026036292315, "global_step": 39770, "epoch": 334, "lr": 4.157492440140834e-05} +{"train_loss": 0.0016094965394586325, "global_step": 39771, "epoch": 334, "lr": 4.15727405787478e-05} +{"train_loss": 0.0009126181830652058, "global_step": 39772, "epoch": 334, "lr": 4.1570556772633305e-05} +{"train_loss": 0.0017305531073361635, "global_step": 39773, "epoch": 334, "lr": 4.1568372983069105e-05} +{"train_loss": 0.001802323735319078, "global_step": 39774, "epoch": 334, "lr": 4.1566189210059514e-05} +{"train_loss": 0.0011919753160327673, "global_step": 39775, "epoch": 334, "lr": 4.156400545360879e-05} +{"train_loss": 0.002307932823896408, "global_step": 39776, "epoch": 334, "lr": 4.156182171372127e-05} +{"train_loss": 0.0024071582593023777, "global_step": 39777, "epoch": 334, "lr": 4.155963799040118e-05} +{"train_loss": 0.002346296329051256, "global_step": 39778, "epoch": 334, "lr": 4.1557454283652866e-05} +{"train_loss": 0.001318916562013328, "global_step": 39779, "epoch": 334, "lr": 4.155527059348059e-05} +{"train_loss": 0.0014682954642921686, "global_step": 39780, "epoch": 334, "lr": 4.1553086919888604e-05} +{"train_loss": 0.0014981577405706048, "global_step": 39781, "epoch": 334, "lr": 4.1550903262881267e-05} +{"train_loss": 0.0013740877620875835, "global_step": 39782, "epoch": 334, "lr": 4.15487196224628e-05} +{"train_loss": 0.0013390743406489491, "global_step": 39783, "epoch": 334, "lr": 4.1546535998637535e-05} +{"train_loss": 0.0009964978089556098, "global_step": 39784, "epoch": 334, "lr": 4.154435239140974e-05} +{"train_loss": 0.0016513424925506115, "global_step": 39785, "epoch": 334, "lr": 4.154216880078371e-05} +{"train_loss": 0.0022788741625845432, "global_step": 39786, "epoch": 334, "lr": 4.153998522676372e-05} +{"train_loss": 0.0014254017733037472, "global_step": 39787, "epoch": 334, "lr": 4.153780166935407e-05} +{"train_loss": 0.0018432756187394261, "global_step": 39788, "epoch": 334, "lr": 4.153561812855904e-05} +{"train_loss": 0.0014330836711451411, "global_step": 39789, "epoch": 334, "lr": 4.1533434604382915e-05} +{"train_loss": 0.0030644091311842203, "global_step": 39790, "epoch": 334, "lr": 4.1531251096829994e-05} +{"train_loss": 0.0010595597559586167, "global_step": 39791, "epoch": 334, "lr": 4.1529067605904566e-05} +{"train_loss": 0.001571603468619287, "global_step": 39792, "epoch": 334, "lr": 4.152688413161088e-05} +{"train_loss": 0.0021282427478581667, "global_step": 39793, "epoch": 334, "lr": 4.152470067395328e-05} +{"train_loss": 0.002432161010801792, "global_step": 39794, "epoch": 334, "lr": 4.1522517232936006e-05} +{"train_loss": 0.0021144335623830557, "global_step": 39795, "epoch": 334, "lr": 4.152033380856338e-05} +{"train_loss": 0.001458358601666987, "global_step": 39796, "epoch": 334, "lr": 4.1518150400839675e-05} +{"train_loss": 0.0009219635394401848, "global_step": 39797, "epoch": 334, "lr": 4.151596700976915e-05} +{"train_loss": 0.0021915724501013756, "global_step": 39798, "epoch": 334, "lr": 4.151378363535614e-05} +{"train_loss": 0.0027852682396769524, "global_step": 39799, "epoch": 334, "lr": 4.1511600277604895e-05} +{"train_loss": 0.0017275518039241433, "global_step": 39800, "epoch": 334, "lr": 4.150941693651973e-05} +{"train_loss": 0.001361195812933147, "global_step": 39801, "epoch": 334, "lr": 4.15072336121049e-05} +{"train_loss": 0.0028120619244873524, "global_step": 39802, "epoch": 334, "lr": 4.1505050304364735e-05} +{"train_loss": 0.0009498855215497315, "global_step": 39803, "epoch": 334, "lr": 4.1502867013303474e-05} +{"train_loss": 0.0018942079041153193, "global_step": 39804, "epoch": 334, "lr": 4.150068373892542e-05} +{"train_loss": 0.002027237555012107, "global_step": 39805, "epoch": 334, "lr": 4.1498500481234894e-05} +{"train_loss": 0.0016586693236604333, "global_step": 39806, "epoch": 334, "lr": 4.1496317240236126e-05} +{"train_loss": 0.0020617216359823942, "global_step": 39807, "epoch": 334, "lr": 4.149413401593345e-05} +{"train_loss": 0.0023410823196172714, "global_step": 39808, "epoch": 334, "lr": 4.1491950808331116e-05} +{"train_loss": 0.0011724465293809772, "global_step": 39809, "epoch": 334, "lr": 4.1489767617433446e-05} +{"train_loss": 0.002081718295812607, "global_step": 39810, "epoch": 334, "lr": 4.1487584443244706e-05} +{"train_loss": 0.0024217271711677313, "global_step": 39811, "epoch": 334, "lr": 4.1485401285769174e-05} +{"train_loss": 0.002413395093753934, "global_step": 39812, "epoch": 334, "lr": 4.148321814501116e-05} +{"train_loss": 0.001292505650781095, "global_step": 39813, "epoch": 334, "lr": 4.1481035020974915e-05} +{"train_loss": 0.0016799713484942913, "global_step": 39814, "epoch": 334, "lr": 4.147885191366477e-05} +{"train_loss": 0.0031239488162100315, "global_step": 39815, "epoch": 334, "lr": 4.147666882308499e-05} +{"train_loss": 0.0022559508215636015, "global_step": 39816, "epoch": 334, "lr": 4.147448574923984e-05} +{"train_loss": 0.002138671465218067, "global_step": 39817, "epoch": 334, "lr": 4.147230269213364e-05} +{"train_loss": 0.002172882203012705, "global_step": 39818, "epoch": 334, "lr": 4.147011965177066e-05} +{"train_loss": 0.002691384870558977, "global_step": 39819, "epoch": 334, "lr": 4.1467936628155177e-05} +{"train_loss": 0.0016618467634543777, "global_step": 39820, "epoch": 334, "lr": 4.14657536212915e-05} +{"train_loss": 0.0013712916988879442, "global_step": 39821, "epoch": 334, "lr": 4.1463570631183906e-05} +{"train_loss": 0.0016576203051954508, "global_step": 39822, "epoch": 334, "lr": 4.146138765783669e-05} +{"train_loss": 0.0040880655869841576, "global_step": 39823, "epoch": 334, "lr": 4.14592047012541e-05} +{"train_loss": 0.0016423150664195418, "global_step": 39824, "epoch": 334, "lr": 4.1457021761440475e-05} +{"train_loss": 0.0022464829962700605, "global_step": 39825, "epoch": 334, "lr": 4.1454838838400054e-05} +{"train_loss": 0.002419077791273594, "global_step": 39826, "epoch": 334, "lr": 4.145265593213716e-05} +{"train_loss": 0.0013029251713305712, "global_step": 39827, "epoch": 334, "lr": 4.145047304265605e-05} +{"train_loss": 0.00147745490539819, "global_step": 39828, "epoch": 334, "lr": 4.144829016996104e-05} +{"train_loss": 0.002039000391960144, "global_step": 39829, "epoch": 334, "lr": 4.144610731405639e-05} +{"train_loss": 0.0020657628774642944, "global_step": 39830, "epoch": 334, "lr": 4.144392447494638e-05} +{"train_loss": 0.0011408708523958921, "global_step": 39831, "epoch": 334, "lr": 4.1441741652635334e-05} +{"train_loss": 0.0021313047036528587, "global_step": 39832, "epoch": 334, "lr": 4.143955884712749e-05} +{"train_loss": 0.004157132934778929, "global_step": 39833, "epoch": 334, "lr": 4.143737605842718e-05} +{"train_loss": 0.0017804832896217704, "global_step": 39834, "epoch": 334, "lr": 4.143519328653866e-05} +{"train_loss": 0.0026980156544595957, "global_step": 39835, "epoch": 334, "lr": 4.143301053146622e-05} +{"train_loss": 0.0012113123666495085, "global_step": 39836, "epoch": 334, "lr": 4.1430827793214144e-05} +{"train_loss": 0.0020602927543222904, "global_step": 39837, "epoch": 334, "lr": 4.142864507178673e-05} +{"train_loss": 0.0018914954271167517, "global_step": 39838, "epoch": 334, "lr": 4.142646236718825e-05} +{"train_loss": 0.0013390585081651807, "global_step": 39839, "epoch": 334, "lr": 4.142427967942298e-05} +{"train_loss": 0.0012082977918908, "global_step": 39840, "epoch": 334, "lr": 4.1422097008495255e-05} +{"train_loss": 0.001406213385052979, "global_step": 39841, "epoch": 334, "lr": 4.141991435440932e-05} +{"train_loss": 0.002336598467081785, "global_step": 39842, "epoch": 334, "lr": 4.141773171716945e-05} +{"train_loss": 0.0010258712572976947, "global_step": 39843, "epoch": 334, "lr": 4.141554909677996e-05} +{"train_loss": 0.0010245428420603275, "global_step": 39844, "epoch": 334, "lr": 4.14133664932451e-05} +{"train_loss": 0.002102284925058484, "global_step": 39845, "epoch": 334, "lr": 4.141118390656921e-05} +{"train_loss": 0.002006216673180461, "global_step": 39846, "epoch": 334, "lr": 4.140900133675651e-05} +{"train_loss": 0.001888576429337263, "global_step": 39847, "epoch": 334, "lr": 4.1406818783811344e-05} +{"train_loss": 0.001694856327958405, "global_step": 39848, "epoch": 334, "lr": 4.140463624773797e-05} +{"train_loss": 0.0019460893236100674, "global_step": 39849, "epoch": 334, "lr": 4.1402453728540655e-05} +{"train_loss": 0.0019605569541454315, "global_step": 39850, "epoch": 334, "lr": 4.140027122622372e-05} +{"train_loss": 0.002461559372022748, "global_step": 39851, "epoch": 334, "lr": 4.139808874079142e-05} +{"train_loss": 0.0014899392845109105, "global_step": 39852, "epoch": 334, "lr": 4.1395906272248056e-05} +{"train_loss": 0.0009687746642157435, "global_step": 39853, "epoch": 334, "lr": 4.139372382059793e-05} +{"train_loss": 0.0023949001915752888, "global_step": 39854, "epoch": 334, "lr": 4.139154138584528e-05} +{"train_loss": 0.0019364252220839262, "global_step": 39855, "epoch": 334, "lr": 4.138935896799444e-05} +{"train_loss": 0.0029270548839122057, "global_step": 39856, "epoch": 334, "lr": 4.138717656704966e-05} +{"train_loss": 0.002387627260759473, "global_step": 39857, "epoch": 334, "lr": 4.138499418301526e-05} +{"train_loss": 0.0026968896854668856, "global_step": 39858, "epoch": 334, "lr": 4.138281181589547e-05} +{"train_loss": 0.0009233184391632676, "global_step": 39859, "epoch": 334, "lr": 4.138062946569464e-05} +{"train_loss": 0.002773958258330822, "global_step": 39860, "epoch": 334, "lr": 4.137844713241702e-05} +{"train_loss": 0.001576912123709917, "global_step": 39861, "epoch": 334, "lr": 4.137626481606688e-05} +{"train_loss": 0.002989263040944934, "global_step": 39862, "epoch": 334, "lr": 4.137408251664854e-05} +{"train_loss": 0.0022246157750487328, "global_step": 39863, "epoch": 334, "lr": 4.1371900234166246e-05} +{"train_loss": 0.0018892448376903327, "global_step": 39864, "epoch": 334, "lr": 4.136971796862433e-05, "val_loss": 0.044888872653245926} +{"train_loss": 0.002340457635000348, "global_step": 39865, "epoch": 335, "lr": 4.136753572002705e-05} +{"train_loss": 0.0014709666138514876, "global_step": 39866, "epoch": 335, "lr": 4.136535348837866e-05} +{"train_loss": 0.0015369298635050654, "global_step": 39867, "epoch": 335, "lr": 4.136317127368349e-05} +{"train_loss": 0.0016247070161625743, "global_step": 39868, "epoch": 335, "lr": 4.1360989075945824e-05} +{"train_loss": 0.002534202765673399, "global_step": 39869, "epoch": 335, "lr": 4.135880689516992e-05} +{"train_loss": 0.0019884544890373945, "global_step": 39870, "epoch": 335, "lr": 4.135662473136008e-05} +{"train_loss": 0.001129913842305541, "global_step": 39871, "epoch": 335, "lr": 4.135444258452058e-05} +{"train_loss": 0.0018671242287382483, "global_step": 39872, "epoch": 335, "lr": 4.135226045465572e-05} +{"train_loss": 0.0017174078384414315, "global_step": 39873, "epoch": 335, "lr": 4.135007834176975e-05} +{"train_loss": 0.002142716897651553, "global_step": 39874, "epoch": 335, "lr": 4.134789624586701e-05} +{"train_loss": 0.0017988323234021664, "global_step": 39875, "epoch": 335, "lr": 4.134571416695172e-05} +{"train_loss": 0.0014615511754527688, "global_step": 39876, "epoch": 335, "lr": 4.134353210502822e-05} +{"train_loss": 0.0025268676690757275, "global_step": 39877, "epoch": 335, "lr": 4.134135006010075e-05} +{"train_loss": 0.0032310213427990675, "global_step": 39878, "epoch": 335, "lr": 4.133916803217363e-05} +{"train_loss": 0.0010979032376781106, "global_step": 39879, "epoch": 335, "lr": 4.133698602125113e-05} +{"train_loss": 0.002355786506086588, "global_step": 39880, "epoch": 335, "lr": 4.1334804027337514e-05} +{"train_loss": 0.0007310612709261477, "global_step": 39881, "epoch": 335, "lr": 4.1332622050437104e-05} +{"train_loss": 0.0019174115732312202, "global_step": 39882, "epoch": 335, "lr": 4.133044009055415e-05} +{"train_loss": 0.0014606104232370853, "global_step": 39883, "epoch": 335, "lr": 4.1328258147692955e-05} +{"train_loss": 0.0020534470677375793, "global_step": 39884, "epoch": 335, "lr": 4.13260762218578e-05} +{"train_loss": 0.0018740262603387237, "global_step": 39885, "epoch": 335, "lr": 4.132389431305297e-05} +{"train_loss": 0.0015667041298002005, "global_step": 39886, "epoch": 335, "lr": 4.132171242128275e-05} +{"train_loss": 0.0020485962741076946, "global_step": 39887, "epoch": 335, "lr": 4.1319530546551396e-05} +{"train_loss": 0.001298980787396431, "global_step": 39888, "epoch": 335, "lr": 4.131734868886324e-05} +{"train_loss": 0.0015611647395417094, "global_step": 39889, "epoch": 335, "lr": 4.131516684822253e-05} +{"train_loss": 0.0018575091380625963, "global_step": 39890, "epoch": 335, "lr": 4.1312985024633576e-05} +{"train_loss": 0.002103889361023903, "global_step": 39891, "epoch": 335, "lr": 4.131080321810065e-05} +{"train_loss": 0.0018199174664914608, "global_step": 39892, "epoch": 335, "lr": 4.1308621428628016e-05} +{"train_loss": 0.0012137017911300063, "global_step": 39893, "epoch": 335, "lr": 4.1306439656219994e-05} +{"train_loss": 0.00281562190502882, "global_step": 39894, "epoch": 335, "lr": 4.130425790088082e-05} +{"train_loss": 0.0017181627918034792, "global_step": 39895, "epoch": 335, "lr": 4.130207616261484e-05} +{"train_loss": 0.0018844574224203825, "global_step": 39896, "epoch": 335, "lr": 4.129989444142627e-05} +{"train_loss": 0.002694255905225873, "global_step": 39897, "epoch": 335, "lr": 4.129771273731946e-05} +{"train_loss": 0.0010823601623997092, "global_step": 39898, "epoch": 335, "lr": 4.129553105029866e-05} +{"train_loss": 0.0018234490416944027, "global_step": 39899, "epoch": 335, "lr": 4.129334938036813e-05} +{"train_loss": 0.002767048543319106, "global_step": 39900, "epoch": 335, "lr": 4.12911677275322e-05} +{"train_loss": 0.0009285193518735468, "global_step": 39901, "epoch": 335, "lr": 4.128898609179512e-05} +{"train_loss": 0.0010168071603402495, "global_step": 39902, "epoch": 335, "lr": 4.1286804473161187e-05} +{"train_loss": 0.0019993220921605825, "global_step": 39903, "epoch": 335, "lr": 4.1284622871634695e-05} +{"train_loss": 0.0022756801918148994, "global_step": 39904, "epoch": 335, "lr": 4.128244128721989e-05} +{"train_loss": 0.0019668382592499256, "global_step": 39905, "epoch": 335, "lr": 4.12802597199211e-05} +{"train_loss": 0.0012174767907708883, "global_step": 39906, "epoch": 335, "lr": 4.127807816974257e-05} +{"train_loss": 0.0024296455085277557, "global_step": 39907, "epoch": 335, "lr": 4.127589663668863e-05} +{"train_loss": 0.0019793231040239334, "global_step": 39908, "epoch": 335, "lr": 4.1273715120763505e-05} +{"train_loss": 0.0019305445021018386, "global_step": 39909, "epoch": 335, "lr": 4.127153362197153e-05} +{"train_loss": 0.0023078531958162785, "global_step": 39910, "epoch": 335, "lr": 4.1269352140316975e-05} +{"train_loss": 0.002210852690041065, "global_step": 39911, "epoch": 335, "lr": 4.1267170675804087e-05} +{"train_loss": 0.0035455855540931225, "global_step": 39912, "epoch": 335, "lr": 4.126498922843719e-05} +{"train_loss": 0.0014258184237405658, "global_step": 39913, "epoch": 335, "lr": 4.1262807798220546e-05} +{"train_loss": 0.001715375343337655, "global_step": 39914, "epoch": 335, "lr": 4.126062638515846e-05} +{"train_loss": 0.0013126966077834368, "global_step": 39915, "epoch": 335, "lr": 4.125844498925517e-05} +{"train_loss": 0.0024209183175116777, "global_step": 39916, "epoch": 335, "lr": 4.125626361051502e-05} +{"train_loss": 0.0016569022554904222, "global_step": 39917, "epoch": 335, "lr": 4.125408224894226e-05} +{"train_loss": 0.0011713069397956133, "global_step": 39918, "epoch": 335, "lr": 4.125190090454116e-05} +{"train_loss": 0.004296908620744944, "global_step": 39919, "epoch": 335, "lr": 4.1249719577316025e-05} +{"train_loss": 0.0027944224420934916, "global_step": 39920, "epoch": 335, "lr": 4.1247538267271135e-05} +{"train_loss": 0.001016975729726255, "global_step": 39921, "epoch": 335, "lr": 4.124535697441077e-05} +{"train_loss": 0.0017253935802727938, "global_step": 39922, "epoch": 335, "lr": 4.124317569873921e-05} +{"train_loss": 0.0016211036127060652, "global_step": 39923, "epoch": 335, "lr": 4.124099444026072e-05} +{"train_loss": 0.0026975409127771854, "global_step": 39924, "epoch": 335, "lr": 4.123881319897963e-05} +{"train_loss": 0.0018400393892079592, "global_step": 39925, "epoch": 335, "lr": 4.123663197490017e-05} +{"train_loss": 0.0020868079736828804, "global_step": 39926, "epoch": 335, "lr": 4.1234450768026664e-05} +{"train_loss": 0.0015300915110856295, "global_step": 39927, "epoch": 335, "lr": 4.1232269578363356e-05} +{"train_loss": 0.0016310772625729442, "global_step": 39928, "epoch": 335, "lr": 4.123008840591458e-05} +{"train_loss": 0.002303175628185272, "global_step": 39929, "epoch": 335, "lr": 4.122790725068458e-05} +{"train_loss": 0.0023283581249415874, "global_step": 39930, "epoch": 335, "lr": 4.1225726112677634e-05} +{"train_loss": 0.002432620618492365, "global_step": 39931, "epoch": 335, "lr": 4.1223544991898054e-05} +{"train_loss": 0.002085339743643999, "global_step": 39932, "epoch": 335, "lr": 4.1221363888350086e-05} +{"train_loss": 0.004279863554984331, "global_step": 39933, "epoch": 335, "lr": 4.1219182802038046e-05} +{"train_loss": 0.002571898978203535, "global_step": 39934, "epoch": 335, "lr": 4.12170017329662e-05} +{"train_loss": 0.0021090200170874596, "global_step": 39935, "epoch": 335, "lr": 4.121482068113883e-05} +{"train_loss": 0.0012423601001501083, "global_step": 39936, "epoch": 335, "lr": 4.1212639646560224e-05} +{"train_loss": 0.0019497661851346493, "global_step": 39937, "epoch": 335, "lr": 4.121045862923465e-05} +{"train_loss": 0.001336229732260108, "global_step": 39938, "epoch": 335, "lr": 4.120827762916642e-05} +{"train_loss": 0.0016803332837298512, "global_step": 39939, "epoch": 335, "lr": 4.120609664635978e-05} +{"train_loss": 0.0030565704219043255, "global_step": 39940, "epoch": 335, "lr": 4.120391568081904e-05} +{"train_loss": 0.003514358075335622, "global_step": 39941, "epoch": 335, "lr": 4.1201734732548484e-05} +{"train_loss": 0.0014556430978700519, "global_step": 39942, "epoch": 335, "lr": 4.119955380155236e-05} +{"train_loss": 0.001869868254289031, "global_step": 39943, "epoch": 335, "lr": 4.119737288783499e-05} +{"train_loss": 0.001782214385457337, "global_step": 39944, "epoch": 335, "lr": 4.1195191991400616e-05} +{"train_loss": 0.0019629187881946564, "global_step": 39945, "epoch": 335, "lr": 4.119301111225356e-05} +{"train_loss": 0.004599727224558592, "global_step": 39946, "epoch": 335, "lr": 4.119083025039807e-05} +{"train_loss": 0.0030238134786486626, "global_step": 39947, "epoch": 335, "lr": 4.1188649405838464e-05} +{"train_loss": 0.0022358715068548918, "global_step": 39948, "epoch": 335, "lr": 4.1186468578579e-05} +{"train_loss": 0.0026185933966189623, "global_step": 39949, "epoch": 335, "lr": 4.118428776862395e-05} +{"train_loss": 0.0029843614902347326, "global_step": 39950, "epoch": 335, "lr": 4.1182106975977616e-05} +{"train_loss": 0.002117627765983343, "global_step": 39951, "epoch": 335, "lr": 4.117992620064427e-05} +{"train_loss": 0.005293992348015308, "global_step": 39952, "epoch": 335, "lr": 4.1177745442628193e-05} +{"train_loss": 0.002459249459207058, "global_step": 39953, "epoch": 335, "lr": 4.117556470193369e-05} +{"train_loss": 0.0027195492293685675, "global_step": 39954, "epoch": 335, "lr": 4.1173383978564995e-05} +{"train_loss": 0.0023043914698064327, "global_step": 39955, "epoch": 335, "lr": 4.1171203272526445e-05} +{"train_loss": 0.001787578104995191, "global_step": 39956, "epoch": 335, "lr": 4.116902258382227e-05} +{"train_loss": 0.003722128225490451, "global_step": 39957, "epoch": 335, "lr": 4.1166841912456795e-05} +{"train_loss": 0.004606226924806833, "global_step": 39958, "epoch": 335, "lr": 4.116466125843426e-05} +{"train_loss": 0.003088735742494464, "global_step": 39959, "epoch": 335, "lr": 4.1162480621758995e-05} +{"train_loss": 0.002334948629140854, "global_step": 39960, "epoch": 335, "lr": 4.1160300002435246e-05} +{"train_loss": 0.0018930082442238927, "global_step": 39961, "epoch": 335, "lr": 4.115811940046729e-05} +{"train_loss": 0.002354220487177372, "global_step": 39962, "epoch": 335, "lr": 4.1155938815859445e-05} +{"train_loss": 0.002046238398179412, "global_step": 39963, "epoch": 335, "lr": 4.1153758248615944e-05} +{"train_loss": 0.0015684396494179964, "global_step": 39964, "epoch": 335, "lr": 4.115157769874112e-05} +{"train_loss": 0.001664070994593203, "global_step": 39965, "epoch": 335, "lr": 4.11493971662392e-05} +{"train_loss": 0.0026249652728438377, "global_step": 39966, "epoch": 335, "lr": 4.114721665111452e-05} +{"train_loss": 0.0018992065452039242, "global_step": 39967, "epoch": 335, "lr": 4.114503615337132e-05} +{"train_loss": 0.002120902528986335, "global_step": 39968, "epoch": 335, "lr": 4.114285567301389e-05} +{"train_loss": 0.0042655630968511105, "global_step": 39969, "epoch": 335, "lr": 4.114067521004653e-05} +{"train_loss": 0.00203142361715436, "global_step": 39970, "epoch": 335, "lr": 4.1138494764473496e-05} +{"train_loss": 0.0012744233245030046, "global_step": 39971, "epoch": 335, "lr": 4.113631433629909e-05} +{"train_loss": 0.0028210554737597704, "global_step": 39972, "epoch": 335, "lr": 4.1134133925527585e-05} +{"train_loss": 0.0018796755466610193, "global_step": 39973, "epoch": 335, "lr": 4.1131953532163245e-05} +{"train_loss": 0.0016842583427205682, "global_step": 39974, "epoch": 335, "lr": 4.1129773156210385e-05} +{"train_loss": 0.0015310462331399322, "global_step": 39975, "epoch": 335, "lr": 4.1127592797673255e-05} +{"train_loss": 0.0008194550755433738, "global_step": 39976, "epoch": 335, "lr": 4.112541245655616e-05} +{"train_loss": 0.0020276422146707773, "global_step": 39977, "epoch": 335, "lr": 4.112323213286335e-05} +{"train_loss": 0.001958053559064865, "global_step": 39978, "epoch": 335, "lr": 4.112105182659915e-05} +{"train_loss": 0.003202366176992655, "global_step": 39979, "epoch": 335, "lr": 4.111887153776782e-05} +{"train_loss": 0.001041894662193954, "global_step": 39980, "epoch": 335, "lr": 4.111669126637361e-05} +{"train_loss": 0.0026537880767136812, "global_step": 39981, "epoch": 335, "lr": 4.111451101242085e-05} +{"train_loss": 0.003151498967781663, "global_step": 39982, "epoch": 335, "lr": 4.1112330775913775e-05} +{"train_loss": 0.0021473330591351356, "global_step": 39983, "epoch": 335, "lr": 4.1110150556856707e-05, "val_loss": 0.015956753864884377, "train_action_mse_error": 2.4769566152826883e-05} +{"train_loss": 0.0015309759182855487, "global_step": 39984, "epoch": 336, "lr": 4.1107970355253903e-05} +{"train_loss": 0.0016927951946854591, "global_step": 39985, "epoch": 336, "lr": 4.110579017110964e-05} +{"train_loss": 0.0013283060397952795, "global_step": 39986, "epoch": 336, "lr": 4.1103610004428225e-05} +{"train_loss": 0.0040390207432210445, "global_step": 39987, "epoch": 336, "lr": 4.110142985521391e-05} +{"train_loss": 0.002099305856972933, "global_step": 39988, "epoch": 336, "lr": 4.1099249723471e-05} +{"train_loss": 0.003129693679511547, "global_step": 39989, "epoch": 336, "lr": 4.109706960920374e-05} +{"train_loss": 0.0015760187525302172, "global_step": 39990, "epoch": 336, "lr": 4.109488951241646e-05} +{"train_loss": 0.002329392358660698, "global_step": 39991, "epoch": 336, "lr": 4.10927094331134e-05} +{"train_loss": 0.002089201705530286, "global_step": 39992, "epoch": 336, "lr": 4.1090529371298846e-05} +{"train_loss": 0.002680930308997631, "global_step": 39993, "epoch": 336, "lr": 4.10883493269771e-05} +{"train_loss": 0.001416003447957337, "global_step": 39994, "epoch": 336, "lr": 4.108616930015241e-05} +{"train_loss": 0.0018321058014407754, "global_step": 39995, "epoch": 336, "lr": 4.108398929082909e-05} +{"train_loss": 0.0027379700914025307, "global_step": 39996, "epoch": 336, "lr": 4.1081809299011394e-05} +{"train_loss": 0.0024526563938707113, "global_step": 39997, "epoch": 336, "lr": 4.107962932470362e-05} +{"train_loss": 0.0014557399554178119, "global_step": 39998, "epoch": 336, "lr": 4.107744936791004e-05} +{"train_loss": 0.0020406499970704317, "global_step": 39999, "epoch": 336, "lr": 4.1075269428634936e-05} +{"train_loss": 0.002209471305832267, "global_step": 40000, "epoch": 336, "lr": 4.1073089506882576e-05} +{"train_loss": 0.002009475836530328, "global_step": 40001, "epoch": 336, "lr": 4.1070909602657265e-05} +{"train_loss": 0.0015974040143191814, "global_step": 40002, "epoch": 336, "lr": 4.106872971596326e-05} +{"train_loss": 0.0027638671454042196, "global_step": 40003, "epoch": 336, "lr": 4.106654984680486e-05} +{"train_loss": 0.002835306106135249, "global_step": 40004, "epoch": 336, "lr": 4.106436999518632e-05} +{"train_loss": 0.0010967068374156952, "global_step": 40005, "epoch": 336, "lr": 4.1062190161111956e-05} +{"train_loss": 0.0017968950560316443, "global_step": 40006, "epoch": 336, "lr": 4.1060010344586004e-05} +{"train_loss": 0.0020954550709575415, "global_step": 40007, "epoch": 336, "lr": 4.1057830545612784e-05} +{"train_loss": 0.0018069116631522775, "global_step": 40008, "epoch": 336, "lr": 4.105565076419654e-05} +{"train_loss": 0.003737794701009989, "global_step": 40009, "epoch": 336, "lr": 4.1053471000341595e-05} +{"train_loss": 0.002222041366621852, "global_step": 40010, "epoch": 336, "lr": 4.105129125405219e-05} +{"train_loss": 0.0018801080295816064, "global_step": 40011, "epoch": 336, "lr": 4.104911152533261e-05} +{"train_loss": 0.0019503443036228418, "global_step": 40012, "epoch": 336, "lr": 4.1046931814187164e-05} +{"train_loss": 0.002374245785176754, "global_step": 40013, "epoch": 336, "lr": 4.1044752120620086e-05} +{"train_loss": 0.0033847580198198557, "global_step": 40014, "epoch": 336, "lr": 4.1042572444635704e-05} +{"train_loss": 0.001295750611461699, "global_step": 40015, "epoch": 336, "lr": 4.1040392786238254e-05} +{"train_loss": 0.0018241917714476585, "global_step": 40016, "epoch": 336, "lr": 4.103821314543205e-05} +{"train_loss": 0.0009254536707885563, "global_step": 40017, "epoch": 336, "lr": 4.1036033522221353e-05} +{"train_loss": 0.0025999376084655523, "global_step": 40018, "epoch": 336, "lr": 4.103385391661045e-05} +{"train_loss": 0.0012370481854304671, "global_step": 40019, "epoch": 336, "lr": 4.103167432860361e-05} +{"train_loss": 0.0031428742222487926, "global_step": 40020, "epoch": 336, "lr": 4.102949475820511e-05} +{"train_loss": 0.0028361333534121513, "global_step": 40021, "epoch": 336, "lr": 4.102731520541926e-05} +{"train_loss": 0.0026374156586825848, "global_step": 40022, "epoch": 336, "lr": 4.102513567025032e-05} +{"train_loss": 0.0021858930122107267, "global_step": 40023, "epoch": 336, "lr": 4.102295615270254e-05} +{"train_loss": 0.0021941137965768576, "global_step": 40024, "epoch": 336, "lr": 4.102077665278026e-05} +{"train_loss": 0.0030120208393782377, "global_step": 40025, "epoch": 336, "lr": 4.1018597170487694e-05} +{"train_loss": 0.0017821169458329678, "global_step": 40026, "epoch": 336, "lr": 4.1016417705829176e-05} +{"train_loss": 0.0026661627925932407, "global_step": 40027, "epoch": 336, "lr": 4.101423825880894e-05} +{"train_loss": 0.002236171392723918, "global_step": 40028, "epoch": 336, "lr": 4.101205882943131e-05} +{"train_loss": 0.0013209780445322394, "global_step": 40029, "epoch": 336, "lr": 4.100987941770054e-05} +{"train_loss": 0.0021174082066863775, "global_step": 40030, "epoch": 336, "lr": 4.100770002362089e-05} +{"train_loss": 0.004393525421619415, "global_step": 40031, "epoch": 336, "lr": 4.1005520647196686e-05} +{"train_loss": 0.0020514214411377907, "global_step": 40032, "epoch": 336, "lr": 4.100334128843216e-05} +{"train_loss": 0.0023223599418997765, "global_step": 40033, "epoch": 336, "lr": 4.100116194733163e-05} +{"train_loss": 0.0016056254971772432, "global_step": 40034, "epoch": 336, "lr": 4.099898262389934e-05} +{"train_loss": 0.0019618174992501736, "global_step": 40035, "epoch": 336, "lr": 4.099680331813959e-05} +{"train_loss": 0.0030910144560039043, "global_step": 40036, "epoch": 336, "lr": 4.0994624030056674e-05} +{"train_loss": 0.0020190589129924774, "global_step": 40037, "epoch": 336, "lr": 4.099244475965482e-05} +{"train_loss": 0.0012745661661028862, "global_step": 40038, "epoch": 336, "lr": 4.099026550693837e-05} +{"train_loss": 0.00257127289660275, "global_step": 40039, "epoch": 336, "lr": 4.0988086271911545e-05} +{"train_loss": 0.0015741377137601376, "global_step": 40040, "epoch": 336, "lr": 4.098590705457867e-05} +{"train_loss": 0.0024562827311456203, "global_step": 40041, "epoch": 336, "lr": 4.098372785494401e-05} +{"train_loss": 0.002950855763629079, "global_step": 40042, "epoch": 336, "lr": 4.09815486730118e-05} +{"train_loss": 0.002089013112708926, "global_step": 40043, "epoch": 336, "lr": 4.09793695087864e-05} +{"train_loss": 0.003971824422478676, "global_step": 40044, "epoch": 336, "lr": 4.0977190362272004e-05} +{"train_loss": 0.0010253277141600847, "global_step": 40045, "epoch": 336, "lr": 4.097501123347296e-05} +{"train_loss": 0.0035074851475656033, "global_step": 40046, "epoch": 336, "lr": 4.097283212239349e-05} +{"train_loss": 0.001203681924380362, "global_step": 40047, "epoch": 336, "lr": 4.097065302903793e-05} +{"train_loss": 0.002667361171916127, "global_step": 40048, "epoch": 336, "lr": 4.096847395341051e-05} +{"train_loss": 0.0012154497671872377, "global_step": 40049, "epoch": 336, "lr": 4.096629489551553e-05} +{"train_loss": 0.0029294455889612436, "global_step": 40050, "epoch": 336, "lr": 4.096411585535727e-05} +{"train_loss": 0.0015111039392650127, "global_step": 40051, "epoch": 336, "lr": 4.0961936832939996e-05} +{"train_loss": 0.0016744207823649049, "global_step": 40052, "epoch": 336, "lr": 4.0959757828268e-05} +{"train_loss": 0.002296891761943698, "global_step": 40053, "epoch": 336, "lr": 4.095757884134556e-05} +{"train_loss": 0.0018027215264737606, "global_step": 40054, "epoch": 336, "lr": 4.0955399872176925e-05} +{"train_loss": 0.0016381723107770085, "global_step": 40055, "epoch": 336, "lr": 4.0953220920766414e-05} +{"train_loss": 0.001972232712432742, "global_step": 40056, "epoch": 336, "lr": 4.095104198711827e-05} +{"train_loss": 0.0015929288929328322, "global_step": 40057, "epoch": 336, "lr": 4.094886307123681e-05} +{"train_loss": 0.0015072128735482693, "global_step": 40058, "epoch": 336, "lr": 4.094668417312627e-05} +{"train_loss": 0.0027537415735423565, "global_step": 40059, "epoch": 336, "lr": 4.0944505292790966e-05} +{"train_loss": 0.003558854106813669, "global_step": 40060, "epoch": 336, "lr": 4.0942326430235167e-05} +{"train_loss": 0.0011848326539620757, "global_step": 40061, "epoch": 336, "lr": 4.0940147585463115e-05} +{"train_loss": 0.0028997950721532106, "global_step": 40062, "epoch": 336, "lr": 4.093796875847914e-05} +{"train_loss": 0.0020814421586692333, "global_step": 40063, "epoch": 336, "lr": 4.093578994928747e-05} +{"train_loss": 0.0015601037302985787, "global_step": 40064, "epoch": 336, "lr": 4.0933611157892424e-05} +{"train_loss": 0.0021904208697378635, "global_step": 40065, "epoch": 336, "lr": 4.093143238429825e-05} +{"train_loss": 0.002872900804504752, "global_step": 40066, "epoch": 336, "lr": 4.092925362850926e-05} +{"train_loss": 0.002184160752221942, "global_step": 40067, "epoch": 336, "lr": 4.092707489052971e-05} +{"train_loss": 0.0026611133944243193, "global_step": 40068, "epoch": 336, "lr": 4.0924896170363866e-05} +{"train_loss": 0.0015993877314031124, "global_step": 40069, "epoch": 336, "lr": 4.092271746801602e-05} +{"train_loss": 0.0011434978805482388, "global_step": 40070, "epoch": 336, "lr": 4.092053878349044e-05} +{"train_loss": 0.0009400174021720886, "global_step": 40071, "epoch": 336, "lr": 4.091836011679143e-05} +{"train_loss": 0.002546456176787615, "global_step": 40072, "epoch": 336, "lr": 4.091618146792326e-05} +{"train_loss": 0.0018960634479299188, "global_step": 40073, "epoch": 336, "lr": 4.091400283689017e-05} +{"train_loss": 0.002177528105676174, "global_step": 40074, "epoch": 336, "lr": 4.0911824223696484e-05} +{"train_loss": 0.002117806812748313, "global_step": 40075, "epoch": 336, "lr": 4.090964562834644e-05} +{"train_loss": 0.0023488691076636314, "global_step": 40076, "epoch": 336, "lr": 4.0907467050844356e-05} +{"train_loss": 0.0025115504395216703, "global_step": 40077, "epoch": 336, "lr": 4.090528849119447e-05} +{"train_loss": 0.003038461320102215, "global_step": 40078, "epoch": 336, "lr": 4.0903109949401097e-05} +{"train_loss": 0.0012476282427087426, "global_step": 40079, "epoch": 336, "lr": 4.09009314254685e-05} +{"train_loss": 0.0023058168590068817, "global_step": 40080, "epoch": 336, "lr": 4.0898752919400926e-05} +{"train_loss": 0.0012404626468196511, "global_step": 40081, "epoch": 336, "lr": 4.089657443120271e-05} +{"train_loss": 0.002130950801074505, "global_step": 40082, "epoch": 336, "lr": 4.0894395960878064e-05} +{"train_loss": 0.001426864881068468, "global_step": 40083, "epoch": 336, "lr": 4.089221750843131e-05} +{"train_loss": 0.0035226824693381786, "global_step": 40084, "epoch": 336, "lr": 4.089003907386672e-05} +{"train_loss": 0.002752052852883935, "global_step": 40085, "epoch": 336, "lr": 4.088786065718856e-05} +{"train_loss": 0.0017579036066308618, "global_step": 40086, "epoch": 336, "lr": 4.088568225840113e-05} +{"train_loss": 0.00166498648468405, "global_step": 40087, "epoch": 336, "lr": 4.088350387750866e-05} +{"train_loss": 0.000962807156611234, "global_step": 40088, "epoch": 336, "lr": 4.0881325514515486e-05} +{"train_loss": 0.002250435296446085, "global_step": 40089, "epoch": 336, "lr": 4.087914716942582e-05} +{"train_loss": 0.0016493522562086582, "global_step": 40090, "epoch": 336, "lr": 4.087696884224401e-05} +{"train_loss": 0.0014338108012452722, "global_step": 40091, "epoch": 336, "lr": 4.087479053297429e-05} +{"train_loss": 0.0023919506929814816, "global_step": 40092, "epoch": 336, "lr": 4.0872612241620924e-05} +{"train_loss": 0.002152002416551113, "global_step": 40093, "epoch": 336, "lr": 4.087043396818823e-05} +{"train_loss": 0.0024529004003852606, "global_step": 40094, "epoch": 336, "lr": 4.0868255712680444e-05} +{"train_loss": 0.003233908209949732, "global_step": 40095, "epoch": 336, "lr": 4.086607747510188e-05} +{"train_loss": 0.0018108022632077336, "global_step": 40096, "epoch": 336, "lr": 4.086389925545677e-05} +{"train_loss": 0.0012796460650861263, "global_step": 40097, "epoch": 336, "lr": 4.086172105374945e-05} +{"train_loss": 0.001845643506385386, "global_step": 40098, "epoch": 336, "lr": 4.085954286998415e-05} +{"train_loss": 0.0017663190374150872, "global_step": 40099, "epoch": 336, "lr": 4.085736470416516e-05} +{"train_loss": 0.0014075498329475522, "global_step": 40100, "epoch": 336, "lr": 4.0855186556296765e-05} +{"train_loss": 0.0016609053127467632, "global_step": 40101, "epoch": 336, "lr": 4.0853008426383225e-05} +{"train_loss": 0.0021383248615869078, "global_step": 40102, "epoch": 336, "lr": 4.085083031442883e-05, "val_loss": 0.015171671286225319} +{"train_loss": 0.0014353056903928518, "global_step": 40103, "epoch": 337, "lr": 4.084865222043785e-05} +{"train_loss": 0.0016578756039962173, "global_step": 40104, "epoch": 337, "lr": 4.084647414441456e-05} +{"train_loss": 0.0015360756078734994, "global_step": 40105, "epoch": 337, "lr": 4.084429608636326e-05} +{"train_loss": 0.002005048096179962, "global_step": 40106, "epoch": 337, "lr": 4.084211804628818e-05} +{"train_loss": 0.001941609662026167, "global_step": 40107, "epoch": 337, "lr": 4.0839940024193644e-05} +{"train_loss": 0.0018023168668150902, "global_step": 40108, "epoch": 337, "lr": 4.083776202008388e-05} +{"train_loss": 0.0016951682046055794, "global_step": 40109, "epoch": 337, "lr": 4.0835584033963225e-05} +{"train_loss": 0.0011576541000977159, "global_step": 40110, "epoch": 337, "lr": 4.0833406065835925e-05} +{"train_loss": 0.0025390591472387314, "global_step": 40111, "epoch": 337, "lr": 4.083122811570622e-05} +{"train_loss": 0.0027584971394389868, "global_step": 40112, "epoch": 337, "lr": 4.0829050183578435e-05} +{"train_loss": 0.002434689551591873, "global_step": 40113, "epoch": 337, "lr": 4.0826872269456824e-05} +{"train_loss": 0.0017682822654023767, "global_step": 40114, "epoch": 337, "lr": 4.082469437334568e-05} +{"train_loss": 0.0018172081327065825, "global_step": 40115, "epoch": 337, "lr": 4.082251649524925e-05} +{"train_loss": 0.0011503081768751144, "global_step": 40116, "epoch": 337, "lr": 4.082033863517185e-05} +{"train_loss": 0.0011426362907513976, "global_step": 40117, "epoch": 337, "lr": 4.081816079311773e-05} +{"train_loss": 0.001649036887101829, "global_step": 40118, "epoch": 337, "lr": 4.081598296909115e-05} +{"train_loss": 0.0019353536190465093, "global_step": 40119, "epoch": 337, "lr": 4.081380516309643e-05} +{"train_loss": 0.002298000268638134, "global_step": 40120, "epoch": 337, "lr": 4.08116273751378e-05} +{"train_loss": 0.003440535394474864, "global_step": 40121, "epoch": 337, "lr": 4.0809449605219586e-05} +{"train_loss": 0.0014138102997094393, "global_step": 40122, "epoch": 337, "lr": 4.080727185334603e-05} +{"train_loss": 0.00125880294945091, "global_step": 40123, "epoch": 337, "lr": 4.0805094119521394e-05} +{"train_loss": 0.0022341907024383545, "global_step": 40124, "epoch": 337, "lr": 4.080291640374999e-05} +{"train_loss": 0.002120980527251959, "global_step": 40125, "epoch": 337, "lr": 4.080073870603606e-05} +{"train_loss": 0.0013450016267597675, "global_step": 40126, "epoch": 337, "lr": 4.079856102638392e-05} +{"train_loss": 0.0018270921427756548, "global_step": 40127, "epoch": 337, "lr": 4.07963833647978e-05} +{"train_loss": 0.0031092145945876837, "global_step": 40128, "epoch": 337, "lr": 4.079420572128202e-05} +{"train_loss": 0.0014878858346492052, "global_step": 40129, "epoch": 337, "lr": 4.079202809584083e-05} +{"train_loss": 0.0019677295349538326, "global_step": 40130, "epoch": 337, "lr": 4.078985048847849e-05} +{"train_loss": 0.002199167385697365, "global_step": 40131, "epoch": 337, "lr": 4.078767289919931e-05} +{"train_loss": 0.0020868899300694466, "global_step": 40132, "epoch": 337, "lr": 4.0785495328007536e-05} +{"train_loss": 0.0016265485901385546, "global_step": 40133, "epoch": 337, "lr": 4.078331777490747e-05} +{"train_loss": 0.0009256736375391483, "global_step": 40134, "epoch": 337, "lr": 4.078114023990338e-05} +{"train_loss": 0.001336126122623682, "global_step": 40135, "epoch": 337, "lr": 4.077896272299952e-05} +{"train_loss": 0.0011154839303344488, "global_step": 40136, "epoch": 337, "lr": 4.077678522420021e-05} +{"train_loss": 0.002567049115896225, "global_step": 40137, "epoch": 337, "lr": 4.077460774350966e-05} +{"train_loss": 0.0018396064406260848, "global_step": 40138, "epoch": 337, "lr": 4.0772430280932204e-05} +{"train_loss": 0.0015008131740614772, "global_step": 40139, "epoch": 337, "lr": 4.077025283647208e-05} +{"train_loss": 0.0015709068393334746, "global_step": 40140, "epoch": 337, "lr": 4.07680754101336e-05} +{"train_loss": 0.0012301855022087693, "global_step": 40141, "epoch": 337, "lr": 4.076589800192101e-05} +{"train_loss": 0.002205745317041874, "global_step": 40142, "epoch": 337, "lr": 4.076372061183859e-05} +{"train_loss": 0.0012620544293895364, "global_step": 40143, "epoch": 337, "lr": 4.0761543239890624e-05} +{"train_loss": 0.002320137806236744, "global_step": 40144, "epoch": 337, "lr": 4.0759365886081355e-05} +{"train_loss": 0.0019572051241993904, "global_step": 40145, "epoch": 337, "lr": 4.075718855041512e-05} +{"train_loss": 0.002056104363873601, "global_step": 40146, "epoch": 337, "lr": 4.075501123289613e-05} +{"train_loss": 0.001525918603874743, "global_step": 40147, "epoch": 337, "lr": 4.0752833933528703e-05} +{"train_loss": 0.0033544881734997034, "global_step": 40148, "epoch": 337, "lr": 4.07506566523171e-05} +{"train_loss": 0.0018199487822130322, "global_step": 40149, "epoch": 337, "lr": 4.074847938926558e-05} +{"train_loss": 0.002031321171671152, "global_step": 40150, "epoch": 337, "lr": 4.0746302144378445e-05} +{"train_loss": 0.0019557487685233355, "global_step": 40151, "epoch": 337, "lr": 4.074412491765995e-05} +{"train_loss": 0.001746616791933775, "global_step": 40152, "epoch": 337, "lr": 4.074194770911438e-05} +{"train_loss": 0.0005204089102335274, "global_step": 40153, "epoch": 337, "lr": 4.073977051874599e-05} +{"train_loss": 0.0012512978864833713, "global_step": 40154, "epoch": 337, "lr": 4.073759334655911e-05} +{"train_loss": 0.0008834879845380783, "global_step": 40155, "epoch": 337, "lr": 4.073541619255796e-05} +{"train_loss": 0.0019330482464283705, "global_step": 40156, "epoch": 337, "lr": 4.073323905674681e-05} +{"train_loss": 0.001681094290688634, "global_step": 40157, "epoch": 337, "lr": 4.073106193912998e-05} +{"train_loss": 0.0037348936311900616, "global_step": 40158, "epoch": 337, "lr": 4.07288848397117e-05} +{"train_loss": 0.0022054840810596943, "global_step": 40159, "epoch": 337, "lr": 4.072670775849628e-05} +{"train_loss": 0.000879503961186856, "global_step": 40160, "epoch": 337, "lr": 4.072453069548798e-05} +{"train_loss": 0.0016014971770346165, "global_step": 40161, "epoch": 337, "lr": 4.0722353650691055e-05} +{"train_loss": 0.0018178706523030996, "global_step": 40162, "epoch": 337, "lr": 4.072017662410982e-05} +{"train_loss": 0.0018481607548892498, "global_step": 40163, "epoch": 337, "lr": 4.07179996157485e-05} +{"train_loss": 0.0010641849366948009, "global_step": 40164, "epoch": 337, "lr": 4.071582262561142e-05} +{"train_loss": 0.002215348184108734, "global_step": 40165, "epoch": 337, "lr": 4.071364565370281e-05} +{"train_loss": 0.0010737128322944045, "global_step": 40166, "epoch": 337, "lr": 4.0711468700026975e-05} +{"train_loss": 0.001490215421654284, "global_step": 40167, "epoch": 337, "lr": 4.070929176458818e-05} +{"train_loss": 0.0015775321517139673, "global_step": 40168, "epoch": 337, "lr": 4.0707114847390694e-05} +{"train_loss": 0.002906153444200754, "global_step": 40169, "epoch": 337, "lr": 4.070493794843881e-05} +{"train_loss": 0.0016127416165545583, "global_step": 40170, "epoch": 337, "lr": 4.070276106773676e-05} +{"train_loss": 0.0015714389737695456, "global_step": 40171, "epoch": 337, "lr": 4.0700584205288874e-05} +{"train_loss": 0.0011626312043517828, "global_step": 40172, "epoch": 337, "lr": 4.06984073610994e-05} +{"train_loss": 0.001842645462602377, "global_step": 40173, "epoch": 337, "lr": 4.069623053517258e-05} +{"train_loss": 0.0011947251623496413, "global_step": 40174, "epoch": 337, "lr": 4.0694053727512735e-05} +{"train_loss": 0.0016005749348551035, "global_step": 40175, "epoch": 337, "lr": 4.0691876938124114e-05} +{"train_loss": 0.0015018255217000842, "global_step": 40176, "epoch": 337, "lr": 4.068970016701101e-05} +{"train_loss": 0.0020168533083051443, "global_step": 40177, "epoch": 337, "lr": 4.068752341417767e-05} +{"train_loss": 0.0013405939098447561, "global_step": 40178, "epoch": 337, "lr": 4.068534667962839e-05} +{"train_loss": 0.0007796449353918433, "global_step": 40179, "epoch": 337, "lr": 4.068316996336745e-05} +{"train_loss": 0.0013441370101645589, "global_step": 40180, "epoch": 337, "lr": 4.0680993265399085e-05} +{"train_loss": 0.0022933888249099255, "global_step": 40181, "epoch": 337, "lr": 4.067881658572761e-05} +{"train_loss": 0.0011767768301069736, "global_step": 40182, "epoch": 337, "lr": 4.067663992435727e-05} +{"train_loss": 0.0012054177932441235, "global_step": 40183, "epoch": 337, "lr": 4.067446328129236e-05} +{"train_loss": 0.002164058154448867, "global_step": 40184, "epoch": 337, "lr": 4.067228665653715e-05} +{"train_loss": 0.0038891586009413004, "global_step": 40185, "epoch": 337, "lr": 4.06701100500959e-05} +{"train_loss": 0.002034015255048871, "global_step": 40186, "epoch": 337, "lr": 4.066793346197291e-05} +{"train_loss": 0.002039977815002203, "global_step": 40187, "epoch": 337, "lr": 4.066575689217241e-05} +{"train_loss": 0.0009912372333928943, "global_step": 40188, "epoch": 337, "lr": 4.066358034069872e-05} +{"train_loss": 0.0017340865451842546, "global_step": 40189, "epoch": 337, "lr": 4.066140380755607e-05} +{"train_loss": 0.001564412610605359, "global_step": 40190, "epoch": 337, "lr": 4.065922729274878e-05} +{"train_loss": 0.0017425433034077287, "global_step": 40191, "epoch": 337, "lr": 4.06570507962811e-05} +{"train_loss": 0.001411542878486216, "global_step": 40192, "epoch": 337, "lr": 4.0654874318157276e-05} +{"train_loss": 0.001520791556686163, "global_step": 40193, "epoch": 337, "lr": 4.065269785838164e-05} +{"train_loss": 0.0007070866995491087, "global_step": 40194, "epoch": 337, "lr": 4.0650521416958396e-05} +{"train_loss": 0.001489059766754508, "global_step": 40195, "epoch": 337, "lr": 4.064834499389189e-05} +{"train_loss": 0.0008848042343743145, "global_step": 40196, "epoch": 337, "lr": 4.0646168589186336e-05} +{"train_loss": 0.001966522540897131, "global_step": 40197, "epoch": 337, "lr": 4.064399220284605e-05} +{"train_loss": 0.0028573195450007915, "global_step": 40198, "epoch": 337, "lr": 4.064181583487527e-05} +{"train_loss": 0.001327458885498345, "global_step": 40199, "epoch": 337, "lr": 4.063963948527829e-05} +{"train_loss": 0.0011059073731303215, "global_step": 40200, "epoch": 337, "lr": 4.063746315405937e-05} +{"train_loss": 0.0017675255658105016, "global_step": 40201, "epoch": 337, "lr": 4.063528684122279e-05} +{"train_loss": 0.002137052360922098, "global_step": 40202, "epoch": 337, "lr": 4.063311054677285e-05} +{"train_loss": 0.002249599900096655, "global_step": 40203, "epoch": 337, "lr": 4.063093427071376e-05} +{"train_loss": 0.002692252164706588, "global_step": 40204, "epoch": 337, "lr": 4.062875801304986e-05} +{"train_loss": 0.0021099913865327835, "global_step": 40205, "epoch": 337, "lr": 4.062658177378539e-05} +{"train_loss": 0.0011589244240894914, "global_step": 40206, "epoch": 337, "lr": 4.0624405552924606e-05} +{"train_loss": 0.0009680174989625812, "global_step": 40207, "epoch": 337, "lr": 4.062222935047182e-05} +{"train_loss": 0.001312887528911233, "global_step": 40208, "epoch": 337, "lr": 4.062005316643126e-05} +{"train_loss": 0.0010124968830496073, "global_step": 40209, "epoch": 337, "lr": 4.0617877000807256e-05} +{"train_loss": 0.0019460218027234077, "global_step": 40210, "epoch": 337, "lr": 4.061570085360403e-05} +{"train_loss": 0.0021405357401818037, "global_step": 40211, "epoch": 337, "lr": 4.061352472482587e-05} +{"train_loss": 0.002798337023705244, "global_step": 40212, "epoch": 337, "lr": 4.061134861447706e-05} +{"train_loss": 0.0014936852967366576, "global_step": 40213, "epoch": 337, "lr": 4.060917252256185e-05} +{"train_loss": 0.0016412172699347138, "global_step": 40214, "epoch": 337, "lr": 4.0606996449084544e-05} +{"train_loss": 0.002065870678052306, "global_step": 40215, "epoch": 337, "lr": 4.060482039404938e-05} +{"train_loss": 0.0016212615882977843, "global_step": 40216, "epoch": 337, "lr": 4.0602644357460653e-05} +{"train_loss": 0.0023576708044856787, "global_step": 40217, "epoch": 337, "lr": 4.060046833932264e-05} +{"train_loss": 0.0014910477912053466, "global_step": 40218, "epoch": 337, "lr": 4.059829233963959e-05} +{"train_loss": 0.0017510709585621953, "global_step": 40219, "epoch": 337, "lr": 4.0596116358415804e-05} +{"train_loss": 0.0013572291936725378, "global_step": 40220, "epoch": 337, "lr": 4.0593940395655514e-05} +{"train_loss": 0.0017652225469340797, "global_step": 40221, "epoch": 337, "lr": 4.059176445136305e-05, "val_loss": 0.01138082891702652} +{"train_loss": 0.0017496959771960974, "global_step": 40222, "epoch": 338, "lr": 4.058958852554262e-05} +{"train_loss": 0.0015844301087781787, "global_step": 40223, "epoch": 338, "lr": 4.058741261819855e-05} +{"train_loss": 0.001338964095339179, "global_step": 40224, "epoch": 338, "lr": 4.0585236729335094e-05} +{"train_loss": 0.003000750672072172, "global_step": 40225, "epoch": 338, "lr": 4.058306085895649e-05} +{"train_loss": 0.002211853628978133, "global_step": 40226, "epoch": 338, "lr": 4.058088500706707e-05} +{"train_loss": 0.001750520197674632, "global_step": 40227, "epoch": 338, "lr": 4.057870917367105e-05} +{"train_loss": 0.0018690620781853795, "global_step": 40228, "epoch": 338, "lr": 4.057653335877275e-05} +{"train_loss": 0.001962321810424328, "global_step": 40229, "epoch": 338, "lr": 4.057435756237641e-05} +{"train_loss": 0.0011583165032789111, "global_step": 40230, "epoch": 338, "lr": 4.057218178448631e-05} +{"train_loss": 0.0021126316860318184, "global_step": 40231, "epoch": 338, "lr": 4.057000602510673e-05} +{"train_loss": 0.0009789838222786784, "global_step": 40232, "epoch": 338, "lr": 4.056783028424193e-05} +{"train_loss": 0.002201472409069538, "global_step": 40233, "epoch": 338, "lr": 4.056565456189619e-05} +{"train_loss": 0.0023160153068602085, "global_step": 40234, "epoch": 338, "lr": 4.0563478858073776e-05} +{"train_loss": 0.001891119871288538, "global_step": 40235, "epoch": 338, "lr": 4.056130317277897e-05} +{"train_loss": 0.0016775743570178747, "global_step": 40236, "epoch": 338, "lr": 4.055912750601604e-05} +{"train_loss": 0.0014063917333260179, "global_step": 40237, "epoch": 338, "lr": 4.055695185778924e-05} +{"train_loss": 0.002229839563369751, "global_step": 40238, "epoch": 338, "lr": 4.055477622810288e-05} +{"train_loss": 0.0021980861201882362, "global_step": 40239, "epoch": 338, "lr": 4.0552600616961176e-05} +{"train_loss": 0.0016342458548024297, "global_step": 40240, "epoch": 338, "lr": 4.055042502436845e-05} +{"train_loss": 0.0027730045840144157, "global_step": 40241, "epoch": 338, "lr": 4.054824945032897e-05} +{"train_loss": 0.0016539808129891753, "global_step": 40242, "epoch": 338, "lr": 4.054607389484696e-05} +{"train_loss": 0.0019017448648810387, "global_step": 40243, "epoch": 338, "lr": 4.0543898357926746e-05} +{"train_loss": 0.0027827927842736244, "global_step": 40244, "epoch": 338, "lr": 4.054172283957256e-05} +{"train_loss": 0.0015016949037089944, "global_step": 40245, "epoch": 338, "lr": 4.0539547339788706e-05} +{"train_loss": 0.002196453046053648, "global_step": 40246, "epoch": 338, "lr": 4.0537371858579426e-05} +{"train_loss": 0.0009082879987545311, "global_step": 40247, "epoch": 338, "lr": 4.053519639594903e-05} +{"train_loss": 0.0015890515642240644, "global_step": 40248, "epoch": 338, "lr": 4.0533020951901746e-05} +{"train_loss": 0.0027398548554629087, "global_step": 40249, "epoch": 338, "lr": 4.0530845526441864e-05} +{"train_loss": 0.001771636656485498, "global_step": 40250, "epoch": 338, "lr": 4.052867011957366e-05} +{"train_loss": 0.0021395396906882524, "global_step": 40251, "epoch": 338, "lr": 4.052649473130138e-05} +{"train_loss": 0.0012139281025156379, "global_step": 40252, "epoch": 338, "lr": 4.0524319361629346e-05} +{"train_loss": 0.001457338104955852, "global_step": 40253, "epoch": 338, "lr": 4.052214401056178e-05} +{"train_loss": 0.0023317912127822638, "global_step": 40254, "epoch": 338, "lr": 4.051996867810299e-05} +{"train_loss": 0.0010383902117609978, "global_step": 40255, "epoch": 338, "lr": 4.051779336425722e-05} +{"train_loss": 0.0016556932823732495, "global_step": 40256, "epoch": 338, "lr": 4.051561806902874e-05} +{"train_loss": 0.0012572467094287276, "global_step": 40257, "epoch": 338, "lr": 4.0513442792421845e-05} +{"train_loss": 0.001562112825922668, "global_step": 40258, "epoch": 338, "lr": 4.0511267534440774e-05} +{"train_loss": 0.0012310533784329891, "global_step": 40259, "epoch": 338, "lr": 4.050909229508983e-05} +{"train_loss": 0.0022535601165145636, "global_step": 40260, "epoch": 338, "lr": 4.050691707437328e-05} +{"train_loss": 0.002546572359278798, "global_step": 40261, "epoch": 338, "lr": 4.050474187229536e-05} +{"train_loss": 0.001792479888536036, "global_step": 40262, "epoch": 338, "lr": 4.0502566688860374e-05} +{"train_loss": 0.001061463262885809, "global_step": 40263, "epoch": 338, "lr": 4.050039152407258e-05} +{"train_loss": 0.0024663961958140135, "global_step": 40264, "epoch": 338, "lr": 4.049821637793625e-05} +{"train_loss": 0.0017564172158017755, "global_step": 40265, "epoch": 338, "lr": 4.049604125045566e-05} +{"train_loss": 0.0025710095651447773, "global_step": 40266, "epoch": 338, "lr": 4.0493866141635085e-05} +{"train_loss": 0.0013465554220601916, "global_step": 40267, "epoch": 338, "lr": 4.049169105147879e-05} +{"train_loss": 0.001342429663054645, "global_step": 40268, "epoch": 338, "lr": 4.0489515979991025e-05} +{"train_loss": 0.0014715234283357859, "global_step": 40269, "epoch": 338, "lr": 4.0487340927176105e-05} +{"train_loss": 0.002186134224757552, "global_step": 40270, "epoch": 338, "lr": 4.048516589303825e-05} +{"train_loss": 0.0031041924376040697, "global_step": 40271, "epoch": 338, "lr": 4.048299087758178e-05} +{"train_loss": 0.0011952616041526198, "global_step": 40272, "epoch": 338, "lr": 4.0480815880810915e-05} +{"train_loss": 0.0006817097892053425, "global_step": 40273, "epoch": 338, "lr": 4.047864090272997e-05} +{"train_loss": 0.002551102079451084, "global_step": 40274, "epoch": 338, "lr": 4.04764659433432e-05} +{"train_loss": 0.0012619018089026213, "global_step": 40275, "epoch": 338, "lr": 4.0474291002654854e-05} +{"train_loss": 0.0023714301642030478, "global_step": 40276, "epoch": 338, "lr": 4.047211608066923e-05} +{"train_loss": 0.002200942486524582, "global_step": 40277, "epoch": 338, "lr": 4.046994117739058e-05} +{"train_loss": 0.0011016393546015024, "global_step": 40278, "epoch": 338, "lr": 4.046776629282319e-05} +{"train_loss": 0.0021920939907431602, "global_step": 40279, "epoch": 338, "lr": 4.046559142697133e-05} +{"train_loss": 0.0018673191079869866, "global_step": 40280, "epoch": 338, "lr": 4.046341657983925e-05} +{"train_loss": 0.001237831311300397, "global_step": 40281, "epoch": 338, "lr": 4.0461241751431236e-05} +{"train_loss": 0.0026458720676600933, "global_step": 40282, "epoch": 338, "lr": 4.0459066941751547e-05} +{"train_loss": 0.0016914934385567904, "global_step": 40283, "epoch": 338, "lr": 4.045689215080447e-05} +{"train_loss": 0.001577926566824317, "global_step": 40284, "epoch": 338, "lr": 4.045471737859426e-05} +{"train_loss": 0.0015084632905200124, "global_step": 40285, "epoch": 338, "lr": 4.0452542625125203e-05} +{"train_loss": 0.002378396689891815, "global_step": 40286, "epoch": 338, "lr": 4.045036789040156e-05} +{"train_loss": 0.0012456501135602593, "global_step": 40287, "epoch": 338, "lr": 4.044819317442758e-05} +{"train_loss": 0.001904341857880354, "global_step": 40288, "epoch": 338, "lr": 4.0446018477207576e-05} +{"train_loss": 0.0010329707292839885, "global_step": 40289, "epoch": 338, "lr": 4.044384379874577e-05} +{"train_loss": 0.0024952623061835766, "global_step": 40290, "epoch": 338, "lr": 4.044166913904648e-05} +{"train_loss": 0.0014569323975592852, "global_step": 40291, "epoch": 338, "lr": 4.043949449811395e-05} +{"train_loss": 0.0018958394648507237, "global_step": 40292, "epoch": 338, "lr": 4.0437319875952426e-05} +{"train_loss": 0.0019464049255475402, "global_step": 40293, "epoch": 338, "lr": 4.043514527256623e-05} +{"train_loss": 0.0009750202880240977, "global_step": 40294, "epoch": 338, "lr": 4.043297068795958e-05} +{"train_loss": 0.001985123148187995, "global_step": 40295, "epoch": 338, "lr": 4.0430796122136786e-05} +{"train_loss": 0.0024954527616500854, "global_step": 40296, "epoch": 338, "lr": 4.0428621575102085e-05} +{"train_loss": 0.0013389915693551302, "global_step": 40297, "epoch": 338, "lr": 4.042644704685979e-05} +{"train_loss": 0.0015008043264970183, "global_step": 40298, "epoch": 338, "lr": 4.042427253741412e-05} +{"train_loss": 0.0016676170052960515, "global_step": 40299, "epoch": 338, "lr": 4.042209804676937e-05} +{"train_loss": 0.0018280852818861604, "global_step": 40300, "epoch": 338, "lr": 4.0419923574929825e-05} +{"train_loss": 0.0014576342655345798, "global_step": 40301, "epoch": 338, "lr": 4.0417749121899715e-05} +{"train_loss": 0.0029449767898768187, "global_step": 40302, "epoch": 338, "lr": 4.041557468768335e-05} +{"train_loss": 0.0013862453633919358, "global_step": 40303, "epoch": 338, "lr": 4.041340027228496e-05} +{"train_loss": 0.001443061395548284, "global_step": 40304, "epoch": 338, "lr": 4.041122587570886e-05} +{"train_loss": 0.0014651676174253225, "global_step": 40305, "epoch": 338, "lr": 4.0409051497959284e-05} +{"train_loss": 0.0023710387758910656, "global_step": 40306, "epoch": 338, "lr": 4.04068771390405e-05} +{"train_loss": 0.0018623443320393562, "global_step": 40307, "epoch": 338, "lr": 4.04047027989568e-05} +{"train_loss": 0.001924837357364595, "global_step": 40308, "epoch": 338, "lr": 4.040252847771242e-05} +{"train_loss": 0.002113542053848505, "global_step": 40309, "epoch": 338, "lr": 4.040035417531168e-05} +{"train_loss": 0.0015580205945298076, "global_step": 40310, "epoch": 338, "lr": 4.039817989175881e-05} +{"train_loss": 0.0016471112612634897, "global_step": 40311, "epoch": 338, "lr": 4.0396005627058075e-05} +{"train_loss": 0.0016783317551016808, "global_step": 40312, "epoch": 338, "lr": 4.039383138121376e-05} +{"train_loss": 0.0018887680489569902, "global_step": 40313, "epoch": 338, "lr": 4.0391657154230135e-05} +{"train_loss": 0.001329434453509748, "global_step": 40314, "epoch": 338, "lr": 4.038948294611146e-05} +{"train_loss": 0.0018076871056109667, "global_step": 40315, "epoch": 338, "lr": 4.0387308756862015e-05} +{"train_loss": 0.002017483813688159, "global_step": 40316, "epoch": 338, "lr": 4.038513458648606e-05} +{"train_loss": 0.0020635738037526608, "global_step": 40317, "epoch": 338, "lr": 4.0382960434987875e-05} +{"train_loss": 0.001080006710253656, "global_step": 40318, "epoch": 338, "lr": 4.03807863023717e-05} +{"train_loss": 0.0012327745789662004, "global_step": 40319, "epoch": 338, "lr": 4.0378612188641847e-05} +{"train_loss": 0.0026564402505755424, "global_step": 40320, "epoch": 338, "lr": 4.0376438093802535e-05} +{"train_loss": 0.0030254393350332975, "global_step": 40321, "epoch": 338, "lr": 4.037426401785808e-05} +{"train_loss": 0.0019139833748340607, "global_step": 40322, "epoch": 338, "lr": 4.037208996081271e-05} +{"train_loss": 0.0021472794469445944, "global_step": 40323, "epoch": 338, "lr": 4.036991592267073e-05} +{"train_loss": 0.0012529920786619186, "global_step": 40324, "epoch": 338, "lr": 4.03677419034364e-05} +{"train_loss": 0.0024239751510322094, "global_step": 40325, "epoch": 338, "lr": 4.036556790311396e-05} +{"train_loss": 0.001598112634383142, "global_step": 40326, "epoch": 338, "lr": 4.0363393921707705e-05} +{"train_loss": 0.0013387983199208975, "global_step": 40327, "epoch": 338, "lr": 4.0361219959221886e-05} +{"train_loss": 0.0014727808302268386, "global_step": 40328, "epoch": 338, "lr": 4.03590460156608e-05} +{"train_loss": 0.0014391072327271104, "global_step": 40329, "epoch": 338, "lr": 4.035687209102868e-05} +{"train_loss": 0.0007942093070596457, "global_step": 40330, "epoch": 338, "lr": 4.035469818532982e-05} +{"train_loss": 0.0014085754519328475, "global_step": 40331, "epoch": 338, "lr": 4.0352524298568485e-05} +{"train_loss": 0.0016042266506701708, "global_step": 40332, "epoch": 338, "lr": 4.035035043074893e-05} +{"train_loss": 0.0021004413720220327, "global_step": 40333, "epoch": 338, "lr": 4.034817658187543e-05} +{"train_loss": 0.0020347335375845432, "global_step": 40334, "epoch": 338, "lr": 4.034600275195225e-05} +{"train_loss": 0.0020239748992025852, "global_step": 40335, "epoch": 338, "lr": 4.0343828940983675e-05} +{"train_loss": 0.0011885010171681643, "global_step": 40336, "epoch": 338, "lr": 4.034165514897397e-05} +{"train_loss": 0.0015287495916709304, "global_step": 40337, "epoch": 338, "lr": 4.0339481375927354e-05} +{"train_loss": 0.001634749467484653, "global_step": 40338, "epoch": 338, "lr": 4.033730762184818e-05} +{"train_loss": 0.002685792278498411, "global_step": 40339, "epoch": 338, "lr": 4.033513388674063e-05} +{"train_loss": 0.0017994481942052913, "global_step": 40340, "epoch": 338, "lr": 4.033296017060904e-05, "val_loss": 0.02036312036216259} +{"train_loss": 0.0009531616815365851, "global_step": 40341, "epoch": 339, "lr": 4.033078647345763e-05} +{"train_loss": 0.003059969749301672, "global_step": 40342, "epoch": 339, "lr": 4.0328612795290705e-05} +{"train_loss": 0.0017194182146340609, "global_step": 40343, "epoch": 339, "lr": 4.0326439136112524e-05} +{"train_loss": 0.002888086484745145, "global_step": 40344, "epoch": 339, "lr": 4.0324265495927315e-05} +{"train_loss": 0.0026240695733577013, "global_step": 40345, "epoch": 339, "lr": 4.03220918747394e-05} +{"train_loss": 0.0017551607452332973, "global_step": 40346, "epoch": 339, "lr": 4.0319918272553006e-05} +{"train_loss": 0.00247814878821373, "global_step": 40347, "epoch": 339, "lr": 4.031774468937244e-05} +{"train_loss": 0.0011482380796223879, "global_step": 40348, "epoch": 339, "lr": 4.031557112520194e-05} +{"train_loss": 0.0016381634632125497, "global_step": 40349, "epoch": 339, "lr": 4.031339758004576e-05} +{"train_loss": 0.0017406584229320288, "global_step": 40350, "epoch": 339, "lr": 4.031122405390822e-05} +{"train_loss": 0.0007761701126582921, "global_step": 40351, "epoch": 339, "lr": 4.0309050546793533e-05} +{"train_loss": 0.0024242193903774023, "global_step": 40352, "epoch": 339, "lr": 4.0306877058706006e-05} +{"train_loss": 0.0016577766509726644, "global_step": 40353, "epoch": 339, "lr": 4.030470358964987e-05} +{"train_loss": 0.002212708815932274, "global_step": 40354, "epoch": 339, "lr": 4.030253013962944e-05} +{"train_loss": 0.002810476813465357, "global_step": 40355, "epoch": 339, "lr": 4.030035670864896e-05} +{"train_loss": 0.001476023462601006, "global_step": 40356, "epoch": 339, "lr": 4.029818329671266e-05} +{"train_loss": 0.0015934943221509457, "global_step": 40357, "epoch": 339, "lr": 4.029600990382487e-05} +{"train_loss": 0.001813743612729013, "global_step": 40358, "epoch": 339, "lr": 4.0293836529989805e-05} +{"train_loss": 0.002669947687536478, "global_step": 40359, "epoch": 339, "lr": 4.029166317521177e-05} +{"train_loss": 0.0016784729668870568, "global_step": 40360, "epoch": 339, "lr": 4.028948983949503e-05} +{"train_loss": 0.0025218171067535877, "global_step": 40361, "epoch": 339, "lr": 4.0287316522843806e-05} +{"train_loss": 0.0014011702733114362, "global_step": 40362, "epoch": 339, "lr": 4.028514322526241e-05} +{"train_loss": 0.0017711353721097112, "global_step": 40363, "epoch": 339, "lr": 4.02829699467551e-05} +{"train_loss": 0.001491898437961936, "global_step": 40364, "epoch": 339, "lr": 4.0280796687326143e-05} +{"train_loss": 0.0013095749309286475, "global_step": 40365, "epoch": 339, "lr": 4.02786234469798e-05} +{"train_loss": 0.0027046927716583014, "global_step": 40366, "epoch": 339, "lr": 4.0276450225720345e-05} +{"train_loss": 0.0016971550649031997, "global_step": 40367, "epoch": 339, "lr": 4.027427702355205e-05} +{"train_loss": 0.0016492382856085896, "global_step": 40368, "epoch": 339, "lr": 4.027210384047915e-05} +{"train_loss": 0.0019231535261496902, "global_step": 40369, "epoch": 339, "lr": 4.026993067650596e-05} +{"train_loss": 0.0023590761702507734, "global_step": 40370, "epoch": 339, "lr": 4.0267757531636695e-05} +{"train_loss": 0.0016315692337229848, "global_step": 40371, "epoch": 339, "lr": 4.026558440587567e-05} +{"train_loss": 0.001770451432093978, "global_step": 40372, "epoch": 339, "lr": 4.0263411299227116e-05} +{"train_loss": 0.003207689616829157, "global_step": 40373, "epoch": 339, "lr": 4.026123821169533e-05} +{"train_loss": 0.0011302795028313994, "global_step": 40374, "epoch": 339, "lr": 4.025906514328456e-05} +{"train_loss": 0.001693954225629568, "global_step": 40375, "epoch": 339, "lr": 4.025689209399906e-05} +{"train_loss": 0.0021142102777957916, "global_step": 40376, "epoch": 339, "lr": 4.025471906384313e-05} +{"train_loss": 0.001754874479956925, "global_step": 40377, "epoch": 339, "lr": 4.0252546052820995e-05} +{"train_loss": 0.002000828506425023, "global_step": 40378, "epoch": 339, "lr": 4.025037306093696e-05} +{"train_loss": 0.0022624717094004154, "global_step": 40379, "epoch": 339, "lr": 4.024820008819528e-05} +{"train_loss": 0.00200076075270772, "global_step": 40380, "epoch": 339, "lr": 4.0246027134600204e-05} +{"train_loss": 0.002303004963323474, "global_step": 40381, "epoch": 339, "lr": 4.024385420015602e-05} +{"train_loss": 0.0014941354747861624, "global_step": 40382, "epoch": 339, "lr": 4.024168128486698e-05} +{"train_loss": 0.0017603172454982996, "global_step": 40383, "epoch": 339, "lr": 4.023950838873736e-05} +{"train_loss": 0.0012053267564624548, "global_step": 40384, "epoch": 339, "lr": 4.023733551177141e-05} +{"train_loss": 0.0016735023818910122, "global_step": 40385, "epoch": 339, "lr": 4.023516265397343e-05} +{"train_loss": 0.0026949618477374315, "global_step": 40386, "epoch": 339, "lr": 4.023298981534766e-05} +{"train_loss": 0.002461520489305258, "global_step": 40387, "epoch": 339, "lr": 4.0230816995898356e-05} +{"train_loss": 0.0007587046129629016, "global_step": 40388, "epoch": 339, "lr": 4.0228644195629825e-05} +{"train_loss": 0.0016496677417308092, "global_step": 40389, "epoch": 339, "lr": 4.022647141454628e-05} +{"train_loss": 0.0015045510372146964, "global_step": 40390, "epoch": 339, "lr": 4.022429865265204e-05} +{"train_loss": 0.0012103170156478882, "global_step": 40391, "epoch": 339, "lr": 4.022212590995131e-05} +{"train_loss": 0.0015223755035549402, "global_step": 40392, "epoch": 339, "lr": 4.021995318644843e-05} +{"train_loss": 0.00118867470882833, "global_step": 40393, "epoch": 339, "lr": 4.021778048214762e-05} +{"train_loss": 0.0019999812357127666, "global_step": 40394, "epoch": 339, "lr": 4.0215607797053125e-05} +{"train_loss": 0.0018319736700505018, "global_step": 40395, "epoch": 339, "lr": 4.021343513116927e-05} +{"train_loss": 0.0014061563415452838, "global_step": 40396, "epoch": 339, "lr": 4.0211262484500266e-05} +{"train_loss": 0.0011971411295235157, "global_step": 40397, "epoch": 339, "lr": 4.020908985705041e-05} +{"train_loss": 0.0008453893242403865, "global_step": 40398, "epoch": 339, "lr": 4.0206917248823974e-05} +{"train_loss": 0.0014592338120564818, "global_step": 40399, "epoch": 339, "lr": 4.0204744659825186e-05} +{"train_loss": 0.0030318659264594316, "global_step": 40400, "epoch": 339, "lr": 4.020257209005836e-05} +{"train_loss": 0.0018063901225104928, "global_step": 40401, "epoch": 339, "lr": 4.020039953952771e-05} +{"train_loss": 0.0013045278610661626, "global_step": 40402, "epoch": 339, "lr": 4.0198227008237556e-05} +{"train_loss": 0.0010362433968111873, "global_step": 40403, "epoch": 339, "lr": 4.019605449619211e-05} +{"train_loss": 0.001088800490833819, "global_step": 40404, "epoch": 339, "lr": 4.0193882003395686e-05} +{"train_loss": 0.001722425571642816, "global_step": 40405, "epoch": 339, "lr": 4.019170952985253e-05} +{"train_loss": 0.00224090158008039, "global_step": 40406, "epoch": 339, "lr": 4.018953707556688e-05} +{"train_loss": 0.0017492002807557583, "global_step": 40407, "epoch": 339, "lr": 4.018736464054305e-05} +{"train_loss": 0.003014178713783622, "global_step": 40408, "epoch": 339, "lr": 4.018519222478526e-05} +{"train_loss": 0.0015700970543548465, "global_step": 40409, "epoch": 339, "lr": 4.0183019828297815e-05} +{"train_loss": 0.001500012120231986, "global_step": 40410, "epoch": 339, "lr": 4.018084745108494e-05} +{"train_loss": 0.0023656280245631933, "global_step": 40411, "epoch": 339, "lr": 4.0178675093150944e-05} +{"train_loss": 0.005596044007688761, "global_step": 40412, "epoch": 339, "lr": 4.017650275450006e-05} +{"train_loss": 0.0037667183205485344, "global_step": 40413, "epoch": 339, "lr": 4.017433043513657e-05} +{"train_loss": 0.0030709209386259317, "global_step": 40414, "epoch": 339, "lr": 4.0172158135064716e-05} +{"train_loss": 0.002778152236714959, "global_step": 40415, "epoch": 339, "lr": 4.0169985854288796e-05} +{"train_loss": 0.003267834894359112, "global_step": 40416, "epoch": 339, "lr": 4.016781359281305e-05} +{"train_loss": 0.0027324287220835686, "global_step": 40417, "epoch": 339, "lr": 4.016564135064176e-05} +{"train_loss": 0.0028190123848617077, "global_step": 40418, "epoch": 339, "lr": 4.0163469127779167e-05} +{"train_loss": 0.002391763497143984, "global_step": 40419, "epoch": 339, "lr": 4.016129692422957e-05} +{"train_loss": 0.0018224299419671297, "global_step": 40420, "epoch": 339, "lr": 4.01591247399972e-05} +{"train_loss": 0.0031347463373094797, "global_step": 40421, "epoch": 339, "lr": 4.0156952575086356e-05} +{"train_loss": 0.001832620007917285, "global_step": 40422, "epoch": 339, "lr": 4.015478042950126e-05} +{"train_loss": 0.001573010697029531, "global_step": 40423, "epoch": 339, "lr": 4.015260830324622e-05} +{"train_loss": 0.003399788634851575, "global_step": 40424, "epoch": 339, "lr": 4.0150436196325486e-05} +{"train_loss": 0.0021551272366195917, "global_step": 40425, "epoch": 339, "lr": 4.0148264108743294e-05} +{"train_loss": 0.0019410228123888373, "global_step": 40426, "epoch": 339, "lr": 4.014609204050396e-05} +{"train_loss": 0.002608642214909196, "global_step": 40427, "epoch": 339, "lr": 4.014391999161169e-05} +{"train_loss": 0.002802689326927066, "global_step": 40428, "epoch": 339, "lr": 4.014174796207081e-05} +{"train_loss": 0.0025190263986587524, "global_step": 40429, "epoch": 339, "lr": 4.0139575951885546e-05} +{"train_loss": 0.004311836790293455, "global_step": 40430, "epoch": 339, "lr": 4.013740396106016e-05} +{"train_loss": 0.0018257496412843466, "global_step": 40431, "epoch": 339, "lr": 4.013523198959894e-05} +{"train_loss": 0.002766102086752653, "global_step": 40432, "epoch": 339, "lr": 4.013306003750612e-05} +{"train_loss": 0.0023112152703106403, "global_step": 40433, "epoch": 339, "lr": 4.0130888104786005e-05} +{"train_loss": 0.002295711077749729, "global_step": 40434, "epoch": 339, "lr": 4.0128716191442814e-05} +{"train_loss": 0.0018716794438660145, "global_step": 40435, "epoch": 339, "lr": 4.012654429748086e-05} +{"train_loss": 0.0008946025627665222, "global_step": 40436, "epoch": 339, "lr": 4.0124372422904375e-05} +{"train_loss": 0.0016064905794337392, "global_step": 40437, "epoch": 339, "lr": 4.012220056771762e-05} +{"train_loss": 0.001895855413749814, "global_step": 40438, "epoch": 339, "lr": 4.012002873192488e-05} +{"train_loss": 0.0023756397422403097, "global_step": 40439, "epoch": 339, "lr": 4.011785691553039e-05} +{"train_loss": 0.0011158243287354708, "global_step": 40440, "epoch": 339, "lr": 4.011568511853845e-05} +{"train_loss": 0.0019934673327952623, "global_step": 40441, "epoch": 339, "lr": 4.011351334095329e-05} +{"train_loss": 0.0013777712592855096, "global_step": 40442, "epoch": 339, "lr": 4.01113415827792e-05} +{"train_loss": 0.002942353021353483, "global_step": 40443, "epoch": 339, "lr": 4.010916984402046e-05} +{"train_loss": 0.0029284609481692314, "global_step": 40444, "epoch": 339, "lr": 4.010699812468126e-05} +{"train_loss": 0.0015873172087594867, "global_step": 40445, "epoch": 339, "lr": 4.0104826424765936e-05} +{"train_loss": 0.002581895561888814, "global_step": 40446, "epoch": 339, "lr": 4.010265474427873e-05} +{"train_loss": 0.002266930416226387, "global_step": 40447, "epoch": 339, "lr": 4.0100483083223894e-05} +{"train_loss": 0.0021652213763445616, "global_step": 40448, "epoch": 339, "lr": 4.009831144160572e-05} +{"train_loss": 0.0034138367045670748, "global_step": 40449, "epoch": 339, "lr": 4.009613981942843e-05} +{"train_loss": 0.0034148157574236393, "global_step": 40450, "epoch": 339, "lr": 4.0093968216696336e-05} +{"train_loss": 0.002356684533879161, "global_step": 40451, "epoch": 339, "lr": 4.0091796633413654e-05} +{"train_loss": 0.002808657241985202, "global_step": 40452, "epoch": 339, "lr": 4.008962506958469e-05} +{"train_loss": 0.00249865441583097, "global_step": 40453, "epoch": 339, "lr": 4.008745352521367e-05} +{"train_loss": 0.0024658602196723223, "global_step": 40454, "epoch": 339, "lr": 4.008528200030489e-05} +{"train_loss": 0.0015480377478525043, "global_step": 40455, "epoch": 339, "lr": 4.008311049486261e-05} +{"train_loss": 0.0017971780616790056, "global_step": 40456, "epoch": 339, "lr": 4.008093900889106e-05} +{"train_loss": 0.0021299999207258224, "global_step": 40457, "epoch": 339, "lr": 4.007876754239454e-05} +{"train_loss": 0.0037504720967262983, "global_step": 40458, "epoch": 339, "lr": 4.007659609537728e-05} +{"train_loss": 0.0020957430271909203, "global_step": 40459, "epoch": 339, "lr": 4.007442466784359e-05, "val_loss": 0.029865765944123268} +{"train_loss": 0.0014615370891988277, "global_step": 40460, "epoch": 340, "lr": 4.007225325979769e-05} +{"train_loss": 0.0010262388968840241, "global_step": 40461, "epoch": 340, "lr": 4.0070081871243875e-05} +{"train_loss": 0.003178456099703908, "global_step": 40462, "epoch": 340, "lr": 4.006791050218638e-05} +{"train_loss": 0.0018071001395583153, "global_step": 40463, "epoch": 340, "lr": 4.006573915262949e-05} +{"train_loss": 0.002189348917454481, "global_step": 40464, "epoch": 340, "lr": 4.006356782257745e-05} +{"train_loss": 0.0025466452352702618, "global_step": 40465, "epoch": 340, "lr": 4.006139651203454e-05} +{"train_loss": 0.0009713403414934874, "global_step": 40466, "epoch": 340, "lr": 4.005922522100502e-05} +{"train_loss": 0.0008738656179048121, "global_step": 40467, "epoch": 340, "lr": 4.005705394949315e-05} +{"train_loss": 0.0032142524141818285, "global_step": 40468, "epoch": 340, "lr": 4.005488269750317e-05} +{"train_loss": 0.0022818208672106266, "global_step": 40469, "epoch": 340, "lr": 4.005271146503939e-05} +{"train_loss": 0.0016704904846847057, "global_step": 40470, "epoch": 340, "lr": 4.005054025210603e-05} +{"train_loss": 0.0025953815784305334, "global_step": 40471, "epoch": 340, "lr": 4.004836905870739e-05} +{"train_loss": 0.002283476060256362, "global_step": 40472, "epoch": 340, "lr": 4.004619788484769e-05} +{"train_loss": 0.0021748209837824106, "global_step": 40473, "epoch": 340, "lr": 4.0044026730531246e-05} +{"train_loss": 0.0014390432043001056, "global_step": 40474, "epoch": 340, "lr": 4.004185559576229e-05} +{"train_loss": 0.001278270734474063, "global_step": 40475, "epoch": 340, "lr": 4.003968448054506e-05} +{"train_loss": 0.003093993989750743, "global_step": 40476, "epoch": 340, "lr": 4.0037513384883877e-05} +{"train_loss": 0.002617430640384555, "global_step": 40477, "epoch": 340, "lr": 4.003534230878294e-05} +{"train_loss": 0.0013937641633674502, "global_step": 40478, "epoch": 340, "lr": 4.003317125224657e-05} +{"train_loss": 0.001099568558856845, "global_step": 40479, "epoch": 340, "lr": 4.003100021527899e-05} +{"train_loss": 0.0018207322573289275, "global_step": 40480, "epoch": 340, "lr": 4.0028829197884465e-05} +{"train_loss": 0.0017656655982136726, "global_step": 40481, "epoch": 340, "lr": 4.00266582000673e-05} +{"train_loss": 0.0022686764132231474, "global_step": 40482, "epoch": 340, "lr": 4.002448722183169e-05} +{"train_loss": 0.002969230990856886, "global_step": 40483, "epoch": 340, "lr": 4.002231626318196e-05} +{"train_loss": 0.002165525918826461, "global_step": 40484, "epoch": 340, "lr": 4.0020145324122324e-05} +{"train_loss": 0.0037385253235697746, "global_step": 40485, "epoch": 340, "lr": 4.00179744046571e-05} +{"train_loss": 0.0024782500695437193, "global_step": 40486, "epoch": 340, "lr": 4.0015803504790503e-05} +{"train_loss": 0.0014198130229488015, "global_step": 40487, "epoch": 340, "lr": 4.001363262452679e-05} +{"train_loss": 0.002537363674491644, "global_step": 40488, "epoch": 340, "lr": 4.0011461763870265e-05} +{"train_loss": 0.0025918257888406515, "global_step": 40489, "epoch": 340, "lr": 4.0009290922825146e-05} +{"train_loss": 0.0014027287252247334, "global_step": 40490, "epoch": 340, "lr": 4.0007120101395746e-05} +{"train_loss": 0.0011427138233557343, "global_step": 40491, "epoch": 340, "lr": 4.000494929958627e-05} +{"train_loss": 0.0014761917991563678, "global_step": 40492, "epoch": 340, "lr": 4.000277851740103e-05} +{"train_loss": 0.0038626466412097216, "global_step": 40493, "epoch": 340, "lr": 4.0000607754844263e-05} +{"train_loss": 0.001243807259015739, "global_step": 40494, "epoch": 340, "lr": 3.999843701192022e-05} +{"train_loss": 0.002399392891675234, "global_step": 40495, "epoch": 340, "lr": 3.999626628863318e-05} +{"train_loss": 0.0019917075987905264, "global_step": 40496, "epoch": 340, "lr": 3.999409558498741e-05} +{"train_loss": 0.0012382094282656908, "global_step": 40497, "epoch": 340, "lr": 3.999192490098716e-05} +{"train_loss": 0.0019482169300317764, "global_step": 40498, "epoch": 340, "lr": 3.998975423663671e-05} +{"train_loss": 0.0011198510183021426, "global_step": 40499, "epoch": 340, "lr": 3.998758359194028e-05} +{"train_loss": 0.0016172433970496058, "global_step": 40500, "epoch": 340, "lr": 3.998541296690219e-05} +{"train_loss": 0.0021317971404641867, "global_step": 40501, "epoch": 340, "lr": 3.998324236152665e-05} +{"train_loss": 0.0013108678394928575, "global_step": 40502, "epoch": 340, "lr": 3.998107177581796e-05} +{"train_loss": 0.002954561496153474, "global_step": 40503, "epoch": 340, "lr": 3.997890120978034e-05} +{"train_loss": 0.002073791343718767, "global_step": 40504, "epoch": 340, "lr": 3.997673066341811e-05} +{"train_loss": 0.002362742554396391, "global_step": 40505, "epoch": 340, "lr": 3.9974560136735484e-05} +{"train_loss": 0.0017938176169991493, "global_step": 40506, "epoch": 340, "lr": 3.997238962973673e-05} +{"train_loss": 0.002131788060069084, "global_step": 40507, "epoch": 340, "lr": 3.997021914242613e-05} +{"train_loss": 0.0017741640331223607, "global_step": 40508, "epoch": 340, "lr": 3.996804867480792e-05} +{"train_loss": 0.0026313969865441322, "global_step": 40509, "epoch": 340, "lr": 3.996587822688639e-05} +{"train_loss": 0.0008366931579075754, "global_step": 40510, "epoch": 340, "lr": 3.9963707798665764e-05} +{"train_loss": 0.0013843796914443374, "global_step": 40511, "epoch": 340, "lr": 3.996153739015035e-05} +{"train_loss": 0.0015948606887832284, "global_step": 40512, "epoch": 340, "lr": 3.9959367001344375e-05} +{"train_loss": 0.00236296933144331, "global_step": 40513, "epoch": 340, "lr": 3.995719663225211e-05} +{"train_loss": 0.0019895979203283787, "global_step": 40514, "epoch": 340, "lr": 3.995502628287781e-05} +{"train_loss": 0.0022897114977240562, "global_step": 40515, "epoch": 340, "lr": 3.995285595322574e-05} +{"train_loss": 0.0016730476636439562, "global_step": 40516, "epoch": 340, "lr": 3.995068564330018e-05} +{"train_loss": 0.002824329538270831, "global_step": 40517, "epoch": 340, "lr": 3.9948515353105376e-05} +{"train_loss": 0.0016395116690546274, "global_step": 40518, "epoch": 340, "lr": 3.994634508264557e-05} +{"train_loss": 0.0027599709574133158, "global_step": 40519, "epoch": 340, "lr": 3.994417483192506e-05} +{"train_loss": 0.0030604032799601555, "global_step": 40520, "epoch": 340, "lr": 3.9942004600948066e-05} +{"train_loss": 0.0018514867406338453, "global_step": 40521, "epoch": 340, "lr": 3.9939834389718896e-05} +{"train_loss": 0.0027451245114207268, "global_step": 40522, "epoch": 340, "lr": 3.993766419824177e-05} +{"train_loss": 0.0018688435666263103, "global_step": 40523, "epoch": 340, "lr": 3.993549402652098e-05} +{"train_loss": 0.0006854750099591911, "global_step": 40524, "epoch": 340, "lr": 3.993332387456077e-05} +{"train_loss": 0.001863874145783484, "global_step": 40525, "epoch": 340, "lr": 3.9931153742365384e-05} +{"train_loss": 0.002037348225712776, "global_step": 40526, "epoch": 340, "lr": 3.9928983629939125e-05} +{"train_loss": 0.002110249362885952, "global_step": 40527, "epoch": 340, "lr": 3.992681353728621e-05} +{"train_loss": 0.0013576986966654658, "global_step": 40528, "epoch": 340, "lr": 3.992464346441094e-05} +{"train_loss": 0.001779850572347641, "global_step": 40529, "epoch": 340, "lr": 3.9922473411317534e-05} +{"train_loss": 0.0028287069872021675, "global_step": 40530, "epoch": 340, "lr": 3.9920303378010285e-05} +{"train_loss": 0.0011050880420953035, "global_step": 40531, "epoch": 340, "lr": 3.991813336449346e-05} +{"train_loss": 0.0023205773904919624, "global_step": 40532, "epoch": 340, "lr": 3.991596337077128e-05} +{"train_loss": 0.0009586667292751372, "global_step": 40533, "epoch": 340, "lr": 3.9913793396848046e-05} +{"train_loss": 0.0014411346055567265, "global_step": 40534, "epoch": 340, "lr": 3.991162344272798e-05} +{"train_loss": 0.0027514020912349224, "global_step": 40535, "epoch": 340, "lr": 3.9909453508415385e-05} +{"train_loss": 0.0012701081577688456, "global_step": 40536, "epoch": 340, "lr": 3.99072835939145e-05} +{"train_loss": 0.0013650193577632308, "global_step": 40537, "epoch": 340, "lr": 3.990511369922957e-05} +{"train_loss": 0.0009148063836619258, "global_step": 40538, "epoch": 340, "lr": 3.990294382436488e-05} +{"train_loss": 0.0012248323764652014, "global_step": 40539, "epoch": 340, "lr": 3.9900773969324666e-05} +{"train_loss": 0.0012002734001725912, "global_step": 40540, "epoch": 340, "lr": 3.989860413411323e-05} +{"train_loss": 0.0019140427466481924, "global_step": 40541, "epoch": 340, "lr": 3.989643431873478e-05} +{"train_loss": 0.0018884005257859826, "global_step": 40542, "epoch": 340, "lr": 3.989426452319363e-05} +{"train_loss": 0.001613899483345449, "global_step": 40543, "epoch": 340, "lr": 3.9892094747493986e-05} +{"train_loss": 0.0011524446308612823, "global_step": 40544, "epoch": 340, "lr": 3.9889924991640145e-05} +{"train_loss": 0.0032850210554897785, "global_step": 40545, "epoch": 340, "lr": 3.988775525563635e-05} +{"train_loss": 0.0017670365050435066, "global_step": 40546, "epoch": 340, "lr": 3.9885585539486874e-05} +{"train_loss": 0.001925813383422792, "global_step": 40547, "epoch": 340, "lr": 3.988341584319596e-05} +{"train_loss": 0.0016896837623789907, "global_step": 40548, "epoch": 340, "lr": 3.9881246166767905e-05} +{"train_loss": 0.0017925474094226956, "global_step": 40549, "epoch": 340, "lr": 3.987907651020691e-05} +{"train_loss": 0.0013457377208396792, "global_step": 40550, "epoch": 340, "lr": 3.987690687351729e-05} +{"train_loss": 0.0017809238051995635, "global_step": 40551, "epoch": 340, "lr": 3.987473725670326e-05} +{"train_loss": 0.0016186331631615758, "global_step": 40552, "epoch": 340, "lr": 3.987256765976912e-05} +{"train_loss": 0.0029240900184959173, "global_step": 40553, "epoch": 340, "lr": 3.9870398082719094e-05} +{"train_loss": 0.0017451498424634337, "global_step": 40554, "epoch": 340, "lr": 3.9868228525557485e-05} +{"train_loss": 0.002936104778200388, "global_step": 40555, "epoch": 340, "lr": 3.9866058988288525e-05} +{"train_loss": 0.0008719058241695166, "global_step": 40556, "epoch": 340, "lr": 3.986388947091645e-05} +{"train_loss": 0.0015617527533322573, "global_step": 40557, "epoch": 340, "lr": 3.9861719973445564e-05} +{"train_loss": 0.002073188778012991, "global_step": 40558, "epoch": 340, "lr": 3.9859550495880094e-05} +{"train_loss": 0.0014036979991942644, "global_step": 40559, "epoch": 340, "lr": 3.985738103822433e-05} +{"train_loss": 0.0008763723308220506, "global_step": 40560, "epoch": 340, "lr": 3.985521160048249e-05} +{"train_loss": 0.0020231015514582396, "global_step": 40561, "epoch": 340, "lr": 3.985304218265888e-05} +{"train_loss": 0.001557730371132493, "global_step": 40562, "epoch": 340, "lr": 3.9850872784757735e-05} +{"train_loss": 0.0012706373818218708, "global_step": 40563, "epoch": 340, "lr": 3.9848703406783316e-05} +{"train_loss": 0.002368845045566559, "global_step": 40564, "epoch": 340, "lr": 3.984653404873988e-05} +{"train_loss": 0.0017514751525595784, "global_step": 40565, "epoch": 340, "lr": 3.984436471063168e-05} +{"train_loss": 0.002080765552818775, "global_step": 40566, "epoch": 340, "lr": 3.9842195392463e-05} +{"train_loss": 0.0018312913598492742, "global_step": 40567, "epoch": 340, "lr": 3.984002609423809e-05} +{"train_loss": 0.001784574007615447, "global_step": 40568, "epoch": 340, "lr": 3.983785681596118e-05} +{"train_loss": 0.0015393480425700545, "global_step": 40569, "epoch": 340, "lr": 3.983568755763658e-05} +{"train_loss": 0.0009983940981328487, "global_step": 40570, "epoch": 340, "lr": 3.983351831926849e-05} +{"train_loss": 0.0013017827877774835, "global_step": 40571, "epoch": 340, "lr": 3.9831349100861234e-05} +{"train_loss": 0.0025862776674330235, "global_step": 40572, "epoch": 340, "lr": 3.9829179902419006e-05} +{"train_loss": 0.0027715901378542185, "global_step": 40573, "epoch": 340, "lr": 3.982701072394612e-05} +{"train_loss": 0.001006640144623816, "global_step": 40574, "epoch": 340, "lr": 3.9824841565446816e-05} +{"train_loss": 0.0029018432833254337, "global_step": 40575, "epoch": 340, "lr": 3.982267242692533e-05} +{"train_loss": 0.0019184770062565804, "global_step": 40576, "epoch": 340, "lr": 3.982050330838595e-05} +{"train_loss": 0.0020094928331673145, "global_step": 40577, "epoch": 340, "lr": 3.981833420983291e-05} +{"train_loss": 0.0019031438503038733, "global_step": 40578, "epoch": 340, "lr": 3.981616513127049e-05, "val_loss": 0.009910078719258308, "train_action_mse_error": 2.3530223188572563e-05} +{"train_loss": 0.001111882971599698, "global_step": 40579, "epoch": 341, "lr": 3.981399607270295e-05} +{"train_loss": 0.0016421308973804116, "global_step": 40580, "epoch": 341, "lr": 3.981182703413453e-05} +{"train_loss": 0.0018433082150295377, "global_step": 40581, "epoch": 341, "lr": 3.980965801556952e-05} +{"train_loss": 0.0027951369993388653, "global_step": 40582, "epoch": 341, "lr": 3.9807489017012126e-05} +{"train_loss": 0.0021988172084093094, "global_step": 40583, "epoch": 341, "lr": 3.9805320038466664e-05} +{"train_loss": 0.0017640567384660244, "global_step": 40584, "epoch": 341, "lr": 3.980315107993734e-05} +{"train_loss": 0.0016555587062612176, "global_step": 40585, "epoch": 341, "lr": 3.980098214142847e-05} +{"train_loss": 0.0021194228902459145, "global_step": 40586, "epoch": 341, "lr": 3.979881322294428e-05} +{"train_loss": 0.0015022681327536702, "global_step": 40587, "epoch": 341, "lr": 3.979664432448901e-05} +{"train_loss": 0.0024394497741013765, "global_step": 40588, "epoch": 341, "lr": 3.979447544606696e-05} +{"train_loss": 0.002898923587054014, "global_step": 40589, "epoch": 341, "lr": 3.979230658768234e-05} +{"train_loss": 0.0010271769715473056, "global_step": 40590, "epoch": 341, "lr": 3.9790137749339465e-05} +{"train_loss": 0.0015796995721757412, "global_step": 40591, "epoch": 341, "lr": 3.9787968931042534e-05} +{"train_loss": 0.0013119499199092388, "global_step": 40592, "epoch": 341, "lr": 3.978580013279586e-05} +{"train_loss": 0.001050085760653019, "global_step": 40593, "epoch": 341, "lr": 3.978363135460367e-05} +{"train_loss": 0.002699078293517232, "global_step": 40594, "epoch": 341, "lr": 3.978146259647022e-05} +{"train_loss": 0.0022549955174326897, "global_step": 40595, "epoch": 341, "lr": 3.977929385839978e-05} +{"train_loss": 0.0015370718901976943, "global_step": 40596, "epoch": 341, "lr": 3.977712514039661e-05} +{"train_loss": 0.0015325299464166164, "global_step": 40597, "epoch": 341, "lr": 3.977495644246496e-05} +{"train_loss": 0.0016654563369229436, "global_step": 40598, "epoch": 341, "lr": 3.977278776460909e-05} +{"train_loss": 0.0012311222963035107, "global_step": 40599, "epoch": 341, "lr": 3.977061910683325e-05} +{"train_loss": 0.0015892419032752514, "global_step": 40600, "epoch": 341, "lr": 3.976845046914173e-05} +{"train_loss": 0.0013360099401324987, "global_step": 40601, "epoch": 341, "lr": 3.9766281851538736e-05} +{"train_loss": 0.0018465160392224789, "global_step": 40602, "epoch": 341, "lr": 3.976411325402857e-05} +{"train_loss": 0.001705322996713221, "global_step": 40603, "epoch": 341, "lr": 3.9761944676615465e-05} +{"train_loss": 0.0023827864788472652, "global_step": 40604, "epoch": 341, "lr": 3.97597761193037e-05} +{"train_loss": 0.0018170069670304656, "global_step": 40605, "epoch": 341, "lr": 3.975760758209753e-05} +{"train_loss": 0.0027413121424615383, "global_step": 40606, "epoch": 341, "lr": 3.9755439065001175e-05} +{"train_loss": 0.0017161696450784802, "global_step": 40607, "epoch": 341, "lr": 3.975327056801894e-05} +{"train_loss": 0.001698246574960649, "global_step": 40608, "epoch": 341, "lr": 3.975110209115505e-05} +{"train_loss": 0.0023219187278300524, "global_step": 40609, "epoch": 341, "lr": 3.974893363441379e-05} +{"train_loss": 0.0018582937773317099, "global_step": 40610, "epoch": 341, "lr": 3.974676519779939e-05} +{"train_loss": 0.0011427588760852814, "global_step": 40611, "epoch": 341, "lr": 3.9744596781316135e-05} +{"train_loss": 0.0014282652409747243, "global_step": 40612, "epoch": 341, "lr": 3.9742428384968266e-05} +{"train_loss": 0.0013018192257732153, "global_step": 40613, "epoch": 341, "lr": 3.974026000876002e-05} +{"train_loss": 0.001380715984851122, "global_step": 40614, "epoch": 341, "lr": 3.9738091652695705e-05} +{"train_loss": 0.002146091777831316, "global_step": 40615, "epoch": 341, "lr": 3.973592331677954e-05} +{"train_loss": 0.003401800524443388, "global_step": 40616, "epoch": 341, "lr": 3.97337550010158e-05} +{"train_loss": 0.0015698970528319478, "global_step": 40617, "epoch": 341, "lr": 3.973158670540874e-05} +{"train_loss": 0.002512715058401227, "global_step": 40618, "epoch": 341, "lr": 3.972941842996259e-05} +{"train_loss": 0.0019940081983804703, "global_step": 40619, "epoch": 341, "lr": 3.972725017468166e-05} +{"train_loss": 0.001355634885840118, "global_step": 40620, "epoch": 341, "lr": 3.972508193957014e-05} +{"train_loss": 0.0015335126081481576, "global_step": 40621, "epoch": 341, "lr": 3.972291372463236e-05} +{"train_loss": 0.0015218169428408146, "global_step": 40622, "epoch": 341, "lr": 3.972074552987251e-05} +{"train_loss": 0.0022626046556979418, "global_step": 40623, "epoch": 341, "lr": 3.97185773552949e-05} +{"train_loss": 0.0020009882282465696, "global_step": 40624, "epoch": 341, "lr": 3.971640920090377e-05} +{"train_loss": 0.0026889359578490257, "global_step": 40625, "epoch": 341, "lr": 3.971424106670334e-05} +{"train_loss": 0.001651356345973909, "global_step": 40626, "epoch": 341, "lr": 3.971207295269792e-05} +{"train_loss": 0.002019605366513133, "global_step": 40627, "epoch": 341, "lr": 3.970990485889174e-05} +{"train_loss": 0.0018355417996644974, "global_step": 40628, "epoch": 341, "lr": 3.9707736785289075e-05} +{"train_loss": 0.001688463380560279, "global_step": 40629, "epoch": 341, "lr": 3.970556873189415e-05} +{"train_loss": 0.0017403863603249192, "global_step": 40630, "epoch": 341, "lr": 3.9703400698711254e-05} +{"train_loss": 0.0014341505011543632, "global_step": 40631, "epoch": 341, "lr": 3.970123268574464e-05} +{"train_loss": 0.0021247852127999067, "global_step": 40632, "epoch": 341, "lr": 3.969906469299853e-05} +{"train_loss": 0.0014491749461740255, "global_step": 40633, "epoch": 341, "lr": 3.969689672047723e-05} +{"train_loss": 0.0016421290347352624, "global_step": 40634, "epoch": 341, "lr": 3.9694728768184955e-05} +{"train_loss": 0.0021976386196911335, "global_step": 40635, "epoch": 341, "lr": 3.969256083612599e-05} +{"train_loss": 0.0015526552451774478, "global_step": 40636, "epoch": 341, "lr": 3.9690392924304585e-05} +{"train_loss": 0.0016351972008123994, "global_step": 40637, "epoch": 341, "lr": 3.9688225032724975e-05} +{"train_loss": 0.0014359973138198256, "global_step": 40638, "epoch": 341, "lr": 3.968605716139146e-05} +{"train_loss": 0.001900236587971449, "global_step": 40639, "epoch": 341, "lr": 3.968388931030823e-05} +{"train_loss": 0.0010890583507716656, "global_step": 40640, "epoch": 341, "lr": 3.9681721479479616e-05} +{"train_loss": 0.0014035840285941958, "global_step": 40641, "epoch": 341, "lr": 3.9679553668909816e-05} +{"train_loss": 0.0015974853886291385, "global_step": 40642, "epoch": 341, "lr": 3.967738587860313e-05} +{"train_loss": 0.0014178684214130044, "global_step": 40643, "epoch": 341, "lr": 3.9675218108563784e-05} +{"train_loss": 0.0024775266647338867, "global_step": 40644, "epoch": 341, "lr": 3.967305035879604e-05} +{"train_loss": 0.0016137628117576241, "global_step": 40645, "epoch": 341, "lr": 3.967088262930417e-05} +{"train_loss": 0.001897932030260563, "global_step": 40646, "epoch": 341, "lr": 3.966871492009241e-05} +{"train_loss": 0.0007560559315606952, "global_step": 40647, "epoch": 341, "lr": 3.966654723116502e-05} +{"train_loss": 0.0012815273366868496, "global_step": 40648, "epoch": 341, "lr": 3.966437956252626e-05} +{"train_loss": 0.0017149036284536123, "global_step": 40649, "epoch": 341, "lr": 3.9662211914180405e-05} +{"train_loss": 0.002641365397721529, "global_step": 40650, "epoch": 341, "lr": 3.9660044286131684e-05} +{"train_loss": 0.0016494208248332143, "global_step": 40651, "epoch": 341, "lr": 3.965787667838435e-05} +{"train_loss": 0.0022988885175436735, "global_step": 40652, "epoch": 341, "lr": 3.965570909094269e-05} +{"train_loss": 0.0018077748827636242, "global_step": 40653, "epoch": 341, "lr": 3.965354152381091e-05} +{"train_loss": 0.0022643525153398514, "global_step": 40654, "epoch": 341, "lr": 3.9651373976993325e-05} +{"train_loss": 0.0012492183595895767, "global_step": 40655, "epoch": 341, "lr": 3.9649206450494164e-05} +{"train_loss": 0.0014868669677525759, "global_step": 40656, "epoch": 341, "lr": 3.9647038944317655e-05} +{"train_loss": 0.0014704247005283833, "global_step": 40657, "epoch": 341, "lr": 3.96448714584681e-05} +{"train_loss": 0.0019168913131579757, "global_step": 40658, "epoch": 341, "lr": 3.9642703992949715e-05} +{"train_loss": 0.001263959682546556, "global_step": 40659, "epoch": 341, "lr": 3.9640536547766794e-05} +{"train_loss": 0.0019309315830469131, "global_step": 40660, "epoch": 341, "lr": 3.9638369122923554e-05} +{"train_loss": 0.00280201924033463, "global_step": 40661, "epoch": 341, "lr": 3.9636201718424284e-05} +{"train_loss": 0.0023557960521429777, "global_step": 40662, "epoch": 341, "lr": 3.963403433427322e-05} +{"train_loss": 0.002672910923138261, "global_step": 40663, "epoch": 341, "lr": 3.9631866970474605e-05} +{"train_loss": 0.0017100191907957196, "global_step": 40664, "epoch": 341, "lr": 3.962969962703274e-05} +{"train_loss": 0.0016357444692403078, "global_step": 40665, "epoch": 341, "lr": 3.9627532303951824e-05} +{"train_loss": 0.0010304541792720556, "global_step": 40666, "epoch": 341, "lr": 3.962536500123617e-05} +{"train_loss": 0.0015625511296093464, "global_step": 40667, "epoch": 341, "lr": 3.962319771889e-05} +{"train_loss": 0.0014748448738828301, "global_step": 40668, "epoch": 341, "lr": 3.9621030456917545e-05} +{"train_loss": 0.0009550880640745163, "global_step": 40669, "epoch": 341, "lr": 3.9618863215323114e-05} +{"train_loss": 0.003003175836056471, "global_step": 40670, "epoch": 341, "lr": 3.961669599411092e-05} +{"train_loss": 0.002040695399045944, "global_step": 40671, "epoch": 341, "lr": 3.961452879328525e-05} +{"train_loss": 0.0016967697301879525, "global_step": 40672, "epoch": 341, "lr": 3.961236161285032e-05} +{"train_loss": 0.0011165118776261806, "global_step": 40673, "epoch": 341, "lr": 3.9610194452810436e-05} +{"train_loss": 0.001993433339521289, "global_step": 40674, "epoch": 341, "lr": 3.960802731316982e-05} +{"train_loss": 0.002400971483439207, "global_step": 40675, "epoch": 341, "lr": 3.960586019393271e-05} +{"train_loss": 0.0016292294021695852, "global_step": 40676, "epoch": 341, "lr": 3.960369309510339e-05} +{"train_loss": 0.0009837596444413066, "global_step": 40677, "epoch": 341, "lr": 3.960152601668612e-05} +{"train_loss": 0.002107704523950815, "global_step": 40678, "epoch": 341, "lr": 3.9599358958685135e-05} +{"train_loss": 0.001735775382257998, "global_step": 40679, "epoch": 341, "lr": 3.95971919211047e-05} +{"train_loss": 0.0019255432998761535, "global_step": 40680, "epoch": 341, "lr": 3.9595024903949064e-05} +{"train_loss": 0.0022228537127375603, "global_step": 40681, "epoch": 341, "lr": 3.95928579072225e-05} +{"train_loss": 0.002241601934656501, "global_step": 40682, "epoch": 341, "lr": 3.959069093092922e-05} +{"train_loss": 0.0014901033136993647, "global_step": 40683, "epoch": 341, "lr": 3.9588523975073536e-05} +{"train_loss": 0.0019068510737270117, "global_step": 40684, "epoch": 341, "lr": 3.958635703965964e-05} +{"train_loss": 0.0027252165600657463, "global_step": 40685, "epoch": 341, "lr": 3.9584190124691855e-05} +{"train_loss": 0.0020521976985037327, "global_step": 40686, "epoch": 341, "lr": 3.958202323017439e-05} +{"train_loss": 0.0024036034010350704, "global_step": 40687, "epoch": 341, "lr": 3.9579856356111486e-05} +{"train_loss": 0.0010330715449526906, "global_step": 40688, "epoch": 341, "lr": 3.9577689502507455e-05} +{"train_loss": 0.004070736002177, "global_step": 40689, "epoch": 341, "lr": 3.957552266936648e-05} +{"train_loss": 0.0018334940541535616, "global_step": 40690, "epoch": 341, "lr": 3.9573355856692884e-05} +{"train_loss": 0.0013346007326617837, "global_step": 40691, "epoch": 341, "lr": 3.9571189064490874e-05} +{"train_loss": 0.0021334998309612274, "global_step": 40692, "epoch": 341, "lr": 3.956902229276473e-05} +{"train_loss": 0.002055218443274498, "global_step": 40693, "epoch": 341, "lr": 3.9566855541518686e-05} +{"train_loss": 0.0013571962481364608, "global_step": 40694, "epoch": 341, "lr": 3.956468881075701e-05} +{"train_loss": 0.0018815252697095275, "global_step": 40695, "epoch": 341, "lr": 3.956252210048396e-05} +{"train_loss": 0.0017300407635048032, "global_step": 40696, "epoch": 341, "lr": 3.956035541070377e-05} +{"train_loss": 0.00184844496577759, "global_step": 40697, "epoch": 341, "lr": 3.955818874142071e-05, "val_loss": 0.013583170250058174} +{"train_loss": 0.001759628765285015, "global_step": 40698, "epoch": 342, "lr": 3.955602209263902e-05} +{"train_loss": 0.0018236922333016992, "global_step": 40699, "epoch": 342, "lr": 3.9553855464362995e-05} +{"train_loss": 0.003195543307811022, "global_step": 40700, "epoch": 342, "lr": 3.9551688856596854e-05} +{"train_loss": 0.0023234705440700054, "global_step": 40701, "epoch": 342, "lr": 3.954952226934483e-05} +{"train_loss": 0.002173111541196704, "global_step": 40702, "epoch": 342, "lr": 3.9547355702611225e-05} +{"train_loss": 0.0017447273712605238, "global_step": 40703, "epoch": 342, "lr": 3.9545189156400255e-05} +{"train_loss": 0.0016947687836363912, "global_step": 40704, "epoch": 342, "lr": 3.95430226307162e-05} +{"train_loss": 0.0024414118379354477, "global_step": 40705, "epoch": 342, "lr": 3.9540856125563316e-05} +{"train_loss": 0.0014832145534455776, "global_step": 40706, "epoch": 342, "lr": 3.953868964094581e-05} +{"train_loss": 0.002659769495949149, "global_step": 40707, "epoch": 342, "lr": 3.9536523176868e-05} +{"train_loss": 0.0016239278484135866, "global_step": 40708, "epoch": 342, "lr": 3.953435673333408e-05} +{"train_loss": 0.0015823721187189221, "global_step": 40709, "epoch": 342, "lr": 3.953219031034836e-05} +{"train_loss": 0.002032527467235923, "global_step": 40710, "epoch": 342, "lr": 3.9530023907915045e-05} +{"train_loss": 0.0016894607106223702, "global_step": 40711, "epoch": 342, "lr": 3.9527857526038415e-05} +{"train_loss": 0.002679492812603712, "global_step": 40712, "epoch": 342, "lr": 3.952569116472273e-05} +{"train_loss": 0.001659700064919889, "global_step": 40713, "epoch": 342, "lr": 3.952352482397221e-05} +{"train_loss": 0.0020642452873289585, "global_step": 40714, "epoch": 342, "lr": 3.952135850379115e-05} +{"train_loss": 0.0028370560612529516, "global_step": 40715, "epoch": 342, "lr": 3.951919220418376e-05} +{"train_loss": 0.002144282916560769, "global_step": 40716, "epoch": 342, "lr": 3.951702592515435e-05} +{"train_loss": 0.0013371440581977367, "global_step": 40717, "epoch": 342, "lr": 3.9514859666707105e-05} +{"train_loss": 0.002364425454288721, "global_step": 40718, "epoch": 342, "lr": 3.951269342884634e-05} +{"train_loss": 0.0021288972347974777, "global_step": 40719, "epoch": 342, "lr": 3.951052721157628e-05} +{"train_loss": 0.0020446956623345613, "global_step": 40720, "epoch": 342, "lr": 3.950836101490116e-05} +{"train_loss": 0.002706284401938319, "global_step": 40721, "epoch": 342, "lr": 3.9506194838825274e-05} +{"train_loss": 0.0022464573848992586, "global_step": 40722, "epoch": 342, "lr": 3.9504028683352826e-05} +{"train_loss": 0.0018682160880416632, "global_step": 40723, "epoch": 342, "lr": 3.950186254848812e-05} +{"train_loss": 0.001204083557240665, "global_step": 40724, "epoch": 342, "lr": 3.949969643423538e-05} +{"train_loss": 0.0013810734963044524, "global_step": 40725, "epoch": 342, "lr": 3.949753034059886e-05} +{"train_loss": 0.002331335796043277, "global_step": 40726, "epoch": 342, "lr": 3.9495364267582813e-05} +{"train_loss": 0.0032681140583008528, "global_step": 40727, "epoch": 342, "lr": 3.94931982151915e-05} +{"train_loss": 0.0014341152273118496, "global_step": 40728, "epoch": 342, "lr": 3.949103218342917e-05} +{"train_loss": 0.0019310968928039074, "global_step": 40729, "epoch": 342, "lr": 3.9488866172300075e-05} +{"train_loss": 0.003571735695004463, "global_step": 40730, "epoch": 342, "lr": 3.9486700181808476e-05} +{"train_loss": 0.0021094358526170254, "global_step": 40731, "epoch": 342, "lr": 3.9484534211958615e-05} +{"train_loss": 0.0014812194276601076, "global_step": 40732, "epoch": 342, "lr": 3.9482368262754735e-05} +{"train_loss": 0.002984903287142515, "global_step": 40733, "epoch": 342, "lr": 3.948020233420112e-05} +{"train_loss": 0.0024031726643443108, "global_step": 40734, "epoch": 342, "lr": 3.947803642630198e-05} +{"train_loss": 0.001993961399421096, "global_step": 40735, "epoch": 342, "lr": 3.9475870539061624e-05} +{"train_loss": 0.001868924591690302, "global_step": 40736, "epoch": 342, "lr": 3.947370467248426e-05} +{"train_loss": 0.00279411138035357, "global_step": 40737, "epoch": 342, "lr": 3.9471538826574134e-05} +{"train_loss": 0.004670730791985989, "global_step": 40738, "epoch": 342, "lr": 3.946937300133554e-05} +{"train_loss": 0.0010645862203091383, "global_step": 40739, "epoch": 342, "lr": 3.946720719677268e-05} +{"train_loss": 0.002130964072421193, "global_step": 40740, "epoch": 342, "lr": 3.9465041412889864e-05} +{"train_loss": 0.0020798398181796074, "global_step": 40741, "epoch": 342, "lr": 3.946287564969129e-05} +{"train_loss": 0.0013283329317346215, "global_step": 40742, "epoch": 342, "lr": 3.946070990718125e-05} +{"train_loss": 0.003096691332757473, "global_step": 40743, "epoch": 342, "lr": 3.9458544185363974e-05} +{"train_loss": 0.002076065866276622, "global_step": 40744, "epoch": 342, "lr": 3.945637848424372e-05} +{"train_loss": 0.0027527466882020235, "global_step": 40745, "epoch": 342, "lr": 3.945421280382474e-05} +{"train_loss": 0.0014263895573094487, "global_step": 40746, "epoch": 342, "lr": 3.945204714411127e-05} +{"train_loss": 0.0016969699645414948, "global_step": 40747, "epoch": 342, "lr": 3.9449881505107605e-05} +{"train_loss": 0.002582165878266096, "global_step": 40748, "epoch": 342, "lr": 3.944771588681795e-05} +{"train_loss": 0.0022261571139097214, "global_step": 40749, "epoch": 342, "lr": 3.94455502892466e-05} +{"train_loss": 0.001724272035062313, "global_step": 40750, "epoch": 342, "lr": 3.944338471239778e-05} +{"train_loss": 0.0017637121491134167, "global_step": 40751, "epoch": 342, "lr": 3.9441219156275725e-05} +{"train_loss": 0.002078492194414139, "global_step": 40752, "epoch": 342, "lr": 3.943905362088474e-05} +{"train_loss": 0.001482382882386446, "global_step": 40753, "epoch": 342, "lr": 3.9436888106229006e-05} +{"train_loss": 0.0029546176083385944, "global_step": 40754, "epoch": 342, "lr": 3.9434722612312844e-05} +{"train_loss": 0.0019219446694478393, "global_step": 40755, "epoch": 342, "lr": 3.943255713914048e-05} +{"train_loss": 0.0022328642662614584, "global_step": 40756, "epoch": 342, "lr": 3.9430391686716136e-05} +{"train_loss": 0.0014163743471726775, "global_step": 40757, "epoch": 342, "lr": 3.942822625504411e-05} +{"train_loss": 0.001556634670123458, "global_step": 40758, "epoch": 342, "lr": 3.942606084412861e-05} +{"train_loss": 0.0017263954505324364, "global_step": 40759, "epoch": 342, "lr": 3.942389545397392e-05} +{"train_loss": 0.001525930012576282, "global_step": 40760, "epoch": 342, "lr": 3.942173008458429e-05} +{"train_loss": 0.0008516829111613333, "global_step": 40761, "epoch": 342, "lr": 3.941956473596395e-05} +{"train_loss": 0.0026330703403800726, "global_step": 40762, "epoch": 342, "lr": 3.941739940811718e-05} +{"train_loss": 0.0014586461475118995, "global_step": 40763, "epoch": 342, "lr": 3.941523410104819e-05} +{"train_loss": 0.0017198367277160287, "global_step": 40764, "epoch": 342, "lr": 3.9413068814761286e-05} +{"train_loss": 0.0014401789521798491, "global_step": 40765, "epoch": 342, "lr": 3.941090354926066e-05} +{"train_loss": 0.001609418191947043, "global_step": 40766, "epoch": 342, "lr": 3.940873830455063e-05} +{"train_loss": 0.0021334912162274122, "global_step": 40767, "epoch": 342, "lr": 3.940657308063538e-05} +{"train_loss": 0.0022443910129368305, "global_step": 40768, "epoch": 342, "lr": 3.940440787751921e-05} +{"train_loss": 0.0011440800735726953, "global_step": 40769, "epoch": 342, "lr": 3.940224269520636e-05} +{"train_loss": 0.0020074998028576374, "global_step": 40770, "epoch": 342, "lr": 3.9400077533701046e-05} +{"train_loss": 0.0015101534081622958, "global_step": 40771, "epoch": 342, "lr": 3.939791239300758e-05} +{"train_loss": 0.0011983667500317097, "global_step": 40772, "epoch": 342, "lr": 3.9395747273130146e-05} +{"train_loss": 0.002143074292689562, "global_step": 40773, "epoch": 342, "lr": 3.9393582174073056e-05} +{"train_loss": 0.0017902484396472573, "global_step": 40774, "epoch": 342, "lr": 3.939141709584052e-05} +{"train_loss": 0.0032210825011134148, "global_step": 40775, "epoch": 342, "lr": 3.938925203843681e-05} +{"train_loss": 0.0013832564000040293, "global_step": 40776, "epoch": 342, "lr": 3.938708700186617e-05} +{"train_loss": 0.0009992585983127356, "global_step": 40777, "epoch": 342, "lr": 3.938492198613285e-05} +{"train_loss": 0.002379093086346984, "global_step": 40778, "epoch": 342, "lr": 3.938275699124109e-05} +{"train_loss": 0.0021865994203835726, "global_step": 40779, "epoch": 342, "lr": 3.938059201719517e-05} +{"train_loss": 0.0022533207666128874, "global_step": 40780, "epoch": 342, "lr": 3.937842706399931e-05} +{"train_loss": 0.0012971796095371246, "global_step": 40781, "epoch": 342, "lr": 3.9376262131657794e-05} +{"train_loss": 0.002281871857121587, "global_step": 40782, "epoch": 342, "lr": 3.937409722017482e-05} +{"train_loss": 0.0016380639281123877, "global_step": 40783, "epoch": 342, "lr": 3.93719323295547e-05} +{"train_loss": 0.00235100369900465, "global_step": 40784, "epoch": 342, "lr": 3.936976745980163e-05} +{"train_loss": 0.0022645757999271154, "global_step": 40785, "epoch": 342, "lr": 3.9367602610919916e-05} +{"train_loss": 0.003113649319857359, "global_step": 40786, "epoch": 342, "lr": 3.9365437782913775e-05} +{"train_loss": 0.0024957405403256416, "global_step": 40787, "epoch": 342, "lr": 3.936327297578744e-05} +{"train_loss": 0.0011856753844767809, "global_step": 40788, "epoch": 342, "lr": 3.936110818954519e-05} +{"train_loss": 0.001378423417918384, "global_step": 40789, "epoch": 342, "lr": 3.935894342419126e-05} +{"train_loss": 0.00197784136980772, "global_step": 40790, "epoch": 342, "lr": 3.935677867972992e-05} +{"train_loss": 0.0030368322040885687, "global_step": 40791, "epoch": 342, "lr": 3.93546139561654e-05} +{"train_loss": 0.00174107460770756, "global_step": 40792, "epoch": 342, "lr": 3.9352449253501965e-05} +{"train_loss": 0.002962200902402401, "global_step": 40793, "epoch": 342, "lr": 3.9350284571743856e-05} +{"train_loss": 0.0021478005219250917, "global_step": 40794, "epoch": 342, "lr": 3.934811991089532e-05} +{"train_loss": 0.0015558138256892562, "global_step": 40795, "epoch": 342, "lr": 3.9345955270960625e-05} +{"train_loss": 0.0024170568212866783, "global_step": 40796, "epoch": 342, "lr": 3.934379065194399e-05} +{"train_loss": 0.0022640915121883154, "global_step": 40797, "epoch": 342, "lr": 3.93416260538497e-05} +{"train_loss": 0.0018647173419594765, "global_step": 40798, "epoch": 342, "lr": 3.933946147668197e-05} +{"train_loss": 0.0010211567860096693, "global_step": 40799, "epoch": 342, "lr": 3.933729692044509e-05} +{"train_loss": 0.0026915878988802433, "global_step": 40800, "epoch": 342, "lr": 3.933513238514329e-05} +{"train_loss": 0.0015310293529182673, "global_step": 40801, "epoch": 342, "lr": 3.9332967870780804e-05} +{"train_loss": 0.0022193577606230974, "global_step": 40802, "epoch": 342, "lr": 3.93308033773619e-05} +{"train_loss": 0.0025222834665328264, "global_step": 40803, "epoch": 342, "lr": 3.932863890489082e-05} +{"train_loss": 0.002650088630616665, "global_step": 40804, "epoch": 342, "lr": 3.932647445337183e-05} +{"train_loss": 0.0013715510722249746, "global_step": 40805, "epoch": 342, "lr": 3.932431002280916e-05} +{"train_loss": 0.0018156897276639938, "global_step": 40806, "epoch": 342, "lr": 3.932214561320706e-05} +{"train_loss": 0.001580883632414043, "global_step": 40807, "epoch": 342, "lr": 3.9319981224569804e-05} +{"train_loss": 0.0018238351913169026, "global_step": 40808, "epoch": 342, "lr": 3.9317816856901595e-05} +{"train_loss": 0.001182451844215393, "global_step": 40809, "epoch": 342, "lr": 3.931565251020673e-05} +{"train_loss": 0.002096428070217371, "global_step": 40810, "epoch": 342, "lr": 3.931348818448943e-05} +{"train_loss": 0.003554692491889, "global_step": 40811, "epoch": 342, "lr": 3.9311323879753966e-05} +{"train_loss": 0.0014201292069628835, "global_step": 40812, "epoch": 342, "lr": 3.930915959600458e-05} +{"train_loss": 0.0019420944154262543, "global_step": 40813, "epoch": 342, "lr": 3.93069953332455e-05} +{"train_loss": 0.001388576696626842, "global_step": 40814, "epoch": 342, "lr": 3.930483109148101e-05} +{"train_loss": 0.0011810250580310822, "global_step": 40815, "epoch": 342, "lr": 3.9302666870715324e-05} +{"train_loss": 0.002020925216419826, "global_step": 40816, "epoch": 342, "lr": 3.930050267095272e-05, "val_loss": 0.043150290846824646} +{"train_loss": 0.0027711191214621067, "global_step": 40817, "epoch": 343, "lr": 3.929833849219742e-05} +{"train_loss": 0.001822507125325501, "global_step": 40818, "epoch": 343, "lr": 3.929617433445372e-05} +{"train_loss": 0.0012689657742157578, "global_step": 40819, "epoch": 343, "lr": 3.929401019772583e-05} +{"train_loss": 0.001959517365321517, "global_step": 40820, "epoch": 343, "lr": 3.929184608201798e-05} +{"train_loss": 0.002338889054954052, "global_step": 40821, "epoch": 343, "lr": 3.9289681987334474e-05} +{"train_loss": 0.0016306270845234394, "global_step": 40822, "epoch": 343, "lr": 3.928751791367951e-05} +{"train_loss": 0.0018118952866643667, "global_step": 40823, "epoch": 343, "lr": 3.928535386105739e-05} +{"train_loss": 0.0019517811015248299, "global_step": 40824, "epoch": 343, "lr": 3.928318982947231e-05} +{"train_loss": 0.0030260507483035326, "global_step": 40825, "epoch": 343, "lr": 3.9281025818928544e-05} +{"train_loss": 0.001107561867684126, "global_step": 40826, "epoch": 343, "lr": 3.927886182943035e-05} +{"train_loss": 0.002164437435567379, "global_step": 40827, "epoch": 343, "lr": 3.927669786098195e-05} +{"train_loss": 0.0017239758744835854, "global_step": 40828, "epoch": 343, "lr": 3.9274533913587614e-05} +{"train_loss": 0.0021322311367839575, "global_step": 40829, "epoch": 343, "lr": 3.9272369987251576e-05} +{"train_loss": 0.001985997660085559, "global_step": 40830, "epoch": 343, "lr": 3.927020608197811e-05} +{"train_loss": 0.0017402771627530456, "global_step": 40831, "epoch": 343, "lr": 3.926804219777146e-05} +{"train_loss": 0.0014679769519716501, "global_step": 40832, "epoch": 343, "lr": 3.926587833463583e-05} +{"train_loss": 0.0008398306672461331, "global_step": 40833, "epoch": 343, "lr": 3.9263714492575524e-05} +{"train_loss": 0.0019950037822127342, "global_step": 40834, "epoch": 343, "lr": 3.926155067159475e-05} +{"train_loss": 0.0026590372435748577, "global_step": 40835, "epoch": 343, "lr": 3.925938687169779e-05} +{"train_loss": 0.0018220882629975677, "global_step": 40836, "epoch": 343, "lr": 3.925722309288886e-05} +{"train_loss": 0.00200866162776947, "global_step": 40837, "epoch": 343, "lr": 3.925505933517224e-05} +{"train_loss": 0.00304801925085485, "global_step": 40838, "epoch": 343, "lr": 3.925289559855218e-05} +{"train_loss": 0.001404385780915618, "global_step": 40839, "epoch": 343, "lr": 3.925073188303287e-05} +{"train_loss": 0.0024209762923419476, "global_step": 40840, "epoch": 343, "lr": 3.9248568188618626e-05} +{"train_loss": 0.002725837053731084, "global_step": 40841, "epoch": 343, "lr": 3.924640451531366e-05} +{"train_loss": 0.0020752849522978067, "global_step": 40842, "epoch": 343, "lr": 3.924424086312224e-05} +{"train_loss": 0.0022619643714278936, "global_step": 40843, "epoch": 343, "lr": 3.924207723204859e-05} +{"train_loss": 0.0012389938347041607, "global_step": 40844, "epoch": 343, "lr": 3.923991362209697e-05} +{"train_loss": 0.002076801611110568, "global_step": 40845, "epoch": 343, "lr": 3.9237750033271646e-05} +{"train_loss": 0.001375937950797379, "global_step": 40846, "epoch": 343, "lr": 3.923558646557683e-05} +{"train_loss": 0.0017650084337219596, "global_step": 40847, "epoch": 343, "lr": 3.923342291901682e-05} +{"train_loss": 0.001120836939662695, "global_step": 40848, "epoch": 343, "lr": 3.92312593935958e-05} +{"train_loss": 0.0026475086342543364, "global_step": 40849, "epoch": 343, "lr": 3.922909588931808e-05} +{"train_loss": 0.0019156364724040031, "global_step": 40850, "epoch": 343, "lr": 3.922693240618787e-05} +{"train_loss": 0.0016675267834216356, "global_step": 40851, "epoch": 343, "lr": 3.9224768944209415e-05} +{"train_loss": 0.001251828740350902, "global_step": 40852, "epoch": 343, "lr": 3.922260550338699e-05} +{"train_loss": 0.001328261336311698, "global_step": 40853, "epoch": 343, "lr": 3.922044208372482e-05} +{"train_loss": 0.001946871168911457, "global_step": 40854, "epoch": 343, "lr": 3.9218278685227174e-05} +{"train_loss": 0.0011407030979171395, "global_step": 40855, "epoch": 343, "lr": 3.9216115307898285e-05} +{"train_loss": 0.0016491288552060723, "global_step": 40856, "epoch": 343, "lr": 3.921395195174238e-05} +{"train_loss": 0.002243033843114972, "global_step": 40857, "epoch": 343, "lr": 3.921178861676374e-05} +{"train_loss": 0.0021385822910815477, "global_step": 40858, "epoch": 343, "lr": 3.920962530296659e-05} +{"train_loss": 0.0018950914964079857, "global_step": 40859, "epoch": 343, "lr": 3.92074620103552e-05} +{"train_loss": 0.001617587637156248, "global_step": 40860, "epoch": 343, "lr": 3.9205298738933806e-05} +{"train_loss": 0.00168238312471658, "global_step": 40861, "epoch": 343, "lr": 3.920313548870664e-05} +{"train_loss": 0.0011927015148103237, "global_step": 40862, "epoch": 343, "lr": 3.920097225967799e-05} +{"train_loss": 0.0023316300939768553, "global_step": 40863, "epoch": 343, "lr": 3.9198809051852056e-05} +{"train_loss": 0.002427662257105112, "global_step": 40864, "epoch": 343, "lr": 3.9196645865233124e-05} +{"train_loss": 0.0012085199123248458, "global_step": 40865, "epoch": 343, "lr": 3.9194482699825394e-05} +{"train_loss": 0.001916655688546598, "global_step": 40866, "epoch": 343, "lr": 3.9192319555633176e-05} +{"train_loss": 0.0013415247667580843, "global_step": 40867, "epoch": 343, "lr": 3.919015643266066e-05} +{"train_loss": 0.0013288590125739574, "global_step": 40868, "epoch": 343, "lr": 3.918799333091213e-05} +{"train_loss": 0.0012872547376900911, "global_step": 40869, "epoch": 343, "lr": 3.918583025039183e-05} +{"train_loss": 0.001772465300746262, "global_step": 40870, "epoch": 343, "lr": 3.9183667191103974e-05} +{"train_loss": 0.0012267206329852343, "global_step": 40871, "epoch": 343, "lr": 3.918150415305285e-05} +{"train_loss": 0.002027211245149374, "global_step": 40872, "epoch": 343, "lr": 3.917934113624267e-05} +{"train_loss": 0.0021105732303112745, "global_step": 40873, "epoch": 343, "lr": 3.917717814067772e-05} +{"train_loss": 0.0015419084811583161, "global_step": 40874, "epoch": 343, "lr": 3.917501516636221e-05} +{"train_loss": 0.0017482908442616463, "global_step": 40875, "epoch": 343, "lr": 3.9172852213300393e-05} +{"train_loss": 0.002186342142522335, "global_step": 40876, "epoch": 343, "lr": 3.917068928149654e-05} +{"train_loss": 0.001122219837270677, "global_step": 40877, "epoch": 343, "lr": 3.916852637095487e-05} +{"train_loss": 0.0016726133180782199, "global_step": 40878, "epoch": 343, "lr": 3.916636348167965e-05} +{"train_loss": 0.0017778046894818544, "global_step": 40879, "epoch": 343, "lr": 3.916420061367509e-05} +{"train_loss": 0.0010075325844809413, "global_step": 40880, "epoch": 343, "lr": 3.9162037766945504e-05} +{"train_loss": 0.0010657863458618522, "global_step": 40881, "epoch": 343, "lr": 3.915987494149509e-05} +{"train_loss": 0.001064351643435657, "global_step": 40882, "epoch": 343, "lr": 3.915771213732809e-05} +{"train_loss": 0.0012141978368163109, "global_step": 40883, "epoch": 343, "lr": 3.915554935444878e-05} +{"train_loss": 0.001817092765122652, "global_step": 40884, "epoch": 343, "lr": 3.915338659286137e-05} +{"train_loss": 0.0019227010197937489, "global_step": 40885, "epoch": 343, "lr": 3.9151223852570146e-05} +{"train_loss": 0.0026881457306444645, "global_step": 40886, "epoch": 343, "lr": 3.914906113357931e-05} +{"train_loss": 0.0014394179452210665, "global_step": 40887, "epoch": 343, "lr": 3.914689843589317e-05} +{"train_loss": 0.0014226579805836082, "global_step": 40888, "epoch": 343, "lr": 3.914473575951592e-05} +{"train_loss": 0.002193148247897625, "global_step": 40889, "epoch": 343, "lr": 3.91425731044518e-05} +{"train_loss": 0.0020176952239125967, "global_step": 40890, "epoch": 343, "lr": 3.914041047070511e-05} +{"train_loss": 0.0015730797313153744, "global_step": 40891, "epoch": 343, "lr": 3.913824785828003e-05} +{"train_loss": 0.0016618737718090415, "global_step": 40892, "epoch": 343, "lr": 3.913608526718086e-05} +{"train_loss": 0.0010956980986520648, "global_step": 40893, "epoch": 343, "lr": 3.9133922697411836e-05} +{"train_loss": 0.001381553360261023, "global_step": 40894, "epoch": 343, "lr": 3.913176014897717e-05} +{"train_loss": 0.002131666289642453, "global_step": 40895, "epoch": 343, "lr": 3.912959762188115e-05} +{"train_loss": 0.001863447716459632, "global_step": 40896, "epoch": 343, "lr": 3.912743511612799e-05} +{"train_loss": 0.0020968709141016006, "global_step": 40897, "epoch": 343, "lr": 3.912527263172196e-05} +{"train_loss": 0.002589697949588299, "global_step": 40898, "epoch": 343, "lr": 3.9123110168667284e-05} +{"train_loss": 0.001163658918812871, "global_step": 40899, "epoch": 343, "lr": 3.9120947726968245e-05} +{"train_loss": 0.002030272502452135, "global_step": 40900, "epoch": 343, "lr": 3.911878530662905e-05} +{"train_loss": 0.002099008997902274, "global_step": 40901, "epoch": 343, "lr": 3.911662290765394e-05} +{"train_loss": 0.0014552236534655094, "global_step": 40902, "epoch": 343, "lr": 3.91144605300472e-05} +{"train_loss": 0.00129710475448519, "global_step": 40903, "epoch": 343, "lr": 3.911229817381304e-05} +{"train_loss": 0.0018877112306654453, "global_step": 40904, "epoch": 343, "lr": 3.911013583895573e-05} +{"train_loss": 0.0018262475496158004, "global_step": 40905, "epoch": 343, "lr": 3.91079735254795e-05} +{"train_loss": 0.002282565925270319, "global_step": 40906, "epoch": 343, "lr": 3.91058112333886e-05} +{"train_loss": 0.0020531348418444395, "global_step": 40907, "epoch": 343, "lr": 3.910364896268728e-05} +{"train_loss": 0.001376111526042223, "global_step": 40908, "epoch": 343, "lr": 3.910148671337977e-05} +{"train_loss": 0.0021993592381477356, "global_step": 40909, "epoch": 343, "lr": 3.909932448547033e-05} +{"train_loss": 0.0012570848921313882, "global_step": 40910, "epoch": 343, "lr": 3.9097162278963205e-05} +{"train_loss": 0.001622928073629737, "global_step": 40911, "epoch": 343, "lr": 3.909500009386264e-05} +{"train_loss": 0.0021985897328704596, "global_step": 40912, "epoch": 343, "lr": 3.9092837930172884e-05} +{"train_loss": 0.0014496379299089313, "global_step": 40913, "epoch": 343, "lr": 3.9090675787898155e-05} +{"train_loss": 0.0010477377800270915, "global_step": 40914, "epoch": 343, "lr": 3.9088513667042734e-05} +{"train_loss": 0.002460536314174533, "global_step": 40915, "epoch": 343, "lr": 3.9086351567610844e-05} +{"train_loss": 0.0013453061692416668, "global_step": 40916, "epoch": 343, "lr": 3.9084189489606745e-05} +{"train_loss": 0.0009325618739239872, "global_step": 40917, "epoch": 343, "lr": 3.9082027433034654e-05} +{"train_loss": 0.0018401941051706672, "global_step": 40918, "epoch": 343, "lr": 3.9079865397898866e-05} +{"train_loss": 0.0013455294538289309, "global_step": 40919, "epoch": 343, "lr": 3.907770338420358e-05} +{"train_loss": 0.0021765544079244137, "global_step": 40920, "epoch": 343, "lr": 3.9075541391953045e-05} +{"train_loss": 0.0015958950389176607, "global_step": 40921, "epoch": 343, "lr": 3.907337942115154e-05} +{"train_loss": 0.0008365217945538461, "global_step": 40922, "epoch": 343, "lr": 3.907121747180326e-05} +{"train_loss": 0.001429158728569746, "global_step": 40923, "epoch": 343, "lr": 3.90690555439125e-05} +{"train_loss": 0.0019722580909729004, "global_step": 40924, "epoch": 343, "lr": 3.906689363748348e-05} +{"train_loss": 0.0009643756784498692, "global_step": 40925, "epoch": 343, "lr": 3.906473175252044e-05} +{"train_loss": 0.004087136127054691, "global_step": 40926, "epoch": 343, "lr": 3.906256988902763e-05} +{"train_loss": 0.0013935684692114592, "global_step": 40927, "epoch": 343, "lr": 3.906040804700928e-05} +{"train_loss": 0.0009781959233805537, "global_step": 40928, "epoch": 343, "lr": 3.905824622646968e-05} +{"train_loss": 0.001257150317542255, "global_step": 40929, "epoch": 343, "lr": 3.905608442741302e-05} +{"train_loss": 0.0016534555470570922, "global_step": 40930, "epoch": 343, "lr": 3.905392264984359e-05} +{"train_loss": 0.0018529014196246862, "global_step": 40931, "epoch": 343, "lr": 3.9051760893765607e-05} +{"train_loss": 0.0017798846820369363, "global_step": 40932, "epoch": 343, "lr": 3.904959915918331e-05} +{"train_loss": 0.0028351538348942995, "global_step": 40933, "epoch": 343, "lr": 3.904743744610098e-05} +{"train_loss": 0.0017934482311829925, "global_step": 40934, "epoch": 343, "lr": 3.90452757545228e-05} +{"train_loss": 0.001767136509228936, "global_step": 40935, "epoch": 343, "lr": 3.9043114084453085e-05, "val_loss": 0.010797279886901379} +{"train_loss": 0.0014542784774675965, "global_step": 40936, "epoch": 344, "lr": 3.904095243589602e-05} +{"train_loss": 0.0018435327801853418, "global_step": 40937, "epoch": 344, "lr": 3.9038790808855894e-05} +{"train_loss": 0.0022860714234411716, "global_step": 40938, "epoch": 344, "lr": 3.903662920333693e-05} +{"train_loss": 0.001053342130035162, "global_step": 40939, "epoch": 344, "lr": 3.903446761934336e-05} +{"train_loss": 0.0009564929641783237, "global_step": 40940, "epoch": 344, "lr": 3.903230605687944e-05} +{"train_loss": 0.0018175444565713406, "global_step": 40941, "epoch": 344, "lr": 3.903014451594942e-05} +{"train_loss": 0.002564632100984454, "global_step": 40942, "epoch": 344, "lr": 3.902798299655754e-05} +{"train_loss": 0.0016499952180311084, "global_step": 40943, "epoch": 344, "lr": 3.902582149870806e-05} +{"train_loss": 0.0021041587460786104, "global_step": 40944, "epoch": 344, "lr": 3.902366002240518e-05} +{"train_loss": 0.0015916782431304455, "global_step": 40945, "epoch": 344, "lr": 3.902149856765319e-05} +{"train_loss": 0.0007754134712740779, "global_step": 40946, "epoch": 344, "lr": 3.90193371344563e-05} +{"train_loss": 0.001385571202263236, "global_step": 40947, "epoch": 344, "lr": 3.901717572281878e-05} +{"train_loss": 0.0020575872622430325, "global_step": 40948, "epoch": 344, "lr": 3.901501433274485e-05} +{"train_loss": 0.0018475098768249154, "global_step": 40949, "epoch": 344, "lr": 3.9012852964238776e-05} +{"train_loss": 0.0014385032700374722, "global_step": 40950, "epoch": 344, "lr": 3.901069161730481e-05} +{"train_loss": 0.0019548884592950344, "global_step": 40951, "epoch": 344, "lr": 3.900853029194714e-05} +{"train_loss": 0.0015226370887830853, "global_step": 40952, "epoch": 344, "lr": 3.9006368988170075e-05} +{"train_loss": 0.0017205567564815283, "global_step": 40953, "epoch": 344, "lr": 3.9004207705977805e-05} +{"train_loss": 0.0019118820782750845, "global_step": 40954, "epoch": 344, "lr": 3.9002046445374616e-05} +{"train_loss": 0.001980680273845792, "global_step": 40955, "epoch": 344, "lr": 3.8999885206364715e-05} +{"train_loss": 0.0024080630391836166, "global_step": 40956, "epoch": 344, "lr": 3.8997723988952386e-05} +{"train_loss": 0.0012650404823943973, "global_step": 40957, "epoch": 344, "lr": 3.899556279314185e-05} +{"train_loss": 0.0016444456996396184, "global_step": 40958, "epoch": 344, "lr": 3.899340161893734e-05} +{"train_loss": 0.0025059336330741644, "global_step": 40959, "epoch": 344, "lr": 3.8991240466343106e-05} +{"train_loss": 0.002380205085501075, "global_step": 40960, "epoch": 344, "lr": 3.89890793353634e-05} +{"train_loss": 0.0011045443825423717, "global_step": 40961, "epoch": 344, "lr": 3.8986918226002465e-05} +{"train_loss": 0.0017240047454833984, "global_step": 40962, "epoch": 344, "lr": 3.898475713826455e-05} +{"train_loss": 0.002171867061406374, "global_step": 40963, "epoch": 344, "lr": 3.898259607215386e-05} +{"train_loss": 0.0018708579009398818, "global_step": 40964, "epoch": 344, "lr": 3.8980435027674694e-05} +{"train_loss": 0.0023521126713603735, "global_step": 40965, "epoch": 344, "lr": 3.897827400483124e-05} +{"train_loss": 0.0020918843802064657, "global_step": 40966, "epoch": 344, "lr": 3.897611300362779e-05} +{"train_loss": 0.0015935071278363466, "global_step": 40967, "epoch": 344, "lr": 3.897395202406854e-05} +{"train_loss": 0.0016116329934448004, "global_step": 40968, "epoch": 344, "lr": 3.897179106615779e-05} +{"train_loss": 0.0018976973369717598, "global_step": 40969, "epoch": 344, "lr": 3.8969630129899735e-05} +{"train_loss": 0.0012312558246776462, "global_step": 40970, "epoch": 344, "lr": 3.896746921529862e-05} +{"train_loss": 0.0010235542431473732, "global_step": 40971, "epoch": 344, "lr": 3.896530832235872e-05} +{"train_loss": 0.0018969944212585688, "global_step": 40972, "epoch": 344, "lr": 3.896314745108423e-05} +{"train_loss": 0.001564670237712562, "global_step": 40973, "epoch": 344, "lr": 3.896098660147946e-05} +{"train_loss": 0.0014792403671890497, "global_step": 40974, "epoch": 344, "lr": 3.895882577354859e-05} +{"train_loss": 0.0021239370107650757, "global_step": 40975, "epoch": 344, "lr": 3.895666496729589e-05} +{"train_loss": 0.0015090761007741094, "global_step": 40976, "epoch": 344, "lr": 3.89545041827256e-05} +{"train_loss": 0.0006599353509955108, "global_step": 40977, "epoch": 344, "lr": 3.8952343419841944e-05} +{"train_loss": 0.0019399153534322977, "global_step": 40978, "epoch": 344, "lr": 3.8950182678649204e-05} +{"train_loss": 0.0015451371436938643, "global_step": 40979, "epoch": 344, "lr": 3.894802195915158e-05} +{"train_loss": 0.0016772779636085033, "global_step": 40980, "epoch": 344, "lr": 3.8945861261353353e-05} +{"train_loss": 0.0025676351506263018, "global_step": 40981, "epoch": 344, "lr": 3.8943700585258754e-05} +{"train_loss": 0.0014711384428665042, "global_step": 40982, "epoch": 344, "lr": 3.8941539930872e-05} +{"train_loss": 0.001448642578907311, "global_step": 40983, "epoch": 344, "lr": 3.893937929819735e-05} +{"train_loss": 0.0015283903339877725, "global_step": 40984, "epoch": 344, "lr": 3.893721868723905e-05} +{"train_loss": 0.003208707319572568, "global_step": 40985, "epoch": 344, "lr": 3.893505809800135e-05} +{"train_loss": 0.0009810681222006679, "global_step": 40986, "epoch": 344, "lr": 3.8932897530488454e-05} +{"train_loss": 0.0018359145615249872, "global_step": 40987, "epoch": 344, "lr": 3.893073698470466e-05} +{"train_loss": 0.002245045965537429, "global_step": 40988, "epoch": 344, "lr": 3.892857646065418e-05} +{"train_loss": 0.0012590266996994615, "global_step": 40989, "epoch": 344, "lr": 3.892641595834124e-05} +{"train_loss": 0.001414017635397613, "global_step": 40990, "epoch": 344, "lr": 3.8924255477770106e-05} +{"train_loss": 0.0012040967121720314, "global_step": 40991, "epoch": 344, "lr": 3.892209501894501e-05} +{"train_loss": 0.0024009854532778263, "global_step": 40992, "epoch": 344, "lr": 3.89199345818702e-05} +{"train_loss": 0.0010984729742631316, "global_step": 40993, "epoch": 344, "lr": 3.8917774166549924e-05} +{"train_loss": 0.0026978752575814724, "global_step": 40994, "epoch": 344, "lr": 3.8915613772988396e-05} +{"train_loss": 0.0011879559606313705, "global_step": 40995, "epoch": 344, "lr": 3.8913453401189896e-05} +{"train_loss": 0.002100809942930937, "global_step": 40996, "epoch": 344, "lr": 3.8911293051158624e-05} +{"train_loss": 0.0018285984406247735, "global_step": 40997, "epoch": 344, "lr": 3.8909132722898864e-05} +{"train_loss": 0.002709748689085245, "global_step": 40998, "epoch": 344, "lr": 3.890697241641482e-05} +{"train_loss": 0.0008691592374816537, "global_step": 40999, "epoch": 344, "lr": 3.890481213171077e-05} +{"train_loss": 0.002734305104240775, "global_step": 41000, "epoch": 344, "lr": 3.8902651868790935e-05} +{"train_loss": 0.001387382042594254, "global_step": 41001, "epoch": 344, "lr": 3.890049162765954e-05} +{"train_loss": 0.001927768113091588, "global_step": 41002, "epoch": 344, "lr": 3.8898331408320856e-05} +{"train_loss": 0.0023092771880328655, "global_step": 41003, "epoch": 344, "lr": 3.8896171210779097e-05} +{"train_loss": 0.001648935372941196, "global_step": 41004, "epoch": 344, "lr": 3.889401103503854e-05} +{"train_loss": 0.002540829125791788, "global_step": 41005, "epoch": 344, "lr": 3.8891850881103387e-05} +{"train_loss": 0.0015856230165809393, "global_step": 41006, "epoch": 344, "lr": 3.8889690748977914e-05} +{"train_loss": 0.0016780479345470667, "global_step": 41007, "epoch": 344, "lr": 3.8887530638666344e-05} +{"train_loss": 0.0014572552172467113, "global_step": 41008, "epoch": 344, "lr": 3.8885370550172914e-05} +{"train_loss": 0.0013277152320370078, "global_step": 41009, "epoch": 344, "lr": 3.888321048350187e-05} +{"train_loss": 0.001219205092638731, "global_step": 41010, "epoch": 344, "lr": 3.888105043865746e-05} +{"train_loss": 0.001578881754539907, "global_step": 41011, "epoch": 344, "lr": 3.8878890415643916e-05} +{"train_loss": 0.0022815384436398745, "global_step": 41012, "epoch": 344, "lr": 3.887673041446549e-05} +{"train_loss": 0.0012618402251973748, "global_step": 41013, "epoch": 344, "lr": 3.88745704351264e-05} +{"train_loss": 0.001557322801090777, "global_step": 41014, "epoch": 344, "lr": 3.887241047763092e-05} +{"train_loss": 0.0011660768650472164, "global_step": 41015, "epoch": 344, "lr": 3.8870250541983257e-05} +{"train_loss": 0.0011557203251868486, "global_step": 41016, "epoch": 344, "lr": 3.886809062818769e-05} +{"train_loss": 0.0009540394530631602, "global_step": 41017, "epoch": 344, "lr": 3.886593073624841e-05} +{"train_loss": 0.0018596748122945428, "global_step": 41018, "epoch": 344, "lr": 3.886377086616971e-05} +{"train_loss": 0.0022971108555793762, "global_step": 41019, "epoch": 344, "lr": 3.88616110179558e-05} +{"train_loss": 0.0009682427626103163, "global_step": 41020, "epoch": 344, "lr": 3.885945119161091e-05} +{"train_loss": 0.0013089175336062908, "global_step": 41021, "epoch": 344, "lr": 3.885729138713932e-05} +{"train_loss": 0.0015214703744277358, "global_step": 41022, "epoch": 344, "lr": 3.885513160454523e-05} +{"train_loss": 0.0016529835993424058, "global_step": 41023, "epoch": 344, "lr": 3.885297184383292e-05} +{"train_loss": 0.0017313614953309298, "global_step": 41024, "epoch": 344, "lr": 3.8850812105006576e-05} +{"train_loss": 0.0016820078017190099, "global_step": 41025, "epoch": 344, "lr": 3.88486523880705e-05} +{"train_loss": 0.0026350312400609255, "global_step": 41026, "epoch": 344, "lr": 3.88464926930289e-05} +{"train_loss": 0.000840052729472518, "global_step": 41027, "epoch": 344, "lr": 3.8844333019885996e-05} +{"train_loss": 0.0008914266945794225, "global_step": 41028, "epoch": 344, "lr": 3.8842173368646084e-05} +{"train_loss": 0.002322893124073744, "global_step": 41029, "epoch": 344, "lr": 3.8840013739313345e-05} +{"train_loss": 0.001025882549583912, "global_step": 41030, "epoch": 344, "lr": 3.883785413189207e-05} +{"train_loss": 0.0011422114912420511, "global_step": 41031, "epoch": 344, "lr": 3.883569454638648e-05} +{"train_loss": 0.0015337758231908083, "global_step": 41032, "epoch": 344, "lr": 3.883353498280078e-05} +{"train_loss": 0.0019258238608017564, "global_step": 41033, "epoch": 344, "lr": 3.883137544113927e-05} +{"train_loss": 0.0014875412452965975, "global_step": 41034, "epoch": 344, "lr": 3.8829215921406145e-05} +{"train_loss": 0.0030267538968473673, "global_step": 41035, "epoch": 344, "lr": 3.8827056423605676e-05} +{"train_loss": 0.002332843840122223, "global_step": 41036, "epoch": 344, "lr": 3.8824896947742065e-05} +{"train_loss": 0.0013718917034566402, "global_step": 41037, "epoch": 344, "lr": 3.88227374938196e-05} +{"train_loss": 0.0014131695497781038, "global_step": 41038, "epoch": 344, "lr": 3.8820578061842484e-05} +{"train_loss": 0.00216383533552289, "global_step": 41039, "epoch": 344, "lr": 3.8818418651814963e-05} +{"train_loss": 0.001073430641554296, "global_step": 41040, "epoch": 344, "lr": 3.881625926374129e-05} +{"train_loss": 0.0016473380383104086, "global_step": 41041, "epoch": 344, "lr": 3.881409989762569e-05} +{"train_loss": 0.0018352395854890347, "global_step": 41042, "epoch": 344, "lr": 3.881194055347241e-05} +{"train_loss": 0.0015387528110295534, "global_step": 41043, "epoch": 344, "lr": 3.880978123128571e-05} +{"train_loss": 0.0017756142187863588, "global_step": 41044, "epoch": 344, "lr": 3.8807621931069785e-05} +{"train_loss": 0.002071334747597575, "global_step": 41045, "epoch": 344, "lr": 3.8805462652828915e-05} +{"train_loss": 0.0021401550620794296, "global_step": 41046, "epoch": 344, "lr": 3.8803303396567304e-05} +{"train_loss": 0.001427123905159533, "global_step": 41047, "epoch": 344, "lr": 3.880114416228923e-05} +{"train_loss": 0.0022272069472819567, "global_step": 41048, "epoch": 344, "lr": 3.87989849499989e-05} +{"train_loss": 0.002328414935618639, "global_step": 41049, "epoch": 344, "lr": 3.8796825759700573e-05} +{"train_loss": 0.0025816410779953003, "global_step": 41050, "epoch": 344, "lr": 3.8794666591398495e-05} +{"train_loss": 0.002030250383540988, "global_step": 41051, "epoch": 344, "lr": 3.879250744509686e-05} +{"train_loss": 0.0020797522738575935, "global_step": 41052, "epoch": 344, "lr": 3.879034832079997e-05} +{"train_loss": 0.0014229875523597002, "global_step": 41053, "epoch": 344, "lr": 3.8788189218512e-05} +{"train_loss": 0.0017244838625231774, "global_step": 41054, "epoch": 344, "lr": 3.878603013823726e-05, "val_loss": 0.025388676673173904} +{"train_loss": 0.0013266346650198102, "global_step": 41055, "epoch": 345, "lr": 3.878387107997992e-05} +{"train_loss": 0.001075627631507814, "global_step": 41056, "epoch": 345, "lr": 3.878171204374428e-05} +{"train_loss": 0.0026486990973353386, "global_step": 41057, "epoch": 345, "lr": 3.877955302953453e-05} +{"train_loss": 0.0032131534535437822, "global_step": 41058, "epoch": 345, "lr": 3.877739403735493e-05} +{"train_loss": 0.0012337591033428907, "global_step": 41059, "epoch": 345, "lr": 3.877523506720972e-05} +{"train_loss": 0.0014958579558879137, "global_step": 41060, "epoch": 345, "lr": 3.877307611910313e-05} +{"train_loss": 0.0013231196207925677, "global_step": 41061, "epoch": 345, "lr": 3.8770917193039424e-05} +{"train_loss": 0.0014584698947146535, "global_step": 41062, "epoch": 345, "lr": 3.876875828902282e-05} +{"train_loss": 0.001548068132251501, "global_step": 41063, "epoch": 345, "lr": 3.8766599407057546e-05} +{"train_loss": 0.0015999196330085397, "global_step": 41064, "epoch": 345, "lr": 3.8764440547147865e-05} +{"train_loss": 0.001598156290128827, "global_step": 41065, "epoch": 345, "lr": 3.8762281709297985e-05} +{"train_loss": 0.00251448480412364, "global_step": 41066, "epoch": 345, "lr": 3.8760122893512195e-05} +{"train_loss": 0.00223057740367949, "global_step": 41067, "epoch": 345, "lr": 3.8757964099794676e-05} +{"train_loss": 0.0010331299854442477, "global_step": 41068, "epoch": 345, "lr": 3.875580532814971e-05} +{"train_loss": 0.0019176910864189267, "global_step": 41069, "epoch": 345, "lr": 3.875364657858153e-05} +{"train_loss": 0.0014306805096566677, "global_step": 41070, "epoch": 345, "lr": 3.875148785109433e-05} +{"train_loss": 0.0016698281979188323, "global_step": 41071, "epoch": 345, "lr": 3.874932914569241e-05} +{"train_loss": 0.0016364824259653687, "global_step": 41072, "epoch": 345, "lr": 3.8747170462379957e-05} +{"train_loss": 0.0012742520775645971, "global_step": 41073, "epoch": 345, "lr": 3.874501180116124e-05} +{"train_loss": 0.0031992155127227306, "global_step": 41074, "epoch": 345, "lr": 3.8742853162040496e-05} +{"train_loss": 0.000797546817921102, "global_step": 41075, "epoch": 345, "lr": 3.874069454502195e-05} +{"train_loss": 0.0021506818011403084, "global_step": 41076, "epoch": 345, "lr": 3.873853595010987e-05} +{"train_loss": 0.0028011908289045095, "global_step": 41077, "epoch": 345, "lr": 3.8736377377308435e-05} +{"train_loss": 0.002067358000203967, "global_step": 41078, "epoch": 345, "lr": 3.873421882662195e-05} +{"train_loss": 0.001418360392563045, "global_step": 41079, "epoch": 345, "lr": 3.87320602980546e-05} +{"train_loss": 0.0017946475418284535, "global_step": 41080, "epoch": 345, "lr": 3.8729901791610666e-05} +{"train_loss": 0.0018197683384642005, "global_step": 41081, "epoch": 345, "lr": 3.872774330729437e-05} +{"train_loss": 0.001994275487959385, "global_step": 41082, "epoch": 345, "lr": 3.872558484510992e-05} +{"train_loss": 0.001365231117233634, "global_step": 41083, "epoch": 345, "lr": 3.8723426405061605e-05} +{"train_loss": 0.002937232842668891, "global_step": 41084, "epoch": 345, "lr": 3.872126798715361e-05} +{"train_loss": 0.002224675379693508, "global_step": 41085, "epoch": 345, "lr": 3.871910959139022e-05} +{"train_loss": 0.0014198941644281149, "global_step": 41086, "epoch": 345, "lr": 3.871695121777564e-05} +{"train_loss": 0.0012276245979592204, "global_step": 41087, "epoch": 345, "lr": 3.8714792866314143e-05} +{"train_loss": 0.0019987577106803656, "global_step": 41088, "epoch": 345, "lr": 3.871263453700993e-05} +{"train_loss": 0.002123842481523752, "global_step": 41089, "epoch": 345, "lr": 3.8710476229867255e-05} +{"train_loss": 0.0010740960715338588, "global_step": 41090, "epoch": 345, "lr": 3.870831794489035e-05} +{"train_loss": 0.0015367158921435475, "global_step": 41091, "epoch": 345, "lr": 3.870615968208346e-05} +{"train_loss": 0.001801517209969461, "global_step": 41092, "epoch": 345, "lr": 3.8704001441450814e-05} +{"train_loss": 0.001911316066980362, "global_step": 41093, "epoch": 345, "lr": 3.870184322299667e-05} +{"train_loss": 0.002592637436464429, "global_step": 41094, "epoch": 345, "lr": 3.869968502672523e-05} +{"train_loss": 0.0013988696737214923, "global_step": 41095, "epoch": 345, "lr": 3.869752685264077e-05} +{"train_loss": 0.002235551131889224, "global_step": 41096, "epoch": 345, "lr": 3.8695368700747485e-05} +{"train_loss": 0.002229789737612009, "global_step": 41097, "epoch": 345, "lr": 3.869321057104966e-05} +{"train_loss": 0.0023451587185263634, "global_step": 41098, "epoch": 345, "lr": 3.869105246355149e-05} +{"train_loss": 0.001659233937971294, "global_step": 41099, "epoch": 345, "lr": 3.868889437825724e-05} +{"train_loss": 0.0008227903745137155, "global_step": 41100, "epoch": 345, "lr": 3.868673631517114e-05} +{"train_loss": 0.0021157795563340187, "global_step": 41101, "epoch": 345, "lr": 3.868457827429741e-05} +{"train_loss": 0.0014351257123053074, "global_step": 41102, "epoch": 345, "lr": 3.8682420255640326e-05} +{"train_loss": 0.0013203417183831334, "global_step": 41103, "epoch": 345, "lr": 3.8680262259204075e-05} +{"train_loss": 0.0015870330389589071, "global_step": 41104, "epoch": 345, "lr": 3.867810428499294e-05} +{"train_loss": 0.0017166694160550833, "global_step": 41105, "epoch": 345, "lr": 3.867594633301112e-05} +{"train_loss": 0.0020765531808137894, "global_step": 41106, "epoch": 345, "lr": 3.867378840326288e-05} +{"train_loss": 0.0016750188078731298, "global_step": 41107, "epoch": 345, "lr": 3.8671630495752446e-05} +{"train_loss": 0.0019742257427424192, "global_step": 41108, "epoch": 345, "lr": 3.8669472610484045e-05} +{"train_loss": 0.0019602978136390448, "global_step": 41109, "epoch": 345, "lr": 3.866731474746194e-05} +{"train_loss": 0.002607484580948949, "global_step": 41110, "epoch": 345, "lr": 3.8665156906690335e-05} +{"train_loss": 0.0012489128857851028, "global_step": 41111, "epoch": 345, "lr": 3.8662999088173504e-05} +{"train_loss": 0.0017329526599496603, "global_step": 41112, "epoch": 345, "lr": 3.866084129191566e-05} +{"train_loss": 0.0021045159082859755, "global_step": 41113, "epoch": 345, "lr": 3.865868351792102e-05} +{"train_loss": 0.0018405660521239042, "global_step": 41114, "epoch": 345, "lr": 3.865652576619387e-05} +{"train_loss": 0.00232066516764462, "global_step": 41115, "epoch": 345, "lr": 3.86543680367384e-05} +{"train_loss": 0.0018434118246659636, "global_step": 41116, "epoch": 345, "lr": 3.865221032955888e-05} +{"train_loss": 0.0009055195259861648, "global_step": 41117, "epoch": 345, "lr": 3.865005264465952e-05} +{"train_loss": 0.002791788661852479, "global_step": 41118, "epoch": 345, "lr": 3.864789498204458e-05} +{"train_loss": 0.0014235167764127254, "global_step": 41119, "epoch": 345, "lr": 3.864573734171829e-05} +{"train_loss": 0.0013464317889884114, "global_step": 41120, "epoch": 345, "lr": 3.8643579723684865e-05} +{"train_loss": 0.0010407284134998918, "global_step": 41121, "epoch": 345, "lr": 3.8641422127948575e-05} +{"train_loss": 0.0016436571022495627, "global_step": 41122, "epoch": 345, "lr": 3.863926455451362e-05} +{"train_loss": 0.0018183980137109756, "global_step": 41123, "epoch": 345, "lr": 3.8637107003384265e-05} +{"train_loss": 0.001354310312308371, "global_step": 41124, "epoch": 345, "lr": 3.863494947456473e-05} +{"train_loss": 0.002766999648883939, "global_step": 41125, "epoch": 345, "lr": 3.863279196805927e-05} +{"train_loss": 0.0019348098430782557, "global_step": 41126, "epoch": 345, "lr": 3.8630634483872107e-05} +{"train_loss": 0.001784272026270628, "global_step": 41127, "epoch": 345, "lr": 3.862847702200746e-05} +{"train_loss": 0.003079432062804699, "global_step": 41128, "epoch": 345, "lr": 3.862631958246962e-05} +{"train_loss": 0.0009103591437451541, "global_step": 41129, "epoch": 345, "lr": 3.8624162165262746e-05} +{"train_loss": 0.0017223095055669546, "global_step": 41130, "epoch": 345, "lr": 3.862200477039114e-05} +{"train_loss": 0.0009914723923429847, "global_step": 41131, "epoch": 345, "lr": 3.861984739785901e-05} +{"train_loss": 0.001591820502653718, "global_step": 41132, "epoch": 345, "lr": 3.861769004767059e-05} +{"train_loss": 0.0012438688427209854, "global_step": 41133, "epoch": 345, "lr": 3.8615532719830124e-05} +{"train_loss": 0.001315838540904224, "global_step": 41134, "epoch": 345, "lr": 3.861337541434182e-05} +{"train_loss": 0.0017353020375594497, "global_step": 41135, "epoch": 345, "lr": 3.861121813120997e-05} +{"train_loss": 0.0020961398258805275, "global_step": 41136, "epoch": 345, "lr": 3.8609060870438744e-05} +{"train_loss": 0.0012654109159484506, "global_step": 41137, "epoch": 345, "lr": 3.8606903632032444e-05} +{"train_loss": 0.0008852417231537402, "global_step": 41138, "epoch": 345, "lr": 3.8604746415995254e-05} +{"train_loss": 0.0016398354200646281, "global_step": 41139, "epoch": 345, "lr": 3.860258922233142e-05} +{"train_loss": 0.001088951132260263, "global_step": 41140, "epoch": 345, "lr": 3.860043205104519e-05} +{"train_loss": 0.0017074807547032833, "global_step": 41141, "epoch": 345, "lr": 3.85982749021408e-05} +{"train_loss": 0.0018582639750093222, "global_step": 41142, "epoch": 345, "lr": 3.859611777562247e-05} +{"train_loss": 0.0010077524930238724, "global_step": 41143, "epoch": 345, "lr": 3.8593960671494436e-05} +{"train_loss": 0.001373390550725162, "global_step": 41144, "epoch": 345, "lr": 3.859180358976097e-05} +{"train_loss": 0.001264061313122511, "global_step": 41145, "epoch": 345, "lr": 3.858964653042627e-05} +{"train_loss": 0.002864799927920103, "global_step": 41146, "epoch": 345, "lr": 3.858748949349457e-05} +{"train_loss": 0.0017041151877492666, "global_step": 41147, "epoch": 345, "lr": 3.858533247897012e-05} +{"train_loss": 0.0014690031530335546, "global_step": 41148, "epoch": 345, "lr": 3.8583175486857135e-05} +{"train_loss": 0.0018940476002171636, "global_step": 41149, "epoch": 345, "lr": 3.8581018517159894e-05} +{"train_loss": 0.0012527479557320476, "global_step": 41150, "epoch": 345, "lr": 3.85788615698826e-05} +{"train_loss": 0.00089595204917714, "global_step": 41151, "epoch": 345, "lr": 3.8576704645029464e-05} +{"train_loss": 0.0013746629701927304, "global_step": 41152, "epoch": 345, "lr": 3.857454774260477e-05} +{"train_loss": 0.0021419411059468985, "global_step": 41153, "epoch": 345, "lr": 3.857239086261272e-05} +{"train_loss": 0.001748579670675099, "global_step": 41154, "epoch": 345, "lr": 3.857023400505757e-05} +{"train_loss": 0.002144110156223178, "global_step": 41155, "epoch": 345, "lr": 3.8568077169943525e-05} +{"train_loss": 0.0019226422300562263, "global_step": 41156, "epoch": 345, "lr": 3.856592035727486e-05} +{"train_loss": 0.0015803497517481446, "global_step": 41157, "epoch": 345, "lr": 3.8563763567055785e-05} +{"train_loss": 0.001285012112930417, "global_step": 41158, "epoch": 345, "lr": 3.856160679929053e-05} +{"train_loss": 0.0018288312712684274, "global_step": 41159, "epoch": 345, "lr": 3.855945005398335e-05} +{"train_loss": 0.0013094769092276692, "global_step": 41160, "epoch": 345, "lr": 3.855729333113845e-05} +{"train_loss": 0.001090315985493362, "global_step": 41161, "epoch": 345, "lr": 3.8555136630760104e-05} +{"train_loss": 0.002229902660474181, "global_step": 41162, "epoch": 345, "lr": 3.855297995285252e-05} +{"train_loss": 0.0016344267642125487, "global_step": 41163, "epoch": 345, "lr": 3.855082329741992e-05} +{"train_loss": 0.0012918582651764154, "global_step": 41164, "epoch": 345, "lr": 3.854866666446657e-05} +{"train_loss": 0.0010637817904353142, "global_step": 41165, "epoch": 345, "lr": 3.854651005399668e-05} +{"train_loss": 0.0021464054007083178, "global_step": 41166, "epoch": 345, "lr": 3.85443534660145e-05} +{"train_loss": 0.0014605496544390917, "global_step": 41167, "epoch": 345, "lr": 3.854219690052425e-05} +{"train_loss": 0.001929988618940115, "global_step": 41168, "epoch": 345, "lr": 3.854004035753019e-05} +{"train_loss": 0.0009185054805129766, "global_step": 41169, "epoch": 345, "lr": 3.853788383703654e-05} +{"train_loss": 0.0017395466566085815, "global_step": 41170, "epoch": 345, "lr": 3.85357273390475e-05} +{"train_loss": 0.0016399191226810217, "global_step": 41171, "epoch": 345, "lr": 3.853357086356735e-05} +{"train_loss": 0.001403440604917705, "global_step": 41172, "epoch": 345, "lr": 3.8531414410600305e-05} +{"train_loss": 0.0017112744536775188, "global_step": 41173, "epoch": 345, "lr": 3.852925798015061e-05, "val_loss": 0.01597169041633606, "train_action_mse_error": 2.3060090825310908e-05} +{"train_loss": 0.0017972951754927635, "global_step": 41174, "epoch": 346, "lr": 3.852710157222249e-05} +{"train_loss": 0.0025258027017116547, "global_step": 41175, "epoch": 346, "lr": 3.8524945186820175e-05} +{"train_loss": 0.0011270333779975772, "global_step": 41176, "epoch": 346, "lr": 3.852278882394792e-05} +{"train_loss": 0.0014706725487485528, "global_step": 41177, "epoch": 346, "lr": 3.8520632483609917e-05} +{"train_loss": 0.0017632798990234733, "global_step": 41178, "epoch": 346, "lr": 3.8518476165810455e-05} +{"train_loss": 0.001102352049201727, "global_step": 41179, "epoch": 346, "lr": 3.8516319870553705e-05} +{"train_loss": 0.0016567824641242623, "global_step": 41180, "epoch": 346, "lr": 3.851416359784397e-05} +{"train_loss": 0.0014753754949197173, "global_step": 41181, "epoch": 346, "lr": 3.8512007347685435e-05} +{"train_loss": 0.0015009477501735091, "global_step": 41182, "epoch": 346, "lr": 3.850985112008233e-05} +{"train_loss": 0.0017135866219177842, "global_step": 41183, "epoch": 346, "lr": 3.8507694915038926e-05} +{"train_loss": 0.0018406668677926064, "global_step": 41184, "epoch": 346, "lr": 3.8505538732559416e-05} +{"train_loss": 0.0017200021538883448, "global_step": 41185, "epoch": 346, "lr": 3.8503382572648075e-05} +{"train_loss": 0.002405814826488495, "global_step": 41186, "epoch": 346, "lr": 3.8501226435309084e-05} +{"train_loss": 0.0011630784720182419, "global_step": 41187, "epoch": 346, "lr": 3.849907032054674e-05} +{"train_loss": 0.0020262834150344133, "global_step": 41188, "epoch": 346, "lr": 3.8496914228365225e-05} +{"train_loss": 0.0009556276490911841, "global_step": 41189, "epoch": 346, "lr": 3.8494758158768785e-05} +{"train_loss": 0.0012782705016434193, "global_step": 41190, "epoch": 346, "lr": 3.8492602111761664e-05} +{"train_loss": 0.0011786051327362657, "global_step": 41191, "epoch": 346, "lr": 3.849044608734809e-05} +{"train_loss": 0.0017074896022677422, "global_step": 41192, "epoch": 346, "lr": 3.84882900855323e-05} +{"train_loss": 0.0011915595969185233, "global_step": 41193, "epoch": 346, "lr": 3.84861341063185e-05} +{"train_loss": 0.001853438327088952, "global_step": 41194, "epoch": 346, "lr": 3.848397814971097e-05} +{"train_loss": 0.0018909526988863945, "global_step": 41195, "epoch": 346, "lr": 3.848182221571392e-05} +{"train_loss": 0.002495942637324333, "global_step": 41196, "epoch": 346, "lr": 3.847966630433157e-05} +{"train_loss": 0.0016309486236423254, "global_step": 41197, "epoch": 346, "lr": 3.8477510415568173e-05} +{"train_loss": 0.0010894933948293328, "global_step": 41198, "epoch": 346, "lr": 3.8475354549427937e-05} +{"train_loss": 0.001696971943601966, "global_step": 41199, "epoch": 346, "lr": 3.8473198705915135e-05} +{"train_loss": 0.002060465281829238, "global_step": 41200, "epoch": 346, "lr": 3.8471042885033976e-05} +{"train_loss": 0.003404908813536167, "global_step": 41201, "epoch": 346, "lr": 3.846888708678866e-05} +{"train_loss": 0.0006728778243996203, "global_step": 41202, "epoch": 346, "lr": 3.846673131118349e-05} +{"train_loss": 0.0013880227925255895, "global_step": 41203, "epoch": 346, "lr": 3.846457555822263e-05} +{"train_loss": 0.001607911428436637, "global_step": 41204, "epoch": 346, "lr": 3.846241982791037e-05} +{"train_loss": 0.0013473063008859754, "global_step": 41205, "epoch": 346, "lr": 3.8460264120250886e-05} +{"train_loss": 0.0020075917709618807, "global_step": 41206, "epoch": 346, "lr": 3.8458108435248455e-05} +{"train_loss": 0.0014771458227187395, "global_step": 41207, "epoch": 346, "lr": 3.845595277290731e-05} +{"train_loss": 0.001748251379467547, "global_step": 41208, "epoch": 346, "lr": 3.845379713323165e-05} +{"train_loss": 0.0015586181543767452, "global_step": 41209, "epoch": 346, "lr": 3.8451641516225736e-05} +{"train_loss": 0.0018519399454817176, "global_step": 41210, "epoch": 346, "lr": 3.844948592189378e-05} +{"train_loss": 0.0016403158660978079, "global_step": 41211, "epoch": 346, "lr": 3.8447330350240035e-05} +{"train_loss": 0.0013332689413800836, "global_step": 41212, "epoch": 346, "lr": 3.844517480126873e-05} +{"train_loss": 0.0016135924961417913, "global_step": 41213, "epoch": 346, "lr": 3.8443019274984066e-05} +{"train_loss": 0.0019482241477817297, "global_step": 41214, "epoch": 346, "lr": 3.8440863771390315e-05} +{"train_loss": 0.0016787811182439327, "global_step": 41215, "epoch": 346, "lr": 3.843870829049168e-05} +{"train_loss": 0.0023634349927306175, "global_step": 41216, "epoch": 346, "lr": 3.8436552832292425e-05} +{"train_loss": 0.0019649795722216368, "global_step": 41217, "epoch": 346, "lr": 3.843439739679674e-05} +{"train_loss": 0.0016988026909530163, "global_step": 41218, "epoch": 346, "lr": 3.84322419840089e-05} +{"train_loss": 0.0023872326128184795, "global_step": 41219, "epoch": 346, "lr": 3.843008659393311e-05} +{"train_loss": 0.0010637418599799275, "global_step": 41220, "epoch": 346, "lr": 3.842793122657361e-05} +{"train_loss": 0.002417101990431547, "global_step": 41221, "epoch": 346, "lr": 3.8425775881934634e-05} +{"train_loss": 0.0020050061866641045, "global_step": 41222, "epoch": 346, "lr": 3.8423620560020404e-05} +{"train_loss": 0.0026185279712080956, "global_step": 41223, "epoch": 346, "lr": 3.842146526083515e-05} +{"train_loss": 0.0009665242396295071, "global_step": 41224, "epoch": 346, "lr": 3.8419309984383125e-05} +{"train_loss": 0.001513660536147654, "global_step": 41225, "epoch": 346, "lr": 3.8417154730668546e-05} +{"train_loss": 0.0013299918500706553, "global_step": 41226, "epoch": 346, "lr": 3.841499949969566e-05} +{"train_loss": 0.0019445442594587803, "global_step": 41227, "epoch": 346, "lr": 3.841284429146866e-05} +{"train_loss": 0.0021983019541949034, "global_step": 41228, "epoch": 346, "lr": 3.841068910599182e-05} +{"train_loss": 0.0012196276802569628, "global_step": 41229, "epoch": 346, "lr": 3.8408533943269334e-05} +{"train_loss": 0.0010285633616149426, "global_step": 41230, "epoch": 346, "lr": 3.840637880330547e-05} +{"train_loss": 0.002879314823076129, "global_step": 41231, "epoch": 346, "lr": 3.8404223686104457e-05} +{"train_loss": 0.001923483912833035, "global_step": 41232, "epoch": 346, "lr": 3.840206859167048e-05} +{"train_loss": 0.0015618088655173779, "global_step": 41233, "epoch": 346, "lr": 3.8399913520007825e-05} +{"train_loss": 0.0011853801552206278, "global_step": 41234, "epoch": 346, "lr": 3.839775847112068e-05} +{"train_loss": 0.0014923122944310308, "global_step": 41235, "epoch": 346, "lr": 3.839560344501332e-05} +{"train_loss": 0.0022111430298537016, "global_step": 41236, "epoch": 346, "lr": 3.839344844168993e-05} +{"train_loss": 0.0020452281460165977, "global_step": 41237, "epoch": 346, "lr": 3.8391293461154776e-05} +{"train_loss": 0.0013712826184928417, "global_step": 41238, "epoch": 346, "lr": 3.838913850341208e-05} +{"train_loss": 0.0010999121004715562, "global_step": 41239, "epoch": 346, "lr": 3.838698356846606e-05} +{"train_loss": 0.002969631226733327, "global_step": 41240, "epoch": 346, "lr": 3.838482865632097e-05} +{"train_loss": 0.002567945048213005, "global_step": 41241, "epoch": 346, "lr": 3.8382673766981e-05} +{"train_loss": 0.0008515557856298983, "global_step": 41242, "epoch": 346, "lr": 3.838051890045045e-05} +{"train_loss": 0.0009467067429795861, "global_step": 41243, "epoch": 346, "lr": 3.8378364056733474e-05} +{"train_loss": 0.001393343205563724, "global_step": 41244, "epoch": 346, "lr": 3.837620923583436e-05} +{"train_loss": 0.0014769401168450713, "global_step": 41245, "epoch": 346, "lr": 3.8374054437757323e-05} +{"train_loss": 0.0015303591499105096, "global_step": 41246, "epoch": 346, "lr": 3.8371899662506564e-05} +{"train_loss": 0.0012452169321477413, "global_step": 41247, "epoch": 346, "lr": 3.836974491008636e-05} +{"train_loss": 0.0015730592422187328, "global_step": 41248, "epoch": 346, "lr": 3.83675901805009e-05} +{"train_loss": 0.0016334300162270665, "global_step": 41249, "epoch": 346, "lr": 3.836543547375445e-05} +{"train_loss": 0.002458515577018261, "global_step": 41250, "epoch": 346, "lr": 3.836328078985123e-05} +{"train_loss": 0.0011083370773121715, "global_step": 41251, "epoch": 346, "lr": 3.8361126128795445e-05} +{"train_loss": 0.0019523140508681536, "global_step": 41252, "epoch": 346, "lr": 3.835897149059136e-05} +{"train_loss": 0.0013659134274348617, "global_step": 41253, "epoch": 346, "lr": 3.835681687524317e-05} +{"train_loss": 0.0011319651966914535, "global_step": 41254, "epoch": 346, "lr": 3.8354662282755146e-05} +{"train_loss": 0.0016897973837330937, "global_step": 41255, "epoch": 346, "lr": 3.8352507713131494e-05} +{"train_loss": 0.0011312998831272125, "global_step": 41256, "epoch": 346, "lr": 3.8350353166376444e-05} +{"train_loss": 0.002637493424117565, "global_step": 41257, "epoch": 346, "lr": 3.8348198642494244e-05} +{"train_loss": 0.000860836124047637, "global_step": 41258, "epoch": 346, "lr": 3.834604414148909e-05} +{"train_loss": 0.0031153413001447916, "global_step": 41259, "epoch": 346, "lr": 3.834388966336525e-05} +{"train_loss": 0.0010714551899582148, "global_step": 41260, "epoch": 346, "lr": 3.834173520812693e-05} +{"train_loss": 0.0017348277615383267, "global_step": 41261, "epoch": 346, "lr": 3.8339580775778374e-05} +{"train_loss": 0.0020464935805648565, "global_step": 41262, "epoch": 346, "lr": 3.8337426366323794e-05} +{"train_loss": 0.0008963024010881782, "global_step": 41263, "epoch": 346, "lr": 3.833527197976745e-05} +{"train_loss": 0.0017298852326348424, "global_step": 41264, "epoch": 346, "lr": 3.8333117616113545e-05} +{"train_loss": 0.0012054287362843752, "global_step": 41265, "epoch": 346, "lr": 3.8330963275366306e-05} +{"train_loss": 0.001395795843563974, "global_step": 41266, "epoch": 346, "lr": 3.8328808957529994e-05} +{"train_loss": 0.0012891648802906275, "global_step": 41267, "epoch": 346, "lr": 3.832665466260879e-05} +{"train_loss": 0.0016778046265244484, "global_step": 41268, "epoch": 346, "lr": 3.832450039060698e-05} +{"train_loss": 0.0025325478054583073, "global_step": 41269, "epoch": 346, "lr": 3.832234614152875e-05} +{"train_loss": 0.0016921742353588343, "global_step": 41270, "epoch": 346, "lr": 3.832019191537836e-05} +{"train_loss": 0.0017265265341848135, "global_step": 41271, "epoch": 346, "lr": 3.831803771216001e-05} +{"train_loss": 0.0018424482550472021, "global_step": 41272, "epoch": 346, "lr": 3.831588353187795e-05} +{"train_loss": 0.0006942992913536727, "global_step": 41273, "epoch": 346, "lr": 3.8313729374536405e-05} +{"train_loss": 0.0020772700663655996, "global_step": 41274, "epoch": 346, "lr": 3.8311575240139606e-05} +{"train_loss": 0.001553232199512422, "global_step": 41275, "epoch": 346, "lr": 3.830942112869178e-05} +{"train_loss": 0.0023609993513673544, "global_step": 41276, "epoch": 346, "lr": 3.830726704019716e-05} +{"train_loss": 0.0011507547460496426, "global_step": 41277, "epoch": 346, "lr": 3.830511297465996e-05} +{"train_loss": 0.0009343886049464345, "global_step": 41278, "epoch": 346, "lr": 3.8302958932084434e-05} +{"train_loss": 0.0021588311064988375, "global_step": 41279, "epoch": 346, "lr": 3.830080491247479e-05} +{"train_loss": 0.001955178566277027, "global_step": 41280, "epoch": 346, "lr": 3.8298650915835275e-05} +{"train_loss": 0.0023043472319841385, "global_step": 41281, "epoch": 346, "lr": 3.829649694217011e-05} +{"train_loss": 0.001254483126103878, "global_step": 41282, "epoch": 346, "lr": 3.8294342991483505e-05} +{"train_loss": 0.0024430081248283386, "global_step": 41283, "epoch": 346, "lr": 3.829218906377973e-05} +{"train_loss": 0.0015941024757921696, "global_step": 41284, "epoch": 346, "lr": 3.8290035159062965e-05} +{"train_loss": 0.0017578779952600598, "global_step": 41285, "epoch": 346, "lr": 3.828788127733749e-05} +{"train_loss": 0.001443728688172996, "global_step": 41286, "epoch": 346, "lr": 3.828572741860749e-05} +{"train_loss": 0.0013352158712223172, "global_step": 41287, "epoch": 346, "lr": 3.828357358287723e-05} +{"train_loss": 0.0020745687652379274, "global_step": 41288, "epoch": 346, "lr": 3.8281419770150905e-05} +{"train_loss": 0.0011417869245633483, "global_step": 41289, "epoch": 346, "lr": 3.827926598043276e-05} +{"train_loss": 0.0018757502548396587, "global_step": 41290, "epoch": 346, "lr": 3.827711221372704e-05} +{"train_loss": 0.0029017662163823843, "global_step": 41291, "epoch": 346, "lr": 3.8274958470037936e-05} +{"train_loss": 0.0016880343211306055, "global_step": 41292, "epoch": 346, "lr": 3.8272804749369725e-05, "val_loss": 0.023744022473692894} +{"train_loss": 0.0011229217052459717, "global_step": 41293, "epoch": 347, "lr": 3.827065105172658e-05} +{"train_loss": 0.002339733298867941, "global_step": 41294, "epoch": 347, "lr": 3.826849737711279e-05} +{"train_loss": 0.0023255005944520235, "global_step": 41295, "epoch": 347, "lr": 3.826634372553254e-05} +{"train_loss": 0.0020762563217431307, "global_step": 41296, "epoch": 347, "lr": 3.826419009699006e-05} +{"train_loss": 0.0010256139794364572, "global_step": 41297, "epoch": 347, "lr": 3.8262036491489606e-05} +{"train_loss": 0.0016398174921050668, "global_step": 41298, "epoch": 347, "lr": 3.8259882909035366e-05} +{"train_loss": 0.001344590913504362, "global_step": 41299, "epoch": 347, "lr": 3.825772934963161e-05} +{"train_loss": 0.002118093892931938, "global_step": 41300, "epoch": 347, "lr": 3.825557581328256e-05} +{"train_loss": 0.001626059878617525, "global_step": 41301, "epoch": 347, "lr": 3.82534222999924e-05} +{"train_loss": 0.001424548332579434, "global_step": 41302, "epoch": 347, "lr": 3.825126880976542e-05} +{"train_loss": 0.004105424974113703, "global_step": 41303, "epoch": 347, "lr": 3.8249115342605786e-05} +{"train_loss": 0.0010926874820142984, "global_step": 41304, "epoch": 347, "lr": 3.824696189851777e-05} +{"train_loss": 0.0017493395134806633, "global_step": 41305, "epoch": 347, "lr": 3.82448084775056e-05} +{"train_loss": 0.0023238463327288628, "global_step": 41306, "epoch": 347, "lr": 3.824265507957348e-05} +{"train_loss": 0.001748422859236598, "global_step": 41307, "epoch": 347, "lr": 3.8240501704725676e-05} +{"train_loss": 0.0023648596834391356, "global_step": 41308, "epoch": 347, "lr": 3.8238348352966355e-05} +{"train_loss": 0.0015905367908999324, "global_step": 41309, "epoch": 347, "lr": 3.8236195024299815e-05} +{"train_loss": 0.0013608646113425493, "global_step": 41310, "epoch": 347, "lr": 3.8234041718730216e-05} +{"train_loss": 0.0015976089052855968, "global_step": 41311, "epoch": 347, "lr": 3.823188843626185e-05} +{"train_loss": 0.001003088429570198, "global_step": 41312, "epoch": 347, "lr": 3.822973517689889e-05} +{"train_loss": 0.0018277118215337396, "global_step": 41313, "epoch": 347, "lr": 3.822758194064561e-05} +{"train_loss": 0.0024328541476279497, "global_step": 41314, "epoch": 347, "lr": 3.822542872750621e-05} +{"train_loss": 0.002390442881733179, "global_step": 41315, "epoch": 347, "lr": 3.82232755374849e-05} +{"train_loss": 0.001614582957699895, "global_step": 41316, "epoch": 347, "lr": 3.822112237058595e-05} +{"train_loss": 0.0013598474906757474, "global_step": 41317, "epoch": 347, "lr": 3.821896922681355e-05} +{"train_loss": 0.0012449820060282946, "global_step": 41318, "epoch": 347, "lr": 3.821681610617197e-05} +{"train_loss": 0.0021471974905580282, "global_step": 41319, "epoch": 347, "lr": 3.821466300866541e-05} +{"train_loss": 0.0019529095152392983, "global_step": 41320, "epoch": 347, "lr": 3.821250993429809e-05} +{"train_loss": 0.0037429446820169687, "global_step": 41321, "epoch": 347, "lr": 3.821035688307424e-05} +{"train_loss": 0.001734980964101851, "global_step": 41322, "epoch": 347, "lr": 3.8208203854998106e-05} +{"train_loss": 0.0022074016742408276, "global_step": 41323, "epoch": 347, "lr": 3.82060508500739e-05} +{"train_loss": 0.0017641236772760749, "global_step": 41324, "epoch": 347, "lr": 3.8203897868305855e-05} +{"train_loss": 0.0012238515773788095, "global_step": 41325, "epoch": 347, "lr": 3.82017449096982e-05} +{"train_loss": 0.001561855198815465, "global_step": 41326, "epoch": 347, "lr": 3.8199591974255156e-05} +{"train_loss": 0.0010604929411783814, "global_step": 41327, "epoch": 347, "lr": 3.8197439061980946e-05} +{"train_loss": 0.0033477770630270243, "global_step": 41328, "epoch": 347, "lr": 3.8195286172879816e-05} +{"train_loss": 0.0012608501128852367, "global_step": 41329, "epoch": 347, "lr": 3.819313330695596e-05} +{"train_loss": 0.0021351026371121407, "global_step": 41330, "epoch": 347, "lr": 3.819098046421364e-05} +{"train_loss": 0.00143009377643466, "global_step": 41331, "epoch": 347, "lr": 3.818882764465706e-05} +{"train_loss": 0.0023219804279506207, "global_step": 41332, "epoch": 347, "lr": 3.818667484829047e-05} +{"train_loss": 0.002509906655177474, "global_step": 41333, "epoch": 347, "lr": 3.818452207511809e-05} +{"train_loss": 0.0018260470824316144, "global_step": 41334, "epoch": 347, "lr": 3.8182369325144104e-05} +{"train_loss": 0.002287616953253746, "global_step": 41335, "epoch": 347, "lr": 3.8180216598372807e-05} +{"train_loss": 0.001442191656678915, "global_step": 41336, "epoch": 347, "lr": 3.8178063894808355e-05} +{"train_loss": 0.0021719359792768955, "global_step": 41337, "epoch": 347, "lr": 3.817591121445505e-05} +{"train_loss": 0.0013801836175844073, "global_step": 41338, "epoch": 347, "lr": 3.8173758557317066e-05} +{"train_loss": 0.00431121326982975, "global_step": 41339, "epoch": 347, "lr": 3.8171605923398625e-05} +{"train_loss": 0.002974167698994279, "global_step": 41340, "epoch": 347, "lr": 3.8169453312704e-05} +{"train_loss": 0.003727475181221962, "global_step": 41341, "epoch": 347, "lr": 3.816730072523736e-05} +{"train_loss": 0.0024050292558968067, "global_step": 41342, "epoch": 347, "lr": 3.816514816100299e-05} +{"train_loss": 0.0013131012674421072, "global_step": 41343, "epoch": 347, "lr": 3.816299562000506e-05} +{"train_loss": 0.0012902232119813561, "global_step": 41344, "epoch": 347, "lr": 3.816084310224785e-05} +{"train_loss": 0.001386262127198279, "global_step": 41345, "epoch": 347, "lr": 3.815869060773556e-05} +{"train_loss": 0.0009934433037415147, "global_step": 41346, "epoch": 347, "lr": 3.8156538136472394e-05} +{"train_loss": 0.003715431783348322, "global_step": 41347, "epoch": 347, "lr": 3.815438568846262e-05} +{"train_loss": 0.002117627067491412, "global_step": 41348, "epoch": 347, "lr": 3.815223326371043e-05} +{"train_loss": 0.0018459392013028264, "global_step": 41349, "epoch": 347, "lr": 3.815008086222007e-05} +{"train_loss": 0.0011343330843374133, "global_step": 41350, "epoch": 347, "lr": 3.814792848399577e-05} +{"train_loss": 0.002940648002550006, "global_step": 41351, "epoch": 347, "lr": 3.814577612904172e-05} +{"train_loss": 0.0017168076010420918, "global_step": 41352, "epoch": 347, "lr": 3.814362379736219e-05} +{"train_loss": 0.0018845766317099333, "global_step": 41353, "epoch": 347, "lr": 3.8141471488961385e-05} +{"train_loss": 0.0017907973378896713, "global_step": 41354, "epoch": 347, "lr": 3.8139319203843535e-05} +{"train_loss": 0.003201450686901808, "global_step": 41355, "epoch": 347, "lr": 3.813716694201286e-05} +{"train_loss": 0.003546668915078044, "global_step": 41356, "epoch": 347, "lr": 3.8135014703473594e-05} +{"train_loss": 0.0018845839658752084, "global_step": 41357, "epoch": 347, "lr": 3.813286248822997e-05} +{"train_loss": 0.0019229449098929763, "global_step": 41358, "epoch": 347, "lr": 3.8130710296286173e-05} +{"train_loss": 0.0014433593023568392, "global_step": 41359, "epoch": 347, "lr": 3.8128558127646494e-05} +{"train_loss": 0.0019895739387720823, "global_step": 41360, "epoch": 347, "lr": 3.8126405982315095e-05} +{"train_loss": 0.0020583930891007185, "global_step": 41361, "epoch": 347, "lr": 3.812425386029625e-05} +{"train_loss": 0.001052717911079526, "global_step": 41362, "epoch": 347, "lr": 3.8122101761594145e-05} +{"train_loss": 0.001961668021976948, "global_step": 41363, "epoch": 347, "lr": 3.8119949686213044e-05} +{"train_loss": 0.000902092142496258, "global_step": 41364, "epoch": 347, "lr": 3.811779763415715e-05} +{"train_loss": 0.0025548553094267845, "global_step": 41365, "epoch": 347, "lr": 3.811564560543067e-05} +{"train_loss": 0.0016701689455658197, "global_step": 41366, "epoch": 347, "lr": 3.811349360003788e-05} +{"train_loss": 0.0011583087034523487, "global_step": 41367, "epoch": 347, "lr": 3.811134161798294e-05} +{"train_loss": 0.0016012501437216997, "global_step": 41368, "epoch": 347, "lr": 3.810918965927014e-05} +{"train_loss": 0.002137955278158188, "global_step": 41369, "epoch": 347, "lr": 3.810703772390366e-05} +{"train_loss": 0.0020787192042917013, "global_step": 41370, "epoch": 347, "lr": 3.810488581188775e-05} +{"train_loss": 0.0019486078526824713, "global_step": 41371, "epoch": 347, "lr": 3.810273392322662e-05} +{"train_loss": 0.001611802028492093, "global_step": 41372, "epoch": 347, "lr": 3.81005820579245e-05} +{"train_loss": 0.0011365001555532217, "global_step": 41373, "epoch": 347, "lr": 3.809843021598562e-05} +{"train_loss": 0.0014045624993741512, "global_step": 41374, "epoch": 347, "lr": 3.809627839741419e-05} +{"train_loss": 0.0011611429508775473, "global_step": 41375, "epoch": 347, "lr": 3.809412660221446e-05} +{"train_loss": 0.0016029475955292583, "global_step": 41376, "epoch": 347, "lr": 3.809197483039065e-05} +{"train_loss": 0.002122236881405115, "global_step": 41377, "epoch": 347, "lr": 3.8089823081946947e-05} +{"train_loss": 0.002160510281100869, "global_step": 41378, "epoch": 347, "lr": 3.808767135688763e-05} +{"train_loss": 0.001970724668353796, "global_step": 41379, "epoch": 347, "lr": 3.808551965521687e-05} +{"train_loss": 0.0012171854032203555, "global_step": 41380, "epoch": 347, "lr": 3.8083367976938946e-05} +{"train_loss": 0.0022180976811796427, "global_step": 41381, "epoch": 347, "lr": 3.8081216322058035e-05} +{"train_loss": 0.001014675130136311, "global_step": 41382, "epoch": 347, "lr": 3.80790646905784e-05} +{"train_loss": 0.0028594438917934895, "global_step": 41383, "epoch": 347, "lr": 3.8076913082504245e-05} +{"train_loss": 0.0007846435764804482, "global_step": 41384, "epoch": 347, "lr": 3.807476149783978e-05} +{"train_loss": 0.002355781150981784, "global_step": 41385, "epoch": 347, "lr": 3.807260993658927e-05} +{"train_loss": 0.001717983279377222, "global_step": 41386, "epoch": 347, "lr": 3.8070458398756893e-05} +{"train_loss": 0.0018235392635688186, "global_step": 41387, "epoch": 347, "lr": 3.806830688434691e-05} +{"train_loss": 0.0014118555700406432, "global_step": 41388, "epoch": 347, "lr": 3.806615539336354e-05} +{"train_loss": 0.0019868421368300915, "global_step": 41389, "epoch": 347, "lr": 3.806400392581098e-05} +{"train_loss": 0.002556747756898403, "global_step": 41390, "epoch": 347, "lr": 3.8061852481693486e-05} +{"train_loss": 0.0018626523669809103, "global_step": 41391, "epoch": 347, "lr": 3.805970106101526e-05} +{"train_loss": 0.0021270141005516052, "global_step": 41392, "epoch": 347, "lr": 3.805754966378055e-05} +{"train_loss": 0.0014255184214562178, "global_step": 41393, "epoch": 347, "lr": 3.805539828999354e-05} +{"train_loss": 0.0013624437851831317, "global_step": 41394, "epoch": 347, "lr": 3.80532469396585e-05} +{"train_loss": 0.0025916756130754948, "global_step": 41395, "epoch": 347, "lr": 3.805109561277965e-05} +{"train_loss": 0.0009272382594645023, "global_step": 41396, "epoch": 347, "lr": 3.804894430936116e-05} +{"train_loss": 0.0021071620285511017, "global_step": 41397, "epoch": 347, "lr": 3.804679302940732e-05} +{"train_loss": 0.002953942632302642, "global_step": 41398, "epoch": 347, "lr": 3.80446417729223e-05} +{"train_loss": 0.001167283859103918, "global_step": 41399, "epoch": 347, "lr": 3.804249053991037e-05} +{"train_loss": 0.0024024159647524357, "global_step": 41400, "epoch": 347, "lr": 3.804033933037572e-05} +{"train_loss": 0.0012555471621453762, "global_step": 41401, "epoch": 347, "lr": 3.803818814432259e-05} +{"train_loss": 0.0012299963273108006, "global_step": 41402, "epoch": 347, "lr": 3.8036036981755196e-05} +{"train_loss": 0.0028300287667661905, "global_step": 41403, "epoch": 347, "lr": 3.803388584267777e-05} +{"train_loss": 0.0018825535662472248, "global_step": 41404, "epoch": 347, "lr": 3.803173472709453e-05} +{"train_loss": 0.0018305381527170539, "global_step": 41405, "epoch": 347, "lr": 3.802958363500969e-05} +{"train_loss": 0.001208438421599567, "global_step": 41406, "epoch": 347, "lr": 3.8027432566427495e-05} +{"train_loss": 0.001367430668324232, "global_step": 41407, "epoch": 347, "lr": 3.8025281521352165e-05} +{"train_loss": 0.002008631592616439, "global_step": 41408, "epoch": 347, "lr": 3.8023130499787895e-05} +{"train_loss": 0.001677564810961485, "global_step": 41409, "epoch": 347, "lr": 3.8020979501738946e-05} +{"train_loss": 0.0023374808952212334, "global_step": 41410, "epoch": 347, "lr": 3.801882852720951e-05} +{"train_loss": 0.0019001061778648623, "global_step": 41411, "epoch": 347, "lr": 3.801667757620384e-05, "val_loss": 0.0314689502120018} +{"train_loss": 0.0009850967908278108, "global_step": 41412, "epoch": 348, "lr": 3.801452664872612e-05} +{"train_loss": 0.0021061289589852095, "global_step": 41413, "epoch": 348, "lr": 3.801237574478062e-05} +{"train_loss": 0.0024478412233293056, "global_step": 41414, "epoch": 348, "lr": 3.801022486437154e-05} +{"train_loss": 0.002225514268502593, "global_step": 41415, "epoch": 348, "lr": 3.800807400750308e-05} +{"train_loss": 0.0018797112861648202, "global_step": 41416, "epoch": 348, "lr": 3.8005923174179516e-05} +{"train_loss": 0.001724021858535707, "global_step": 41417, "epoch": 348, "lr": 3.8003772364405006e-05} +{"train_loss": 0.0012411241186782718, "global_step": 41418, "epoch": 348, "lr": 3.800162157818383e-05} +{"train_loss": 0.0013440110487863421, "global_step": 41419, "epoch": 348, "lr": 3.799947081552019e-05} +{"train_loss": 0.0024306587874889374, "global_step": 41420, "epoch": 348, "lr": 3.7997320076418294e-05} +{"train_loss": 0.0014257519505918026, "global_step": 41421, "epoch": 348, "lr": 3.7995169360882385e-05} +{"train_loss": 0.0026331553235650063, "global_step": 41422, "epoch": 348, "lr": 3.7993018668916667e-05} +{"train_loss": 0.001450832700356841, "global_step": 41423, "epoch": 348, "lr": 3.799086800052539e-05} +{"train_loss": 0.00260132341645658, "global_step": 41424, "epoch": 348, "lr": 3.7988717355712744e-05} +{"train_loss": 0.0019579778891056776, "global_step": 41425, "epoch": 348, "lr": 3.7986566734482984e-05} +{"train_loss": 0.0023388818372040987, "global_step": 41426, "epoch": 348, "lr": 3.798441613684032e-05} +{"train_loss": 0.0010831599356606603, "global_step": 41427, "epoch": 348, "lr": 3.798226556278895e-05} +{"train_loss": 0.0021604818757623434, "global_step": 41428, "epoch": 348, "lr": 3.7980115012333145e-05} +{"train_loss": 0.001681781723164022, "global_step": 41429, "epoch": 348, "lr": 3.797796448547707e-05} +{"train_loss": 0.0015178591711446643, "global_step": 41430, "epoch": 348, "lr": 3.797581398222501e-05} +{"train_loss": 0.002091251779347658, "global_step": 41431, "epoch": 348, "lr": 3.797366350258112e-05} +{"train_loss": 0.0013624735875055194, "global_step": 41432, "epoch": 348, "lr": 3.797151304654969e-05} +{"train_loss": 0.0019586095586419106, "global_step": 41433, "epoch": 348, "lr": 3.79693626141349e-05} +{"train_loss": 0.0009956425055861473, "global_step": 41434, "epoch": 348, "lr": 3.7967212205340964e-05} +{"train_loss": 0.0017448340076953173, "global_step": 41435, "epoch": 348, "lr": 3.7965061820172143e-05} +{"train_loss": 0.0016409896779805422, "global_step": 41436, "epoch": 348, "lr": 3.796291145863261e-05} +{"train_loss": 0.0021018157713115215, "global_step": 41437, "epoch": 348, "lr": 3.796076112072663e-05} +{"train_loss": 0.0012008061166852713, "global_step": 41438, "epoch": 348, "lr": 3.795861080645842e-05} +{"train_loss": 0.0018369724275544286, "global_step": 41439, "epoch": 348, "lr": 3.795646051583217e-05} +{"train_loss": 0.0015453858068212867, "global_step": 41440, "epoch": 348, "lr": 3.7954310248852145e-05} +{"train_loss": 0.002087364438921213, "global_step": 41441, "epoch": 348, "lr": 3.795216000552252e-05} +{"train_loss": 0.001274833339266479, "global_step": 41442, "epoch": 348, "lr": 3.795000978584757e-05} +{"train_loss": 0.0016877963207662106, "global_step": 41443, "epoch": 348, "lr": 3.794785958983146e-05} +{"train_loss": 0.0017870650626718998, "global_step": 41444, "epoch": 348, "lr": 3.7945709417478467e-05} +{"train_loss": 0.0019545648247003555, "global_step": 41445, "epoch": 348, "lr": 3.794355926879278e-05} +{"train_loss": 0.0015417670365422964, "global_step": 41446, "epoch": 348, "lr": 3.794140914377861e-05} +{"train_loss": 0.00153070455417037, "global_step": 41447, "epoch": 348, "lr": 3.793925904244021e-05} +{"train_loss": 0.0011371576692909002, "global_step": 41448, "epoch": 348, "lr": 3.793710896478178e-05} +{"train_loss": 0.0010779722360894084, "global_step": 41449, "epoch": 348, "lr": 3.793495891080755e-05} +{"train_loss": 0.002447857754305005, "global_step": 41450, "epoch": 348, "lr": 3.793280888052173e-05} +{"train_loss": 0.001359479851089418, "global_step": 41451, "epoch": 348, "lr": 3.7930658873928565e-05} +{"train_loss": 0.0022466746158897877, "global_step": 41452, "epoch": 348, "lr": 3.792850889103225e-05} +{"train_loss": 0.0020485571585595608, "global_step": 41453, "epoch": 348, "lr": 3.792635893183703e-05} +{"train_loss": 0.002283461857587099, "global_step": 41454, "epoch": 348, "lr": 3.79242089963471e-05} +{"train_loss": 0.0023237308487296104, "global_step": 41455, "epoch": 348, "lr": 3.792205908456671e-05} +{"train_loss": 0.0009872913360595703, "global_step": 41456, "epoch": 348, "lr": 3.791990919650006e-05} +{"train_loss": 0.0019143421668559313, "global_step": 41457, "epoch": 348, "lr": 3.7917759332151386e-05} +{"train_loss": 0.0009207214461639524, "global_step": 41458, "epoch": 348, "lr": 3.7915609491524876e-05} +{"train_loss": 0.001873024390079081, "global_step": 41459, "epoch": 348, "lr": 3.791345967462481e-05} +{"train_loss": 0.0015467171324416995, "global_step": 41460, "epoch": 348, "lr": 3.7911309881455345e-05} +{"train_loss": 0.002055761171504855, "global_step": 41461, "epoch": 348, "lr": 3.790916011202075e-05} +{"train_loss": 0.0012469720095396042, "global_step": 41462, "epoch": 348, "lr": 3.7907010366325204e-05} +{"train_loss": 0.000960599456448108, "global_step": 41463, "epoch": 348, "lr": 3.7904860644372984e-05} +{"train_loss": 0.001263245358131826, "global_step": 41464, "epoch": 348, "lr": 3.7902710946168273e-05} +{"train_loss": 0.0009680005023255944, "global_step": 41465, "epoch": 348, "lr": 3.7900561271715275e-05} +{"train_loss": 0.0015088539803400636, "global_step": 41466, "epoch": 348, "lr": 3.789841162101825e-05} +{"train_loss": 0.0017569484189152718, "global_step": 41467, "epoch": 348, "lr": 3.789626199408138e-05} +{"train_loss": 0.002208767691627145, "global_step": 41468, "epoch": 348, "lr": 3.789411239090893e-05} +{"train_loss": 0.0018345743883401155, "global_step": 41469, "epoch": 348, "lr": 3.789196281150509e-05} +{"train_loss": 0.002025071531534195, "global_step": 41470, "epoch": 348, "lr": 3.7889813255874084e-05} +{"train_loss": 0.0008186421473510563, "global_step": 41471, "epoch": 348, "lr": 3.788766372402013e-05} +{"train_loss": 0.0015194176230579615, "global_step": 41472, "epoch": 348, "lr": 3.788551421594745e-05} +{"train_loss": 0.0025629557203501463, "global_step": 41473, "epoch": 348, "lr": 3.788336473166029e-05} +{"train_loss": 0.0015238195192068815, "global_step": 41474, "epoch": 348, "lr": 3.7881215271162826e-05} +{"train_loss": 0.0021914029493927956, "global_step": 41475, "epoch": 348, "lr": 3.7879065834459325e-05} +{"train_loss": 0.00168685766402632, "global_step": 41476, "epoch": 348, "lr": 3.787691642155399e-05} +{"train_loss": 0.0021264313254505396, "global_step": 41477, "epoch": 348, "lr": 3.7874767032451e-05} +{"train_loss": 0.0015717183705419302, "global_step": 41478, "epoch": 348, "lr": 3.787261766715464e-05} +{"train_loss": 0.000995137495920062, "global_step": 41479, "epoch": 348, "lr": 3.7870468325669066e-05} +{"train_loss": 0.001429308787919581, "global_step": 41480, "epoch": 348, "lr": 3.786831900799856e-05} +{"train_loss": 0.0018540127202868462, "global_step": 41481, "epoch": 348, "lr": 3.78661697141473e-05} +{"train_loss": 0.0014748183311894536, "global_step": 41482, "epoch": 348, "lr": 3.786402044411953e-05} +{"train_loss": 0.0013366017956286669, "global_step": 41483, "epoch": 348, "lr": 3.7861871197919465e-05} +{"train_loss": 0.0015694844769313931, "global_step": 41484, "epoch": 348, "lr": 3.7859721975551295e-05} +{"train_loss": 0.001955186016857624, "global_step": 41485, "epoch": 348, "lr": 3.7857572777019276e-05} +{"train_loss": 0.001447396702133119, "global_step": 41486, "epoch": 348, "lr": 3.7855423602327615e-05} +{"train_loss": 0.001175035024061799, "global_step": 41487, "epoch": 348, "lr": 3.785327445148053e-05} +{"train_loss": 0.0015119562158361077, "global_step": 41488, "epoch": 348, "lr": 3.7851125324482265e-05} +{"train_loss": 0.0013550689909607172, "global_step": 41489, "epoch": 348, "lr": 3.784897622133698e-05} +{"train_loss": 0.0009241324733011425, "global_step": 41490, "epoch": 348, "lr": 3.784682714204896e-05} +{"train_loss": 0.0018301644595339894, "global_step": 41491, "epoch": 348, "lr": 3.7844678086622373e-05} +{"train_loss": 0.0013587538851425052, "global_step": 41492, "epoch": 348, "lr": 3.7842529055061494e-05} +{"train_loss": 0.001266320119611919, "global_step": 41493, "epoch": 348, "lr": 3.7840380047370477e-05} +{"train_loss": 0.0015960695454850793, "global_step": 41494, "epoch": 348, "lr": 3.78382310635536e-05} +{"train_loss": 0.0029957739170640707, "global_step": 41495, "epoch": 348, "lr": 3.783608210361505e-05} +{"train_loss": 0.0008522138232365251, "global_step": 41496, "epoch": 348, "lr": 3.783393316755905e-05} +{"train_loss": 0.0017422859091311693, "global_step": 41497, "epoch": 348, "lr": 3.783178425538983e-05} +{"train_loss": 0.0016316105611622334, "global_step": 41498, "epoch": 348, "lr": 3.7829635367111584e-05} +{"train_loss": 0.0019441210897639394, "global_step": 41499, "epoch": 348, "lr": 3.7827486502728574e-05} +{"train_loss": 0.0017676346469670534, "global_step": 41500, "epoch": 348, "lr": 3.7825337662244964e-05} +{"train_loss": 0.0009340854594483972, "global_step": 41501, "epoch": 348, "lr": 3.7823188845665024e-05} +{"train_loss": 0.0017911792965605855, "global_step": 41502, "epoch": 348, "lr": 3.782104005299295e-05} +{"train_loss": 0.001162899425253272, "global_step": 41503, "epoch": 348, "lr": 3.781889128423296e-05} +{"train_loss": 0.0014811997534707189, "global_step": 41504, "epoch": 348, "lr": 3.7816742539389275e-05} +{"train_loss": 0.0027052750810980797, "global_step": 41505, "epoch": 348, "lr": 3.781459381846611e-05} +{"train_loss": 0.001665207208134234, "global_step": 41506, "epoch": 348, "lr": 3.781244512146769e-05} +{"train_loss": 0.0012859369162470102, "global_step": 41507, "epoch": 348, "lr": 3.7810296448398245e-05} +{"train_loss": 0.0012221818324178457, "global_step": 41508, "epoch": 348, "lr": 3.780814779926195e-05} +{"train_loss": 0.0007406605873256922, "global_step": 41509, "epoch": 348, "lr": 3.780599917406309e-05} +{"train_loss": 0.0015112455002963543, "global_step": 41510, "epoch": 348, "lr": 3.780385057280582e-05} +{"train_loss": 0.0035099941305816174, "global_step": 41511, "epoch": 348, "lr": 3.780170199549441e-05} +{"train_loss": 0.0011199809378013015, "global_step": 41512, "epoch": 348, "lr": 3.7799553442133026e-05} +{"train_loss": 0.0015574019635096192, "global_step": 41513, "epoch": 348, "lr": 3.7797404912725945e-05} +{"train_loss": 0.0019411502871662378, "global_step": 41514, "epoch": 348, "lr": 3.7795256407277355e-05} +{"train_loss": 0.002017656108364463, "global_step": 41515, "epoch": 348, "lr": 3.779310792579145e-05} +{"train_loss": 0.0024759217631071806, "global_step": 41516, "epoch": 348, "lr": 3.7790959468272494e-05} +{"train_loss": 0.002865486079826951, "global_step": 41517, "epoch": 348, "lr": 3.778881103472467e-05} +{"train_loss": 0.0018432801589369774, "global_step": 41518, "epoch": 348, "lr": 3.7786662625152224e-05} +{"train_loss": 0.0011694099521264434, "global_step": 41519, "epoch": 348, "lr": 3.778451423955936e-05} +{"train_loss": 0.0011767704272642732, "global_step": 41520, "epoch": 348, "lr": 3.778236587795028e-05} +{"train_loss": 0.0024820277467370033, "global_step": 41521, "epoch": 348, "lr": 3.7780217540329243e-05} +{"train_loss": 0.002286578994244337, "global_step": 41522, "epoch": 348, "lr": 3.777806922670042e-05} +{"train_loss": 0.0013175115454941988, "global_step": 41523, "epoch": 348, "lr": 3.777592093706808e-05} +{"train_loss": 0.0012920030858367682, "global_step": 41524, "epoch": 348, "lr": 3.777377267143638e-05} +{"train_loss": 0.0015494561521336436, "global_step": 41525, "epoch": 348, "lr": 3.77716244298096e-05} +{"train_loss": 0.001425263937562704, "global_step": 41526, "epoch": 348, "lr": 3.776947621219193e-05} +{"train_loss": 0.0010597649961709976, "global_step": 41527, "epoch": 348, "lr": 3.776732801858756e-05} +{"train_loss": 0.0009263501269742846, "global_step": 41528, "epoch": 348, "lr": 3.7765179849000765e-05} +{"train_loss": 0.002499982248991728, "global_step": 41529, "epoch": 348, "lr": 3.7763031703435705e-05} +{"train_loss": 0.0016831055292350968, "global_step": 41530, "epoch": 348, "lr": 3.7760883581896645e-05, "val_loss": 0.018797749653458595} +{"train_loss": 0.0017675833078101277, "global_step": 41531, "epoch": 349, "lr": 3.775873548438776e-05} +{"train_loss": 0.002003764035180211, "global_step": 41532, "epoch": 349, "lr": 3.7756587410913316e-05} +{"train_loss": 0.0017030747840180993, "global_step": 41533, "epoch": 349, "lr": 3.7754439361477496e-05} +{"train_loss": 0.0013369153020903468, "global_step": 41534, "epoch": 349, "lr": 3.775229133608452e-05} +{"train_loss": 0.0022364361211657524, "global_step": 41535, "epoch": 349, "lr": 3.775014333473861e-05} +{"train_loss": 0.001288209343329072, "global_step": 41536, "epoch": 349, "lr": 3.774799535744399e-05} +{"train_loss": 0.0018433313816785812, "global_step": 41537, "epoch": 349, "lr": 3.774584740420488e-05} +{"train_loss": 0.002232852391898632, "global_step": 41538, "epoch": 349, "lr": 3.774369947502548e-05} +{"train_loss": 0.0018991216784343123, "global_step": 41539, "epoch": 349, "lr": 3.7741551569910015e-05} +{"train_loss": 0.0014524670550599694, "global_step": 41540, "epoch": 349, "lr": 3.773940368886272e-05} +{"train_loss": 0.0014070754405111074, "global_step": 41541, "epoch": 349, "lr": 3.773725583188777e-05} +{"train_loss": 0.0015052052913233638, "global_step": 41542, "epoch": 349, "lr": 3.773510799898943e-05} +{"train_loss": 0.0025667964946478605, "global_step": 41543, "epoch": 349, "lr": 3.7732960190171877e-05} +{"train_loss": 0.0013915190938860178, "global_step": 41544, "epoch": 349, "lr": 3.773081240543936e-05} +{"train_loss": 0.0018316330388188362, "global_step": 41545, "epoch": 349, "lr": 3.7728664644796084e-05} +{"train_loss": 0.0018768359441310167, "global_step": 41546, "epoch": 349, "lr": 3.772651690824625e-05} +{"train_loss": 0.0013449214166030288, "global_step": 41547, "epoch": 349, "lr": 3.772436919579411e-05} +{"train_loss": 0.0015778170200064778, "global_step": 41548, "epoch": 349, "lr": 3.7722221507443825e-05} +{"train_loss": 0.0009717968059703708, "global_step": 41549, "epoch": 349, "lr": 3.772007384319968e-05} +{"train_loss": 0.0010161229874938726, "global_step": 41550, "epoch": 349, "lr": 3.7717926203065834e-05} +{"train_loss": 0.0008831301238387823, "global_step": 41551, "epoch": 349, "lr": 3.7715778587046554e-05} +{"train_loss": 0.0020235104020684958, "global_step": 41552, "epoch": 349, "lr": 3.771363099514601e-05} +{"train_loss": 0.002605419373139739, "global_step": 41553, "epoch": 349, "lr": 3.771148342736844e-05} +{"train_loss": 0.001777163241058588, "global_step": 41554, "epoch": 349, "lr": 3.7709335883718063e-05} +{"train_loss": 0.0012014966923743486, "global_step": 41555, "epoch": 349, "lr": 3.7707188364199086e-05} +{"train_loss": 0.0014538696268573403, "global_step": 41556, "epoch": 349, "lr": 3.770504086881575e-05} +{"train_loss": 0.0013688576873391867, "global_step": 41557, "epoch": 349, "lr": 3.770289339757225e-05} +{"train_loss": 0.0016634525964036584, "global_step": 41558, "epoch": 349, "lr": 3.770074595047278e-05} +{"train_loss": 0.0018763133557513356, "global_step": 41559, "epoch": 349, "lr": 3.769859852752161e-05} +{"train_loss": 0.001121410634368658, "global_step": 41560, "epoch": 349, "lr": 3.7696451128722906e-05} +{"train_loss": 0.001282982062548399, "global_step": 41561, "epoch": 349, "lr": 3.7694303754080925e-05} +{"train_loss": 0.0014118485851213336, "global_step": 41562, "epoch": 349, "lr": 3.769215640359984e-05} +{"train_loss": 0.0015695111360400915, "global_step": 41563, "epoch": 349, "lr": 3.7690009077283914e-05} +{"train_loss": 0.002029668539762497, "global_step": 41564, "epoch": 349, "lr": 3.768786177513734e-05} +{"train_loss": 0.0027746777050197124, "global_step": 41565, "epoch": 349, "lr": 3.768571449716432e-05} +{"train_loss": 0.00208007893525064, "global_step": 41566, "epoch": 349, "lr": 3.768356724336909e-05} +{"train_loss": 0.002176440553739667, "global_step": 41567, "epoch": 349, "lr": 3.7681420013755845e-05} +{"train_loss": 0.001569858635775745, "global_step": 41568, "epoch": 349, "lr": 3.767927280832883e-05} +{"train_loss": 0.0013402767945080996, "global_step": 41569, "epoch": 349, "lr": 3.7677125627092244e-05} +{"train_loss": 0.0013638719683513045, "global_step": 41570, "epoch": 349, "lr": 3.767497847005031e-05} +{"train_loss": 0.0011427572462707758, "global_step": 41571, "epoch": 349, "lr": 3.7672831337207246e-05} +{"train_loss": 0.0019832889083772898, "global_step": 41572, "epoch": 349, "lr": 3.767068422856724e-05} +{"train_loss": 0.001509074936620891, "global_step": 41573, "epoch": 349, "lr": 3.766853714413455e-05} +{"train_loss": 0.0020280450116842985, "global_step": 41574, "epoch": 349, "lr": 3.766639008391335e-05} +{"train_loss": 0.0023339230101555586, "global_step": 41575, "epoch": 349, "lr": 3.766424304790789e-05} +{"train_loss": 0.0015991131076589227, "global_step": 41576, "epoch": 349, "lr": 3.766209603612237e-05} +{"train_loss": 0.0030801782850176096, "global_step": 41577, "epoch": 349, "lr": 3.765994904856099e-05} +{"train_loss": 0.0010231670457869768, "global_step": 41578, "epoch": 349, "lr": 3.7657802085228004e-05} +{"train_loss": 0.0010711060604080558, "global_step": 41579, "epoch": 349, "lr": 3.7655655146127586e-05} +{"train_loss": 0.002722590696066618, "global_step": 41580, "epoch": 349, "lr": 3.765350823126399e-05} +{"train_loss": 0.001712752622552216, "global_step": 41581, "epoch": 349, "lr": 3.765136134064139e-05} +{"train_loss": 0.00236912677064538, "global_step": 41582, "epoch": 349, "lr": 3.764921447426404e-05} +{"train_loss": 0.0010956337209790945, "global_step": 41583, "epoch": 349, "lr": 3.764706763213613e-05} +{"train_loss": 0.002263708971440792, "global_step": 41584, "epoch": 349, "lr": 3.7644920814261884e-05} +{"train_loss": 0.0014959560940042138, "global_step": 41585, "epoch": 349, "lr": 3.7642774020645514e-05} +{"train_loss": 0.003599320538341999, "global_step": 41586, "epoch": 349, "lr": 3.764062725129124e-05} +{"train_loss": 0.0015626098029315472, "global_step": 41587, "epoch": 349, "lr": 3.7638480506203275e-05} +{"train_loss": 0.0018232209840789437, "global_step": 41588, "epoch": 349, "lr": 3.7636333785385836e-05} +{"train_loss": 0.0019037718884646893, "global_step": 41589, "epoch": 349, "lr": 3.763418708884312e-05} +{"train_loss": 0.0017238646978512406, "global_step": 41590, "epoch": 349, "lr": 3.763204041657937e-05} +{"train_loss": 0.0014823885867372155, "global_step": 41591, "epoch": 349, "lr": 3.762989376859878e-05} +{"train_loss": 0.0018675265600904822, "global_step": 41592, "epoch": 349, "lr": 3.7627747144905586e-05} +{"train_loss": 0.0010870842961594462, "global_step": 41593, "epoch": 349, "lr": 3.7625600545503964e-05} +{"train_loss": 0.0027284256648272276, "global_step": 41594, "epoch": 349, "lr": 3.7623453970398174e-05} +{"train_loss": 0.0023084799759089947, "global_step": 41595, "epoch": 349, "lr": 3.762130741959242e-05} +{"train_loss": 0.0021269735880196095, "global_step": 41596, "epoch": 349, "lr": 3.7619160893090877e-05} +{"train_loss": 0.0014950071927160025, "global_step": 41597, "epoch": 349, "lr": 3.761701439089781e-05} +{"train_loss": 0.0015776820946484804, "global_step": 41598, "epoch": 349, "lr": 3.761486791301739e-05} +{"train_loss": 0.001812591915950179, "global_step": 41599, "epoch": 349, "lr": 3.761272145945388e-05} +{"train_loss": 0.0010797677095979452, "global_step": 41600, "epoch": 349, "lr": 3.761057503021144e-05} +{"train_loss": 0.0012264061952009797, "global_step": 41601, "epoch": 349, "lr": 3.7608428625294345e-05} +{"train_loss": 0.0014151943614706397, "global_step": 41602, "epoch": 349, "lr": 3.760628224470676e-05} +{"train_loss": 0.0015783251728862524, "global_step": 41603, "epoch": 349, "lr": 3.76041358884529e-05} +{"train_loss": 0.0029620849527418613, "global_step": 41604, "epoch": 349, "lr": 3.760198955653702e-05} +{"train_loss": 0.0014338765759021044, "global_step": 41605, "epoch": 349, "lr": 3.759984324896329e-05} +{"train_loss": 0.002007467905059457, "global_step": 41606, "epoch": 349, "lr": 3.7597696965735965e-05} +{"train_loss": 0.0026532819028943777, "global_step": 41607, "epoch": 349, "lr": 3.7595550706859226e-05} +{"train_loss": 0.00285866716876626, "global_step": 41608, "epoch": 349, "lr": 3.759340447233729e-05} +{"train_loss": 0.0008440008969046175, "global_step": 41609, "epoch": 349, "lr": 3.7591258262174396e-05} +{"train_loss": 0.0021090409718453884, "global_step": 41610, "epoch": 349, "lr": 3.758911207637471e-05} +{"train_loss": 0.0016816509887576103, "global_step": 41611, "epoch": 349, "lr": 3.7586965914942515e-05} +{"train_loss": 0.0024012101348489523, "global_step": 41612, "epoch": 349, "lr": 3.7584819777881955e-05} +{"train_loss": 0.0033370009623467922, "global_step": 41613, "epoch": 349, "lr": 3.7582673665197296e-05} +{"train_loss": 0.0010783624602481723, "global_step": 41614, "epoch": 349, "lr": 3.758052757689273e-05} +{"train_loss": 0.0016999293584376574, "global_step": 41615, "epoch": 349, "lr": 3.757838151297246e-05} +{"train_loss": 0.001138287247158587, "global_step": 41616, "epoch": 349, "lr": 3.757623547344072e-05} +{"train_loss": 0.0018074336694553494, "global_step": 41617, "epoch": 349, "lr": 3.75740894583017e-05} +{"train_loss": 0.0017053426709026098, "global_step": 41618, "epoch": 349, "lr": 3.7571943467559635e-05} +{"train_loss": 0.000854340847581625, "global_step": 41619, "epoch": 349, "lr": 3.756979750121873e-05} +{"train_loss": 0.0015576374717056751, "global_step": 41620, "epoch": 349, "lr": 3.75676515592832e-05} +{"train_loss": 0.002334403805434704, "global_step": 41621, "epoch": 349, "lr": 3.756550564175727e-05} +{"train_loss": 0.00148937723133713, "global_step": 41622, "epoch": 349, "lr": 3.756335974864512e-05} +{"train_loss": 0.001720185624435544, "global_step": 41623, "epoch": 349, "lr": 3.756121387995101e-05} +{"train_loss": 0.0015237476909533143, "global_step": 41624, "epoch": 349, "lr": 3.7559068035679105e-05} +{"train_loss": 0.0009596389718353748, "global_step": 41625, "epoch": 349, "lr": 3.755692221583366e-05} +{"train_loss": 0.0020229583606123924, "global_step": 41626, "epoch": 349, "lr": 3.755477642041886e-05} +{"train_loss": 0.0013830824755132198, "global_step": 41627, "epoch": 349, "lr": 3.7552630649438916e-05} +{"train_loss": 0.0012949625961482525, "global_step": 41628, "epoch": 349, "lr": 3.755048490289807e-05} +{"train_loss": 0.0037505982909351587, "global_step": 41629, "epoch": 349, "lr": 3.75483391808005e-05} +{"train_loss": 0.0017192823579534888, "global_step": 41630, "epoch": 349, "lr": 3.754619348315045e-05} +{"train_loss": 0.0012706223642453551, "global_step": 41631, "epoch": 349, "lr": 3.75440478099521e-05} +{"train_loss": 0.0009487699717283249, "global_step": 41632, "epoch": 349, "lr": 3.754190216120971e-05} +{"train_loss": 0.002515312284231186, "global_step": 41633, "epoch": 349, "lr": 3.7539756536927445e-05} +{"train_loss": 0.0017812441801652312, "global_step": 41634, "epoch": 349, "lr": 3.753761093710953e-05} +{"train_loss": 0.002342367311939597, "global_step": 41635, "epoch": 349, "lr": 3.75354653617602e-05} +{"train_loss": 0.0011798838386312127, "global_step": 41636, "epoch": 349, "lr": 3.753331981088365e-05} +{"train_loss": 0.0009555027354508638, "global_step": 41637, "epoch": 349, "lr": 3.7531174284484085e-05} +{"train_loss": 0.0016652446938678622, "global_step": 41638, "epoch": 349, "lr": 3.752902878256573e-05} +{"train_loss": 0.001582885393872857, "global_step": 41639, "epoch": 349, "lr": 3.7526883305132806e-05} +{"train_loss": 0.0019372293027117848, "global_step": 41640, "epoch": 349, "lr": 3.752473785218951e-05} +{"train_loss": 0.0014382593799382448, "global_step": 41641, "epoch": 349, "lr": 3.7522592423740047e-05} +{"train_loss": 0.0011039664968848228, "global_step": 41642, "epoch": 349, "lr": 3.752044701978866e-05} +{"train_loss": 0.0028895267751067877, "global_step": 41643, "epoch": 349, "lr": 3.751830164033951e-05} +{"train_loss": 0.0012989954557269812, "global_step": 41644, "epoch": 349, "lr": 3.751615628539688e-05} +{"train_loss": 0.001364517374895513, "global_step": 41645, "epoch": 349, "lr": 3.7514010954964936e-05} +{"train_loss": 0.0014408292481675744, "global_step": 41646, "epoch": 349, "lr": 3.751186564904787e-05} +{"train_loss": 0.0028614436741918325, "global_step": 41647, "epoch": 349, "lr": 3.7509720367649954e-05} +{"train_loss": 0.0015265180263668299, "global_step": 41648, "epoch": 349, "lr": 3.750757511077534e-05} +{"train_loss": 0.0017545080245785541, "global_step": 41649, "epoch": 349, "lr": 3.7505429878428286e-05, "val_loss": 0.022571727633476257} +{"train_loss": 0.0007361689931713045, "global_step": 41650, "epoch": 350, "lr": 3.750328467061297e-05} +{"train_loss": 0.001219309400767088, "global_step": 41651, "epoch": 350, "lr": 3.7501139487333636e-05} +{"train_loss": 0.0016187506262212992, "global_step": 41652, "epoch": 350, "lr": 3.749899432859447e-05} +{"train_loss": 0.000975464005023241, "global_step": 41653, "epoch": 350, "lr": 3.749684919439968e-05} +{"train_loss": 0.001019821036607027, "global_step": 41654, "epoch": 350, "lr": 3.749470408475352e-05} +{"train_loss": 0.00281479861587286, "global_step": 41655, "epoch": 350, "lr": 3.749255899966015e-05} +{"train_loss": 0.0016746146138757467, "global_step": 41656, "epoch": 350, "lr": 3.7490413939123824e-05} +{"train_loss": 0.0019444129429757595, "global_step": 41657, "epoch": 350, "lr": 3.7488268903148735e-05} +{"train_loss": 0.0017840903019532561, "global_step": 41658, "epoch": 350, "lr": 3.7486123891739065e-05} +{"train_loss": 0.002386215142905712, "global_step": 41659, "epoch": 350, "lr": 3.748397890489908e-05} +{"train_loss": 0.001216667122207582, "global_step": 41660, "epoch": 350, "lr": 3.748183394263294e-05} +{"train_loss": 0.0016279950505122542, "global_step": 41661, "epoch": 350, "lr": 3.747968900494491e-05} +{"train_loss": 0.0012922168243676424, "global_step": 41662, "epoch": 350, "lr": 3.747754409183914e-05} +{"train_loss": 0.0013523311354219913, "global_step": 41663, "epoch": 350, "lr": 3.747539920331992e-05} +{"train_loss": 0.001118839136324823, "global_step": 41664, "epoch": 350, "lr": 3.74732543393914e-05} +{"train_loss": 0.0026558106765151024, "global_step": 41665, "epoch": 350, "lr": 3.747110950005778e-05} +{"train_loss": 0.0010852457489818335, "global_step": 41666, "epoch": 350, "lr": 3.746896468532331e-05} +{"train_loss": 0.002602493856102228, "global_step": 41667, "epoch": 350, "lr": 3.7466819895192195e-05} +{"train_loss": 0.0015748159494251013, "global_step": 41668, "epoch": 350, "lr": 3.7464675129668634e-05} +{"train_loss": 0.002578052692115307, "global_step": 41669, "epoch": 350, "lr": 3.746253038875685e-05} +{"train_loss": 0.001610455452464521, "global_step": 41670, "epoch": 350, "lr": 3.7460385672461046e-05} +{"train_loss": 0.0017884951084852219, "global_step": 41671, "epoch": 350, "lr": 3.745824098078545e-05} +{"train_loss": 0.00154320546425879, "global_step": 41672, "epoch": 350, "lr": 3.745609631373423e-05} +{"train_loss": 0.0018119780579581857, "global_step": 41673, "epoch": 350, "lr": 3.745395167131165e-05} +{"train_loss": 0.0024057477712631226, "global_step": 41674, "epoch": 350, "lr": 3.745180705352187e-05} +{"train_loss": 0.0011483666021376848, "global_step": 41675, "epoch": 350, "lr": 3.7449662460369154e-05} +{"train_loss": 0.0023350093979388475, "global_step": 41676, "epoch": 350, "lr": 3.744751789185768e-05} +{"train_loss": 0.0015283538959920406, "global_step": 41677, "epoch": 350, "lr": 3.744537334799164e-05} +{"train_loss": 0.0018795657670125365, "global_step": 41678, "epoch": 350, "lr": 3.74432288287753e-05} +{"train_loss": 0.0008600982837378979, "global_step": 41679, "epoch": 350, "lr": 3.744108433421281e-05} +{"train_loss": 0.001157688326202333, "global_step": 41680, "epoch": 350, "lr": 3.743893986430843e-05} +{"train_loss": 0.0020414823666214943, "global_step": 41681, "epoch": 350, "lr": 3.7436795419066325e-05} +{"train_loss": 0.0020850016735494137, "global_step": 41682, "epoch": 350, "lr": 3.743465099849076e-05} +{"train_loss": 0.002212702063843608, "global_step": 41683, "epoch": 350, "lr": 3.74325066025859e-05} +{"train_loss": 0.0016486762324348092, "global_step": 41684, "epoch": 350, "lr": 3.743036223135597e-05} +{"train_loss": 0.0012386030284687877, "global_step": 41685, "epoch": 350, "lr": 3.7428217884805184e-05} +{"train_loss": 0.0014928891323506832, "global_step": 41686, "epoch": 350, "lr": 3.742607356293775e-05} +{"train_loss": 0.0015500510344281793, "global_step": 41687, "epoch": 350, "lr": 3.7423929265757866e-05} +{"train_loss": 0.001106398762203753, "global_step": 41688, "epoch": 350, "lr": 3.7421784993269754e-05} +{"train_loss": 0.0017419497016817331, "global_step": 41689, "epoch": 350, "lr": 3.741964074547764e-05} +{"train_loss": 0.0014865731354802847, "global_step": 41690, "epoch": 350, "lr": 3.741749652238572e-05} +{"train_loss": 0.0014320147456601262, "global_step": 41691, "epoch": 350, "lr": 3.7415352323998176e-05} +{"train_loss": 0.0013587134890258312, "global_step": 41692, "epoch": 350, "lr": 3.741320815031927e-05} +{"train_loss": 0.002110756002366543, "global_step": 41693, "epoch": 350, "lr": 3.741106400135316e-05} +{"train_loss": 0.002450220286846161, "global_step": 41694, "epoch": 350, "lr": 3.7408919877104107e-05} +{"train_loss": 0.0019472726853564382, "global_step": 41695, "epoch": 350, "lr": 3.740677577757629e-05} +{"train_loss": 0.001259543001651764, "global_step": 41696, "epoch": 350, "lr": 3.740463170277391e-05} +{"train_loss": 0.0013534730533137918, "global_step": 41697, "epoch": 350, "lr": 3.7402487652701205e-05} +{"train_loss": 0.0025985257234424353, "global_step": 41698, "epoch": 350, "lr": 3.7400343627362345e-05} +{"train_loss": 0.0015520448796451092, "global_step": 41699, "epoch": 350, "lr": 3.739819962676159e-05} +{"train_loss": 0.0011453208280727267, "global_step": 41700, "epoch": 350, "lr": 3.7396055650903095e-05} +{"train_loss": 0.0022339681163430214, "global_step": 41701, "epoch": 350, "lr": 3.739391169979112e-05} +{"train_loss": 0.0012412050273269415, "global_step": 41702, "epoch": 350, "lr": 3.7391767773429856e-05} +{"train_loss": 0.0009453122620470822, "global_step": 41703, "epoch": 350, "lr": 3.738962387182349e-05} +{"train_loss": 0.0014647489879280329, "global_step": 41704, "epoch": 350, "lr": 3.7387479994976274e-05} +{"train_loss": 0.0020984304137527943, "global_step": 41705, "epoch": 350, "lr": 3.7385336142892365e-05} +{"train_loss": 0.001618248876184225, "global_step": 41706, "epoch": 350, "lr": 3.7383192315576026e-05} +{"train_loss": 0.0018356089713051915, "global_step": 41707, "epoch": 350, "lr": 3.738104851303144e-05} +{"train_loss": 0.001365799573250115, "global_step": 41708, "epoch": 350, "lr": 3.7378904735262796e-05} +{"train_loss": 0.0021382111590355635, "global_step": 41709, "epoch": 350, "lr": 3.737676098227435e-05} +{"train_loss": 0.002293602330610156, "global_step": 41710, "epoch": 350, "lr": 3.737461725407026e-05} +{"train_loss": 0.0008161754813045263, "global_step": 41711, "epoch": 350, "lr": 3.7372473550654785e-05} +{"train_loss": 0.001164123066700995, "global_step": 41712, "epoch": 350, "lr": 3.7370329872032084e-05} +{"train_loss": 0.002309668343514204, "global_step": 41713, "epoch": 350, "lr": 3.7368186218206415e-05} +{"train_loss": 0.0013640127144753933, "global_step": 41714, "epoch": 350, "lr": 3.736604258918195e-05} +{"train_loss": 0.0010108640417456627, "global_step": 41715, "epoch": 350, "lr": 3.736389898496291e-05} +{"train_loss": 0.001472405856475234, "global_step": 41716, "epoch": 350, "lr": 3.73617554055535e-05} +{"train_loss": 0.0014166147448122501, "global_step": 41717, "epoch": 350, "lr": 3.7359611850957946e-05} +{"train_loss": 0.002057787962257862, "global_step": 41718, "epoch": 350, "lr": 3.7357468321180435e-05} +{"train_loss": 0.0018823272548615932, "global_step": 41719, "epoch": 350, "lr": 3.735532481622519e-05} +{"train_loss": 0.0015345521969720721, "global_step": 41720, "epoch": 350, "lr": 3.735318133609641e-05} +{"train_loss": 0.0020211953669786453, "global_step": 41721, "epoch": 350, "lr": 3.735103788079831e-05} +{"train_loss": 0.0010771340457722545, "global_step": 41722, "epoch": 350, "lr": 3.734889445033509e-05} +{"train_loss": 0.0034231417812407017, "global_step": 41723, "epoch": 350, "lr": 3.734675104471097e-05} +{"train_loss": 0.0021352877374738455, "global_step": 41724, "epoch": 350, "lr": 3.734460766393014e-05} +{"train_loss": 0.0020669300574809313, "global_step": 41725, "epoch": 350, "lr": 3.7342464307996845e-05} +{"train_loss": 0.0009674814064055681, "global_step": 41726, "epoch": 350, "lr": 3.7340320976915265e-05} +{"train_loss": 0.0019067458342760801, "global_step": 41727, "epoch": 350, "lr": 3.733817767068959e-05} +{"train_loss": 0.0014561114367097616, "global_step": 41728, "epoch": 350, "lr": 3.7336034389324074e-05} +{"train_loss": 0.002292859833687544, "global_step": 41729, "epoch": 350, "lr": 3.733389113282287e-05} +{"train_loss": 0.0010536271147429943, "global_step": 41730, "epoch": 350, "lr": 3.733174790119026e-05} +{"train_loss": 0.0010577876819297671, "global_step": 41731, "epoch": 350, "lr": 3.732960469443037e-05} +{"train_loss": 0.0017304911743849516, "global_step": 41732, "epoch": 350, "lr": 3.732746151254748e-05} +{"train_loss": 0.0017883549444377422, "global_step": 41733, "epoch": 350, "lr": 3.732531835554575e-05} +{"train_loss": 0.0016151475720107555, "global_step": 41734, "epoch": 350, "lr": 3.7323175223429396e-05} +{"train_loss": 0.0014637872809544206, "global_step": 41735, "epoch": 350, "lr": 3.732103211620264e-05} +{"train_loss": 0.0014960423577576876, "global_step": 41736, "epoch": 350, "lr": 3.731888903386967e-05} +{"train_loss": 0.0019169705919921398, "global_step": 41737, "epoch": 350, "lr": 3.731674597643474e-05} +{"train_loss": 0.00316832703538239, "global_step": 41738, "epoch": 350, "lr": 3.731460294390199e-05} +{"train_loss": 0.0012008899357169867, "global_step": 41739, "epoch": 350, "lr": 3.731245993627569e-05} +{"train_loss": 0.0010110375005751848, "global_step": 41740, "epoch": 350, "lr": 3.731031695356001e-05} +{"train_loss": 0.0013198318192735314, "global_step": 41741, "epoch": 350, "lr": 3.7308173995759155e-05} +{"train_loss": 0.0021110260859131813, "global_step": 41742, "epoch": 350, "lr": 3.730603106287736e-05} +{"train_loss": 0.001213948125950992, "global_step": 41743, "epoch": 350, "lr": 3.7303888154918797e-05} +{"train_loss": 0.0020825883839279413, "global_step": 41744, "epoch": 350, "lr": 3.7301745271887715e-05} +{"train_loss": 0.0026574290823191404, "global_step": 41745, "epoch": 350, "lr": 3.7299602413788304e-05} +{"train_loss": 0.0012361627304926515, "global_step": 41746, "epoch": 350, "lr": 3.7297459580624735e-05} +{"train_loss": 0.0034955192822963, "global_step": 41747, "epoch": 350, "lr": 3.729531677240128e-05} +{"train_loss": 0.0020481247920542955, "global_step": 41748, "epoch": 350, "lr": 3.729317398912209e-05} +{"train_loss": 0.0011552567593753338, "global_step": 41749, "epoch": 350, "lr": 3.729103123079141e-05} +{"train_loss": 0.002248652745038271, "global_step": 41750, "epoch": 350, "lr": 3.728888849741342e-05} +{"train_loss": 0.0018508456414565444, "global_step": 41751, "epoch": 350, "lr": 3.728674578899234e-05} +{"train_loss": 0.0014665252529084682, "global_step": 41752, "epoch": 350, "lr": 3.728460310553239e-05} +{"train_loss": 0.002128089778125286, "global_step": 41753, "epoch": 350, "lr": 3.728246044703775e-05} +{"train_loss": 0.002200524788349867, "global_step": 41754, "epoch": 350, "lr": 3.728031781351266e-05} +{"train_loss": 0.002541345078498125, "global_step": 41755, "epoch": 350, "lr": 3.7278175204961275e-05} +{"train_loss": 0.0022823845501989126, "global_step": 41756, "epoch": 350, "lr": 3.727603262138786e-05} +{"train_loss": 0.0009440726134926081, "global_step": 41757, "epoch": 350, "lr": 3.727389006279657e-05} +{"train_loss": 0.0016993387835100293, "global_step": 41758, "epoch": 350, "lr": 3.727174752919167e-05} +{"train_loss": 0.0009356560767628253, "global_step": 41759, "epoch": 350, "lr": 3.7269605020577324e-05} +{"train_loss": 0.0016561276279389858, "global_step": 41760, "epoch": 350, "lr": 3.726746253695773e-05} +{"train_loss": 0.0018926610937342048, "global_step": 41761, "epoch": 350, "lr": 3.726532007833714e-05} +{"train_loss": 0.0026040486991405487, "global_step": 41762, "epoch": 350, "lr": 3.726317764471971e-05} +{"train_loss": 0.001583655015565455, "global_step": 41763, "epoch": 350, "lr": 3.7261035236109686e-05} +{"train_loss": 0.001964594703167677, "global_step": 41764, "epoch": 350, "lr": 3.725889285251125e-05} +{"train_loss": 0.0019506567623466253, "global_step": 41765, "epoch": 350, "lr": 3.725675049392862e-05} +{"train_loss": 0.0027099023573100567, "global_step": 41766, "epoch": 350, "lr": 3.7254608160366e-05} +{"train_loss": 0.0019491813145577908, "global_step": 41767, "epoch": 350, "lr": 3.725246585182759e-05} +{"train_loss": 0.0017350311982914993, "global_step": 41768, "epoch": 350, "lr": 3.7250323568317604e-05, "val_loss": 0.023050878196954727, "train_action_mse_error": 2.752350155788008e-05} +{"train_loss": 0.0007306505576707423, "global_step": 41769, "epoch": 351, "lr": 3.724818130984024e-05} +{"train_loss": 0.002356209559366107, "global_step": 41770, "epoch": 351, "lr": 3.724603907639972e-05} +{"train_loss": 0.0035523183178156614, "global_step": 41771, "epoch": 351, "lr": 3.724389686800024e-05} +{"train_loss": 0.002192460000514984, "global_step": 41772, "epoch": 351, "lr": 3.724175468464599e-05} +{"train_loss": 0.0019408036023378372, "global_step": 41773, "epoch": 351, "lr": 3.723961252634122e-05} +{"train_loss": 0.0020322157070040703, "global_step": 41774, "epoch": 351, "lr": 3.723747039309007e-05} +{"train_loss": 0.001434912090189755, "global_step": 41775, "epoch": 351, "lr": 3.723532828489682e-05} +{"train_loss": 0.0009483806788921356, "global_step": 41776, "epoch": 351, "lr": 3.723318620176562e-05} +{"train_loss": 0.0016563511453568935, "global_step": 41777, "epoch": 351, "lr": 3.7231044143700695e-05} +{"train_loss": 0.0036238108295947313, "global_step": 41778, "epoch": 351, "lr": 3.722890211070626e-05} +{"train_loss": 0.0020576445385813713, "global_step": 41779, "epoch": 351, "lr": 3.72267601027865e-05} +{"train_loss": 0.0014327316312119365, "global_step": 41780, "epoch": 351, "lr": 3.7224618119945644e-05} +{"train_loss": 0.002112885005772114, "global_step": 41781, "epoch": 351, "lr": 3.722247616218786e-05} +{"train_loss": 0.0026237843558192253, "global_step": 41782, "epoch": 351, "lr": 3.722033422951741e-05} +{"train_loss": 0.0012459272984415293, "global_step": 41783, "epoch": 351, "lr": 3.7218192321938447e-05} +{"train_loss": 0.001247022533789277, "global_step": 41784, "epoch": 351, "lr": 3.721605043945521e-05} +{"train_loss": 0.0009537978330627084, "global_step": 41785, "epoch": 351, "lr": 3.721390858207189e-05} +{"train_loss": 0.0021390493493527174, "global_step": 41786, "epoch": 351, "lr": 3.721176674979268e-05} +{"train_loss": 0.0018506565829738975, "global_step": 41787, "epoch": 351, "lr": 3.7209624942621824e-05} +{"train_loss": 0.0013000451726838946, "global_step": 41788, "epoch": 351, "lr": 3.7207483160563483e-05} +{"train_loss": 0.003430178388953209, "global_step": 41789, "epoch": 351, "lr": 3.72053414036219e-05} +{"train_loss": 0.0032251006923615932, "global_step": 41790, "epoch": 351, "lr": 3.720319967180126e-05} +{"train_loss": 0.002258074004203081, "global_step": 41791, "epoch": 351, "lr": 3.720105796510575e-05} +{"train_loss": 0.0020089519675821066, "global_step": 41792, "epoch": 351, "lr": 3.719891628353962e-05} +{"train_loss": 0.001588965067639947, "global_step": 41793, "epoch": 351, "lr": 3.719677462710703e-05} +{"train_loss": 0.001285139238461852, "global_step": 41794, "epoch": 351, "lr": 3.7194632995812216e-05} +{"train_loss": 0.003166107926517725, "global_step": 41795, "epoch": 351, "lr": 3.719249138965938e-05} +{"train_loss": 0.0010176245123147964, "global_step": 41796, "epoch": 351, "lr": 3.71903498086527e-05} +{"train_loss": 0.001986956223845482, "global_step": 41797, "epoch": 351, "lr": 3.718820825279642e-05} +{"train_loss": 0.0019444044446572661, "global_step": 41798, "epoch": 351, "lr": 3.7186066722094707e-05} +{"train_loss": 0.0017505645519122481, "global_step": 41799, "epoch": 351, "lr": 3.718392521655178e-05} +{"train_loss": 0.0034632165916264057, "global_step": 41800, "epoch": 351, "lr": 3.718178373617186e-05} +{"train_loss": 0.001817761454731226, "global_step": 41801, "epoch": 351, "lr": 3.717964228095913e-05} +{"train_loss": 0.0007820886676199734, "global_step": 41802, "epoch": 351, "lr": 3.717750085091782e-05} +{"train_loss": 0.0015711347805336118, "global_step": 41803, "epoch": 351, "lr": 3.7175359446052095e-05} +{"train_loss": 0.002155556809157133, "global_step": 41804, "epoch": 351, "lr": 3.717321806636619e-05} +{"train_loss": 0.0016202157130464911, "global_step": 41805, "epoch": 351, "lr": 3.717107671186429e-05} +{"train_loss": 0.001891416497528553, "global_step": 41806, "epoch": 351, "lr": 3.716893538255064e-05} +{"train_loss": 0.002188992453739047, "global_step": 41807, "epoch": 351, "lr": 3.716679407842938e-05} +{"train_loss": 0.002056411001831293, "global_step": 41808, "epoch": 351, "lr": 3.716465279950477e-05} +{"train_loss": 0.0019061346538364887, "global_step": 41809, "epoch": 351, "lr": 3.7162511545781e-05} +{"train_loss": 0.0015446513425558805, "global_step": 41810, "epoch": 351, "lr": 3.716037031726225e-05} +{"train_loss": 0.001586795668117702, "global_step": 41811, "epoch": 351, "lr": 3.715822911395276e-05} +{"train_loss": 0.0016406051581725478, "global_step": 41812, "epoch": 351, "lr": 3.7156087935856684e-05} +{"train_loss": 0.0013532255543395877, "global_step": 41813, "epoch": 351, "lr": 3.7153946782978286e-05} +{"train_loss": 0.001593746361322701, "global_step": 41814, "epoch": 351, "lr": 3.715180565532172e-05} +{"train_loss": 0.0024885700549930334, "global_step": 41815, "epoch": 351, "lr": 3.7149664552891225e-05} +{"train_loss": 0.0014120271662250161, "global_step": 41816, "epoch": 351, "lr": 3.7147523475690985e-05} +{"train_loss": 0.0014314517611637712, "global_step": 41817, "epoch": 351, "lr": 3.714538242372522e-05} +{"train_loss": 0.0020242403261363506, "global_step": 41818, "epoch": 351, "lr": 3.714324139699811e-05} +{"train_loss": 0.0018768988084048033, "global_step": 41819, "epoch": 351, "lr": 3.714110039551387e-05} +{"train_loss": 0.0009808964096009731, "global_step": 41820, "epoch": 351, "lr": 3.7138959419276714e-05} +{"train_loss": 0.001037940732203424, "global_step": 41821, "epoch": 351, "lr": 3.713681846829085e-05} +{"train_loss": 0.0015026129549369216, "global_step": 41822, "epoch": 351, "lr": 3.7134677542560435e-05} +{"train_loss": 0.003155704354867339, "global_step": 41823, "epoch": 351, "lr": 3.713253664208974e-05} +{"train_loss": 0.0026449004653841257, "global_step": 41824, "epoch": 351, "lr": 3.713039576688291e-05} +{"train_loss": 0.0008524981094524264, "global_step": 41825, "epoch": 351, "lr": 3.712825491694419e-05} +{"train_loss": 0.0019453682471066713, "global_step": 41826, "epoch": 351, "lr": 3.712611409227774e-05} +{"train_loss": 0.001351183163933456, "global_step": 41827, "epoch": 351, "lr": 3.7123973292887823e-05} +{"train_loss": 0.0014827516861259937, "global_step": 41828, "epoch": 351, "lr": 3.7121832518778605e-05} +{"train_loss": 0.0015065601328387856, "global_step": 41829, "epoch": 351, "lr": 3.711969176995427e-05} +{"train_loss": 0.0014430538285523653, "global_step": 41830, "epoch": 351, "lr": 3.711755104641907e-05} +{"train_loss": 0.0022789007052779198, "global_step": 41831, "epoch": 351, "lr": 3.7115410348177156e-05} +{"train_loss": 0.0034752367064356804, "global_step": 41832, "epoch": 351, "lr": 3.7113269675232776e-05} +{"train_loss": 0.0014951032353565097, "global_step": 41833, "epoch": 351, "lr": 3.711112902759011e-05} +{"train_loss": 0.0014791941503062844, "global_step": 41834, "epoch": 351, "lr": 3.710898840525335e-05} +{"train_loss": 0.0013457771856337786, "global_step": 41835, "epoch": 351, "lr": 3.710684780822674e-05} +{"train_loss": 0.0011253250995650887, "global_step": 41836, "epoch": 351, "lr": 3.710470723651444e-05} +{"train_loss": 0.001094416482374072, "global_step": 41837, "epoch": 351, "lr": 3.7102566690120676e-05} +{"train_loss": 0.0012057317653670907, "global_step": 41838, "epoch": 351, "lr": 3.710042616904963e-05} +{"train_loss": 0.0014181097503751516, "global_step": 41839, "epoch": 351, "lr": 3.7098285673305544e-05} +{"train_loss": 0.0018369263270869851, "global_step": 41840, "epoch": 351, "lr": 3.7096145202892596e-05} +{"train_loss": 0.0014135357923805714, "global_step": 41841, "epoch": 351, "lr": 3.709400475781496e-05} +{"train_loss": 0.001501508173532784, "global_step": 41842, "epoch": 351, "lr": 3.7091864338076895e-05} +{"train_loss": 0.001794600859284401, "global_step": 41843, "epoch": 351, "lr": 3.708972394368255e-05} +{"train_loss": 0.002074804622679949, "global_step": 41844, "epoch": 351, "lr": 3.708758357463618e-05} +{"train_loss": 0.0014049015007913113, "global_step": 41845, "epoch": 351, "lr": 3.7085443230941954e-05} +{"train_loss": 0.0018591593252494931, "global_step": 41846, "epoch": 351, "lr": 3.7083302912604055e-05} +{"train_loss": 0.001529919565655291, "global_step": 41847, "epoch": 351, "lr": 3.708116261962673e-05} +{"train_loss": 0.0009981696493923664, "global_step": 41848, "epoch": 351, "lr": 3.7079022352014156e-05} +{"train_loss": 0.0016200145473703742, "global_step": 41849, "epoch": 351, "lr": 3.707688210977055e-05} +{"train_loss": 0.0014596672262996435, "global_step": 41850, "epoch": 351, "lr": 3.70747418929001e-05} +{"train_loss": 0.00116593181155622, "global_step": 41851, "epoch": 351, "lr": 3.707260170140701e-05} +{"train_loss": 0.0014005493139848113, "global_step": 41852, "epoch": 351, "lr": 3.7070461535295505e-05} +{"train_loss": 0.00209550722502172, "global_step": 41853, "epoch": 351, "lr": 3.7068321394569735e-05} +{"train_loss": 0.0021242224611341953, "global_step": 41854, "epoch": 351, "lr": 3.706618127923396e-05} +{"train_loss": 0.0006851818761788309, "global_step": 41855, "epoch": 351, "lr": 3.706404118929234e-05} +{"train_loss": 0.0012618398759514093, "global_step": 41856, "epoch": 351, "lr": 3.706190112474911e-05} +{"train_loss": 0.001626051147468388, "global_step": 41857, "epoch": 351, "lr": 3.7059761085608435e-05} +{"train_loss": 0.0011512798955664039, "global_step": 41858, "epoch": 351, "lr": 3.705762107187456e-05} +{"train_loss": 0.0016500671626999974, "global_step": 41859, "epoch": 351, "lr": 3.7055481083551654e-05} +{"train_loss": 0.0019806374330073595, "global_step": 41860, "epoch": 351, "lr": 3.705334112064391e-05} +{"train_loss": 0.0012405592715367675, "global_step": 41861, "epoch": 351, "lr": 3.705120118315558e-05} +{"train_loss": 0.002686758292838931, "global_step": 41862, "epoch": 351, "lr": 3.70490612710908e-05} +{"train_loss": 0.0021872178185731173, "global_step": 41863, "epoch": 351, "lr": 3.704692138445384e-05} +{"train_loss": 0.001872080727480352, "global_step": 41864, "epoch": 351, "lr": 3.704478152324884e-05} +{"train_loss": 0.00231535779312253, "global_step": 41865, "epoch": 351, "lr": 3.704264168748003e-05} +{"train_loss": 0.0020803911611437798, "global_step": 41866, "epoch": 351, "lr": 3.704050187715161e-05} +{"train_loss": 0.002192107727751136, "global_step": 41867, "epoch": 351, "lr": 3.7038362092267784e-05} +{"train_loss": 0.0010931796859949827, "global_step": 41868, "epoch": 351, "lr": 3.703622233283275e-05} +{"train_loss": 0.001716839848086238, "global_step": 41869, "epoch": 351, "lr": 3.70340825988507e-05} +{"train_loss": 0.0027789887972176075, "global_step": 41870, "epoch": 351, "lr": 3.7031942890325853e-05} +{"train_loss": 0.0011812098091468215, "global_step": 41871, "epoch": 351, "lr": 3.702980320726241e-05} +{"train_loss": 0.0016117211198434234, "global_step": 41872, "epoch": 351, "lr": 3.702766354966454e-05} +{"train_loss": 0.001562469988130033, "global_step": 41873, "epoch": 351, "lr": 3.702552391753648e-05} +{"train_loss": 0.0010630860924720764, "global_step": 41874, "epoch": 351, "lr": 3.70233843108824e-05} +{"train_loss": 0.002372747752815485, "global_step": 41875, "epoch": 351, "lr": 3.702124472970655e-05} +{"train_loss": 0.0013280060375109315, "global_step": 41876, "epoch": 351, "lr": 3.7019105174013066e-05} +{"train_loss": 0.0011010856833308935, "global_step": 41877, "epoch": 351, "lr": 3.7016965643806215e-05} +{"train_loss": 0.0016578902723267674, "global_step": 41878, "epoch": 351, "lr": 3.701482613909015e-05} +{"train_loss": 0.002315674675628543, "global_step": 41879, "epoch": 351, "lr": 3.701268665986908e-05} +{"train_loss": 0.002826013835147023, "global_step": 41880, "epoch": 351, "lr": 3.701054720614723e-05} +{"train_loss": 0.0017155345994979143, "global_step": 41881, "epoch": 351, "lr": 3.7008407777928756e-05} +{"train_loss": 0.0013527740957215428, "global_step": 41882, "epoch": 351, "lr": 3.7006268375217894e-05} +{"train_loss": 0.0013860320905223489, "global_step": 41883, "epoch": 351, "lr": 3.700412899801885e-05} +{"train_loss": 0.001139483880251646, "global_step": 41884, "epoch": 351, "lr": 3.7001989646335794e-05} +{"train_loss": 0.0011211931705474854, "global_step": 41885, "epoch": 351, "lr": 3.699985032017296e-05} +{"train_loss": 0.0010871244594454765, "global_step": 41886, "epoch": 351, "lr": 3.699771101953451e-05} +{"train_loss": 0.0017625385080464184, "global_step": 41887, "epoch": 351, "lr": 3.6995571744424687e-05, "val_loss": 0.03475835919380188} +{"train_loss": 0.0017330205300822854, "global_step": 41888, "epoch": 352, "lr": 3.6993432494847644e-05} +{"train_loss": 0.0019912822172045708, "global_step": 41889, "epoch": 352, "lr": 3.6991293270807635e-05} +{"train_loss": 0.0012615129817277193, "global_step": 41890, "epoch": 352, "lr": 3.698915407230883e-05} +{"train_loss": 0.0016780258156359196, "global_step": 41891, "epoch": 352, "lr": 3.698701489935541e-05} +{"train_loss": 0.0022930314298719168, "global_step": 41892, "epoch": 352, "lr": 3.698487575195161e-05} +{"train_loss": 0.0011235239217057824, "global_step": 41893, "epoch": 352, "lr": 3.698273663010161e-05} +{"train_loss": 0.0012668807758018374, "global_step": 41894, "epoch": 352, "lr": 3.6980597533809624e-05} +{"train_loss": 0.0019700645934790373, "global_step": 41895, "epoch": 352, "lr": 3.697845846307985e-05} +{"train_loss": 0.0017839866923168302, "global_step": 41896, "epoch": 352, "lr": 3.697631941791645e-05} +{"train_loss": 0.0015145554207265377, "global_step": 41897, "epoch": 352, "lr": 3.6974180398323675e-05} +{"train_loss": 0.001338533591479063, "global_step": 41898, "epoch": 352, "lr": 3.697204140430571e-05} +{"train_loss": 0.0011420162627473474, "global_step": 41899, "epoch": 352, "lr": 3.696990243586674e-05} +{"train_loss": 0.0015543574700132012, "global_step": 41900, "epoch": 352, "lr": 3.696776349301098e-05} +{"train_loss": 0.0017984549049288034, "global_step": 41901, "epoch": 352, "lr": 3.696562457574262e-05} +{"train_loss": 0.001468517119064927, "global_step": 41902, "epoch": 352, "lr": 3.696348568406588e-05} +{"train_loss": 0.0014232791727408767, "global_step": 41903, "epoch": 352, "lr": 3.696134681798492e-05} +{"train_loss": 0.0008386892732232809, "global_step": 41904, "epoch": 352, "lr": 3.695920797750398e-05} +{"train_loss": 0.0015974149573594332, "global_step": 41905, "epoch": 352, "lr": 3.695706916262722e-05} +{"train_loss": 0.00238701025955379, "global_step": 41906, "epoch": 352, "lr": 3.695493037335889e-05} +{"train_loss": 0.0013587882276624441, "global_step": 41907, "epoch": 352, "lr": 3.6952791609703136e-05} +{"train_loss": 0.0016468169633299112, "global_step": 41908, "epoch": 352, "lr": 3.6950652871664205e-05} +{"train_loss": 0.0033958954736590385, "global_step": 41909, "epoch": 352, "lr": 3.694851415924627e-05} +{"train_loss": 0.0010135776828974485, "global_step": 41910, "epoch": 352, "lr": 3.694637547245351e-05} +{"train_loss": 0.0016305200988426805, "global_step": 41911, "epoch": 352, "lr": 3.6944236811290166e-05} +{"train_loss": 0.0008381957304663956, "global_step": 41912, "epoch": 352, "lr": 3.694209817576041e-05} +{"train_loss": 0.0014936367515474558, "global_step": 41913, "epoch": 352, "lr": 3.693995956586846e-05} +{"train_loss": 0.0017679157899692655, "global_step": 41914, "epoch": 352, "lr": 3.693782098161849e-05} +{"train_loss": 0.0018940760055556893, "global_step": 41915, "epoch": 352, "lr": 3.693568242301472e-05} +{"train_loss": 0.0011387026170268655, "global_step": 41916, "epoch": 352, "lr": 3.693354389006134e-05} +{"train_loss": 0.0012663447996601462, "global_step": 41917, "epoch": 352, "lr": 3.693140538276254e-05} +{"train_loss": 0.001900365692563355, "global_step": 41918, "epoch": 352, "lr": 3.692926690112255e-05} +{"train_loss": 0.0011376660550013185, "global_step": 41919, "epoch": 352, "lr": 3.692712844514553e-05} +{"train_loss": 0.0013185025891289115, "global_step": 41920, "epoch": 352, "lr": 3.692499001483572e-05} +{"train_loss": 0.0014161958824843168, "global_step": 41921, "epoch": 352, "lr": 3.692285161019728e-05} +{"train_loss": 0.001476521254517138, "global_step": 41922, "epoch": 352, "lr": 3.692071323123442e-05} +{"train_loss": 0.002102601807564497, "global_step": 41923, "epoch": 352, "lr": 3.691857487795136e-05} +{"train_loss": 0.0016698373947292566, "global_step": 41924, "epoch": 352, "lr": 3.6916436550352254e-05} +{"train_loss": 0.0012229119893163443, "global_step": 41925, "epoch": 352, "lr": 3.691429824844135e-05} +{"train_loss": 0.0008123426232486963, "global_step": 41926, "epoch": 352, "lr": 3.69121599722228e-05} +{"train_loss": 0.0017297298181802034, "global_step": 41927, "epoch": 352, "lr": 3.691002172170086e-05} +{"train_loss": 0.0016092653386294842, "global_step": 41928, "epoch": 352, "lr": 3.690788349687968e-05} +{"train_loss": 0.0015738903312012553, "global_step": 41929, "epoch": 352, "lr": 3.690574529776345e-05} +{"train_loss": 0.0016849323874339461, "global_step": 41930, "epoch": 352, "lr": 3.690360712435642e-05} +{"train_loss": 0.002441409509629011, "global_step": 41931, "epoch": 352, "lr": 3.690146897666273e-05} +{"train_loss": 0.0015959732700139284, "global_step": 41932, "epoch": 352, "lr": 3.689933085468662e-05} +{"train_loss": 0.0012665127869695425, "global_step": 41933, "epoch": 352, "lr": 3.6897192758432286e-05} +{"train_loss": 0.0014949367614462972, "global_step": 41934, "epoch": 352, "lr": 3.689505468790389e-05} +{"train_loss": 0.002252552192658186, "global_step": 41935, "epoch": 352, "lr": 3.689291664310568e-05} +{"train_loss": 0.0017738405149430037, "global_step": 41936, "epoch": 352, "lr": 3.68907786240418e-05} +{"train_loss": 0.0014340688940137625, "global_step": 41937, "epoch": 352, "lr": 3.6888640630716495e-05} +{"train_loss": 0.0013315443648025393, "global_step": 41938, "epoch": 352, "lr": 3.6886502663133935e-05} +{"train_loss": 0.0016389854717999697, "global_step": 41939, "epoch": 352, "lr": 3.688436472129834e-05} +{"train_loss": 0.0016506918473169208, "global_step": 41940, "epoch": 352, "lr": 3.6882226805213896e-05} +{"train_loss": 0.0014661630848422647, "global_step": 41941, "epoch": 352, "lr": 3.688008891488477e-05} +{"train_loss": 0.0017614770913496614, "global_step": 41942, "epoch": 352, "lr": 3.6877951050315215e-05} +{"train_loss": 0.0012369207106530666, "global_step": 41943, "epoch": 352, "lr": 3.687581321150938e-05} +{"train_loss": 0.0017826827242970467, "global_step": 41944, "epoch": 352, "lr": 3.68736753984715e-05} +{"train_loss": 0.0016405540518462658, "global_step": 41945, "epoch": 352, "lr": 3.687153761120574e-05} +{"train_loss": 0.001149860443547368, "global_step": 41946, "epoch": 352, "lr": 3.6869399849716334e-05} +{"train_loss": 0.0019395139534026384, "global_step": 41947, "epoch": 352, "lr": 3.6867262114007444e-05} +{"train_loss": 0.001350182923488319, "global_step": 41948, "epoch": 352, "lr": 3.686512440408329e-05} +{"train_loss": 0.002583620836958289, "global_step": 41949, "epoch": 352, "lr": 3.686298671994805e-05} +{"train_loss": 0.001624722732231021, "global_step": 41950, "epoch": 352, "lr": 3.686084906160594e-05} +{"train_loss": 0.0012457421980798244, "global_step": 41951, "epoch": 352, "lr": 3.685871142906114e-05} +{"train_loss": 0.0018341728718951344, "global_step": 41952, "epoch": 352, "lr": 3.685657382231788e-05} +{"train_loss": 0.0028934304136782885, "global_step": 41953, "epoch": 352, "lr": 3.685443624138031e-05} +{"train_loss": 0.0016906183445826173, "global_step": 41954, "epoch": 352, "lr": 3.6852298686252664e-05} +{"train_loss": 0.0025759574491530657, "global_step": 41955, "epoch": 352, "lr": 3.68501611569391e-05} +{"train_loss": 0.0018258618656545877, "global_step": 41956, "epoch": 352, "lr": 3.684802365344387e-05} +{"train_loss": 0.0014177196426317096, "global_step": 41957, "epoch": 352, "lr": 3.6845886175771114e-05} +{"train_loss": 0.0008490659529343247, "global_step": 41958, "epoch": 352, "lr": 3.684374872392508e-05} +{"train_loss": 0.00211503473110497, "global_step": 41959, "epoch": 352, "lr": 3.684161129790994e-05} +{"train_loss": 0.0018884697929024696, "global_step": 41960, "epoch": 352, "lr": 3.683947389772987e-05} +{"train_loss": 0.0010327890049666166, "global_step": 41961, "epoch": 352, "lr": 3.683733652338911e-05} +{"train_loss": 0.0025457486044615507, "global_step": 41962, "epoch": 352, "lr": 3.6835199174891805e-05} +{"train_loss": 0.0006344446446746588, "global_step": 41963, "epoch": 352, "lr": 3.68330618522422e-05} +{"train_loss": 0.0021518964786082506, "global_step": 41964, "epoch": 352, "lr": 3.683092455544447e-05} +{"train_loss": 0.001219636993482709, "global_step": 41965, "epoch": 352, "lr": 3.682878728450281e-05} +{"train_loss": 0.001162921660579741, "global_step": 41966, "epoch": 352, "lr": 3.6826650039421416e-05} +{"train_loss": 0.0011834049364551902, "global_step": 41967, "epoch": 352, "lr": 3.682451282020448e-05} +{"train_loss": 0.0018289587460458279, "global_step": 41968, "epoch": 352, "lr": 3.682237562685622e-05} +{"train_loss": 0.0014322760980576277, "global_step": 41969, "epoch": 352, "lr": 3.6820238459380805e-05} +{"train_loss": 0.0008864238043315709, "global_step": 41970, "epoch": 352, "lr": 3.6818101317782464e-05} +{"train_loss": 0.0015721677336841822, "global_step": 41971, "epoch": 352, "lr": 3.681596420206537e-05} +{"train_loss": 0.0023963332641869783, "global_step": 41972, "epoch": 352, "lr": 3.681382711223369e-05} +{"train_loss": 0.0009914750698953867, "global_step": 41973, "epoch": 352, "lr": 3.681169004829169e-05} +{"train_loss": 0.0019493319559842348, "global_step": 41974, "epoch": 352, "lr": 3.68095530102435e-05} +{"train_loss": 0.0024292566813528538, "global_step": 41975, "epoch": 352, "lr": 3.680741599809336e-05} +{"train_loss": 0.0026114131323993206, "global_step": 41976, "epoch": 352, "lr": 3.680527901184544e-05} +{"train_loss": 0.001502700732089579, "global_step": 41977, "epoch": 352, "lr": 3.6803142051503955e-05} +{"train_loss": 0.0021105108316987753, "global_step": 41978, "epoch": 352, "lr": 3.6801005117073095e-05} +{"train_loss": 0.0011532687349244952, "global_step": 41979, "epoch": 352, "lr": 3.6798868208557025e-05} +{"train_loss": 0.002480481518432498, "global_step": 41980, "epoch": 352, "lr": 3.679673132595999e-05} +{"train_loss": 0.0014224512269720435, "global_step": 41981, "epoch": 352, "lr": 3.679459446928615e-05} +{"train_loss": 0.0018943848554044962, "global_step": 41982, "epoch": 352, "lr": 3.679245763853972e-05} +{"train_loss": 0.001103246584534645, "global_step": 41983, "epoch": 352, "lr": 3.6790320833724895e-05} +{"train_loss": 0.002083753701299429, "global_step": 41984, "epoch": 352, "lr": 3.678818405484584e-05} +{"train_loss": 0.0014477643417194486, "global_step": 41985, "epoch": 352, "lr": 3.67860473019068e-05} +{"train_loss": 0.0024715657345950603, "global_step": 41986, "epoch": 352, "lr": 3.678391057491193e-05} +{"train_loss": 0.0017169369384646416, "global_step": 41987, "epoch": 352, "lr": 3.678177387386545e-05} +{"train_loss": 0.00126751814968884, "global_step": 41988, "epoch": 352, "lr": 3.6779637198771525e-05} +{"train_loss": 0.0014389046700671315, "global_step": 41989, "epoch": 352, "lr": 3.677750054963439e-05} +{"train_loss": 0.0016894773580133915, "global_step": 41990, "epoch": 352, "lr": 3.677536392645823e-05} +{"train_loss": 0.001993644516915083, "global_step": 41991, "epoch": 352, "lr": 3.67732273292472e-05} +{"train_loss": 0.0013121535303071141, "global_step": 41992, "epoch": 352, "lr": 3.677109075800555e-05} +{"train_loss": 0.0015935302944853902, "global_step": 41993, "epoch": 352, "lr": 3.676895421273743e-05} +{"train_loss": 0.002419606316834688, "global_step": 41994, "epoch": 352, "lr": 3.676681769344707e-05} +{"train_loss": 0.0015305281849578023, "global_step": 41995, "epoch": 352, "lr": 3.676468120013863e-05} +{"train_loss": 0.002333050360903144, "global_step": 41996, "epoch": 352, "lr": 3.676254473281635e-05} +{"train_loss": 0.0014918872620910406, "global_step": 41997, "epoch": 352, "lr": 3.676040829148438e-05} +{"train_loss": 0.0030652189161628485, "global_step": 41998, "epoch": 352, "lr": 3.6758271876146944e-05} +{"train_loss": 0.0030421025585383177, "global_step": 41999, "epoch": 352, "lr": 3.675613548680823e-05} +{"train_loss": 0.002479612361639738, "global_step": 42000, "epoch": 352, "lr": 3.675399912347242e-05} +{"train_loss": 0.0011319104814901948, "global_step": 42001, "epoch": 352, "lr": 3.675186278614371e-05} +{"train_loss": 0.001683528651483357, "global_step": 42002, "epoch": 352, "lr": 3.674972647482633e-05} +{"train_loss": 0.0013105362886562943, "global_step": 42003, "epoch": 352, "lr": 3.6747590189524414e-05} +{"train_loss": 0.001857538940384984, "global_step": 42004, "epoch": 352, "lr": 3.674545393024221e-05} +{"train_loss": 0.0012778770178556442, "global_step": 42005, "epoch": 352, "lr": 3.6743317696983884e-05} +{"train_loss": 0.0016672919326297501, "global_step": 42006, "epoch": 352, "lr": 3.674118148975364e-05, "val_loss": 0.020510340109467506} +{"train_loss": 0.001476077944971621, "global_step": 42007, "epoch": 353, "lr": 3.6739045308555656e-05} +{"train_loss": 0.002180586103349924, "global_step": 42008, "epoch": 353, "lr": 3.673690915339416e-05} +{"train_loss": 0.0028103382792323828, "global_step": 42009, "epoch": 353, "lr": 3.673477302427333e-05} +{"train_loss": 0.0020563090220093727, "global_step": 42010, "epoch": 353, "lr": 3.6732636921197336e-05} +{"train_loss": 0.003150376258417964, "global_step": 42011, "epoch": 353, "lr": 3.6730500844170406e-05} +{"train_loss": 0.0016751367365941405, "global_step": 42012, "epoch": 353, "lr": 3.67283647931967e-05} +{"train_loss": 0.0018036968540400267, "global_step": 42013, "epoch": 353, "lr": 3.6726228768280456e-05} +{"train_loss": 0.0013476504245772958, "global_step": 42014, "epoch": 353, "lr": 3.672409276942583e-05} +{"train_loss": 0.0015454047825187445, "global_step": 42015, "epoch": 353, "lr": 3.6721956796637026e-05} +{"train_loss": 0.0018286096164956689, "global_step": 42016, "epoch": 353, "lr": 3.6719820849918255e-05} +{"train_loss": 0.0011675773421302438, "global_step": 42017, "epoch": 353, "lr": 3.671768492927368e-05} +{"train_loss": 0.0017799998167902231, "global_step": 42018, "epoch": 353, "lr": 3.671554903470753e-05} +{"train_loss": 0.0017262758919969201, "global_step": 42019, "epoch": 353, "lr": 3.6713413166223964e-05} +{"train_loss": 0.0013279018457978964, "global_step": 42020, "epoch": 353, "lr": 3.671127732382721e-05} +{"train_loss": 0.002014528028666973, "global_step": 42021, "epoch": 353, "lr": 3.6709141507521437e-05} +{"train_loss": 0.0012562707997858524, "global_step": 42022, "epoch": 353, "lr": 3.670700571731083e-05} +{"train_loss": 0.0012049558572471142, "global_step": 42023, "epoch": 353, "lr": 3.670486995319962e-05} +{"train_loss": 0.0019282232969999313, "global_step": 42024, "epoch": 353, "lr": 3.670273421519195e-05} +{"train_loss": 0.0017194163519889116, "global_step": 42025, "epoch": 353, "lr": 3.670059850329207e-05} +{"train_loss": 0.001321908668614924, "global_step": 42026, "epoch": 353, "lr": 3.6698462817504115e-05} +{"train_loss": 0.0009339784737676382, "global_step": 42027, "epoch": 353, "lr": 3.6696327157832335e-05} +{"train_loss": 0.0021114032715559006, "global_step": 42028, "epoch": 353, "lr": 3.669419152428088e-05} +{"train_loss": 0.0018020534189417958, "global_step": 42029, "epoch": 353, "lr": 3.6692055916853965e-05} +{"train_loss": 0.002965525258332491, "global_step": 42030, "epoch": 353, "lr": 3.6689920335555765e-05} +{"train_loss": 0.0035839895717799664, "global_step": 42031, "epoch": 353, "lr": 3.668778478039049e-05} +{"train_loss": 0.00165769353043288, "global_step": 42032, "epoch": 353, "lr": 3.6685649251362334e-05} +{"train_loss": 0.0014111935161054134, "global_step": 42033, "epoch": 353, "lr": 3.6683513748475484e-05} +{"train_loss": 0.0016339088324457407, "global_step": 42034, "epoch": 353, "lr": 3.668137827173411e-05} +{"train_loss": 0.0013199556851759553, "global_step": 42035, "epoch": 353, "lr": 3.667924282114246e-05} +{"train_loss": 0.002451520413160324, "global_step": 42036, "epoch": 353, "lr": 3.667710739670466e-05} +{"train_loss": 0.001550384215079248, "global_step": 42037, "epoch": 353, "lr": 3.6674971998424966e-05} +{"train_loss": 0.0012358836829662323, "global_step": 42038, "epoch": 353, "lr": 3.6672836626307516e-05} +{"train_loss": 0.0010225246660411358, "global_step": 42039, "epoch": 353, "lr": 3.667070128035655e-05} +{"train_loss": 0.0012712078168988228, "global_step": 42040, "epoch": 353, "lr": 3.666856596057624e-05} +{"train_loss": 0.001654753228649497, "global_step": 42041, "epoch": 353, "lr": 3.666643066697075e-05} +{"train_loss": 0.0014181972946971655, "global_step": 42042, "epoch": 353, "lr": 3.6664295399544323e-05} +{"train_loss": 0.002109942026436329, "global_step": 42043, "epoch": 353, "lr": 3.6662160158301107e-05} +{"train_loss": 0.0013274120865389705, "global_step": 42044, "epoch": 353, "lr": 3.666002494324533e-05} +{"train_loss": 0.0017223303439095616, "global_step": 42045, "epoch": 353, "lr": 3.665788975438116e-05} +{"train_loss": 0.001832075766287744, "global_step": 42046, "epoch": 353, "lr": 3.665575459171281e-05} +{"train_loss": 0.0028275626245886087, "global_step": 42047, "epoch": 353, "lr": 3.665361945524445e-05} +{"train_loss": 0.0020692464895546436, "global_step": 42048, "epoch": 353, "lr": 3.665148434498028e-05} +{"train_loss": 0.0011361808283254504, "global_step": 42049, "epoch": 353, "lr": 3.6649349260924504e-05} +{"train_loss": 0.0013933280715718865, "global_step": 42050, "epoch": 353, "lr": 3.664721420308128e-05} +{"train_loss": 0.0013336704578250647, "global_step": 42051, "epoch": 353, "lr": 3.664507917145485e-05} +{"train_loss": 0.001427782466635108, "global_step": 42052, "epoch": 353, "lr": 3.664294416604939e-05} +{"train_loss": 0.0021656944882124662, "global_step": 42053, "epoch": 353, "lr": 3.6640809186869056e-05} +{"train_loss": 0.0011726298835128546, "global_step": 42054, "epoch": 353, "lr": 3.663867423391808e-05} +{"train_loss": 0.0018019304843619466, "global_step": 42055, "epoch": 353, "lr": 3.6636539307200636e-05} +{"train_loss": 0.001435058657079935, "global_step": 42056, "epoch": 353, "lr": 3.663440440672092e-05} +{"train_loss": 0.0016410053940489888, "global_step": 42057, "epoch": 353, "lr": 3.6632269532483115e-05} +{"train_loss": 0.0017225593328475952, "global_step": 42058, "epoch": 353, "lr": 3.663013468449144e-05} +{"train_loss": 0.0010752466041594744, "global_step": 42059, "epoch": 353, "lr": 3.662799986275006e-05} +{"train_loss": 0.0011814082972705364, "global_step": 42060, "epoch": 353, "lr": 3.662586506726316e-05} +{"train_loss": 0.0018949067452922463, "global_step": 42061, "epoch": 353, "lr": 3.662373029803496e-05} +{"train_loss": 0.0013161007082089782, "global_step": 42062, "epoch": 353, "lr": 3.662159555506962e-05} +{"train_loss": 0.0016386086354032159, "global_step": 42063, "epoch": 353, "lr": 3.6619460838371366e-05} +{"train_loss": 0.0009550043032504618, "global_step": 42064, "epoch": 353, "lr": 3.661732614794435e-05} +{"train_loss": 0.001879674382507801, "global_step": 42065, "epoch": 353, "lr": 3.66151914837928e-05} +{"train_loss": 0.0011943913996219635, "global_step": 42066, "epoch": 353, "lr": 3.66130568459209e-05} +{"train_loss": 0.0020700409077107906, "global_step": 42067, "epoch": 353, "lr": 3.661092223433281e-05} +{"train_loss": 0.002038257895037532, "global_step": 42068, "epoch": 353, "lr": 3.660878764903277e-05} +{"train_loss": 0.0010544601827859879, "global_step": 42069, "epoch": 353, "lr": 3.660665309002492e-05} +{"train_loss": 0.00164241180755198, "global_step": 42070, "epoch": 353, "lr": 3.6604518557313494e-05} +{"train_loss": 0.0007434479775838554, "global_step": 42071, "epoch": 353, "lr": 3.6602384050902665e-05} +{"train_loss": 0.001555318827740848, "global_step": 42072, "epoch": 353, "lr": 3.660024957079661e-05} +{"train_loss": 0.0040190438739955425, "global_step": 42073, "epoch": 353, "lr": 3.659811511699954e-05} +{"train_loss": 0.0013777752174064517, "global_step": 42074, "epoch": 353, "lr": 3.659598068951563e-05} +{"train_loss": 0.0020077372901141644, "global_step": 42075, "epoch": 353, "lr": 3.65938462883491e-05} +{"train_loss": 0.0010540493531152606, "global_step": 42076, "epoch": 353, "lr": 3.6591711913504096e-05} +{"train_loss": 0.0008636112324893475, "global_step": 42077, "epoch": 353, "lr": 3.658957756498486e-05} +{"train_loss": 0.0016777580603957176, "global_step": 42078, "epoch": 353, "lr": 3.6587443242795536e-05} +{"train_loss": 0.002728306455537677, "global_step": 42079, "epoch": 353, "lr": 3.658530894694034e-05} +{"train_loss": 0.0014716198202222586, "global_step": 42080, "epoch": 353, "lr": 3.658317467742346e-05} +{"train_loss": 0.001946255681104958, "global_step": 42081, "epoch": 353, "lr": 3.658104043424907e-05} +{"train_loss": 0.0019463980570435524, "global_step": 42082, "epoch": 353, "lr": 3.657890621742138e-05} +{"train_loss": 0.0012982988264411688, "global_step": 42083, "epoch": 353, "lr": 3.6576772026944594e-05} +{"train_loss": 0.0009860738646239042, "global_step": 42084, "epoch": 353, "lr": 3.657463786282285e-05} +{"train_loss": 0.002545613097026944, "global_step": 42085, "epoch": 353, "lr": 3.65725037250604e-05} +{"train_loss": 0.0018268382409587502, "global_step": 42086, "epoch": 353, "lr": 3.657036961366138e-05} +{"train_loss": 0.001551797497086227, "global_step": 42087, "epoch": 353, "lr": 3.6568235528630026e-05} +{"train_loss": 0.0015353512717410922, "global_step": 42088, "epoch": 353, "lr": 3.656610146997048e-05} +{"train_loss": 0.0014092373894527555, "global_step": 42089, "epoch": 353, "lr": 3.656396743768698e-05} +{"train_loss": 0.0011383870150893927, "global_step": 42090, "epoch": 353, "lr": 3.65618334317837e-05} +{"train_loss": 0.0016386337811127305, "global_step": 42091, "epoch": 353, "lr": 3.65596994522648e-05} +{"train_loss": 0.0020413007587194443, "global_step": 42092, "epoch": 353, "lr": 3.6557565499134515e-05} +{"train_loss": 0.0012966671492904425, "global_step": 42093, "epoch": 353, "lr": 3.655543157239699e-05} +{"train_loss": 0.0017879457445815206, "global_step": 42094, "epoch": 353, "lr": 3.655329767205647e-05} +{"train_loss": 0.0012706158449873328, "global_step": 42095, "epoch": 353, "lr": 3.655116379811708e-05} +{"train_loss": 0.001793533330783248, "global_step": 42096, "epoch": 353, "lr": 3.654902995058308e-05} +{"train_loss": 0.001586622791364789, "global_step": 42097, "epoch": 353, "lr": 3.6546896129458594e-05} +{"train_loss": 0.0014782306971028447, "global_step": 42098, "epoch": 353, "lr": 3.654476233474785e-05} +{"train_loss": 0.0014054829953238368, "global_step": 42099, "epoch": 353, "lr": 3.6542628566455026e-05} +{"train_loss": 0.0015215821331366897, "global_step": 42100, "epoch": 353, "lr": 3.654049482458431e-05} +{"train_loss": 0.0016684074653312564, "global_step": 42101, "epoch": 353, "lr": 3.6538361109139906e-05} +{"train_loss": 0.0010851019760593772, "global_step": 42102, "epoch": 353, "lr": 3.6536227420125995e-05} +{"train_loss": 0.0012033771490678191, "global_step": 42103, "epoch": 353, "lr": 3.6534093757546736e-05} +{"train_loss": 0.0013938858173787594, "global_step": 42104, "epoch": 353, "lr": 3.6531960121406383e-05} +{"train_loss": 0.0012382392305880785, "global_step": 42105, "epoch": 353, "lr": 3.652982651170905e-05} +{"train_loss": 0.0016493157017976046, "global_step": 42106, "epoch": 353, "lr": 3.652769292845899e-05} +{"train_loss": 0.002581990323960781, "global_step": 42107, "epoch": 353, "lr": 3.652555937166035e-05} +{"train_loss": 0.001519448822364211, "global_step": 42108, "epoch": 353, "lr": 3.652342584131735e-05} +{"train_loss": 0.0022474885918200016, "global_step": 42109, "epoch": 353, "lr": 3.652129233743416e-05} +{"train_loss": 0.0007884756778366864, "global_step": 42110, "epoch": 353, "lr": 3.651915886001496e-05} +{"train_loss": 0.0013001782353967428, "global_step": 42111, "epoch": 353, "lr": 3.651702540906397e-05} +{"train_loss": 0.0022825845517218113, "global_step": 42112, "epoch": 353, "lr": 3.651489198458533e-05} +{"train_loss": 0.001601562020368874, "global_step": 42113, "epoch": 353, "lr": 3.651275858658327e-05} +{"train_loss": 0.001833811984397471, "global_step": 42114, "epoch": 353, "lr": 3.6510625215061974e-05} +{"train_loss": 0.0018767071887850761, "global_step": 42115, "epoch": 353, "lr": 3.650849187002563e-05} +{"train_loss": 0.0012388440081849694, "global_step": 42116, "epoch": 353, "lr": 3.6506358551478424e-05} +{"train_loss": 0.0010952888987958431, "global_step": 42117, "epoch": 353, "lr": 3.6504225259424525e-05} +{"train_loss": 0.0018592528067529202, "global_step": 42118, "epoch": 353, "lr": 3.6502091993868155e-05} +{"train_loss": 0.0017458319198340178, "global_step": 42119, "epoch": 353, "lr": 3.6499958754813466e-05} +{"train_loss": 0.001450629555620253, "global_step": 42120, "epoch": 353, "lr": 3.649782554226468e-05} +{"train_loss": 0.0019369308138266206, "global_step": 42121, "epoch": 353, "lr": 3.649569235622598e-05} +{"train_loss": 0.0014530990738421679, "global_step": 42122, "epoch": 353, "lr": 3.649355919670152e-05} +{"train_loss": 0.0015004175947979093, "global_step": 42123, "epoch": 353, "lr": 3.649142606369554e-05} +{"train_loss": 0.0017542190616950393, "global_step": 42124, "epoch": 353, "lr": 3.6489292957212175e-05} +{"train_loss": 0.0016612605570361582, "global_step": 42125, "epoch": 353, "lr": 3.648715987725566e-05, "val_loss": 0.011519042775034904} +{"train_loss": 0.001548656146042049, "global_step": 42126, "epoch": 354, "lr": 3.648502682383015e-05} +{"train_loss": 0.00162542297039181, "global_step": 42127, "epoch": 354, "lr": 3.648289379693986e-05} +{"train_loss": 0.0020430576987564564, "global_step": 42128, "epoch": 354, "lr": 3.648076079658895e-05} +{"train_loss": 0.003388033015653491, "global_step": 42129, "epoch": 354, "lr": 3.647862782278163e-05} +{"train_loss": 0.0015083890175446868, "global_step": 42130, "epoch": 354, "lr": 3.647649487552208e-05} +{"train_loss": 0.0011635577538982034, "global_step": 42131, "epoch": 354, "lr": 3.6474361954814486e-05} +{"train_loss": 0.002692226553335786, "global_step": 42132, "epoch": 354, "lr": 3.6472229060663035e-05} +{"train_loss": 0.0019398508593440056, "global_step": 42133, "epoch": 354, "lr": 3.6470096193071915e-05} +{"train_loss": 0.0031362713780254126, "global_step": 42134, "epoch": 354, "lr": 3.6467963352045313e-05} +{"train_loss": 0.0024568215012550354, "global_step": 42135, "epoch": 354, "lr": 3.646583053758744e-05} +{"train_loss": 0.0011229722294956446, "global_step": 42136, "epoch": 354, "lr": 3.646369774970243e-05} +{"train_loss": 0.002120445016771555, "global_step": 42137, "epoch": 354, "lr": 3.646156498839454e-05} +{"train_loss": 0.00145576405338943, "global_step": 42138, "epoch": 354, "lr": 3.645943225366789e-05} +{"train_loss": 0.0012073698453605175, "global_step": 42139, "epoch": 354, "lr": 3.6457299545526716e-05} +{"train_loss": 0.0010160740930587053, "global_step": 42140, "epoch": 354, "lr": 3.645516686397519e-05} +{"train_loss": 0.0012332095066085458, "global_step": 42141, "epoch": 354, "lr": 3.645303420901748e-05} +{"train_loss": 0.0022806753404438496, "global_step": 42142, "epoch": 354, "lr": 3.6450901580657805e-05} +{"train_loss": 0.000949317472986877, "global_step": 42143, "epoch": 354, "lr": 3.644876897890032e-05} +{"train_loss": 0.001893838169053197, "global_step": 42144, "epoch": 354, "lr": 3.644663640374925e-05} +{"train_loss": 0.0011827604612335563, "global_step": 42145, "epoch": 354, "lr": 3.644450385520874e-05} +{"train_loss": 0.001952443621121347, "global_step": 42146, "epoch": 354, "lr": 3.644237133328302e-05} +{"train_loss": 0.0009997396264225245, "global_step": 42147, "epoch": 354, "lr": 3.644023883797625e-05} +{"train_loss": 0.0025819125585258007, "global_step": 42148, "epoch": 354, "lr": 3.6438106369292605e-05} +{"train_loss": 0.0024726376868784428, "global_step": 42149, "epoch": 354, "lr": 3.643597392723631e-05} +{"train_loss": 0.0009621928911656141, "global_step": 42150, "epoch": 354, "lr": 3.643384151181151e-05} +{"train_loss": 0.0011064724531024694, "global_step": 42151, "epoch": 354, "lr": 3.643170912302243e-05} +{"train_loss": 0.001785480068065226, "global_step": 42152, "epoch": 354, "lr": 3.642957676087325e-05} +{"train_loss": 0.0013414992718026042, "global_step": 42153, "epoch": 354, "lr": 3.642744442536812e-05} +{"train_loss": 0.0022475547157227993, "global_step": 42154, "epoch": 354, "lr": 3.642531211651128e-05} +{"train_loss": 0.0026155582163482904, "global_step": 42155, "epoch": 354, "lr": 3.6423179834306856e-05} +{"train_loss": 0.0018567306688055396, "global_step": 42156, "epoch": 354, "lr": 3.64210475787591e-05} +{"train_loss": 0.0006242644740268588, "global_step": 42157, "epoch": 354, "lr": 3.641891534987214e-05} +{"train_loss": 0.0018109381198883057, "global_step": 42158, "epoch": 354, "lr": 3.6416783147650216e-05} +{"train_loss": 0.00159838970284909, "global_step": 42159, "epoch": 354, "lr": 3.6414650972097476e-05} +{"train_loss": 0.0026636412367224693, "global_step": 42160, "epoch": 354, "lr": 3.64125188232181e-05} +{"train_loss": 0.0025833970867097378, "global_step": 42161, "epoch": 354, "lr": 3.6410386701016307e-05} +{"train_loss": 0.002878390019759536, "global_step": 42162, "epoch": 354, "lr": 3.640825460549627e-05} +{"train_loss": 0.0017048807349056005, "global_step": 42163, "epoch": 354, "lr": 3.640612253666217e-05} +{"train_loss": 0.0018502145539969206, "global_step": 42164, "epoch": 354, "lr": 3.640399049451819e-05} +{"train_loss": 0.0018522217869758606, "global_step": 42165, "epoch": 354, "lr": 3.6401858479068526e-05} +{"train_loss": 0.001610312145203352, "global_step": 42166, "epoch": 354, "lr": 3.6399726490317376e-05} +{"train_loss": 0.0017896039644256234, "global_step": 42167, "epoch": 354, "lr": 3.639759452826888e-05} +{"train_loss": 0.0025038805324584246, "global_step": 42168, "epoch": 354, "lr": 3.639546259292728e-05} +{"train_loss": 0.0027733659371733665, "global_step": 42169, "epoch": 354, "lr": 3.639333068429671e-05} +{"train_loss": 0.0018110009841620922, "global_step": 42170, "epoch": 354, "lr": 3.639119880238141e-05} +{"train_loss": 0.0016235675429925323, "global_step": 42171, "epoch": 354, "lr": 3.6389066947185534e-05} +{"train_loss": 0.001453644479624927, "global_step": 42172, "epoch": 354, "lr": 3.638693511871325e-05} +{"train_loss": 0.0027823762502521276, "global_step": 42173, "epoch": 354, "lr": 3.638480331696879e-05} +{"train_loss": 0.0015487041091546416, "global_step": 42174, "epoch": 354, "lr": 3.6382671541956285e-05} +{"train_loss": 0.0032027619890868664, "global_step": 42175, "epoch": 354, "lr": 3.638053979367998e-05} +{"train_loss": 0.002370835980400443, "global_step": 42176, "epoch": 354, "lr": 3.6378408072144e-05} +{"train_loss": 0.001343023614026606, "global_step": 42177, "epoch": 354, "lr": 3.637627637735258e-05} +{"train_loss": 0.001741743995808065, "global_step": 42178, "epoch": 354, "lr": 3.6374144709309884e-05} +{"train_loss": 0.0024462584406137466, "global_step": 42179, "epoch": 354, "lr": 3.637201306802009e-05} +{"train_loss": 0.0020539399702101946, "global_step": 42180, "epoch": 354, "lr": 3.6369881453487407e-05} +{"train_loss": 0.0016308898339048028, "global_step": 42181, "epoch": 354, "lr": 3.6367749865715995e-05} +{"train_loss": 0.002726407954469323, "global_step": 42182, "epoch": 354, "lr": 3.6365618304710046e-05} +{"train_loss": 0.0019588321447372437, "global_step": 42183, "epoch": 354, "lr": 3.6363486770473746e-05} +{"train_loss": 0.001920667476952076, "global_step": 42184, "epoch": 354, "lr": 3.6361355263011297e-05} +{"train_loss": 0.0032443501986563206, "global_step": 42185, "epoch": 354, "lr": 3.635922378232688e-05} +{"train_loss": 0.0029225389007478952, "global_step": 42186, "epoch": 354, "lr": 3.635709232842465e-05} +{"train_loss": 0.0024889297783374786, "global_step": 42187, "epoch": 354, "lr": 3.6354960901308824e-05} +{"train_loss": 0.001178742153570056, "global_step": 42188, "epoch": 354, "lr": 3.635282950098355e-05} +{"train_loss": 0.001318771974183619, "global_step": 42189, "epoch": 354, "lr": 3.6350698127453067e-05} +{"train_loss": 0.0020582336001098156, "global_step": 42190, "epoch": 354, "lr": 3.634856678072153e-05} +{"train_loss": 0.0027829341124743223, "global_step": 42191, "epoch": 354, "lr": 3.6346435460793097e-05} +{"train_loss": 0.0021281130611896515, "global_step": 42192, "epoch": 354, "lr": 3.6344304167671996e-05} +{"train_loss": 0.0018094510305672884, "global_step": 42193, "epoch": 354, "lr": 3.634217290136238e-05} +{"train_loss": 0.0021443041041493416, "global_step": 42194, "epoch": 354, "lr": 3.6340041661868475e-05} +{"train_loss": 0.002071546157822013, "global_step": 42195, "epoch": 354, "lr": 3.633791044919441e-05} +{"train_loss": 0.0013471313286572695, "global_step": 42196, "epoch": 354, "lr": 3.633577926334441e-05} +{"train_loss": 0.0024095450062304735, "global_step": 42197, "epoch": 354, "lr": 3.6333648104322657e-05} +{"train_loss": 0.0013798876898363233, "global_step": 42198, "epoch": 354, "lr": 3.633151697213331e-05} +{"train_loss": 0.0009629235719330609, "global_step": 42199, "epoch": 354, "lr": 3.632938586678058e-05} +{"train_loss": 0.0016710117924958467, "global_step": 42200, "epoch": 354, "lr": 3.632725478826864e-05} +{"train_loss": 0.0018113363767042756, "global_step": 42201, "epoch": 354, "lr": 3.632512373660168e-05} +{"train_loss": 0.002106479834765196, "global_step": 42202, "epoch": 354, "lr": 3.632299271178388e-05} +{"train_loss": 0.0018562907353043556, "global_step": 42203, "epoch": 354, "lr": 3.63208617138194e-05} +{"train_loss": 0.0015130635583773255, "global_step": 42204, "epoch": 354, "lr": 3.631873074271247e-05} +{"train_loss": 0.0011914498172700405, "global_step": 42205, "epoch": 354, "lr": 3.631659979846723e-05} +{"train_loss": 0.0026256756391376257, "global_step": 42206, "epoch": 354, "lr": 3.6314468881087905e-05} +{"train_loss": 0.0027170847170054913, "global_step": 42207, "epoch": 354, "lr": 3.631233799057864e-05} +{"train_loss": 0.0022321895230561495, "global_step": 42208, "epoch": 354, "lr": 3.631020712694366e-05} +{"train_loss": 0.001296170987188816, "global_step": 42209, "epoch": 354, "lr": 3.630807629018712e-05} +{"train_loss": 0.0022437414154410362, "global_step": 42210, "epoch": 354, "lr": 3.630594548031319e-05} +{"train_loss": 0.0017971934285014868, "global_step": 42211, "epoch": 354, "lr": 3.6303814697326075e-05} +{"train_loss": 0.0018230119021609426, "global_step": 42212, "epoch": 354, "lr": 3.630168394122997e-05} +{"train_loss": 0.0025498890317976475, "global_step": 42213, "epoch": 354, "lr": 3.629955321202904e-05} +{"train_loss": 0.001583461300469935, "global_step": 42214, "epoch": 354, "lr": 3.6297422509727476e-05} +{"train_loss": 0.0018586922669783235, "global_step": 42215, "epoch": 354, "lr": 3.629529183432946e-05} +{"train_loss": 0.0026246842462569475, "global_step": 42216, "epoch": 354, "lr": 3.629316118583918e-05} +{"train_loss": 0.002213460858911276, "global_step": 42217, "epoch": 354, "lr": 3.6291030564260794e-05} +{"train_loss": 0.0013139389920979738, "global_step": 42218, "epoch": 354, "lr": 3.628889996959852e-05} +{"train_loss": 0.0021974623668938875, "global_step": 42219, "epoch": 354, "lr": 3.6286769401856515e-05} +{"train_loss": 0.002519118133932352, "global_step": 42220, "epoch": 354, "lr": 3.628463886103899e-05} +{"train_loss": 0.002284551504999399, "global_step": 42221, "epoch": 354, "lr": 3.628250834715011e-05} +{"train_loss": 0.0013902455102652311, "global_step": 42222, "epoch": 354, "lr": 3.628037786019404e-05} +{"train_loss": 0.001865845755673945, "global_step": 42223, "epoch": 354, "lr": 3.6278247400175e-05} +{"train_loss": 0.0015307193389162421, "global_step": 42224, "epoch": 354, "lr": 3.627611696709714e-05} +{"train_loss": 0.001608049962669611, "global_step": 42225, "epoch": 354, "lr": 3.627398656096468e-05} +{"train_loss": 0.0018739908700808883, "global_step": 42226, "epoch": 354, "lr": 3.627185618178176e-05} +{"train_loss": 0.0009585272637195885, "global_step": 42227, "epoch": 354, "lr": 3.62697258295526e-05} +{"train_loss": 0.0020010557491332293, "global_step": 42228, "epoch": 354, "lr": 3.626759550428136e-05} +{"train_loss": 0.0008639926090836525, "global_step": 42229, "epoch": 354, "lr": 3.626546520597223e-05} +{"train_loss": 0.0014175965916365385, "global_step": 42230, "epoch": 354, "lr": 3.6263334934629376e-05} +{"train_loss": 0.0011877984507009387, "global_step": 42231, "epoch": 354, "lr": 3.6261204690257003e-05} +{"train_loss": 0.0016490344423800707, "global_step": 42232, "epoch": 354, "lr": 3.62590744728593e-05} +{"train_loss": 0.0015922215534374118, "global_step": 42233, "epoch": 354, "lr": 3.625694428244042e-05} +{"train_loss": 0.0016147944843396544, "global_step": 42234, "epoch": 354, "lr": 3.625481411900459e-05} +{"train_loss": 0.00124673533719033, "global_step": 42235, "epoch": 354, "lr": 3.625268398255595e-05} +{"train_loss": 0.0013132808962836862, "global_step": 42236, "epoch": 354, "lr": 3.625055387309868e-05} +{"train_loss": 0.0015028921188786626, "global_step": 42237, "epoch": 354, "lr": 3.6248423790637e-05} +{"train_loss": 0.0014945653965696692, "global_step": 42238, "epoch": 354, "lr": 3.624629373517505e-05} +{"train_loss": 0.0022231778129935265, "global_step": 42239, "epoch": 354, "lr": 3.624416370671705e-05} +{"train_loss": 0.0013724282616749406, "global_step": 42240, "epoch": 354, "lr": 3.624203370526718e-05} +{"train_loss": 0.0012670205906033516, "global_step": 42241, "epoch": 354, "lr": 3.623990373082957e-05} +{"train_loss": 0.0007941237417981029, "global_step": 42242, "epoch": 354, "lr": 3.623777378340846e-05} +{"train_loss": 0.0013472159625962377, "global_step": 42243, "epoch": 354, "lr": 3.6235643863007996e-05} +{"train_loss": 0.0018523217006703886, "global_step": 42244, "epoch": 354, "lr": 3.6233513969632395e-05, "val_loss": 0.017532985657453537} +{"train_loss": 0.0014219713630154729, "global_step": 42245, "epoch": 355, "lr": 3.623138410328579e-05} +{"train_loss": 0.001617801608517766, "global_step": 42246, "epoch": 355, "lr": 3.6229254263972414e-05} +{"train_loss": 0.0016763968160375953, "global_step": 42247, "epoch": 355, "lr": 3.622712445169643e-05} +{"train_loss": 0.001258876989595592, "global_step": 42248, "epoch": 355, "lr": 3.6224994666462e-05} +{"train_loss": 0.0007831244147382677, "global_step": 42249, "epoch": 355, "lr": 3.622286490827334e-05} +{"train_loss": 0.0011795575264841318, "global_step": 42250, "epoch": 355, "lr": 3.6220735177134585e-05} +{"train_loss": 0.0015912005910649896, "global_step": 42251, "epoch": 355, "lr": 3.621860547304997e-05} +{"train_loss": 0.0016937488690018654, "global_step": 42252, "epoch": 355, "lr": 3.621647579602363e-05} +{"train_loss": 0.0011298817116767168, "global_step": 42253, "epoch": 355, "lr": 3.621434614605979e-05} +{"train_loss": 0.0020085866563022137, "global_step": 42254, "epoch": 355, "lr": 3.6212216523162604e-05} +{"train_loss": 0.0017342405626550317, "global_step": 42255, "epoch": 355, "lr": 3.621008692733624e-05} +{"train_loss": 0.0011394373141229153, "global_step": 42256, "epoch": 355, "lr": 3.620795735858492e-05} +{"train_loss": 0.0011197167914360762, "global_step": 42257, "epoch": 355, "lr": 3.620582781691278e-05} +{"train_loss": 0.0008590592769905925, "global_step": 42258, "epoch": 355, "lr": 3.620369830232404e-05} +{"train_loss": 0.0015842677094042301, "global_step": 42259, "epoch": 355, "lr": 3.620156881482286e-05} +{"train_loss": 0.00322833308018744, "global_step": 42260, "epoch": 355, "lr": 3.619943935441342e-05} +{"train_loss": 0.0015007908223196864, "global_step": 42261, "epoch": 355, "lr": 3.619730992109991e-05} +{"train_loss": 0.002383202314376831, "global_step": 42262, "epoch": 355, "lr": 3.6195180514886515e-05} +{"train_loss": 0.0019705365411937237, "global_step": 42263, "epoch": 355, "lr": 3.61930511357774e-05} +{"train_loss": 0.0013753154780715704, "global_step": 42264, "epoch": 355, "lr": 3.6190921783776754e-05} +{"train_loss": 0.0012147434754297137, "global_step": 42265, "epoch": 355, "lr": 3.618879245888875e-05} +{"train_loss": 0.0011975993402302265, "global_step": 42266, "epoch": 355, "lr": 3.61866631611176e-05} +{"train_loss": 0.00260328920558095, "global_step": 42267, "epoch": 355, "lr": 3.618453389046744e-05} +{"train_loss": 0.0015895417891442776, "global_step": 42268, "epoch": 355, "lr": 3.618240464694248e-05} +{"train_loss": 0.0014086022274568677, "global_step": 42269, "epoch": 355, "lr": 3.618027543054688e-05} +{"train_loss": 0.0018681309884414077, "global_step": 42270, "epoch": 355, "lr": 3.617814624128486e-05} +{"train_loss": 0.0014971167547628284, "global_step": 42271, "epoch": 355, "lr": 3.617601707916056e-05} +{"train_loss": 0.00113271689042449, "global_step": 42272, "epoch": 355, "lr": 3.617388794417817e-05} +{"train_loss": 0.0018576167058199644, "global_step": 42273, "epoch": 355, "lr": 3.617175883634188e-05} +{"train_loss": 0.0012376818340271711, "global_step": 42274, "epoch": 355, "lr": 3.6169629755655845e-05} +{"train_loss": 0.001405071932822466, "global_step": 42275, "epoch": 355, "lr": 3.616750070212429e-05} +{"train_loss": 0.0010683287400752306, "global_step": 42276, "epoch": 355, "lr": 3.6165371675751344e-05} +{"train_loss": 0.0014244354097172618, "global_step": 42277, "epoch": 355, "lr": 3.616324267654123e-05} +{"train_loss": 0.0016193685587495565, "global_step": 42278, "epoch": 355, "lr": 3.616111370449811e-05} +{"train_loss": 0.0007760997395962477, "global_step": 42279, "epoch": 355, "lr": 3.615898475962616e-05} +{"train_loss": 0.001564792008139193, "global_step": 42280, "epoch": 355, "lr": 3.615685584192956e-05} +{"train_loss": 0.001478617312386632, "global_step": 42281, "epoch": 355, "lr": 3.615472695141249e-05} +{"train_loss": 0.0010941295186057687, "global_step": 42282, "epoch": 355, "lr": 3.615259808807916e-05} +{"train_loss": 0.001175352605059743, "global_step": 42283, "epoch": 355, "lr": 3.6150469251933695e-05} +{"train_loss": 0.0018307364080101252, "global_step": 42284, "epoch": 355, "lr": 3.614834044298033e-05} +{"train_loss": 0.0010804872727021575, "global_step": 42285, "epoch": 355, "lr": 3.614621166122322e-05} +{"train_loss": 0.001519974903203547, "global_step": 42286, "epoch": 355, "lr": 3.6144082906666516e-05} +{"train_loss": 0.0007104860851541162, "global_step": 42287, "epoch": 355, "lr": 3.614195417931445e-05} +{"train_loss": 0.0013770946534350514, "global_step": 42288, "epoch": 355, "lr": 3.613982547917115e-05} +{"train_loss": 0.0013425800716504455, "global_step": 42289, "epoch": 355, "lr": 3.613769680624085e-05} +{"train_loss": 0.0013925255043432117, "global_step": 42290, "epoch": 355, "lr": 3.61355681605277e-05} +{"train_loss": 0.003997722174972296, "global_step": 42291, "epoch": 355, "lr": 3.613343954203586e-05} +{"train_loss": 0.0007881583878770471, "global_step": 42292, "epoch": 355, "lr": 3.6131310950769545e-05} +{"train_loss": 0.0027209771797060966, "global_step": 42293, "epoch": 355, "lr": 3.6129182386732906e-05} +{"train_loss": 0.0019422961631789804, "global_step": 42294, "epoch": 355, "lr": 3.6127053849930145e-05} +{"train_loss": 0.0025884490460157394, "global_step": 42295, "epoch": 355, "lr": 3.612492534036544e-05} +{"train_loss": 0.001437787082977593, "global_step": 42296, "epoch": 355, "lr": 3.612279685804294e-05} +{"train_loss": 0.002587200840935111, "global_step": 42297, "epoch": 355, "lr": 3.612066840296687e-05} +{"train_loss": 0.0008664820925332606, "global_step": 42298, "epoch": 355, "lr": 3.6118539975141364e-05} +{"train_loss": 0.0018264406826347113, "global_step": 42299, "epoch": 355, "lr": 3.611641157457064e-05} +{"train_loss": 0.0012009612983092666, "global_step": 42300, "epoch": 355, "lr": 3.611428320125884e-05} +{"train_loss": 0.001995016820728779, "global_step": 42301, "epoch": 355, "lr": 3.611215485521018e-05} +{"train_loss": 0.001650535617955029, "global_step": 42302, "epoch": 355, "lr": 3.61100265364288e-05} +{"train_loss": 0.0010919634951278567, "global_step": 42303, "epoch": 355, "lr": 3.6107898244918914e-05} +{"train_loss": 0.0012327329022809863, "global_step": 42304, "epoch": 355, "lr": 3.610576998068469e-05} +{"train_loss": 0.001308203092776239, "global_step": 42305, "epoch": 355, "lr": 3.610364174373029e-05} +{"train_loss": 0.0008527723839506507, "global_step": 42306, "epoch": 355, "lr": 3.610151353405991e-05} +{"train_loss": 0.0013340241275727749, "global_step": 42307, "epoch": 355, "lr": 3.609938535167772e-05} +{"train_loss": 0.003809961723163724, "global_step": 42308, "epoch": 355, "lr": 3.609725719658791e-05} +{"train_loss": 0.0009684932883828878, "global_step": 42309, "epoch": 355, "lr": 3.609512906879464e-05} +{"train_loss": 0.0017104718135669827, "global_step": 42310, "epoch": 355, "lr": 3.609300096830211e-05} +{"train_loss": 0.0017938331002369523, "global_step": 42311, "epoch": 355, "lr": 3.609087289511447e-05} +{"train_loss": 0.0013698502443730831, "global_step": 42312, "epoch": 355, "lr": 3.608874484923592e-05} +{"train_loss": 0.0013897675089538097, "global_step": 42313, "epoch": 355, "lr": 3.608661683067065e-05} +{"train_loss": 0.0015462725423276424, "global_step": 42314, "epoch": 355, "lr": 3.60844888394228e-05} +{"train_loss": 0.0014148567570373416, "global_step": 42315, "epoch": 355, "lr": 3.608236087549658e-05} +{"train_loss": 0.0023357593454420567, "global_step": 42316, "epoch": 355, "lr": 3.6080232938896166e-05} +{"train_loss": 0.0009525833884254098, "global_step": 42317, "epoch": 355, "lr": 3.6078105029625705e-05} +{"train_loss": 0.0015230714343488216, "global_step": 42318, "epoch": 355, "lr": 3.607597714768942e-05} +{"train_loss": 0.001102758222259581, "global_step": 42319, "epoch": 355, "lr": 3.6073849293091446e-05} +{"train_loss": 0.0017462853575125337, "global_step": 42320, "epoch": 355, "lr": 3.607172146583601e-05} +{"train_loss": 0.0016374388942494988, "global_step": 42321, "epoch": 355, "lr": 3.6069593665927246e-05} +{"train_loss": 0.001152952783741057, "global_step": 42322, "epoch": 355, "lr": 3.606746589336933e-05} +{"train_loss": 0.0015565984649583697, "global_step": 42323, "epoch": 355, "lr": 3.6065338148166485e-05} +{"train_loss": 0.0013525558169931173, "global_step": 42324, "epoch": 355, "lr": 3.606321043032282e-05} +{"train_loss": 0.0014937289524823427, "global_step": 42325, "epoch": 355, "lr": 3.606108273984259e-05} +{"train_loss": 0.0012482155580073595, "global_step": 42326, "epoch": 355, "lr": 3.6058955076729914e-05} +{"train_loss": 0.002882108325138688, "global_step": 42327, "epoch": 355, "lr": 3.6056827440989006e-05} +{"train_loss": 0.0017365965759381652, "global_step": 42328, "epoch": 355, "lr": 3.605469983262402e-05} +{"train_loss": 0.0012639061314985156, "global_step": 42329, "epoch": 355, "lr": 3.605257225163913e-05} +{"train_loss": 0.0016893005231395364, "global_step": 42330, "epoch": 355, "lr": 3.605044469803854e-05} +{"train_loss": 0.0025176997296512127, "global_step": 42331, "epoch": 355, "lr": 3.60483171718264e-05} +{"train_loss": 0.0015590718248859048, "global_step": 42332, "epoch": 355, "lr": 3.6046189673006915e-05} +{"train_loss": 0.001494065742008388, "global_step": 42333, "epoch": 355, "lr": 3.6044062201584225e-05} +{"train_loss": 0.0018002208089455962, "global_step": 42334, "epoch": 355, "lr": 3.604193475756255e-05} +{"train_loss": 0.0013799801236018538, "global_step": 42335, "epoch": 355, "lr": 3.603980734094604e-05} +{"train_loss": 0.0021401543635874987, "global_step": 42336, "epoch": 355, "lr": 3.603767995173886e-05} +{"train_loss": 0.001989637967199087, "global_step": 42337, "epoch": 355, "lr": 3.603555258994523e-05} +{"train_loss": 0.0019368387293070555, "global_step": 42338, "epoch": 355, "lr": 3.603342525556927e-05} +{"train_loss": 0.002275883685797453, "global_step": 42339, "epoch": 355, "lr": 3.603129794861521e-05} +{"train_loss": 0.00192360975779593, "global_step": 42340, "epoch": 355, "lr": 3.602917066908721e-05} +{"train_loss": 0.0020824018865823746, "global_step": 42341, "epoch": 355, "lr": 3.602704341698942e-05} +{"train_loss": 0.001774730859324336, "global_step": 42342, "epoch": 355, "lr": 3.602491619232604e-05} +{"train_loss": 0.0022126114927232265, "global_step": 42343, "epoch": 355, "lr": 3.602278899510125e-05} +{"train_loss": 0.0012284459080547094, "global_step": 42344, "epoch": 355, "lr": 3.6020661825319216e-05} +{"train_loss": 0.0018132049590349197, "global_step": 42345, "epoch": 355, "lr": 3.601853468298412e-05} +{"train_loss": 0.002459337003529072, "global_step": 42346, "epoch": 355, "lr": 3.601640756810014e-05} +{"train_loss": 0.0013193123741075397, "global_step": 42347, "epoch": 355, "lr": 3.6014280480671455e-05} +{"train_loss": 0.0014859066577628255, "global_step": 42348, "epoch": 355, "lr": 3.601215342070222e-05} +{"train_loss": 0.001581894000992179, "global_step": 42349, "epoch": 355, "lr": 3.601002638819665e-05} +{"train_loss": 0.002263471018522978, "global_step": 42350, "epoch": 355, "lr": 3.600789938315888e-05} +{"train_loss": 0.0022768699564039707, "global_step": 42351, "epoch": 355, "lr": 3.600577240559312e-05} +{"train_loss": 0.0007229180773720145, "global_step": 42352, "epoch": 355, "lr": 3.600364545550351e-05} +{"train_loss": 0.0013221015688031912, "global_step": 42353, "epoch": 355, "lr": 3.6001518532894265e-05} +{"train_loss": 0.0013849860988557339, "global_step": 42354, "epoch": 355, "lr": 3.5999391637769556e-05} +{"train_loss": 0.0013524204259738326, "global_step": 42355, "epoch": 355, "lr": 3.599726477013351e-05} +{"train_loss": 0.0017247687792405486, "global_step": 42356, "epoch": 355, "lr": 3.599513792999036e-05} +{"train_loss": 0.0017949934117496014, "global_step": 42357, "epoch": 355, "lr": 3.5993011117344254e-05} +{"train_loss": 0.001378655550070107, "global_step": 42358, "epoch": 355, "lr": 3.599088433219938e-05} +{"train_loss": 0.00255403365008533, "global_step": 42359, "epoch": 355, "lr": 3.59887575745599e-05} +{"train_loss": 0.0014291736297309399, "global_step": 42360, "epoch": 355, "lr": 3.598663084443001e-05} +{"train_loss": 0.001113657490350306, "global_step": 42361, "epoch": 355, "lr": 3.5984504141813866e-05} +{"train_loss": 0.0009472179226577282, "global_step": 42362, "epoch": 355, "lr": 3.598237746671564e-05} +{"train_loss": 0.001609484526180044, "global_step": 42363, "epoch": 355, "lr": 3.598025081913953e-05, "val_loss": 0.016217228025197983, "train_action_mse_error": 2.533828592277132e-05} +{"train_loss": 0.002792556071653962, "global_step": 42364, "epoch": 356, "lr": 3.597812419908969e-05} +{"train_loss": 0.0013470479752868414, "global_step": 42365, "epoch": 356, "lr": 3.597599760657032e-05} +{"train_loss": 0.0011772074503824115, "global_step": 42366, "epoch": 356, "lr": 3.597387104158558e-05} +{"train_loss": 0.0012183253420516849, "global_step": 42367, "epoch": 356, "lr": 3.597174450413964e-05} +{"train_loss": 0.0013358244905248284, "global_step": 42368, "epoch": 356, "lr": 3.5969617994236684e-05} +{"train_loss": 0.0016637466615065932, "global_step": 42369, "epoch": 356, "lr": 3.596749151188087e-05} +{"train_loss": 0.001223238417878747, "global_step": 42370, "epoch": 356, "lr": 3.5965365057076404e-05} +{"train_loss": 0.0016947697149589658, "global_step": 42371, "epoch": 356, "lr": 3.596323862982743e-05} +{"train_loss": 0.001287474180571735, "global_step": 42372, "epoch": 356, "lr": 3.596111223013815e-05} +{"train_loss": 0.0018178640166297555, "global_step": 42373, "epoch": 356, "lr": 3.5958985858012735e-05} +{"train_loss": 0.0012863300507888198, "global_step": 42374, "epoch": 356, "lr": 3.595685951345533e-05} +{"train_loss": 0.0010669982293620706, "global_step": 42375, "epoch": 356, "lr": 3.5954733196470146e-05} +{"train_loss": 0.0014352903235703707, "global_step": 42376, "epoch": 356, "lr": 3.595260690706133e-05} +{"train_loss": 0.0015451500657945871, "global_step": 42377, "epoch": 356, "lr": 3.5950480645233066e-05} +{"train_loss": 0.0015599833568558097, "global_step": 42378, "epoch": 356, "lr": 3.594835441098955e-05} +{"train_loss": 0.0016098929336294532, "global_step": 42379, "epoch": 356, "lr": 3.594622820433492e-05} +{"train_loss": 0.0016554961912333965, "global_step": 42380, "epoch": 356, "lr": 3.594410202527339e-05} +{"train_loss": 0.0012569997925311327, "global_step": 42381, "epoch": 356, "lr": 3.5941975873809096e-05} +{"train_loss": 0.0013489327393472195, "global_step": 42382, "epoch": 356, "lr": 3.5939849749946246e-05} +{"train_loss": 0.0018612557323649526, "global_step": 42383, "epoch": 356, "lr": 3.593772365368898e-05} +{"train_loss": 0.0011774692684412003, "global_step": 42384, "epoch": 356, "lr": 3.593559758504152e-05} +{"train_loss": 0.0009174904553219676, "global_step": 42385, "epoch": 356, "lr": 3.5933471544008e-05} +{"train_loss": 0.0009698002249933779, "global_step": 42386, "epoch": 356, "lr": 3.593134553059259e-05} +{"train_loss": 0.002212175168097019, "global_step": 42387, "epoch": 356, "lr": 3.5929219544799496e-05} +{"train_loss": 0.0015425925375893712, "global_step": 42388, "epoch": 356, "lr": 3.592709358663286e-05} +{"train_loss": 0.0014841241063550115, "global_step": 42389, "epoch": 356, "lr": 3.592496765609689e-05} +{"train_loss": 0.0018621811177581549, "global_step": 42390, "epoch": 356, "lr": 3.5922841753195744e-05} +{"train_loss": 0.0010740476427599788, "global_step": 42391, "epoch": 356, "lr": 3.5920715877933574e-05} +{"train_loss": 0.001536769443191588, "global_step": 42392, "epoch": 356, "lr": 3.591859003031459e-05} +{"train_loss": 0.0010668919421732426, "global_step": 42393, "epoch": 356, "lr": 3.5916464210342935e-05} +{"train_loss": 0.0009011545917019248, "global_step": 42394, "epoch": 356, "lr": 3.5914338418022814e-05} +{"train_loss": 0.0019853326957672834, "global_step": 42395, "epoch": 356, "lr": 3.591221265335838e-05} +{"train_loss": 0.0012391529744490981, "global_step": 42396, "epoch": 356, "lr": 3.591008691635381e-05} +{"train_loss": 0.0015200425405055285, "global_step": 42397, "epoch": 356, "lr": 3.590796120701328e-05} +{"train_loss": 0.0017399482894688845, "global_step": 42398, "epoch": 356, "lr": 3.590583552534096e-05} +{"train_loss": 0.0009436489781364799, "global_step": 42399, "epoch": 356, "lr": 3.5903709871341036e-05} +{"train_loss": 0.0015762306284159422, "global_step": 42400, "epoch": 356, "lr": 3.590158424501765e-05} +{"train_loss": 0.0007562559330835938, "global_step": 42401, "epoch": 356, "lr": 3.5899458646375026e-05} +{"train_loss": 0.002645130269229412, "global_step": 42402, "epoch": 356, "lr": 3.589733307541728e-05} +{"train_loss": 0.0008624718175269663, "global_step": 42403, "epoch": 356, "lr": 3.589520753214863e-05} +{"train_loss": 0.0016380979213863611, "global_step": 42404, "epoch": 356, "lr": 3.589308201657325e-05} +{"train_loss": 0.0010857261950150132, "global_step": 42405, "epoch": 356, "lr": 3.5890956528695264e-05} +{"train_loss": 0.0013309784699231386, "global_step": 42406, "epoch": 356, "lr": 3.58888310685189e-05} +{"train_loss": 0.00087530049495399, "global_step": 42407, "epoch": 356, "lr": 3.588670563604829e-05} +{"train_loss": 0.001042481162585318, "global_step": 42408, "epoch": 356, "lr": 3.588458023128764e-05} +{"train_loss": 0.0026987905148416758, "global_step": 42409, "epoch": 356, "lr": 3.588245485424111e-05} +{"train_loss": 0.0015500241424888372, "global_step": 42410, "epoch": 356, "lr": 3.588032950491286e-05} +{"train_loss": 0.0006005392642691731, "global_step": 42411, "epoch": 356, "lr": 3.587820418330708e-05} +{"train_loss": 0.0013099578209221363, "global_step": 42412, "epoch": 356, "lr": 3.5876078889427936e-05} +{"train_loss": 0.0012616406893357635, "global_step": 42413, "epoch": 356, "lr": 3.58739536232796e-05} +{"train_loss": 0.00198083883151412, "global_step": 42414, "epoch": 356, "lr": 3.587182838486624e-05} +{"train_loss": 0.0018332621548324823, "global_step": 42415, "epoch": 356, "lr": 3.586970317419206e-05} +{"train_loss": 0.001088976627215743, "global_step": 42416, "epoch": 356, "lr": 3.5867577991261204e-05} +{"train_loss": 0.0014115961967036128, "global_step": 42417, "epoch": 356, "lr": 3.586545283607783e-05} +{"train_loss": 0.0008220928139053285, "global_step": 42418, "epoch": 356, "lr": 3.586332770864614e-05} +{"train_loss": 0.0011512503260746598, "global_step": 42419, "epoch": 356, "lr": 3.586120260897029e-05} +{"train_loss": 0.0013782345922663808, "global_step": 42420, "epoch": 356, "lr": 3.585907753705447e-05} +{"train_loss": 0.0013391029788181186, "global_step": 42421, "epoch": 356, "lr": 3.585695249290282e-05} +{"train_loss": 0.0006262617534957826, "global_step": 42422, "epoch": 356, "lr": 3.585482747651956e-05} +{"train_loss": 0.001868980354629457, "global_step": 42423, "epoch": 356, "lr": 3.585270248790883e-05} +{"train_loss": 0.0012971509713679552, "global_step": 42424, "epoch": 356, "lr": 3.585057752707478e-05} +{"train_loss": 0.0018287072889506817, "global_step": 42425, "epoch": 356, "lr": 3.584845259402164e-05} +{"train_loss": 0.0014393239980563521, "global_step": 42426, "epoch": 356, "lr": 3.584632768875352e-05} +{"train_loss": 0.0018405390437692404, "global_step": 42427, "epoch": 356, "lr": 3.584420281127465e-05} +{"train_loss": 0.0020559034310281277, "global_step": 42428, "epoch": 356, "lr": 3.584207796158918e-05} +{"train_loss": 0.0012330583995208144, "global_step": 42429, "epoch": 356, "lr": 3.5839953139701246e-05} +{"train_loss": 0.0013391458196565509, "global_step": 42430, "epoch": 356, "lr": 3.5837828345615085e-05} +{"train_loss": 0.0015685786493122578, "global_step": 42431, "epoch": 356, "lr": 3.5835703579334806e-05} +{"train_loss": 0.0012499490985646844, "global_step": 42432, "epoch": 356, "lr": 3.583357884086463e-05} +{"train_loss": 0.0010242715943604708, "global_step": 42433, "epoch": 356, "lr": 3.5831454130208695e-05} +{"train_loss": 0.0017909180605784059, "global_step": 42434, "epoch": 356, "lr": 3.582932944737121e-05} +{"train_loss": 0.0015551516553387046, "global_step": 42435, "epoch": 356, "lr": 3.582720479235631e-05} +{"train_loss": 0.0025166375562548637, "global_step": 42436, "epoch": 356, "lr": 3.582508016516817e-05} +{"train_loss": 0.001328695798292756, "global_step": 42437, "epoch": 356, "lr": 3.582295556581098e-05} +{"train_loss": 0.001667782198637724, "global_step": 42438, "epoch": 356, "lr": 3.582083099428889e-05} +{"train_loss": 0.0010822642361745238, "global_step": 42439, "epoch": 356, "lr": 3.58187064506061e-05} +{"train_loss": 0.0016685727750882506, "global_step": 42440, "epoch": 356, "lr": 3.581658193476675e-05} +{"train_loss": 0.001101861009374261, "global_step": 42441, "epoch": 356, "lr": 3.581445744677504e-05} +{"train_loss": 0.0013927818508818746, "global_step": 42442, "epoch": 356, "lr": 3.581233298663512e-05} +{"train_loss": 0.0016544874524697661, "global_step": 42443, "epoch": 356, "lr": 3.581020855435117e-05} +{"train_loss": 0.00271526793949306, "global_step": 42444, "epoch": 356, "lr": 3.5808084149927356e-05} +{"train_loss": 0.001711807562969625, "global_step": 42445, "epoch": 356, "lr": 3.580595977336785e-05} +{"train_loss": 0.0019692268688231707, "global_step": 42446, "epoch": 356, "lr": 3.5803835424676834e-05} +{"train_loss": 0.0008934269426390529, "global_step": 42447, "epoch": 356, "lr": 3.5801711103858474e-05} +{"train_loss": 0.0011986930621787906, "global_step": 42448, "epoch": 356, "lr": 3.5799586810916916e-05} +{"train_loss": 0.0007813585107214749, "global_step": 42449, "epoch": 356, "lr": 3.579746254585638e-05} +{"train_loss": 0.001374647836200893, "global_step": 42450, "epoch": 356, "lr": 3.579533830868098e-05} +{"train_loss": 0.0020147655159235, "global_step": 42451, "epoch": 356, "lr": 3.5793214099394945e-05} +{"train_loss": 0.0007884229999035597, "global_step": 42452, "epoch": 356, "lr": 3.579108991800239e-05} +{"train_loss": 0.0028516610618680716, "global_step": 42453, "epoch": 356, "lr": 3.578896576450754e-05} +{"train_loss": 0.0017104684375226498, "global_step": 42454, "epoch": 356, "lr": 3.5786841638914526e-05} +{"train_loss": 0.002044887049123645, "global_step": 42455, "epoch": 356, "lr": 3.578471754122752e-05} +{"train_loss": 0.0021138659212738276, "global_step": 42456, "epoch": 356, "lr": 3.578259347145072e-05} +{"train_loss": 0.0020618177950382233, "global_step": 42457, "epoch": 356, "lr": 3.5780469429588246e-05} +{"train_loss": 0.001726039918139577, "global_step": 42458, "epoch": 356, "lr": 3.577834541564434e-05} +{"train_loss": 0.0009722865652292967, "global_step": 42459, "epoch": 356, "lr": 3.5776221429623116e-05} +{"train_loss": 0.0007317608688026667, "global_step": 42460, "epoch": 356, "lr": 3.577409747152875e-05} +{"train_loss": 0.000852391414809972, "global_step": 42461, "epoch": 356, "lr": 3.5771973541365443e-05} +{"train_loss": 0.0017259857850149274, "global_step": 42462, "epoch": 356, "lr": 3.576984963913733e-05} +{"train_loss": 0.001349744969047606, "global_step": 42463, "epoch": 356, "lr": 3.5767725764848615e-05} +{"train_loss": 0.0014880808303132653, "global_step": 42464, "epoch": 356, "lr": 3.5765601918503424e-05} +{"train_loss": 0.0018280927324667573, "global_step": 42465, "epoch": 356, "lr": 3.5763478100105976e-05} +{"train_loss": 0.0025749378837645054, "global_step": 42466, "epoch": 356, "lr": 3.576135430966042e-05} +{"train_loss": 0.001171683776192367, "global_step": 42467, "epoch": 356, "lr": 3.575923054717091e-05} +{"train_loss": 0.0026725733187049627, "global_step": 42468, "epoch": 356, "lr": 3.575710681264164e-05} +{"train_loss": 0.002081233775243163, "global_step": 42469, "epoch": 356, "lr": 3.5754983106076754e-05} +{"train_loss": 0.0010506822727620602, "global_step": 42470, "epoch": 356, "lr": 3.5752859427480455e-05} +{"train_loss": 0.001748659648001194, "global_step": 42471, "epoch": 356, "lr": 3.575073577685687e-05} +{"train_loss": 0.0008685947395861149, "global_step": 42472, "epoch": 356, "lr": 3.574861215421022e-05} +{"train_loss": 0.0009832738433033228, "global_step": 42473, "epoch": 356, "lr": 3.574648855954465e-05} +{"train_loss": 0.0012289003934711218, "global_step": 42474, "epoch": 356, "lr": 3.57443649928643e-05} +{"train_loss": 0.0007139293593354523, "global_step": 42475, "epoch": 356, "lr": 3.574224145417338e-05} +{"train_loss": 0.00222073495388031, "global_step": 42476, "epoch": 356, "lr": 3.574011794347604e-05} +{"train_loss": 0.002796304179355502, "global_step": 42477, "epoch": 356, "lr": 3.5737994460776456e-05} +{"train_loss": 0.001266602659597993, "global_step": 42478, "epoch": 356, "lr": 3.5735871006078815e-05} +{"train_loss": 0.0017160344868898392, "global_step": 42479, "epoch": 356, "lr": 3.573374757938724e-05} +{"train_loss": 0.0016387247014790773, "global_step": 42480, "epoch": 356, "lr": 3.573162418070595e-05} +{"train_loss": 0.001174823148176074, "global_step": 42481, "epoch": 356, "lr": 3.5729500810039065e-05} +{"train_loss": 0.0014976836342810646, "global_step": 42482, "epoch": 356, "lr": 3.572737746739081e-05, "val_loss": 0.015813004225492477} +{"train_loss": 0.002288058865815401, "global_step": 42483, "epoch": 357, "lr": 3.5725254152765295e-05} +{"train_loss": 0.003079221351072192, "global_step": 42484, "epoch": 357, "lr": 3.572313086616675e-05} +{"train_loss": 0.0016613086918368936, "global_step": 42485, "epoch": 357, "lr": 3.572100760759931e-05} +{"train_loss": 0.0019247980089858174, "global_step": 42486, "epoch": 357, "lr": 3.571888437706712e-05} +{"train_loss": 0.0013270684285089374, "global_step": 42487, "epoch": 357, "lr": 3.5716761174574395e-05} +{"train_loss": 0.001590839005075395, "global_step": 42488, "epoch": 357, "lr": 3.571463800012527e-05} +{"train_loss": 0.003396541578695178, "global_step": 42489, "epoch": 357, "lr": 3.5712514853723944e-05} +{"train_loss": 0.001361351227387786, "global_step": 42490, "epoch": 357, "lr": 3.571039173537454e-05} +{"train_loss": 0.0016570748994126916, "global_step": 42491, "epoch": 357, "lr": 3.570826864508129e-05} +{"train_loss": 0.00207975460216403, "global_step": 42492, "epoch": 357, "lr": 3.570614558284831e-05} +{"train_loss": 0.0015733547043055296, "global_step": 42493, "epoch": 357, "lr": 3.5704022548679784e-05} +{"train_loss": 0.0017454181797802448, "global_step": 42494, "epoch": 357, "lr": 3.5701899542579885e-05} +{"train_loss": 0.0017663614125922322, "global_step": 42495, "epoch": 357, "lr": 3.569977656455278e-05} +{"train_loss": 0.0025035967119038105, "global_step": 42496, "epoch": 357, "lr": 3.5697653614602634e-05} +{"train_loss": 0.002071384573355317, "global_step": 42497, "epoch": 357, "lr": 3.5695530692733624e-05} +{"train_loss": 0.0016677273670211434, "global_step": 42498, "epoch": 357, "lr": 3.5693407798949894e-05} +{"train_loss": 0.0018372021149843931, "global_step": 42499, "epoch": 357, "lr": 3.5691284933255654e-05} +{"train_loss": 0.0014817493502050638, "global_step": 42500, "epoch": 357, "lr": 3.5689162095655024e-05} +{"train_loss": 0.0014498509699478745, "global_step": 42501, "epoch": 357, "lr": 3.568703928615221e-05} +{"train_loss": 0.0020299032330513, "global_step": 42502, "epoch": 357, "lr": 3.5684916504751356e-05} +{"train_loss": 0.0013888474786654115, "global_step": 42503, "epoch": 357, "lr": 3.5682793751456654e-05} +{"train_loss": 0.0019489368423819542, "global_step": 42504, "epoch": 357, "lr": 3.568067102627226e-05} +{"train_loss": 0.0008190312655642629, "global_step": 42505, "epoch": 357, "lr": 3.567854832920231e-05} +{"train_loss": 0.0018648295663297176, "global_step": 42506, "epoch": 357, "lr": 3.5676425660251026e-05} +{"train_loss": 0.002200944582000375, "global_step": 42507, "epoch": 357, "lr": 3.5674303019422526e-05} +{"train_loss": 0.00161206244956702, "global_step": 42508, "epoch": 357, "lr": 3.5672180406721036e-05} +{"train_loss": 0.0016216897638514638, "global_step": 42509, "epoch": 357, "lr": 3.567005782215066e-05} +{"train_loss": 0.002251881640404463, "global_step": 42510, "epoch": 357, "lr": 3.566793526571559e-05} +{"train_loss": 0.0013049913104623556, "global_step": 42511, "epoch": 357, "lr": 3.5665812737420026e-05} +{"train_loss": 0.0010703688021749258, "global_step": 42512, "epoch": 357, "lr": 3.566369023726808e-05} +{"train_loss": 0.0017089775064960122, "global_step": 42513, "epoch": 357, "lr": 3.566156776526397e-05} +{"train_loss": 0.0024846959859132767, "global_step": 42514, "epoch": 357, "lr": 3.565944532141182e-05} +{"train_loss": 0.0019695996306836605, "global_step": 42515, "epoch": 357, "lr": 3.565732290571583e-05} +{"train_loss": 0.0012500165030360222, "global_step": 42516, "epoch": 357, "lr": 3.565520051818017e-05} +{"train_loss": 0.0008933263598009944, "global_step": 42517, "epoch": 357, "lr": 3.565307815880895e-05} +{"train_loss": 0.0016947501571848989, "global_step": 42518, "epoch": 357, "lr": 3.5650955827606414e-05} +{"train_loss": 0.0012229388812556863, "global_step": 42519, "epoch": 357, "lr": 3.5648833524576666e-05} +{"train_loss": 0.0012840916169807315, "global_step": 42520, "epoch": 357, "lr": 3.564671124972392e-05} +{"train_loss": 0.0015155301662161946, "global_step": 42521, "epoch": 357, "lr": 3.564458900305231e-05} +{"train_loss": 0.0014115680241957307, "global_step": 42522, "epoch": 357, "lr": 3.564246678456603e-05} +{"train_loss": 0.00317192985676229, "global_step": 42523, "epoch": 357, "lr": 3.5640344594269234e-05} +{"train_loss": 0.0016966210678219795, "global_step": 42524, "epoch": 357, "lr": 3.563822243216607e-05} +{"train_loss": 0.002474233042448759, "global_step": 42525, "epoch": 357, "lr": 3.563610029826073e-05} +{"train_loss": 0.000738356844522059, "global_step": 42526, "epoch": 357, "lr": 3.563397819255737e-05} +{"train_loss": 0.0018881200812757015, "global_step": 42527, "epoch": 357, "lr": 3.5631856115060156e-05} +{"train_loss": 0.0013039789628237486, "global_step": 42528, "epoch": 357, "lr": 3.562973406577328e-05} +{"train_loss": 0.0017852602759376168, "global_step": 42529, "epoch": 357, "lr": 3.562761204470085e-05} +{"train_loss": 0.0015019631246104836, "global_step": 42530, "epoch": 357, "lr": 3.5625490051847096e-05} +{"train_loss": 0.0007117177592590451, "global_step": 42531, "epoch": 357, "lr": 3.5623368087216144e-05} +{"train_loss": 0.001255684532225132, "global_step": 42532, "epoch": 357, "lr": 3.562124615081218e-05} +{"train_loss": 0.0015216979663819075, "global_step": 42533, "epoch": 357, "lr": 3.561912424263935e-05} +{"train_loss": 0.0011396281188353896, "global_step": 42534, "epoch": 357, "lr": 3.561700236270186e-05} +{"train_loss": 0.0016705370508134365, "global_step": 42535, "epoch": 357, "lr": 3.561488051100383e-05} +{"train_loss": 0.0014183897292241454, "global_step": 42536, "epoch": 357, "lr": 3.561275868754944e-05} +{"train_loss": 0.001836644485592842, "global_step": 42537, "epoch": 357, "lr": 3.561063689234288e-05} +{"train_loss": 0.0017404996324330568, "global_step": 42538, "epoch": 357, "lr": 3.560851512538828e-05} +{"train_loss": 0.0012146938825026155, "global_step": 42539, "epoch": 357, "lr": 3.560639338668983e-05} +{"train_loss": 0.0008028758456930518, "global_step": 42540, "epoch": 357, "lr": 3.560427167625168e-05} +{"train_loss": 0.0008852691389620304, "global_step": 42541, "epoch": 357, "lr": 3.5602149994078026e-05} +{"train_loss": 0.001530709327198565, "global_step": 42542, "epoch": 357, "lr": 3.5600028340173e-05} +{"train_loss": 0.0024314885959029198, "global_step": 42543, "epoch": 357, "lr": 3.5597906714540775e-05} +{"train_loss": 0.0013478907058015466, "global_step": 42544, "epoch": 357, "lr": 3.559578511718552e-05} +{"train_loss": 0.0017545284936204553, "global_step": 42545, "epoch": 357, "lr": 3.55936635481114e-05} +{"train_loss": 0.001347381272353232, "global_step": 42546, "epoch": 357, "lr": 3.55915420073226e-05} +{"train_loss": 0.0012417938560247421, "global_step": 42547, "epoch": 357, "lr": 3.558942049482327e-05} +{"train_loss": 0.0023932841140776873, "global_step": 42548, "epoch": 357, "lr": 3.5587299010617546e-05} +{"train_loss": 0.0009368198225274682, "global_step": 42549, "epoch": 357, "lr": 3.558517755470965e-05} +{"train_loss": 0.0014307056553661823, "global_step": 42550, "epoch": 357, "lr": 3.5583056127103685e-05} +{"train_loss": 0.0017374152084812522, "global_step": 42551, "epoch": 357, "lr": 3.558093472780388e-05} +{"train_loss": 0.0017723515629768372, "global_step": 42552, "epoch": 357, "lr": 3.5578813356814345e-05} +{"train_loss": 0.0011898255906999111, "global_step": 42553, "epoch": 357, "lr": 3.557669201413929e-05} +{"train_loss": 0.0013479198096320033, "global_step": 42554, "epoch": 357, "lr": 3.5574570699782864e-05} +{"train_loss": 0.0011833009775727987, "global_step": 42555, "epoch": 357, "lr": 3.55724494137492e-05} +{"train_loss": 0.0009220996871590614, "global_step": 42556, "epoch": 357, "lr": 3.557032815604251e-05} +{"train_loss": 0.0009907437488436699, "global_step": 42557, "epoch": 357, "lr": 3.5568206926666925e-05} +{"train_loss": 0.0020662895403802395, "global_step": 42558, "epoch": 357, "lr": 3.556608572562664e-05} +{"train_loss": 0.0025403881445527077, "global_step": 42559, "epoch": 357, "lr": 3.556396455292579e-05} +{"train_loss": 0.0015717322239652276, "global_step": 42560, "epoch": 357, "lr": 3.556184340856855e-05} +{"train_loss": 0.0019655609503388405, "global_step": 42561, "epoch": 357, "lr": 3.555972229255911e-05} +{"train_loss": 0.0012265372788533568, "global_step": 42562, "epoch": 357, "lr": 3.555760120490159e-05} +{"train_loss": 0.0008304579532705247, "global_step": 42563, "epoch": 357, "lr": 3.5555480145600194e-05} +{"train_loss": 0.0014425177359953523, "global_step": 42564, "epoch": 357, "lr": 3.5553359114659054e-05} +{"train_loss": 0.0009094411507248878, "global_step": 42565, "epoch": 357, "lr": 3.5551238112082364e-05} +{"train_loss": 0.0016494406154379249, "global_step": 42566, "epoch": 357, "lr": 3.554911713787428e-05} +{"train_loss": 0.0014670111704617739, "global_step": 42567, "epoch": 357, "lr": 3.5546996192038936e-05} +{"train_loss": 0.001408070675097406, "global_step": 42568, "epoch": 357, "lr": 3.554487527458055e-05} +{"train_loss": 0.0018241895595565438, "global_step": 42569, "epoch": 357, "lr": 3.554275438550322e-05} +{"train_loss": 0.0007340278243646026, "global_step": 42570, "epoch": 357, "lr": 3.5540633524811186e-05} +{"train_loss": 0.001559795462526381, "global_step": 42571, "epoch": 357, "lr": 3.553851269250854e-05} +{"train_loss": 0.001015662681311369, "global_step": 42572, "epoch": 357, "lr": 3.5536391888599506e-05} +{"train_loss": 0.0018273154273629189, "global_step": 42573, "epoch": 357, "lr": 3.553427111308821e-05} +{"train_loss": 0.0010141055099666119, "global_step": 42574, "epoch": 357, "lr": 3.553215036597882e-05} +{"train_loss": 0.0008080474799498916, "global_step": 42575, "epoch": 357, "lr": 3.553002964727552e-05} +{"train_loss": 0.0013394012348726392, "global_step": 42576, "epoch": 357, "lr": 3.5527908956982456e-05} +{"train_loss": 0.0013069513952359557, "global_step": 42577, "epoch": 357, "lr": 3.552578829510379e-05} +{"train_loss": 0.0025345622561872005, "global_step": 42578, "epoch": 357, "lr": 3.552366766164371e-05} +{"train_loss": 0.0020237432327121496, "global_step": 42579, "epoch": 357, "lr": 3.552154705660634e-05} +{"train_loss": 0.0011235261335968971, "global_step": 42580, "epoch": 357, "lr": 3.551942647999589e-05} +{"train_loss": 0.0020105119328945875, "global_step": 42581, "epoch": 357, "lr": 3.5517305931816466e-05} +{"train_loss": 0.0015713005559518933, "global_step": 42582, "epoch": 357, "lr": 3.55151854120723e-05} +{"train_loss": 0.0019326788606122136, "global_step": 42583, "epoch": 357, "lr": 3.551306492076749e-05} +{"train_loss": 0.0013677281094715, "global_step": 42584, "epoch": 357, "lr": 3.5510944457906255e-05} +{"train_loss": 0.0012185800587758422, "global_step": 42585, "epoch": 357, "lr": 3.550882402349272e-05} +{"train_loss": 0.001486326102167368, "global_step": 42586, "epoch": 357, "lr": 3.5506703617531056e-05} +{"train_loss": 0.0010993073228746653, "global_step": 42587, "epoch": 357, "lr": 3.5504583240025446e-05} +{"train_loss": 0.0011826471891254187, "global_step": 42588, "epoch": 357, "lr": 3.550246289098002e-05} +{"train_loss": 0.0016488664550706744, "global_step": 42589, "epoch": 357, "lr": 3.5500342570398984e-05} +{"train_loss": 0.0013043849030509591, "global_step": 42590, "epoch": 357, "lr": 3.549822227828644e-05} +{"train_loss": 0.000953255279455334, "global_step": 42591, "epoch": 357, "lr": 3.549610201464662e-05} +{"train_loss": 0.0009541325271129608, "global_step": 42592, "epoch": 357, "lr": 3.5493981779483646e-05} +{"train_loss": 0.0008184032049030066, "global_step": 42593, "epoch": 357, "lr": 3.549186157280168e-05} +{"train_loss": 0.0013839640887454152, "global_step": 42594, "epoch": 357, "lr": 3.54897413946049e-05} +{"train_loss": 0.0015726586570963264, "global_step": 42595, "epoch": 357, "lr": 3.548762124489745e-05} +{"train_loss": 0.0007472708239220083, "global_step": 42596, "epoch": 357, "lr": 3.548550112368352e-05} +{"train_loss": 0.0015722881071269512, "global_step": 42597, "epoch": 357, "lr": 3.548338103096727e-05} +{"train_loss": 0.0023097614757716656, "global_step": 42598, "epoch": 357, "lr": 3.548126096675282e-05} +{"train_loss": 0.0008972107898443937, "global_step": 42599, "epoch": 357, "lr": 3.547914093104439e-05} +{"train_loss": 0.0011600533034652472, "global_step": 42600, "epoch": 357, "lr": 3.54770209238461e-05} +{"train_loss": 0.0015582295898700273, "global_step": 42601, "epoch": 357, "lr": 3.547490094516213e-05, "val_loss": 0.01901710219681263} +{"train_loss": 0.0008074236684478819, "global_step": 42602, "epoch": 358, "lr": 3.5472780994996636e-05} +{"train_loss": 0.0008729794644750655, "global_step": 42603, "epoch": 358, "lr": 3.54706610733538e-05} +{"train_loss": 0.0014419227372854948, "global_step": 42604, "epoch": 358, "lr": 3.546854118023777e-05} +{"train_loss": 0.002540087327361107, "global_step": 42605, "epoch": 358, "lr": 3.5466421315652676e-05} +{"train_loss": 0.0011653552064672112, "global_step": 42606, "epoch": 358, "lr": 3.546430147960275e-05} +{"train_loss": 0.0008512617205269635, "global_step": 42607, "epoch": 358, "lr": 3.546218167209208e-05} +{"train_loss": 0.0020066990982741117, "global_step": 42608, "epoch": 358, "lr": 3.546006189312487e-05} +{"train_loss": 0.0021503493189811707, "global_step": 42609, "epoch": 358, "lr": 3.545794214270529e-05} +{"train_loss": 0.001020158058963716, "global_step": 42610, "epoch": 358, "lr": 3.545582242083748e-05} +{"train_loss": 0.0016887830570340157, "global_step": 42611, "epoch": 358, "lr": 3.545370272752562e-05} +{"train_loss": 0.000989595428109169, "global_step": 42612, "epoch": 358, "lr": 3.545158306277384e-05} +{"train_loss": 0.0022296893876045942, "global_step": 42613, "epoch": 358, "lr": 3.544946342658634e-05} +{"train_loss": 0.0012906125048175454, "global_step": 42614, "epoch": 358, "lr": 3.544734381896725e-05} +{"train_loss": 0.002530689351260662, "global_step": 42615, "epoch": 358, "lr": 3.544522423992076e-05} +{"train_loss": 0.001298979390412569, "global_step": 42616, "epoch": 358, "lr": 3.544310468945102e-05} +{"train_loss": 0.0016154887853190303, "global_step": 42617, "epoch": 358, "lr": 3.5440985167562166e-05} +{"train_loss": 0.002610970987007022, "global_step": 42618, "epoch": 358, "lr": 3.54388656742584e-05} +{"train_loss": 0.0007928262930363417, "global_step": 42619, "epoch": 358, "lr": 3.543674620954386e-05} +{"train_loss": 0.0009462079033255577, "global_step": 42620, "epoch": 358, "lr": 3.543462677342272e-05} +{"train_loss": 0.0016920104390010238, "global_step": 42621, "epoch": 358, "lr": 3.543250736589911e-05} +{"train_loss": 0.0007996362983249128, "global_step": 42622, "epoch": 358, "lr": 3.543038798697725e-05} +{"train_loss": 0.0012865298194810748, "global_step": 42623, "epoch": 358, "lr": 3.542826863666124e-05} +{"train_loss": 0.0015851021744310856, "global_step": 42624, "epoch": 358, "lr": 3.542614931495528e-05} +{"train_loss": 0.001249984372407198, "global_step": 42625, "epoch": 358, "lr": 3.542403002186352e-05} +{"train_loss": 0.0012514402624219656, "global_step": 42626, "epoch": 358, "lr": 3.542191075739012e-05} +{"train_loss": 0.0025369718205183744, "global_step": 42627, "epoch": 358, "lr": 3.541979152153923e-05} +{"train_loss": 0.0009993771091103554, "global_step": 42628, "epoch": 358, "lr": 3.541767231431504e-05} +{"train_loss": 0.0008358414052054286, "global_step": 42629, "epoch": 358, "lr": 3.5415553135721666e-05} +{"train_loss": 0.001126465736888349, "global_step": 42630, "epoch": 358, "lr": 3.541343398576332e-05} +{"train_loss": 0.0020620962604880333, "global_step": 42631, "epoch": 358, "lr": 3.5411314864444125e-05} +{"train_loss": 0.001853373134508729, "global_step": 42632, "epoch": 358, "lr": 3.540919577176827e-05} +{"train_loss": 0.0020401268266141415, "global_step": 42633, "epoch": 358, "lr": 3.540707670773987e-05} +{"train_loss": 0.0015388060128316283, "global_step": 42634, "epoch": 358, "lr": 3.5404957672363145e-05} +{"train_loss": 0.0015042356681078672, "global_step": 42635, "epoch": 358, "lr": 3.540283866564223e-05} +{"train_loss": 0.0008582450682297349, "global_step": 42636, "epoch": 358, "lr": 3.540071968758125e-05} +{"train_loss": 0.001353320898488164, "global_step": 42637, "epoch": 358, "lr": 3.5398600738184426e-05} +{"train_loss": 0.0014997386606410146, "global_step": 42638, "epoch": 358, "lr": 3.539648181745587e-05} +{"train_loss": 0.0009009135537780821, "global_step": 42639, "epoch": 358, "lr": 3.539436292539978e-05} +{"train_loss": 0.0017019339138641953, "global_step": 42640, "epoch": 358, "lr": 3.539224406202028e-05} +{"train_loss": 0.0017137133982032537, "global_step": 42641, "epoch": 358, "lr": 3.5390125227321566e-05} +{"train_loss": 0.0013991754967719316, "global_step": 42642, "epoch": 358, "lr": 3.538800642130777e-05} +{"train_loss": 0.002099580131471157, "global_step": 42643, "epoch": 358, "lr": 3.538588764398305e-05} +{"train_loss": 0.0009806629968807101, "global_step": 42644, "epoch": 358, "lr": 3.53837688953516e-05} +{"train_loss": 0.0013938224874436855, "global_step": 42645, "epoch": 358, "lr": 3.538165017541754e-05} +{"train_loss": 0.0021832173224538565, "global_step": 42646, "epoch": 358, "lr": 3.537953148418507e-05} +{"train_loss": 0.0010255135130137205, "global_step": 42647, "epoch": 358, "lr": 3.537741282165832e-05} +{"train_loss": 0.0018625055672600865, "global_step": 42648, "epoch": 358, "lr": 3.5375294187841445e-05} +{"train_loss": 0.001731425174511969, "global_step": 42649, "epoch": 358, "lr": 3.537317558273864e-05} +{"train_loss": 0.0009574164287187159, "global_step": 42650, "epoch": 358, "lr": 3.5371057006354014e-05} +{"train_loss": 0.0023866326082497835, "global_step": 42651, "epoch": 358, "lr": 3.536893845869178e-05} +{"train_loss": 0.0012978781014680862, "global_step": 42652, "epoch": 358, "lr": 3.5366819939756045e-05} +{"train_loss": 0.0011504426365718246, "global_step": 42653, "epoch": 358, "lr": 3.536470144955102e-05} +{"train_loss": 0.0013494460145011544, "global_step": 42654, "epoch": 358, "lr": 3.5362582988080836e-05} +{"train_loss": 0.0013968042330816388, "global_step": 42655, "epoch": 358, "lr": 3.536046455534965e-05} +{"train_loss": 0.001239212229847908, "global_step": 42656, "epoch": 358, "lr": 3.5358346151361626e-05} +{"train_loss": 0.001610698876902461, "global_step": 42657, "epoch": 358, "lr": 3.5356227776120934e-05} +{"train_loss": 0.0009228172712028027, "global_step": 42658, "epoch": 358, "lr": 3.535410942963172e-05} +{"train_loss": 0.0018727221759036183, "global_step": 42659, "epoch": 358, "lr": 3.535199111189814e-05} +{"train_loss": 0.0017115639057010412, "global_step": 42660, "epoch": 358, "lr": 3.5349872822924365e-05} +{"train_loss": 0.0020163157023489475, "global_step": 42661, "epoch": 358, "lr": 3.534775456271456e-05} +{"train_loss": 0.0015153901185840368, "global_step": 42662, "epoch": 358, "lr": 3.534563633127286e-05} +{"train_loss": 0.00244007701985538, "global_step": 42663, "epoch": 358, "lr": 3.534351812860345e-05} +{"train_loss": 0.0021359657403081656, "global_step": 42664, "epoch": 358, "lr": 3.534139995471046e-05} +{"train_loss": 0.0010654156794771552, "global_step": 42665, "epoch": 358, "lr": 3.5339281809598086e-05} +{"train_loss": 0.0011372987646609545, "global_step": 42666, "epoch": 358, "lr": 3.5337163693270456e-05} +{"train_loss": 0.0018320793751627207, "global_step": 42667, "epoch": 358, "lr": 3.533504560573173e-05} +{"train_loss": 0.0017972422065213323, "global_step": 42668, "epoch": 358, "lr": 3.53329275469861e-05} +{"train_loss": 0.0019246479496359825, "global_step": 42669, "epoch": 358, "lr": 3.533080951703767e-05} +{"train_loss": 0.0008397256024181843, "global_step": 42670, "epoch": 358, "lr": 3.532869151589064e-05} +{"train_loss": 0.001218501478433609, "global_step": 42671, "epoch": 358, "lr": 3.5326573543549154e-05} +{"train_loss": 0.0014551810454577208, "global_step": 42672, "epoch": 358, "lr": 3.532445560001738e-05} +{"train_loss": 0.0017277724109590054, "global_step": 42673, "epoch": 358, "lr": 3.532233768529947e-05} +{"train_loss": 0.0021932432428002357, "global_step": 42674, "epoch": 358, "lr": 3.532021979939958e-05} +{"train_loss": 0.0014165672473609447, "global_step": 42675, "epoch": 358, "lr": 3.531810194232186e-05} +{"train_loss": 0.0011978220427408814, "global_step": 42676, "epoch": 358, "lr": 3.531598411407049e-05} +{"train_loss": 0.00150571099948138, "global_step": 42677, "epoch": 358, "lr": 3.5313866314649614e-05} +{"train_loss": 0.0028036017902195454, "global_step": 42678, "epoch": 358, "lr": 3.531174854406338e-05} +{"train_loss": 0.0010434659197926521, "global_step": 42679, "epoch": 358, "lr": 3.530963080231597e-05} +{"train_loss": 0.0019564898684620857, "global_step": 42680, "epoch": 358, "lr": 3.530751308941155e-05} +{"train_loss": 0.0011237176368013024, "global_step": 42681, "epoch": 358, "lr": 3.5305395405354226e-05} +{"train_loss": 0.002090824767947197, "global_step": 42682, "epoch": 358, "lr": 3.530327775014821e-05} +{"train_loss": 0.0023507471196353436, "global_step": 42683, "epoch": 358, "lr": 3.5301160123797617e-05} +{"train_loss": 0.0015642771031707525, "global_step": 42684, "epoch": 358, "lr": 3.529904252630665e-05} +{"train_loss": 0.0012238890631124377, "global_step": 42685, "epoch": 358, "lr": 3.529692495767944e-05} +{"train_loss": 0.0015380694530904293, "global_step": 42686, "epoch": 358, "lr": 3.5294807417920126e-05} +{"train_loss": 0.0016973235178738832, "global_step": 42687, "epoch": 358, "lr": 3.5292689907032904e-05} +{"train_loss": 0.0018358587985858321, "global_step": 42688, "epoch": 358, "lr": 3.5290572425021896e-05} +{"train_loss": 0.0011388068087399006, "global_step": 42689, "epoch": 358, "lr": 3.52884549718913e-05} +{"train_loss": 0.0019299720879644156, "global_step": 42690, "epoch": 358, "lr": 3.528633754764523e-05} +{"train_loss": 0.001888237427920103, "global_step": 42691, "epoch": 358, "lr": 3.5284220152287875e-05} +{"train_loss": 0.0019394841510802507, "global_step": 42692, "epoch": 358, "lr": 3.528210278582339e-05} +{"train_loss": 0.001913626678287983, "global_step": 42693, "epoch": 358, "lr": 3.52799854482559e-05} +{"train_loss": 0.0012606768868863583, "global_step": 42694, "epoch": 358, "lr": 3.527786813958962e-05} +{"train_loss": 0.0015211055288091302, "global_step": 42695, "epoch": 358, "lr": 3.5275750859828635e-05} +{"train_loss": 0.0014566252939403057, "global_step": 42696, "epoch": 358, "lr": 3.5273633608977174e-05} +{"train_loss": 0.0027348001021891832, "global_step": 42697, "epoch": 358, "lr": 3.527151638703935e-05} +{"train_loss": 0.001855766517110169, "global_step": 42698, "epoch": 358, "lr": 3.526939919401932e-05} +{"train_loss": 0.0018803555285558105, "global_step": 42699, "epoch": 358, "lr": 3.526728202992127e-05} +{"train_loss": 0.0021616320591419935, "global_step": 42700, "epoch": 358, "lr": 3.5265164894749306e-05} +{"train_loss": 0.0007809795206412673, "global_step": 42701, "epoch": 358, "lr": 3.5263047788507646e-05} +{"train_loss": 0.0008951498894020915, "global_step": 42702, "epoch": 358, "lr": 3.5260930711200394e-05} +{"train_loss": 0.0017718055751174688, "global_step": 42703, "epoch": 358, "lr": 3.525881366283176e-05} +{"train_loss": 0.0008404138498008251, "global_step": 42704, "epoch": 358, "lr": 3.5256696643405854e-05} +{"train_loss": 0.0012448380002751946, "global_step": 42705, "epoch": 358, "lr": 3.525457965292684e-05} +{"train_loss": 0.0017890395829454064, "global_step": 42706, "epoch": 358, "lr": 3.525246269139889e-05} +{"train_loss": 0.0015439619310200214, "global_step": 42707, "epoch": 358, "lr": 3.5250345758826155e-05} +{"train_loss": 0.0011173373786732554, "global_step": 42708, "epoch": 358, "lr": 3.524822885521279e-05} +{"train_loss": 0.0018863935256376863, "global_step": 42709, "epoch": 358, "lr": 3.5246111980562946e-05} +{"train_loss": 0.0024887770414352417, "global_step": 42710, "epoch": 358, "lr": 3.524399513488079e-05} +{"train_loss": 0.0015028991037979722, "global_step": 42711, "epoch": 358, "lr": 3.524187831817048e-05} +{"train_loss": 0.0014722885098308325, "global_step": 42712, "epoch": 358, "lr": 3.5239761530436156e-05} +{"train_loss": 0.002173139015212655, "global_step": 42713, "epoch": 358, "lr": 3.5237644771682e-05} +{"train_loss": 0.0015270757721737027, "global_step": 42714, "epoch": 358, "lr": 3.523552804191213e-05} +{"train_loss": 0.001908529899083078, "global_step": 42715, "epoch": 358, "lr": 3.523341134113073e-05} +{"train_loss": 0.0016569900326430798, "global_step": 42716, "epoch": 358, "lr": 3.523129466934196e-05} +{"train_loss": 0.0027647295501083136, "global_step": 42717, "epoch": 358, "lr": 3.522917802654995e-05} +{"train_loss": 0.001986646093428135, "global_step": 42718, "epoch": 358, "lr": 3.522706141275889e-05} +{"train_loss": 0.0010976922931149602, "global_step": 42719, "epoch": 358, "lr": 3.5224944827972886e-05} +{"train_loss": 0.0015819254957389931, "global_step": 42720, "epoch": 358, "lr": 3.522282827219615e-05, "val_loss": 0.02346619963645935} +{"train_loss": 0.0006815484375692904, "global_step": 42721, "epoch": 359, "lr": 3.52207117454328e-05} +{"train_loss": 0.0014463983243331313, "global_step": 42722, "epoch": 359, "lr": 3.521859524768701e-05} +{"train_loss": 0.0017098599346354604, "global_step": 42723, "epoch": 359, "lr": 3.5216478778962924e-05} +{"train_loss": 0.0020816593896597624, "global_step": 42724, "epoch": 359, "lr": 3.5214362339264704e-05} +{"train_loss": 0.0007658967515453696, "global_step": 42725, "epoch": 359, "lr": 3.521224592859651e-05} +{"train_loss": 0.001545338542200625, "global_step": 42726, "epoch": 359, "lr": 3.521012954696248e-05} +{"train_loss": 0.002330245217308402, "global_step": 42727, "epoch": 359, "lr": 3.520801319436679e-05} +{"train_loss": 0.0020575313828885555, "global_step": 42728, "epoch": 359, "lr": 3.520589687081357e-05} +{"train_loss": 0.0016219214303418994, "global_step": 42729, "epoch": 359, "lr": 3.520378057630701e-05} +{"train_loss": 0.0013261031126603484, "global_step": 42730, "epoch": 359, "lr": 3.520166431085126e-05} +{"train_loss": 0.00144309236202389, "global_step": 42731, "epoch": 359, "lr": 3.519954807445042e-05} +{"train_loss": 0.0012088781222701073, "global_step": 42732, "epoch": 359, "lr": 3.519743186710872e-05} +{"train_loss": 0.0013406849466264248, "global_step": 42733, "epoch": 359, "lr": 3.519531568883025e-05} +{"train_loss": 0.0017047850415110588, "global_step": 42734, "epoch": 359, "lr": 3.519319953961922e-05} +{"train_loss": 0.0008298613829538226, "global_step": 42735, "epoch": 359, "lr": 3.5191083419479775e-05} +{"train_loss": 0.0007929228595457971, "global_step": 42736, "epoch": 359, "lr": 3.518896732841602e-05} +{"train_loss": 0.0016284496523439884, "global_step": 42737, "epoch": 359, "lr": 3.518685126643217e-05} +{"train_loss": 0.002896828344091773, "global_step": 42738, "epoch": 359, "lr": 3.518473523353234e-05} +{"train_loss": 0.0016691400669515133, "global_step": 42739, "epoch": 359, "lr": 3.518261922972071e-05} +{"train_loss": 0.0008789294515736401, "global_step": 42740, "epoch": 359, "lr": 3.5180503255001405e-05} +{"train_loss": 0.0021468892227858305, "global_step": 42741, "epoch": 359, "lr": 3.517838730937862e-05} +{"train_loss": 0.0018834462389349937, "global_step": 42742, "epoch": 359, "lr": 3.517627139285649e-05} +{"train_loss": 0.0011292857816442847, "global_step": 42743, "epoch": 359, "lr": 3.5174155505439145e-05} +{"train_loss": 0.001735761179588735, "global_step": 42744, "epoch": 359, "lr": 3.517203964713078e-05} +{"train_loss": 0.002101713325828314, "global_step": 42745, "epoch": 359, "lr": 3.516992381793552e-05} +{"train_loss": 0.0021121802274137735, "global_step": 42746, "epoch": 359, "lr": 3.516780801785755e-05} +{"train_loss": 0.0014662131434306502, "global_step": 42747, "epoch": 359, "lr": 3.5165692246900976e-05} +{"train_loss": 0.0015021833823993802, "global_step": 42748, "epoch": 359, "lr": 3.516357650507e-05} +{"train_loss": 0.0009372971835546196, "global_step": 42749, "epoch": 359, "lr": 3.5161460792368764e-05} +{"train_loss": 0.0019775673281401396, "global_step": 42750, "epoch": 359, "lr": 3.515934510880139e-05} +{"train_loss": 0.0012483648024499416, "global_step": 42751, "epoch": 359, "lr": 3.515722945437209e-05} +{"train_loss": 0.0014417845522984862, "global_step": 42752, "epoch": 359, "lr": 3.515511382908494e-05} +{"train_loss": 0.0010168426670134068, "global_step": 42753, "epoch": 359, "lr": 3.515299823294418e-05} +{"train_loss": 0.0017726882360875607, "global_step": 42754, "epoch": 359, "lr": 3.51508826659539e-05} +{"train_loss": 0.0012786391889676452, "global_step": 42755, "epoch": 359, "lr": 3.5148767128118274e-05} +{"train_loss": 0.0020624157041311264, "global_step": 42756, "epoch": 359, "lr": 3.514665161944146e-05} +{"train_loss": 0.0025936563033610582, "global_step": 42757, "epoch": 359, "lr": 3.514453613992761e-05} +{"train_loss": 0.0014249228406697512, "global_step": 42758, "epoch": 359, "lr": 3.514242068958088e-05} +{"train_loss": 0.001669611083343625, "global_step": 42759, "epoch": 359, "lr": 3.5140305268405415e-05} +{"train_loss": 0.001793410861864686, "global_step": 42760, "epoch": 359, "lr": 3.513818987640537e-05} +{"train_loss": 0.0007158295484259725, "global_step": 42761, "epoch": 359, "lr": 3.5136074513584915e-05} +{"train_loss": 0.0011591619113460183, "global_step": 42762, "epoch": 359, "lr": 3.513395917994817e-05} +{"train_loss": 0.0010453989962115884, "global_step": 42763, "epoch": 359, "lr": 3.5131843875499325e-05} +{"train_loss": 0.004540346562862396, "global_step": 42764, "epoch": 359, "lr": 3.51297286002425e-05} +{"train_loss": 0.0014546260936185718, "global_step": 42765, "epoch": 359, "lr": 3.512761335418189e-05} +{"train_loss": 0.0012446033069863915, "global_step": 42766, "epoch": 359, "lr": 3.5125498137321614e-05} +{"train_loss": 0.0015028977068141103, "global_step": 42767, "epoch": 359, "lr": 3.512338294966581e-05} +{"train_loss": 0.002806855831295252, "global_step": 42768, "epoch": 359, "lr": 3.512126779121868e-05} +{"train_loss": 0.0016920394264161587, "global_step": 42769, "epoch": 359, "lr": 3.5119152661984325e-05} +{"train_loss": 0.0017294707940891385, "global_step": 42770, "epoch": 359, "lr": 3.5117037561966954e-05} +{"train_loss": 0.0026235056575387716, "global_step": 42771, "epoch": 359, "lr": 3.511492249117067e-05} +{"train_loss": 0.0013063607038930058, "global_step": 42772, "epoch": 359, "lr": 3.5112807449599647e-05} +{"train_loss": 0.0025262529961764812, "global_step": 42773, "epoch": 359, "lr": 3.511069243725804e-05} +{"train_loss": 0.001690608449280262, "global_step": 42774, "epoch": 359, "lr": 3.5108577454150005e-05} +{"train_loss": 0.0015763536794111133, "global_step": 42775, "epoch": 359, "lr": 3.510646250027968e-05} +{"train_loss": 0.0017881218809634447, "global_step": 42776, "epoch": 359, "lr": 3.510434757565121e-05} +{"train_loss": 0.0023210428189486265, "global_step": 42777, "epoch": 359, "lr": 3.510223268026879e-05} +{"train_loss": 0.001109099481254816, "global_step": 42778, "epoch": 359, "lr": 3.510011781413651e-05} +{"train_loss": 0.0017555055674165487, "global_step": 42779, "epoch": 359, "lr": 3.509800297725859e-05} +{"train_loss": 0.0023232572712004185, "global_step": 42780, "epoch": 359, "lr": 3.509588816963915e-05} +{"train_loss": 0.0017900855746120214, "global_step": 42781, "epoch": 359, "lr": 3.5093773391282315e-05} +{"train_loss": 0.001755512785166502, "global_step": 42782, "epoch": 359, "lr": 3.5091658642192286e-05} +{"train_loss": 0.0012889911886304617, "global_step": 42783, "epoch": 359, "lr": 3.5089543922373175e-05} +{"train_loss": 0.0020224093459546566, "global_step": 42784, "epoch": 359, "lr": 3.5087429231829175e-05} +{"train_loss": 0.001518906676210463, "global_step": 42785, "epoch": 359, "lr": 3.50853145705644e-05} +{"train_loss": 0.0011897593503817916, "global_step": 42786, "epoch": 359, "lr": 3.508319993858301e-05} +{"train_loss": 0.001933046616613865, "global_step": 42787, "epoch": 359, "lr": 3.508108533588917e-05} +{"train_loss": 0.0009384425939060748, "global_step": 42788, "epoch": 359, "lr": 3.5078970762487016e-05} +{"train_loss": 0.0016365536721423268, "global_step": 42789, "epoch": 359, "lr": 3.507685621838072e-05} +{"train_loss": 0.0019583560060709715, "global_step": 42790, "epoch": 359, "lr": 3.507474170357442e-05} +{"train_loss": 0.0014425126137211919, "global_step": 42791, "epoch": 359, "lr": 3.5072627218072265e-05} +{"train_loss": 0.0021821779664605856, "global_step": 42792, "epoch": 359, "lr": 3.507051276187843e-05} +{"train_loss": 0.0014408425195142627, "global_step": 42793, "epoch": 359, "lr": 3.5068398334997023e-05} +{"train_loss": 0.0016868934035301208, "global_step": 42794, "epoch": 359, "lr": 3.506628393743224e-05} +{"train_loss": 0.0010335637489333749, "global_step": 42795, "epoch": 359, "lr": 3.50641695691882e-05} +{"train_loss": 0.002180964220315218, "global_step": 42796, "epoch": 359, "lr": 3.506205523026908e-05} +{"train_loss": 0.001322999713011086, "global_step": 42797, "epoch": 359, "lr": 3.5059940920679e-05} +{"train_loss": 0.0022066954988986254, "global_step": 42798, "epoch": 359, "lr": 3.5057826640422156e-05} +{"train_loss": 0.0018616766901686788, "global_step": 42799, "epoch": 359, "lr": 3.505571238950266e-05} +{"train_loss": 0.0020269311498850584, "global_step": 42800, "epoch": 359, "lr": 3.505359816792467e-05} +{"train_loss": 0.0009910992812365294, "global_step": 42801, "epoch": 359, "lr": 3.5051483975692354e-05} +{"train_loss": 0.0022226886358112097, "global_step": 42802, "epoch": 359, "lr": 3.504936981280983e-05} +{"train_loss": 0.0022554644383490086, "global_step": 42803, "epoch": 359, "lr": 3.50472556792813e-05} +{"train_loss": 0.0013500034110620618, "global_step": 42804, "epoch": 359, "lr": 3.5045141575110875e-05} +{"train_loss": 0.001265261904336512, "global_step": 42805, "epoch": 359, "lr": 3.504302750030272e-05} +{"train_loss": 0.0011773748556151986, "global_step": 42806, "epoch": 359, "lr": 3.504091345486097e-05} +{"train_loss": 0.002145555568858981, "global_step": 42807, "epoch": 359, "lr": 3.503879943878979e-05} +{"train_loss": 0.0010832732077687979, "global_step": 42808, "epoch": 359, "lr": 3.503668545209334e-05} +{"train_loss": 0.0012411486823111773, "global_step": 42809, "epoch": 359, "lr": 3.5034571494775755e-05} +{"train_loss": 0.002497273962944746, "global_step": 42810, "epoch": 359, "lr": 3.503245756684119e-05} +{"train_loss": 0.0030427768360823393, "global_step": 42811, "epoch": 359, "lr": 3.50303436682938e-05} +{"train_loss": 0.001215522876009345, "global_step": 42812, "epoch": 359, "lr": 3.502822979913772e-05} +{"train_loss": 0.0022498024627566338, "global_step": 42813, "epoch": 359, "lr": 3.5026115959377124e-05} +{"train_loss": 0.0019798059947788715, "global_step": 42814, "epoch": 359, "lr": 3.5024002149016136e-05} +{"train_loss": 0.0011988896876573563, "global_step": 42815, "epoch": 359, "lr": 3.502188836805893e-05} +{"train_loss": 0.0015931843081489205, "global_step": 42816, "epoch": 359, "lr": 3.501977461650965e-05} +{"train_loss": 0.0015751656610518694, "global_step": 42817, "epoch": 359, "lr": 3.5017660894372425e-05} +{"train_loss": 0.0017682636389508843, "global_step": 42818, "epoch": 359, "lr": 3.5015547201651445e-05} +{"train_loss": 0.0011422120733186603, "global_step": 42819, "epoch": 359, "lr": 3.5013433538350813e-05} +{"train_loss": 0.0036096074618399143, "global_step": 42820, "epoch": 359, "lr": 3.5011319904474724e-05} +{"train_loss": 0.0019440141040831804, "global_step": 42821, "epoch": 359, "lr": 3.500920630002729e-05} +{"train_loss": 0.0015426601748913527, "global_step": 42822, "epoch": 359, "lr": 3.500709272501269e-05} +{"train_loss": 0.0019778681453317404, "global_step": 42823, "epoch": 359, "lr": 3.5004979179435063e-05} +{"train_loss": 0.002193830441683531, "global_step": 42824, "epoch": 359, "lr": 3.500286566329853e-05} +{"train_loss": 0.0013868841342628002, "global_step": 42825, "epoch": 359, "lr": 3.5000752176607305e-05} +{"train_loss": 0.002166944555938244, "global_step": 42826, "epoch": 359, "lr": 3.4998638719365476e-05} +{"train_loss": 0.002387461019679904, "global_step": 42827, "epoch": 359, "lr": 3.499652529157723e-05} +{"train_loss": 0.0015540940221399069, "global_step": 42828, "epoch": 359, "lr": 3.4994411893246694e-05} +{"train_loss": 0.001639405032619834, "global_step": 42829, "epoch": 359, "lr": 3.499229852437804e-05} +{"train_loss": 0.0026030384469777346, "global_step": 42830, "epoch": 359, "lr": 3.499018518497541e-05} +{"train_loss": 0.0011095611844211817, "global_step": 42831, "epoch": 359, "lr": 3.498807187504292e-05} +{"train_loss": 0.002719807904213667, "global_step": 42832, "epoch": 359, "lr": 3.498595859458478e-05} +{"train_loss": 0.001726491842418909, "global_step": 42833, "epoch": 359, "lr": 3.498384534360507e-05} +{"train_loss": 0.0012602917850017548, "global_step": 42834, "epoch": 359, "lr": 3.4981732122108004e-05} +{"train_loss": 0.0011403851676732302, "global_step": 42835, "epoch": 359, "lr": 3.49796189300977e-05} +{"train_loss": 0.0013554544420912862, "global_step": 42836, "epoch": 359, "lr": 3.49775057675783e-05} +{"train_loss": 0.001874455832876265, "global_step": 42837, "epoch": 359, "lr": 3.497539263455397e-05} +{"train_loss": 0.0015006928006187081, "global_step": 42838, "epoch": 359, "lr": 3.4973279531028836e-05} +{"train_loss": 0.0017038312884431112, "global_step": 42839, "epoch": 359, "lr": 3.4971166457007074e-05, "val_loss": 0.016052791848778725} +{"train_loss": 0.0020913619082421064, "global_step": 42840, "epoch": 360, "lr": 3.4969053412492816e-05} +{"train_loss": 0.0015849594492465258, "global_step": 42841, "epoch": 360, "lr": 3.496694039749022e-05} +{"train_loss": 0.001519805402494967, "global_step": 42842, "epoch": 360, "lr": 3.4964827412003434e-05} +{"train_loss": 0.001916117500513792, "global_step": 42843, "epoch": 360, "lr": 3.496271445603659e-05} +{"train_loss": 0.0015013631200417876, "global_step": 42844, "epoch": 360, "lr": 3.4960601529593874e-05} +{"train_loss": 0.0008880587411113083, "global_step": 42845, "epoch": 360, "lr": 3.4958488632679376e-05} +{"train_loss": 0.0009420682326890528, "global_step": 42846, "epoch": 360, "lr": 3.495637576529731e-05} +{"train_loss": 0.0008982888539321721, "global_step": 42847, "epoch": 360, "lr": 3.495426292745177e-05} +{"train_loss": 0.001592270564287901, "global_step": 42848, "epoch": 360, "lr": 3.4952150119146945e-05} +{"train_loss": 0.00159274332690984, "global_step": 42849, "epoch": 360, "lr": 3.495003734038697e-05} +{"train_loss": 0.0011055913055315614, "global_step": 42850, "epoch": 360, "lr": 3.494792459117597e-05} +{"train_loss": 0.0017945775762200356, "global_step": 42851, "epoch": 360, "lr": 3.4945811871518125e-05} +{"train_loss": 0.0009831422939896584, "global_step": 42852, "epoch": 360, "lr": 3.494369918141756e-05} +{"train_loss": 0.0011835100594908, "global_step": 42853, "epoch": 360, "lr": 3.4941586520878445e-05} +{"train_loss": 0.0014647232601419091, "global_step": 42854, "epoch": 360, "lr": 3.49394738899049e-05} +{"train_loss": 0.0013414629502221942, "global_step": 42855, "epoch": 360, "lr": 3.4937361288501104e-05} +{"train_loss": 0.0014247933868318796, "global_step": 42856, "epoch": 360, "lr": 3.493524871667118e-05} +{"train_loss": 0.0009636958711780608, "global_step": 42857, "epoch": 360, "lr": 3.493313617441929e-05} +{"train_loss": 0.001180339022539556, "global_step": 42858, "epoch": 360, "lr": 3.493102366174958e-05} +{"train_loss": 0.0011440254747867584, "global_step": 42859, "epoch": 360, "lr": 3.492891117866617e-05} +{"train_loss": 0.0021682879887521267, "global_step": 42860, "epoch": 360, "lr": 3.492679872517327e-05} +{"train_loss": 0.001150723546743393, "global_step": 42861, "epoch": 360, "lr": 3.4924686301274986e-05} +{"train_loss": 0.001162949251011014, "global_step": 42862, "epoch": 360, "lr": 3.492257390697544e-05} +{"train_loss": 0.0015397608513012528, "global_step": 42863, "epoch": 360, "lr": 3.492046154227884e-05} +{"train_loss": 0.0009643082157708704, "global_step": 42864, "epoch": 360, "lr": 3.491834920718928e-05} +{"train_loss": 0.0012041572481393814, "global_step": 42865, "epoch": 360, "lr": 3.491623690171095e-05} +{"train_loss": 0.0018085084157064557, "global_step": 42866, "epoch": 360, "lr": 3.491412462584796e-05} +{"train_loss": 0.0010475824819877744, "global_step": 42867, "epoch": 360, "lr": 3.49120123796045e-05} +{"train_loss": 0.0016467523528262973, "global_step": 42868, "epoch": 360, "lr": 3.490990016298468e-05} +{"train_loss": 0.0016311737708747387, "global_step": 42869, "epoch": 360, "lr": 3.4907787975992645e-05} +{"train_loss": 0.0008644053596071899, "global_step": 42870, "epoch": 360, "lr": 3.4905675818632575e-05} +{"train_loss": 0.0008681845501996577, "global_step": 42871, "epoch": 360, "lr": 3.490356369090857e-05} +{"train_loss": 0.0019132746383547783, "global_step": 42872, "epoch": 360, "lr": 3.490145159282484e-05} +{"train_loss": 0.001499101286754012, "global_step": 42873, "epoch": 360, "lr": 3.489933952438548e-05} +{"train_loss": 0.0016142574604600668, "global_step": 42874, "epoch": 360, "lr": 3.489722748559463e-05} +{"train_loss": 0.0016080130590125918, "global_step": 42875, "epoch": 360, "lr": 3.48951154764565e-05} +{"train_loss": 0.0005854163318872452, "global_step": 42876, "epoch": 360, "lr": 3.489300349697516e-05} +{"train_loss": 0.0016303437296301126, "global_step": 42877, "epoch": 360, "lr": 3.489089154715483e-05} +{"train_loss": 0.0012450277572497725, "global_step": 42878, "epoch": 360, "lr": 3.488877962699959e-05} +{"train_loss": 0.0020333153661340475, "global_step": 42879, "epoch": 360, "lr": 3.488666773651364e-05} +{"train_loss": 0.000884206616319716, "global_step": 42880, "epoch": 360, "lr": 3.488455587570111e-05} +{"train_loss": 0.0013754424871876836, "global_step": 42881, "epoch": 360, "lr": 3.488244404456611e-05} +{"train_loss": 0.0010407494846731424, "global_step": 42882, "epoch": 360, "lr": 3.488033224311284e-05} +{"train_loss": 0.0008401080849580467, "global_step": 42883, "epoch": 360, "lr": 3.4878220471345404e-05} +{"train_loss": 0.0009672394953668118, "global_step": 42884, "epoch": 360, "lr": 3.487610872926798e-05} +{"train_loss": 0.002091675531119108, "global_step": 42885, "epoch": 360, "lr": 3.4873997016884704e-05} +{"train_loss": 0.0011644390178844333, "global_step": 42886, "epoch": 360, "lr": 3.487188533419971e-05} +{"train_loss": 0.0015288402792066336, "global_step": 42887, "epoch": 360, "lr": 3.486977368121714e-05} +{"train_loss": 0.002032156102359295, "global_step": 42888, "epoch": 360, "lr": 3.4867662057941175e-05} +{"train_loss": 0.0020535055082291365, "global_step": 42889, "epoch": 360, "lr": 3.486555046437593e-05} +{"train_loss": 0.0016853805864229798, "global_step": 42890, "epoch": 360, "lr": 3.486343890052556e-05} +{"train_loss": 0.0017031981842592359, "global_step": 42891, "epoch": 360, "lr": 3.48613273663942e-05} +{"train_loss": 0.0010928428964689374, "global_step": 42892, "epoch": 360, "lr": 3.4859215861986034e-05} +{"train_loss": 0.0013429062673822045, "global_step": 42893, "epoch": 360, "lr": 3.485710438730515e-05} +{"train_loss": 0.0015089798253029585, "global_step": 42894, "epoch": 360, "lr": 3.485499294235575e-05} +{"train_loss": 0.0012733351904898882, "global_step": 42895, "epoch": 360, "lr": 3.485288152714192e-05} +{"train_loss": 0.0013913973234593868, "global_step": 42896, "epoch": 360, "lr": 3.485077014166788e-05} +{"train_loss": 0.0021924253087490797, "global_step": 42897, "epoch": 360, "lr": 3.4848658785937696e-05} +{"train_loss": 0.0010331100784242153, "global_step": 42898, "epoch": 360, "lr": 3.484654745995558e-05} +{"train_loss": 0.0009025937179103494, "global_step": 42899, "epoch": 360, "lr": 3.484443616372565e-05} +{"train_loss": 0.0017689693486317992, "global_step": 42900, "epoch": 360, "lr": 3.484232489725203e-05} +{"train_loss": 0.0016453108983114362, "global_step": 42901, "epoch": 360, "lr": 3.48402136605389e-05} +{"train_loss": 0.0012280632508918643, "global_step": 42902, "epoch": 360, "lr": 3.483810245359038e-05} +{"train_loss": 0.0009642125805839896, "global_step": 42903, "epoch": 360, "lr": 3.483599127641064e-05} +{"train_loss": 0.0006300173699855804, "global_step": 42904, "epoch": 360, "lr": 3.48338801290038e-05} +{"train_loss": 0.001329123741015792, "global_step": 42905, "epoch": 360, "lr": 3.4831769011374015e-05} +{"train_loss": 0.0006928843213245273, "global_step": 42906, "epoch": 360, "lr": 3.4829657923525435e-05} +{"train_loss": 0.002288938732817769, "global_step": 42907, "epoch": 360, "lr": 3.48275468654622e-05} +{"train_loss": 0.0018025749595835805, "global_step": 42908, "epoch": 360, "lr": 3.4825435837188455e-05} +{"train_loss": 0.0011933360947296023, "global_step": 42909, "epoch": 360, "lr": 3.4823324838708336e-05} +{"train_loss": 0.0013579445658251643, "global_step": 42910, "epoch": 360, "lr": 3.482121387002602e-05} +{"train_loss": 0.0011963562574237585, "global_step": 42911, "epoch": 360, "lr": 3.481910293114563e-05} +{"train_loss": 0.0014574626693502069, "global_step": 42912, "epoch": 360, "lr": 3.481699202207128e-05} +{"train_loss": 0.0023389316629618406, "global_step": 42913, "epoch": 360, "lr": 3.481488114280718e-05} +{"train_loss": 0.0010771396337077022, "global_step": 42914, "epoch": 360, "lr": 3.48127702933574e-05} +{"train_loss": 0.0009727398864924908, "global_step": 42915, "epoch": 360, "lr": 3.481065947372616e-05} +{"train_loss": 0.002261091023683548, "global_step": 42916, "epoch": 360, "lr": 3.480854868391754e-05} +{"train_loss": 0.0012323545524850488, "global_step": 42917, "epoch": 360, "lr": 3.4806437923935726e-05} +{"train_loss": 0.0018448098562657833, "global_step": 42918, "epoch": 360, "lr": 3.480432719378485e-05} +{"train_loss": 0.0014878906076774001, "global_step": 42919, "epoch": 360, "lr": 3.480221649346904e-05} +{"train_loss": 0.0013537504710257053, "global_step": 42920, "epoch": 360, "lr": 3.480010582299247e-05} +{"train_loss": 0.0008347074617631733, "global_step": 42921, "epoch": 360, "lr": 3.4797995182359256e-05} +{"train_loss": 0.0007983598043210804, "global_step": 42922, "epoch": 360, "lr": 3.4795884571573557e-05} +{"train_loss": 0.0011697834124788642, "global_step": 42923, "epoch": 360, "lr": 3.479377399063952e-05} +{"train_loss": 0.0012812380446121097, "global_step": 42924, "epoch": 360, "lr": 3.479166343956127e-05} +{"train_loss": 0.0011071375338360667, "global_step": 42925, "epoch": 360, "lr": 3.478955291834298e-05} +{"train_loss": 0.001939426176249981, "global_step": 42926, "epoch": 360, "lr": 3.4787442426988767e-05} +{"train_loss": 0.0016192675102502108, "global_step": 42927, "epoch": 360, "lr": 3.4785331965502796e-05} +{"train_loss": 0.001674460363574326, "global_step": 42928, "epoch": 360, "lr": 3.478322153388918e-05} +{"train_loss": 0.0021730668377131224, "global_step": 42929, "epoch": 360, "lr": 3.478111113215211e-05} +{"train_loss": 0.0018239091150462627, "global_step": 42930, "epoch": 360, "lr": 3.4779000760295696e-05} +{"train_loss": 0.0015332202892750502, "global_step": 42931, "epoch": 360, "lr": 3.477689041832407e-05} +{"train_loss": 0.0016026742523536086, "global_step": 42932, "epoch": 360, "lr": 3.4774780106241415e-05} +{"train_loss": 0.0006729988963343203, "global_step": 42933, "epoch": 360, "lr": 3.4772669824051834e-05} +{"train_loss": 0.0014341410715132952, "global_step": 42934, "epoch": 360, "lr": 3.477055957175951e-05} +{"train_loss": 0.0019458109745755792, "global_step": 42935, "epoch": 360, "lr": 3.476844934936855e-05} +{"train_loss": 0.002371538896113634, "global_step": 42936, "epoch": 360, "lr": 3.476633915688311e-05} +{"train_loss": 0.0014639889122918248, "global_step": 42937, "epoch": 360, "lr": 3.476422899430734e-05} +{"train_loss": 0.0018340727547183633, "global_step": 42938, "epoch": 360, "lr": 3.476211886164538e-05} +{"train_loss": 0.0008739755139686167, "global_step": 42939, "epoch": 360, "lr": 3.476000875890137e-05} +{"train_loss": 0.0016614862252026796, "global_step": 42940, "epoch": 360, "lr": 3.475789868607946e-05} +{"train_loss": 0.0010734627721831203, "global_step": 42941, "epoch": 360, "lr": 3.475578864318378e-05} +{"train_loss": 0.0015102199977263808, "global_step": 42942, "epoch": 360, "lr": 3.475367863021849e-05} +{"train_loss": 0.0020661428570747375, "global_step": 42943, "epoch": 360, "lr": 3.475156864718771e-05} +{"train_loss": 0.0006897923303768039, "global_step": 42944, "epoch": 360, "lr": 3.474945869409561e-05} +{"train_loss": 0.0011101813288405538, "global_step": 42945, "epoch": 360, "lr": 3.47473487709463e-05} +{"train_loss": 0.0012998118763789535, "global_step": 42946, "epoch": 360, "lr": 3.4745238877743954e-05} +{"train_loss": 0.002060964470729232, "global_step": 42947, "epoch": 360, "lr": 3.4743129014492695e-05} +{"train_loss": 0.0015957177383825183, "global_step": 42948, "epoch": 360, "lr": 3.474101918119669e-05} +{"train_loss": 0.001329470076598227, "global_step": 42949, "epoch": 360, "lr": 3.473890937786006e-05} +{"train_loss": 0.0014252658002078533, "global_step": 42950, "epoch": 360, "lr": 3.473679960448693e-05} +{"train_loss": 0.0018763266270980239, "global_step": 42951, "epoch": 360, "lr": 3.4734689861081485e-05} +{"train_loss": 0.001734064077027142, "global_step": 42952, "epoch": 360, "lr": 3.473258014764782e-05} +{"train_loss": 0.001411818782798946, "global_step": 42953, "epoch": 360, "lr": 3.4730470464190135e-05} +{"train_loss": 0.0012574855936691165, "global_step": 42954, "epoch": 360, "lr": 3.472836081071252e-05} +{"train_loss": 0.0016182909021154046, "global_step": 42955, "epoch": 360, "lr": 3.4726251187219136e-05} +{"train_loss": 0.0014706222573295236, "global_step": 42956, "epoch": 360, "lr": 3.472414159371413e-05} +{"train_loss": 0.0012958680745214224, "global_step": 42957, "epoch": 360, "lr": 3.4722032030201635e-05} +{"train_loss": 0.0014233667160846106, "global_step": 42958, "epoch": 360, "lr": 3.471992249668581e-05, "val_loss": 0.054457735270261765, "train_action_mse_error": 2.885351568693295e-05} +{"train_loss": 0.002318865619599819, "global_step": 42959, "epoch": 361, "lr": 3.471781299317077e-05} +{"train_loss": 0.001475064200349152, "global_step": 42960, "epoch": 361, "lr": 3.471570351966069e-05} +{"train_loss": 0.0012320360401645303, "global_step": 42961, "epoch": 361, "lr": 3.4713594076159696e-05} +{"train_loss": 0.0014632457168772817, "global_step": 42962, "epoch": 361, "lr": 3.47114846626719e-05} +{"train_loss": 0.0021914923563599586, "global_step": 42963, "epoch": 361, "lr": 3.4709375279201495e-05} +{"train_loss": 0.0020407799165695906, "global_step": 42964, "epoch": 361, "lr": 3.4707265925752574e-05} +{"train_loss": 0.001335651846602559, "global_step": 42965, "epoch": 361, "lr": 3.4705156602329324e-05} +{"train_loss": 0.0009682929958216846, "global_step": 42966, "epoch": 361, "lr": 3.470304730893585e-05} +{"train_loss": 0.0009282529936172068, "global_step": 42967, "epoch": 361, "lr": 3.4700938045576325e-05} +{"train_loss": 0.001622142386622727, "global_step": 42968, "epoch": 361, "lr": 3.469882881225487e-05} +{"train_loss": 0.0017786859534680843, "global_step": 42969, "epoch": 361, "lr": 3.469671960897561e-05} +{"train_loss": 0.0011275751749053597, "global_step": 42970, "epoch": 361, "lr": 3.469461043574272e-05} +{"train_loss": 0.0018413536017760634, "global_step": 42971, "epoch": 361, "lr": 3.469250129256033e-05} +{"train_loss": 0.0017058271914720535, "global_step": 42972, "epoch": 361, "lr": 3.4690392179432573e-05} +{"train_loss": 0.0018724249675869942, "global_step": 42973, "epoch": 361, "lr": 3.4688283096363616e-05} +{"train_loss": 0.0023652310483157635, "global_step": 42974, "epoch": 361, "lr": 3.4686174043357545e-05} +{"train_loss": 0.0015204868977889419, "global_step": 42975, "epoch": 361, "lr": 3.468406502041856e-05} +{"train_loss": 0.0008103797445073724, "global_step": 42976, "epoch": 361, "lr": 3.468195602755076e-05} +{"train_loss": 0.0012168281245976686, "global_step": 42977, "epoch": 361, "lr": 3.467984706475832e-05} +{"train_loss": 0.0017138762632384896, "global_step": 42978, "epoch": 361, "lr": 3.467773813204535e-05} +{"train_loss": 0.0014257215661928058, "global_step": 42979, "epoch": 361, "lr": 3.467562922941602e-05} +{"train_loss": 0.0024714067112654448, "global_step": 42980, "epoch": 361, "lr": 3.467352035687445e-05} +{"train_loss": 0.002105515217408538, "global_step": 42981, "epoch": 361, "lr": 3.467141151442477e-05} +{"train_loss": 0.0018575484864413738, "global_step": 42982, "epoch": 361, "lr": 3.4669302702071155e-05} +{"train_loss": 0.0009088909137062728, "global_step": 42983, "epoch": 361, "lr": 3.466719391981771e-05} +{"train_loss": 0.001419040490873158, "global_step": 42984, "epoch": 361, "lr": 3.466508516766861e-05} +{"train_loss": 0.001462716143578291, "global_step": 42985, "epoch": 361, "lr": 3.466297644562795e-05} +{"train_loss": 0.0020422504749149084, "global_step": 42986, "epoch": 361, "lr": 3.466086775369992e-05} +{"train_loss": 0.0011397553607821465, "global_step": 42987, "epoch": 361, "lr": 3.465875909188862e-05} +{"train_loss": 0.0015745512209832668, "global_step": 42988, "epoch": 361, "lr": 3.4656650460198224e-05} +{"train_loss": 0.002542323200032115, "global_step": 42989, "epoch": 361, "lr": 3.465454185863285e-05} +{"train_loss": 0.0008110936614684761, "global_step": 42990, "epoch": 361, "lr": 3.465243328719664e-05} +{"train_loss": 0.00220947596244514, "global_step": 42991, "epoch": 361, "lr": 3.4650324745893746e-05} +{"train_loss": 0.0019421355100348592, "global_step": 42992, "epoch": 361, "lr": 3.46482162347283e-05} +{"train_loss": 0.0025220029056072235, "global_step": 42993, "epoch": 361, "lr": 3.4646107753704424e-05} +{"train_loss": 0.0017495190259069204, "global_step": 42994, "epoch": 361, "lr": 3.46439993028263e-05} +{"train_loss": 0.0010366777423769236, "global_step": 42995, "epoch": 361, "lr": 3.4641890882098014e-05} +{"train_loss": 0.0018543285550549626, "global_step": 42996, "epoch": 361, "lr": 3.4639782491523764e-05} +{"train_loss": 0.0011665482306852937, "global_step": 42997, "epoch": 361, "lr": 3.463767413110763e-05} +{"train_loss": 0.0019448775565251708, "global_step": 42998, "epoch": 361, "lr": 3.463556580085381e-05} +{"train_loss": 0.0032033692114055157, "global_step": 42999, "epoch": 361, "lr": 3.4633457500766416e-05} +{"train_loss": 0.0013992422027513385, "global_step": 43000, "epoch": 361, "lr": 3.4631349230849555e-05} +{"train_loss": 0.001378555316478014, "global_step": 43001, "epoch": 361, "lr": 3.4629240991107424e-05} +{"train_loss": 0.0009104614146053791, "global_step": 43002, "epoch": 361, "lr": 3.462713278154413e-05} +{"train_loss": 0.0026364275254309177, "global_step": 43003, "epoch": 361, "lr": 3.462502460216382e-05} +{"train_loss": 0.0013004057109355927, "global_step": 43004, "epoch": 361, "lr": 3.462291645297063e-05} +{"train_loss": 0.0021842343267053366, "global_step": 43005, "epoch": 361, "lr": 3.462080833396869e-05} +{"train_loss": 0.0027699361089617014, "global_step": 43006, "epoch": 361, "lr": 3.461870024516216e-05} +{"train_loss": 0.0011365623213350773, "global_step": 43007, "epoch": 361, "lr": 3.4616592186555166e-05} +{"train_loss": 0.0010727413464337587, "global_step": 43008, "epoch": 361, "lr": 3.4614484158151854e-05} +{"train_loss": 0.0015686068218201399, "global_step": 43009, "epoch": 361, "lr": 3.461237615995635e-05} +{"train_loss": 0.002450445434078574, "global_step": 43010, "epoch": 361, "lr": 3.4610268191972816e-05} +{"train_loss": 0.0015184067888185382, "global_step": 43011, "epoch": 361, "lr": 3.460816025420537e-05} +{"train_loss": 0.0025808156933635473, "global_step": 43012, "epoch": 361, "lr": 3.460605234665814e-05} +{"train_loss": 0.001005603582598269, "global_step": 43013, "epoch": 361, "lr": 3.4603944469335314e-05} +{"train_loss": 0.0015369084430858493, "global_step": 43014, "epoch": 361, "lr": 3.460183662224097e-05} +{"train_loss": 0.0019781985320150852, "global_step": 43015, "epoch": 361, "lr": 3.459972880537929e-05} +{"train_loss": 0.0019333121599629521, "global_step": 43016, "epoch": 361, "lr": 3.4597621018754387e-05} +{"train_loss": 0.0011891688918694854, "global_step": 43017, "epoch": 361, "lr": 3.459551326237043e-05} +{"train_loss": 0.0007790692034177482, "global_step": 43018, "epoch": 361, "lr": 3.459340553623153e-05} +{"train_loss": 0.0015294007025659084, "global_step": 43019, "epoch": 361, "lr": 3.459129784034181e-05} +{"train_loss": 0.0017444477416574955, "global_step": 43020, "epoch": 361, "lr": 3.458919017470544e-05} +{"train_loss": 0.0019646708387881517, "global_step": 43021, "epoch": 361, "lr": 3.4587082539326556e-05} +{"train_loss": 0.0012311807367950678, "global_step": 43022, "epoch": 361, "lr": 3.458497493420929e-05} +{"train_loss": 0.003819575533270836, "global_step": 43023, "epoch": 361, "lr": 3.458286735935779e-05} +{"train_loss": 0.0020301721524447203, "global_step": 43024, "epoch": 361, "lr": 3.458075981477615e-05} +{"train_loss": 0.001528903259895742, "global_step": 43025, "epoch": 361, "lr": 3.457865230046857e-05} +{"train_loss": 0.0008771527791395783, "global_step": 43026, "epoch": 361, "lr": 3.457654481643914e-05} +{"train_loss": 0.00173256266862154, "global_step": 43027, "epoch": 361, "lr": 3.457443736269203e-05} +{"train_loss": 0.0015715858899056911, "global_step": 43028, "epoch": 361, "lr": 3.4572329939231345e-05} +{"train_loss": 0.0008264172356575727, "global_step": 43029, "epoch": 361, "lr": 3.4570222546061274e-05} +{"train_loss": 0.002337902784347534, "global_step": 43030, "epoch": 361, "lr": 3.4568115183185904e-05} +{"train_loss": 0.002173431683331728, "global_step": 43031, "epoch": 361, "lr": 3.4566007850609385e-05} +{"train_loss": 0.0016059190966188908, "global_step": 43032, "epoch": 361, "lr": 3.456390054833587e-05} +{"train_loss": 0.0011183209717273712, "global_step": 43033, "epoch": 361, "lr": 3.456179327636948e-05} +{"train_loss": 0.0019992971792817116, "global_step": 43034, "epoch": 361, "lr": 3.455968603471437e-05} +{"train_loss": 0.001668518059886992, "global_step": 43035, "epoch": 361, "lr": 3.455757882337465e-05} +{"train_loss": 0.001928597455844283, "global_step": 43036, "epoch": 361, "lr": 3.4555471642354495e-05} +{"train_loss": 0.00196485104970634, "global_step": 43037, "epoch": 361, "lr": 3.455336449165801e-05} +{"train_loss": 0.002023550448939204, "global_step": 43038, "epoch": 361, "lr": 3.455125737128935e-05} +{"train_loss": 0.0008485394646413624, "global_step": 43039, "epoch": 361, "lr": 3.4549150281252636e-05} +{"train_loss": 0.0016571166925132275, "global_step": 43040, "epoch": 361, "lr": 3.4547043221552015e-05} +{"train_loss": 0.0011728852987289429, "global_step": 43041, "epoch": 361, "lr": 3.454493619219163e-05} +{"train_loss": 0.0018194132717326283, "global_step": 43042, "epoch": 361, "lr": 3.454282919317562e-05} +{"train_loss": 0.0019211280159652233, "global_step": 43043, "epoch": 361, "lr": 3.4540722224508095e-05} +{"train_loss": 0.0012157863238826394, "global_step": 43044, "epoch": 361, "lr": 3.453861528619322e-05} +{"train_loss": 0.0010778276482596993, "global_step": 43045, "epoch": 361, "lr": 3.453650837823511e-05} +{"train_loss": 0.0011715417494997382, "global_step": 43046, "epoch": 361, "lr": 3.453440150063794e-05} +{"train_loss": 0.0015751527389511466, "global_step": 43047, "epoch": 361, "lr": 3.4532294653405795e-05} +{"train_loss": 0.0020605584140866995, "global_step": 43048, "epoch": 361, "lr": 3.453018783654285e-05} +{"train_loss": 0.0016112708253785968, "global_step": 43049, "epoch": 361, "lr": 3.452808105005324e-05} +{"train_loss": 0.0017759843030944467, "global_step": 43050, "epoch": 361, "lr": 3.452597429394106e-05} +{"train_loss": 0.0011760697234421968, "global_step": 43051, "epoch": 361, "lr": 3.45238675682105e-05} +{"train_loss": 0.001375724095851183, "global_step": 43052, "epoch": 361, "lr": 3.452176087286565e-05} +{"train_loss": 0.0014283743221312761, "global_step": 43053, "epoch": 361, "lr": 3.45196542079107e-05} +{"train_loss": 0.0011310153640806675, "global_step": 43054, "epoch": 361, "lr": 3.451754757334972e-05} +{"train_loss": 0.0026423996314406395, "global_step": 43055, "epoch": 361, "lr": 3.4515440969186904e-05} +{"train_loss": 0.0015222609508782625, "global_step": 43056, "epoch": 361, "lr": 3.451333439542637e-05} +{"train_loss": 0.0016205873107537627, "global_step": 43057, "epoch": 361, "lr": 3.451122785207223e-05} +{"train_loss": 0.0013201350811868906, "global_step": 43058, "epoch": 361, "lr": 3.450912133912866e-05} +{"train_loss": 0.0014045683201402426, "global_step": 43059, "epoch": 361, "lr": 3.450701485659975e-05} +{"train_loss": 0.0018072293605655432, "global_step": 43060, "epoch": 361, "lr": 3.450490840448969e-05} +{"train_loss": 0.0011086781742051244, "global_step": 43061, "epoch": 361, "lr": 3.450280198280258e-05} +{"train_loss": 0.0011752822902053595, "global_step": 43062, "epoch": 361, "lr": 3.450069559154254e-05} +{"train_loss": 0.00356723228469491, "global_step": 43063, "epoch": 361, "lr": 3.449858923071376e-05} +{"train_loss": 0.0008819015347398818, "global_step": 43064, "epoch": 361, "lr": 3.449648290032031e-05} +{"train_loss": 0.0013863277854397893, "global_step": 43065, "epoch": 361, "lr": 3.4494376600366396e-05} +{"train_loss": 0.0013088942505419254, "global_step": 43066, "epoch": 361, "lr": 3.449227033085608e-05} +{"train_loss": 0.002725568599998951, "global_step": 43067, "epoch": 361, "lr": 3.449016409179356e-05} +{"train_loss": 0.0017216384876519442, "global_step": 43068, "epoch": 361, "lr": 3.4488057883182946e-05} +{"train_loss": 0.0012919842265546322, "global_step": 43069, "epoch": 361, "lr": 3.448595170502836e-05} +{"train_loss": 0.0015811598859727383, "global_step": 43070, "epoch": 361, "lr": 3.448384555733396e-05} +{"train_loss": 0.0013217400992289186, "global_step": 43071, "epoch": 361, "lr": 3.4481739440103865e-05} +{"train_loss": 0.0009187692776322365, "global_step": 43072, "epoch": 361, "lr": 3.4479633353342225e-05} +{"train_loss": 0.0011476855725049973, "global_step": 43073, "epoch": 361, "lr": 3.447752729705317e-05} +{"train_loss": 0.0015752377221360803, "global_step": 43074, "epoch": 361, "lr": 3.447542127124081e-05} +{"train_loss": 0.0012639485066756606, "global_step": 43075, "epoch": 361, "lr": 3.447331527590932e-05} +{"train_loss": 0.002187249716371298, "global_step": 43076, "epoch": 361, "lr": 3.44712093110628e-05} +{"train_loss": 0.0016549940523300163, "global_step": 43077, "epoch": 361, "lr": 3.446910337670543e-05, "val_loss": 0.02848898619413376} +{"train_loss": 0.0022024326026439667, "global_step": 43078, "epoch": 362, "lr": 3.446699747284128e-05} +{"train_loss": 0.0017394054448232055, "global_step": 43079, "epoch": 362, "lr": 3.4464891599474556e-05} +{"train_loss": 0.002136882394552231, "global_step": 43080, "epoch": 362, "lr": 3.446278575660935e-05} +{"train_loss": 0.0009550157119520009, "global_step": 43081, "epoch": 362, "lr": 3.446067994424979e-05} +{"train_loss": 0.001752429292537272, "global_step": 43082, "epoch": 362, "lr": 3.445857416240004e-05} +{"train_loss": 0.001465036068111658, "global_step": 43083, "epoch": 362, "lr": 3.44564684110642e-05} +{"train_loss": 0.0011141536524519324, "global_step": 43084, "epoch": 362, "lr": 3.445436269024645e-05} +{"train_loss": 0.0013391063548624516, "global_step": 43085, "epoch": 362, "lr": 3.445225699995086e-05} +{"train_loss": 0.0018934110412374139, "global_step": 43086, "epoch": 362, "lr": 3.4450151340181635e-05} +{"train_loss": 0.0012860683491453528, "global_step": 43087, "epoch": 362, "lr": 3.444804571094287e-05} +{"train_loss": 0.0016635750653222203, "global_step": 43088, "epoch": 362, "lr": 3.4445940112238694e-05} +{"train_loss": 0.0017275757854804397, "global_step": 43089, "epoch": 362, "lr": 3.444383454407326e-05} +{"train_loss": 0.0021555577404797077, "global_step": 43090, "epoch": 362, "lr": 3.444172900645068e-05} +{"train_loss": 0.0010173233458772302, "global_step": 43091, "epoch": 362, "lr": 3.443962349937514e-05} +{"train_loss": 0.0006869424250908196, "global_step": 43092, "epoch": 362, "lr": 3.4437518022850726e-05} +{"train_loss": 0.001474043121561408, "global_step": 43093, "epoch": 362, "lr": 3.443541257688155e-05} +{"train_loss": 0.001911746570840478, "global_step": 43094, "epoch": 362, "lr": 3.4433307161471815e-05} +{"train_loss": 0.0013319813879206777, "global_step": 43095, "epoch": 362, "lr": 3.4431201776625596e-05} +{"train_loss": 0.0005880246171727777, "global_step": 43096, "epoch": 362, "lr": 3.442909642234707e-05} +{"train_loss": 0.002143827034160495, "global_step": 43097, "epoch": 362, "lr": 3.4426991098640324e-05} +{"train_loss": 0.002087310189381242, "global_step": 43098, "epoch": 362, "lr": 3.442488580550954e-05} +{"train_loss": 0.001176335383206606, "global_step": 43099, "epoch": 362, "lr": 3.442278054295883e-05} +{"train_loss": 0.0013922661310061812, "global_step": 43100, "epoch": 362, "lr": 3.44206753109923e-05} +{"train_loss": 0.0009525520727038383, "global_step": 43101, "epoch": 362, "lr": 3.4418570109614135e-05} +{"train_loss": 0.0016499205958098173, "global_step": 43102, "epoch": 362, "lr": 3.441646493882842e-05} +{"train_loss": 0.0009362739510834217, "global_step": 43103, "epoch": 362, "lr": 3.441435979863933e-05} +{"train_loss": 0.0024322201497852802, "global_step": 43104, "epoch": 362, "lr": 3.441225468905097e-05} +{"train_loss": 0.0010388686787337065, "global_step": 43105, "epoch": 362, "lr": 3.441014961006748e-05} +{"train_loss": 0.0011536729289218783, "global_step": 43106, "epoch": 362, "lr": 3.440804456169301e-05} +{"train_loss": 0.0013167251599952579, "global_step": 43107, "epoch": 362, "lr": 3.440593954393166e-05} +{"train_loss": 0.001447665854357183, "global_step": 43108, "epoch": 362, "lr": 3.4403834556787605e-05} +{"train_loss": 0.00184326630551368, "global_step": 43109, "epoch": 362, "lr": 3.4401729600264934e-05} +{"train_loss": 0.0015836219536140561, "global_step": 43110, "epoch": 362, "lr": 3.4399624674367816e-05} +{"train_loss": 0.0020994720980525017, "global_step": 43111, "epoch": 362, "lr": 3.439751977910037e-05} +{"train_loss": 0.0019242801936343312, "global_step": 43112, "epoch": 362, "lr": 3.439541491446671e-05} +{"train_loss": 0.0009084272896870971, "global_step": 43113, "epoch": 362, "lr": 3.4393310080471e-05} +{"train_loss": 0.0013756135012954473, "global_step": 43114, "epoch": 362, "lr": 3.439120527711734e-05} +{"train_loss": 0.0008285021176561713, "global_step": 43115, "epoch": 362, "lr": 3.43891005044099e-05} +{"train_loss": 0.0010274782544001937, "global_step": 43116, "epoch": 362, "lr": 3.438699576235278e-05} +{"train_loss": 0.0030540029983967543, "global_step": 43117, "epoch": 362, "lr": 3.438489105095014e-05} +{"train_loss": 0.001678315456956625, "global_step": 43118, "epoch": 362, "lr": 3.438278637020609e-05} +{"train_loss": 0.002320607891306281, "global_step": 43119, "epoch": 362, "lr": 3.438068172012477e-05} +{"train_loss": 0.0016280945856124163, "global_step": 43120, "epoch": 362, "lr": 3.4378577100710314e-05} +{"train_loss": 0.0018766866996884346, "global_step": 43121, "epoch": 362, "lr": 3.437647251196685e-05} +{"train_loss": 0.001452375901862979, "global_step": 43122, "epoch": 362, "lr": 3.437436795389851e-05} +{"train_loss": 0.0011102736461907625, "global_step": 43123, "epoch": 362, "lr": 3.437226342650945e-05} +{"train_loss": 0.0017308314563706517, "global_step": 43124, "epoch": 362, "lr": 3.437015892980375e-05} +{"train_loss": 0.0013838474405929446, "global_step": 43125, "epoch": 362, "lr": 3.436805446378561e-05} +{"train_loss": 0.0017282027984037995, "global_step": 43126, "epoch": 362, "lr": 3.436595002845908e-05} +{"train_loss": 0.0014353886945173144, "global_step": 43127, "epoch": 362, "lr": 3.4363845623828376e-05} +{"train_loss": 0.002037485595792532, "global_step": 43128, "epoch": 362, "lr": 3.436174124989756e-05} +{"train_loss": 0.0014090747572481632, "global_step": 43129, "epoch": 362, "lr": 3.435963690667082e-05} +{"train_loss": 0.0012315757339820266, "global_step": 43130, "epoch": 362, "lr": 3.435753259415226e-05} +{"train_loss": 0.001029876759275794, "global_step": 43131, "epoch": 362, "lr": 3.435542831234599e-05} +{"train_loss": 0.0025260685943067074, "global_step": 43132, "epoch": 362, "lr": 3.43533240612562e-05} +{"train_loss": 0.0017296309815719724, "global_step": 43133, "epoch": 362, "lr": 3.4351219840886953e-05} +{"train_loss": 0.0012761639663949609, "global_step": 43134, "epoch": 362, "lr": 3.4349115651242434e-05} +{"train_loss": 0.002011528005823493, "global_step": 43135, "epoch": 362, "lr": 3.434701149232674e-05} +{"train_loss": 0.001822163350880146, "global_step": 43136, "epoch": 362, "lr": 3.434490736414404e-05} +{"train_loss": 0.0012857052497565746, "global_step": 43137, "epoch": 362, "lr": 3.434280326669842e-05} +{"train_loss": 0.0026720294263213873, "global_step": 43138, "epoch": 362, "lr": 3.434069919999403e-05} +{"train_loss": 0.0018215704476460814, "global_step": 43139, "epoch": 362, "lr": 3.433859516403503e-05} +{"train_loss": 0.0014684123452752829, "global_step": 43140, "epoch": 362, "lr": 3.4336491158825496e-05} +{"train_loss": 0.0017945434665307403, "global_step": 43141, "epoch": 362, "lr": 3.433438718436961e-05} +{"train_loss": 0.0015789850149303675, "global_step": 43142, "epoch": 362, "lr": 3.433228324067148e-05} +{"train_loss": 0.0009051910601556301, "global_step": 43143, "epoch": 362, "lr": 3.433017932773522e-05} +{"train_loss": 0.0023776188027113676, "global_step": 43144, "epoch": 362, "lr": 3.4328075445565e-05} +{"train_loss": 0.0015058281132951379, "global_step": 43145, "epoch": 362, "lr": 3.4325971594164905e-05} +{"train_loss": 0.0010617556981742382, "global_step": 43146, "epoch": 362, "lr": 3.432386777353912e-05} +{"train_loss": 0.0016645690193399787, "global_step": 43147, "epoch": 362, "lr": 3.432176398369172e-05} +{"train_loss": 0.0011529899202287197, "global_step": 43148, "epoch": 362, "lr": 3.431966022462688e-05} +{"train_loss": 0.0014165190514177084, "global_step": 43149, "epoch": 362, "lr": 3.4317556496348715e-05} +{"train_loss": 0.0017335513839498162, "global_step": 43150, "epoch": 362, "lr": 3.4315452798861325e-05} +{"train_loss": 0.001670112949796021, "global_step": 43151, "epoch": 362, "lr": 3.431334913216889e-05} +{"train_loss": 0.00167525140568614, "global_step": 43152, "epoch": 362, "lr": 3.431124549627551e-05} +{"train_loss": 0.001329899183474481, "global_step": 43153, "epoch": 362, "lr": 3.4309141891185324e-05} +{"train_loss": 0.001264826045371592, "global_step": 43154, "epoch": 362, "lr": 3.430703831690246e-05} +{"train_loss": 0.0009100465103983879, "global_step": 43155, "epoch": 362, "lr": 3.430493477343105e-05} +{"train_loss": 0.0016389958327636123, "global_step": 43156, "epoch": 362, "lr": 3.430283126077524e-05} +{"train_loss": 0.001441849977709353, "global_step": 43157, "epoch": 362, "lr": 3.430072777893912e-05} +{"train_loss": 0.001957846339792013, "global_step": 43158, "epoch": 362, "lr": 3.4298624327926864e-05} +{"train_loss": 0.0011127814650535583, "global_step": 43159, "epoch": 362, "lr": 3.429652090774256e-05} +{"train_loss": 0.002786788623780012, "global_step": 43160, "epoch": 362, "lr": 3.429441751839038e-05} +{"train_loss": 0.0016511366702616215, "global_step": 43161, "epoch": 362, "lr": 3.4292314159874435e-05} +{"train_loss": 0.0015880295541137457, "global_step": 43162, "epoch": 362, "lr": 3.429021083219883e-05} +{"train_loss": 0.0023405328392982483, "global_step": 43163, "epoch": 362, "lr": 3.4288107535367744e-05} +{"train_loss": 0.0010205227881669998, "global_step": 43164, "epoch": 362, "lr": 3.428600426938525e-05} +{"train_loss": 0.0006652678130194545, "global_step": 43165, "epoch": 362, "lr": 3.428390103425554e-05} +{"train_loss": 0.0015116386348381639, "global_step": 43166, "epoch": 362, "lr": 3.428179782998268e-05} +{"train_loss": 0.0018419784028083086, "global_step": 43167, "epoch": 362, "lr": 3.427969465657086e-05} +{"train_loss": 0.0013723934534937143, "global_step": 43168, "epoch": 362, "lr": 3.427759151402417e-05} +{"train_loss": 0.0010662298882380128, "global_step": 43169, "epoch": 362, "lr": 3.4275488402346736e-05} +{"train_loss": 0.0007236066157929599, "global_step": 43170, "epoch": 362, "lr": 3.4273385321542714e-05} +{"train_loss": 0.0015770228346809745, "global_step": 43171, "epoch": 362, "lr": 3.4271282271616215e-05} +{"train_loss": 0.0018119161250069737, "global_step": 43172, "epoch": 362, "lr": 3.426917925257137e-05} +{"train_loss": 0.00266571925021708, "global_step": 43173, "epoch": 362, "lr": 3.426707626441231e-05} +{"train_loss": 0.0011782124638557434, "global_step": 43174, "epoch": 362, "lr": 3.426497330714318e-05} +{"train_loss": 0.0014218696160241961, "global_step": 43175, "epoch": 362, "lr": 3.426287038076809e-05} +{"train_loss": 0.001115312334150076, "global_step": 43176, "epoch": 362, "lr": 3.4260767485291154e-05} +{"train_loss": 0.001777746481820941, "global_step": 43177, "epoch": 362, "lr": 3.425866462071654e-05} +{"train_loss": 0.0018988401861861348, "global_step": 43178, "epoch": 362, "lr": 3.4256561787048344e-05} +{"train_loss": 0.0012725982815027237, "global_step": 43179, "epoch": 362, "lr": 3.4254458984290713e-05} +{"train_loss": 0.0023916231002658606, "global_step": 43180, "epoch": 362, "lr": 3.4252356212447787e-05} +{"train_loss": 0.001271581626497209, "global_step": 43181, "epoch": 362, "lr": 3.425025347152364e-05} +{"train_loss": 0.0014779723715037107, "global_step": 43182, "epoch": 362, "lr": 3.424815076152247e-05} +{"train_loss": 0.0015585458604618907, "global_step": 43183, "epoch": 362, "lr": 3.4246048082448346e-05} +{"train_loss": 0.0017653111135587096, "global_step": 43184, "epoch": 362, "lr": 3.4243945434305446e-05} +{"train_loss": 0.0013679565163329244, "global_step": 43185, "epoch": 362, "lr": 3.424184281709786e-05} +{"train_loss": 0.001654887106269598, "global_step": 43186, "epoch": 362, "lr": 3.423974023082974e-05} +{"train_loss": 0.0011275984579697251, "global_step": 43187, "epoch": 362, "lr": 3.4237637675505205e-05} +{"train_loss": 0.0012132776901125908, "global_step": 43188, "epoch": 362, "lr": 3.423553515112838e-05} +{"train_loss": 0.00214928830973804, "global_step": 43189, "epoch": 362, "lr": 3.4233432657703415e-05} +{"train_loss": 0.0017330285627394915, "global_step": 43190, "epoch": 362, "lr": 3.4231330195234393e-05} +{"train_loss": 0.001799358637072146, "global_step": 43191, "epoch": 362, "lr": 3.422922776372549e-05} +{"train_loss": 0.0007401558104902506, "global_step": 43192, "epoch": 362, "lr": 3.422712536318082e-05} +{"train_loss": 0.001492562354542315, "global_step": 43193, "epoch": 362, "lr": 3.422502299360448e-05} +{"train_loss": 0.0024066143669188023, "global_step": 43194, "epoch": 362, "lr": 3.4222920655000646e-05} +{"train_loss": 0.0016902813222259283, "global_step": 43195, "epoch": 362, "lr": 3.4220818347373394e-05} +{"train_loss": 0.0015666981226717662, "global_step": 43196, "epoch": 362, "lr": 3.421871607072691e-05, "val_loss": 0.012564148753881454} +{"train_loss": 0.001388888107612729, "global_step": 43197, "epoch": 363, "lr": 3.421661382506526e-05} +{"train_loss": 0.0009636138565838337, "global_step": 43198, "epoch": 363, "lr": 3.421451161039263e-05} +{"train_loss": 0.0020942892879247665, "global_step": 43199, "epoch": 363, "lr": 3.4212409426713124e-05} +{"train_loss": 0.0016024510841816664, "global_step": 43200, "epoch": 363, "lr": 3.421030727403083e-05} +{"train_loss": 0.0017055862117558718, "global_step": 43201, "epoch": 363, "lr": 3.420820515234993e-05} +{"train_loss": 0.0013588700676336884, "global_step": 43202, "epoch": 363, "lr": 3.4206103061674535e-05} +{"train_loss": 0.0012055396800860763, "global_step": 43203, "epoch": 363, "lr": 3.4204001002008765e-05} +{"train_loss": 0.001266259467229247, "global_step": 43204, "epoch": 363, "lr": 3.4201898973356754e-05} +{"train_loss": 0.001414805417880416, "global_step": 43205, "epoch": 363, "lr": 3.419979697572263e-05} +{"train_loss": 0.002147719031199813, "global_step": 43206, "epoch": 363, "lr": 3.419769500911052e-05} +{"train_loss": 0.0014278660528361797, "global_step": 43207, "epoch": 363, "lr": 3.419559307352453e-05} +{"train_loss": 0.001541810343042016, "global_step": 43208, "epoch": 363, "lr": 3.419349116896882e-05} +{"train_loss": 0.0013948415871709585, "global_step": 43209, "epoch": 363, "lr": 3.4191389295447487e-05} +{"train_loss": 0.001280629774555564, "global_step": 43210, "epoch": 363, "lr": 3.418928745296469e-05} +{"train_loss": 0.0017471995670348406, "global_step": 43211, "epoch": 363, "lr": 3.418718564152454e-05} +{"train_loss": 0.0014474850613623857, "global_step": 43212, "epoch": 363, "lr": 3.418508386113114e-05} +{"train_loss": 0.0016959208296611905, "global_step": 43213, "epoch": 363, "lr": 3.418298211178866e-05} +{"train_loss": 0.0015697578201070428, "global_step": 43214, "epoch": 363, "lr": 3.4180880393501185e-05} +{"train_loss": 0.0017122706631198525, "global_step": 43215, "epoch": 363, "lr": 3.417877870627288e-05} +{"train_loss": 0.0013506889808923006, "global_step": 43216, "epoch": 363, "lr": 3.417667705010783e-05} +{"train_loss": 0.002321616979315877, "global_step": 43217, "epoch": 363, "lr": 3.4174575425010214e-05} +{"train_loss": 0.0013804853660985827, "global_step": 43218, "epoch": 363, "lr": 3.417247383098411e-05} +{"train_loss": 0.0017749047838151455, "global_step": 43219, "epoch": 363, "lr": 3.417037226803366e-05} +{"train_loss": 0.0010656346566975117, "global_step": 43220, "epoch": 363, "lr": 3.4168270736162996e-05} +{"train_loss": 0.0015176389133557677, "global_step": 43221, "epoch": 363, "lr": 3.4166169235376246e-05} +{"train_loss": 0.001128257135860622, "global_step": 43222, "epoch": 363, "lr": 3.416406776567752e-05} +{"train_loss": 0.0009444279130548239, "global_step": 43223, "epoch": 363, "lr": 3.416196632707096e-05} +{"train_loss": 0.0015161854680627584, "global_step": 43224, "epoch": 363, "lr": 3.41598649195607e-05} +{"train_loss": 0.002034571021795273, "global_step": 43225, "epoch": 363, "lr": 3.415776354315085e-05} +{"train_loss": 0.0011327620595693588, "global_step": 43226, "epoch": 363, "lr": 3.4155662197845516e-05} +{"train_loss": 0.0008421892416663468, "global_step": 43227, "epoch": 363, "lr": 3.4153560883648875e-05} +{"train_loss": 0.0019377529388293624, "global_step": 43228, "epoch": 363, "lr": 3.415145960056501e-05} +{"train_loss": 0.0022371055092662573, "global_step": 43229, "epoch": 363, "lr": 3.414935834859806e-05} +{"train_loss": 0.0018367284210398793, "global_step": 43230, "epoch": 363, "lr": 3.414725712775217e-05} +{"train_loss": 0.0014725810615345836, "global_step": 43231, "epoch": 363, "lr": 3.4145155938031414e-05} +{"train_loss": 0.0012604796793311834, "global_step": 43232, "epoch": 363, "lr": 3.414305477943998e-05} +{"train_loss": 0.0014476404758170247, "global_step": 43233, "epoch": 363, "lr": 3.414095365198194e-05} +{"train_loss": 0.0023379926569759846, "global_step": 43234, "epoch": 363, "lr": 3.413885255566147e-05} +{"train_loss": 0.0022826099302619696, "global_step": 43235, "epoch": 363, "lr": 3.4136751490482635e-05} +{"train_loss": 0.0021207190584391356, "global_step": 43236, "epoch": 363, "lr": 3.413465045644961e-05} +{"train_loss": 0.0016763913445174694, "global_step": 43237, "epoch": 363, "lr": 3.413254945356652e-05} +{"train_loss": 0.0007881440105848014, "global_step": 43238, "epoch": 363, "lr": 3.413044848183745e-05} +{"train_loss": 0.0008003218681551516, "global_step": 43239, "epoch": 363, "lr": 3.412834754126657e-05} +{"train_loss": 0.0011402253294363618, "global_step": 43240, "epoch": 363, "lr": 3.412624663185796e-05} +{"train_loss": 0.0017303427448496222, "global_step": 43241, "epoch": 363, "lr": 3.412414575361579e-05} +{"train_loss": 0.001380701782181859, "global_step": 43242, "epoch": 363, "lr": 3.4122044906544144e-05} +{"train_loss": 0.0011393119348213077, "global_step": 43243, "epoch": 363, "lr": 3.411994409064718e-05} +{"train_loss": 0.002914387034252286, "global_step": 43244, "epoch": 363, "lr": 3.411784330592902e-05} +{"train_loss": 0.002128831809386611, "global_step": 43245, "epoch": 363, "lr": 3.411574255239376e-05} +{"train_loss": 0.0008724525105208158, "global_step": 43246, "epoch": 363, "lr": 3.411364183004555e-05} +{"train_loss": 0.0018723409157246351, "global_step": 43247, "epoch": 363, "lr": 3.41115411388885e-05} +{"train_loss": 0.001516913645900786, "global_step": 43248, "epoch": 363, "lr": 3.410944047892675e-05} +{"train_loss": 0.001091041136533022, "global_step": 43249, "epoch": 363, "lr": 3.410733985016441e-05} +{"train_loss": 0.001128649921156466, "global_step": 43250, "epoch": 363, "lr": 3.4105239252605615e-05} +{"train_loss": 0.0019524727249518037, "global_step": 43251, "epoch": 363, "lr": 3.4103138686254486e-05} +{"train_loss": 0.002201083581894636, "global_step": 43252, "epoch": 363, "lr": 3.410103815111514e-05} +{"train_loss": 0.0012439091224223375, "global_step": 43253, "epoch": 363, "lr": 3.4098937647191706e-05} +{"train_loss": 0.001069672405719757, "global_step": 43254, "epoch": 363, "lr": 3.409683717448831e-05} +{"train_loss": 0.001593774533830583, "global_step": 43255, "epoch": 363, "lr": 3.409473673300908e-05} +{"train_loss": 0.0008765485254116356, "global_step": 43256, "epoch": 363, "lr": 3.409263632275814e-05} +{"train_loss": 0.0014542607823386788, "global_step": 43257, "epoch": 363, "lr": 3.409053594373959e-05} +{"train_loss": 0.0015415821690112352, "global_step": 43258, "epoch": 363, "lr": 3.408843559595759e-05} +{"train_loss": 0.0014338374603539705, "global_step": 43259, "epoch": 363, "lr": 3.4086335279416235e-05} +{"train_loss": 0.002846542978659272, "global_step": 43260, "epoch": 363, "lr": 3.408423499411967e-05} +{"train_loss": 0.0015292636817321181, "global_step": 43261, "epoch": 363, "lr": 3.408213474007202e-05} +{"train_loss": 0.0009432596270926297, "global_step": 43262, "epoch": 363, "lr": 3.408003451727737e-05} +{"train_loss": 0.0008729788241907954, "global_step": 43263, "epoch": 363, "lr": 3.4077934325739904e-05} +{"train_loss": 0.0015937646385282278, "global_step": 43264, "epoch": 363, "lr": 3.4075834165463674e-05} +{"train_loss": 0.0024955039843916893, "global_step": 43265, "epoch": 363, "lr": 3.4073734036452874e-05} +{"train_loss": 0.0015422856668010354, "global_step": 43266, "epoch": 363, "lr": 3.4071633938711576e-05} +{"train_loss": 0.0011477724183350801, "global_step": 43267, "epoch": 363, "lr": 3.406953387224394e-05} +{"train_loss": 0.0011107311584055424, "global_step": 43268, "epoch": 363, "lr": 3.406743383705406e-05} +{"train_loss": 0.001307302387431264, "global_step": 43269, "epoch": 363, "lr": 3.406533383314608e-05} +{"train_loss": 0.0019285811576992273, "global_step": 43270, "epoch": 363, "lr": 3.406323386052411e-05} +{"train_loss": 0.001151511212810874, "global_step": 43271, "epoch": 363, "lr": 3.406113391919227e-05} +{"train_loss": 0.0025873573031276464, "global_step": 43272, "epoch": 363, "lr": 3.40590340091547e-05} +{"train_loss": 0.0009938398143276572, "global_step": 43273, "epoch": 363, "lr": 3.4056934130415503e-05} +{"train_loss": 0.00127430132124573, "global_step": 43274, "epoch": 363, "lr": 3.405483428297883e-05} +{"train_loss": 0.001156703452579677, "global_step": 43275, "epoch": 363, "lr": 3.405273446684879e-05} +{"train_loss": 0.0014854272594675422, "global_step": 43276, "epoch": 363, "lr": 3.405063468202948e-05} +{"train_loss": 0.0015251855365931988, "global_step": 43277, "epoch": 363, "lr": 3.404853492852507e-05} +{"train_loss": 0.0013188471784815192, "global_step": 43278, "epoch": 363, "lr": 3.404643520633962e-05} +{"train_loss": 0.002215844113379717, "global_step": 43279, "epoch": 363, "lr": 3.404433551547733e-05} +{"train_loss": 0.0007962439558468759, "global_step": 43280, "epoch": 363, "lr": 3.404223585594227e-05} +{"train_loss": 0.0008958872640505433, "global_step": 43281, "epoch": 363, "lr": 3.404013622773856e-05} +{"train_loss": 0.001403737347573042, "global_step": 43282, "epoch": 363, "lr": 3.403803663087036e-05} +{"train_loss": 0.0018259979551658034, "global_step": 43283, "epoch": 363, "lr": 3.403593706534175e-05} +{"train_loss": 0.0018180841580033302, "global_step": 43284, "epoch": 363, "lr": 3.403383753115688e-05} +{"train_loss": 0.0011250959942117333, "global_step": 43285, "epoch": 363, "lr": 3.403173802831986e-05} +{"train_loss": 0.0007733296952210367, "global_step": 43286, "epoch": 363, "lr": 3.402963855683482e-05} +{"train_loss": 0.0013359134318307042, "global_step": 43287, "epoch": 363, "lr": 3.4027539116705886e-05} +{"train_loss": 0.002394281327724457, "global_step": 43288, "epoch": 363, "lr": 3.4025439707937155e-05} +{"train_loss": 0.0023837012704461813, "global_step": 43289, "epoch": 363, "lr": 3.402334033053278e-05} +{"train_loss": 0.00123852607794106, "global_step": 43290, "epoch": 363, "lr": 3.402124098449686e-05} +{"train_loss": 0.001118876738473773, "global_step": 43291, "epoch": 363, "lr": 3.4019141669833546e-05} +{"train_loss": 0.000896283017937094, "global_step": 43292, "epoch": 363, "lr": 3.401704238654692e-05} +{"train_loss": 0.0019497225293889642, "global_step": 43293, "epoch": 363, "lr": 3.401494313464113e-05} +{"train_loss": 0.001459860010072589, "global_step": 43294, "epoch": 363, "lr": 3.4012843914120306e-05} +{"train_loss": 0.001186318346299231, "global_step": 43295, "epoch": 363, "lr": 3.4010744724988534e-05} +{"train_loss": 0.0010631061159074306, "global_step": 43296, "epoch": 363, "lr": 3.4008645567249963e-05} +{"train_loss": 0.0010004895739257336, "global_step": 43297, "epoch": 363, "lr": 3.40065464409087e-05} +{"train_loss": 0.0013215371873229742, "global_step": 43298, "epoch": 363, "lr": 3.400444734596889e-05} +{"train_loss": 0.0010647049639374018, "global_step": 43299, "epoch": 363, "lr": 3.4002348282434635e-05} +{"train_loss": 0.0011923536658287048, "global_step": 43300, "epoch": 363, "lr": 3.4000249250310055e-05} +{"train_loss": 0.0006982955383136868, "global_step": 43301, "epoch": 363, "lr": 3.3998150249599284e-05} +{"train_loss": 0.0010155880590900779, "global_step": 43302, "epoch": 363, "lr": 3.3996051280306415e-05} +{"train_loss": 0.001132066361606121, "global_step": 43303, "epoch": 363, "lr": 3.399395234243561e-05} +{"train_loss": 0.0012719797668978572, "global_step": 43304, "epoch": 363, "lr": 3.399185343599096e-05} +{"train_loss": 0.0012191475834697485, "global_step": 43305, "epoch": 363, "lr": 3.39897545609766e-05} +{"train_loss": 0.0006098307203501463, "global_step": 43306, "epoch": 363, "lr": 3.398765571739665e-05} +{"train_loss": 0.0008179839933291078, "global_step": 43307, "epoch": 363, "lr": 3.3985556905255215e-05} +{"train_loss": 0.0016015798319131136, "global_step": 43308, "epoch": 363, "lr": 3.398345812455644e-05} +{"train_loss": 0.001226487453095615, "global_step": 43309, "epoch": 363, "lr": 3.398135937530442e-05} +{"train_loss": 0.0010760246077552438, "global_step": 43310, "epoch": 363, "lr": 3.3979260657503314e-05} +{"train_loss": 0.0017807518597692251, "global_step": 43311, "epoch": 363, "lr": 3.3977161971157213e-05} +{"train_loss": 0.0012258425122126937, "global_step": 43312, "epoch": 363, "lr": 3.397506331627022e-05} +{"train_loss": 0.001374397543258965, "global_step": 43313, "epoch": 363, "lr": 3.3972964692846506e-05} +{"train_loss": 0.0012241110671311617, "global_step": 43314, "epoch": 363, "lr": 3.397086610089014e-05} +{"train_loss": 0.001450893037244208, "global_step": 43315, "epoch": 363, "lr": 3.3968767540405274e-05, "val_loss": 0.022158702835440636} +{"train_loss": 0.0009415860986337066, "global_step": 43316, "epoch": 364, "lr": 3.396666901139601e-05} +{"train_loss": 0.0014706187648698688, "global_step": 43317, "epoch": 364, "lr": 3.3964570513866505e-05} +{"train_loss": 0.0008782266522757709, "global_step": 43318, "epoch": 364, "lr": 3.396247204782084e-05} +{"train_loss": 0.0022486269008368254, "global_step": 43319, "epoch": 364, "lr": 3.396037361326313e-05} +{"train_loss": 0.0010916932951658964, "global_step": 43320, "epoch": 364, "lr": 3.3958275210197536e-05} +{"train_loss": 0.0015688483836129308, "global_step": 43321, "epoch": 364, "lr": 3.395617683862814e-05} +{"train_loss": 0.001768138026818633, "global_step": 43322, "epoch": 364, "lr": 3.3954078498559094e-05} +{"train_loss": 0.0009930450469255447, "global_step": 43323, "epoch": 364, "lr": 3.395198018999448e-05} +{"train_loss": 0.002330963034182787, "global_step": 43324, "epoch": 364, "lr": 3.394988191293845e-05} +{"train_loss": 0.0021603491622954607, "global_step": 43325, "epoch": 364, "lr": 3.394778366739513e-05} +{"train_loss": 0.0009361927513964474, "global_step": 43326, "epoch": 364, "lr": 3.394568545336858e-05} +{"train_loss": 0.001481233979575336, "global_step": 43327, "epoch": 364, "lr": 3.3943587270863e-05} +{"train_loss": 0.002074695657938719, "global_step": 43328, "epoch": 364, "lr": 3.394148911988244e-05} +{"train_loss": 0.0012063607573509216, "global_step": 43329, "epoch": 364, "lr": 3.3939391000431076e-05} +{"train_loss": 0.0016526023391634226, "global_step": 43330, "epoch": 364, "lr": 3.3937292912513e-05} +{"train_loss": 0.001470466610044241, "global_step": 43331, "epoch": 364, "lr": 3.3935194856132314e-05} +{"train_loss": 0.0022318901028484106, "global_step": 43332, "epoch": 364, "lr": 3.3933096831293176e-05} +{"train_loss": 0.001599084702320397, "global_step": 43333, "epoch": 364, "lr": 3.393099883799967e-05} +{"train_loss": 0.0018142347689718008, "global_step": 43334, "epoch": 364, "lr": 3.3928900876255936e-05} +{"train_loss": 0.002457637106999755, "global_step": 43335, "epoch": 364, "lr": 3.392680294606609e-05} +{"train_loss": 0.0018632711144164205, "global_step": 43336, "epoch": 364, "lr": 3.392470504743425e-05} +{"train_loss": 0.0010303778108209372, "global_step": 43337, "epoch": 364, "lr": 3.392260718036454e-05} +{"train_loss": 0.0013905822997912765, "global_step": 43338, "epoch": 364, "lr": 3.392050934486106e-05} +{"train_loss": 0.0018676681211218238, "global_step": 43339, "epoch": 364, "lr": 3.391841154092796e-05} +{"train_loss": 0.0007310618530027568, "global_step": 43340, "epoch": 364, "lr": 3.391631376856932e-05} +{"train_loss": 0.0014723974745720625, "global_step": 43341, "epoch": 364, "lr": 3.391421602778929e-05} +{"train_loss": 0.0012724727857857943, "global_step": 43342, "epoch": 364, "lr": 3.3912118318591974e-05} +{"train_loss": 0.001514611067250371, "global_step": 43343, "epoch": 364, "lr": 3.391002064098151e-05} +{"train_loss": 0.0019366987980902195, "global_step": 43344, "epoch": 364, "lr": 3.3907922994961994e-05} +{"train_loss": 0.0008285495568998158, "global_step": 43345, "epoch": 364, "lr": 3.390582538053754e-05} +{"train_loss": 0.0017420817166566849, "global_step": 43346, "epoch": 364, "lr": 3.390372779771229e-05} +{"train_loss": 0.0025543791707605124, "global_step": 43347, "epoch": 364, "lr": 3.3901630246490345e-05} +{"train_loss": 0.0008912456687539816, "global_step": 43348, "epoch": 364, "lr": 3.389953272687584e-05} +{"train_loss": 0.0011465501738712192, "global_step": 43349, "epoch": 364, "lr": 3.3897435238872874e-05} +{"train_loss": 0.001963482704013586, "global_step": 43350, "epoch": 364, "lr": 3.389533778248557e-05} +{"train_loss": 0.0007798442966304719, "global_step": 43351, "epoch": 364, "lr": 3.389324035771806e-05} +{"train_loss": 0.0020821650978177786, "global_step": 43352, "epoch": 364, "lr": 3.389114296457444e-05} +{"train_loss": 0.00150937563739717, "global_step": 43353, "epoch": 364, "lr": 3.3889045603058846e-05} +{"train_loss": 0.0014948337338864803, "global_step": 43354, "epoch": 364, "lr": 3.388694827317539e-05} +{"train_loss": 0.0014885737327858806, "global_step": 43355, "epoch": 364, "lr": 3.388485097492818e-05} +{"train_loss": 0.001707606134004891, "global_step": 43356, "epoch": 364, "lr": 3.3882753708321366e-05} +{"train_loss": 0.0005952701321803033, "global_step": 43357, "epoch": 364, "lr": 3.388065647335902e-05} +{"train_loss": 0.0020329102408140898, "global_step": 43358, "epoch": 364, "lr": 3.3878559270045304e-05} +{"train_loss": 0.0020198023412376642, "global_step": 43359, "epoch": 364, "lr": 3.387646209838429e-05} +{"train_loss": 0.0014008061261847615, "global_step": 43360, "epoch": 364, "lr": 3.387436495838014e-05} +{"train_loss": 0.0017907883739098907, "global_step": 43361, "epoch": 364, "lr": 3.387226785003693e-05} +{"train_loss": 0.0018042637966573238, "global_step": 43362, "epoch": 364, "lr": 3.3870170773358825e-05} +{"train_loss": 0.0015259883366525173, "global_step": 43363, "epoch": 364, "lr": 3.386807372834991e-05} +{"train_loss": 0.0018313064938411117, "global_step": 43364, "epoch": 364, "lr": 3.38659767150143e-05} +{"train_loss": 0.002274514874443412, "global_step": 43365, "epoch": 364, "lr": 3.3863879733356134e-05} +{"train_loss": 0.0016223897691816092, "global_step": 43366, "epoch": 364, "lr": 3.38617827833795e-05} +{"train_loss": 0.0017203358002007008, "global_step": 43367, "epoch": 364, "lr": 3.385968586508854e-05} +{"train_loss": 0.0014521046541631222, "global_step": 43368, "epoch": 364, "lr": 3.3857588978487365e-05} +{"train_loss": 0.0007737834821455181, "global_step": 43369, "epoch": 364, "lr": 3.3855492123580074e-05} +{"train_loss": 0.0011677069123834372, "global_step": 43370, "epoch": 364, "lr": 3.385339530037082e-05} +{"train_loss": 0.001523340935818851, "global_step": 43371, "epoch": 364, "lr": 3.385129850886368e-05} +{"train_loss": 0.002255608094856143, "global_step": 43372, "epoch": 364, "lr": 3.384920174906281e-05} +{"train_loss": 0.0018519592704251409, "global_step": 43373, "epoch": 364, "lr": 3.384710502097229e-05} +{"train_loss": 0.0012108944356441498, "global_step": 43374, "epoch": 364, "lr": 3.384500832459627e-05} +{"train_loss": 0.0015063678147271276, "global_step": 43375, "epoch": 364, "lr": 3.384291165993885e-05} +{"train_loss": 0.0014267556834965944, "global_step": 43376, "epoch": 364, "lr": 3.3840815027004126e-05} +{"train_loss": 0.0016800943994894624, "global_step": 43377, "epoch": 364, "lr": 3.3838718425796254e-05} +{"train_loss": 0.0010270284255966544, "global_step": 43378, "epoch": 364, "lr": 3.383662185631932e-05} +{"train_loss": 0.0016116999322548509, "global_step": 43379, "epoch": 364, "lr": 3.383452531857746e-05} +{"train_loss": 0.0009727709111757576, "global_step": 43380, "epoch": 364, "lr": 3.383242881257479e-05} +{"train_loss": 0.0018496873090043664, "global_step": 43381, "epoch": 364, "lr": 3.3830332338315396e-05} +{"train_loss": 0.000854724261444062, "global_step": 43382, "epoch": 364, "lr": 3.382823589580343e-05} +{"train_loss": 0.0012939820298925042, "global_step": 43383, "epoch": 364, "lr": 3.382613948504299e-05} +{"train_loss": 0.0017315918812528253, "global_step": 43384, "epoch": 364, "lr": 3.38240431060382e-05} +{"train_loss": 0.0011197602143511176, "global_step": 43385, "epoch": 364, "lr": 3.382194675879318e-05} +{"train_loss": 0.0009450704092159867, "global_step": 43386, "epoch": 364, "lr": 3.3819850443312035e-05} +{"train_loss": 0.0013460780028253794, "global_step": 43387, "epoch": 364, "lr": 3.381775415959889e-05} +{"train_loss": 0.002666290383785963, "global_step": 43388, "epoch": 364, "lr": 3.3815657907657844e-05} +{"train_loss": 0.0007776409620419145, "global_step": 43389, "epoch": 364, "lr": 3.381356168749304e-05} +{"train_loss": 0.0013687171740457416, "global_step": 43390, "epoch": 364, "lr": 3.381146549910856e-05} +{"train_loss": 0.0009906868217512965, "global_step": 43391, "epoch": 364, "lr": 3.380936934250856e-05} +{"train_loss": 0.0011126657482236624, "global_step": 43392, "epoch": 364, "lr": 3.380727321769711e-05} +{"train_loss": 0.0012813083594664931, "global_step": 43393, "epoch": 364, "lr": 3.380517712467837e-05} +{"train_loss": 0.0014239917509257793, "global_step": 43394, "epoch": 364, "lr": 3.380308106345643e-05} +{"train_loss": 0.0018099177395924926, "global_step": 43395, "epoch": 364, "lr": 3.380098503403539e-05} +{"train_loss": 0.0016530439024791121, "global_step": 43396, "epoch": 364, "lr": 3.379888903641941e-05} +{"train_loss": 0.001175804645754397, "global_step": 43397, "epoch": 364, "lr": 3.379679307061256e-05} +{"train_loss": 0.0010048424592241645, "global_step": 43398, "epoch": 364, "lr": 3.3794697136618996e-05} +{"train_loss": 0.0008317328174598515, "global_step": 43399, "epoch": 364, "lr": 3.37926012344428e-05} +{"train_loss": 0.0010936716571450233, "global_step": 43400, "epoch": 364, "lr": 3.37905053640881e-05} +{"train_loss": 0.0012111651012673974, "global_step": 43401, "epoch": 364, "lr": 3.3788409525559015e-05} +{"train_loss": 0.0015234535094350576, "global_step": 43402, "epoch": 364, "lr": 3.378631371885965e-05} +{"train_loss": 0.0007488547125831246, "global_step": 43403, "epoch": 364, "lr": 3.378421794399413e-05} +{"train_loss": 0.0013111161533743143, "global_step": 43404, "epoch": 364, "lr": 3.378212220096656e-05} +{"train_loss": 0.0017725576180964708, "global_step": 43405, "epoch": 364, "lr": 3.378002648978108e-05} +{"train_loss": 0.0018927438650280237, "global_step": 43406, "epoch": 364, "lr": 3.3777930810441784e-05} +{"train_loss": 0.0011558275436982512, "global_step": 43407, "epoch": 364, "lr": 3.377583516295276e-05} +{"train_loss": 0.0013415260473266244, "global_step": 43408, "epoch": 364, "lr": 3.377373954731817e-05} +{"train_loss": 0.0018199190963059664, "global_step": 43409, "epoch": 364, "lr": 3.37716439635421e-05} +{"train_loss": 0.0014737988822162151, "global_step": 43410, "epoch": 364, "lr": 3.3769548411628685e-05} +{"train_loss": 0.000829494500067085, "global_step": 43411, "epoch": 364, "lr": 3.376745289158201e-05} +{"train_loss": 0.0011125265154987574, "global_step": 43412, "epoch": 364, "lr": 3.376535740340623e-05} +{"train_loss": 0.0011094561778008938, "global_step": 43413, "epoch": 364, "lr": 3.3763261947105434e-05} +{"train_loss": 0.0010925763053819537, "global_step": 43414, "epoch": 364, "lr": 3.376116652268372e-05} +{"train_loss": 0.0012284938711673021, "global_step": 43415, "epoch": 364, "lr": 3.375907113014524e-05} +{"train_loss": 0.0008341121138073504, "global_step": 43416, "epoch": 364, "lr": 3.375697576949407e-05} +{"train_loss": 0.0018275260226801038, "global_step": 43417, "epoch": 364, "lr": 3.3754880440734346e-05} +{"train_loss": 0.0009152533020824194, "global_step": 43418, "epoch": 364, "lr": 3.375278514387019e-05} +{"train_loss": 0.0020760195329785347, "global_step": 43419, "epoch": 364, "lr": 3.375068987890569e-05} +{"train_loss": 0.0010478675831109285, "global_step": 43420, "epoch": 364, "lr": 3.374859464584499e-05} +{"train_loss": 0.0007842888589948416, "global_step": 43421, "epoch": 364, "lr": 3.374649944469217e-05} +{"train_loss": 0.002425673883408308, "global_step": 43422, "epoch": 364, "lr": 3.374440427545138e-05} +{"train_loss": 0.002302010077983141, "global_step": 43423, "epoch": 364, "lr": 3.37423091381267e-05} +{"train_loss": 0.003131577977910638, "global_step": 43424, "epoch": 364, "lr": 3.3740214032722276e-05} +{"train_loss": 0.0007552501047030091, "global_step": 43425, "epoch": 364, "lr": 3.3738118959242204e-05} +{"train_loss": 0.0022440117318183184, "global_step": 43426, "epoch": 364, "lr": 3.3736023917690586e-05} +{"train_loss": 0.002376014133915305, "global_step": 43427, "epoch": 364, "lr": 3.373392890807155e-05} +{"train_loss": 0.0008961051353253424, "global_step": 43428, "epoch": 364, "lr": 3.373183393038921e-05} +{"train_loss": 0.00139419618062675, "global_step": 43429, "epoch": 364, "lr": 3.372973898464768e-05} +{"train_loss": 0.0016509885899722576, "global_step": 43430, "epoch": 364, "lr": 3.372764407085106e-05} +{"train_loss": 0.0021262364462018013, "global_step": 43431, "epoch": 364, "lr": 3.372554918900348e-05} +{"train_loss": 0.0014552070060744882, "global_step": 43432, "epoch": 364, "lr": 3.372345433910904e-05} +{"train_loss": 0.0021302562672644854, "global_step": 43433, "epoch": 364, "lr": 3.372135952117186e-05} +{"train_loss": 0.001501756565187502, "global_step": 43434, "epoch": 364, "lr": 3.371926473519605e-05, "val_loss": 0.018634190782904625} +{"train_loss": 0.0015482140006497502, "global_step": 43435, "epoch": 365, "lr": 3.3717169981185725e-05} +{"train_loss": 0.0013954690657556057, "global_step": 43436, "epoch": 365, "lr": 3.3715075259145004e-05} +{"train_loss": 0.0011944532161578536, "global_step": 43437, "epoch": 365, "lr": 3.371298056907799e-05} +{"train_loss": 0.001481720944866538, "global_step": 43438, "epoch": 365, "lr": 3.371088591098879e-05} +{"train_loss": 0.0008826799457892776, "global_step": 43439, "epoch": 365, "lr": 3.3708791284881534e-05} +{"train_loss": 0.0020437443163245916, "global_step": 43440, "epoch": 365, "lr": 3.370669669076032e-05} +{"train_loss": 0.0013773159589618444, "global_step": 43441, "epoch": 365, "lr": 3.370460212862927e-05} +{"train_loss": 0.0015746760182082653, "global_step": 43442, "epoch": 365, "lr": 3.3702507598492485e-05} +{"train_loss": 0.001545942504890263, "global_step": 43443, "epoch": 365, "lr": 3.37004131003541e-05} +{"train_loss": 0.0010371481766924262, "global_step": 43444, "epoch": 365, "lr": 3.3698318634218215e-05} +{"train_loss": 0.0018265366088598967, "global_step": 43445, "epoch": 365, "lr": 3.3696224200088925e-05} +{"train_loss": 0.0021836678497493267, "global_step": 43446, "epoch": 365, "lr": 3.369412979797037e-05} +{"train_loss": 0.0011248609516769648, "global_step": 43447, "epoch": 365, "lr": 3.369203542786663e-05} +{"train_loss": 0.0020973056089133024, "global_step": 43448, "epoch": 365, "lr": 3.3689941089781857e-05} +{"train_loss": 0.0011815138859674335, "global_step": 43449, "epoch": 365, "lr": 3.3687846783720133e-05} +{"train_loss": 0.001722949557006359, "global_step": 43450, "epoch": 365, "lr": 3.368575250968557e-05} +{"train_loss": 0.0012724206317216158, "global_step": 43451, "epoch": 365, "lr": 3.36836582676823e-05} +{"train_loss": 0.0014671931276097894, "global_step": 43452, "epoch": 365, "lr": 3.368156405771441e-05} +{"train_loss": 0.001015999703668058, "global_step": 43453, "epoch": 365, "lr": 3.3679469879786055e-05} +{"train_loss": 0.002376193180680275, "global_step": 43454, "epoch": 365, "lr": 3.3677375733901284e-05} +{"train_loss": 0.0013740924187004566, "global_step": 43455, "epoch": 365, "lr": 3.367528162006426e-05} +{"train_loss": 0.0006912873941473663, "global_step": 43456, "epoch": 365, "lr": 3.367318753827909e-05} +{"train_loss": 0.0032557835802435875, "global_step": 43457, "epoch": 365, "lr": 3.3671093488549845e-05} +{"train_loss": 0.0024556382559239864, "global_step": 43458, "epoch": 365, "lr": 3.366899947088068e-05} +{"train_loss": 0.0020469208247959614, "global_step": 43459, "epoch": 365, "lr": 3.3666905485275673e-05} +{"train_loss": 0.0011693257838487625, "global_step": 43460, "epoch": 365, "lr": 3.366481153173897e-05} +{"train_loss": 0.001463560969568789, "global_step": 43461, "epoch": 365, "lr": 3.3662717610274654e-05} +{"train_loss": 0.0014740831684321165, "global_step": 43462, "epoch": 365, "lr": 3.3660623720886855e-05} +{"train_loss": 0.001958801643922925, "global_step": 43463, "epoch": 365, "lr": 3.365852986357968e-05} +{"train_loss": 0.000839959888253361, "global_step": 43464, "epoch": 365, "lr": 3.365643603835722e-05} +{"train_loss": 0.0014387016417458653, "global_step": 43465, "epoch": 365, "lr": 3.3654342245223616e-05} +{"train_loss": 0.0011802217923104763, "global_step": 43466, "epoch": 365, "lr": 3.3652248484182946e-05} +{"train_loss": 0.0012730289017781615, "global_step": 43467, "epoch": 365, "lr": 3.365015475523935e-05} +{"train_loss": 0.001554962364025414, "global_step": 43468, "epoch": 365, "lr": 3.364806105839694e-05} +{"train_loss": 0.002023938577622175, "global_step": 43469, "epoch": 365, "lr": 3.3645967393659795e-05} +{"train_loss": 0.0011125874007120728, "global_step": 43470, "epoch": 365, "lr": 3.3643873761032063e-05} +{"train_loss": 0.0006818841793574393, "global_step": 43471, "epoch": 365, "lr": 3.364178016051782e-05} +{"train_loss": 0.0013115109177306294, "global_step": 43472, "epoch": 365, "lr": 3.363968659212121e-05} +{"train_loss": 0.0016445355722680688, "global_step": 43473, "epoch": 365, "lr": 3.3637593055846304e-05} +{"train_loss": 0.0010575641645118594, "global_step": 43474, "epoch": 365, "lr": 3.363549955169727e-05} +{"train_loss": 0.0012804213911294937, "global_step": 43475, "epoch": 365, "lr": 3.363340607967818e-05} +{"train_loss": 0.002303287386894226, "global_step": 43476, "epoch": 365, "lr": 3.363131263979312e-05} +{"train_loss": 0.0015806311275810003, "global_step": 43477, "epoch": 365, "lr": 3.362921923204625e-05} +{"train_loss": 0.0010033496655523777, "global_step": 43478, "epoch": 365, "lr": 3.3627125856441644e-05} +{"train_loss": 0.0008722214261069894, "global_step": 43479, "epoch": 365, "lr": 3.362503251298345e-05} +{"train_loss": 0.0017466029385104775, "global_step": 43480, "epoch": 365, "lr": 3.362293920167573e-05} +{"train_loss": 0.0013983823591843247, "global_step": 43481, "epoch": 365, "lr": 3.362084592252264e-05} +{"train_loss": 0.001430520904250443, "global_step": 43482, "epoch": 365, "lr": 3.361875267552826e-05} +{"train_loss": 0.0016665155999362469, "global_step": 43483, "epoch": 365, "lr": 3.361665946069671e-05} +{"train_loss": 0.0009222620283253491, "global_step": 43484, "epoch": 365, "lr": 3.36145662780321e-05} +{"train_loss": 0.0010713927913457155, "global_step": 43485, "epoch": 365, "lr": 3.3612473127538533e-05} +{"train_loss": 0.0012667845003306866, "global_step": 43486, "epoch": 365, "lr": 3.3610380009220134e-05} +{"train_loss": 0.003202820895239711, "global_step": 43487, "epoch": 365, "lr": 3.3608286923081005e-05} +{"train_loss": 0.0014319171896204352, "global_step": 43488, "epoch": 365, "lr": 3.360619386912524e-05} +{"train_loss": 0.001600908930413425, "global_step": 43489, "epoch": 365, "lr": 3.3604100847356974e-05} +{"train_loss": 0.0019945513922721148, "global_step": 43490, "epoch": 365, "lr": 3.3602007857780285e-05} +{"train_loss": 0.0024128113873302937, "global_step": 43491, "epoch": 365, "lr": 3.3599914900399325e-05} +{"train_loss": 0.0008488465682603419, "global_step": 43492, "epoch": 365, "lr": 3.359782197521816e-05} +{"train_loss": 0.002472855616360903, "global_step": 43493, "epoch": 365, "lr": 3.359572908224094e-05} +{"train_loss": 0.001879075076431036, "global_step": 43494, "epoch": 365, "lr": 3.3593636221471755e-05} +{"train_loss": 0.0018358936067670584, "global_step": 43495, "epoch": 365, "lr": 3.359154339291468e-05} +{"train_loss": 0.0013341823359951377, "global_step": 43496, "epoch": 365, "lr": 3.358945059657389e-05} +{"train_loss": 0.0011353055015206337, "global_step": 43497, "epoch": 365, "lr": 3.3587357832453435e-05} +{"train_loss": 0.0011127771576866508, "global_step": 43498, "epoch": 365, "lr": 3.358526510055747e-05} +{"train_loss": 0.0020180544815957546, "global_step": 43499, "epoch": 365, "lr": 3.358317240089008e-05} +{"train_loss": 0.0015241679502651095, "global_step": 43500, "epoch": 365, "lr": 3.358107973345537e-05} +{"train_loss": 0.002004709793254733, "global_step": 43501, "epoch": 365, "lr": 3.357898709825746e-05} +{"train_loss": 0.0014024745905771852, "global_step": 43502, "epoch": 365, "lr": 3.357689449530044e-05} +{"train_loss": 0.001026091747917235, "global_step": 43503, "epoch": 365, "lr": 3.357480192458845e-05} +{"train_loss": 0.0012661907821893692, "global_step": 43504, "epoch": 365, "lr": 3.357270938612557e-05} +{"train_loss": 0.000898872094694525, "global_step": 43505, "epoch": 365, "lr": 3.357061687991594e-05} +{"train_loss": 0.0013968374114483595, "global_step": 43506, "epoch": 365, "lr": 3.356852440596364e-05} +{"train_loss": 0.0017813903978094459, "global_step": 43507, "epoch": 365, "lr": 3.356643196427277e-05} +{"train_loss": 0.0008541653514839709, "global_step": 43508, "epoch": 365, "lr": 3.356433955484748e-05} +{"train_loss": 0.0015275763580575585, "global_step": 43509, "epoch": 365, "lr": 3.356224717769183e-05} +{"train_loss": 0.0025515658780932426, "global_step": 43510, "epoch": 365, "lr": 3.3560154832809975e-05} +{"train_loss": 0.0019186956342309713, "global_step": 43511, "epoch": 365, "lr": 3.355806252020598e-05} +{"train_loss": 0.0014289036625996232, "global_step": 43512, "epoch": 365, "lr": 3.355597023988398e-05} +{"train_loss": 0.0015795205254107714, "global_step": 43513, "epoch": 365, "lr": 3.355387799184809e-05} +{"train_loss": 0.0010711068753153086, "global_step": 43514, "epoch": 365, "lr": 3.355178577610238e-05} +{"train_loss": 0.0016262648859992623, "global_step": 43515, "epoch": 365, "lr": 3.3549693592650985e-05} +{"train_loss": 0.0010239852126687765, "global_step": 43516, "epoch": 365, "lr": 3.354760144149802e-05} +{"train_loss": 0.0013057258911430836, "global_step": 43517, "epoch": 365, "lr": 3.354550932264757e-05} +{"train_loss": 0.0018161964835599065, "global_step": 43518, "epoch": 365, "lr": 3.354341723610378e-05} +{"train_loss": 0.002491090213879943, "global_step": 43519, "epoch": 365, "lr": 3.35413251818707e-05} +{"train_loss": 0.0013910775305703282, "global_step": 43520, "epoch": 365, "lr": 3.3539233159952485e-05} +{"train_loss": 0.0010232829954475164, "global_step": 43521, "epoch": 365, "lr": 3.353714117035322e-05} +{"train_loss": 0.0016668441239744425, "global_step": 43522, "epoch": 365, "lr": 3.353504921307704e-05} +{"train_loss": 0.0025156529154628515, "global_step": 43523, "epoch": 365, "lr": 3.3532957288127996e-05} +{"train_loss": 0.002499196445569396, "global_step": 43524, "epoch": 365, "lr": 3.353086539551027e-05} +{"train_loss": 0.0008048022864386439, "global_step": 43525, "epoch": 365, "lr": 3.352877353522792e-05} +{"train_loss": 0.001235518604516983, "global_step": 43526, "epoch": 365, "lr": 3.352668170728505e-05} +{"train_loss": 0.0024688902776688337, "global_step": 43527, "epoch": 365, "lr": 3.352458991168579e-05} +{"train_loss": 0.001035613240674138, "global_step": 43528, "epoch": 365, "lr": 3.352249814843422e-05} +{"train_loss": 0.0008086239104159176, "global_step": 43529, "epoch": 365, "lr": 3.352040641753449e-05} +{"train_loss": 0.0023107314482331276, "global_step": 43530, "epoch": 365, "lr": 3.3518314718990655e-05} +{"train_loss": 0.0007299022981896996, "global_step": 43531, "epoch": 365, "lr": 3.351622305280687e-05} +{"train_loss": 0.0009510329691693187, "global_step": 43532, "epoch": 365, "lr": 3.3514131418987215e-05} +{"train_loss": 0.0021713366732001305, "global_step": 43533, "epoch": 365, "lr": 3.35120398175358e-05} +{"train_loss": 0.0010849176906049252, "global_step": 43534, "epoch": 365, "lr": 3.350994824845673e-05} +{"train_loss": 0.000713232671841979, "global_step": 43535, "epoch": 365, "lr": 3.350785671175412e-05} +{"train_loss": 0.0011652667308226228, "global_step": 43536, "epoch": 365, "lr": 3.350576520743207e-05} +{"train_loss": 0.0012066502822563052, "global_step": 43537, "epoch": 365, "lr": 3.35036737354947e-05} +{"train_loss": 0.001956089399755001, "global_step": 43538, "epoch": 365, "lr": 3.350158229594608e-05} +{"train_loss": 0.0025183474645018578, "global_step": 43539, "epoch": 365, "lr": 3.3499490888790356e-05} +{"train_loss": 0.0011540264822542667, "global_step": 43540, "epoch": 365, "lr": 3.34973995140316e-05} +{"train_loss": 0.0013888721587136388, "global_step": 43541, "epoch": 365, "lr": 3.349530817167397e-05} +{"train_loss": 0.0008468057494610548, "global_step": 43542, "epoch": 365, "lr": 3.349321686172151e-05} +{"train_loss": 0.0014691990800201893, "global_step": 43543, "epoch": 365, "lr": 3.349112558417837e-05} +{"train_loss": 0.0010632728226482868, "global_step": 43544, "epoch": 365, "lr": 3.348903433904865e-05} +{"train_loss": 0.001996782375499606, "global_step": 43545, "epoch": 365, "lr": 3.3486943126336425e-05} +{"train_loss": 0.0012117390288040042, "global_step": 43546, "epoch": 365, "lr": 3.348485194604584e-05} +{"train_loss": 0.00121632544323802, "global_step": 43547, "epoch": 365, "lr": 3.348276079818097e-05} +{"train_loss": 0.0014721073675900698, "global_step": 43548, "epoch": 365, "lr": 3.348066968274595e-05} +{"train_loss": 0.001177979982458055, "global_step": 43549, "epoch": 365, "lr": 3.3478578599744844e-05} +{"train_loss": 0.00175119424238801, "global_step": 43550, "epoch": 365, "lr": 3.34764875491818e-05} +{"train_loss": 0.0013684838777408004, "global_step": 43551, "epoch": 365, "lr": 3.347439653106092e-05} +{"train_loss": 0.0013399046147242188, "global_step": 43552, "epoch": 365, "lr": 3.3472305545386275e-05} +{"train_loss": 0.0015120862722944688, "global_step": 43553, "epoch": 365, "lr": 3.3470214592162016e-05, "val_loss": 0.02478908561170101, "train_action_mse_error": 1.8579279640107416e-05} +{"train_loss": 0.0009890594519674778, "global_step": 43554, "epoch": 366, "lr": 3.346812367139219e-05} +{"train_loss": 0.0018143545603379607, "global_step": 43555, "epoch": 366, "lr": 3.346603278308097e-05} +{"train_loss": 0.0017788687255233526, "global_step": 43556, "epoch": 366, "lr": 3.3463941927232434e-05} +{"train_loss": 0.0014008936705067754, "global_step": 43557, "epoch": 366, "lr": 3.346185110385065e-05} +{"train_loss": 0.002208651974797249, "global_step": 43558, "epoch": 366, "lr": 3.345976031293978e-05} +{"train_loss": 0.0010286957258358598, "global_step": 43559, "epoch": 366, "lr": 3.3457669554503876e-05} +{"train_loss": 0.000936900032684207, "global_step": 43560, "epoch": 366, "lr": 3.3455578828547095e-05} +{"train_loss": 0.0012971317628398538, "global_step": 43561, "epoch": 366, "lr": 3.34534881350735e-05} +{"train_loss": 0.0015899497084319592, "global_step": 43562, "epoch": 366, "lr": 3.345139747408723e-05} +{"train_loss": 0.0016282614087685943, "global_step": 43563, "epoch": 366, "lr": 3.344930684559236e-05} +{"train_loss": 0.001306335092522204, "global_step": 43564, "epoch": 366, "lr": 3.344721624959302e-05} +{"train_loss": 0.0008370261057280004, "global_step": 43565, "epoch": 366, "lr": 3.34451256860933e-05} +{"train_loss": 0.0012112711556255817, "global_step": 43566, "epoch": 366, "lr": 3.34430351550973e-05} +{"train_loss": 0.0008357262122444808, "global_step": 43567, "epoch": 366, "lr": 3.344094465660913e-05} +{"train_loss": 0.001303863013163209, "global_step": 43568, "epoch": 366, "lr": 3.343885419063291e-05} +{"train_loss": 0.001496202778071165, "global_step": 43569, "epoch": 366, "lr": 3.343676375717271e-05} +{"train_loss": 0.0013756257249042392, "global_step": 43570, "epoch": 366, "lr": 3.343467335623268e-05} +{"train_loss": 0.001683920039795339, "global_step": 43571, "epoch": 366, "lr": 3.343258298781688e-05} +{"train_loss": 0.0015985878417268395, "global_step": 43572, "epoch": 366, "lr": 3.343049265192944e-05} +{"train_loss": 0.0006776911905035377, "global_step": 43573, "epoch": 366, "lr": 3.3428402348574446e-05} +{"train_loss": 0.0016698010731488466, "global_step": 43574, "epoch": 366, "lr": 3.3426312077756034e-05} +{"train_loss": 0.0014977671671658754, "global_step": 43575, "epoch": 366, "lr": 3.342422183947829e-05} +{"train_loss": 0.0016365317860618234, "global_step": 43576, "epoch": 366, "lr": 3.342213163374529e-05} +{"train_loss": 0.0006747839506715536, "global_step": 43577, "epoch": 366, "lr": 3.342004146056118e-05} +{"train_loss": 0.0011432914761826396, "global_step": 43578, "epoch": 366, "lr": 3.341795131993003e-05} +{"train_loss": 0.0021452733781188726, "global_step": 43579, "epoch": 366, "lr": 3.341586121185599e-05} +{"train_loss": 0.0016500174533575773, "global_step": 43580, "epoch": 366, "lr": 3.341377113634311e-05} +{"train_loss": 0.001798695302568376, "global_step": 43581, "epoch": 366, "lr": 3.341168109339554e-05} +{"train_loss": 0.0010444056242704391, "global_step": 43582, "epoch": 366, "lr": 3.340959108301734e-05} +{"train_loss": 0.0009693081956356764, "global_step": 43583, "epoch": 366, "lr": 3.340750110521264e-05} +{"train_loss": 0.0024306976702064276, "global_step": 43584, "epoch": 366, "lr": 3.340541115998555e-05} +{"train_loss": 0.0018203118816018105, "global_step": 43585, "epoch": 366, "lr": 3.340332124734015e-05} +{"train_loss": 0.0016991740558296442, "global_step": 43586, "epoch": 366, "lr": 3.3401231367280567e-05} +{"train_loss": 0.0012870976934209466, "global_step": 43587, "epoch": 366, "lr": 3.3399141519810895e-05} +{"train_loss": 0.0006878769490867853, "global_step": 43588, "epoch": 366, "lr": 3.339705170493522e-05} +{"train_loss": 0.0013252057833597064, "global_step": 43589, "epoch": 366, "lr": 3.3394961922657676e-05} +{"train_loss": 0.0018414672231301665, "global_step": 43590, "epoch": 366, "lr": 3.3392872172982336e-05} +{"train_loss": 0.0013146622804924846, "global_step": 43591, "epoch": 366, "lr": 3.3390782455913325e-05} +{"train_loss": 0.0008172732195816934, "global_step": 43592, "epoch": 366, "lr": 3.338869277145473e-05} +{"train_loss": 0.0006593209109269083, "global_step": 43593, "epoch": 366, "lr": 3.338660311961068e-05} +{"train_loss": 0.0013179992092773318, "global_step": 43594, "epoch": 366, "lr": 3.338451350038526e-05} +{"train_loss": 0.0012406541500240564, "global_step": 43595, "epoch": 366, "lr": 3.338242391378255e-05} +{"train_loss": 0.0014172247610986233, "global_step": 43596, "epoch": 366, "lr": 3.3380334359806697e-05} +{"train_loss": 0.0006509084487333894, "global_step": 43597, "epoch": 366, "lr": 3.337824483846176e-05} +{"train_loss": 0.002663093851879239, "global_step": 43598, "epoch": 366, "lr": 3.337615534975187e-05} +{"train_loss": 0.0010435061994940042, "global_step": 43599, "epoch": 366, "lr": 3.3374065893681126e-05} +{"train_loss": 0.0023534162901341915, "global_step": 43600, "epoch": 366, "lr": 3.337197647025364e-05} +{"train_loss": 0.002104409970343113, "global_step": 43601, "epoch": 366, "lr": 3.3369887079473495e-05} +{"train_loss": 0.0016775047406554222, "global_step": 43602, "epoch": 366, "lr": 3.3367797721344785e-05} +{"train_loss": 0.0017422527307644486, "global_step": 43603, "epoch": 366, "lr": 3.336570839587165e-05} +{"train_loss": 0.0007448214455507696, "global_step": 43604, "epoch": 366, "lr": 3.3363619103058145e-05} +{"train_loss": 0.0012814573710784316, "global_step": 43605, "epoch": 366, "lr": 3.336152984290842e-05} +{"train_loss": 0.00202784757129848, "global_step": 43606, "epoch": 366, "lr": 3.3359440615426554e-05} +{"train_loss": 0.0014835753245279193, "global_step": 43607, "epoch": 366, "lr": 3.3357351420616625e-05} +{"train_loss": 0.0013909093104302883, "global_step": 43608, "epoch": 366, "lr": 3.335526225848278e-05} +{"train_loss": 0.0012509631924331188, "global_step": 43609, "epoch": 366, "lr": 3.335317312902908e-05} +{"train_loss": 0.002580284606665373, "global_step": 43610, "epoch": 366, "lr": 3.335108403225967e-05} +{"train_loss": 0.0017228997312486172, "global_step": 43611, "epoch": 366, "lr": 3.334899496817861e-05} +{"train_loss": 0.001329520484432578, "global_step": 43612, "epoch": 366, "lr": 3.334690593679003e-05} +{"train_loss": 0.0010887287789955735, "global_step": 43613, "epoch": 366, "lr": 3.334481693809801e-05} +{"train_loss": 0.001885632169432938, "global_step": 43614, "epoch": 366, "lr": 3.334272797210667e-05} +{"train_loss": 0.0018572499975562096, "global_step": 43615, "epoch": 366, "lr": 3.33406390388201e-05} +{"train_loss": 0.0013656433438882232, "global_step": 43616, "epoch": 366, "lr": 3.333855013824241e-05} +{"train_loss": 0.001526320120319724, "global_step": 43617, "epoch": 366, "lr": 3.333646127037769e-05} +{"train_loss": 0.0027926794718950987, "global_step": 43618, "epoch": 366, "lr": 3.333437243523006e-05} +{"train_loss": 0.001521468861028552, "global_step": 43619, "epoch": 366, "lr": 3.333228363280359e-05} +{"train_loss": 0.0010527314152568579, "global_step": 43620, "epoch": 366, "lr": 3.333019486310242e-05} +{"train_loss": 0.0010638273088261485, "global_step": 43621, "epoch": 366, "lr": 3.332810612613061e-05} +{"train_loss": 0.0013399978633970022, "global_step": 43622, "epoch": 366, "lr": 3.332601742189231e-05} +{"train_loss": 0.0013912274735048413, "global_step": 43623, "epoch": 366, "lr": 3.332392875039156e-05} +{"train_loss": 0.0020867399871349335, "global_step": 43624, "epoch": 366, "lr": 3.332184011163253e-05} +{"train_loss": 0.001110666198655963, "global_step": 43625, "epoch": 366, "lr": 3.331975150561928e-05} +{"train_loss": 0.0012961230240762234, "global_step": 43626, "epoch": 366, "lr": 3.3317662932355895e-05} +{"train_loss": 0.000811113859526813, "global_step": 43627, "epoch": 366, "lr": 3.3315574391846514e-05} +{"train_loss": 0.001461754902265966, "global_step": 43628, "epoch": 366, "lr": 3.33134858840952e-05} +{"train_loss": 0.0008650930831208825, "global_step": 43629, "epoch": 366, "lr": 3.331139740910609e-05} +{"train_loss": 0.0020927470177412033, "global_step": 43630, "epoch": 366, "lr": 3.3309308966883256e-05} +{"train_loss": 0.0013972135493531823, "global_step": 43631, "epoch": 366, "lr": 3.330722055743083e-05} +{"train_loss": 0.0019158789655193686, "global_step": 43632, "epoch": 366, "lr": 3.330513218075288e-05} +{"train_loss": 0.0015917153796181083, "global_step": 43633, "epoch": 366, "lr": 3.3303043836853516e-05} +{"train_loss": 0.0015660843346267939, "global_step": 43634, "epoch": 366, "lr": 3.330095552573685e-05} +{"train_loss": 0.0007763964822515845, "global_step": 43635, "epoch": 366, "lr": 3.3298867247406964e-05} +{"train_loss": 0.001933201914653182, "global_step": 43636, "epoch": 366, "lr": 3.3296779001867984e-05} +{"train_loss": 0.0008895021164789796, "global_step": 43637, "epoch": 366, "lr": 3.329469078912399e-05} +{"train_loss": 0.0012516239657998085, "global_step": 43638, "epoch": 366, "lr": 3.329260260917908e-05} +{"train_loss": 0.0004412749840412289, "global_step": 43639, "epoch": 366, "lr": 3.329051446203737e-05} +{"train_loss": 0.0018230078276246786, "global_step": 43640, "epoch": 366, "lr": 3.328842634770293e-05} +{"train_loss": 0.0025127434637397528, "global_step": 43641, "epoch": 366, "lr": 3.32863382661799e-05} +{"train_loss": 0.002645649714395404, "global_step": 43642, "epoch": 366, "lr": 3.3284250217472334e-05} +{"train_loss": 0.0016547527629882097, "global_step": 43643, "epoch": 366, "lr": 3.3282162201584376e-05} +{"train_loss": 0.0017473381012678146, "global_step": 43644, "epoch": 366, "lr": 3.328007421852012e-05} +{"train_loss": 0.0008496836526319385, "global_step": 43645, "epoch": 366, "lr": 3.327798626828362e-05} +{"train_loss": 0.0015100912423804402, "global_step": 43646, "epoch": 366, "lr": 3.327589835087903e-05} +{"train_loss": 0.0007857767050154507, "global_step": 43647, "epoch": 366, "lr": 3.327381046631041e-05} +{"train_loss": 0.0011822076048702002, "global_step": 43648, "epoch": 366, "lr": 3.327172261458189e-05} +{"train_loss": 0.0009654127643443644, "global_step": 43649, "epoch": 366, "lr": 3.3269634795697544e-05} +{"train_loss": 0.00257316417992115, "global_step": 43650, "epoch": 366, "lr": 3.326754700966149e-05} +{"train_loss": 0.0012996327131986618, "global_step": 43651, "epoch": 366, "lr": 3.3265459256477826e-05} +{"train_loss": 0.0009720245143398643, "global_step": 43652, "epoch": 366, "lr": 3.326337153615063e-05} +{"train_loss": 0.0015591400442644954, "global_step": 43653, "epoch": 366, "lr": 3.326128384868403e-05} +{"train_loss": 0.0011921832337975502, "global_step": 43654, "epoch": 366, "lr": 3.32591961940821e-05} +{"train_loss": 0.0010161716490983963, "global_step": 43655, "epoch": 366, "lr": 3.3257108572348964e-05} +{"train_loss": 0.0016842384357005358, "global_step": 43656, "epoch": 366, "lr": 3.32550209834887e-05} +{"train_loss": 0.0012930461671203375, "global_step": 43657, "epoch": 366, "lr": 3.325293342750541e-05} +{"train_loss": 0.002097326796501875, "global_step": 43658, "epoch": 366, "lr": 3.32508459044032e-05} +{"train_loss": 0.0015214562881737947, "global_step": 43659, "epoch": 366, "lr": 3.3248758414186146e-05} +{"train_loss": 0.003163582645356655, "global_step": 43660, "epoch": 366, "lr": 3.324667095685839e-05} +{"train_loss": 0.001387717784382403, "global_step": 43661, "epoch": 366, "lr": 3.324458353242399e-05} +{"train_loss": 0.0018843567231670022, "global_step": 43662, "epoch": 366, "lr": 3.324249614088707e-05} +{"train_loss": 0.0017486193682998419, "global_step": 43663, "epoch": 366, "lr": 3.324040878225172e-05} +{"train_loss": 0.0019374499097466469, "global_step": 43664, "epoch": 366, "lr": 3.3238321456522035e-05} +{"train_loss": 0.0016613821499049664, "global_step": 43665, "epoch": 366, "lr": 3.3236234163702105e-05} +{"train_loss": 0.0010727386688813567, "global_step": 43666, "epoch": 366, "lr": 3.323414690379605e-05} +{"train_loss": 0.0025184459518641233, "global_step": 43667, "epoch": 366, "lr": 3.3232059676807945e-05} +{"train_loss": 0.0022789982613176107, "global_step": 43668, "epoch": 366, "lr": 3.3229972482741914e-05} +{"train_loss": 0.0013445441145449877, "global_step": 43669, "epoch": 366, "lr": 3.3227885321602025e-05} +{"train_loss": 0.0016819012816995382, "global_step": 43670, "epoch": 366, "lr": 3.322579819339241e-05} +{"train_loss": 0.0008305651717819273, "global_step": 43671, "epoch": 366, "lr": 3.322371109811713e-05} +{"train_loss": 0.001494054843235307, "global_step": 43672, "epoch": 366, "lr": 3.322162403578031e-05, "val_loss": 0.034402769058942795} +{"train_loss": 0.0015365715371444821, "global_step": 43673, "epoch": 367, "lr": 3.321953700638602e-05} +{"train_loss": 0.0023262351751327515, "global_step": 43674, "epoch": 367, "lr": 3.321745000993841e-05} +{"train_loss": 0.0009663683013059199, "global_step": 43675, "epoch": 367, "lr": 3.321536304644154e-05} +{"train_loss": 0.0013395290588960052, "global_step": 43676, "epoch": 367, "lr": 3.321327611589948e-05} +{"train_loss": 0.0009985656943172216, "global_step": 43677, "epoch": 367, "lr": 3.3211189218316394e-05} +{"train_loss": 0.0015599575126543641, "global_step": 43678, "epoch": 367, "lr": 3.320910235369631e-05} +{"train_loss": 0.0016576297348365188, "global_step": 43679, "epoch": 367, "lr": 3.32070155220434e-05} +{"train_loss": 0.001857352559454739, "global_step": 43680, "epoch": 367, "lr": 3.320492872336168e-05} +{"train_loss": 0.0018654465675354004, "global_step": 43681, "epoch": 367, "lr": 3.320284195765532e-05} +{"train_loss": 0.001401954097673297, "global_step": 43682, "epoch": 367, "lr": 3.320075522492837e-05} +{"train_loss": 0.0018957552965730429, "global_step": 43683, "epoch": 367, "lr": 3.319866852518493e-05} +{"train_loss": 0.002088929293677211, "global_step": 43684, "epoch": 367, "lr": 3.319658185842913e-05} +{"train_loss": 0.0017368282424286008, "global_step": 43685, "epoch": 367, "lr": 3.3194495224665035e-05} +{"train_loss": 0.0015895479591563344, "global_step": 43686, "epoch": 367, "lr": 3.319240862389677e-05} +{"train_loss": 0.0015688531566411257, "global_step": 43687, "epoch": 367, "lr": 3.319032205612841e-05} +{"train_loss": 0.0012069515651091933, "global_step": 43688, "epoch": 367, "lr": 3.318823552136404e-05} +{"train_loss": 0.002033816184848547, "global_step": 43689, "epoch": 367, "lr": 3.3186149019607794e-05} +{"train_loss": 0.0013061597710475326, "global_step": 43690, "epoch": 367, "lr": 3.3184062550863726e-05} +{"train_loss": 0.002225377829745412, "global_step": 43691, "epoch": 367, "lr": 3.318197611513597e-05} +{"train_loss": 0.00195971573702991, "global_step": 43692, "epoch": 367, "lr": 3.31798897124286e-05} +{"train_loss": 0.0012954920530319214, "global_step": 43693, "epoch": 367, "lr": 3.317780334274573e-05} +{"train_loss": 0.0006603990332223475, "global_step": 43694, "epoch": 367, "lr": 3.317571700609144e-05} +{"train_loss": 0.0018608293030411005, "global_step": 43695, "epoch": 367, "lr": 3.3173630702469826e-05} +{"train_loss": 0.0013037018943578005, "global_step": 43696, "epoch": 367, "lr": 3.3171544431884996e-05} +{"train_loss": 0.0013816476566717029, "global_step": 43697, "epoch": 367, "lr": 3.3169458194341044e-05} +{"train_loss": 0.0014083505375310779, "global_step": 43698, "epoch": 367, "lr": 3.3167371989842056e-05} +{"train_loss": 0.0014167081099003553, "global_step": 43699, "epoch": 367, "lr": 3.316528581839213e-05} +{"train_loss": 0.0012102064210921526, "global_step": 43700, "epoch": 367, "lr": 3.3163199679995385e-05} +{"train_loss": 0.0014451075112447143, "global_step": 43701, "epoch": 367, "lr": 3.3161113574655895e-05} +{"train_loss": 0.0006746432627551258, "global_step": 43702, "epoch": 367, "lr": 3.315902750237774e-05} +{"train_loss": 0.0014434584882110357, "global_step": 43703, "epoch": 367, "lr": 3.3156941463165056e-05} +{"train_loss": 0.0017456987407058477, "global_step": 43704, "epoch": 367, "lr": 3.3154855457021906e-05} +{"train_loss": 0.001843546750023961, "global_step": 43705, "epoch": 367, "lr": 3.3152769483952404e-05} +{"train_loss": 0.0021497057750821114, "global_step": 43706, "epoch": 367, "lr": 3.315068354396065e-05} +{"train_loss": 0.002399877645075321, "global_step": 43707, "epoch": 367, "lr": 3.31485976370507e-05} +{"train_loss": 0.0013501897919923067, "global_step": 43708, "epoch": 367, "lr": 3.31465117632267e-05} +{"train_loss": 0.0024178598541766405, "global_step": 43709, "epoch": 367, "lr": 3.3144425922492716e-05} +{"train_loss": 0.0010128214489668608, "global_step": 43710, "epoch": 367, "lr": 3.314234011485287e-05} +{"train_loss": 0.00137313490267843, "global_step": 43711, "epoch": 367, "lr": 3.314025434031121e-05} +{"train_loss": 0.0016500756610184908, "global_step": 43712, "epoch": 367, "lr": 3.313816859887187e-05} +{"train_loss": 0.0021108908113092184, "global_step": 43713, "epoch": 367, "lr": 3.313608289053893e-05} +{"train_loss": 0.000850148790050298, "global_step": 43714, "epoch": 367, "lr": 3.3133997215316504e-05} +{"train_loss": 0.0010980636579915881, "global_step": 43715, "epoch": 367, "lr": 3.313191157320866e-05} +{"train_loss": 0.0014496525982394814, "global_step": 43716, "epoch": 367, "lr": 3.3129825964219506e-05} +{"train_loss": 0.0023244176991283894, "global_step": 43717, "epoch": 367, "lr": 3.3127740388353135e-05} +{"train_loss": 0.0009937024442479014, "global_step": 43718, "epoch": 367, "lr": 3.312565484561364e-05} +{"train_loss": 0.0015159707982093096, "global_step": 43719, "epoch": 367, "lr": 3.3123569336005134e-05} +{"train_loss": 0.0015091397799551487, "global_step": 43720, "epoch": 367, "lr": 3.3121483859531696e-05} +{"train_loss": 0.0025602399837225676, "global_step": 43721, "epoch": 367, "lr": 3.3119398416197406e-05} +{"train_loss": 0.0012443240266293287, "global_step": 43722, "epoch": 367, "lr": 3.311731300600639e-05} +{"train_loss": 0.0007704480667598546, "global_step": 43723, "epoch": 367, "lr": 3.311522762896271e-05} +{"train_loss": 0.0009435861138626933, "global_step": 43724, "epoch": 367, "lr": 3.31131422850705e-05} +{"train_loss": 0.0023466998245567083, "global_step": 43725, "epoch": 367, "lr": 3.311105697433382e-05} +{"train_loss": 0.002463448094204068, "global_step": 43726, "epoch": 367, "lr": 3.3108971696756765e-05} +{"train_loss": 0.000916000222787261, "global_step": 43727, "epoch": 367, "lr": 3.310688645234345e-05} +{"train_loss": 0.0010162235703319311, "global_step": 43728, "epoch": 367, "lr": 3.3104801241097945e-05} +{"train_loss": 0.0015758444787934422, "global_step": 43729, "epoch": 367, "lr": 3.3102716063024375e-05} +{"train_loss": 0.002208227990195155, "global_step": 43730, "epoch": 367, "lr": 3.3100630918126796e-05} +{"train_loss": 0.0007505019311793149, "global_step": 43731, "epoch": 367, "lr": 3.309854580640934e-05} +{"train_loss": 0.0021398195531219244, "global_step": 43732, "epoch": 367, "lr": 3.309646072787609e-05} +{"train_loss": 0.0010719636920839548, "global_step": 43733, "epoch": 367, "lr": 3.309437568253111e-05} +{"train_loss": 0.0018269580323249102, "global_step": 43734, "epoch": 367, "lr": 3.3092290670378535e-05} +{"train_loss": 0.0019565557595342398, "global_step": 43735, "epoch": 367, "lr": 3.309020569142243e-05} +{"train_loss": 0.0009516344871371984, "global_step": 43736, "epoch": 367, "lr": 3.3088120745666916e-05} +{"train_loss": 0.0016238264506682754, "global_step": 43737, "epoch": 367, "lr": 3.308603583311607e-05} +{"train_loss": 0.0033925704192370176, "global_step": 43738, "epoch": 367, "lr": 3.308395095377396e-05} +{"train_loss": 0.0014234822010621428, "global_step": 43739, "epoch": 367, "lr": 3.3081866107644734e-05} +{"train_loss": 0.001504356856457889, "global_step": 43740, "epoch": 367, "lr": 3.307978129473243e-05} +{"train_loss": 0.002627432579174638, "global_step": 43741, "epoch": 367, "lr": 3.307769651504119e-05} +{"train_loss": 0.001545366714708507, "global_step": 43742, "epoch": 367, "lr": 3.3075611768575066e-05} +{"train_loss": 0.0015751913888379931, "global_step": 43743, "epoch": 367, "lr": 3.307352705533819e-05} +{"train_loss": 0.001396941370330751, "global_step": 43744, "epoch": 367, "lr": 3.307144237533462e-05} +{"train_loss": 0.0012159566394984722, "global_step": 43745, "epoch": 367, "lr": 3.306935772856847e-05} +{"train_loss": 0.00128081813454628, "global_step": 43746, "epoch": 367, "lr": 3.3067273115043826e-05} +{"train_loss": 0.0018630814738571644, "global_step": 43747, "epoch": 367, "lr": 3.306518853476478e-05} +{"train_loss": 0.0008988064364530146, "global_step": 43748, "epoch": 367, "lr": 3.3063103987735433e-05} +{"train_loss": 0.002298134146258235, "global_step": 43749, "epoch": 367, "lr": 3.306101947395987e-05} +{"train_loss": 0.0017835975158959627, "global_step": 43750, "epoch": 367, "lr": 3.305893499344218e-05} +{"train_loss": 0.00133515743073076, "global_step": 43751, "epoch": 367, "lr": 3.305685054618648e-05} +{"train_loss": 0.0016250343760475516, "global_step": 43752, "epoch": 367, "lr": 3.305476613219682e-05} +{"train_loss": 0.002017296152189374, "global_step": 43753, "epoch": 367, "lr": 3.3052681751477335e-05} +{"train_loss": 0.0013571848394349217, "global_step": 43754, "epoch": 367, "lr": 3.3050597404032077e-05} +{"train_loss": 0.0018242055084556341, "global_step": 43755, "epoch": 367, "lr": 3.3048513089865184e-05} +{"train_loss": 0.00115114264190197, "global_step": 43756, "epoch": 367, "lr": 3.304642880898072e-05} +{"train_loss": 0.002328521804884076, "global_step": 43757, "epoch": 367, "lr": 3.3044344561382766e-05} +{"train_loss": 0.0006996740703471005, "global_step": 43758, "epoch": 367, "lr": 3.304226034707545e-05} +{"train_loss": 0.0021587421651929617, "global_step": 43759, "epoch": 367, "lr": 3.3040176166062825e-05} +{"train_loss": 0.0016075341263785958, "global_step": 43760, "epoch": 367, "lr": 3.303809201834902e-05} +{"train_loss": 0.001243110978975892, "global_step": 43761, "epoch": 367, "lr": 3.303600790393809e-05} +{"train_loss": 0.001895736437290907, "global_step": 43762, "epoch": 367, "lr": 3.303392382283417e-05} +{"train_loss": 0.0011100460542365909, "global_step": 43763, "epoch": 367, "lr": 3.3031839775041304e-05} +{"train_loss": 0.002002303721383214, "global_step": 43764, "epoch": 367, "lr": 3.302975576056362e-05} +{"train_loss": 0.0012795100919902325, "global_step": 43765, "epoch": 367, "lr": 3.30276717794052e-05} +{"train_loss": 0.0017257496947422624, "global_step": 43766, "epoch": 367, "lr": 3.302558783157011e-05} +{"train_loss": 0.0016734772361814976, "global_step": 43767, "epoch": 367, "lr": 3.3023503917062495e-05} +{"train_loss": 0.0011049103923141956, "global_step": 43768, "epoch": 367, "lr": 3.30214200358864e-05} +{"train_loss": 0.001963704591616988, "global_step": 43769, "epoch": 367, "lr": 3.3019336188045945e-05} +{"train_loss": 0.0013023152714595199, "global_step": 43770, "epoch": 367, "lr": 3.301725237354522e-05} +{"train_loss": 0.0016217035008594394, "global_step": 43771, "epoch": 367, "lr": 3.301516859238827e-05} +{"train_loss": 0.0010216040536761284, "global_step": 43772, "epoch": 367, "lr": 3.301308484457924e-05} +{"train_loss": 0.0011653748806566, "global_step": 43773, "epoch": 367, "lr": 3.30110011301222e-05} +{"train_loss": 0.003008688800036907, "global_step": 43774, "epoch": 367, "lr": 3.300891744902126e-05} +{"train_loss": 0.001233094371855259, "global_step": 43775, "epoch": 367, "lr": 3.300683380128049e-05} +{"train_loss": 0.0015098036965355277, "global_step": 43776, "epoch": 367, "lr": 3.300475018690397e-05} +{"train_loss": 0.0013412859989330173, "global_step": 43777, "epoch": 367, "lr": 3.300266660589583e-05} +{"train_loss": 0.0011421102099120617, "global_step": 43778, "epoch": 367, "lr": 3.30005830582601e-05} +{"train_loss": 0.0014418276259675622, "global_step": 43779, "epoch": 367, "lr": 3.299849954400094e-05} +{"train_loss": 0.0016983463428914547, "global_step": 43780, "epoch": 367, "lr": 3.2996416063122405e-05} +{"train_loss": 0.0011588353663682938, "global_step": 43781, "epoch": 367, "lr": 3.2994332615628585e-05} +{"train_loss": 0.002104391111060977, "global_step": 43782, "epoch": 367, "lr": 3.299224920152359e-05} +{"train_loss": 0.0007841769838705659, "global_step": 43783, "epoch": 367, "lr": 3.2990165820811476e-05} +{"train_loss": 0.000665620609652251, "global_step": 43784, "epoch": 367, "lr": 3.298808247349637e-05} +{"train_loss": 0.0015483011957257986, "global_step": 43785, "epoch": 367, "lr": 3.298599915958234e-05} +{"train_loss": 0.001281404634937644, "global_step": 43786, "epoch": 367, "lr": 3.298391587907349e-05} +{"train_loss": 0.001395538216456771, "global_step": 43787, "epoch": 367, "lr": 3.298183263197389e-05} +{"train_loss": 0.0008771111024543643, "global_step": 43788, "epoch": 367, "lr": 3.297974941828765e-05} +{"train_loss": 0.0012500997399911284, "global_step": 43789, "epoch": 367, "lr": 3.2977666238018875e-05} +{"train_loss": 0.0013214765349403024, "global_step": 43790, "epoch": 367, "lr": 3.29755830911716e-05} +{"train_loss": 0.0015479693978735316, "global_step": 43791, "epoch": 367, "lr": 3.2973499977749975e-05, "val_loss": 0.01697542332112789} +{"train_loss": 0.0010318608256056905, "global_step": 43792, "epoch": 368, "lr": 3.2971416897758035e-05} +{"train_loss": 0.001617379137314856, "global_step": 43793, "epoch": 368, "lr": 3.296933385119992e-05} +{"train_loss": 0.001768031856045127, "global_step": 43794, "epoch": 368, "lr": 3.29672508380797e-05} +{"train_loss": 0.0016697789542376995, "global_step": 43795, "epoch": 368, "lr": 3.2965167858401455e-05} +{"train_loss": 0.0008912133635021746, "global_step": 43796, "epoch": 368, "lr": 3.2963084912169285e-05} +{"train_loss": 0.0009194241720251739, "global_step": 43797, "epoch": 368, "lr": 3.2961001999387274e-05} +{"train_loss": 0.0014743170468136668, "global_step": 43798, "epoch": 368, "lr": 3.295891912005952e-05} +{"train_loss": 0.0008858296205289662, "global_step": 43799, "epoch": 368, "lr": 3.295683627419011e-05} +{"train_loss": 0.0016510699642822146, "global_step": 43800, "epoch": 368, "lr": 3.295475346178312e-05} +{"train_loss": 0.0008617833955213428, "global_step": 43801, "epoch": 368, "lr": 3.295267068284267e-05} +{"train_loss": 0.0012842359719797969, "global_step": 43802, "epoch": 368, "lr": 3.2950587937372806e-05} +{"train_loss": 0.0018288142746314406, "global_step": 43803, "epoch": 368, "lr": 3.294850522537767e-05} +{"train_loss": 0.0011899664532393217, "global_step": 43804, "epoch": 368, "lr": 3.294642254686129e-05} +{"train_loss": 0.0009779604151844978, "global_step": 43805, "epoch": 368, "lr": 3.2944339901827816e-05} +{"train_loss": 0.0011812294833362103, "global_step": 43806, "epoch": 368, "lr": 3.2942257290281295e-05} +{"train_loss": 0.0008251020917668939, "global_step": 43807, "epoch": 368, "lr": 3.2940174712225827e-05} +{"train_loss": 0.0016808930085971951, "global_step": 43808, "epoch": 368, "lr": 3.293809216766551e-05} +{"train_loss": 0.0014533840585500002, "global_step": 43809, "epoch": 368, "lr": 3.293600965660442e-05} +{"train_loss": 0.0018033974338322878, "global_step": 43810, "epoch": 368, "lr": 3.293392717904666e-05} +{"train_loss": 0.0008482637931592762, "global_step": 43811, "epoch": 368, "lr": 3.2931844734996295e-05} +{"train_loss": 0.0015065839979797602, "global_step": 43812, "epoch": 368, "lr": 3.292976232445745e-05} +{"train_loss": 0.0009398022666573524, "global_step": 43813, "epoch": 368, "lr": 3.292767994743418e-05} +{"train_loss": 0.002447043778374791, "global_step": 43814, "epoch": 368, "lr": 3.292559760393059e-05} +{"train_loss": 0.0015819366089999676, "global_step": 43815, "epoch": 368, "lr": 3.2923515293950755e-05} +{"train_loss": 0.0009852721123024821, "global_step": 43816, "epoch": 368, "lr": 3.2921433017498776e-05} +{"train_loss": 0.0012980959145352244, "global_step": 43817, "epoch": 368, "lr": 3.291935077457876e-05} +{"train_loss": 0.0009903600439429283, "global_step": 43818, "epoch": 368, "lr": 3.2917268565194745e-05} +{"train_loss": 0.0018241752404719591, "global_step": 43819, "epoch": 368, "lr": 3.291518638935087e-05} +{"train_loss": 0.0006616165046580136, "global_step": 43820, "epoch": 368, "lr": 3.2913104247051206e-05} +{"train_loss": 0.001548389671370387, "global_step": 43821, "epoch": 368, "lr": 3.291102213829981e-05} +{"train_loss": 0.001711222343146801, "global_step": 43822, "epoch": 368, "lr": 3.2908940063100826e-05} +{"train_loss": 0.0008572826045565307, "global_step": 43823, "epoch": 368, "lr": 3.290685802145828e-05} +{"train_loss": 0.0022489866241812706, "global_step": 43824, "epoch": 368, "lr": 3.2904776013376315e-05} +{"train_loss": 0.0019103516824543476, "global_step": 43825, "epoch": 368, "lr": 3.290269403885901e-05} +{"train_loss": 0.0012879952555522323, "global_step": 43826, "epoch": 368, "lr": 3.2900612097910396e-05} +{"train_loss": 0.002120014512911439, "global_step": 43827, "epoch": 368, "lr": 3.289853019053464e-05} +{"train_loss": 0.001820100238546729, "global_step": 43828, "epoch": 368, "lr": 3.2896448316735763e-05} +{"train_loss": 0.0007165258284658194, "global_step": 43829, "epoch": 368, "lr": 3.28943664765179e-05} +{"train_loss": 0.0015104004414752126, "global_step": 43830, "epoch": 368, "lr": 3.289228466988512e-05} +{"train_loss": 0.0017132855718955398, "global_step": 43831, "epoch": 368, "lr": 3.2890202896841504e-05} +{"train_loss": 0.0007789390510879457, "global_step": 43832, "epoch": 368, "lr": 3.288812115739117e-05} +{"train_loss": 0.0009487405186519027, "global_step": 43833, "epoch": 368, "lr": 3.2886039451538156e-05} +{"train_loss": 0.0016367568168789148, "global_step": 43834, "epoch": 368, "lr": 3.288395777928659e-05} +{"train_loss": 0.00107968645170331, "global_step": 43835, "epoch": 368, "lr": 3.288187614064052e-05} +{"train_loss": 0.0015536068240180612, "global_step": 43836, "epoch": 368, "lr": 3.287979453560409e-05} +{"train_loss": 0.0011130195343866944, "global_step": 43837, "epoch": 368, "lr": 3.287771296418133e-05} +{"train_loss": 0.0015451995423063636, "global_step": 43838, "epoch": 368, "lr": 3.2875631426376374e-05} +{"train_loss": 0.0013780486769974232, "global_step": 43839, "epoch": 368, "lr": 3.287354992219328e-05} +{"train_loss": 0.0016916418680921197, "global_step": 43840, "epoch": 368, "lr": 3.287146845163612e-05} +{"train_loss": 0.0010174151975661516, "global_step": 43841, "epoch": 368, "lr": 3.286938701470903e-05} +{"train_loss": 0.000999060575850308, "global_step": 43842, "epoch": 368, "lr": 3.2867305611416045e-05} +{"train_loss": 0.0014481195248663425, "global_step": 43843, "epoch": 368, "lr": 3.286522424176129e-05} +{"train_loss": 0.0012713136384263635, "global_step": 43844, "epoch": 368, "lr": 3.286314290574883e-05} +{"train_loss": 0.0018732819007709622, "global_step": 43845, "epoch": 368, "lr": 3.286106160338277e-05} +{"train_loss": 0.0019159847870469093, "global_step": 43846, "epoch": 368, "lr": 3.2858980334667166e-05} +{"train_loss": 0.000796667707618326, "global_step": 43847, "epoch": 368, "lr": 3.285689909960613e-05} +{"train_loss": 0.001354419975541532, "global_step": 43848, "epoch": 368, "lr": 3.285481789820375e-05} +{"train_loss": 0.0017203579191118479, "global_step": 43849, "epoch": 368, "lr": 3.285273673046409e-05} +{"train_loss": 0.0009886508341878653, "global_step": 43850, "epoch": 368, "lr": 3.2850655596391254e-05} +{"train_loss": 0.0014502384001389146, "global_step": 43851, "epoch": 368, "lr": 3.2848574495989336e-05} +{"train_loss": 0.0007339465664699674, "global_step": 43852, "epoch": 368, "lr": 3.2846493429262385e-05} +{"train_loss": 0.001480201492086053, "global_step": 43853, "epoch": 368, "lr": 3.284441239621454e-05} +{"train_loss": 0.0016246114391833544, "global_step": 43854, "epoch": 368, "lr": 3.284233139684984e-05} +{"train_loss": 0.0012122669722884893, "global_step": 43855, "epoch": 368, "lr": 3.284025043117239e-05} +{"train_loss": 0.0008894761558622122, "global_step": 43856, "epoch": 368, "lr": 3.2838169499186266e-05} +{"train_loss": 0.0008845881093293428, "global_step": 43857, "epoch": 368, "lr": 3.2836088600895584e-05} +{"train_loss": 0.0014934337232261896, "global_step": 43858, "epoch": 368, "lr": 3.283400773630441e-05} +{"train_loss": 0.0013232870260253549, "global_step": 43859, "epoch": 368, "lr": 3.283192690541681e-05} +{"train_loss": 0.001061521703377366, "global_step": 43860, "epoch": 368, "lr": 3.282984610823691e-05} +{"train_loss": 0.0013865460641682148, "global_step": 43861, "epoch": 368, "lr": 3.282776534476874e-05} +{"train_loss": 0.0017527485033497214, "global_step": 43862, "epoch": 368, "lr": 3.282568461501644e-05} +{"train_loss": 0.0021188976243138313, "global_step": 43863, "epoch": 368, "lr": 3.282360391898407e-05} +{"train_loss": 0.001316550886258483, "global_step": 43864, "epoch": 368, "lr": 3.282152325667571e-05} +{"train_loss": 0.000699688564054668, "global_step": 43865, "epoch": 368, "lr": 3.2819442628095464e-05} +{"train_loss": 0.0014511089539155364, "global_step": 43866, "epoch": 368, "lr": 3.28173620332474e-05} +{"train_loss": 0.0019646899309009314, "global_step": 43867, "epoch": 368, "lr": 3.2815281472135615e-05} +{"train_loss": 0.0019322959706187248, "global_step": 43868, "epoch": 368, "lr": 3.2813200944764184e-05} +{"train_loss": 0.001053660293109715, "global_step": 43869, "epoch": 368, "lr": 3.281112045113721e-05} +{"train_loss": 0.0008883553091436625, "global_step": 43870, "epoch": 368, "lr": 3.280903999125876e-05} +{"train_loss": 0.0010356346610933542, "global_step": 43871, "epoch": 368, "lr": 3.280695956513291e-05} +{"train_loss": 0.0009530789684504271, "global_step": 43872, "epoch": 368, "lr": 3.280487917276378e-05} +{"train_loss": 0.0006683902465738356, "global_step": 43873, "epoch": 368, "lr": 3.280279881415541e-05} +{"train_loss": 0.0012721158564090729, "global_step": 43874, "epoch": 368, "lr": 3.280071848931192e-05} +{"train_loss": 0.0018753765616565943, "global_step": 43875, "epoch": 368, "lr": 3.2798638198237394e-05} +{"train_loss": 0.0008087683818303049, "global_step": 43876, "epoch": 368, "lr": 3.279655794093588e-05} +{"train_loss": 0.0009091735119000077, "global_step": 43877, "epoch": 368, "lr": 3.2794477717411485e-05} +{"train_loss": 0.0016315075336024165, "global_step": 43878, "epoch": 368, "lr": 3.279239752766831e-05} +{"train_loss": 0.0012797260424122214, "global_step": 43879, "epoch": 368, "lr": 3.2790317371710424e-05} +{"train_loss": 0.0011346355313435197, "global_step": 43880, "epoch": 368, "lr": 3.2788237249541897e-05} +{"train_loss": 0.0016950143035501242, "global_step": 43881, "epoch": 368, "lr": 3.278615716116684e-05} +{"train_loss": 0.0017357725882902741, "global_step": 43882, "epoch": 368, "lr": 3.2784077106589326e-05} +{"train_loss": 0.0014618615387007594, "global_step": 43883, "epoch": 368, "lr": 3.278199708581343e-05} +{"train_loss": 0.0010754331015050411, "global_step": 43884, "epoch": 368, "lr": 3.277991709884325e-05} +{"train_loss": 0.0015473574167117476, "global_step": 43885, "epoch": 368, "lr": 3.277783714568285e-05} +{"train_loss": 0.0009158047032542527, "global_step": 43886, "epoch": 368, "lr": 3.2775757226336346e-05} +{"train_loss": 0.0014564007287845016, "global_step": 43887, "epoch": 368, "lr": 3.2773677340807784e-05} +{"train_loss": 0.0013687427854165435, "global_step": 43888, "epoch": 368, "lr": 3.277159748910128e-05} +{"train_loss": 0.0006192598957568407, "global_step": 43889, "epoch": 368, "lr": 3.27695176712209e-05} +{"train_loss": 0.0010637934319674969, "global_step": 43890, "epoch": 368, "lr": 3.2767437887170724e-05} +{"train_loss": 0.00158657634165138, "global_step": 43891, "epoch": 368, "lr": 3.276535813695486e-05} +{"train_loss": 0.0010184596758335829, "global_step": 43892, "epoch": 368, "lr": 3.2763278420577356e-05} +{"train_loss": 0.0009214122546836734, "global_step": 43893, "epoch": 368, "lr": 3.2761198738042326e-05} +{"train_loss": 0.0012778200907632709, "global_step": 43894, "epoch": 368, "lr": 3.275911908935383e-05} +{"train_loss": 0.0013021965278312564, "global_step": 43895, "epoch": 368, "lr": 3.275703947451597e-05} +{"train_loss": 0.0008371526491828263, "global_step": 43896, "epoch": 368, "lr": 3.2754959893532815e-05} +{"train_loss": 0.0009775691432878375, "global_step": 43897, "epoch": 368, "lr": 3.275288034640846e-05} +{"train_loss": 0.0006690919981338084, "global_step": 43898, "epoch": 368, "lr": 3.275080083314697e-05} +{"train_loss": 0.0015355495270341635, "global_step": 43899, "epoch": 368, "lr": 3.2748721353752446e-05} +{"train_loss": 0.001264450023882091, "global_step": 43900, "epoch": 368, "lr": 3.274664190822897e-05} +{"train_loss": 0.0018995286663994193, "global_step": 43901, "epoch": 368, "lr": 3.274456249658062e-05} +{"train_loss": 0.0010544615797698498, "global_step": 43902, "epoch": 368, "lr": 3.274248311881147e-05} +{"train_loss": 0.0012147299712523818, "global_step": 43903, "epoch": 368, "lr": 3.274040377492562e-05} +{"train_loss": 0.0014997617108747363, "global_step": 43904, "epoch": 368, "lr": 3.2738324464927125e-05} +{"train_loss": 0.001112641184590757, "global_step": 43905, "epoch": 368, "lr": 3.273624518882011e-05} +{"train_loss": 0.0007947038975544274, "global_step": 43906, "epoch": 368, "lr": 3.273416594660861e-05} +{"train_loss": 0.0006472737295553088, "global_step": 43907, "epoch": 368, "lr": 3.273208673829675e-05} +{"train_loss": 0.001116372412070632, "global_step": 43908, "epoch": 368, "lr": 3.2730007563888596e-05} +{"train_loss": 0.001281826407648623, "global_step": 43909, "epoch": 368, "lr": 3.2727928423388204e-05} +{"train_loss": 0.0013020831031114364, "global_step": 43910, "epoch": 368, "lr": 3.27258493167997e-05, "val_loss": 0.02421807497739792} +{"train_loss": 0.0006138801691122353, "global_step": 43911, "epoch": 369, "lr": 3.2723770244127124e-05} +{"train_loss": 0.0007657637470401824, "global_step": 43912, "epoch": 369, "lr": 3.2721691205374594e-05} +{"train_loss": 0.0025699492543935776, "global_step": 43913, "epoch": 369, "lr": 3.271961220054619e-05} +{"train_loss": 0.0005756000173278153, "global_step": 43914, "epoch": 369, "lr": 3.271753322964595e-05} +{"train_loss": 0.0022753658704459667, "global_step": 43915, "epoch": 369, "lr": 3.2715454292678015e-05} +{"train_loss": 0.0012453568633645773, "global_step": 43916, "epoch": 369, "lr": 3.2713375389646414e-05} +{"train_loss": 0.0009891712106764317, "global_step": 43917, "epoch": 369, "lr": 3.271129652055528e-05} +{"train_loss": 0.001461532199755311, "global_step": 43918, "epoch": 369, "lr": 3.270921768540864e-05} +{"train_loss": 0.0011302781058475375, "global_step": 43919, "epoch": 369, "lr": 3.2707138884210634e-05} +{"train_loss": 0.0014867777936160564, "global_step": 43920, "epoch": 369, "lr": 3.2705060116965306e-05} +{"train_loss": 0.0015965198399499059, "global_step": 43921, "epoch": 369, "lr": 3.270298138367673e-05} +{"train_loss": 0.0021066840272396803, "global_step": 43922, "epoch": 369, "lr": 3.2700902684349024e-05} +{"train_loss": 0.0014744311338290572, "global_step": 43923, "epoch": 369, "lr": 3.269882401898622e-05} +{"train_loss": 0.0014699151506647468, "global_step": 43924, "epoch": 369, "lr": 3.269674538759244e-05} +{"train_loss": 0.0011239763116464019, "global_step": 43925, "epoch": 369, "lr": 3.2694666790171765e-05} +{"train_loss": 0.0011087863240391016, "global_step": 43926, "epoch": 369, "lr": 3.2692588226728236e-05} +{"train_loss": 0.0009980738395825028, "global_step": 43927, "epoch": 369, "lr": 3.269050969726598e-05} +{"train_loss": 0.0011910226894542575, "global_step": 43928, "epoch": 369, "lr": 3.268843120178905e-05} +{"train_loss": 0.0009051391971297562, "global_step": 43929, "epoch": 369, "lr": 3.268635274030154e-05} +{"train_loss": 0.0010599966626614332, "global_step": 43930, "epoch": 369, "lr": 3.268427431280753e-05} +{"train_loss": 0.0007148832664825022, "global_step": 43931, "epoch": 369, "lr": 3.2682195919311085e-05} +{"train_loss": 0.000814654107671231, "global_step": 43932, "epoch": 369, "lr": 3.268011755981632e-05} +{"train_loss": 0.0013806080678477883, "global_step": 43933, "epoch": 369, "lr": 3.2678039234327275e-05} +{"train_loss": 0.0007039451156742871, "global_step": 43934, "epoch": 369, "lr": 3.267596094284806e-05} +{"train_loss": 0.001583675155416131, "global_step": 43935, "epoch": 369, "lr": 3.267388268538273e-05} +{"train_loss": 0.0012814918300136924, "global_step": 43936, "epoch": 369, "lr": 3.267180446193539e-05} +{"train_loss": 0.001222724560648203, "global_step": 43937, "epoch": 369, "lr": 3.266972627251011e-05} +{"train_loss": 0.0013779157306998968, "global_step": 43938, "epoch": 369, "lr": 3.266764811711098e-05} +{"train_loss": 0.0010034453589469194, "global_step": 43939, "epoch": 369, "lr": 3.266556999574207e-05} +{"train_loss": 0.0009645271929912269, "global_step": 43940, "epoch": 369, "lr": 3.266349190840745e-05} +{"train_loss": 0.0008550534839741886, "global_step": 43941, "epoch": 369, "lr": 3.2661413855111223e-05} +{"train_loss": 0.0008057983359321952, "global_step": 43942, "epoch": 369, "lr": 3.265933583585744e-05} +{"train_loss": 0.0008723438368178904, "global_step": 43943, "epoch": 369, "lr": 3.265725785065022e-05} +{"train_loss": 0.001525874831713736, "global_step": 43944, "epoch": 369, "lr": 3.265517989949361e-05} +{"train_loss": 0.0011081538395956159, "global_step": 43945, "epoch": 369, "lr": 3.2653101982391696e-05} +{"train_loss": 0.0011579830897971988, "global_step": 43946, "epoch": 369, "lr": 3.265102409934857e-05} +{"train_loss": 0.0007885816157795489, "global_step": 43947, "epoch": 369, "lr": 3.264894625036829e-05} +{"train_loss": 0.0021927976049482822, "global_step": 43948, "epoch": 369, "lr": 3.264686843545498e-05} +{"train_loss": 0.0012028380297124386, "global_step": 43949, "epoch": 369, "lr": 3.2644790654612665e-05} +{"train_loss": 0.0009992949198931456, "global_step": 43950, "epoch": 369, "lr": 3.2642712907845465e-05} +{"train_loss": 0.0008582548471167684, "global_step": 43951, "epoch": 369, "lr": 3.2640635195157444e-05} +{"train_loss": 0.001605180324986577, "global_step": 43952, "epoch": 369, "lr": 3.263855751655267e-05} +{"train_loss": 0.0014159709680825472, "global_step": 43953, "epoch": 369, "lr": 3.263647987203524e-05} +{"train_loss": 0.0017486470751464367, "global_step": 43954, "epoch": 369, "lr": 3.2634402261609215e-05} +{"train_loss": 0.0015345525462180376, "global_step": 43955, "epoch": 369, "lr": 3.2632324685278706e-05} +{"train_loss": 0.0010242349235340953, "global_step": 43956, "epoch": 369, "lr": 3.263024714304775e-05} +{"train_loss": 0.0019333113450556993, "global_step": 43957, "epoch": 369, "lr": 3.262816963492047e-05} +{"train_loss": 0.0009703590767458081, "global_step": 43958, "epoch": 369, "lr": 3.262609216090092e-05} +{"train_loss": 0.0023657483980059624, "global_step": 43959, "epoch": 369, "lr": 3.262401472099317e-05} +{"train_loss": 0.001401147455908358, "global_step": 43960, "epoch": 369, "lr": 3.2621937315201324e-05} +{"train_loss": 0.0010616191430017352, "global_step": 43961, "epoch": 369, "lr": 3.2619859943529424e-05} +{"train_loss": 0.001794776413589716, "global_step": 43962, "epoch": 369, "lr": 3.261778260598158e-05} +{"train_loss": 0.0006763900746591389, "global_step": 43963, "epoch": 369, "lr": 3.2615705302561884e-05} +{"train_loss": 0.0010895597515627742, "global_step": 43964, "epoch": 369, "lr": 3.261362803327437e-05} +{"train_loss": 0.001624293508939445, "global_step": 43965, "epoch": 369, "lr": 3.261155079812316e-05} +{"train_loss": 0.001765080145560205, "global_step": 43966, "epoch": 369, "lr": 3.260947359711229e-05} +{"train_loss": 0.001284429570659995, "global_step": 43967, "epoch": 369, "lr": 3.2607396430245884e-05} +{"train_loss": 0.00160465098451823, "global_step": 43968, "epoch": 369, "lr": 3.260531929752797e-05} +{"train_loss": 0.001101743197068572, "global_step": 43969, "epoch": 369, "lr": 3.260324219896268e-05} +{"train_loss": 0.000859986525028944, "global_step": 43970, "epoch": 369, "lr": 3.260116513455406e-05} +{"train_loss": 0.001579150091856718, "global_step": 43971, "epoch": 369, "lr": 3.2599088104306176e-05} +{"train_loss": 0.0008730737608857453, "global_step": 43972, "epoch": 369, "lr": 3.2597011108223146e-05} +{"train_loss": 0.002233740407973528, "global_step": 43973, "epoch": 369, "lr": 3.2594934146309005e-05} +{"train_loss": 0.0014588224003091455, "global_step": 43974, "epoch": 369, "lr": 3.259285721856787e-05} +{"train_loss": 0.0016337395645678043, "global_step": 43975, "epoch": 369, "lr": 3.2590780325003775e-05} +{"train_loss": 0.001006788806989789, "global_step": 43976, "epoch": 369, "lr": 3.258870346562085e-05} +{"train_loss": 0.001141875283792615, "global_step": 43977, "epoch": 369, "lr": 3.2586626640423134e-05} +{"train_loss": 0.0007897616596892476, "global_step": 43978, "epoch": 369, "lr": 3.2584549849414716e-05} +{"train_loss": 0.002010409953072667, "global_step": 43979, "epoch": 369, "lr": 3.2582473092599676e-05} +{"train_loss": 0.0014948912430554628, "global_step": 43980, "epoch": 369, "lr": 3.258039636998209e-05} +{"train_loss": 0.0011897314107045531, "global_step": 43981, "epoch": 369, "lr": 3.257831968156603e-05} +{"train_loss": 0.0024240424390882254, "global_step": 43982, "epoch": 369, "lr": 3.257624302735559e-05} +{"train_loss": 0.0014154117088764906, "global_step": 43983, "epoch": 369, "lr": 3.257416640735481e-05} +{"train_loss": 0.002127181040123105, "global_step": 43984, "epoch": 369, "lr": 3.257208982156782e-05} +{"train_loss": 0.0017625647597014904, "global_step": 43985, "epoch": 369, "lr": 3.257001326999865e-05} +{"train_loss": 0.0010273730149492621, "global_step": 43986, "epoch": 369, "lr": 3.256793675265141e-05} +{"train_loss": 0.001212976174429059, "global_step": 43987, "epoch": 369, "lr": 3.256586026953015e-05} +{"train_loss": 0.0022392317187041044, "global_step": 43988, "epoch": 369, "lr": 3.2563783820638975e-05} +{"train_loss": 0.0014071447076275945, "global_step": 43989, "epoch": 369, "lr": 3.256170740598196e-05} +{"train_loss": 0.0012266194680705667, "global_step": 43990, "epoch": 369, "lr": 3.255963102556313e-05} +{"train_loss": 0.0012644458329305053, "global_step": 43991, "epoch": 369, "lr": 3.255755467938664e-05} +{"train_loss": 0.0014239574084058404, "global_step": 43992, "epoch": 369, "lr": 3.2555478367456496e-05} +{"train_loss": 0.0020434067118912935, "global_step": 43993, "epoch": 369, "lr": 3.255340208977683e-05} +{"train_loss": 0.0005923059652559459, "global_step": 43994, "epoch": 369, "lr": 3.2551325846351685e-05} +{"train_loss": 0.00216264883056283, "global_step": 43995, "epoch": 369, "lr": 3.254924963718515e-05} +{"train_loss": 0.0009589400724507868, "global_step": 43996, "epoch": 369, "lr": 3.25471734622813e-05} +{"train_loss": 0.0017302490305155516, "global_step": 43997, "epoch": 369, "lr": 3.25450973216442e-05} +{"train_loss": 0.0013511939905583858, "global_step": 43998, "epoch": 369, "lr": 3.254302121527795e-05} +{"train_loss": 0.002259399276226759, "global_step": 43999, "epoch": 369, "lr": 3.25409451431866e-05} +{"train_loss": 0.0009869292844086885, "global_step": 44000, "epoch": 369, "lr": 3.2538869105374256e-05} +{"train_loss": 0.0012759468518197536, "global_step": 44001, "epoch": 369, "lr": 3.2536793101844976e-05} +{"train_loss": 0.0010923340450972319, "global_step": 44002, "epoch": 369, "lr": 3.2534717132602823e-05} +{"train_loss": 0.0010602246038615704, "global_step": 44003, "epoch": 369, "lr": 3.25326411976519e-05} +{"train_loss": 0.001153259538114071, "global_step": 44004, "epoch": 369, "lr": 3.2530565296996254e-05} +{"train_loss": 0.0016547845443710685, "global_step": 44005, "epoch": 369, "lr": 3.252848943063999e-05} +{"train_loss": 0.0007671529310755432, "global_step": 44006, "epoch": 369, "lr": 3.2526413598587155e-05} +{"train_loss": 0.0010708927875384688, "global_step": 44007, "epoch": 369, "lr": 3.2524337800841866e-05} +{"train_loss": 0.0007722036098130047, "global_step": 44008, "epoch": 369, "lr": 3.252226203740816e-05} +{"train_loss": 0.001388290198519826, "global_step": 44009, "epoch": 369, "lr": 3.252018630829011e-05} +{"train_loss": 0.0015897860284894705, "global_step": 44010, "epoch": 369, "lr": 3.2518110613491825e-05} +{"train_loss": 0.002789540449157357, "global_step": 44011, "epoch": 369, "lr": 3.251603495301735e-05} +{"train_loss": 0.001992299221456051, "global_step": 44012, "epoch": 369, "lr": 3.251395932687078e-05} +{"train_loss": 0.0008396320044994354, "global_step": 44013, "epoch": 369, "lr": 3.25118837350562e-05} +{"train_loss": 0.0018454554956406355, "global_step": 44014, "epoch": 369, "lr": 3.250980817757764e-05} +{"train_loss": 0.0017164853634312749, "global_step": 44015, "epoch": 369, "lr": 3.250773265443922e-05} +{"train_loss": 0.003623448545113206, "global_step": 44016, "epoch": 369, "lr": 3.2505657165644976e-05} +{"train_loss": 0.0018457041587680578, "global_step": 44017, "epoch": 369, "lr": 3.250358171119904e-05} +{"train_loss": 0.0007400449248962104, "global_step": 44018, "epoch": 369, "lr": 3.2501506291105414e-05} +{"train_loss": 0.0008506369777023792, "global_step": 44019, "epoch": 369, "lr": 3.2499430905368247e-05} +{"train_loss": 0.001409613760188222, "global_step": 44020, "epoch": 369, "lr": 3.249735555399157e-05} +{"train_loss": 0.0009701464441604912, "global_step": 44021, "epoch": 369, "lr": 3.249528023697944e-05} +{"train_loss": 0.002078463789075613, "global_step": 44022, "epoch": 369, "lr": 3.249320495433598e-05} +{"train_loss": 0.0009321013931185007, "global_step": 44023, "epoch": 369, "lr": 3.249112970606523e-05} +{"train_loss": 0.0023336708545684814, "global_step": 44024, "epoch": 369, "lr": 3.248905449217129e-05} +{"train_loss": 0.0019093469018116593, "global_step": 44025, "epoch": 369, "lr": 3.2486979312658196e-05} +{"train_loss": 0.0009479933069087565, "global_step": 44026, "epoch": 369, "lr": 3.2484904167530075e-05} +{"train_loss": 0.0012822173302993178, "global_step": 44027, "epoch": 369, "lr": 3.2482829056790956e-05} +{"train_loss": 0.001058837864547968, "global_step": 44028, "epoch": 369, "lr": 3.248075398044494e-05} +{"train_loss": 0.0013750967708564981, "global_step": 44029, "epoch": 369, "lr": 3.2478678938496084e-05, "val_loss": 0.01576257310807705} +{"train_loss": 0.0014899434754624963, "global_step": 44030, "epoch": 370, "lr": 3.247660393094848e-05} +{"train_loss": 0.003007465275004506, "global_step": 44031, "epoch": 370, "lr": 3.247452895780618e-05} +{"train_loss": 0.003080675145611167, "global_step": 44032, "epoch": 370, "lr": 3.247245401907328e-05} +{"train_loss": 0.0014946820447221398, "global_step": 44033, "epoch": 370, "lr": 3.247037911475384e-05} +{"train_loss": 0.001957216765731573, "global_step": 44034, "epoch": 370, "lr": 3.246830424485194e-05} +{"train_loss": 0.00206577405333519, "global_step": 44035, "epoch": 370, "lr": 3.246622940937164e-05} +{"train_loss": 0.0022870793472975492, "global_step": 44036, "epoch": 370, "lr": 3.246415460831705e-05} +{"train_loss": 0.002655086573213339, "global_step": 44037, "epoch": 370, "lr": 3.246207984169219e-05} +{"train_loss": 0.0024320774246007204, "global_step": 44038, "epoch": 370, "lr": 3.246000510950119e-05} +{"train_loss": 0.001857832190580666, "global_step": 44039, "epoch": 370, "lr": 3.245793041174809e-05} +{"train_loss": 0.0013018022291362286, "global_step": 44040, "epoch": 370, "lr": 3.245585574843695e-05} +{"train_loss": 0.003790623042732477, "global_step": 44041, "epoch": 370, "lr": 3.2453781119571886e-05} +{"train_loss": 0.002087692730128765, "global_step": 44042, "epoch": 370, "lr": 3.245170652515693e-05} +{"train_loss": 0.0018885352183133364, "global_step": 44043, "epoch": 370, "lr": 3.2449631965196185e-05} +{"train_loss": 0.0018732132157310843, "global_step": 44044, "epoch": 370, "lr": 3.244755743969371e-05} +{"train_loss": 0.0015733331674709916, "global_step": 44045, "epoch": 370, "lr": 3.2445482948653574e-05} +{"train_loss": 0.001242640893906355, "global_step": 44046, "epoch": 370, "lr": 3.2443408492079864e-05} +{"train_loss": 0.0012188286054879427, "global_step": 44047, "epoch": 370, "lr": 3.2441334069976634e-05} +{"train_loss": 0.0017690727254375815, "global_step": 44048, "epoch": 370, "lr": 3.243925968234799e-05} +{"train_loss": 0.0018580830655992031, "global_step": 44049, "epoch": 370, "lr": 3.243718532919796e-05} +{"train_loss": 0.0028255165088921785, "global_step": 44050, "epoch": 370, "lr": 3.243511101053066e-05} +{"train_loss": 0.0009288069559261203, "global_step": 44051, "epoch": 370, "lr": 3.2433036726350144e-05} +{"train_loss": 0.0010814281413331628, "global_step": 44052, "epoch": 370, "lr": 3.2430962476660464e-05} +{"train_loss": 0.0013621929101645947, "global_step": 44053, "epoch": 370, "lr": 3.242888826146574e-05} +{"train_loss": 0.0020470041781663895, "global_step": 44054, "epoch": 370, "lr": 3.242681408076998e-05} +{"train_loss": 0.0015221633948385715, "global_step": 44055, "epoch": 370, "lr": 3.242473993457733e-05} +{"train_loss": 0.002387572778388858, "global_step": 44056, "epoch": 370, "lr": 3.24226658228918e-05} +{"train_loss": 0.0022298048716038465, "global_step": 44057, "epoch": 370, "lr": 3.24205917457175e-05} +{"train_loss": 0.0014740538317710161, "global_step": 44058, "epoch": 370, "lr": 3.241851770305849e-05} +{"train_loss": 0.0014393118908628821, "global_step": 44059, "epoch": 370, "lr": 3.2416443694918835e-05} +{"train_loss": 0.001138170249760151, "global_step": 44060, "epoch": 370, "lr": 3.241436972130262e-05} +{"train_loss": 0.0015148421516641974, "global_step": 44061, "epoch": 370, "lr": 3.241229578221391e-05} +{"train_loss": 0.00126325199380517, "global_step": 44062, "epoch": 370, "lr": 3.2410221877656774e-05} +{"train_loss": 0.0008843101095408201, "global_step": 44063, "epoch": 370, "lr": 3.2408148007635294e-05} +{"train_loss": 0.0023871096782386303, "global_step": 44064, "epoch": 370, "lr": 3.240607417215353e-05} +{"train_loss": 0.0008029785822145641, "global_step": 44065, "epoch": 370, "lr": 3.240400037121557e-05} +{"train_loss": 0.0013529898133128881, "global_step": 44066, "epoch": 370, "lr": 3.240192660482546e-05} +{"train_loss": 0.0011267297668382525, "global_step": 44067, "epoch": 370, "lr": 3.23998528729873e-05} +{"train_loss": 0.0012245223624631763, "global_step": 44068, "epoch": 370, "lr": 3.239777917570514e-05} +{"train_loss": 0.0021739820949733257, "global_step": 44069, "epoch": 370, "lr": 3.2395705512983074e-05} +{"train_loss": 0.0010261305142194033, "global_step": 44070, "epoch": 370, "lr": 3.239363188482516e-05} +{"train_loss": 0.0010968068381771445, "global_step": 44071, "epoch": 370, "lr": 3.239155829123545e-05} +{"train_loss": 0.001438712002709508, "global_step": 44072, "epoch": 370, "lr": 3.2389484732218046e-05} +{"train_loss": 0.002123681828379631, "global_step": 44073, "epoch": 370, "lr": 3.2387411207777e-05} +{"train_loss": 0.0020075333304703236, "global_step": 44074, "epoch": 370, "lr": 3.23853377179164e-05} +{"train_loss": 0.0012735225027427077, "global_step": 44075, "epoch": 370, "lr": 3.238326426264029e-05} +{"train_loss": 0.0012305440613999963, "global_step": 44076, "epoch": 370, "lr": 3.238119084195278e-05} +{"train_loss": 0.002028963528573513, "global_step": 44077, "epoch": 370, "lr": 3.237911745585791e-05} +{"train_loss": 0.0011070219334214926, "global_step": 44078, "epoch": 370, "lr": 3.2377044104359764e-05} +{"train_loss": 0.0012726543936878443, "global_step": 44079, "epoch": 370, "lr": 3.23749707874624e-05} +{"train_loss": 0.0011844000546261668, "global_step": 44080, "epoch": 370, "lr": 3.2372897505169896e-05} +{"train_loss": 0.0008383316453546286, "global_step": 44081, "epoch": 370, "lr": 3.2370824257486345e-05} +{"train_loss": 0.0009911810047924519, "global_step": 44082, "epoch": 370, "lr": 3.236875104441579e-05} +{"train_loss": 0.0017193612875416875, "global_step": 44083, "epoch": 370, "lr": 3.236667786596229e-05} +{"train_loss": 0.0018772728508338332, "global_step": 44084, "epoch": 370, "lr": 3.236460472212996e-05} +{"train_loss": 0.0010784234618768096, "global_step": 44085, "epoch": 370, "lr": 3.236253161292282e-05} +{"train_loss": 0.0016619886737316847, "global_step": 44086, "epoch": 370, "lr": 3.2360458538344984e-05} +{"train_loss": 0.002527236472815275, "global_step": 44087, "epoch": 370, "lr": 3.235838549840049e-05} +{"train_loss": 0.0014653304824605584, "global_step": 44088, "epoch": 370, "lr": 3.2356312493093434e-05} +{"train_loss": 0.0011837042402476072, "global_step": 44089, "epoch": 370, "lr": 3.2354239522427875e-05} +{"train_loss": 0.0018131249817088246, "global_step": 44090, "epoch": 370, "lr": 3.235216658640786e-05} +{"train_loss": 0.0017484084237366915, "global_step": 44091, "epoch": 370, "lr": 3.235009368503751e-05} +{"train_loss": 0.0005787972477264702, "global_step": 44092, "epoch": 370, "lr": 3.234802081832083e-05} +{"train_loss": 0.0013536002952605486, "global_step": 44093, "epoch": 370, "lr": 3.234594798626195e-05} +{"train_loss": 0.0017772074788808823, "global_step": 44094, "epoch": 370, "lr": 3.23438751888649e-05} +{"train_loss": 0.001256628311239183, "global_step": 44095, "epoch": 370, "lr": 3.234180242613378e-05} +{"train_loss": 0.0010807504877448082, "global_step": 44096, "epoch": 370, "lr": 3.233972969807265e-05} +{"train_loss": 0.001337528578005731, "global_step": 44097, "epoch": 370, "lr": 3.233765700468555e-05} +{"train_loss": 0.0008211847161874175, "global_step": 44098, "epoch": 370, "lr": 3.2335584345976596e-05} +{"train_loss": 0.0014515483053401113, "global_step": 44099, "epoch": 370, "lr": 3.233351172194982e-05} +{"train_loss": 0.001549845328554511, "global_step": 44100, "epoch": 370, "lr": 3.233143913260932e-05} +{"train_loss": 0.0006582782953046262, "global_step": 44101, "epoch": 370, "lr": 3.232936657795915e-05} +{"train_loss": 0.0013236188096925616, "global_step": 44102, "epoch": 370, "lr": 3.232729405800337e-05} +{"train_loss": 0.0012705849949270487, "global_step": 44103, "epoch": 370, "lr": 3.2325221572746065e-05} +{"train_loss": 0.0013183840783312917, "global_step": 44104, "epoch": 370, "lr": 3.232314912219129e-05} +{"train_loss": 0.001488270005211234, "global_step": 44105, "epoch": 370, "lr": 3.232107670634314e-05} +{"train_loss": 0.0015910420333966613, "global_step": 44106, "epoch": 370, "lr": 3.2319004325205646e-05} +{"train_loss": 0.0009829074842855334, "global_step": 44107, "epoch": 370, "lr": 3.231693197878292e-05} +{"train_loss": 0.0021130037494003773, "global_step": 44108, "epoch": 370, "lr": 3.2314859667079e-05} +{"train_loss": 0.0006930723320692778, "global_step": 44109, "epoch": 370, "lr": 3.2312787390097966e-05} +{"train_loss": 0.0012485272018238902, "global_step": 44110, "epoch": 370, "lr": 3.231071514784388e-05} +{"train_loss": 0.0009872560622170568, "global_step": 44111, "epoch": 370, "lr": 3.230864294032082e-05} +{"train_loss": 0.001451427466236055, "global_step": 44112, "epoch": 370, "lr": 3.230657076753284e-05} +{"train_loss": 0.0013147066347301006, "global_step": 44113, "epoch": 370, "lr": 3.230449862948404e-05} +{"train_loss": 0.0015937549760565162, "global_step": 44114, "epoch": 370, "lr": 3.2302426526178434e-05} +{"train_loss": 0.0011599916033446789, "global_step": 44115, "epoch": 370, "lr": 3.2300354457620155e-05} +{"train_loss": 0.0017944211140275002, "global_step": 44116, "epoch": 370, "lr": 3.2298282423813206e-05} +{"train_loss": 0.00198741746135056, "global_step": 44117, "epoch": 370, "lr": 3.229621042476172e-05} +{"train_loss": 0.0013057306641712785, "global_step": 44118, "epoch": 370, "lr": 3.2294138460469706e-05} +{"train_loss": 0.0008157435222528875, "global_step": 44119, "epoch": 370, "lr": 3.229206653094128e-05} +{"train_loss": 0.0014894583728164434, "global_step": 44120, "epoch": 370, "lr": 3.2289994636180495e-05} +{"train_loss": 0.0022531840950250626, "global_step": 44121, "epoch": 370, "lr": 3.2287922776191394e-05} +{"train_loss": 0.0014406773261725903, "global_step": 44122, "epoch": 370, "lr": 3.228585095097808e-05} +{"train_loss": 0.001204062718898058, "global_step": 44123, "epoch": 370, "lr": 3.228377916054458e-05} +{"train_loss": 0.001099117798730731, "global_step": 44124, "epoch": 370, "lr": 3.228170740489501e-05} +{"train_loss": 0.0013738059205934405, "global_step": 44125, "epoch": 370, "lr": 3.227963568403341e-05} +{"train_loss": 0.002227901481091976, "global_step": 44126, "epoch": 370, "lr": 3.2277563997963854e-05} +{"train_loss": 0.0014426975976675749, "global_step": 44127, "epoch": 370, "lr": 3.22754923466904e-05} +{"train_loss": 0.0013798330910503864, "global_step": 44128, "epoch": 370, "lr": 3.227342073021713e-05} +{"train_loss": 0.0008915647631511092, "global_step": 44129, "epoch": 370, "lr": 3.22713491485481e-05} +{"train_loss": 0.0008921000408008695, "global_step": 44130, "epoch": 370, "lr": 3.226927760168738e-05} +{"train_loss": 0.0018785200081765652, "global_step": 44131, "epoch": 370, "lr": 3.226720608963905e-05} +{"train_loss": 0.001837570802308619, "global_step": 44132, "epoch": 370, "lr": 3.226513461240717e-05} +{"train_loss": 0.002275902545079589, "global_step": 44133, "epoch": 370, "lr": 3.226306316999578e-05} +{"train_loss": 0.0012516401475295424, "global_step": 44134, "epoch": 370, "lr": 3.2260991762408986e-05} +{"train_loss": 0.0016218473901972175, "global_step": 44135, "epoch": 370, "lr": 3.225892038965083e-05} +{"train_loss": 0.0021599482279270887, "global_step": 44136, "epoch": 370, "lr": 3.22568490517254e-05} +{"train_loss": 0.0011700326576828957, "global_step": 44137, "epoch": 370, "lr": 3.225477774863674e-05} +{"train_loss": 0.0015464468160644174, "global_step": 44138, "epoch": 370, "lr": 3.2252706480388936e-05} +{"train_loss": 0.0014603023882955313, "global_step": 44139, "epoch": 370, "lr": 3.225063524698606e-05} +{"train_loss": 0.0017792275175452232, "global_step": 44140, "epoch": 370, "lr": 3.224856404843214e-05} +{"train_loss": 0.001993263140320778, "global_step": 44141, "epoch": 370, "lr": 3.2246492884731296e-05} +{"train_loss": 0.0010065531823784113, "global_step": 44142, "epoch": 370, "lr": 3.224442175588753e-05} +{"train_loss": 0.0017874639015644789, "global_step": 44143, "epoch": 370, "lr": 3.2242350661904964e-05} +{"train_loss": 0.0011016897624358535, "global_step": 44144, "epoch": 370, "lr": 3.224027960278765e-05} +{"train_loss": 0.0010411589173600078, "global_step": 44145, "epoch": 370, "lr": 3.223820857853964e-05} +{"train_loss": 0.001574100460857153, "global_step": 44146, "epoch": 370, "lr": 3.2236137589165024e-05} +{"train_loss": 0.001394568127579987, "global_step": 44147, "epoch": 370, "lr": 3.223406663466784e-05} +{"train_loss": 0.001555359924306013, "global_step": 44148, "epoch": 370, "lr": 3.223199571505218e-05, "val_loss": 0.011639106087386608, "train_action_mse_error": 2.3618944396730512e-05} +{"train_loss": 0.0017827374394983053, "global_step": 44149, "epoch": 371, "lr": 3.2229924830322085e-05} +{"train_loss": 0.0018895918037742376, "global_step": 44150, "epoch": 371, "lr": 3.222785398048165e-05} +{"train_loss": 0.0017850458389148116, "global_step": 44151, "epoch": 371, "lr": 3.222578316553492e-05} +{"train_loss": 0.001516722491942346, "global_step": 44152, "epoch": 371, "lr": 3.2223712385485955e-05} +{"train_loss": 0.0014479488600045443, "global_step": 44153, "epoch": 371, "lr": 3.222164164033885e-05} +{"train_loss": 0.0034611797891557217, "global_step": 44154, "epoch": 371, "lr": 3.221957093009763e-05} +{"train_loss": 0.00090323033509776, "global_step": 44155, "epoch": 371, "lr": 3.22175002547664e-05} +{"train_loss": 0.0008109780610539019, "global_step": 44156, "epoch": 371, "lr": 3.221542961434919e-05} +{"train_loss": 0.0015895499382168055, "global_step": 44157, "epoch": 371, "lr": 3.2213359008850105e-05} +{"train_loss": 0.0008852028986439109, "global_step": 44158, "epoch": 371, "lr": 3.221128843827318e-05} +{"train_loss": 0.0023619167041033506, "global_step": 44159, "epoch": 371, "lr": 3.220921790262249e-05} +{"train_loss": 0.0017437983769923449, "global_step": 44160, "epoch": 371, "lr": 3.2207147401902104e-05} +{"train_loss": 0.0015135776484385133, "global_step": 44161, "epoch": 371, "lr": 3.2205076936116075e-05} +{"train_loss": 0.0010590421734377742, "global_step": 44162, "epoch": 371, "lr": 3.220300650526848e-05} +{"train_loss": 0.001928356708958745, "global_step": 44163, "epoch": 371, "lr": 3.2200936109363375e-05} +{"train_loss": 0.0007270485511980951, "global_step": 44164, "epoch": 371, "lr": 3.2198865748404836e-05} +{"train_loss": 0.002697139047086239, "global_step": 44165, "epoch": 371, "lr": 3.219679542239694e-05} +{"train_loss": 0.0028029170352965593, "global_step": 44166, "epoch": 371, "lr": 3.219472513134371e-05} +{"train_loss": 0.0017125057056546211, "global_step": 44167, "epoch": 371, "lr": 3.219265487524924e-05} +{"train_loss": 0.0008230999810621142, "global_step": 44168, "epoch": 371, "lr": 3.219058465411758e-05} +{"train_loss": 0.0021490822546184063, "global_step": 44169, "epoch": 371, "lr": 3.2188514467952835e-05} +{"train_loss": 0.001050095190294087, "global_step": 44170, "epoch": 371, "lr": 3.2186444316759024e-05} +{"train_loss": 0.001455462770536542, "global_step": 44171, "epoch": 371, "lr": 3.218437420054021e-05} +{"train_loss": 0.0014524117577821016, "global_step": 44172, "epoch": 371, "lr": 3.21823041193005e-05} +{"train_loss": 0.001251403009518981, "global_step": 44173, "epoch": 371, "lr": 3.218023407304391e-05} +{"train_loss": 0.0010531708830967546, "global_step": 44174, "epoch": 371, "lr": 3.217816406177454e-05} +{"train_loss": 0.001527768443338573, "global_step": 44175, "epoch": 371, "lr": 3.217609408549643e-05} +{"train_loss": 0.0029495221097022295, "global_step": 44176, "epoch": 371, "lr": 3.2174024144213674e-05} +{"train_loss": 0.0015250809956341982, "global_step": 44177, "epoch": 371, "lr": 3.2171954237930305e-05} +{"train_loss": 0.0016602397663518786, "global_step": 44178, "epoch": 371, "lr": 3.216988436665038e-05} +{"train_loss": 0.001934595755301416, "global_step": 44179, "epoch": 371, "lr": 3.2167814530378014e-05} +{"train_loss": 0.0014848561258986592, "global_step": 44180, "epoch": 371, "lr": 3.2165744729117216e-05} +{"train_loss": 0.0015679592033848166, "global_step": 44181, "epoch": 371, "lr": 3.216367496287209e-05} +{"train_loss": 0.0019899189937859774, "global_step": 44182, "epoch": 371, "lr": 3.2161605231646686e-05} +{"train_loss": 0.0013982878299430013, "global_step": 44183, "epoch": 371, "lr": 3.215953553544504e-05} +{"train_loss": 0.00194447860121727, "global_step": 44184, "epoch": 371, "lr": 3.2157465874271266e-05} +{"train_loss": 0.0014408937422558665, "global_step": 44185, "epoch": 371, "lr": 3.2155396248129374e-05} +{"train_loss": 0.0016082669608294964, "global_step": 44186, "epoch": 371, "lr": 3.215332665702349e-05} +{"train_loss": 0.0022991164587438107, "global_step": 44187, "epoch": 371, "lr": 3.215125710095761e-05} +{"train_loss": 0.0012352158082649112, "global_step": 44188, "epoch": 371, "lr": 3.2149187579935844e-05} +{"train_loss": 0.0016731532523408532, "global_step": 44189, "epoch": 371, "lr": 3.214711809396226e-05} +{"train_loss": 0.0009110200335271657, "global_step": 44190, "epoch": 371, "lr": 3.214504864304087e-05} +{"train_loss": 0.0018047813791781664, "global_step": 44191, "epoch": 371, "lr": 3.214297922717578e-05} +{"train_loss": 0.002126770094037056, "global_step": 44192, "epoch": 371, "lr": 3.214090984637104e-05} +{"train_loss": 0.0020249863155186176, "global_step": 44193, "epoch": 371, "lr": 3.213884050063072e-05} +{"train_loss": 0.001763237756676972, "global_step": 44194, "epoch": 371, "lr": 3.213677118995888e-05} +{"train_loss": 0.0017411545850336552, "global_step": 44195, "epoch": 371, "lr": 3.2134701914359576e-05} +{"train_loss": 0.0010030935518443584, "global_step": 44196, "epoch": 371, "lr": 3.2132632673836894e-05} +{"train_loss": 0.0008923244313336909, "global_step": 44197, "epoch": 371, "lr": 3.2130563468394846e-05} +{"train_loss": 0.002325828652828932, "global_step": 44198, "epoch": 371, "lr": 3.212849429803756e-05} +{"train_loss": 0.0017407251289114356, "global_step": 44199, "epoch": 371, "lr": 3.212642516276905e-05} +{"train_loss": 0.0014584844466298819, "global_step": 44200, "epoch": 371, "lr": 3.21243560625934e-05} +{"train_loss": 0.0012955990387126803, "global_step": 44201, "epoch": 371, "lr": 3.212228699751467e-05} +{"train_loss": 0.0013506191316992044, "global_step": 44202, "epoch": 371, "lr": 3.21202179675369e-05} +{"train_loss": 0.0006871374207548797, "global_step": 44203, "epoch": 371, "lr": 3.21181489726642e-05} +{"train_loss": 0.0013712316285818815, "global_step": 44204, "epoch": 371, "lr": 3.2116080012900584e-05} +{"train_loss": 0.00211140513420105, "global_step": 44205, "epoch": 371, "lr": 3.211401108825015e-05} +{"train_loss": 0.0008548882906325161, "global_step": 44206, "epoch": 371, "lr": 3.211194219871692e-05} +{"train_loss": 0.0014701298205181956, "global_step": 44207, "epoch": 371, "lr": 3.210987334430501e-05} +{"train_loss": 0.001633283100090921, "global_step": 44208, "epoch": 371, "lr": 3.210780452501843e-05} +{"train_loss": 0.0015766327269375324, "global_step": 44209, "epoch": 371, "lr": 3.210573574086127e-05} +{"train_loss": 0.0023124385625123978, "global_step": 44210, "epoch": 371, "lr": 3.210366699183759e-05} +{"train_loss": 0.0018497644923627377, "global_step": 44211, "epoch": 371, "lr": 3.210159827795144e-05} +{"train_loss": 0.0008049127063713968, "global_step": 44212, "epoch": 371, "lr": 3.20995295992069e-05} +{"train_loss": 0.0009400862036272883, "global_step": 44213, "epoch": 371, "lr": 3.209746095560801e-05} +{"train_loss": 0.002307600574567914, "global_step": 44214, "epoch": 371, "lr": 3.2095392347158855e-05} +{"train_loss": 0.0010866746306419373, "global_step": 44215, "epoch": 371, "lr": 3.2093323773863486e-05} +{"train_loss": 0.001555156079120934, "global_step": 44216, "epoch": 371, "lr": 3.209125523572595e-05} +{"train_loss": 0.0010649266187101603, "global_step": 44217, "epoch": 371, "lr": 3.208918673275033e-05} +{"train_loss": 0.0012129148235544562, "global_step": 44218, "epoch": 371, "lr": 3.2087118264940666e-05} +{"train_loss": 0.0017039966769516468, "global_step": 44219, "epoch": 371, "lr": 3.208504983230105e-05} +{"train_loss": 0.0018278571078553796, "global_step": 44220, "epoch": 371, "lr": 3.208298143483552e-05} +{"train_loss": 0.0013804627815261483, "global_step": 44221, "epoch": 371, "lr": 3.208091307254813e-05} +{"train_loss": 0.0010312253143638372, "global_step": 44222, "epoch": 371, "lr": 3.207884474544297e-05} +{"train_loss": 0.0018545995699241757, "global_step": 44223, "epoch": 371, "lr": 3.207677645352406e-05} +{"train_loss": 0.0012589616235345602, "global_step": 44224, "epoch": 371, "lr": 3.207470819679551e-05} +{"train_loss": 0.0011108008911833167, "global_step": 44225, "epoch": 371, "lr": 3.207263997526133e-05} +{"train_loss": 0.001028088852763176, "global_step": 44226, "epoch": 371, "lr": 3.207057178892562e-05} +{"train_loss": 0.0012688357383012772, "global_step": 44227, "epoch": 371, "lr": 3.206850363779243e-05} +{"train_loss": 0.0009167034877464175, "global_step": 44228, "epoch": 371, "lr": 3.206643552186581e-05} +{"train_loss": 0.000960535544436425, "global_step": 44229, "epoch": 371, "lr": 3.2064367441149843e-05} +{"train_loss": 0.0013445743825286627, "global_step": 44230, "epoch": 371, "lr": 3.206229939564855e-05} +{"train_loss": 0.0009668726706877351, "global_step": 44231, "epoch": 371, "lr": 3.206023138536604e-05} +{"train_loss": 0.002785310847684741, "global_step": 44232, "epoch": 371, "lr": 3.2058163410306354e-05} +{"train_loss": 0.0017036257777363062, "global_step": 44233, "epoch": 371, "lr": 3.205609547047351e-05} +{"train_loss": 0.0020513413473963737, "global_step": 44234, "epoch": 371, "lr": 3.205402756587164e-05} +{"train_loss": 0.0017842173110693693, "global_step": 44235, "epoch": 371, "lr": 3.205195969650475e-05} +{"train_loss": 0.0019921185448765755, "global_step": 44236, "epoch": 371, "lr": 3.204989186237694e-05} +{"train_loss": 0.001264929655008018, "global_step": 44237, "epoch": 371, "lr": 3.2047824063492215e-05} +{"train_loss": 0.0012468226486817002, "global_step": 44238, "epoch": 371, "lr": 3.20457562998547e-05} +{"train_loss": 0.0007730850484222174, "global_step": 44239, "epoch": 371, "lr": 3.204368857146843e-05} +{"train_loss": 0.0008860907983034849, "global_step": 44240, "epoch": 371, "lr": 3.204162087833743e-05} +{"train_loss": 0.0018335753120481968, "global_step": 44241, "epoch": 371, "lr": 3.20395532204658e-05} +{"train_loss": 0.0017010224983096123, "global_step": 44242, "epoch": 371, "lr": 3.20374855978576e-05} +{"train_loss": 0.001025981968268752, "global_step": 44243, "epoch": 371, "lr": 3.203541801051686e-05} +{"train_loss": 0.0013019903562963009, "global_step": 44244, "epoch": 371, "lr": 3.203335045844767e-05} +{"train_loss": 0.001455815858207643, "global_step": 44245, "epoch": 371, "lr": 3.203128294165407e-05} +{"train_loss": 0.0013474833685904741, "global_step": 44246, "epoch": 371, "lr": 3.202921546014014e-05} +{"train_loss": 0.0013699806295335293, "global_step": 44247, "epoch": 371, "lr": 3.20271480139099e-05} +{"train_loss": 0.001486313296481967, "global_step": 44248, "epoch": 371, "lr": 3.202508060296747e-05} +{"train_loss": 0.0008376503828912973, "global_step": 44249, "epoch": 371, "lr": 3.202301322731684e-05} +{"train_loss": 0.0017385773826390505, "global_step": 44250, "epoch": 371, "lr": 3.202094588696213e-05} +{"train_loss": 0.0013579276856034994, "global_step": 44251, "epoch": 371, "lr": 3.2018878581907365e-05} +{"train_loss": 0.0021080034784972668, "global_step": 44252, "epoch": 371, "lr": 3.201681131215659e-05} +{"train_loss": 0.0022503037471324205, "global_step": 44253, "epoch": 371, "lr": 3.201474407771391e-05} +{"train_loss": 0.0013194334460422397, "global_step": 44254, "epoch": 371, "lr": 3.201267687858334e-05} +{"train_loss": 0.0017587800975888968, "global_step": 44255, "epoch": 371, "lr": 3.201060971476898e-05} +{"train_loss": 0.0009106675861403346, "global_step": 44256, "epoch": 371, "lr": 3.2008542586274835e-05} +{"train_loss": 0.00149144500028342, "global_step": 44257, "epoch": 371, "lr": 3.2006475493105025e-05} +{"train_loss": 0.0007490582065656781, "global_step": 44258, "epoch": 371, "lr": 3.2004408435263564e-05} +{"train_loss": 0.0008946257294155657, "global_step": 44259, "epoch": 371, "lr": 3.200234141275452e-05} +{"train_loss": 0.0013011766131967306, "global_step": 44260, "epoch": 371, "lr": 3.200027442558196e-05} +{"train_loss": 0.0016699250554665923, "global_step": 44261, "epoch": 371, "lr": 3.199820747374993e-05} +{"train_loss": 0.0014981779968366027, "global_step": 44262, "epoch": 371, "lr": 3.199614055726251e-05} +{"train_loss": 0.0019867231603711843, "global_step": 44263, "epoch": 371, "lr": 3.1994073676123734e-05} +{"train_loss": 0.0008068705210462213, "global_step": 44264, "epoch": 371, "lr": 3.199200683033768e-05} +{"train_loss": 0.0017428587889298797, "global_step": 44265, "epoch": 371, "lr": 3.1989940019908404e-05} +{"train_loss": 0.001781294122338295, "global_step": 44266, "epoch": 371, "lr": 3.198787324483994e-05} +{"train_loss": 0.001524224629852639, "global_step": 44267, "epoch": 371, "lr": 3.1985806505136376e-05, "val_loss": 0.036724913865327835} +{"train_loss": 0.0008756337338127196, "global_step": 44268, "epoch": 372, "lr": 3.198373980080174e-05} +{"train_loss": 0.0011125578312203288, "global_step": 44269, "epoch": 372, "lr": 3.198167313184012e-05} +{"train_loss": 0.0015607172390446067, "global_step": 44270, "epoch": 372, "lr": 3.197960649825557e-05} +{"train_loss": 0.0014862543903291225, "global_step": 44271, "epoch": 372, "lr": 3.197753990005211e-05} +{"train_loss": 0.0014065414434298873, "global_step": 44272, "epoch": 372, "lr": 3.197547333723384e-05} +{"train_loss": 0.0018935272237285972, "global_step": 44273, "epoch": 372, "lr": 3.1973406809804796e-05} +{"train_loss": 0.0012080277083441615, "global_step": 44274, "epoch": 372, "lr": 3.197134031776905e-05} +{"train_loss": 0.0015120304888114333, "global_step": 44275, "epoch": 372, "lr": 3.196927386113064e-05} +{"train_loss": 0.0006870840443298221, "global_step": 44276, "epoch": 372, "lr": 3.1967207439893646e-05} +{"train_loss": 0.0008944009896367788, "global_step": 44277, "epoch": 372, "lr": 3.196514105406211e-05} +{"train_loss": 0.0013857816811650991, "global_step": 44278, "epoch": 372, "lr": 3.196307470364008e-05} +{"train_loss": 0.001103218412026763, "global_step": 44279, "epoch": 372, "lr": 3.1961008388631655e-05} +{"train_loss": 0.001878799987025559, "global_step": 44280, "epoch": 372, "lr": 3.1958942109040826e-05} +{"train_loss": 0.0014521352713927627, "global_step": 44281, "epoch": 372, "lr": 3.1956875864871716e-05} +{"train_loss": 0.0007549955043941736, "global_step": 44282, "epoch": 372, "lr": 3.1954809656128335e-05} +{"train_loss": 0.0012681077932938933, "global_step": 44283, "epoch": 372, "lr": 3.195274348281477e-05} +{"train_loss": 0.000906835775822401, "global_step": 44284, "epoch": 372, "lr": 3.1950677344935075e-05} +{"train_loss": 0.0017492154147475958, "global_step": 44285, "epoch": 372, "lr": 3.194861124249327e-05} +{"train_loss": 0.0013831343967467546, "global_step": 44286, "epoch": 372, "lr": 3.1946545175493456e-05} +{"train_loss": 0.0015444824239239097, "global_step": 44287, "epoch": 372, "lr": 3.194447914393966e-05} +{"train_loss": 0.0013678872492164373, "global_step": 44288, "epoch": 372, "lr": 3.1942413147835964e-05} +{"train_loss": 0.000575553101953119, "global_step": 44289, "epoch": 372, "lr": 3.1940347187186406e-05} +{"train_loss": 0.0014150901697576046, "global_step": 44290, "epoch": 372, "lr": 3.193828126199504e-05} +{"train_loss": 0.0013527526753023267, "global_step": 44291, "epoch": 372, "lr": 3.1936215372265934e-05} +{"train_loss": 0.0016355108236894011, "global_step": 44292, "epoch": 372, "lr": 3.193414951800314e-05} +{"train_loss": 0.0016997265629470348, "global_step": 44293, "epoch": 372, "lr": 3.193208369921071e-05} +{"train_loss": 0.001558842952363193, "global_step": 44294, "epoch": 372, "lr": 3.193001791589271e-05} +{"train_loss": 0.0010133621981367469, "global_step": 44295, "epoch": 372, "lr": 3.192795216805318e-05} +{"train_loss": 0.0015410674968734384, "global_step": 44296, "epoch": 372, "lr": 3.19258864556962e-05} +{"train_loss": 0.001789278700016439, "global_step": 44297, "epoch": 372, "lr": 3.1923820778825784e-05} +{"train_loss": 0.002357407007366419, "global_step": 44298, "epoch": 372, "lr": 3.1921755137446044e-05} +{"train_loss": 0.0010401353938505054, "global_step": 44299, "epoch": 372, "lr": 3.191968953156098e-05} +{"train_loss": 0.0016964462120085955, "global_step": 44300, "epoch": 372, "lr": 3.19176239611747e-05} +{"train_loss": 0.00141930824611336, "global_step": 44301, "epoch": 372, "lr": 3.191555842629123e-05} +{"train_loss": 0.0011277017183601856, "global_step": 44302, "epoch": 372, "lr": 3.1913492926914615e-05} +{"train_loss": 0.0018267693230882287, "global_step": 44303, "epoch": 372, "lr": 3.191142746304894e-05} +{"train_loss": 0.0012074921978637576, "global_step": 44304, "epoch": 372, "lr": 3.190936203469822e-05} +{"train_loss": 0.0009138167952187359, "global_step": 44305, "epoch": 372, "lr": 3.190729664186656e-05} +{"train_loss": 0.00192549591884017, "global_step": 44306, "epoch": 372, "lr": 3.1905231284557966e-05} +{"train_loss": 0.002378626726567745, "global_step": 44307, "epoch": 372, "lr": 3.190316596277654e-05} +{"train_loss": 0.002881248714402318, "global_step": 44308, "epoch": 372, "lr": 3.1901100676526304e-05} +{"train_loss": 0.0011451778700575233, "global_step": 44309, "epoch": 372, "lr": 3.189903542581132e-05} +{"train_loss": 0.0015268780989572406, "global_step": 44310, "epoch": 372, "lr": 3.1896970210635655e-05} +{"train_loss": 0.0021274180617183447, "global_step": 44311, "epoch": 372, "lr": 3.1894905031003336e-05} +{"train_loss": 0.002163561061024666, "global_step": 44312, "epoch": 372, "lr": 3.189283988691846e-05} +{"train_loss": 0.0015580535400658846, "global_step": 44313, "epoch": 372, "lr": 3.189077477838504e-05} +{"train_loss": 0.0019760753493756056, "global_step": 44314, "epoch": 372, "lr": 3.188870970540717e-05} +{"train_loss": 0.0013082674704492092, "global_step": 44315, "epoch": 372, "lr": 3.188664466798888e-05} +{"train_loss": 0.0012059223372489214, "global_step": 44316, "epoch": 372, "lr": 3.188457966613421e-05} +{"train_loss": 0.0010602992260828614, "global_step": 44317, "epoch": 372, "lr": 3.1882514699847254e-05} +{"train_loss": 0.0018981590401381254, "global_step": 44318, "epoch": 372, "lr": 3.188044976913202e-05} +{"train_loss": 0.0008016756037250161, "global_step": 44319, "epoch": 372, "lr": 3.187838487399261e-05} +{"train_loss": 0.0006342646083794534, "global_step": 44320, "epoch": 372, "lr": 3.187632001443306e-05} +{"train_loss": 0.001556960167363286, "global_step": 44321, "epoch": 372, "lr": 3.187425519045739e-05} +{"train_loss": 0.0009308930020779371, "global_step": 44322, "epoch": 372, "lr": 3.187219040206971e-05} +{"train_loss": 0.0031528365798294544, "global_step": 44323, "epoch": 372, "lr": 3.1870125649274024e-05} +{"train_loss": 0.0006739863893017173, "global_step": 44324, "epoch": 372, "lr": 3.1868060932074416e-05} +{"train_loss": 0.002591540105640888, "global_step": 44325, "epoch": 372, "lr": 3.1865996250474946e-05} +{"train_loss": 0.001032021245919168, "global_step": 44326, "epoch": 372, "lr": 3.1863931604479645e-05} +{"train_loss": 0.0026624074671417475, "global_step": 44327, "epoch": 372, "lr": 3.1861866994092586e-05} +{"train_loss": 0.0012471061199903488, "global_step": 44328, "epoch": 372, "lr": 3.1859802419317794e-05} +{"train_loss": 0.0012486582854762673, "global_step": 44329, "epoch": 372, "lr": 3.185773788015937e-05} +{"train_loss": 0.0009305971907451749, "global_step": 44330, "epoch": 372, "lr": 3.185567337662131e-05} +{"train_loss": 0.0014283221680670977, "global_step": 44331, "epoch": 372, "lr": 3.1853608908707725e-05} +{"train_loss": 0.0014651493402197957, "global_step": 44332, "epoch": 372, "lr": 3.185154447642261e-05} +{"train_loss": 0.001013236935250461, "global_step": 44333, "epoch": 372, "lr": 3.184948007977008e-05} +{"train_loss": 0.001799470977857709, "global_step": 44334, "epoch": 372, "lr": 3.184741571875415e-05} +{"train_loss": 0.0014561018906533718, "global_step": 44335, "epoch": 372, "lr": 3.184535139337886e-05} +{"train_loss": 0.0011621240992099047, "global_step": 44336, "epoch": 372, "lr": 3.18432871036483e-05} +{"train_loss": 0.0014608671190217137, "global_step": 44337, "epoch": 372, "lr": 3.18412228495665e-05} +{"train_loss": 0.0012266732519492507, "global_step": 44338, "epoch": 372, "lr": 3.183915863113752e-05} +{"train_loss": 0.0008275035652332008, "global_step": 44339, "epoch": 372, "lr": 3.183709444836541e-05} +{"train_loss": 0.0018198220059275627, "global_step": 44340, "epoch": 372, "lr": 3.183503030125423e-05} +{"train_loss": 0.001052768318913877, "global_step": 44341, "epoch": 372, "lr": 3.183296618980802e-05} +{"train_loss": 0.0017227224307134748, "global_step": 44342, "epoch": 372, "lr": 3.183090211403085e-05} +{"train_loss": 0.002517192391678691, "global_step": 44343, "epoch": 372, "lr": 3.182883807392675e-05} +{"train_loss": 0.0007807756192050874, "global_step": 44344, "epoch": 372, "lr": 3.182677406949979e-05} +{"train_loss": 0.0013039532350376248, "global_step": 44345, "epoch": 372, "lr": 3.182471010075402e-05} +{"train_loss": 0.0016936952015385032, "global_step": 44346, "epoch": 372, "lr": 3.1822646167693504e-05} +{"train_loss": 0.0009653975139372051, "global_step": 44347, "epoch": 372, "lr": 3.182058227032225e-05} +{"train_loss": 0.003165364498272538, "global_step": 44348, "epoch": 372, "lr": 3.181851840864437e-05} +{"train_loss": 0.0013427947415038943, "global_step": 44349, "epoch": 372, "lr": 3.181645458266386e-05} +{"train_loss": 0.0013817832805216312, "global_step": 44350, "epoch": 372, "lr": 3.181439079238482e-05} +{"train_loss": 0.001270756358280778, "global_step": 44351, "epoch": 372, "lr": 3.181232703781128e-05} +{"train_loss": 0.0013996186899021268, "global_step": 44352, "epoch": 372, "lr": 3.1810263318947276e-05} +{"train_loss": 0.001004555611871183, "global_step": 44353, "epoch": 372, "lr": 3.180819963579689e-05} +{"train_loss": 0.0012842228170484304, "global_step": 44354, "epoch": 372, "lr": 3.180613598836415e-05} +{"train_loss": 0.0020610084757208824, "global_step": 44355, "epoch": 372, "lr": 3.1804072376653135e-05} +{"train_loss": 0.0010918311309069395, "global_step": 44356, "epoch": 372, "lr": 3.180200880066786e-05} +{"train_loss": 0.001357126166112721, "global_step": 44357, "epoch": 372, "lr": 3.179994526041241e-05} +{"train_loss": 0.0013082224177196622, "global_step": 44358, "epoch": 372, "lr": 3.179788175589082e-05} +{"train_loss": 0.0007850308320485055, "global_step": 44359, "epoch": 372, "lr": 3.179581828710713e-05} +{"train_loss": 0.0017342576757073402, "global_step": 44360, "epoch": 372, "lr": 3.179375485406543e-05} +{"train_loss": 0.00096844881772995, "global_step": 44361, "epoch": 372, "lr": 3.1791691456769725e-05} +{"train_loss": 0.0018805483123287559, "global_step": 44362, "epoch": 372, "lr": 3.178962809522411e-05} +{"train_loss": 0.0007366422796621919, "global_step": 44363, "epoch": 372, "lr": 3.17875647694326e-05} +{"train_loss": 0.0018351252656430006, "global_step": 44364, "epoch": 372, "lr": 3.1785501479399274e-05} +{"train_loss": 0.0015690705040469766, "global_step": 44365, "epoch": 372, "lr": 3.178343822512817e-05} +{"train_loss": 0.0014532754430547357, "global_step": 44366, "epoch": 372, "lr": 3.1781375006623315e-05} +{"train_loss": 0.0009092268301174045, "global_step": 44367, "epoch": 372, "lr": 3.1779311823888815e-05} +{"train_loss": 0.002045476110652089, "global_step": 44368, "epoch": 372, "lr": 3.177724867692866e-05} +{"train_loss": 0.0009501295862719417, "global_step": 44369, "epoch": 372, "lr": 3.177518556574696e-05} +{"train_loss": 0.0012677469057962298, "global_step": 44370, "epoch": 372, "lr": 3.177312249034773e-05} +{"train_loss": 0.0014082627603784204, "global_step": 44371, "epoch": 372, "lr": 3.1771059450735e-05} +{"train_loss": 0.0012586084194481373, "global_step": 44372, "epoch": 372, "lr": 3.176899644691287e-05} +{"train_loss": 0.0011820048093795776, "global_step": 44373, "epoch": 372, "lr": 3.1766933478885357e-05} +{"train_loss": 0.0014569108607247472, "global_step": 44374, "epoch": 372, "lr": 3.176487054665653e-05} +{"train_loss": 0.0011764665832743049, "global_step": 44375, "epoch": 372, "lr": 3.1762807650230425e-05} +{"train_loss": 0.001743443077430129, "global_step": 44376, "epoch": 372, "lr": 3.176074478961111e-05} +{"train_loss": 0.001107722520828247, "global_step": 44377, "epoch": 372, "lr": 3.175868196480262e-05} +{"train_loss": 0.0013159408699721098, "global_step": 44378, "epoch": 372, "lr": 3.1756619175809e-05} +{"train_loss": 0.0011771195568144321, "global_step": 44379, "epoch": 372, "lr": 3.175455642263432e-05} +{"train_loss": 0.0010179674718528986, "global_step": 44380, "epoch": 372, "lr": 3.1752493705282606e-05} +{"train_loss": 0.000928506487980485, "global_step": 44381, "epoch": 372, "lr": 3.175043102375794e-05} +{"train_loss": 0.0007093276362866163, "global_step": 44382, "epoch": 372, "lr": 3.174836837806433e-05} +{"train_loss": 0.0015370446490123868, "global_step": 44383, "epoch": 372, "lr": 3.174630576820588e-05} +{"train_loss": 0.0018350938335061073, "global_step": 44384, "epoch": 372, "lr": 3.174424319418659e-05} +{"train_loss": 0.0018115193815901875, "global_step": 44385, "epoch": 372, "lr": 3.174218065601052e-05} +{"train_loss": 0.0014224740536687818, "global_step": 44386, "epoch": 372, "lr": 3.174011815368174e-05, "val_loss": 0.016988612711429596} +{"train_loss": 0.001005988335236907, "global_step": 44387, "epoch": 373, "lr": 3.173805568720428e-05} +{"train_loss": 0.0016473495634272695, "global_step": 44388, "epoch": 373, "lr": 3.173599325658221e-05} +{"train_loss": 0.0009749173768796027, "global_step": 44389, "epoch": 373, "lr": 3.173393086181955e-05} +{"train_loss": 0.0015037108678370714, "global_step": 44390, "epoch": 373, "lr": 3.173186850292037e-05} +{"train_loss": 0.001438469858840108, "global_step": 44391, "epoch": 373, "lr": 3.1729806179888716e-05} +{"train_loss": 0.0005170191288925707, "global_step": 44392, "epoch": 373, "lr": 3.1727743892728635e-05} +{"train_loss": 0.0008218661532737315, "global_step": 44393, "epoch": 373, "lr": 3.1725681641444175e-05} +{"train_loss": 0.0017561311833560467, "global_step": 44394, "epoch": 373, "lr": 3.172361942603938e-05} +{"train_loss": 0.0009540350292809308, "global_step": 44395, "epoch": 373, "lr": 3.172155724651832e-05} +{"train_loss": 0.0020210586953908205, "global_step": 44396, "epoch": 373, "lr": 3.171949510288504e-05} +{"train_loss": 0.0010441241320222616, "global_step": 44397, "epoch": 373, "lr": 3.1717432995143546e-05} +{"train_loss": 0.0012345168506726623, "global_step": 44398, "epoch": 373, "lr": 3.1715370923297947e-05} +{"train_loss": 0.0008392127347178757, "global_step": 44399, "epoch": 373, "lr": 3.1713308887352246e-05} +{"train_loss": 0.0011510642943903804, "global_step": 44400, "epoch": 373, "lr": 3.171124688731052e-05} +{"train_loss": 0.0015180337941274047, "global_step": 44401, "epoch": 373, "lr": 3.170918492317679e-05} +{"train_loss": 0.001470846589654684, "global_step": 44402, "epoch": 373, "lr": 3.170712299495515e-05} +{"train_loss": 0.001231662929058075, "global_step": 44403, "epoch": 373, "lr": 3.1705061102649615e-05} +{"train_loss": 0.0013767699711024761, "global_step": 44404, "epoch": 373, "lr": 3.1702999246264206e-05} +{"train_loss": 0.0008960080449469388, "global_step": 44405, "epoch": 373, "lr": 3.170093742580304e-05} +{"train_loss": 0.0012034740066155791, "global_step": 44406, "epoch": 373, "lr": 3.16988756412701e-05} +{"train_loss": 0.0020604028832167387, "global_step": 44407, "epoch": 373, "lr": 3.1696813892669477e-05} +{"train_loss": 0.0019540460780262947, "global_step": 44408, "epoch": 373, "lr": 3.169475218000521e-05} +{"train_loss": 0.0009320082026533782, "global_step": 44409, "epoch": 373, "lr": 3.1692690503281324e-05} +{"train_loss": 0.0008717330056242645, "global_step": 44410, "epoch": 373, "lr": 3.1690628862501904e-05} +{"train_loss": 0.0004904216038994491, "global_step": 44411, "epoch": 373, "lr": 3.1688567257670956e-05} +{"train_loss": 0.0009123205090872943, "global_step": 44412, "epoch": 373, "lr": 3.168650568879257e-05} +{"train_loss": 0.003024626988917589, "global_step": 44413, "epoch": 373, "lr": 3.168444415587076e-05} +{"train_loss": 0.002061233390122652, "global_step": 44414, "epoch": 373, "lr": 3.1682382658909604e-05} +{"train_loss": 0.0007695708191022277, "global_step": 44415, "epoch": 373, "lr": 3.168032119791313e-05} +{"train_loss": 0.0009612991125322878, "global_step": 44416, "epoch": 373, "lr": 3.167825977288536e-05} +{"train_loss": 0.001120544970035553, "global_step": 44417, "epoch": 373, "lr": 3.16761983838304e-05} +{"train_loss": 0.0006672650342807174, "global_step": 44418, "epoch": 373, "lr": 3.1674137030752246e-05} +{"train_loss": 0.0014822562225162983, "global_step": 44419, "epoch": 373, "lr": 3.167207571365499e-05} +{"train_loss": 0.0014055926585569978, "global_step": 44420, "epoch": 373, "lr": 3.167001443254265e-05} +{"train_loss": 0.0018222827930003405, "global_step": 44421, "epoch": 373, "lr": 3.166795318741926e-05} +{"train_loss": 0.000884596782270819, "global_step": 44422, "epoch": 373, "lr": 3.1665891978288895e-05} +{"train_loss": 0.0010731903603300452, "global_step": 44423, "epoch": 373, "lr": 3.166383080515559e-05} +{"train_loss": 0.0012804795987904072, "global_step": 44424, "epoch": 373, "lr": 3.16617696680234e-05} +{"train_loss": 0.0016204941784963012, "global_step": 44425, "epoch": 373, "lr": 3.165970856689636e-05} +{"train_loss": 0.0021574534475803375, "global_step": 44426, "epoch": 373, "lr": 3.165764750177853e-05} +{"train_loss": 0.0007044996018521488, "global_step": 44427, "epoch": 373, "lr": 3.1655586472673953e-05} +{"train_loss": 0.0014181735459715128, "global_step": 44428, "epoch": 373, "lr": 3.165352547958665e-05} +{"train_loss": 0.002213607309386134, "global_step": 44429, "epoch": 373, "lr": 3.1651464522520715e-05} +{"train_loss": 0.0016722498694434762, "global_step": 44430, "epoch": 373, "lr": 3.164940360148015e-05} +{"train_loss": 0.0014633233658969402, "global_step": 44431, "epoch": 373, "lr": 3.1647342716469045e-05} +{"train_loss": 0.0008997699478641152, "global_step": 44432, "epoch": 373, "lr": 3.1645281867491396e-05} +{"train_loss": 0.0011833911994472146, "global_step": 44433, "epoch": 373, "lr": 3.1643221054551286e-05} +{"train_loss": 0.0015469082864001393, "global_step": 44434, "epoch": 373, "lr": 3.164116027765276e-05} +{"train_loss": 0.0008684048661962152, "global_step": 44435, "epoch": 373, "lr": 3.163909953679983e-05} +{"train_loss": 0.0015166621888056397, "global_step": 44436, "epoch": 373, "lr": 3.1637038831996594e-05} +{"train_loss": 0.002170354127883911, "global_step": 44437, "epoch": 373, "lr": 3.1634978163247045e-05} +{"train_loss": 0.0007754361140541732, "global_step": 44438, "epoch": 373, "lr": 3.163291753055528e-05} +{"train_loss": 0.0015280368970707059, "global_step": 44439, "epoch": 373, "lr": 3.16308569339253e-05} +{"train_loss": 0.0010871058329939842, "global_step": 44440, "epoch": 373, "lr": 3.162879637336118e-05} +{"train_loss": 0.0018917650450021029, "global_step": 44441, "epoch": 373, "lr": 3.162673584886695e-05} +{"train_loss": 0.0011151317739859223, "global_step": 44442, "epoch": 373, "lr": 3.162467536044666e-05} +{"train_loss": 0.000973715097643435, "global_step": 44443, "epoch": 373, "lr": 3.162261490810436e-05} +{"train_loss": 0.001412666286341846, "global_step": 44444, "epoch": 373, "lr": 3.162055449184408e-05} +{"train_loss": 0.0010058186016976833, "global_step": 44445, "epoch": 373, "lr": 3.1618494111669896e-05} +{"train_loss": 0.0024821029510349035, "global_step": 44446, "epoch": 373, "lr": 3.161643376758584e-05} +{"train_loss": 0.0011948979226872325, "global_step": 44447, "epoch": 373, "lr": 3.161437345959593e-05} +{"train_loss": 0.0010634181089699268, "global_step": 44448, "epoch": 373, "lr": 3.1612313187704254e-05} +{"train_loss": 0.001833306741900742, "global_step": 44449, "epoch": 373, "lr": 3.1610252951914816e-05} +{"train_loss": 0.001561902230605483, "global_step": 44450, "epoch": 373, "lr": 3.16081927522317e-05} +{"train_loss": 0.000611231429502368, "global_step": 44451, "epoch": 373, "lr": 3.160613258865891e-05} +{"train_loss": 0.0014149616472423077, "global_step": 44452, "epoch": 373, "lr": 3.160407246120054e-05} +{"train_loss": 0.0008098774123936892, "global_step": 44453, "epoch": 373, "lr": 3.160201236986061e-05} +{"train_loss": 0.0009350060718134046, "global_step": 44454, "epoch": 373, "lr": 3.159995231464314e-05} +{"train_loss": 0.001633487525396049, "global_step": 44455, "epoch": 373, "lr": 3.1597892295552214e-05} +{"train_loss": 0.00128225889056921, "global_step": 44456, "epoch": 373, "lr": 3.1595832312591845e-05} +{"train_loss": 0.0014657791471108794, "global_step": 44457, "epoch": 373, "lr": 3.1593772365766105e-05} +{"train_loss": 0.0018198778852820396, "global_step": 44458, "epoch": 373, "lr": 3.159171245507903e-05} +{"train_loss": 0.0012593988794833422, "global_step": 44459, "epoch": 373, "lr": 3.1589652580534646e-05} +{"train_loss": 0.0010216108057647943, "global_step": 44460, "epoch": 373, "lr": 3.158759274213703e-05} +{"train_loss": 0.0018386259907856584, "global_step": 44461, "epoch": 373, "lr": 3.1585532939890186e-05} +{"train_loss": 0.0019932612776756287, "global_step": 44462, "epoch": 373, "lr": 3.1583473173798204e-05} +{"train_loss": 0.0009956422727555037, "global_step": 44463, "epoch": 373, "lr": 3.158141344386509e-05} +{"train_loss": 0.0011125982273370028, "global_step": 44464, "epoch": 373, "lr": 3.157935375009492e-05} +{"train_loss": 0.000807088625151664, "global_step": 44465, "epoch": 373, "lr": 3.157729409249172e-05} +{"train_loss": 0.0018772832117974758, "global_step": 44466, "epoch": 373, "lr": 3.157523447105951e-05} +{"train_loss": 0.0008201083401218057, "global_step": 44467, "epoch": 373, "lr": 3.1573174885802384e-05} +{"train_loss": 0.0011381108779460192, "global_step": 44468, "epoch": 373, "lr": 3.1571115336724336e-05} +{"train_loss": 0.0008776678005233407, "global_step": 44469, "epoch": 373, "lr": 3.1569055823829455e-05} +{"train_loss": 0.0008638795698061585, "global_step": 44470, "epoch": 373, "lr": 3.1566996347121746e-05} +{"train_loss": 0.0008557021501474082, "global_step": 44471, "epoch": 373, "lr": 3.1564936906605295e-05} +{"train_loss": 0.0012255689362064004, "global_step": 44472, "epoch": 373, "lr": 3.1562877502284106e-05} +{"train_loss": 0.0009908282663673162, "global_step": 44473, "epoch": 373, "lr": 3.156081813416224e-05} +{"train_loss": 0.0009783857967704535, "global_step": 44474, "epoch": 373, "lr": 3.1558758802243734e-05} +{"train_loss": 0.0008349950076080859, "global_step": 44475, "epoch": 373, "lr": 3.1556699506532634e-05} +{"train_loss": 0.0019164136610925198, "global_step": 44476, "epoch": 373, "lr": 3.1554640247032985e-05} +{"train_loss": 0.0005814881296828389, "global_step": 44477, "epoch": 373, "lr": 3.155258102374884e-05} +{"train_loss": 0.0009542767656967044, "global_step": 44478, "epoch": 373, "lr": 3.155052183668421e-05} +{"train_loss": 0.0008020116365514696, "global_step": 44479, "epoch": 373, "lr": 3.154846268584318e-05} +{"train_loss": 0.0010304595343768597, "global_step": 44480, "epoch": 373, "lr": 3.154640357122976e-05} +{"train_loss": 0.0010599838569760323, "global_step": 44481, "epoch": 373, "lr": 3.154434449284802e-05} +{"train_loss": 0.0006484597688540816, "global_step": 44482, "epoch": 373, "lr": 3.1542285450701966e-05} +{"train_loss": 0.000754973734728992, "global_step": 44483, "epoch": 373, "lr": 3.154022644479569e-05} +{"train_loss": 0.0006571777048520744, "global_step": 44484, "epoch": 373, "lr": 3.1538167475133196e-05} +{"train_loss": 0.0008244480122812092, "global_step": 44485, "epoch": 373, "lr": 3.153610854171852e-05} +{"train_loss": 0.0007957599591463804, "global_step": 44486, "epoch": 373, "lr": 3.153404964455574e-05} +{"train_loss": 0.0011174079263582826, "global_step": 44487, "epoch": 373, "lr": 3.153199078364887e-05} +{"train_loss": 0.0007836099248379469, "global_step": 44488, "epoch": 373, "lr": 3.152993195900198e-05} +{"train_loss": 0.00178682676050812, "global_step": 44489, "epoch": 373, "lr": 3.152787317061908e-05} +{"train_loss": 0.0007745538605377078, "global_step": 44490, "epoch": 373, "lr": 3.152581441850423e-05} +{"train_loss": 0.0007549238507635891, "global_step": 44491, "epoch": 373, "lr": 3.1523755702661475e-05} +{"train_loss": 0.001921660965308547, "global_step": 44492, "epoch": 373, "lr": 3.152169702309483e-05} +{"train_loss": 0.0007592755719088018, "global_step": 44493, "epoch": 373, "lr": 3.1519638379808394e-05} +{"train_loss": 0.0012529243249446154, "global_step": 44494, "epoch": 373, "lr": 3.151757977280614e-05} +{"train_loss": 0.0008795643807388842, "global_step": 44495, "epoch": 373, "lr": 3.151552120209217e-05} +{"train_loss": 0.0014227719511836767, "global_step": 44496, "epoch": 373, "lr": 3.15134626676705e-05} +{"train_loss": 0.0015323641709983349, "global_step": 44497, "epoch": 373, "lr": 3.151140416954515e-05} +{"train_loss": 0.0006998447934165597, "global_step": 44498, "epoch": 373, "lr": 3.150934570772021e-05} +{"train_loss": 0.0010789006482809782, "global_step": 44499, "epoch": 373, "lr": 3.150728728219966e-05} +{"train_loss": 0.001496824319474399, "global_step": 44500, "epoch": 373, "lr": 3.15052288929876e-05} +{"train_loss": 0.0013369288062676787, "global_step": 44501, "epoch": 373, "lr": 3.150317054008803e-05} +{"train_loss": 0.0011064247228205204, "global_step": 44502, "epoch": 373, "lr": 3.1501112223505034e-05} +{"train_loss": 0.002037524711340666, "global_step": 44503, "epoch": 373, "lr": 3.1499053943242625e-05} +{"train_loss": 0.0009015424875542521, "global_step": 44504, "epoch": 373, "lr": 3.1496995699304824e-05} +{"train_loss": 0.0012393501130355318, "global_step": 44505, "epoch": 373, "lr": 3.149493749169571e-05, "val_loss": 0.009604210034012794} +{"train_loss": 0.0015267753042280674, "global_step": 44506, "epoch": 374, "lr": 3.1492879320419297e-05} +{"train_loss": 0.0013060994679108262, "global_step": 44507, "epoch": 374, "lr": 3.149082118547965e-05} +{"train_loss": 0.0009474172256886959, "global_step": 44508, "epoch": 374, "lr": 3.14887630868808e-05} +{"train_loss": 0.0014686781214550138, "global_step": 44509, "epoch": 374, "lr": 3.148670502462677e-05} +{"train_loss": 0.002473172964528203, "global_step": 44510, "epoch": 374, "lr": 3.1484646998721646e-05} +{"train_loss": 0.0012355775106698275, "global_step": 44511, "epoch": 374, "lr": 3.148258900916941e-05} +{"train_loss": 0.0009866701439023018, "global_step": 44512, "epoch": 374, "lr": 3.148053105597415e-05} +{"train_loss": 0.0022996054030954838, "global_step": 44513, "epoch": 374, "lr": 3.147847313913987e-05} +{"train_loss": 0.0019119910430163145, "global_step": 44514, "epoch": 374, "lr": 3.147641525867065e-05} +{"train_loss": 0.0007072215084917843, "global_step": 44515, "epoch": 374, "lr": 3.147435741457051e-05} +{"train_loss": 0.001028378028422594, "global_step": 44516, "epoch": 374, "lr": 3.147229960684348e-05} +{"train_loss": 0.002303440123796463, "global_step": 44517, "epoch": 374, "lr": 3.147024183549362e-05} +{"train_loss": 0.0006717964424751699, "global_step": 44518, "epoch": 374, "lr": 3.1468184100524936e-05} +{"train_loss": 0.0008833942702040076, "global_step": 44519, "epoch": 374, "lr": 3.146612640194152e-05} +{"train_loss": 0.0008709657122381032, "global_step": 44520, "epoch": 374, "lr": 3.146406873974736e-05} +{"train_loss": 0.0014607870252802968, "global_step": 44521, "epoch": 374, "lr": 3.1462011113946546e-05} +{"train_loss": 0.0023842109367251396, "global_step": 44522, "epoch": 374, "lr": 3.145995352454308e-05} +{"train_loss": 0.0022420533932745457, "global_step": 44523, "epoch": 374, "lr": 3.145789597154102e-05} +{"train_loss": 0.0013360925950109959, "global_step": 44524, "epoch": 374, "lr": 3.145583845494439e-05} +{"train_loss": 0.0017208491917699575, "global_step": 44525, "epoch": 374, "lr": 3.145378097475725e-05} +{"train_loss": 0.0011528395116329193, "global_step": 44526, "epoch": 374, "lr": 3.145172353098362e-05} +{"train_loss": 0.0016496592434123158, "global_step": 44527, "epoch": 374, "lr": 3.144966612362756e-05} +{"train_loss": 0.0010839867172762752, "global_step": 44528, "epoch": 374, "lr": 3.144760875269309e-05} +{"train_loss": 0.0007837485172785819, "global_step": 44529, "epoch": 374, "lr": 3.1445551418184274e-05} +{"train_loss": 0.000786261516623199, "global_step": 44530, "epoch": 374, "lr": 3.144349412010511e-05} +{"train_loss": 0.0018437067046761513, "global_step": 44531, "epoch": 374, "lr": 3.1441436858459685e-05} +{"train_loss": 0.0013511943398043513, "global_step": 44532, "epoch": 374, "lr": 3.1439379633251994e-05} +{"train_loss": 0.0017881669336929917, "global_step": 44533, "epoch": 374, "lr": 3.143732244448613e-05} +{"train_loss": 0.001176576828584075, "global_step": 44534, "epoch": 374, "lr": 3.143526529216608e-05} +{"train_loss": 0.0017840059008449316, "global_step": 44535, "epoch": 374, "lr": 3.1433208176295906e-05} +{"train_loss": 0.001397778745740652, "global_step": 44536, "epoch": 374, "lr": 3.1431151096879655e-05} +{"train_loss": 0.0028933589346706867, "global_step": 44537, "epoch": 374, "lr": 3.142909405392133e-05} +{"train_loss": 0.0009516407735645771, "global_step": 44538, "epoch": 374, "lr": 3.142703704742501e-05} +{"train_loss": 0.001769357011653483, "global_step": 44539, "epoch": 374, "lr": 3.142498007739472e-05} +{"train_loss": 0.0012004505842924118, "global_step": 44540, "epoch": 374, "lr": 3.1422923143834485e-05} +{"train_loss": 0.0007261184509843588, "global_step": 44541, "epoch": 374, "lr": 3.142086624674837e-05} +{"train_loss": 0.0013692846987396479, "global_step": 44542, "epoch": 374, "lr": 3.141880938614038e-05} +{"train_loss": 0.0014223236357793212, "global_step": 44543, "epoch": 374, "lr": 3.14167525620146e-05} +{"train_loss": 0.0012007239274680614, "global_step": 44544, "epoch": 374, "lr": 3.141469577437501e-05} +{"train_loss": 0.0028805893380194902, "global_step": 44545, "epoch": 374, "lr": 3.141263902322571e-05} +{"train_loss": 0.0008404406835325062, "global_step": 44546, "epoch": 374, "lr": 3.1410582308570706e-05} +{"train_loss": 0.0009493595571257174, "global_step": 44547, "epoch": 374, "lr": 3.140852563041401e-05} +{"train_loss": 0.0013197804801166058, "global_step": 44548, "epoch": 374, "lr": 3.140646898875972e-05} +{"train_loss": 0.0019198826048523188, "global_step": 44549, "epoch": 374, "lr": 3.1404412383611816e-05} +{"train_loss": 0.0015207756077870727, "global_step": 44550, "epoch": 374, "lr": 3.1402355814974376e-05} +{"train_loss": 0.001749553019180894, "global_step": 44551, "epoch": 374, "lr": 3.140029928285141e-05} +{"train_loss": 0.0011518680257722735, "global_step": 44552, "epoch": 374, "lr": 3.139824278724699e-05} +{"train_loss": 0.0011694720014929771, "global_step": 44553, "epoch": 374, "lr": 3.1396186328165125e-05} +{"train_loss": 0.0027243553195148706, "global_step": 44554, "epoch": 374, "lr": 3.139412990560985e-05} +{"train_loss": 0.001331121544353664, "global_step": 44555, "epoch": 374, "lr": 3.1392073519585216e-05} +{"train_loss": 0.0008444517734460533, "global_step": 44556, "epoch": 374, "lr": 3.1390017170095264e-05} +{"train_loss": 0.0010406224755570292, "global_step": 44557, "epoch": 374, "lr": 3.1387960857144016e-05} +{"train_loss": 0.001979229273274541, "global_step": 44558, "epoch": 374, "lr": 3.138590458073554e-05} +{"train_loss": 0.0011518531246110797, "global_step": 44559, "epoch": 374, "lr": 3.138384834087382e-05} +{"train_loss": 0.0027424024883657694, "global_step": 44560, "epoch": 374, "lr": 3.138179213756295e-05} +{"train_loss": 0.0017782686045393348, "global_step": 44561, "epoch": 374, "lr": 3.137973597080692e-05} +{"train_loss": 0.0013504985254257917, "global_step": 44562, "epoch": 374, "lr": 3.137767984060982e-05} +{"train_loss": 0.0013728641206398606, "global_step": 44563, "epoch": 374, "lr": 3.137562374697562e-05} +{"train_loss": 0.0012965797213837504, "global_step": 44564, "epoch": 374, "lr": 3.137356768990843e-05} +{"train_loss": 0.0014259506715461612, "global_step": 44565, "epoch": 374, "lr": 3.137151166941224e-05} +{"train_loss": 0.0034580063074827194, "global_step": 44566, "epoch": 374, "lr": 3.136945568549108e-05} +{"train_loss": 0.0019006648799404502, "global_step": 44567, "epoch": 374, "lr": 3.1367399738149015e-05} +{"train_loss": 0.0010472550056874752, "global_step": 44568, "epoch": 374, "lr": 3.136534382739006e-05} +{"train_loss": 0.0017421126831322908, "global_step": 44569, "epoch": 374, "lr": 3.136328795321828e-05} +{"train_loss": 0.001017212402075529, "global_step": 44570, "epoch": 374, "lr": 3.1361232115637664e-05} +{"train_loss": 0.0016507778782397509, "global_step": 44571, "epoch": 374, "lr": 3.135917631465231e-05} +{"train_loss": 0.0008074540528468788, "global_step": 44572, "epoch": 374, "lr": 3.1357120550266206e-05} +{"train_loss": 0.001258092699572444, "global_step": 44573, "epoch": 374, "lr": 3.135506482248341e-05} +{"train_loss": 0.0010779864387586713, "global_step": 44574, "epoch": 374, "lr": 3.135300913130794e-05} +{"train_loss": 0.0021923452150076628, "global_step": 44575, "epoch": 374, "lr": 3.135095347674384e-05} +{"train_loss": 0.0024096157867461443, "global_step": 44576, "epoch": 374, "lr": 3.134889785879517e-05} +{"train_loss": 0.0014648836804553866, "global_step": 44577, "epoch": 374, "lr": 3.134684227746595e-05} +{"train_loss": 0.0014975297963246703, "global_step": 44578, "epoch": 374, "lr": 3.1344786732760187e-05} +{"train_loss": 0.0026627362240105867, "global_step": 44579, "epoch": 374, "lr": 3.1342731224681966e-05} +{"train_loss": 0.0013515993487089872, "global_step": 44580, "epoch": 374, "lr": 3.1340675753235285e-05} +{"train_loss": 0.0018471041694283485, "global_step": 44581, "epoch": 374, "lr": 3.133862031842421e-05} +{"train_loss": 0.0012241998920217156, "global_step": 44582, "epoch": 374, "lr": 3.1336564920252734e-05} +{"train_loss": 0.0008353165467269719, "global_step": 44583, "epoch": 374, "lr": 3.133450955872494e-05} +{"train_loss": 0.0010672106873244047, "global_step": 44584, "epoch": 374, "lr": 3.1332454233844844e-05} +{"train_loss": 0.0009133382700383663, "global_step": 44585, "epoch": 374, "lr": 3.1330398945616464e-05} +{"train_loss": 0.002004151465371251, "global_step": 44586, "epoch": 374, "lr": 3.132834369404386e-05} +{"train_loss": 0.001331029343418777, "global_step": 44587, "epoch": 374, "lr": 3.132628847913105e-05} +{"train_loss": 0.001115526887588203, "global_step": 44588, "epoch": 374, "lr": 3.132423330088209e-05} +{"train_loss": 0.0013712478103116155, "global_step": 44589, "epoch": 374, "lr": 3.132217815930099e-05} +{"train_loss": 0.0009144318755716085, "global_step": 44590, "epoch": 374, "lr": 3.13201230543918e-05} +{"train_loss": 0.002072458853945136, "global_step": 44591, "epoch": 374, "lr": 3.1318067986158574e-05} +{"train_loss": 0.0013734062667936087, "global_step": 44592, "epoch": 374, "lr": 3.13160129546053e-05} +{"train_loss": 0.0019164426485076547, "global_step": 44593, "epoch": 374, "lr": 3.131395795973605e-05} +{"train_loss": 0.0017701716860756278, "global_step": 44594, "epoch": 374, "lr": 3.1311903001554836e-05} +{"train_loss": 0.0014579680282622576, "global_step": 44595, "epoch": 374, "lr": 3.130984808006572e-05} +{"train_loss": 0.001659371773712337, "global_step": 44596, "epoch": 374, "lr": 3.1307793195272725e-05} +{"train_loss": 0.0009478570427745581, "global_step": 44597, "epoch": 374, "lr": 3.130573834717986e-05} +{"train_loss": 0.002013532444834709, "global_step": 44598, "epoch": 374, "lr": 3.13036835357912e-05} +{"train_loss": 0.0011661816388368607, "global_step": 44599, "epoch": 374, "lr": 3.130162876111074e-05} +{"train_loss": 0.001917318906635046, "global_step": 44600, "epoch": 374, "lr": 3.129957402314255e-05} +{"train_loss": 0.0014135526726022363, "global_step": 44601, "epoch": 374, "lr": 3.1297519321890635e-05} +{"train_loss": 0.0020801140926778316, "global_step": 44602, "epoch": 374, "lr": 3.129546465735906e-05} +{"train_loss": 0.00277587678283453, "global_step": 44603, "epoch": 374, "lr": 3.1293410029551836e-05} +{"train_loss": 0.0017530169570818543, "global_step": 44604, "epoch": 374, "lr": 3.1291355438472995e-05} +{"train_loss": 0.0010724521707743406, "global_step": 44605, "epoch": 374, "lr": 3.1289300884126586e-05} +{"train_loss": 0.0012516924180090427, "global_step": 44606, "epoch": 374, "lr": 3.128724636651663e-05} +{"train_loss": 0.0019338312558829784, "global_step": 44607, "epoch": 374, "lr": 3.128519188564717e-05} +{"train_loss": 0.001191256451420486, "global_step": 44608, "epoch": 374, "lr": 3.1283137441522246e-05} +{"train_loss": 0.0016139104263857007, "global_step": 44609, "epoch": 374, "lr": 3.128108303414586e-05} +{"train_loss": 0.0011826039990410209, "global_step": 44610, "epoch": 374, "lr": 3.1279028663522094e-05} +{"train_loss": 0.0008159686112776399, "global_step": 44611, "epoch": 374, "lr": 3.1276974329654924e-05} +{"train_loss": 0.0015199653571471572, "global_step": 44612, "epoch": 374, "lr": 3.1274920032548436e-05} +{"train_loss": 0.0017198144923895597, "global_step": 44613, "epoch": 374, "lr": 3.127286577220663e-05} +{"train_loss": 0.0009784927824512124, "global_step": 44614, "epoch": 374, "lr": 3.127081154863357e-05} +{"train_loss": 0.001409923075698316, "global_step": 44615, "epoch": 374, "lr": 3.126875736183327e-05} +{"train_loss": 0.0013460967456921935, "global_step": 44616, "epoch": 374, "lr": 3.126670321180974e-05} +{"train_loss": 0.000903266598470509, "global_step": 44617, "epoch": 374, "lr": 3.126464909856706e-05} +{"train_loss": 0.0008886577561497688, "global_step": 44618, "epoch": 374, "lr": 3.126259502210922e-05} +{"train_loss": 0.0016438012244179845, "global_step": 44619, "epoch": 374, "lr": 3.126054098244029e-05} +{"train_loss": 0.0012440462596714497, "global_step": 44620, "epoch": 374, "lr": 3.125848697956427e-05} +{"train_loss": 0.001037604990415275, "global_step": 44621, "epoch": 374, "lr": 3.125643301348523e-05} +{"train_loss": 0.0013120529474690557, "global_step": 44622, "epoch": 374, "lr": 3.125437908420716e-05} +{"train_loss": 0.0015047856140881777, "global_step": 44623, "epoch": 374, "lr": 3.125232519173413e-05} +{"train_loss": 0.0014894209942044768, "global_step": 44624, "epoch": 374, "lr": 3.125027133607015e-05, "val_loss": 0.017466042190790176} +{"train_loss": 0.0018039029091596603, "global_step": 44625, "epoch": 375, "lr": 3.1248217517219246e-05} +{"train_loss": 0.0012036103289574385, "global_step": 44626, "epoch": 375, "lr": 3.1246163735185483e-05} +{"train_loss": 0.001943646464496851, "global_step": 44627, "epoch": 375, "lr": 3.124410998997287e-05} +{"train_loss": 0.0030267825350165367, "global_step": 44628, "epoch": 375, "lr": 3.1242056281585434e-05} +{"train_loss": 0.0013419747119769454, "global_step": 44629, "epoch": 375, "lr": 3.124000261002723e-05} +{"train_loss": 0.0025305459275841713, "global_step": 44630, "epoch": 375, "lr": 3.123794897530226e-05} +{"train_loss": 0.0009167699608951807, "global_step": 44631, "epoch": 375, "lr": 3.1235895377414595e-05} +{"train_loss": 0.001395222614519298, "global_step": 44632, "epoch": 375, "lr": 3.123384181636822e-05} +{"train_loss": 0.000895263918209821, "global_step": 44633, "epoch": 375, "lr": 3.123178829216721e-05} +{"train_loss": 0.00204674294218421, "global_step": 44634, "epoch": 375, "lr": 3.122973480481558e-05} +{"train_loss": 0.0017944559222087264, "global_step": 44635, "epoch": 375, "lr": 3.1227681354317345e-05} +{"train_loss": 0.001798582379706204, "global_step": 44636, "epoch": 375, "lr": 3.1225627940676575e-05} +{"train_loss": 0.0011031953617930412, "global_step": 44637, "epoch": 375, "lr": 3.122357456389725e-05} +{"train_loss": 0.001785955624654889, "global_step": 44638, "epoch": 375, "lr": 3.122152122398344e-05} +{"train_loss": 0.0018118995940312743, "global_step": 44639, "epoch": 375, "lr": 3.121946792093917e-05} +{"train_loss": 0.0014822103548794985, "global_step": 44640, "epoch": 375, "lr": 3.121741465476847e-05} +{"train_loss": 0.003253915114328265, "global_step": 44641, "epoch": 375, "lr": 3.1215361425475376e-05} +{"train_loss": 0.0011353619629517198, "global_step": 44642, "epoch": 375, "lr": 3.12133082330639e-05} +{"train_loss": 0.0012396356323733926, "global_step": 44643, "epoch": 375, "lr": 3.12112550775381e-05} +{"train_loss": 0.0016115977196022868, "global_step": 44644, "epoch": 375, "lr": 3.120920195890197e-05} +{"train_loss": 0.001744499197229743, "global_step": 44645, "epoch": 375, "lr": 3.120714887715959e-05} +{"train_loss": 0.0016487903194501996, "global_step": 44646, "epoch": 375, "lr": 3.120509583231497e-05} +{"train_loss": 0.0009840719867497683, "global_step": 44647, "epoch": 375, "lr": 3.1203042824372106e-05} +{"train_loss": 0.0011305876541882753, "global_step": 44648, "epoch": 375, "lr": 3.120098985333508e-05} +{"train_loss": 0.0009456230909563601, "global_step": 44649, "epoch": 375, "lr": 3.119893691920789e-05} +{"train_loss": 0.0016979547217488289, "global_step": 44650, "epoch": 375, "lr": 3.11968840219946e-05} +{"train_loss": 0.0009181735804304481, "global_step": 44651, "epoch": 375, "lr": 3.119483116169919e-05} +{"train_loss": 0.0006346468580886722, "global_step": 44652, "epoch": 375, "lr": 3.1192778338325746e-05} +{"train_loss": 0.001567928702570498, "global_step": 44653, "epoch": 375, "lr": 3.119072555187827e-05} +{"train_loss": 0.0015483121387660503, "global_step": 44654, "epoch": 375, "lr": 3.1188672802360774e-05} +{"train_loss": 0.0016288267215713859, "global_step": 44655, "epoch": 375, "lr": 3.1186620089777326e-05} +{"train_loss": 0.0008513145730830729, "global_step": 44656, "epoch": 375, "lr": 3.1184567414131934e-05} +{"train_loss": 0.0026517182122915983, "global_step": 44657, "epoch": 375, "lr": 3.118251477542863e-05} +{"train_loss": 0.001671117846854031, "global_step": 44658, "epoch": 375, "lr": 3.118046217367147e-05} +{"train_loss": 0.0020135657396167517, "global_step": 44659, "epoch": 375, "lr": 3.117840960886443e-05} +{"train_loss": 0.0017762379720807076, "global_step": 44660, "epoch": 375, "lr": 3.11763570810116e-05} +{"train_loss": 0.0010595417115837336, "global_step": 44661, "epoch": 375, "lr": 3.117430459011695e-05} +{"train_loss": 0.0012556248111650348, "global_step": 44662, "epoch": 375, "lr": 3.117225213618458e-05} +{"train_loss": 0.001863087061792612, "global_step": 44663, "epoch": 375, "lr": 3.117019971921844e-05} +{"train_loss": 0.0010055265156552196, "global_step": 44664, "epoch": 375, "lr": 3.1168147339222634e-05} +{"train_loss": 0.0017359007615596056, "global_step": 44665, "epoch": 375, "lr": 3.116609499620116e-05} +{"train_loss": 0.0016191808972507715, "global_step": 44666, "epoch": 375, "lr": 3.1164042690158024e-05} +{"train_loss": 0.0025681243278086185, "global_step": 44667, "epoch": 375, "lr": 3.11619904210973e-05} +{"train_loss": 0.0012585797812789679, "global_step": 44668, "epoch": 375, "lr": 3.115993818902297e-05} +{"train_loss": 0.0013131869491189718, "global_step": 44669, "epoch": 375, "lr": 3.115788599393911e-05} +{"train_loss": 0.0018043755553662777, "global_step": 44670, "epoch": 375, "lr": 3.1155833835849715e-05} +{"train_loss": 0.0011267659720033407, "global_step": 44671, "epoch": 375, "lr": 3.115378171475883e-05} +{"train_loss": 0.001489297836087644, "global_step": 44672, "epoch": 375, "lr": 3.115172963067049e-05} +{"train_loss": 0.0012570463586598635, "global_step": 44673, "epoch": 375, "lr": 3.11496775835887e-05} +{"train_loss": 0.0012119939783588052, "global_step": 44674, "epoch": 375, "lr": 3.114762557351752e-05} +{"train_loss": 0.0016756390687078238, "global_step": 44675, "epoch": 375, "lr": 3.114557360046094e-05} +{"train_loss": 0.001554225804284215, "global_step": 44676, "epoch": 375, "lr": 3.1143521664423034e-05} +{"train_loss": 0.0017033994663506746, "global_step": 44677, "epoch": 375, "lr": 3.114146976540781e-05} +{"train_loss": 0.001718202605843544, "global_step": 44678, "epoch": 375, "lr": 3.113941790341929e-05} +{"train_loss": 0.001190782175399363, "global_step": 44679, "epoch": 375, "lr": 3.1137366078461514e-05} +{"train_loss": 0.0006737469811923802, "global_step": 44680, "epoch": 375, "lr": 3.113531429053848e-05} +{"train_loss": 0.0019783552270382643, "global_step": 44681, "epoch": 375, "lr": 3.113326253965427e-05} +{"train_loss": 0.00131005619186908, "global_step": 44682, "epoch": 375, "lr": 3.113121082581286e-05} +{"train_loss": 0.0011218440486118197, "global_step": 44683, "epoch": 375, "lr": 3.112915914901832e-05} +{"train_loss": 0.00131601607427001, "global_step": 44684, "epoch": 375, "lr": 3.112710750927466e-05} +{"train_loss": 0.0011880414094775915, "global_step": 44685, "epoch": 375, "lr": 3.112505590658589e-05} +{"train_loss": 0.0012806705199182034, "global_step": 44686, "epoch": 375, "lr": 3.112300434095606e-05} +{"train_loss": 0.0014227547217160463, "global_step": 44687, "epoch": 375, "lr": 3.11209528123892e-05} +{"train_loss": 0.0020865038968622684, "global_step": 44688, "epoch": 375, "lr": 3.111890132088934e-05} +{"train_loss": 0.0008624413167126477, "global_step": 44689, "epoch": 375, "lr": 3.111684986646049e-05} +{"train_loss": 0.0018246081890538335, "global_step": 44690, "epoch": 375, "lr": 3.111479844910669e-05} +{"train_loss": 0.0017361281206831336, "global_step": 44691, "epoch": 375, "lr": 3.111274706883198e-05} +{"train_loss": 0.0006128230597823858, "global_step": 44692, "epoch": 375, "lr": 3.1110695725640346e-05} +{"train_loss": 0.001347412820905447, "global_step": 44693, "epoch": 375, "lr": 3.110864441953587e-05} +{"train_loss": 0.0011858789948746562, "global_step": 44694, "epoch": 375, "lr": 3.1106593150522524e-05} +{"train_loss": 0.0013660023687407374, "global_step": 44695, "epoch": 375, "lr": 3.110454191860439e-05} +{"train_loss": 0.0006231525912880898, "global_step": 44696, "epoch": 375, "lr": 3.1102490723785474e-05} +{"train_loss": 0.0010200133547186852, "global_step": 44697, "epoch": 375, "lr": 3.1100439566069765e-05} +{"train_loss": 0.0011683707125484943, "global_step": 44698, "epoch": 375, "lr": 3.1098388445461357e-05} +{"train_loss": 0.0015403189463540912, "global_step": 44699, "epoch": 375, "lr": 3.109633736196421e-05} +{"train_loss": 0.0017615449614822865, "global_step": 44700, "epoch": 375, "lr": 3.109428631558242e-05} +{"train_loss": 0.0015440327115356922, "global_step": 44701, "epoch": 375, "lr": 3.109223530631995e-05} +{"train_loss": 0.0011230529053136706, "global_step": 44702, "epoch": 375, "lr": 3.1090184334180876e-05} +{"train_loss": 0.0009085809579119086, "global_step": 44703, "epoch": 375, "lr": 3.10881333991692e-05} +{"train_loss": 0.00140882667619735, "global_step": 44704, "epoch": 375, "lr": 3.108608250128895e-05} +{"train_loss": 0.001246603555046022, "global_step": 44705, "epoch": 375, "lr": 3.108403164054415e-05} +{"train_loss": 0.00212192814797163, "global_step": 44706, "epoch": 375, "lr": 3.1081980816938846e-05} +{"train_loss": 0.0014565723249688745, "global_step": 44707, "epoch": 375, "lr": 3.107993003047705e-05} +{"train_loss": 0.0012186078820377588, "global_step": 44708, "epoch": 375, "lr": 3.1077879281162767e-05} +{"train_loss": 0.001699286513030529, "global_step": 44709, "epoch": 375, "lr": 3.107582856900008e-05} +{"train_loss": 0.0009066913044080138, "global_step": 44710, "epoch": 375, "lr": 3.107377789399298e-05} +{"train_loss": 0.0010733003728091717, "global_step": 44711, "epoch": 375, "lr": 3.1071727256145463e-05} +{"train_loss": 0.0007640178082510829, "global_step": 44712, "epoch": 375, "lr": 3.106967665546162e-05} +{"train_loss": 0.0015167280798777938, "global_step": 44713, "epoch": 375, "lr": 3.1067626091945425e-05} +{"train_loss": 0.002131262794137001, "global_step": 44714, "epoch": 375, "lr": 3.106557556560093e-05} +{"train_loss": 0.002400807337835431, "global_step": 44715, "epoch": 375, "lr": 3.1063525076432174e-05} +{"train_loss": 0.0033673353027552366, "global_step": 44716, "epoch": 375, "lr": 3.1061474624443134e-05} +{"train_loss": 0.0012628106633201241, "global_step": 44717, "epoch": 375, "lr": 3.1059424209637885e-05} +{"train_loss": 0.0018426352180540562, "global_step": 44718, "epoch": 375, "lr": 3.105737383202041e-05} +{"train_loss": 0.0017306080553680658, "global_step": 44719, "epoch": 375, "lr": 3.105532349159478e-05} +{"train_loss": 0.0008333594305440784, "global_step": 44720, "epoch": 375, "lr": 3.1053273188364985e-05} +{"train_loss": 0.0010739532299339771, "global_step": 44721, "epoch": 375, "lr": 3.105122292233506e-05} +{"train_loss": 0.0010541550582274795, "global_step": 44722, "epoch": 375, "lr": 3.1049172693509057e-05} +{"train_loss": 0.001878775772638619, "global_step": 44723, "epoch": 375, "lr": 3.104712250189096e-05} +{"train_loss": 0.0017840327927842736, "global_step": 44724, "epoch": 375, "lr": 3.104507234748482e-05} +{"train_loss": 0.0008408117573708296, "global_step": 44725, "epoch": 375, "lr": 3.1043022230294646e-05} +{"train_loss": 0.0015676089096814394, "global_step": 44726, "epoch": 375, "lr": 3.104097215032449e-05} +{"train_loss": 0.0020873823668807745, "global_step": 44727, "epoch": 375, "lr": 3.103892210757836e-05} +{"train_loss": 0.002056677360087633, "global_step": 44728, "epoch": 375, "lr": 3.103687210206026e-05} +{"train_loss": 0.0017889189766719937, "global_step": 44729, "epoch": 375, "lr": 3.1034822133774254e-05} +{"train_loss": 0.0011840537190437317, "global_step": 44730, "epoch": 375, "lr": 3.103277220272433e-05} +{"train_loss": 0.0020934001076966524, "global_step": 44731, "epoch": 375, "lr": 3.103072230891455e-05} +{"train_loss": 0.001558441435918212, "global_step": 44732, "epoch": 375, "lr": 3.10286724523489e-05} +{"train_loss": 0.000884183042217046, "global_step": 44733, "epoch": 375, "lr": 3.102662263303145e-05} +{"train_loss": 0.001765678753145039, "global_step": 44734, "epoch": 375, "lr": 3.102457285096619e-05} +{"train_loss": 0.0008971659699454904, "global_step": 44735, "epoch": 375, "lr": 3.102252310615714e-05} +{"train_loss": 0.001681955298408866, "global_step": 44736, "epoch": 375, "lr": 3.102047339860835e-05} +{"train_loss": 0.0033735311590135098, "global_step": 44737, "epoch": 375, "lr": 3.101842372832383e-05} +{"train_loss": 0.00230091018602252, "global_step": 44738, "epoch": 375, "lr": 3.101637409530761e-05} +{"train_loss": 0.0007525749388150871, "global_step": 44739, "epoch": 375, "lr": 3.101432449956371e-05} +{"train_loss": 0.001209684880450368, "global_step": 44740, "epoch": 375, "lr": 3.1012274941096156e-05} +{"train_loss": 0.002208155579864979, "global_step": 44741, "epoch": 375, "lr": 3.1010225419908986e-05} +{"train_loss": 0.001963239163160324, "global_step": 44742, "epoch": 375, "lr": 3.100817593600618e-05} +{"train_loss": 0.001527865181047031, "global_step": 44743, "epoch": 375, "lr": 3.100612648939182e-05, "val_loss": 0.028678162023425102, "train_action_mse_error": 1.9113987946184352e-05} +{"train_loss": 0.0009849362540990114, "global_step": 44744, "epoch": 376, "lr": 3.100407708006987e-05} +{"train_loss": 0.0007466754177585244, "global_step": 44745, "epoch": 376, "lr": 3.1002027708044415e-05} +{"train_loss": 0.0009129648096859455, "global_step": 44746, "epoch": 376, "lr": 3.099997837331945e-05} +{"train_loss": 0.0019075045129284263, "global_step": 44747, "epoch": 376, "lr": 3.099792907589897e-05} +{"train_loss": 0.0009128146921284497, "global_step": 44748, "epoch": 376, "lr": 3.0995879815787056e-05} +{"train_loss": 0.0012978145387023687, "global_step": 44749, "epoch": 376, "lr": 3.099383059298767e-05} +{"train_loss": 0.0024115885607898235, "global_step": 44750, "epoch": 376, "lr": 3.09917814075049e-05} +{"train_loss": 0.0008944535511545837, "global_step": 44751, "epoch": 376, "lr": 3.0989732259342705e-05} +{"train_loss": 0.002298024483025074, "global_step": 44752, "epoch": 376, "lr": 3.0987683148505165e-05} +{"train_loss": 0.002489992883056402, "global_step": 44753, "epoch": 376, "lr": 3.098563407499627e-05} +{"train_loss": 0.0008484529098495841, "global_step": 44754, "epoch": 376, "lr": 3.0983585038820054e-05} +{"train_loss": 0.001176990568637848, "global_step": 44755, "epoch": 376, "lr": 3.098153603998053e-05} +{"train_loss": 0.0007970889564603567, "global_step": 44756, "epoch": 376, "lr": 3.097948707848173e-05} +{"train_loss": 0.002144694561138749, "global_step": 44757, "epoch": 376, "lr": 3.097743815432768e-05} +{"train_loss": 0.0013796844286844134, "global_step": 44758, "epoch": 376, "lr": 3.097538926752238e-05} +{"train_loss": 0.0013044282095506787, "global_step": 44759, "epoch": 376, "lr": 3.097334041806988e-05} +{"train_loss": 0.0012184794759377837, "global_step": 44760, "epoch": 376, "lr": 3.0971291605974216e-05} +{"train_loss": 0.0013708478072658181, "global_step": 44761, "epoch": 376, "lr": 3.096924283123936e-05} +{"train_loss": 0.001977312844246626, "global_step": 44762, "epoch": 376, "lr": 3.096719409386938e-05} +{"train_loss": 0.000947916298173368, "global_step": 44763, "epoch": 376, "lr": 3.096514539386827e-05} +{"train_loss": 0.001506154891103506, "global_step": 44764, "epoch": 376, "lr": 3.096309673124007e-05} +{"train_loss": 0.001216432312503457, "global_step": 44765, "epoch": 376, "lr": 3.09610481059888e-05} +{"train_loss": 0.000707455154042691, "global_step": 44766, "epoch": 376, "lr": 3.0958999518118456e-05} +{"train_loss": 0.0014527273597195745, "global_step": 44767, "epoch": 376, "lr": 3.095695096763311e-05} +{"train_loss": 0.0010922880610451102, "global_step": 44768, "epoch": 376, "lr": 3.095490245453674e-05} +{"train_loss": 0.0011313945287838578, "global_step": 44769, "epoch": 376, "lr": 3.09528539788334e-05} +{"train_loss": 0.0022154459729790688, "global_step": 44770, "epoch": 376, "lr": 3.0950805540527064e-05} +{"train_loss": 0.0015891598304733634, "global_step": 44771, "epoch": 376, "lr": 3.094875713962181e-05} +{"train_loss": 0.0021571628749370575, "global_step": 44772, "epoch": 376, "lr": 3.0946708776121634e-05} +{"train_loss": 0.0012487858766689897, "global_step": 44773, "epoch": 376, "lr": 3.094466045003055e-05} +{"train_loss": 0.0024624192155897617, "global_step": 44774, "epoch": 376, "lr": 3.094261216135261e-05} +{"train_loss": 0.0009240600047633052, "global_step": 44775, "epoch": 376, "lr": 3.094056391009179e-05} +{"train_loss": 0.0009169323602691293, "global_step": 44776, "epoch": 376, "lr": 3.0938515696252155e-05} +{"train_loss": 0.0012130190152674913, "global_step": 44777, "epoch": 376, "lr": 3.09364675198377e-05} +{"train_loss": 0.0016963585512712598, "global_step": 44778, "epoch": 376, "lr": 3.0934419380852466e-05} +{"train_loss": 0.0011922137346118689, "global_step": 44779, "epoch": 376, "lr": 3.093237127930046e-05} +{"train_loss": 0.001733474782668054, "global_step": 44780, "epoch": 376, "lr": 3.0930323215185685e-05} +{"train_loss": 0.0025168457068502903, "global_step": 44781, "epoch": 376, "lr": 3.092827518851221e-05} +{"train_loss": 0.0010139292571693659, "global_step": 44782, "epoch": 376, "lr": 3.0926227199284006e-05} +{"train_loss": 0.0008509960025548935, "global_step": 44783, "epoch": 376, "lr": 3.0924179247505135e-05} +{"train_loss": 0.0009039317956194282, "global_step": 44784, "epoch": 376, "lr": 3.092213133317959e-05} +{"train_loss": 0.0011085809674113989, "global_step": 44785, "epoch": 376, "lr": 3.0920083456311396e-05} +{"train_loss": 0.0020232698880136013, "global_step": 44786, "epoch": 376, "lr": 3.091803561690459e-05} +{"train_loss": 0.001143995439633727, "global_step": 44787, "epoch": 376, "lr": 3.091598781496319e-05} +{"train_loss": 0.0017616936238482594, "global_step": 44788, "epoch": 376, "lr": 3.09139400504912e-05} +{"train_loss": 0.0021514748223125935, "global_step": 44789, "epoch": 376, "lr": 3.091189232349264e-05} +{"train_loss": 0.0015974303241819143, "global_step": 44790, "epoch": 376, "lr": 3.0909844633971554e-05} +{"train_loss": 0.0014067994197830558, "global_step": 44791, "epoch": 376, "lr": 3.090779698193195e-05} +{"train_loss": 0.002021683845669031, "global_step": 44792, "epoch": 376, "lr": 3.090574936737783e-05} +{"train_loss": 0.0011238574516028166, "global_step": 44793, "epoch": 376, "lr": 3.090370179031325e-05} +{"train_loss": 0.0016442298656329513, "global_step": 44794, "epoch": 376, "lr": 3.090165425074219e-05} +{"train_loss": 0.0019793794490396976, "global_step": 44795, "epoch": 376, "lr": 3.089960674866872e-05} +{"train_loss": 0.0013603445840999484, "global_step": 44796, "epoch": 376, "lr": 3.0897559284096824e-05} +{"train_loss": 0.0008665219065733254, "global_step": 44797, "epoch": 376, "lr": 3.089551185703051e-05} +{"train_loss": 0.0020370734855532646, "global_step": 44798, "epoch": 376, "lr": 3.0893464467473845e-05} +{"train_loss": 0.0022418759763240814, "global_step": 44799, "epoch": 376, "lr": 3.089141711543079e-05} +{"train_loss": 0.0016612823819741607, "global_step": 44800, "epoch": 376, "lr": 3.088936980090542e-05} +{"train_loss": 0.0019574908073991537, "global_step": 44801, "epoch": 376, "lr": 3.088732252390172e-05} +{"train_loss": 0.0009392176289111376, "global_step": 44802, "epoch": 376, "lr": 3.088527528442373e-05} +{"train_loss": 0.00175405852496624, "global_step": 44803, "epoch": 376, "lr": 3.088322808247545e-05} +{"train_loss": 0.0014919814420863986, "global_step": 44804, "epoch": 376, "lr": 3.088118091806091e-05} +{"train_loss": 0.0017294586868956685, "global_step": 44805, "epoch": 376, "lr": 3.087913379118413e-05} +{"train_loss": 0.0017843793611973524, "global_step": 44806, "epoch": 376, "lr": 3.087708670184912e-05} +{"train_loss": 0.0011007495922967792, "global_step": 44807, "epoch": 376, "lr": 3.0875039650059926e-05} +{"train_loss": 0.002114079659804702, "global_step": 44808, "epoch": 376, "lr": 3.087299263582053e-05} +{"train_loss": 0.000692204455845058, "global_step": 44809, "epoch": 376, "lr": 3.0870945659134984e-05} +{"train_loss": 0.0015596753219142556, "global_step": 44810, "epoch": 376, "lr": 3.08688987200073e-05} +{"train_loss": 0.0017077417578548193, "global_step": 44811, "epoch": 376, "lr": 3.0866851818441465e-05} +{"train_loss": 0.0013731915969401598, "global_step": 44812, "epoch": 376, "lr": 3.086480495444154e-05} +{"train_loss": 0.0007851387490518391, "global_step": 44813, "epoch": 376, "lr": 3.086275812801152e-05} +{"train_loss": 0.0016832025721669197, "global_step": 44814, "epoch": 376, "lr": 3.086071133915543e-05} +{"train_loss": 0.0024675701279193163, "global_step": 44815, "epoch": 376, "lr": 3.08586645878773e-05} +{"train_loss": 0.001769458525814116, "global_step": 44816, "epoch": 376, "lr": 3.085661787418112e-05} +{"train_loss": 0.0011214230908080935, "global_step": 44817, "epoch": 376, "lr": 3.085457119807094e-05} +{"train_loss": 0.0012800160329788923, "global_step": 44818, "epoch": 376, "lr": 3.085252455955074e-05} +{"train_loss": 0.0006745346472598612, "global_step": 44819, "epoch": 376, "lr": 3.085047795862458e-05} +{"train_loss": 0.0015225679380819201, "global_step": 44820, "epoch": 376, "lr": 3.084843139529645e-05} +{"train_loss": 0.002047874964773655, "global_step": 44821, "epoch": 376, "lr": 3.0846384869570386e-05} +{"train_loss": 0.0013510551070794463, "global_step": 44822, "epoch": 376, "lr": 3.084433838145041e-05} +{"train_loss": 0.0009596326854079962, "global_step": 44823, "epoch": 376, "lr": 3.0842291930940515e-05} +{"train_loss": 0.0007098920177668333, "global_step": 44824, "epoch": 376, "lr": 3.084024551804474e-05} +{"train_loss": 0.0009508969960734248, "global_step": 44825, "epoch": 376, "lr": 3.083819914276709e-05} +{"train_loss": 0.0008486966253258288, "global_step": 44826, "epoch": 376, "lr": 3.08361528051116e-05} +{"train_loss": 0.001418963773176074, "global_step": 44827, "epoch": 376, "lr": 3.083410650508226e-05} +{"train_loss": 0.001328058773651719, "global_step": 44828, "epoch": 376, "lr": 3.083206024268312e-05} +{"train_loss": 0.002336694858968258, "global_step": 44829, "epoch": 376, "lr": 3.083001401791818e-05} +{"train_loss": 0.0014657302526757121, "global_step": 44830, "epoch": 376, "lr": 3.082796783079145e-05} +{"train_loss": 0.0015685734106227756, "global_step": 44831, "epoch": 376, "lr": 3.082592168130697e-05} +{"train_loss": 0.0022493628785014153, "global_step": 44832, "epoch": 376, "lr": 3.082387556946873e-05} +{"train_loss": 0.0018924155738204718, "global_step": 44833, "epoch": 376, "lr": 3.0821829495280774e-05} +{"train_loss": 0.0008433866896666586, "global_step": 44834, "epoch": 376, "lr": 3.08197834587471e-05} +{"train_loss": 0.0015802003908902407, "global_step": 44835, "epoch": 376, "lr": 3.0817737459871733e-05} +{"train_loss": 0.001096865744329989, "global_step": 44836, "epoch": 376, "lr": 3.081569149865868e-05} +{"train_loss": 0.0018723339308053255, "global_step": 44837, "epoch": 376, "lr": 3.081364557511198e-05} +{"train_loss": 0.0008226374629884958, "global_step": 44838, "epoch": 376, "lr": 3.0811599689235634e-05} +{"train_loss": 0.0007624090067110956, "global_step": 44839, "epoch": 376, "lr": 3.080955384103366e-05} +{"train_loss": 0.0012986098881810904, "global_step": 44840, "epoch": 376, "lr": 3.080750803051008e-05} +{"train_loss": 0.0016347491182386875, "global_step": 44841, "epoch": 376, "lr": 3.080546225766892e-05} +{"train_loss": 0.0017248662188649178, "global_step": 44842, "epoch": 376, "lr": 3.080341652251415e-05} +{"train_loss": 0.000579100742470473, "global_step": 44843, "epoch": 376, "lr": 3.080137082504985e-05} +{"train_loss": 0.001469491282477975, "global_step": 44844, "epoch": 376, "lr": 3.079932516527999e-05} +{"train_loss": 0.0009330493048764765, "global_step": 44845, "epoch": 376, "lr": 3.079727954320862e-05} +{"train_loss": 0.0006147793028503656, "global_step": 44846, "epoch": 376, "lr": 3.079523395883974e-05} +{"train_loss": 0.0015929978108033538, "global_step": 44847, "epoch": 376, "lr": 3.079318841217735e-05} +{"train_loss": 0.0009669575374573469, "global_step": 44848, "epoch": 376, "lr": 3.07911429032255e-05} +{"train_loss": 0.002141025848686695, "global_step": 44849, "epoch": 376, "lr": 3.078909743198817e-05} +{"train_loss": 0.0011627585627138615, "global_step": 44850, "epoch": 376, "lr": 3.078705199846941e-05} +{"train_loss": 0.002650107257068157, "global_step": 44851, "epoch": 376, "lr": 3.0785006602673206e-05} +{"train_loss": 0.0017717186128720641, "global_step": 44852, "epoch": 376, "lr": 3.0782961244603606e-05} +{"train_loss": 0.003054747823625803, "global_step": 44853, "epoch": 376, "lr": 3.0780915924264595e-05} +{"train_loss": 0.0007310457294806838, "global_step": 44854, "epoch": 376, "lr": 3.07788706416602e-05} +{"train_loss": 0.0010073072044178843, "global_step": 44855, "epoch": 376, "lr": 3.0776825396794456e-05} +{"train_loss": 0.0013607960427179933, "global_step": 44856, "epoch": 376, "lr": 3.0774780189671345e-05} +{"train_loss": 0.0009012632654048502, "global_step": 44857, "epoch": 376, "lr": 3.0772735020294916e-05} +{"train_loss": 0.0005512884235940874, "global_step": 44858, "epoch": 376, "lr": 3.0770689888669146e-05} +{"train_loss": 0.0011363099329173565, "global_step": 44859, "epoch": 376, "lr": 3.0768644794798095e-05} +{"train_loss": 0.0013969918945804238, "global_step": 44860, "epoch": 376, "lr": 3.076659973868575e-05} +{"train_loss": 0.0005580681608989835, "global_step": 44861, "epoch": 376, "lr": 3.076455472033611e-05} +{"train_loss": 0.0014335463325367817, "global_step": 44862, "epoch": 376, "lr": 3.076250973975324e-05, "val_loss": 0.01992938108742237} +{"train_loss": 0.0011929951142519712, "global_step": 44863, "epoch": 377, "lr": 3.076046479694111e-05} +{"train_loss": 0.001829640124924481, "global_step": 44864, "epoch": 377, "lr": 3.0758419891903764e-05} +{"train_loss": 0.0009480197913944721, "global_step": 44865, "epoch": 377, "lr": 3.075637502464521e-05} +{"train_loss": 0.0011584997409954667, "global_step": 44866, "epoch": 377, "lr": 3.0754330195169435e-05} +{"train_loss": 0.0015638737240806222, "global_step": 44867, "epoch": 377, "lr": 3.0752285403480485e-05} +{"train_loss": 0.0020908606238663197, "global_step": 44868, "epoch": 377, "lr": 3.075024064958237e-05} +{"train_loss": 0.0011001850944012403, "global_step": 44869, "epoch": 377, "lr": 3.0748195933479095e-05} +{"train_loss": 0.0018305334961041808, "global_step": 44870, "epoch": 377, "lr": 3.074615125517468e-05} +{"train_loss": 0.0011430156882852316, "global_step": 44871, "epoch": 377, "lr": 3.0744106614673154e-05} +{"train_loss": 0.0014605831820517778, "global_step": 44872, "epoch": 377, "lr": 3.074206201197851e-05} +{"train_loss": 0.0019972992595285177, "global_step": 44873, "epoch": 377, "lr": 3.074001744709476e-05} +{"train_loss": 0.0010627126321196556, "global_step": 44874, "epoch": 377, "lr": 3.073797292002595e-05} +{"train_loss": 0.0005482487031258643, "global_step": 44875, "epoch": 377, "lr": 3.073592843077604e-05} +{"train_loss": 0.0019357951823621988, "global_step": 44876, "epoch": 377, "lr": 3.073388397934911e-05} +{"train_loss": 0.001295943045988679, "global_step": 44877, "epoch": 377, "lr": 3.073183956574912e-05} +{"train_loss": 0.0008783444063737988, "global_step": 44878, "epoch": 377, "lr": 3.0729795189980117e-05} +{"train_loss": 0.0011701080948114395, "global_step": 44879, "epoch": 377, "lr": 3.07277508520461e-05} +{"train_loss": 0.0012383933644741774, "global_step": 44880, "epoch": 377, "lr": 3.072570655195107e-05} +{"train_loss": 0.0012212380534037948, "global_step": 44881, "epoch": 377, "lr": 3.072366228969908e-05} +{"train_loss": 0.0005964361480437219, "global_step": 44882, "epoch": 377, "lr": 3.0721618065294094e-05} +{"train_loss": 0.001223828410729766, "global_step": 44883, "epoch": 377, "lr": 3.071957387874017e-05} +{"train_loss": 0.0015786447329446673, "global_step": 44884, "epoch": 377, "lr": 3.07175297300413e-05} +{"train_loss": 0.0008555433014407754, "global_step": 44885, "epoch": 377, "lr": 3.07154856192015e-05} +{"train_loss": 0.0008381898514926434, "global_step": 44886, "epoch": 377, "lr": 3.0713441546224777e-05} +{"train_loss": 0.0015935191186144948, "global_step": 44887, "epoch": 377, "lr": 3.0711397511115155e-05} +{"train_loss": 0.001066142925992608, "global_step": 44888, "epoch": 377, "lr": 3.070935351387664e-05} +{"train_loss": 0.0017856515478342772, "global_step": 44889, "epoch": 377, "lr": 3.0707309554513244e-05} +{"train_loss": 0.0007474416051991284, "global_step": 44890, "epoch": 377, "lr": 3.0705265633029e-05} +{"train_loss": 0.000775362248532474, "global_step": 44891, "epoch": 377, "lr": 3.070322174942791e-05} +{"train_loss": 0.0012487837811931968, "global_step": 44892, "epoch": 377, "lr": 3.070117790371396e-05} +{"train_loss": 0.0008080137195065618, "global_step": 44893, "epoch": 377, "lr": 3.06991340958912e-05} +{"train_loss": 0.0010433592833578587, "global_step": 44894, "epoch": 377, "lr": 3.0697090325963615e-05} +{"train_loss": 0.0017100409604609013, "global_step": 44895, "epoch": 377, "lr": 3.069504659393525e-05} +{"train_loss": 0.0011518826941028237, "global_step": 44896, "epoch": 377, "lr": 3.069300289981008e-05} +{"train_loss": 0.0010507561964914203, "global_step": 44897, "epoch": 377, "lr": 3.069095924359216e-05} +{"train_loss": 0.001236314419656992, "global_step": 44898, "epoch": 377, "lr": 3.0688915625285466e-05} +{"train_loss": 0.0014678084990009665, "global_step": 44899, "epoch": 377, "lr": 3.068687204489401e-05} +{"train_loss": 0.001035318709909916, "global_step": 44900, "epoch": 377, "lr": 3.068482850242184e-05} +{"train_loss": 0.0009773807832971215, "global_step": 44901, "epoch": 377, "lr": 3.068278499787291e-05} +{"train_loss": 0.001527991029433906, "global_step": 44902, "epoch": 377, "lr": 3.068074153125131e-05} +{"train_loss": 0.0007411369006149471, "global_step": 44903, "epoch": 377, "lr": 3.067869810256099e-05} +{"train_loss": 0.0016953055746853352, "global_step": 44904, "epoch": 377, "lr": 3.067665471180597e-05} +{"train_loss": 0.0011398997157812119, "global_step": 44905, "epoch": 377, "lr": 3.06746113589903e-05} +{"train_loss": 0.001912413747049868, "global_step": 44906, "epoch": 377, "lr": 3.067256804411794e-05} +{"train_loss": 0.0011495850048959255, "global_step": 44907, "epoch": 377, "lr": 3.067052476719295e-05} +{"train_loss": 0.0006171654677018523, "global_step": 44908, "epoch": 377, "lr": 3.066848152821931e-05} +{"train_loss": 0.0006753565976396203, "global_step": 44909, "epoch": 377, "lr": 3.066643832720105e-05} +{"train_loss": 0.0009596317540854216, "global_step": 44910, "epoch": 377, "lr": 3.0664395164142175e-05} +{"train_loss": 0.0010991445742547512, "global_step": 44911, "epoch": 377, "lr": 3.066235203904667e-05} +{"train_loss": 0.000882708583958447, "global_step": 44912, "epoch": 377, "lr": 3.0660308951918595e-05} +{"train_loss": 0.0010508995037525892, "global_step": 44913, "epoch": 377, "lr": 3.0658265902761917e-05} +{"train_loss": 0.0012565258657559752, "global_step": 44914, "epoch": 377, "lr": 3.065622289158069e-05} +{"train_loss": 0.0010744594037532806, "global_step": 44915, "epoch": 377, "lr": 3.06541799183789e-05} +{"train_loss": 0.0014810474822297692, "global_step": 44916, "epoch": 377, "lr": 3.0652136983160536e-05} +{"train_loss": 0.001765530207194388, "global_step": 44917, "epoch": 377, "lr": 3.065009408592965e-05} +{"train_loss": 0.0013312759110704064, "global_step": 44918, "epoch": 377, "lr": 3.064805122669024e-05} +{"train_loss": 0.0012326425639912486, "global_step": 44919, "epoch": 377, "lr": 3.064600840544631e-05} +{"train_loss": 0.0019406634382903576, "global_step": 44920, "epoch": 377, "lr": 3.064396562220187e-05} +{"train_loss": 0.0015929479850456119, "global_step": 44921, "epoch": 377, "lr": 3.064192287696095e-05} +{"train_loss": 0.001508913584984839, "global_step": 44922, "epoch": 377, "lr": 3.0639880169727544e-05} +{"train_loss": 0.0005532372160814703, "global_step": 44923, "epoch": 377, "lr": 3.063783750050565e-05} +{"train_loss": 0.0009547610534355044, "global_step": 44924, "epoch": 377, "lr": 3.063579486929931e-05} +{"train_loss": 0.0016496158204972744, "global_step": 44925, "epoch": 377, "lr": 3.06337522761125e-05} +{"train_loss": 0.0010967608541250229, "global_step": 44926, "epoch": 377, "lr": 3.0631709720949265e-05} +{"train_loss": 0.0019425328355282545, "global_step": 44927, "epoch": 377, "lr": 3.062966720381358e-05} +{"train_loss": 0.0012796529335901141, "global_step": 44928, "epoch": 377, "lr": 3.06276247247095e-05} +{"train_loss": 0.001831401139497757, "global_step": 44929, "epoch": 377, "lr": 3.062558228364101e-05} +{"train_loss": 0.0011174860410392284, "global_step": 44930, "epoch": 377, "lr": 3.062353988061209e-05} +{"train_loss": 0.001740904524922371, "global_step": 44931, "epoch": 377, "lr": 3.0621497515626804e-05} +{"train_loss": 0.0021488512866199017, "global_step": 44932, "epoch": 377, "lr": 3.0619455188689116e-05} +{"train_loss": 0.0009961124742403626, "global_step": 44933, "epoch": 377, "lr": 3.0617412899803075e-05} +{"train_loss": 0.0009794625220820308, "global_step": 44934, "epoch": 377, "lr": 3.0615370648972666e-05} +{"train_loss": 0.0017207564087584615, "global_step": 44935, "epoch": 377, "lr": 3.061332843620191e-05} +{"train_loss": 0.002658685902133584, "global_step": 44936, "epoch": 377, "lr": 3.061128626149481e-05} +{"train_loss": 0.0009058151626959443, "global_step": 44937, "epoch": 377, "lr": 3.060924412485537e-05} +{"train_loss": 0.0014168996131047606, "global_step": 44938, "epoch": 377, "lr": 3.060720202628762e-05} +{"train_loss": 0.0014483958948403597, "global_step": 44939, "epoch": 377, "lr": 3.0605159965795536e-05} +{"train_loss": 0.0022075215820223093, "global_step": 44940, "epoch": 377, "lr": 3.0603117943383174e-05} +{"train_loss": 0.0012312968028709292, "global_step": 44941, "epoch": 377, "lr": 3.060107595905452e-05} +{"train_loss": 0.0009885728359222412, "global_step": 44942, "epoch": 377, "lr": 3.059903401281356e-05} +{"train_loss": 0.001608035760000348, "global_step": 44943, "epoch": 377, "lr": 3.059699210466434e-05} +{"train_loss": 0.0011811181902885437, "global_step": 44944, "epoch": 377, "lr": 3.059495023461084e-05} +{"train_loss": 0.0015878973063081503, "global_step": 44945, "epoch": 377, "lr": 3.059290840265709e-05} +{"train_loss": 0.0007212428608909249, "global_step": 44946, "epoch": 377, "lr": 3.059086660880708e-05} +{"train_loss": 0.0023679682053625584, "global_step": 44947, "epoch": 377, "lr": 3.058882485306485e-05} +{"train_loss": 0.0013496088795363903, "global_step": 44948, "epoch": 377, "lr": 3.0586783135434385e-05} +{"train_loss": 0.0008105254382826388, "global_step": 44949, "epoch": 377, "lr": 3.058474145591968e-05} +{"train_loss": 0.0013969041174277663, "global_step": 44950, "epoch": 377, "lr": 3.058269981452478e-05} +{"train_loss": 0.001652355887927115, "global_step": 44951, "epoch": 377, "lr": 3.058065821125365e-05} +{"train_loss": 0.0010196202201768756, "global_step": 44952, "epoch": 377, "lr": 3.0578616646110345e-05} +{"train_loss": 0.0016938730841502547, "global_step": 44953, "epoch": 377, "lr": 3.057657511909885e-05} +{"train_loss": 0.0017644937615841627, "global_step": 44954, "epoch": 377, "lr": 3.057453363022316e-05} +{"train_loss": 0.0008771141874603927, "global_step": 44955, "epoch": 377, "lr": 3.0572492179487315e-05} +{"train_loss": 0.0005937570822425187, "global_step": 44956, "epoch": 377, "lr": 3.057045076689529e-05} +{"train_loss": 0.0015043788589537144, "global_step": 44957, "epoch": 377, "lr": 3.056840939245112e-05} +{"train_loss": 0.002382695209234953, "global_step": 44958, "epoch": 377, "lr": 3.05663680561588e-05} +{"train_loss": 0.0013408513041213155, "global_step": 44959, "epoch": 377, "lr": 3.056432675802235e-05} +{"train_loss": 0.001183733926154673, "global_step": 44960, "epoch": 377, "lr": 3.056228549804576e-05} +{"train_loss": 0.0015650748973712325, "global_step": 44961, "epoch": 377, "lr": 3.0560244276233036e-05} +{"train_loss": 0.0006259996443986893, "global_step": 44962, "epoch": 377, "lr": 3.055820309258821e-05} +{"train_loss": 0.0015712255844846368, "global_step": 44963, "epoch": 377, "lr": 3.055616194711526e-05} +{"train_loss": 0.0010015744483098388, "global_step": 44964, "epoch": 377, "lr": 3.0554120839818226e-05} +{"train_loss": 0.0026735339779406786, "global_step": 44965, "epoch": 377, "lr": 3.055207977070108e-05} +{"train_loss": 0.0016226564766839147, "global_step": 44966, "epoch": 377, "lr": 3.055003873976786e-05} +{"train_loss": 0.001709643518552184, "global_step": 44967, "epoch": 377, "lr": 3.054799774702256e-05} +{"train_loss": 0.0013994250912219286, "global_step": 44968, "epoch": 377, "lr": 3.054595679246919e-05} +{"train_loss": 0.0011331165442243218, "global_step": 44969, "epoch": 377, "lr": 3.054391587611175e-05} +{"train_loss": 0.001153238583356142, "global_step": 44970, "epoch": 377, "lr": 3.054187499795425e-05} +{"train_loss": 0.0009914709953591228, "global_step": 44971, "epoch": 377, "lr": 3.05398341580007e-05} +{"train_loss": 0.0019047545501962304, "global_step": 44972, "epoch": 377, "lr": 3.053779335625513e-05} +{"train_loss": 0.0014586907345801592, "global_step": 44973, "epoch": 377, "lr": 3.053575259272149e-05} +{"train_loss": 0.0008785015670582652, "global_step": 44974, "epoch": 377, "lr": 3.0533711867403844e-05} +{"train_loss": 0.001110327197238803, "global_step": 44975, "epoch": 377, "lr": 3.0531671180306154e-05} +{"train_loss": 0.0013370726956054568, "global_step": 44976, "epoch": 377, "lr": 3.052963053143247e-05} +{"train_loss": 0.0006725016864947975, "global_step": 44977, "epoch": 377, "lr": 3.0527589920786754e-05} +{"train_loss": 0.0016550446162000299, "global_step": 44978, "epoch": 377, "lr": 3.052554934837305e-05} +{"train_loss": 0.002395781222730875, "global_step": 44979, "epoch": 377, "lr": 3.052350881419536e-05} +{"train_loss": 0.0016411395044997334, "global_step": 44980, "epoch": 377, "lr": 3.052146831825765e-05} +{"train_loss": 0.0013316958998877775, "global_step": 44981, "epoch": 377, "lr": 3.0519427860563985e-05, "val_loss": 0.013017441146075726} +{"train_loss": 0.001015131245367229, "global_step": 44982, "epoch": 378, "lr": 3.0517387441118318e-05} +{"train_loss": 0.0021129848901182413, "global_step": 44983, "epoch": 378, "lr": 3.05153470599247e-05} +{"train_loss": 0.000756019086111337, "global_step": 44984, "epoch": 378, "lr": 3.0513306716987106e-05} +{"train_loss": 0.001706999377347529, "global_step": 44985, "epoch": 378, "lr": 3.0511266412309547e-05} +{"train_loss": 0.000627858389634639, "global_step": 44986, "epoch": 378, "lr": 3.0509226145896042e-05} +{"train_loss": 0.001369849662296474, "global_step": 44987, "epoch": 378, "lr": 3.050718591775058e-05} +{"train_loss": 0.002376762218773365, "global_step": 44988, "epoch": 378, "lr": 3.0505145727877194e-05} +{"train_loss": 0.0018619311740621924, "global_step": 44989, "epoch": 378, "lr": 3.0503105576279845e-05} +{"train_loss": 0.001210158341564238, "global_step": 44990, "epoch": 378, "lr": 3.050106546296259e-05} +{"train_loss": 0.0015652404399588704, "global_step": 44991, "epoch": 378, "lr": 3.0499025387929413e-05} +{"train_loss": 0.001468330854550004, "global_step": 44992, "epoch": 378, "lr": 3.0496985351184294e-05} +{"train_loss": 0.001424150774255395, "global_step": 44993, "epoch": 378, "lr": 3.049494535273128e-05} +{"train_loss": 0.0007956157205626369, "global_step": 44994, "epoch": 378, "lr": 3.0492905392574334e-05} +{"train_loss": 0.0006746716680936515, "global_step": 44995, "epoch": 378, "lr": 3.049086547071751e-05} +{"train_loss": 0.0010629919124767184, "global_step": 44996, "epoch": 378, "lr": 3.0488825587164764e-05} +{"train_loss": 0.0016126659465953708, "global_step": 44997, "epoch": 378, "lr": 3.0486785741920143e-05} +{"train_loss": 0.0009178958716802299, "global_step": 44998, "epoch": 378, "lr": 3.0484745934987642e-05} +{"train_loss": 0.0011866880813613534, "global_step": 44999, "epoch": 378, "lr": 3.0482706166371232e-05} +{"train_loss": 0.0013483839575201273, "global_step": 45000, "epoch": 378, "lr": 3.048066643607495e-05} +{"train_loss": 0.0005959215923212469, "global_step": 45001, "epoch": 378, "lr": 3.0478626744102802e-05} +{"train_loss": 0.0016835881397128105, "global_step": 45002, "epoch": 378, "lr": 3.0476587090458775e-05} +{"train_loss": 0.0009475525585003197, "global_step": 45003, "epoch": 378, "lr": 3.04745474751469e-05} +{"train_loss": 0.0015296556521207094, "global_step": 45004, "epoch": 378, "lr": 3.0472507898171144e-05} +{"train_loss": 0.001420221058651805, "global_step": 45005, "epoch": 378, "lr": 3.0470468359535547e-05} +{"train_loss": 0.001737429411150515, "global_step": 45006, "epoch": 378, "lr": 3.0468428859244087e-05} +{"train_loss": 0.000930141017306596, "global_step": 45007, "epoch": 378, "lr": 3.0466389397300797e-05} +{"train_loss": 0.0007141670794226229, "global_step": 45008, "epoch": 378, "lr": 3.0464349973709645e-05} +{"train_loss": 0.0010130623122677207, "global_step": 45009, "epoch": 378, "lr": 3.0462310588474675e-05} +{"train_loss": 0.0014691565884277225, "global_step": 45010, "epoch": 378, "lr": 3.046027124159987e-05} +{"train_loss": 0.0013327867491170764, "global_step": 45011, "epoch": 378, "lr": 3.045823193308921e-05} +{"train_loss": 0.00081471330486238, "global_step": 45012, "epoch": 378, "lr": 3.0456192662946755e-05} +{"train_loss": 0.0009344399441033602, "global_step": 45013, "epoch": 378, "lr": 3.0454153431176445e-05} +{"train_loss": 0.0010870799887925386, "global_step": 45014, "epoch": 378, "lr": 3.0452114237782346e-05} +{"train_loss": 0.0023215864785015583, "global_step": 45015, "epoch": 378, "lr": 3.045007508276841e-05} +{"train_loss": 0.0009636931354179978, "global_step": 45016, "epoch": 378, "lr": 3.044803596613868e-05} +{"train_loss": 0.0013947237748652697, "global_step": 45017, "epoch": 378, "lr": 3.044599688789714e-05} +{"train_loss": 0.0018471601651981473, "global_step": 45018, "epoch": 378, "lr": 3.044395784804779e-05} +{"train_loss": 0.0016054183943197131, "global_step": 45019, "epoch": 378, "lr": 3.044191884659464e-05} +{"train_loss": 0.0009123117779381573, "global_step": 45020, "epoch": 378, "lr": 3.0439879883541696e-05} +{"train_loss": 0.001530662295408547, "global_step": 45021, "epoch": 378, "lr": 3.043784095889295e-05} +{"train_loss": 0.001198102138005197, "global_step": 45022, "epoch": 378, "lr": 3.043580207265243e-05} +{"train_loss": 0.0021724244579672813, "global_step": 45023, "epoch": 378, "lr": 3.043376322482411e-05} +{"train_loss": 0.0014500186080113053, "global_step": 45024, "epoch": 378, "lr": 3.043172441541201e-05} +{"train_loss": 0.0014894333435222507, "global_step": 45025, "epoch": 378, "lr": 3.0429685644420115e-05} +{"train_loss": 0.0009282251703552902, "global_step": 45026, "epoch": 378, "lr": 3.0427646911852464e-05} +{"train_loss": 0.0015449405182152987, "global_step": 45027, "epoch": 378, "lr": 3.0425608217713015e-05} +{"train_loss": 0.0011834383476525545, "global_step": 45028, "epoch": 378, "lr": 3.0423569562005815e-05} +{"train_loss": 0.002176265697926283, "global_step": 45029, "epoch": 378, "lr": 3.0421530944734846e-05} +{"train_loss": 0.0014419894432649016, "global_step": 45030, "epoch": 378, "lr": 3.0419492365904078e-05} +{"train_loss": 0.0007942313677631319, "global_step": 45031, "epoch": 378, "lr": 3.0417453825517578e-05} +{"train_loss": 0.0011121185962110758, "global_step": 45032, "epoch": 378, "lr": 3.041541532357929e-05} +{"train_loss": 0.0008436303469352424, "global_step": 45033, "epoch": 378, "lr": 3.0413376860093264e-05} +{"train_loss": 0.0011956678936257958, "global_step": 45034, "epoch": 378, "lr": 3.041133843506347e-05} +{"train_loss": 0.0006548851961269975, "global_step": 45035, "epoch": 378, "lr": 3.0409300048493904e-05} +{"train_loss": 0.0015926121268421412, "global_step": 45036, "epoch": 378, "lr": 3.0407261700388613e-05} +{"train_loss": 0.0009261599043384194, "global_step": 45037, "epoch": 378, "lr": 3.0405223390751546e-05} +{"train_loss": 0.0008865143172442913, "global_step": 45038, "epoch": 378, "lr": 3.0403185119586754e-05} +{"train_loss": 0.0017458552028983831, "global_step": 45039, "epoch": 378, "lr": 3.0401146886898185e-05} +{"train_loss": 0.0013496052706614137, "global_step": 45040, "epoch": 378, "lr": 3.0399108692689894e-05} +{"train_loss": 0.001226679072715342, "global_step": 45041, "epoch": 378, "lr": 3.0397070536965866e-05} +{"train_loss": 0.0013790285447612405, "global_step": 45042, "epoch": 378, "lr": 3.0395032419730067e-05} +{"train_loss": 0.0013503188965842128, "global_step": 45043, "epoch": 378, "lr": 3.0392994340986552e-05} +{"train_loss": 0.0010758021380752325, "global_step": 45044, "epoch": 378, "lr": 3.0390956300739275e-05} +{"train_loss": 0.0006250965525396168, "global_step": 45045, "epoch": 378, "lr": 3.0388918298992285e-05} +{"train_loss": 0.0009415527456440032, "global_step": 45046, "epoch": 378, "lr": 3.0386880335749536e-05} +{"train_loss": 0.0009443185408599675, "global_step": 45047, "epoch": 378, "lr": 3.038484241101507e-05} +{"train_loss": 0.0009663766832090914, "global_step": 45048, "epoch": 378, "lr": 3.0382804524792873e-05} +{"train_loss": 0.001192131545394659, "global_step": 45049, "epoch": 378, "lr": 3.0380766677086926e-05} +{"train_loss": 0.0012385159498080611, "global_step": 45050, "epoch": 378, "lr": 3.037872886790125e-05} +{"train_loss": 0.0013961534714326262, "global_step": 45051, "epoch": 378, "lr": 3.0376691097239852e-05} +{"train_loss": 0.00161290867254138, "global_step": 45052, "epoch": 378, "lr": 3.037465336510672e-05} +{"train_loss": 0.0009591868729330599, "global_step": 45053, "epoch": 378, "lr": 3.0372615671505866e-05} +{"train_loss": 0.00101335474755615, "global_step": 45054, "epoch": 378, "lr": 3.0370578016441275e-05} +{"train_loss": 0.0010557258501648903, "global_step": 45055, "epoch": 378, "lr": 3.036854039991697e-05} +{"train_loss": 0.0010387785732746124, "global_step": 45056, "epoch": 378, "lr": 3.0366502821936916e-05} +{"train_loss": 0.0010124924592673779, "global_step": 45057, "epoch": 378, "lr": 3.036446528250516e-05} +{"train_loss": 0.0005572353256866336, "global_step": 45058, "epoch": 378, "lr": 3.036242778162566e-05} +{"train_loss": 0.0013270300114527345, "global_step": 45059, "epoch": 378, "lr": 3.036039031930245e-05} +{"train_loss": 0.0010894725564867258, "global_step": 45060, "epoch": 378, "lr": 3.035835289553952e-05} +{"train_loss": 0.0007002927595749497, "global_step": 45061, "epoch": 378, "lr": 3.0356315510340844e-05} +{"train_loss": 0.0017368877306580544, "global_step": 45062, "epoch": 378, "lr": 3.0354278163710464e-05} +{"train_loss": 0.0011808003764599562, "global_step": 45063, "epoch": 378, "lr": 3.0352240855652338e-05} +{"train_loss": 0.0012772250920534134, "global_step": 45064, "epoch": 378, "lr": 3.035020358617051e-05} +{"train_loss": 0.0009300496312789619, "global_step": 45065, "epoch": 378, "lr": 3.0348166355268937e-05} +{"train_loss": 0.0015279968501999974, "global_step": 45066, "epoch": 378, "lr": 3.0346129162951663e-05} +{"train_loss": 0.0012628540862351656, "global_step": 45067, "epoch": 378, "lr": 3.0344092009222652e-05} +{"train_loss": 0.0013898225734010339, "global_step": 45068, "epoch": 378, "lr": 3.034205489408592e-05} +{"train_loss": 0.001137451734393835, "global_step": 45069, "epoch": 378, "lr": 3.0340017817545458e-05} +{"train_loss": 0.0016000361647456884, "global_step": 45070, "epoch": 378, "lr": 3.0337980779605264e-05} +{"train_loss": 0.0008799748029559851, "global_step": 45071, "epoch": 378, "lr": 3.033594378026936e-05} +{"train_loss": 0.000758407055400312, "global_step": 45072, "epoch": 378, "lr": 3.0333906819541735e-05} +{"train_loss": 0.0009641415090300143, "global_step": 45073, "epoch": 378, "lr": 3.0331869897426358e-05} +{"train_loss": 0.0006011583609506488, "global_step": 45074, "epoch": 378, "lr": 3.0329833013927277e-05} +{"train_loss": 0.000946248706895858, "global_step": 45075, "epoch": 378, "lr": 3.032779616904845e-05} +{"train_loss": 0.0009253179305233061, "global_step": 45076, "epoch": 378, "lr": 3.0325759362793903e-05} +{"train_loss": 0.0008574879611842334, "global_step": 45077, "epoch": 378, "lr": 3.0323722595167615e-05} +{"train_loss": 0.0011398334754630923, "global_step": 45078, "epoch": 378, "lr": 3.032168586617361e-05} +{"train_loss": 0.0007728731725364923, "global_step": 45079, "epoch": 378, "lr": 3.031964917581588e-05} +{"train_loss": 0.0005002805846743286, "global_step": 45080, "epoch": 378, "lr": 3.0317612524098392e-05} +{"train_loss": 0.0010489767882972956, "global_step": 45081, "epoch": 378, "lr": 3.0315575911025185e-05} +{"train_loss": 0.0013433138374239206, "global_step": 45082, "epoch": 378, "lr": 3.0313539336600228e-05} +{"train_loss": 0.000463056901935488, "global_step": 45083, "epoch": 378, "lr": 3.0311502800827552e-05} +{"train_loss": 0.0010545785771682858, "global_step": 45084, "epoch": 378, "lr": 3.0309466303711116e-05} +{"train_loss": 0.0009970165556296706, "global_step": 45085, "epoch": 378, "lr": 3.0307429845254947e-05} +{"train_loss": 0.0005609157378785312, "global_step": 45086, "epoch": 378, "lr": 3.0305393425463047e-05} +{"train_loss": 0.0022274404764175415, "global_step": 45087, "epoch": 378, "lr": 3.0303357044339387e-05} +{"train_loss": 0.000700271048117429, "global_step": 45088, "epoch": 378, "lr": 3.0301320701887992e-05} +{"train_loss": 0.0017438901122659445, "global_step": 45089, "epoch": 378, "lr": 3.0299284398112837e-05} +{"train_loss": 0.0007977522327564657, "global_step": 45090, "epoch": 378, "lr": 3.0297248133017952e-05} +{"train_loss": 0.0009290436864830554, "global_step": 45091, "epoch": 378, "lr": 3.0295211906607313e-05} +{"train_loss": 0.0009483877802267671, "global_step": 45092, "epoch": 378, "lr": 3.0293175718884904e-05} +{"train_loss": 0.001366425771266222, "global_step": 45093, "epoch": 378, "lr": 3.0291139569854753e-05} +{"train_loss": 0.000887471076566726, "global_step": 45094, "epoch": 378, "lr": 3.0289103459520828e-05} +{"train_loss": 0.0022834008559584618, "global_step": 45095, "epoch": 378, "lr": 3.0287067387887157e-05} +{"train_loss": 0.001488094450905919, "global_step": 45096, "epoch": 378, "lr": 3.0285031354957712e-05} +{"train_loss": 0.0013129512080922723, "global_step": 45097, "epoch": 378, "lr": 3.0282995360736517e-05} +{"train_loss": 0.0012434342643246055, "global_step": 45098, "epoch": 378, "lr": 3.0280959405227543e-05} +{"train_loss": 0.001936174463480711, "global_step": 45099, "epoch": 378, "lr": 3.0278923488434802e-05} +{"train_loss": 0.0012113242620453552, "global_step": 45100, "epoch": 378, "lr": 3.027688761036228e-05, "val_loss": 0.042726561427116394} +{"train_loss": 0.0007094803149811924, "global_step": 45101, "epoch": 379, "lr": 3.027485177101399e-05} +{"train_loss": 0.0008435656782239676, "global_step": 45102, "epoch": 379, "lr": 3.0272815970393918e-05} +{"train_loss": 0.0019215152133256197, "global_step": 45103, "epoch": 379, "lr": 3.0270780208506078e-05} +{"train_loss": 0.0019174778135493398, "global_step": 45104, "epoch": 379, "lr": 3.0268744485354433e-05} +{"train_loss": 0.0016947939293459058, "global_step": 45105, "epoch": 379, "lr": 3.0266708800943016e-05} +{"train_loss": 0.001669395947828889, "global_step": 45106, "epoch": 379, "lr": 3.026467315527579e-05} +{"train_loss": 0.0006359919207170606, "global_step": 45107, "epoch": 379, "lr": 3.0262637548356792e-05} +{"train_loss": 0.0016584686236456037, "global_step": 45108, "epoch": 379, "lr": 3.0260601980189975e-05} +{"train_loss": 0.0006445006583817303, "global_step": 45109, "epoch": 379, "lr": 3.0258566450779373e-05} +{"train_loss": 0.0012064538896083832, "global_step": 45110, "epoch": 379, "lr": 3.025653096012897e-05} +{"train_loss": 0.0016526434337720275, "global_step": 45111, "epoch": 379, "lr": 3.0254495508242743e-05} +{"train_loss": 0.0010930029675364494, "global_step": 45112, "epoch": 379, "lr": 3.0252460095124723e-05} +{"train_loss": 0.000901015242561698, "global_step": 45113, "epoch": 379, "lr": 3.0250424720778865e-05} +{"train_loss": 0.0013552774908021092, "global_step": 45114, "epoch": 379, "lr": 3.024838938520921e-05} +{"train_loss": 0.001033935695886612, "global_step": 45115, "epoch": 379, "lr": 3.024635408841971e-05} +{"train_loss": 0.0007556671625934541, "global_step": 45116, "epoch": 379, "lr": 3.0244318830414402e-05} +{"train_loss": 0.0009124898933805525, "global_step": 45117, "epoch": 379, "lr": 3.0242283611197257e-05} +{"train_loss": 0.0016101860674098134, "global_step": 45118, "epoch": 379, "lr": 3.0240248430772277e-05} +{"train_loss": 0.000927781336940825, "global_step": 45119, "epoch": 379, "lr": 3.023821328914346e-05} +{"train_loss": 0.0011793883750215173, "global_step": 45120, "epoch": 379, "lr": 3.023617818631479e-05} +{"train_loss": 0.0006524549098685384, "global_step": 45121, "epoch": 379, "lr": 3.0234143122290287e-05} +{"train_loss": 0.0011381026124581695, "global_step": 45122, "epoch": 379, "lr": 3.0232108097073936e-05} +{"train_loss": 0.0013583071995526552, "global_step": 45123, "epoch": 379, "lr": 3.023007311066971e-05} +{"train_loss": 0.0016029642429202795, "global_step": 45124, "epoch": 379, "lr": 3.022803816308164e-05} +{"train_loss": 0.0012242259690538049, "global_step": 45125, "epoch": 379, "lr": 3.0226003254313684e-05} +{"train_loss": 0.001989062875509262, "global_step": 45126, "epoch": 379, "lr": 3.0223968384369884e-05} +{"train_loss": 0.0013780546141788363, "global_step": 45127, "epoch": 379, "lr": 3.022193355325419e-05} +{"train_loss": 0.001391956233419478, "global_step": 45128, "epoch": 379, "lr": 3.021989876097063e-05} +{"train_loss": 0.0017630333313718438, "global_step": 45129, "epoch": 379, "lr": 3.021786400752319e-05} +{"train_loss": 0.0011781752109527588, "global_step": 45130, "epoch": 379, "lr": 3.021582929291583e-05} +{"train_loss": 0.001241783844307065, "global_step": 45131, "epoch": 379, "lr": 3.0213794617152612e-05} +{"train_loss": 0.000937310338485986, "global_step": 45132, "epoch": 379, "lr": 3.0211759980237463e-05} +{"train_loss": 0.0011571282520890236, "global_step": 45133, "epoch": 379, "lr": 3.0209725382174427e-05} +{"train_loss": 0.0023797713220119476, "global_step": 45134, "epoch": 379, "lr": 3.0207690822967472e-05} +{"train_loss": 0.0012103780172765255, "global_step": 45135, "epoch": 379, "lr": 3.020565630262061e-05} +{"train_loss": 0.002739467890933156, "global_step": 45136, "epoch": 379, "lr": 3.020362182113783e-05} +{"train_loss": 0.001540996483527124, "global_step": 45137, "epoch": 379, "lr": 3.020158737852311e-05} +{"train_loss": 0.0012140261242166162, "global_step": 45138, "epoch": 379, "lr": 3.0199552974780478e-05} +{"train_loss": 0.0022119858767837286, "global_step": 45139, "epoch": 379, "lr": 3.0197518609913883e-05} +{"train_loss": 0.0016891197301447392, "global_step": 45140, "epoch": 379, "lr": 3.0195484283927367e-05} +{"train_loss": 0.0008941213600337505, "global_step": 45141, "epoch": 379, "lr": 3.0193449996824902e-05} +{"train_loss": 0.0015863854205235839, "global_step": 45142, "epoch": 379, "lr": 3.0191415748610465e-05} +{"train_loss": 0.001418300555087626, "global_step": 45143, "epoch": 379, "lr": 3.018938153928808e-05} +{"train_loss": 0.001877117669209838, "global_step": 45144, "epoch": 379, "lr": 3.0187347368861713e-05} +{"train_loss": 0.0010452677961438894, "global_step": 45145, "epoch": 379, "lr": 3.018531323733539e-05} +{"train_loss": 0.0015125778736546636, "global_step": 45146, "epoch": 379, "lr": 3.0183279144713074e-05} +{"train_loss": 0.0010720078134909272, "global_step": 45147, "epoch": 379, "lr": 3.0181245090998784e-05} +{"train_loss": 0.0016788808861747384, "global_step": 45148, "epoch": 379, "lr": 3.0179211076196496e-05} +{"train_loss": 0.0010972085874527693, "global_step": 45149, "epoch": 379, "lr": 3.0177177100310206e-05} +{"train_loss": 0.001760789891704917, "global_step": 45150, "epoch": 379, "lr": 3.0175143163343917e-05} +{"train_loss": 0.0011227852664887905, "global_step": 45151, "epoch": 379, "lr": 3.0173109265301614e-05} +{"train_loss": 0.0020145243033766747, "global_step": 45152, "epoch": 379, "lr": 3.017107540618729e-05} +{"train_loss": 0.0009754793718457222, "global_step": 45153, "epoch": 379, "lr": 3.0169041586004953e-05} +{"train_loss": 0.0009440614958293736, "global_step": 45154, "epoch": 379, "lr": 3.0167007804758563e-05} +{"train_loss": 0.0008327679242938757, "global_step": 45155, "epoch": 379, "lr": 3.0164974062452155e-05} +{"train_loss": 0.0017589960480108857, "global_step": 45156, "epoch": 379, "lr": 3.0162940359089686e-05} +{"train_loss": 0.0015344646526500583, "global_step": 45157, "epoch": 379, "lr": 3.0160906694675177e-05} +{"train_loss": 0.0013207776937633753, "global_step": 45158, "epoch": 379, "lr": 3.015887306921259e-05} +{"train_loss": 0.0007308487547561526, "global_step": 45159, "epoch": 379, "lr": 3.0156839482705963e-05} +{"train_loss": 0.0012578897876664996, "global_step": 45160, "epoch": 379, "lr": 3.015480593515926e-05} +{"train_loss": 0.0008836147026158869, "global_step": 45161, "epoch": 379, "lr": 3.015277242657645e-05} +{"train_loss": 0.0007014400907792151, "global_step": 45162, "epoch": 379, "lr": 3.0150738956961567e-05} +{"train_loss": 0.00141565827652812, "global_step": 45163, "epoch": 379, "lr": 3.0148705526318577e-05} +{"train_loss": 0.0019229007884860039, "global_step": 45164, "epoch": 379, "lr": 3.01466721346515e-05} +{"train_loss": 0.0015154413413256407, "global_step": 45165, "epoch": 379, "lr": 3.0144638781964286e-05} +{"train_loss": 0.001030811108648777, "global_step": 45166, "epoch": 379, "lr": 3.0142605468260978e-05} +{"train_loss": 0.0011669822270050645, "global_step": 45167, "epoch": 379, "lr": 3.0140572193545535e-05} +{"train_loss": 0.0017835573526099324, "global_step": 45168, "epoch": 379, "lr": 3.0138538957821936e-05} +{"train_loss": 0.0014088352909311652, "global_step": 45169, "epoch": 379, "lr": 3.0136505761094223e-05} +{"train_loss": 0.001061214366927743, "global_step": 45170, "epoch": 379, "lr": 3.0134472603366337e-05} +{"train_loss": 0.0013183025876060128, "global_step": 45171, "epoch": 379, "lr": 3.0132439484642318e-05} +{"train_loss": 0.0009477029670961201, "global_step": 45172, "epoch": 379, "lr": 3.0130406404926125e-05} +{"train_loss": 0.002145589329302311, "global_step": 45173, "epoch": 379, "lr": 3.0128373364221735e-05} +{"train_loss": 0.0015579505125060678, "global_step": 45174, "epoch": 379, "lr": 3.0126340362533177e-05} +{"train_loss": 0.0019600812811404467, "global_step": 45175, "epoch": 379, "lr": 3.0124307399864415e-05} +{"train_loss": 0.0009315370116382837, "global_step": 45176, "epoch": 379, "lr": 3.012227447621947e-05} +{"train_loss": 0.0015644447412341833, "global_step": 45177, "epoch": 379, "lr": 3.0120241591602294e-05} +{"train_loss": 0.0008075199439190328, "global_step": 45178, "epoch": 379, "lr": 3.0118208746016917e-05} +{"train_loss": 0.0014864180702716112, "global_step": 45179, "epoch": 379, "lr": 3.0116175939467318e-05} +{"train_loss": 0.0008705806685611606, "global_step": 45180, "epoch": 379, "lr": 3.0114143171957464e-05} +{"train_loss": 0.0012047112686559558, "global_step": 45181, "epoch": 379, "lr": 3.011211044349137e-05} +{"train_loss": 0.0013940687058493495, "global_step": 45182, "epoch": 379, "lr": 3.0110077754073028e-05} +{"train_loss": 0.0019686773885041475, "global_step": 45183, "epoch": 379, "lr": 3.010804510370642e-05} +{"train_loss": 0.0009067946230061352, "global_step": 45184, "epoch": 379, "lr": 3.0106012492395542e-05} +{"train_loss": 0.0010742106242105365, "global_step": 45185, "epoch": 379, "lr": 3.0103979920144387e-05} +{"train_loss": 0.0019085975363850594, "global_step": 45186, "epoch": 379, "lr": 3.0101947386956942e-05} +{"train_loss": 0.001813385752029717, "global_step": 45187, "epoch": 379, "lr": 3.0099914892837183e-05} +{"train_loss": 0.0011858834186568856, "global_step": 45188, "epoch": 379, "lr": 3.0097882437789137e-05} +{"train_loss": 0.0015786542790010571, "global_step": 45189, "epoch": 379, "lr": 3.009585002181675e-05} +{"train_loss": 0.001093983300961554, "global_step": 45190, "epoch": 379, "lr": 3.0093817644924055e-05} +{"train_loss": 0.0009780849795788527, "global_step": 45191, "epoch": 379, "lr": 3.0091785307115022e-05} +{"train_loss": 0.0012593455612659454, "global_step": 45192, "epoch": 379, "lr": 3.008975300839362e-05} +{"train_loss": 0.002692060312256217, "global_step": 45193, "epoch": 379, "lr": 3.0087720748763886e-05} +{"train_loss": 0.001498691039159894, "global_step": 45194, "epoch": 379, "lr": 3.008568852822976e-05} +{"train_loss": 0.0017513735219836235, "global_step": 45195, "epoch": 379, "lr": 3.0083656346795286e-05} +{"train_loss": 0.0005430607707239687, "global_step": 45196, "epoch": 379, "lr": 3.0081624204464398e-05} +{"train_loss": 0.001429870375432074, "global_step": 45197, "epoch": 379, "lr": 3.007959210124113e-05} +{"train_loss": 0.0013212099438533187, "global_step": 45198, "epoch": 379, "lr": 3.0077560037129447e-05} +{"train_loss": 0.0013957904884591699, "global_step": 45199, "epoch": 379, "lr": 3.0075528012133347e-05} +{"train_loss": 0.001602423028089106, "global_step": 45200, "epoch": 379, "lr": 3.007349602625682e-05} +{"train_loss": 0.0016480666818097234, "global_step": 45201, "epoch": 379, "lr": 3.0071464079503854e-05} +{"train_loss": 0.0015119124436751008, "global_step": 45202, "epoch": 379, "lr": 3.0069432171878443e-05} +{"train_loss": 0.0011078630341216922, "global_step": 45203, "epoch": 379, "lr": 3.0067400303384558e-05} +{"train_loss": 0.0013345152838155627, "global_step": 45204, "epoch": 379, "lr": 3.006536847402622e-05} +{"train_loss": 0.0012513094116002321, "global_step": 45205, "epoch": 379, "lr": 3.0063336683807407e-05} +{"train_loss": 0.0013522186782211065, "global_step": 45206, "epoch": 379, "lr": 3.0061304932732082e-05} +{"train_loss": 0.0015205050585791469, "global_step": 45207, "epoch": 379, "lr": 3.0059273220804272e-05} +{"train_loss": 0.0010402282932773232, "global_step": 45208, "epoch": 379, "lr": 3.0057241548027938e-05} +{"train_loss": 0.0014587893383577466, "global_step": 45209, "epoch": 379, "lr": 3.005520991440709e-05} +{"train_loss": 0.0007961011142469943, "global_step": 45210, "epoch": 379, "lr": 3.005317831994571e-05} +{"train_loss": 0.0012695956975221634, "global_step": 45211, "epoch": 379, "lr": 3.0051146764647758e-05} +{"train_loss": 0.0008267158991657197, "global_step": 45212, "epoch": 379, "lr": 3.0049115248517272e-05} +{"train_loss": 0.0012017544358968735, "global_step": 45213, "epoch": 379, "lr": 3.0047083771558194e-05} +{"train_loss": 0.0020579679403454065, "global_step": 45214, "epoch": 379, "lr": 3.004505233377456e-05} +{"train_loss": 0.001906527322717011, "global_step": 45215, "epoch": 379, "lr": 3.004302093517031e-05} +{"train_loss": 0.0009046374470926821, "global_step": 45216, "epoch": 379, "lr": 3.004098957574948e-05} +{"train_loss": 0.0007908392581157386, "global_step": 45217, "epoch": 379, "lr": 3.0038958255516027e-05} +{"train_loss": 0.0013396969297900796, "global_step": 45218, "epoch": 379, "lr": 3.0036926974473935e-05} +{"train_loss": 0.0013489462533073516, "global_step": 45219, "epoch": 379, "lr": 3.003489573262722e-05, "val_loss": 0.01750582829117775} +{"train_loss": 0.002266484312713146, "global_step": 45220, "epoch": 380, "lr": 3.003286452997983e-05} +{"train_loss": 0.0014360143104568124, "global_step": 45221, "epoch": 380, "lr": 3.0030833366535806e-05} +{"train_loss": 0.0009023488382808864, "global_step": 45222, "epoch": 380, "lr": 3.0028802242299102e-05} +{"train_loss": 0.0009632532019168139, "global_step": 45223, "epoch": 380, "lr": 3.0026771157273702e-05} +{"train_loss": 0.0015587796224281192, "global_step": 45224, "epoch": 380, "lr": 3.002474011146361e-05} +{"train_loss": 0.0017109425971284509, "global_step": 45225, "epoch": 380, "lr": 3.0022709104872793e-05} +{"train_loss": 0.0012138162273913622, "global_step": 45226, "epoch": 380, "lr": 3.0020678137505277e-05} +{"train_loss": 0.0008309968980029225, "global_step": 45227, "epoch": 380, "lr": 3.0018647209364992e-05} +{"train_loss": 0.0011030822061002254, "global_step": 45228, "epoch": 380, "lr": 3.0016616320455993e-05} +{"train_loss": 0.0008179061696864665, "global_step": 45229, "epoch": 380, "lr": 3.0014585470782218e-05} +{"train_loss": 0.0015956313582137227, "global_step": 45230, "epoch": 380, "lr": 3.0012554660347657e-05} +{"train_loss": 0.0011758266482502222, "global_step": 45231, "epoch": 380, "lr": 3.001052388915633e-05} +{"train_loss": 0.0017944620922207832, "global_step": 45232, "epoch": 380, "lr": 3.0008493157212185e-05} +{"train_loss": 0.0009329807944595814, "global_step": 45233, "epoch": 380, "lr": 3.0006462464519235e-05} +{"train_loss": 0.0005885688588023186, "global_step": 45234, "epoch": 380, "lr": 3.000443181108147e-05} +{"train_loss": 0.0017998488619923592, "global_step": 45235, "epoch": 380, "lr": 3.0002401196902853e-05} +{"train_loss": 0.001021235715597868, "global_step": 45236, "epoch": 380, "lr": 3.00003706219874e-05} +{"train_loss": 0.0011534587247297168, "global_step": 45237, "epoch": 380, "lr": 2.999834008633906e-05} +{"train_loss": 0.0008402618695981801, "global_step": 45238, "epoch": 380, "lr": 2.9996309589961867e-05} +{"train_loss": 0.0015623221406713128, "global_step": 45239, "epoch": 380, "lr": 2.9994279132859758e-05} +{"train_loss": 0.0009102095500566065, "global_step": 45240, "epoch": 380, "lr": 2.9992248715036776e-05} +{"train_loss": 0.0011866686400026083, "global_step": 45241, "epoch": 380, "lr": 2.9990218336496868e-05} +{"train_loss": 0.0010975348995998502, "global_step": 45242, "epoch": 380, "lr": 2.9988187997244005e-05} +{"train_loss": 0.001085752504877746, "global_step": 45243, "epoch": 380, "lr": 2.9986157697282218e-05} +{"train_loss": 0.0011130382772535086, "global_step": 45244, "epoch": 380, "lr": 2.9984127436615456e-05} +{"train_loss": 0.002055044285953045, "global_step": 45245, "epoch": 380, "lr": 2.998209721524774e-05} +{"train_loss": 0.0006432172376662493, "global_step": 45246, "epoch": 380, "lr": 2.9980067033183018e-05} +{"train_loss": 0.0017148563638329506, "global_step": 45247, "epoch": 380, "lr": 2.9978036890425315e-05} +{"train_loss": 0.0015542652690783143, "global_step": 45248, "epoch": 380, "lr": 2.9976006786978588e-05} +{"train_loss": 0.0011245819041505456, "global_step": 45249, "epoch": 380, "lr": 2.997397672284683e-05} +{"train_loss": 0.0010502533987164497, "global_step": 45250, "epoch": 380, "lr": 2.9971946698034037e-05} +{"train_loss": 0.0016148013528436422, "global_step": 45251, "epoch": 380, "lr": 2.9969916712544176e-05} +{"train_loss": 0.0016691661439836025, "global_step": 45252, "epoch": 380, "lr": 2.9967886766381248e-05} +{"train_loss": 0.0012943431502208114, "global_step": 45253, "epoch": 380, "lr": 2.9965856859549225e-05} +{"train_loss": 0.0011325990781188011, "global_step": 45254, "epoch": 380, "lr": 2.9963826992052124e-05} +{"train_loss": 0.001547604100778699, "global_step": 45255, "epoch": 380, "lr": 2.9961797163893906e-05} +{"train_loss": 0.0013059041230008006, "global_step": 45256, "epoch": 380, "lr": 2.995976737507854e-05} +{"train_loss": 0.0010906783863902092, "global_step": 45257, "epoch": 380, "lr": 2.9957737625610048e-05} +{"train_loss": 0.0010400714818388224, "global_step": 45258, "epoch": 380, "lr": 2.9955707915492377e-05} +{"train_loss": 0.0019912782590836287, "global_step": 45259, "epoch": 380, "lr": 2.9953678244729554e-05} +{"train_loss": 0.0009478066931478679, "global_step": 45260, "epoch": 380, "lr": 2.995164861332554e-05} +{"train_loss": 0.0007686294848099351, "global_step": 45261, "epoch": 380, "lr": 2.9949619021284302e-05} +{"train_loss": 0.0008917165105231106, "global_step": 45262, "epoch": 380, "lr": 2.994758946860986e-05} +{"train_loss": 0.002008599229156971, "global_step": 45263, "epoch": 380, "lr": 2.9945559955306175e-05} +{"train_loss": 0.0014005961129441857, "global_step": 45264, "epoch": 380, "lr": 2.994353048137725e-05} +{"train_loss": 0.0012579396134242415, "global_step": 45265, "epoch": 380, "lr": 2.9941501046827048e-05} +{"train_loss": 0.0008199361618608236, "global_step": 45266, "epoch": 380, "lr": 2.9939471651659574e-05} +{"train_loss": 0.0010017529129981995, "global_step": 45267, "epoch": 380, "lr": 2.9937442295878814e-05} +{"train_loss": 0.0032010863069444895, "global_step": 45268, "epoch": 380, "lr": 2.9935412979488718e-05} +{"train_loss": 0.0015488150529563427, "global_step": 45269, "epoch": 380, "lr": 2.993338370249332e-05} +{"train_loss": 0.0007674978696741164, "global_step": 45270, "epoch": 380, "lr": 2.9931354464896554e-05} +{"train_loss": 0.0015364703722298145, "global_step": 45271, "epoch": 380, "lr": 2.992932526670246e-05} +{"train_loss": 0.0016723505686968565, "global_step": 45272, "epoch": 380, "lr": 2.992729610791496e-05} +{"train_loss": 0.0006859788554720581, "global_step": 45273, "epoch": 380, "lr": 2.99252669885381e-05} +{"train_loss": 0.001556834322400391, "global_step": 45274, "epoch": 380, "lr": 2.992323790857583e-05} +{"train_loss": 0.0014651099918410182, "global_step": 45275, "epoch": 380, "lr": 2.9921208868032113e-05} +{"train_loss": 0.001087483367882669, "global_step": 45276, "epoch": 380, "lr": 2.991917986691098e-05} +{"train_loss": 0.0011944447178393602, "global_step": 45277, "epoch": 380, "lr": 2.9917150905216374e-05} +{"train_loss": 0.001429853611625731, "global_step": 45278, "epoch": 380, "lr": 2.991512198295231e-05} +{"train_loss": 0.0010876061860471964, "global_step": 45279, "epoch": 380, "lr": 2.9913093100122758e-05} +{"train_loss": 0.0016434671124443412, "global_step": 45280, "epoch": 380, "lr": 2.9911064256731692e-05} +{"train_loss": 0.001721854554489255, "global_step": 45281, "epoch": 380, "lr": 2.9909035452783112e-05} +{"train_loss": 0.0017065282445400953, "global_step": 45282, "epoch": 380, "lr": 2.9907006688280992e-05} +{"train_loss": 0.001700107124634087, "global_step": 45283, "epoch": 380, "lr": 2.990497796322932e-05} +{"train_loss": 0.0010047839023172855, "global_step": 45284, "epoch": 380, "lr": 2.9902949277632076e-05} +{"train_loss": 0.0018503009341657162, "global_step": 45285, "epoch": 380, "lr": 2.9900920631493245e-05} +{"train_loss": 0.0016657375963404775, "global_step": 45286, "epoch": 380, "lr": 2.9898892024816816e-05} +{"train_loss": 0.0011257993755862117, "global_step": 45287, "epoch": 380, "lr": 2.9896863457606745e-05} +{"train_loss": 0.0016347841592505574, "global_step": 45288, "epoch": 380, "lr": 2.9894834929867054e-05} +{"train_loss": 0.0008592021185904741, "global_step": 45289, "epoch": 380, "lr": 2.989280644160169e-05} +{"train_loss": 0.0013488356489688158, "global_step": 45290, "epoch": 380, "lr": 2.9890777992814672e-05} +{"train_loss": 0.0006021212320774794, "global_step": 45291, "epoch": 380, "lr": 2.988874958350996e-05} +{"train_loss": 0.001231235801242292, "global_step": 45292, "epoch": 380, "lr": 2.9886721213691526e-05} +{"train_loss": 0.0006898290594108403, "global_step": 45293, "epoch": 380, "lr": 2.988469288336338e-05} +{"train_loss": 0.0015849870396777987, "global_step": 45294, "epoch": 380, "lr": 2.9882664592529473e-05} +{"train_loss": 0.0017399681964889169, "global_step": 45295, "epoch": 380, "lr": 2.9880636341193824e-05} +{"train_loss": 0.0008242636104114354, "global_step": 45296, "epoch": 380, "lr": 2.9878608129360373e-05} +{"train_loss": 0.001074594329111278, "global_step": 45297, "epoch": 380, "lr": 2.9876579957033152e-05} +{"train_loss": 0.0009556301520206034, "global_step": 45298, "epoch": 380, "lr": 2.9874551824216102e-05} +{"train_loss": 0.0011267781956121325, "global_step": 45299, "epoch": 380, "lr": 2.987252373091322e-05} +{"train_loss": 0.0008545751334168017, "global_step": 45300, "epoch": 380, "lr": 2.987049567712849e-05} +{"train_loss": 0.0016709433402866125, "global_step": 45301, "epoch": 380, "lr": 2.986846766286588e-05} +{"train_loss": 0.001708799391053617, "global_step": 45302, "epoch": 380, "lr": 2.98664396881294e-05} +{"train_loss": 0.0008559893467463553, "global_step": 45303, "epoch": 380, "lr": 2.9864411752922994e-05} +{"train_loss": 0.0006788612809032202, "global_step": 45304, "epoch": 380, "lr": 2.9862383857250693e-05} +{"train_loss": 0.000927187385968864, "global_step": 45305, "epoch": 380, "lr": 2.986035600111644e-05} +{"train_loss": 0.0012839314294978976, "global_step": 45306, "epoch": 380, "lr": 2.9858328184524208e-05} +{"train_loss": 0.0015759178204461932, "global_step": 45307, "epoch": 380, "lr": 2.985630040747802e-05} +{"train_loss": 0.0014912696788087487, "global_step": 45308, "epoch": 380, "lr": 2.985427266998182e-05} +{"train_loss": 0.0009348210878670216, "global_step": 45309, "epoch": 380, "lr": 2.985224497203961e-05} +{"train_loss": 0.0007773541728965938, "global_step": 45310, "epoch": 380, "lr": 2.9850217313655376e-05} +{"train_loss": 0.0008703739149495959, "global_step": 45311, "epoch": 380, "lr": 2.9848189694833063e-05} +{"train_loss": 0.002344506559893489, "global_step": 45312, "epoch": 380, "lr": 2.9846162115576692e-05} +{"train_loss": 0.0008905829745344818, "global_step": 45313, "epoch": 380, "lr": 2.9844134575890214e-05} +{"train_loss": 0.0009007933549582958, "global_step": 45314, "epoch": 380, "lr": 2.9842107075777637e-05} +{"train_loss": 0.0014602981973439455, "global_step": 45315, "epoch": 380, "lr": 2.984007961524292e-05} +{"train_loss": 0.0012048435164615512, "global_step": 45316, "epoch": 380, "lr": 2.9838052194290066e-05} +{"train_loss": 0.0010049142874777317, "global_step": 45317, "epoch": 380, "lr": 2.983602481292305e-05} +{"train_loss": 0.0015541543252766132, "global_step": 45318, "epoch": 380, "lr": 2.9833997471145815e-05} +{"train_loss": 0.001986902207136154, "global_step": 45319, "epoch": 380, "lr": 2.9831970168962398e-05} +{"train_loss": 0.0021152060944586992, "global_step": 45320, "epoch": 380, "lr": 2.9829942906376728e-05} +{"train_loss": 0.001382096903398633, "global_step": 45321, "epoch": 380, "lr": 2.9827915683392837e-05} +{"train_loss": 0.0008392709423787892, "global_step": 45322, "epoch": 380, "lr": 2.9825888500014654e-05} +{"train_loss": 0.0007393829873763025, "global_step": 45323, "epoch": 380, "lr": 2.982386135624621e-05} +{"train_loss": 0.0011907167499884963, "global_step": 45324, "epoch": 380, "lr": 2.982183425209145e-05} +{"train_loss": 0.0011389469727873802, "global_step": 45325, "epoch": 380, "lr": 2.981980718755435e-05} +{"train_loss": 0.0007070344290696084, "global_step": 45326, "epoch": 380, "lr": 2.9817780162638914e-05} +{"train_loss": 0.0016306963516399264, "global_step": 45327, "epoch": 380, "lr": 2.9815753177349094e-05} +{"train_loss": 0.0014523189747706056, "global_step": 45328, "epoch": 380, "lr": 2.981372623168891e-05} +{"train_loss": 0.0007889171247370541, "global_step": 45329, "epoch": 380, "lr": 2.9811699325662306e-05} +{"train_loss": 0.0014901644317433238, "global_step": 45330, "epoch": 380, "lr": 2.9809672459273275e-05} +{"train_loss": 0.0019225667929276824, "global_step": 45331, "epoch": 380, "lr": 2.9807645632525793e-05} +{"train_loss": 0.001555882510729134, "global_step": 45332, "epoch": 380, "lr": 2.9805618845423843e-05} +{"train_loss": 0.0013754874235019088, "global_step": 45333, "epoch": 380, "lr": 2.98035920979714e-05} +{"train_loss": 0.001060162903741002, "global_step": 45334, "epoch": 380, "lr": 2.980156539017245e-05} +{"train_loss": 0.0020392155274748802, "global_step": 45335, "epoch": 380, "lr": 2.9799538722030968e-05} +{"train_loss": 0.0007550425361841917, "global_step": 45336, "epoch": 380, "lr": 2.979751209355094e-05} +{"train_loss": 0.0006777067319490016, "global_step": 45337, "epoch": 380, "lr": 2.979548550473632e-05} +{"train_loss": 0.0012828588075818447, "global_step": 45338, "epoch": 380, "lr": 2.979345895559113e-05, "val_loss": 0.012439101934432983, "train_action_mse_error": 1.7049205780494958e-05} +{"train_loss": 0.000806868018116802, "global_step": 45339, "epoch": 381, "lr": 2.97914324461193e-05} +{"train_loss": 0.0012760355602949858, "global_step": 45340, "epoch": 381, "lr": 2.978940597632486e-05} +{"train_loss": 0.001292491564527154, "global_step": 45341, "epoch": 381, "lr": 2.9787379546211752e-05} +{"train_loss": 0.0009851106442511082, "global_step": 45342, "epoch": 381, "lr": 2.9785353155783948e-05} +{"train_loss": 0.0013211286859586835, "global_step": 45343, "epoch": 381, "lr": 2.9783326805045464e-05} +{"train_loss": 0.0010136077180504799, "global_step": 45344, "epoch": 381, "lr": 2.9781300494000242e-05} +{"train_loss": 0.0008438862860202789, "global_step": 45345, "epoch": 381, "lr": 2.9779274222652297e-05} +{"train_loss": 0.0006677760393358767, "global_step": 45346, "epoch": 381, "lr": 2.9777247991005562e-05} +{"train_loss": 0.001251355279237032, "global_step": 45347, "epoch": 381, "lr": 2.977522179906406e-05} +{"train_loss": 0.002124092075973749, "global_step": 45348, "epoch": 381, "lr": 2.977319564683174e-05} +{"train_loss": 0.0005503961001522839, "global_step": 45349, "epoch": 381, "lr": 2.9771169534312583e-05} +{"train_loss": 0.001868935883976519, "global_step": 45350, "epoch": 381, "lr": 2.976914346151059e-05} +{"train_loss": 0.0006880423170514405, "global_step": 45351, "epoch": 381, "lr": 2.9767117428429703e-05} +{"train_loss": 0.000948412052821368, "global_step": 45352, "epoch": 381, "lr": 2.9765091435073943e-05} +{"train_loss": 0.0007721180445514619, "global_step": 45353, "epoch": 381, "lr": 2.976306548144724e-05} +{"train_loss": 0.0010633410420268774, "global_step": 45354, "epoch": 381, "lr": 2.976103956755362e-05} +{"train_loss": 0.0017933292547240853, "global_step": 45355, "epoch": 381, "lr": 2.975901369339703e-05} +{"train_loss": 0.0013186975847929716, "global_step": 45356, "epoch": 381, "lr": 2.9756987858981432e-05} +{"train_loss": 0.0011693374253809452, "global_step": 45357, "epoch": 381, "lr": 2.9754962064310853e-05} +{"train_loss": 0.0008030556491576135, "global_step": 45358, "epoch": 381, "lr": 2.9752936309389222e-05} +{"train_loss": 0.001251200563274324, "global_step": 45359, "epoch": 381, "lr": 2.975091059422056e-05} +{"train_loss": 0.0008853881736285985, "global_step": 45360, "epoch": 381, "lr": 2.9748884918808817e-05} +{"train_loss": 0.0028259907849133015, "global_step": 45361, "epoch": 381, "lr": 2.9746859283157957e-05} +{"train_loss": 0.0013221862027421594, "global_step": 45362, "epoch": 381, "lr": 2.9744833687271993e-05} +{"train_loss": 0.001009867643006146, "global_step": 45363, "epoch": 381, "lr": 2.9742808131154864e-05} +{"train_loss": 0.0012072615791112185, "global_step": 45364, "epoch": 381, "lr": 2.974078261481058e-05} +{"train_loss": 0.0010355315171182156, "global_step": 45365, "epoch": 381, "lr": 2.9738757138243105e-05} +{"train_loss": 0.0016396201681345701, "global_step": 45366, "epoch": 381, "lr": 2.9736731701456418e-05} +{"train_loss": 0.0016890187980607152, "global_step": 45367, "epoch": 381, "lr": 2.9734706304454495e-05} +{"train_loss": 0.001078809262253344, "global_step": 45368, "epoch": 381, "lr": 2.9732680947241298e-05} +{"train_loss": 0.0007048160186968744, "global_step": 45369, "epoch": 381, "lr": 2.9730655629820835e-05} +{"train_loss": 0.0014828199055045843, "global_step": 45370, "epoch": 381, "lr": 2.9728630352197046e-05} +{"train_loss": 0.0007675511296838522, "global_step": 45371, "epoch": 381, "lr": 2.972660511437394e-05} +{"train_loss": 0.0007025389350019395, "global_step": 45372, "epoch": 381, "lr": 2.9724579916355465e-05} +{"train_loss": 0.0014319493202492595, "global_step": 45373, "epoch": 381, "lr": 2.9722554758145628e-05} +{"train_loss": 0.0011910900939255953, "global_step": 45374, "epoch": 381, "lr": 2.972052963974839e-05} +{"train_loss": 0.0013360767625272274, "global_step": 45375, "epoch": 381, "lr": 2.9718504561167704e-05} +{"train_loss": 0.000991769484244287, "global_step": 45376, "epoch": 381, "lr": 2.9716479522407592e-05} +{"train_loss": 0.0006895281258039176, "global_step": 45377, "epoch": 381, "lr": 2.9714454523471978e-05} +{"train_loss": 0.0009334303322248161, "global_step": 45378, "epoch": 381, "lr": 2.971242956436489e-05} +{"train_loss": 0.001195959048345685, "global_step": 45379, "epoch": 381, "lr": 2.9710404645090274e-05} +{"train_loss": 0.0014208421343937516, "global_step": 45380, "epoch": 381, "lr": 2.97083797656521e-05} +{"train_loss": 0.0007533362368121743, "global_step": 45381, "epoch": 381, "lr": 2.9706354926054357e-05} +{"train_loss": 0.0014919524546712637, "global_step": 45382, "epoch": 381, "lr": 2.9704330126301027e-05} +{"train_loss": 0.0011486038565635681, "global_step": 45383, "epoch": 381, "lr": 2.9702305366396067e-05} +{"train_loss": 0.0021610611584037542, "global_step": 45384, "epoch": 381, "lr": 2.970028064634346e-05} +{"train_loss": 0.0015448385383933783, "global_step": 45385, "epoch": 381, "lr": 2.9698255966147193e-05} +{"train_loss": 0.0010318176355212927, "global_step": 45386, "epoch": 381, "lr": 2.969623132581124e-05} +{"train_loss": 0.0010411706753075123, "global_step": 45387, "epoch": 381, "lr": 2.9694206725339545e-05} +{"train_loss": 0.001460105529986322, "global_step": 45388, "epoch": 381, "lr": 2.9692182164736125e-05} +{"train_loss": 0.000897781690582633, "global_step": 45389, "epoch": 381, "lr": 2.969015764400491e-05} +{"train_loss": 0.0013366795610636473, "global_step": 45390, "epoch": 381, "lr": 2.9688133163149935e-05} +{"train_loss": 0.00210754107683897, "global_step": 45391, "epoch": 381, "lr": 2.968610872217511e-05} +{"train_loss": 0.0011476501822471619, "global_step": 45392, "epoch": 381, "lr": 2.968408432108446e-05} +{"train_loss": 0.0008906296570785344, "global_step": 45393, "epoch": 381, "lr": 2.9682059959881947e-05} +{"train_loss": 0.0009474040125496686, "global_step": 45394, "epoch": 381, "lr": 2.968003563857151e-05} +{"train_loss": 0.0013687512837350368, "global_step": 45395, "epoch": 381, "lr": 2.9678011357157174e-05} +{"train_loss": 0.0015556763391941786, "global_step": 45396, "epoch": 381, "lr": 2.9675987115642877e-05} +{"train_loss": 0.0006923506734892726, "global_step": 45397, "epoch": 381, "lr": 2.9673962914032627e-05} +{"train_loss": 0.0010039809858426452, "global_step": 45398, "epoch": 381, "lr": 2.9671938752330364e-05} +{"train_loss": 0.0014915014617145061, "global_step": 45399, "epoch": 381, "lr": 2.9669914630540074e-05} +{"train_loss": 0.0009194681188091636, "global_step": 45400, "epoch": 381, "lr": 2.966789054866575e-05} +{"train_loss": 0.0009336127550341189, "global_step": 45401, "epoch": 381, "lr": 2.9665866506711332e-05} +{"train_loss": 0.002022214001044631, "global_step": 45402, "epoch": 381, "lr": 2.9663842504680835e-05} +{"train_loss": 0.001464154338464141, "global_step": 45403, "epoch": 381, "lr": 2.966181854257819e-05} +{"train_loss": 0.0007527204579673707, "global_step": 45404, "epoch": 381, "lr": 2.965979462040741e-05} +{"train_loss": 0.0007836284348741174, "global_step": 45405, "epoch": 381, "lr": 2.9657770738172446e-05} +{"train_loss": 0.001348907477222383, "global_step": 45406, "epoch": 381, "lr": 2.9655746895877262e-05} +{"train_loss": 0.001184102613478899, "global_step": 45407, "epoch": 381, "lr": 2.9653723093525864e-05} +{"train_loss": 0.0006733023328706622, "global_step": 45408, "epoch": 381, "lr": 2.9651699331122184e-05} +{"train_loss": 0.0009027197957038879, "global_step": 45409, "epoch": 381, "lr": 2.9649675608670246e-05} +{"train_loss": 0.0010142455575987697, "global_step": 45410, "epoch": 381, "lr": 2.964765192617399e-05} +{"train_loss": 0.0012670280411839485, "global_step": 45411, "epoch": 381, "lr": 2.964562828363737e-05} +{"train_loss": 0.0007276453543454409, "global_step": 45412, "epoch": 381, "lr": 2.9643604681064406e-05} +{"train_loss": 0.0006830046186223626, "global_step": 45413, "epoch": 381, "lr": 2.9641581118459044e-05} +{"train_loss": 0.0012329822639003396, "global_step": 45414, "epoch": 381, "lr": 2.963955759582526e-05} +{"train_loss": 0.001780731719918549, "global_step": 45415, "epoch": 381, "lr": 2.9637534113167032e-05} +{"train_loss": 0.0011483710259199142, "global_step": 45416, "epoch": 381, "lr": 2.963551067048833e-05} +{"train_loss": 0.0008725320803932846, "global_step": 45417, "epoch": 381, "lr": 2.9633487267793137e-05} +{"train_loss": 0.0018065697513520718, "global_step": 45418, "epoch": 381, "lr": 2.96314639050854e-05} +{"train_loss": 0.0013385118218138814, "global_step": 45419, "epoch": 381, "lr": 2.962944058236912e-05} +{"train_loss": 0.0010751321678981185, "global_step": 45420, "epoch": 381, "lr": 2.9627417299648242e-05} +{"train_loss": 0.0010799719020724297, "global_step": 45421, "epoch": 381, "lr": 2.9625394056926777e-05} +{"train_loss": 0.002547019859775901, "global_step": 45422, "epoch": 381, "lr": 2.9623370854208644e-05} +{"train_loss": 0.0017577260732650757, "global_step": 45423, "epoch": 381, "lr": 2.9621347691497877e-05} +{"train_loss": 0.0010525190737098455, "global_step": 45424, "epoch": 381, "lr": 2.961932456879841e-05} +{"train_loss": 0.0007233683718368411, "global_step": 45425, "epoch": 381, "lr": 2.9617301486114202e-05} +{"train_loss": 0.0012599739711731672, "global_step": 45426, "epoch": 381, "lr": 2.9615278443449267e-05} +{"train_loss": 0.0006786496960557997, "global_step": 45427, "epoch": 381, "lr": 2.961325544080753e-05} +{"train_loss": 0.0013399266172200441, "global_step": 45428, "epoch": 381, "lr": 2.9611232478193012e-05} +{"train_loss": 0.0014195862459018826, "global_step": 45429, "epoch": 381, "lr": 2.960920955560965e-05} +{"train_loss": 0.0021994183771312237, "global_step": 45430, "epoch": 381, "lr": 2.9607186673061428e-05} +{"train_loss": 0.0008045315044000745, "global_step": 45431, "epoch": 381, "lr": 2.960516383055232e-05} +{"train_loss": 0.0009697726927697659, "global_step": 45432, "epoch": 381, "lr": 2.9603141028086284e-05} +{"train_loss": 0.0009524696506559849, "global_step": 45433, "epoch": 381, "lr": 2.9601118265667306e-05} +{"train_loss": 0.0015288444701582193, "global_step": 45434, "epoch": 381, "lr": 2.959909554329935e-05} +{"train_loss": 0.0017845325637608767, "global_step": 45435, "epoch": 381, "lr": 2.9597072860986397e-05} +{"train_loss": 0.0016576419584453106, "global_step": 45436, "epoch": 381, "lr": 2.9595050218732422e-05} +{"train_loss": 0.0015498929424211383, "global_step": 45437, "epoch": 381, "lr": 2.9593027616541357e-05} +{"train_loss": 0.0017078218515962362, "global_step": 45438, "epoch": 381, "lr": 2.959100505441723e-05} +{"train_loss": 0.0009128700476139784, "global_step": 45439, "epoch": 381, "lr": 2.9588982532363963e-05} +{"train_loss": 0.0014834433095529675, "global_step": 45440, "epoch": 381, "lr": 2.958696005038557e-05} +{"train_loss": 0.0013072382425889373, "global_step": 45441, "epoch": 381, "lr": 2.9584937608485975e-05} +{"train_loss": 0.0015599720645695925, "global_step": 45442, "epoch": 381, "lr": 2.9582915206669197e-05} +{"train_loss": 0.0008348944247700274, "global_step": 45443, "epoch": 381, "lr": 2.9580892844939185e-05} +{"train_loss": 0.0019753011874854565, "global_step": 45444, "epoch": 381, "lr": 2.9578870523299886e-05} +{"train_loss": 0.0013802179601043463, "global_step": 45445, "epoch": 381, "lr": 2.9576848241755318e-05} +{"train_loss": 0.0010963339591398835, "global_step": 45446, "epoch": 381, "lr": 2.9574826000309395e-05} +{"train_loss": 0.0016178014921024442, "global_step": 45447, "epoch": 381, "lr": 2.9572803798966142e-05} +{"train_loss": 0.0031354683451354504, "global_step": 45448, "epoch": 381, "lr": 2.9570781637729506e-05} +{"train_loss": 0.0014808500418439507, "global_step": 45449, "epoch": 381, "lr": 2.9568759516603445e-05} +{"train_loss": 0.0006535275606438518, "global_step": 45450, "epoch": 381, "lr": 2.9566737435591962e-05} +{"train_loss": 0.0010280698770657182, "global_step": 45451, "epoch": 381, "lr": 2.9564715394698982e-05} +{"train_loss": 0.0020757601596415043, "global_step": 45452, "epoch": 381, "lr": 2.956269339392852e-05} +{"train_loss": 0.0018849349580705166, "global_step": 45453, "epoch": 381, "lr": 2.956067143328451e-05} +{"train_loss": 0.0009479372529312968, "global_step": 45454, "epoch": 381, "lr": 2.9558649512770954e-05} +{"train_loss": 0.001948955119587481, "global_step": 45455, "epoch": 381, "lr": 2.9556627632391808e-05} +{"train_loss": 0.0016804394545033574, "global_step": 45456, "epoch": 381, "lr": 2.9554605792151023e-05} +{"train_loss": 0.001268121270568525, "global_step": 45457, "epoch": 381, "lr": 2.9552583992052607e-05, "val_loss": 0.011561241932213306} +{"train_loss": 0.0013320251600816846, "global_step": 45458, "epoch": 382, "lr": 2.9550562232100476e-05} +{"train_loss": 0.0007487811963073909, "global_step": 45459, "epoch": 382, "lr": 2.9548540512298662e-05} +{"train_loss": 0.0009981825714930892, "global_step": 45460, "epoch": 382, "lr": 2.9546518832651092e-05} +{"train_loss": 0.0016642750706523657, "global_step": 45461, "epoch": 382, "lr": 2.9544497193161747e-05} +{"train_loss": 0.0014035258209332824, "global_step": 45462, "epoch": 382, "lr": 2.9542475593834595e-05} +{"train_loss": 0.0009077715803869069, "global_step": 45463, "epoch": 382, "lr": 2.9540454034673602e-05} +{"train_loss": 0.002505362732335925, "global_step": 45464, "epoch": 382, "lr": 2.9538432515682744e-05} +{"train_loss": 0.002295502694323659, "global_step": 45465, "epoch": 382, "lr": 2.9536411036865995e-05} +{"train_loss": 0.0016957215266302228, "global_step": 45466, "epoch": 382, "lr": 2.953438959822731e-05} +{"train_loss": 0.000652884307783097, "global_step": 45467, "epoch": 382, "lr": 2.9532368199770675e-05} +{"train_loss": 0.0006050340016372502, "global_step": 45468, "epoch": 382, "lr": 2.9530346841500033e-05} +{"train_loss": 0.0013224506983533502, "global_step": 45469, "epoch": 382, "lr": 2.9528325523419387e-05} +{"train_loss": 0.0014911193866282701, "global_step": 45470, "epoch": 382, "lr": 2.952630424553266e-05} +{"train_loss": 0.0006812900537624955, "global_step": 45471, "epoch": 382, "lr": 2.9524283007843872e-05} +{"train_loss": 0.0016256258822977543, "global_step": 45472, "epoch": 382, "lr": 2.9522261810356943e-05} +{"train_loss": 0.0011839339276775718, "global_step": 45473, "epoch": 382, "lr": 2.9520240653075892e-05} +{"train_loss": 0.0013515970204025507, "global_step": 45474, "epoch": 382, "lr": 2.951821953600466e-05} +{"train_loss": 0.0015151604311540723, "global_step": 45475, "epoch": 382, "lr": 2.9516198459147194e-05} +{"train_loss": 0.0013740877620875835, "global_step": 45476, "epoch": 382, "lr": 2.9514177422507505e-05} +{"train_loss": 0.0008089117472991347, "global_step": 45477, "epoch": 382, "lr": 2.9512156426089517e-05} +{"train_loss": 0.0014776450116187334, "global_step": 45478, "epoch": 382, "lr": 2.9510135469897236e-05} +{"train_loss": 0.002506946213543415, "global_step": 45479, "epoch": 382, "lr": 2.950811455393462e-05} +{"train_loss": 0.0012179852928966284, "global_step": 45480, "epoch": 382, "lr": 2.9506093678205616e-05} +{"train_loss": 0.0012587358942255378, "global_step": 45481, "epoch": 382, "lr": 2.9504072842714215e-05} +{"train_loss": 0.001295843510888517, "global_step": 45482, "epoch": 382, "lr": 2.9502052047464367e-05} +{"train_loss": 0.0015515891136601567, "global_step": 45483, "epoch": 382, "lr": 2.9500031292460074e-05} +{"train_loss": 0.000903064850717783, "global_step": 45484, "epoch": 382, "lr": 2.9498010577705254e-05} +{"train_loss": 0.0017480544047430158, "global_step": 45485, "epoch": 382, "lr": 2.9495989903203924e-05} +{"train_loss": 0.001992548815906048, "global_step": 45486, "epoch": 382, "lr": 2.949396926896002e-05} +{"train_loss": 0.0010123407701030374, "global_step": 45487, "epoch": 382, "lr": 2.94919486749775e-05} +{"train_loss": 0.0013538411585614085, "global_step": 45488, "epoch": 382, "lr": 2.948992812126037e-05} +{"train_loss": 0.0010125081753358245, "global_step": 45489, "epoch": 382, "lr": 2.948790760781256e-05} +{"train_loss": 0.0016442934283986688, "global_step": 45490, "epoch": 382, "lr": 2.948588713463806e-05} +{"train_loss": 0.0012373876525089145, "global_step": 45491, "epoch": 382, "lr": 2.9483866701740814e-05} +{"train_loss": 0.0013584387488663197, "global_step": 45492, "epoch": 382, "lr": 2.948184630912483e-05} +{"train_loss": 0.0013661672128364444, "global_step": 45493, "epoch": 382, "lr": 2.9479825956794038e-05} +{"train_loss": 0.0018892931984737515, "global_step": 45494, "epoch": 382, "lr": 2.9477805644752404e-05} +{"train_loss": 0.0013072520960122347, "global_step": 45495, "epoch": 382, "lr": 2.9475785373003917e-05} +{"train_loss": 0.0012249031569808722, "global_step": 45496, "epoch": 382, "lr": 2.9473765141552524e-05} +{"train_loss": 0.001535179209895432, "global_step": 45497, "epoch": 382, "lr": 2.9471744950402207e-05} +{"train_loss": 0.0016780898440629244, "global_step": 45498, "epoch": 382, "lr": 2.946972479955693e-05} +{"train_loss": 0.0007128462311811745, "global_step": 45499, "epoch": 382, "lr": 2.946770468902064e-05} +{"train_loss": 0.0017466903664171696, "global_step": 45500, "epoch": 382, "lr": 2.946568461879734e-05} +{"train_loss": 0.0010270006023347378, "global_step": 45501, "epoch": 382, "lr": 2.9463664588890948e-05} +{"train_loss": 0.0011002430692315102, "global_step": 45502, "epoch": 382, "lr": 2.9461644599305483e-05} +{"train_loss": 0.0012674141908064485, "global_step": 45503, "epoch": 382, "lr": 2.9459624650044858e-05} +{"train_loss": 0.0007808569353073835, "global_step": 45504, "epoch": 382, "lr": 2.94576047411131e-05} +{"train_loss": 0.0010514495661482215, "global_step": 45505, "epoch": 382, "lr": 2.9455584872514123e-05} +{"train_loss": 0.0007142230751924217, "global_step": 45506, "epoch": 382, "lr": 2.9453565044251898e-05} +{"train_loss": 0.0011455179192125797, "global_step": 45507, "epoch": 382, "lr": 2.9451545256330426e-05} +{"train_loss": 0.0006537465960718691, "global_step": 45508, "epoch": 382, "lr": 2.944952550875362e-05} +{"train_loss": 0.000795742787886411, "global_step": 45509, "epoch": 382, "lr": 2.9447505801525505e-05} +{"train_loss": 0.0010431812843307853, "global_step": 45510, "epoch": 382, "lr": 2.944548613464999e-05} +{"train_loss": 0.0006670482689514756, "global_step": 45511, "epoch": 382, "lr": 2.944346650813109e-05} +{"train_loss": 0.0011803176021203399, "global_step": 45512, "epoch": 382, "lr": 2.944144692197274e-05} +{"train_loss": 0.000945329840760678, "global_step": 45513, "epoch": 382, "lr": 2.9439427376178908e-05} +{"train_loss": 0.0014881431125104427, "global_step": 45514, "epoch": 382, "lr": 2.9437407870753562e-05} +{"train_loss": 0.0015302926767617464, "global_step": 45515, "epoch": 382, "lr": 2.9435388405700677e-05} +{"train_loss": 0.0008937863749451935, "global_step": 45516, "epoch": 382, "lr": 2.9433368981024202e-05} +{"train_loss": 0.0013821603497490287, "global_step": 45517, "epoch": 382, "lr": 2.9431349596728126e-05} +{"train_loss": 0.0017530176555737853, "global_step": 45518, "epoch": 382, "lr": 2.9429330252816372e-05} +{"train_loss": 0.0012379426043480635, "global_step": 45519, "epoch": 382, "lr": 2.942731094929295e-05} +{"train_loss": 0.0008560439455322921, "global_step": 45520, "epoch": 382, "lr": 2.9425291686161793e-05} +{"train_loss": 0.0011464980198070407, "global_step": 45521, "epoch": 382, "lr": 2.9423272463426894e-05} +{"train_loss": 0.0019314984092488885, "global_step": 45522, "epoch": 382, "lr": 2.9421253281092177e-05} +{"train_loss": 0.0016276297392323613, "global_step": 45523, "epoch": 382, "lr": 2.9419234139161656e-05} +{"train_loss": 0.00148283620364964, "global_step": 45524, "epoch": 382, "lr": 2.941721503763927e-05} +{"train_loss": 0.0012827202444896102, "global_step": 45525, "epoch": 382, "lr": 2.941519597652896e-05} +{"train_loss": 0.001226654858328402, "global_step": 45526, "epoch": 382, "lr": 2.9413176955834732e-05} +{"train_loss": 0.001425569411367178, "global_step": 45527, "epoch": 382, "lr": 2.941115797556051e-05} +{"train_loss": 0.0017470100428909063, "global_step": 45528, "epoch": 382, "lr": 2.940913903571031e-05} +{"train_loss": 0.0027889965567737818, "global_step": 45529, "epoch": 382, "lr": 2.9407120136288048e-05} +{"train_loss": 0.0009590423433110118, "global_step": 45530, "epoch": 382, "lr": 2.940510127729771e-05} +{"train_loss": 0.001378705259412527, "global_step": 45531, "epoch": 382, "lr": 2.9403082458743246e-05} +{"train_loss": 0.001045172568410635, "global_step": 45532, "epoch": 382, "lr": 2.9401063680628626e-05} +{"train_loss": 0.0012753005139529705, "global_step": 45533, "epoch": 382, "lr": 2.9399044942957844e-05} +{"train_loss": 0.0008508973405696452, "global_step": 45534, "epoch": 382, "lr": 2.9397026245734803e-05} +{"train_loss": 0.000685107777826488, "global_step": 45535, "epoch": 382, "lr": 2.939500758896353e-05} +{"train_loss": 0.0008422260289080441, "global_step": 45536, "epoch": 382, "lr": 2.939298897264795e-05} +{"train_loss": 0.0012937921565026045, "global_step": 45537, "epoch": 382, "lr": 2.9390970396792017e-05} +{"train_loss": 0.0009651014697737992, "global_step": 45538, "epoch": 382, "lr": 2.938895186139974e-05} +{"train_loss": 0.0020326923113316298, "global_step": 45539, "epoch": 382, "lr": 2.9386933366475024e-05} +{"train_loss": 0.001397289102897048, "global_step": 45540, "epoch": 382, "lr": 2.9384914912021888e-05} +{"train_loss": 0.001116719446144998, "global_step": 45541, "epoch": 382, "lr": 2.9382896498044245e-05} +{"train_loss": 0.0010387792717665434, "global_step": 45542, "epoch": 382, "lr": 2.9380878124546107e-05} +{"train_loss": 0.0008809274877421558, "global_step": 45543, "epoch": 382, "lr": 2.9378859791531403e-05} +{"train_loss": 0.0015723903197795153, "global_step": 45544, "epoch": 382, "lr": 2.9376841499004092e-05} +{"train_loss": 0.0009392501087859273, "global_step": 45545, "epoch": 382, "lr": 2.9374823246968165e-05} +{"train_loss": 0.0016244673170149326, "global_step": 45546, "epoch": 382, "lr": 2.9372805035427554e-05} +{"train_loss": 0.0009555916185490787, "global_step": 45547, "epoch": 382, "lr": 2.9370786864386245e-05} +{"train_loss": 0.0032339629251509905, "global_step": 45548, "epoch": 382, "lr": 2.9368768733848205e-05} +{"train_loss": 0.0014846152625977993, "global_step": 45549, "epoch": 382, "lr": 2.9366750643817364e-05} +{"train_loss": 0.0015023763990029693, "global_step": 45550, "epoch": 382, "lr": 2.9364732594297717e-05} +{"train_loss": 0.002807924058288336, "global_step": 45551, "epoch": 382, "lr": 2.9362714585293194e-05} +{"train_loss": 0.0013785434421151876, "global_step": 45552, "epoch": 382, "lr": 2.9360696616807804e-05} +{"train_loss": 0.0010964712128043175, "global_step": 45553, "epoch": 382, "lr": 2.9358678688845452e-05} +{"train_loss": 0.0015649126144126058, "global_step": 45554, "epoch": 382, "lr": 2.935666080141015e-05} +{"train_loss": 0.0007484181551262736, "global_step": 45555, "epoch": 382, "lr": 2.9354642954505846e-05} +{"train_loss": 0.0011524405563250184, "global_step": 45556, "epoch": 382, "lr": 2.935262514813647e-05} +{"train_loss": 0.001049463520757854, "global_step": 45557, "epoch": 382, "lr": 2.935060738230603e-05} +{"train_loss": 0.0021934385877102613, "global_step": 45558, "epoch": 382, "lr": 2.9348589657018445e-05} +{"train_loss": 0.0016299353446811438, "global_step": 45559, "epoch": 382, "lr": 2.9346571972277714e-05} +{"train_loss": 0.0010244211880490184, "global_step": 45560, "epoch": 382, "lr": 2.934455432808777e-05} +{"train_loss": 0.0010992652969434857, "global_step": 45561, "epoch": 382, "lr": 2.9342536724452607e-05} +{"train_loss": 0.0013381809694692492, "global_step": 45562, "epoch": 382, "lr": 2.934051916137615e-05} +{"train_loss": 0.002116599353030324, "global_step": 45563, "epoch": 382, "lr": 2.9338501638862383e-05} +{"train_loss": 0.0012184937950223684, "global_step": 45564, "epoch": 382, "lr": 2.9336484156915255e-05} +{"train_loss": 0.0009955228306353092, "global_step": 45565, "epoch": 382, "lr": 2.9334466715538735e-05} +{"train_loss": 0.0021389632020145655, "global_step": 45566, "epoch": 382, "lr": 2.9332449314736787e-05} +{"train_loss": 0.0011248881928622723, "global_step": 45567, "epoch": 382, "lr": 2.9330431954513372e-05} +{"train_loss": 0.0010433162096887827, "global_step": 45568, "epoch": 382, "lr": 2.9328414634872424e-05} +{"train_loss": 0.0013076099567115307, "global_step": 45569, "epoch": 382, "lr": 2.9326397355817947e-05} +{"train_loss": 0.0018643561052158475, "global_step": 45570, "epoch": 382, "lr": 2.9324380117353855e-05} +{"train_loss": 0.0013829340459778905, "global_step": 45571, "epoch": 382, "lr": 2.932236291948416e-05} +{"train_loss": 0.0011560246348381042, "global_step": 45572, "epoch": 382, "lr": 2.9320345762212776e-05} +{"train_loss": 0.0010592490434646606, "global_step": 45573, "epoch": 382, "lr": 2.93183286455437e-05} +{"train_loss": 0.0010548214195296168, "global_step": 45574, "epoch": 382, "lr": 2.931631156948088e-05} +{"train_loss": 0.0013932980364188552, "global_step": 45575, "epoch": 382, "lr": 2.9314294534028254e-05} +{"train_loss": 0.0013290264735687054, "global_step": 45576, "epoch": 382, "lr": 2.9312277539189818e-05, "val_loss": 0.03717904910445213} +{"train_loss": 0.0011061718687415123, "global_step": 45577, "epoch": 383, "lr": 2.9310260584969495e-05} +{"train_loss": 0.001472029252909124, "global_step": 45578, "epoch": 383, "lr": 2.9308243671371283e-05} +{"train_loss": 0.0010570967569947243, "global_step": 45579, "epoch": 383, "lr": 2.9306226798399106e-05} +{"train_loss": 0.0013951050350442529, "global_step": 45580, "epoch": 383, "lr": 2.9304209966056954e-05} +{"train_loss": 0.001930991536937654, "global_step": 45581, "epoch": 383, "lr": 2.9302193174348786e-05} +{"train_loss": 0.0009899601573124528, "global_step": 45582, "epoch": 383, "lr": 2.9300176423278524e-05} +{"train_loss": 0.000705212471075356, "global_step": 45583, "epoch": 383, "lr": 2.929815971285018e-05} +{"train_loss": 0.0012302164686843753, "global_step": 45584, "epoch": 383, "lr": 2.9296143043067665e-05} +{"train_loss": 0.0012771807378157973, "global_step": 45585, "epoch": 383, "lr": 2.929412641393498e-05} +{"train_loss": 0.0010366691276431084, "global_step": 45586, "epoch": 383, "lr": 2.9292109825456072e-05} +{"train_loss": 0.0007119915098883212, "global_step": 45587, "epoch": 383, "lr": 2.9290093277634866e-05} +{"train_loss": 0.0013694402296096087, "global_step": 45588, "epoch": 383, "lr": 2.928807677047537e-05} +{"train_loss": 0.0011878848308697343, "global_step": 45589, "epoch": 383, "lr": 2.9286060303981505e-05} +{"train_loss": 0.001123230904340744, "global_step": 45590, "epoch": 383, "lr": 2.9284043878157268e-05} +{"train_loss": 0.000838909181766212, "global_step": 45591, "epoch": 383, "lr": 2.928202749300658e-05} +{"train_loss": 0.0012565989745780826, "global_step": 45592, "epoch": 383, "lr": 2.9280011148533432e-05} +{"train_loss": 0.0005951251368969679, "global_step": 45593, "epoch": 383, "lr": 2.9277994844741764e-05} +{"train_loss": 0.0022017364390194416, "global_step": 45594, "epoch": 383, "lr": 2.927597858163553e-05} +{"train_loss": 0.001049791811965406, "global_step": 45595, "epoch": 383, "lr": 2.9273962359218708e-05} +{"train_loss": 0.0017372826114296913, "global_step": 45596, "epoch": 383, "lr": 2.9271946177495245e-05} +{"train_loss": 0.0012105242349207401, "global_step": 45597, "epoch": 383, "lr": 2.9269930036469096e-05} +{"train_loss": 0.0010994356125593185, "global_step": 45598, "epoch": 383, "lr": 2.9267913936144242e-05} +{"train_loss": 0.0011638881405815482, "global_step": 45599, "epoch": 383, "lr": 2.92658978765246e-05} +{"train_loss": 0.0009701087255962193, "global_step": 45600, "epoch": 383, "lr": 2.9263881857614172e-05} +{"train_loss": 0.0012777755036950111, "global_step": 45601, "epoch": 383, "lr": 2.9261865879416876e-05} +{"train_loss": 0.0007385602802969515, "global_step": 45602, "epoch": 383, "lr": 2.9259849941936712e-05} +{"train_loss": 0.001183719257824123, "global_step": 45603, "epoch": 383, "lr": 2.9257834045177603e-05} +{"train_loss": 0.0016050181584432721, "global_step": 45604, "epoch": 383, "lr": 2.9255818189143536e-05} +{"train_loss": 0.0011066754814237356, "global_step": 45605, "epoch": 383, "lr": 2.9253802373838445e-05} +{"train_loss": 0.0008668733644299209, "global_step": 45606, "epoch": 383, "lr": 2.9251786599266285e-05} +{"train_loss": 0.0011260004248470068, "global_step": 45607, "epoch": 383, "lr": 2.924977086543105e-05} +{"train_loss": 0.0006512143299914896, "global_step": 45608, "epoch": 383, "lr": 2.9247755172336644e-05} +{"train_loss": 0.0007244909647852182, "global_step": 45609, "epoch": 383, "lr": 2.9245739519987082e-05} +{"train_loss": 0.0022637525107711554, "global_step": 45610, "epoch": 383, "lr": 2.9243723908386266e-05} +{"train_loss": 0.0013648229651153088, "global_step": 45611, "epoch": 383, "lr": 2.9241708337538205e-05} +{"train_loss": 0.0015305883716791868, "global_step": 45612, "epoch": 383, "lr": 2.9239692807446817e-05} +{"train_loss": 0.0008325165254063904, "global_step": 45613, "epoch": 383, "lr": 2.923767731811608e-05} +{"train_loss": 0.0017036780482158065, "global_step": 45614, "epoch": 383, "lr": 2.9235661869549945e-05} +{"train_loss": 0.0014806060353294015, "global_step": 45615, "epoch": 383, "lr": 2.923364646175235e-05} +{"train_loss": 0.0014607098419219255, "global_step": 45616, "epoch": 383, "lr": 2.9231631094727308e-05} +{"train_loss": 0.0013267785543575883, "global_step": 45617, "epoch": 383, "lr": 2.9229615768478725e-05} +{"train_loss": 0.001939781941473484, "global_step": 45618, "epoch": 383, "lr": 2.9227600483010558e-05} +{"train_loss": 0.0007644777651876211, "global_step": 45619, "epoch": 383, "lr": 2.9225585238326803e-05} +{"train_loss": 0.0011704381322488189, "global_step": 45620, "epoch": 383, "lr": 2.9223570034431368e-05} +{"train_loss": 0.0006682885577902198, "global_step": 45621, "epoch": 383, "lr": 2.922155487132825e-05} +{"train_loss": 0.0011616171104833484, "global_step": 45622, "epoch": 383, "lr": 2.9219539749021373e-05} +{"train_loss": 0.0010720849968492985, "global_step": 45623, "epoch": 383, "lr": 2.9217524667514728e-05} +{"train_loss": 0.0021889961790293455, "global_step": 45624, "epoch": 383, "lr": 2.9215509626812255e-05} +{"train_loss": 0.0011065138969570398, "global_step": 45625, "epoch": 383, "lr": 2.9213494626917888e-05} +{"train_loss": 0.0016733427764847875, "global_step": 45626, "epoch": 383, "lr": 2.921147966783562e-05} +{"train_loss": 0.0011972178472205997, "global_step": 45627, "epoch": 383, "lr": 2.9209464749569376e-05} +{"train_loss": 0.001465403358452022, "global_step": 45628, "epoch": 383, "lr": 2.9207449872123132e-05} +{"train_loss": 0.0007340105366893113, "global_step": 45629, "epoch": 383, "lr": 2.920543503550084e-05} +{"train_loss": 0.0011463360860943794, "global_step": 45630, "epoch": 383, "lr": 2.920342023970646e-05} +{"train_loss": 0.0008204529876820743, "global_step": 45631, "epoch": 383, "lr": 2.920140548474395e-05} +{"train_loss": 0.001657299231737852, "global_step": 45632, "epoch": 383, "lr": 2.9199390770617236e-05} +{"train_loss": 0.0009342811536043882, "global_step": 45633, "epoch": 383, "lr": 2.9197376097330313e-05} +{"train_loss": 0.000821401656139642, "global_step": 45634, "epoch": 383, "lr": 2.9195361464887106e-05} +{"train_loss": 0.0012625360395759344, "global_step": 45635, "epoch": 383, "lr": 2.9193346873291605e-05} +{"train_loss": 0.0015687168342992663, "global_step": 45636, "epoch": 383, "lr": 2.9191332322547728e-05} +{"train_loss": 0.0007285749888978899, "global_step": 45637, "epoch": 383, "lr": 2.9189317812659454e-05} +{"train_loss": 0.0009608793188817799, "global_step": 45638, "epoch": 383, "lr": 2.9187303343630722e-05} +{"train_loss": 0.0016122519737109542, "global_step": 45639, "epoch": 383, "lr": 2.918528891546549e-05} +{"train_loss": 0.0023108923342078924, "global_step": 45640, "epoch": 383, "lr": 2.918327452816774e-05} +{"train_loss": 0.0012644656235352159, "global_step": 45641, "epoch": 383, "lr": 2.9181260181741387e-05} +{"train_loss": 0.00109454698394984, "global_step": 45642, "epoch": 383, "lr": 2.917924587619043e-05} +{"train_loss": 0.0011045682476833463, "global_step": 45643, "epoch": 383, "lr": 2.9177231611518794e-05} +{"train_loss": 0.0013869496760889888, "global_step": 45644, "epoch": 383, "lr": 2.9175217387730424e-05} +{"train_loss": 0.002261468907818198, "global_step": 45645, "epoch": 383, "lr": 2.9173203204829303e-05} +{"train_loss": 0.0009524922934360802, "global_step": 45646, "epoch": 383, "lr": 2.917118906281936e-05} +{"train_loss": 0.0014468200970441103, "global_step": 45647, "epoch": 383, "lr": 2.9169174961704577e-05} +{"train_loss": 0.0011463192058727145, "global_step": 45648, "epoch": 383, "lr": 2.9167160901488893e-05} +{"train_loss": 0.0008640460437163711, "global_step": 45649, "epoch": 383, "lr": 2.916514688217624e-05} +{"train_loss": 0.0010324071627110243, "global_step": 45650, "epoch": 383, "lr": 2.9163132903770622e-05} +{"train_loss": 0.0009668035199865699, "global_step": 45651, "epoch": 383, "lr": 2.9161118966275945e-05} +{"train_loss": 0.0011570638744160533, "global_step": 45652, "epoch": 383, "lr": 2.9159105069696202e-05} +{"train_loss": 0.0013166350545361638, "global_step": 45653, "epoch": 383, "lr": 2.9157091214035313e-05} +{"train_loss": 0.0006242466624826193, "global_step": 45654, "epoch": 383, "lr": 2.915507739929727e-05} +{"train_loss": 0.001288960105739534, "global_step": 45655, "epoch": 383, "lr": 2.9153063625486e-05} +{"train_loss": 0.001542864483781159, "global_step": 45656, "epoch": 383, "lr": 2.915104989260544e-05} +{"train_loss": 0.0008038808009587228, "global_step": 45657, "epoch": 383, "lr": 2.9149036200659595e-05} +{"train_loss": 0.0015675510512664914, "global_step": 45658, "epoch": 383, "lr": 2.914702254965237e-05} +{"train_loss": 0.0016002116026356816, "global_step": 45659, "epoch": 383, "lr": 2.9145008939587754e-05} +{"train_loss": 0.0011779048945754766, "global_step": 45660, "epoch": 383, "lr": 2.914299537046966e-05} +{"train_loss": 0.0013416369911283255, "global_step": 45661, "epoch": 383, "lr": 2.9140981842302094e-05} +{"train_loss": 0.0016820463351905346, "global_step": 45662, "epoch": 383, "lr": 2.913896835508898e-05} +{"train_loss": 0.001046429155394435, "global_step": 45663, "epoch": 383, "lr": 2.9136954908834257e-05} +{"train_loss": 0.001485136803239584, "global_step": 45664, "epoch": 383, "lr": 2.9134941503541907e-05} +{"train_loss": 0.001230746041983366, "global_step": 45665, "epoch": 383, "lr": 2.9132928139215855e-05} +{"train_loss": 0.0008076818194240332, "global_step": 45666, "epoch": 383, "lr": 2.9130914815860082e-05} +{"train_loss": 0.0008890443132258952, "global_step": 45667, "epoch": 383, "lr": 2.9128901533478515e-05} +{"train_loss": 0.0013364111073315144, "global_step": 45668, "epoch": 383, "lr": 2.912688829207514e-05} +{"train_loss": 0.0015334312338382006, "global_step": 45669, "epoch": 383, "lr": 2.912487509165387e-05} +{"train_loss": 0.0010110692819580436, "global_step": 45670, "epoch": 383, "lr": 2.9122861932218694e-05} +{"train_loss": 0.0007265214226208627, "global_step": 45671, "epoch": 383, "lr": 2.9120848813773526e-05} +{"train_loss": 0.001934374333359301, "global_step": 45672, "epoch": 383, "lr": 2.911883573632237e-05} +{"train_loss": 0.0012749505694955587, "global_step": 45673, "epoch": 383, "lr": 2.9116822699869117e-05} +{"train_loss": 0.001281635370105505, "global_step": 45674, "epoch": 383, "lr": 2.9114809704417782e-05} +{"train_loss": 0.0013039209879934788, "global_step": 45675, "epoch": 383, "lr": 2.9112796749972264e-05} +{"train_loss": 0.001704343594610691, "global_step": 45676, "epoch": 383, "lr": 2.911078383653656e-05} +{"train_loss": 0.0016427998198196292, "global_step": 45677, "epoch": 383, "lr": 2.9108770964114574e-05} +{"train_loss": 0.001697394298389554, "global_step": 45678, "epoch": 383, "lr": 2.910675813271031e-05} +{"train_loss": 0.0009124582284130156, "global_step": 45679, "epoch": 383, "lr": 2.910474534232767e-05} +{"train_loss": 0.0012342238333076239, "global_step": 45680, "epoch": 383, "lr": 2.9102732592970655e-05} +{"train_loss": 0.0008477161172777414, "global_step": 45681, "epoch": 383, "lr": 2.910071988464319e-05} +{"train_loss": 0.0008632119279354811, "global_step": 45682, "epoch": 383, "lr": 2.909870721734921e-05} +{"train_loss": 0.0011963238939642906, "global_step": 45683, "epoch": 383, "lr": 2.90966945910927e-05} +{"train_loss": 0.0012124743079766631, "global_step": 45684, "epoch": 383, "lr": 2.9094682005877584e-05} +{"train_loss": 0.0013296559918671846, "global_step": 45685, "epoch": 383, "lr": 2.9092669461707843e-05} +{"train_loss": 0.0013549712020903826, "global_step": 45686, "epoch": 383, "lr": 2.9090656958587416e-05} +{"train_loss": 0.001913984538987279, "global_step": 45687, "epoch": 383, "lr": 2.9088644496520222e-05} +{"train_loss": 0.001389615354128182, "global_step": 45688, "epoch": 383, "lr": 2.9086632075510268e-05} +{"train_loss": 0.0011141349095851183, "global_step": 45689, "epoch": 383, "lr": 2.908461969556145e-05} +{"train_loss": 0.0008009641896933317, "global_step": 45690, "epoch": 383, "lr": 2.9082607356677772e-05} +{"train_loss": 0.0010225920705124736, "global_step": 45691, "epoch": 383, "lr": 2.9080595058863135e-05} +{"train_loss": 0.0017306992085650563, "global_step": 45692, "epoch": 383, "lr": 2.9078582802121546e-05} +{"train_loss": 0.0011795603204518557, "global_step": 45693, "epoch": 383, "lr": 2.9076570586456915e-05} +{"train_loss": 0.001037666923366487, "global_step": 45694, "epoch": 383, "lr": 2.9074558411873182e-05} +{"train_loss": 0.0012401776885253791, "global_step": 45695, "epoch": 383, "lr": 2.907254627837434e-05, "val_loss": 0.021749749779701233} +{"train_loss": 0.001207001507282257, "global_step": 45696, "epoch": 384, "lr": 2.90705341859643e-05} +{"train_loss": 0.001705317059531808, "global_step": 45697, "epoch": 384, "lr": 2.9068522134647046e-05} +{"train_loss": 0.0008636596612632275, "global_step": 45698, "epoch": 384, "lr": 2.9066510124426495e-05} +{"train_loss": 0.0017934603383764625, "global_step": 45699, "epoch": 384, "lr": 2.9064498155306636e-05} +{"train_loss": 0.001333103864453733, "global_step": 45700, "epoch": 384, "lr": 2.9062486227291398e-05} +{"train_loss": 0.0017807381227612495, "global_step": 45701, "epoch": 384, "lr": 2.9060474340384713e-05} +{"train_loss": 0.001315110013820231, "global_step": 45702, "epoch": 384, "lr": 2.9058462494590543e-05} +{"train_loss": 0.001187894376926124, "global_step": 45703, "epoch": 384, "lr": 2.9056450689912874e-05} +{"train_loss": 0.0009712175233289599, "global_step": 45704, "epoch": 384, "lr": 2.90544389263556e-05} +{"train_loss": 0.0011818943312391639, "global_step": 45705, "epoch": 384, "lr": 2.9052427203922715e-05} +{"train_loss": 0.000756163033656776, "global_step": 45706, "epoch": 384, "lr": 2.9050415522618136e-05} +{"train_loss": 0.0014230910455808043, "global_step": 45707, "epoch": 384, "lr": 2.9048403882445846e-05} +{"train_loss": 0.002543595153838396, "global_step": 45708, "epoch": 384, "lr": 2.9046392283409762e-05} +{"train_loss": 0.001313531887717545, "global_step": 45709, "epoch": 384, "lr": 2.9044380725513858e-05} +{"train_loss": 0.0014086108421906829, "global_step": 45710, "epoch": 384, "lr": 2.9042369208762065e-05} +{"train_loss": 0.0007983227842487395, "global_step": 45711, "epoch": 384, "lr": 2.9040357733158353e-05} +{"train_loss": 0.0014140777057036757, "global_step": 45712, "epoch": 384, "lr": 2.9038346298706666e-05} +{"train_loss": 0.001174830598756671, "global_step": 45713, "epoch": 384, "lr": 2.9036334905410917e-05} +{"train_loss": 0.0008246408542618155, "global_step": 45714, "epoch": 384, "lr": 2.903432355327511e-05} +{"train_loss": 0.0012247080449014902, "global_step": 45715, "epoch": 384, "lr": 2.903231224230315e-05} +{"train_loss": 0.0007990350131876767, "global_step": 45716, "epoch": 384, "lr": 2.9030300972499024e-05} +{"train_loss": 0.001442868378944695, "global_step": 45717, "epoch": 384, "lr": 2.9028289743866666e-05} +{"train_loss": 0.0015082418685778975, "global_step": 45718, "epoch": 384, "lr": 2.902627855640999e-05} +{"train_loss": 0.0016414704732596874, "global_step": 45719, "epoch": 384, "lr": 2.9024267410133006e-05} +{"train_loss": 0.001398697728291154, "global_step": 45720, "epoch": 384, "lr": 2.9022256305039608e-05} +{"train_loss": 0.0008889977470971644, "global_step": 45721, "epoch": 384, "lr": 2.9020245241133787e-05} +{"train_loss": 0.002718882169574499, "global_step": 45722, "epoch": 384, "lr": 2.9018234218419455e-05} +{"train_loss": 0.0015947100473567843, "global_step": 45723, "epoch": 384, "lr": 2.90162232369006e-05} +{"train_loss": 0.00038888389826752245, "global_step": 45724, "epoch": 384, "lr": 2.9014212296581143e-05} +{"train_loss": 0.001525707426480949, "global_step": 45725, "epoch": 384, "lr": 2.9012201397465022e-05} +{"train_loss": 0.0015180263435468078, "global_step": 45726, "epoch": 384, "lr": 2.9010190539556225e-05} +{"train_loss": 0.001065877266228199, "global_step": 45727, "epoch": 384, "lr": 2.9008179722858653e-05} +{"train_loss": 0.0009758552187122405, "global_step": 45728, "epoch": 384, "lr": 2.9006168947376295e-05} +{"train_loss": 0.0007927209953777492, "global_step": 45729, "epoch": 384, "lr": 2.9004158213113064e-05} +{"train_loss": 0.0013163841795176268, "global_step": 45730, "epoch": 384, "lr": 2.900214752007294e-05} +{"train_loss": 0.0009231423027813435, "global_step": 45731, "epoch": 384, "lr": 2.9000136868259863e-05} +{"train_loss": 0.0023221815936267376, "global_step": 45732, "epoch": 384, "lr": 2.8998126257677754e-05} +{"train_loss": 0.001265668193809688, "global_step": 45733, "epoch": 384, "lr": 2.89961156883306e-05} +{"train_loss": 0.0010495861060917377, "global_step": 45734, "epoch": 384, "lr": 2.8994105160222307e-05} +{"train_loss": 0.0010937921470031142, "global_step": 45735, "epoch": 384, "lr": 2.899209467335686e-05} +{"train_loss": 0.0011359343770891428, "global_step": 45736, "epoch": 384, "lr": 2.899008422773818e-05} +{"train_loss": 0.0010701969731599092, "global_step": 45737, "epoch": 384, "lr": 2.8988073823370222e-05} +{"train_loss": 0.0017981166020035744, "global_step": 45738, "epoch": 384, "lr": 2.898606346025695e-05} +{"train_loss": 0.0011822902597486973, "global_step": 45739, "epoch": 384, "lr": 2.8984053138402277e-05} +{"train_loss": 0.001582463039085269, "global_step": 45740, "epoch": 384, "lr": 2.8982042857810198e-05} +{"train_loss": 0.0018512682290747762, "global_step": 45741, "epoch": 384, "lr": 2.8980032618484608e-05} +{"train_loss": 0.0014318866888061166, "global_step": 45742, "epoch": 384, "lr": 2.8978022420429506e-05} +{"train_loss": 0.0015824746806174517, "global_step": 45743, "epoch": 384, "lr": 2.8976012263648805e-05} +{"train_loss": 0.0011715113651007414, "global_step": 45744, "epoch": 384, "lr": 2.8974002148146438e-05} +{"train_loss": 0.0008391142473556101, "global_step": 45745, "epoch": 384, "lr": 2.897199207392639e-05} +{"train_loss": 0.0011844938853755593, "global_step": 45746, "epoch": 384, "lr": 2.8969982040992572e-05} +{"train_loss": 0.0007571281166747212, "global_step": 45747, "epoch": 384, "lr": 2.8967972049348967e-05} +{"train_loss": 0.0009675088804215193, "global_step": 45748, "epoch": 384, "lr": 2.8965962098999476e-05} +{"train_loss": 0.0034356596879661083, "global_step": 45749, "epoch": 384, "lr": 2.8963952189948095e-05} +{"train_loss": 0.0009233999880962074, "global_step": 45750, "epoch": 384, "lr": 2.8961942322198753e-05} +{"train_loss": 0.0013058644253760576, "global_step": 45751, "epoch": 384, "lr": 2.895993249575536e-05} +{"train_loss": 0.001329856808297336, "global_step": 45752, "epoch": 384, "lr": 2.895792271062192e-05} +{"train_loss": 0.0009565411601215601, "global_step": 45753, "epoch": 384, "lr": 2.8955912966802323e-05} +{"train_loss": 0.0015319088706746697, "global_step": 45754, "epoch": 384, "lr": 2.895390326430057e-05} +{"train_loss": 0.0013547042617574334, "global_step": 45755, "epoch": 384, "lr": 2.895189360312057e-05} +{"train_loss": 0.0013541907537728548, "global_step": 45756, "epoch": 384, "lr": 2.894988398326627e-05} +{"train_loss": 0.0011564946034923196, "global_step": 45757, "epoch": 384, "lr": 2.8947874404741636e-05} +{"train_loss": 0.0012551749823614955, "global_step": 45758, "epoch": 384, "lr": 2.8945864867550587e-05} +{"train_loss": 0.0012165121734142303, "global_step": 45759, "epoch": 384, "lr": 2.8943855371697098e-05} +{"train_loss": 0.0019447763916105032, "global_step": 45760, "epoch": 384, "lr": 2.8941845917185084e-05} +{"train_loss": 0.0018506519263610244, "global_step": 45761, "epoch": 384, "lr": 2.8939836504018524e-05} +{"train_loss": 0.0014208327047526836, "global_step": 45762, "epoch": 384, "lr": 2.8937827132201345e-05} +{"train_loss": 0.0012575925793498755, "global_step": 45763, "epoch": 384, "lr": 2.893581780173747e-05} +{"train_loss": 0.0011011025635525584, "global_step": 45764, "epoch": 384, "lr": 2.8933808512630888e-05} +{"train_loss": 0.002416041446849704, "global_step": 45765, "epoch": 384, "lr": 2.8931799264885502e-05} +{"train_loss": 0.0019445819780230522, "global_step": 45766, "epoch": 384, "lr": 2.8929790058505296e-05} +{"train_loss": 0.0008449901943095028, "global_step": 45767, "epoch": 384, "lr": 2.8927780893494178e-05} +{"train_loss": 0.0020117133390158415, "global_step": 45768, "epoch": 384, "lr": 2.892577176985613e-05} +{"train_loss": 0.0007647101301699877, "global_step": 45769, "epoch": 384, "lr": 2.8923762687595057e-05} +{"train_loss": 0.0008565702592022717, "global_step": 45770, "epoch": 384, "lr": 2.8921753646714944e-05} +{"train_loss": 0.0009885045001283288, "global_step": 45771, "epoch": 384, "lr": 2.8919744647219705e-05} +{"train_loss": 0.0009732170728966594, "global_step": 45772, "epoch": 384, "lr": 2.8917735689113278e-05} +{"train_loss": 0.0020722956396639347, "global_step": 45773, "epoch": 384, "lr": 2.891572677239966e-05} +{"train_loss": 0.0014922558329999447, "global_step": 45774, "epoch": 384, "lr": 2.8913717897082752e-05} +{"train_loss": 0.0013832947006449103, "global_step": 45775, "epoch": 384, "lr": 2.8911709063166494e-05} +{"train_loss": 0.0009658864582888782, "global_step": 45776, "epoch": 384, "lr": 2.8909700270654855e-05} +{"train_loss": 0.001770846894942224, "global_step": 45777, "epoch": 384, "lr": 2.890769151955175e-05} +{"train_loss": 0.0015846636379137635, "global_step": 45778, "epoch": 384, "lr": 2.8905682809861158e-05} +{"train_loss": 0.001651595812290907, "global_step": 45779, "epoch": 384, "lr": 2.890367414158698e-05} +{"train_loss": 0.0011742445640265942, "global_step": 45780, "epoch": 384, "lr": 2.890166551473321e-05} +{"train_loss": 0.001704822527244687, "global_step": 45781, "epoch": 384, "lr": 2.8899656929303763e-05} +{"train_loss": 0.001793454634025693, "global_step": 45782, "epoch": 384, "lr": 2.8897648385302566e-05} +{"train_loss": 0.0008731198613531888, "global_step": 45783, "epoch": 384, "lr": 2.88956398827336e-05} +{"train_loss": 0.0011227208888158202, "global_step": 45784, "epoch": 384, "lr": 2.8893631421600775e-05} +{"train_loss": 0.0011756446911022067, "global_step": 45785, "epoch": 384, "lr": 2.8891623001908063e-05} +{"train_loss": 0.0010309879435226321, "global_step": 45786, "epoch": 384, "lr": 2.88896146236594e-05} +{"train_loss": 0.0009413764346390963, "global_step": 45787, "epoch": 384, "lr": 2.8887606286858703e-05} +{"train_loss": 0.0009802061831578612, "global_step": 45788, "epoch": 384, "lr": 2.888559799150995e-05} +{"train_loss": 0.0016638635424897075, "global_step": 45789, "epoch": 384, "lr": 2.8883589737617055e-05} +{"train_loss": 0.0007677296525798738, "global_step": 45790, "epoch": 384, "lr": 2.8881581525183998e-05} +{"train_loss": 0.0008640193846076727, "global_step": 45791, "epoch": 384, "lr": 2.8879573354214674e-05} +{"train_loss": 0.0011133610969409347, "global_step": 45792, "epoch": 384, "lr": 2.887756522471307e-05} +{"train_loss": 0.001301993033848703, "global_step": 45793, "epoch": 384, "lr": 2.887555713668312e-05} +{"train_loss": 0.0013310187496244907, "global_step": 45794, "epoch": 384, "lr": 2.8873549090128725e-05} +{"train_loss": 0.0013306194450706244, "global_step": 45795, "epoch": 384, "lr": 2.8871541085053887e-05} +{"train_loss": 0.0019362537423148751, "global_step": 45796, "epoch": 384, "lr": 2.88695331214625e-05} +{"train_loss": 0.0015190460253506899, "global_step": 45797, "epoch": 384, "lr": 2.886752519935854e-05} +{"train_loss": 0.001031120540574193, "global_step": 45798, "epoch": 384, "lr": 2.8865517318745928e-05} +{"train_loss": 0.0018755971686914563, "global_step": 45799, "epoch": 384, "lr": 2.8863509479628626e-05} +{"train_loss": 0.0021142789628356695, "global_step": 45800, "epoch": 384, "lr": 2.886150168201055e-05} +{"train_loss": 0.0011198886204510927, "global_step": 45801, "epoch": 384, "lr": 2.8859493925895677e-05} +{"train_loss": 0.0007438117754645646, "global_step": 45802, "epoch": 384, "lr": 2.8857486211287898e-05} +{"train_loss": 0.002793539548292756, "global_step": 45803, "epoch": 384, "lr": 2.8855478538191218e-05} +{"train_loss": 0.000848481897264719, "global_step": 45804, "epoch": 384, "lr": 2.8853470906609527e-05} +{"train_loss": 0.0011149848578497767, "global_step": 45805, "epoch": 384, "lr": 2.8851463316546802e-05} +{"train_loss": 0.0014227342326194048, "global_step": 45806, "epoch": 384, "lr": 2.884945576800695e-05} +{"train_loss": 0.0012194121954962611, "global_step": 45807, "epoch": 384, "lr": 2.8847448260993954e-05} +{"train_loss": 0.0011793524026870728, "global_step": 45808, "epoch": 384, "lr": 2.8845440795511714e-05} +{"train_loss": 0.0014801829820498824, "global_step": 45809, "epoch": 384, "lr": 2.8843433371564212e-05} +{"train_loss": 0.0019593797624111176, "global_step": 45810, "epoch": 384, "lr": 2.8841425989155345e-05} +{"train_loss": 0.002355860313400626, "global_step": 45811, "epoch": 384, "lr": 2.8839418648289097e-05} +{"train_loss": 0.0010229895124211907, "global_step": 45812, "epoch": 384, "lr": 2.883741134896939e-05} +{"train_loss": 0.0017245403723791242, "global_step": 45813, "epoch": 384, "lr": 2.8835404091200145e-05} +{"train_loss": 0.0013710149676840315, "global_step": 45814, "epoch": 384, "lr": 2.8833396874985346e-05, "val_loss": 0.027184057980775833} +{"train_loss": 0.001294861314818263, "global_step": 45815, "epoch": 385, "lr": 2.8831389700328894e-05} +{"train_loss": 0.0014230606611818075, "global_step": 45816, "epoch": 385, "lr": 2.882938256723476e-05} +{"train_loss": 0.000987432198598981, "global_step": 45817, "epoch": 385, "lr": 2.8827375475706852e-05} +{"train_loss": 0.0014740527840331197, "global_step": 45818, "epoch": 385, "lr": 2.8825368425749154e-05} +{"train_loss": 0.0010772272944450378, "global_step": 45819, "epoch": 385, "lr": 2.882336141736558e-05} +{"train_loss": 0.001434958423487842, "global_step": 45820, "epoch": 385, "lr": 2.8821354450560056e-05} +{"train_loss": 0.0015251052100211382, "global_step": 45821, "epoch": 385, "lr": 2.8819347525336558e-05} +{"train_loss": 0.0009023130987770855, "global_step": 45822, "epoch": 385, "lr": 2.8817340641698987e-05} +{"train_loss": 0.000913699041120708, "global_step": 45823, "epoch": 385, "lr": 2.8815333799651322e-05} +{"train_loss": 0.0019815589766949415, "global_step": 45824, "epoch": 385, "lr": 2.8813326999197492e-05} +{"train_loss": 0.0015796676743775606, "global_step": 45825, "epoch": 385, "lr": 2.8811320240341412e-05} +{"train_loss": 0.001046077231876552, "global_step": 45826, "epoch": 385, "lr": 2.8809313523087054e-05} +{"train_loss": 0.0011794496094807982, "global_step": 45827, "epoch": 385, "lr": 2.880730684743833e-05} +{"train_loss": 0.0011964929290115833, "global_step": 45828, "epoch": 385, "lr": 2.8805300213399218e-05} +{"train_loss": 0.0008620015578344464, "global_step": 45829, "epoch": 385, "lr": 2.880329362097361e-05} +{"train_loss": 0.0016015195287764072, "global_step": 45830, "epoch": 385, "lr": 2.8801287070165488e-05} +{"train_loss": 0.0011095290537923574, "global_step": 45831, "epoch": 385, "lr": 2.879928056097878e-05} +{"train_loss": 0.0017568100010976195, "global_step": 45832, "epoch": 385, "lr": 2.8797274093417392e-05} +{"train_loss": 0.0015290615847334266, "global_step": 45833, "epoch": 385, "lr": 2.8795267667485322e-05} +{"train_loss": 0.0006785673322156072, "global_step": 45834, "epoch": 385, "lr": 2.8793261283186453e-05} +{"train_loss": 0.0014026409480720758, "global_step": 45835, "epoch": 385, "lr": 2.879125494052475e-05} +{"train_loss": 0.000839437183458358, "global_step": 45836, "epoch": 385, "lr": 2.878924863950417e-05} +{"train_loss": 0.0013120074290782213, "global_step": 45837, "epoch": 385, "lr": 2.8787242380128616e-05} +{"train_loss": 0.0018896071705967188, "global_step": 45838, "epoch": 385, "lr": 2.8785236162402063e-05} +{"train_loss": 0.0005271697300486267, "global_step": 45839, "epoch": 385, "lr": 2.8783229986328415e-05} +{"train_loss": 0.0007117291097529233, "global_step": 45840, "epoch": 385, "lr": 2.8781223851911648e-05} +{"train_loss": 0.0021051019430160522, "global_step": 45841, "epoch": 385, "lr": 2.8779217759155665e-05} +{"train_loss": 0.0018891129875555634, "global_step": 45842, "epoch": 385, "lr": 2.8777211708064432e-05} +{"train_loss": 0.0009927855571731925, "global_step": 45843, "epoch": 385, "lr": 2.877520569864188e-05} +{"train_loss": 0.0007910907734185457, "global_step": 45844, "epoch": 385, "lr": 2.8773199730891925e-05} +{"train_loss": 0.00112605607137084, "global_step": 45845, "epoch": 385, "lr": 2.8771193804818547e-05} +{"train_loss": 0.0012611448764801025, "global_step": 45846, "epoch": 385, "lr": 2.8769187920425638e-05} +{"train_loss": 0.0010478897020220757, "global_step": 45847, "epoch": 385, "lr": 2.876718207771718e-05} +{"train_loss": 0.0018156261648982763, "global_step": 45848, "epoch": 385, "lr": 2.8765176276697076e-05} +{"train_loss": 0.0018505395855754614, "global_step": 45849, "epoch": 385, "lr": 2.8763170517369297e-05} +{"train_loss": 0.001268541207537055, "global_step": 45850, "epoch": 385, "lr": 2.8761164799737765e-05} +{"train_loss": 0.0006011365330778062, "global_step": 45851, "epoch": 385, "lr": 2.87591591238064e-05} +{"train_loss": 0.0011007071007043123, "global_step": 45852, "epoch": 385, "lr": 2.875715348957917e-05} +{"train_loss": 0.0015819290420040488, "global_step": 45853, "epoch": 385, "lr": 2.8755147897059987e-05} +{"train_loss": 0.0014691584510728717, "global_step": 45854, "epoch": 385, "lr": 2.8753142346252814e-05} +{"train_loss": 0.0009384349687024951, "global_step": 45855, "epoch": 385, "lr": 2.8751136837161573e-05} +{"train_loss": 0.0012962515465915203, "global_step": 45856, "epoch": 385, "lr": 2.8749131369790194e-05} +{"train_loss": 0.0008491835324093699, "global_step": 45857, "epoch": 385, "lr": 2.8747125944142645e-05} +{"train_loss": 0.0012369310716167092, "global_step": 45858, "epoch": 385, "lr": 2.8745120560222816e-05} +{"train_loss": 0.0011076226364821196, "global_step": 45859, "epoch": 385, "lr": 2.87431152180347e-05} +{"train_loss": 0.0011324102524667978, "global_step": 45860, "epoch": 385, "lr": 2.874110991758219e-05} +{"train_loss": 0.001458074082620442, "global_step": 45861, "epoch": 385, "lr": 2.8739104658869242e-05} +{"train_loss": 0.001142747700214386, "global_step": 45862, "epoch": 385, "lr": 2.8737099441899806e-05} +{"train_loss": 0.0017939142417162657, "global_step": 45863, "epoch": 385, "lr": 2.8735094266677775e-05} +{"train_loss": 0.0008428923320025206, "global_step": 45864, "epoch": 385, "lr": 2.8733089133207143e-05} +{"train_loss": 0.0011257906444370747, "global_step": 45865, "epoch": 385, "lr": 2.8731084041491797e-05} +{"train_loss": 0.00116686150431633, "global_step": 45866, "epoch": 385, "lr": 2.8729078991535706e-05} +{"train_loss": 0.000812687270808965, "global_step": 45867, "epoch": 385, "lr": 2.8727073983342782e-05} +{"train_loss": 0.001397434389218688, "global_step": 45868, "epoch": 385, "lr": 2.8725069016916995e-05} +{"train_loss": 0.0017232458340004086, "global_step": 45869, "epoch": 385, "lr": 2.8723064092262248e-05} +{"train_loss": 0.0014295057626441121, "global_step": 45870, "epoch": 385, "lr": 2.8721059209382485e-05} +{"train_loss": 0.0012170439586043358, "global_step": 45871, "epoch": 385, "lr": 2.8719054368281674e-05} +{"train_loss": 0.0015957505675032735, "global_step": 45872, "epoch": 385, "lr": 2.8717049568963693e-05} +{"train_loss": 0.002114900154992938, "global_step": 45873, "epoch": 385, "lr": 2.8715044811432545e-05} +{"train_loss": 0.0010808188235387206, "global_step": 45874, "epoch": 385, "lr": 2.8713040095692128e-05} +{"train_loss": 0.0014247640501707792, "global_step": 45875, "epoch": 385, "lr": 2.8711035421746367e-05} +{"train_loss": 0.001042541698552668, "global_step": 45876, "epoch": 385, "lr": 2.870903078959923e-05} +{"train_loss": 0.001459805411286652, "global_step": 45877, "epoch": 385, "lr": 2.8707026199254617e-05} +{"train_loss": 0.0011405409313738346, "global_step": 45878, "epoch": 385, "lr": 2.8705021650716502e-05} +{"train_loss": 0.0013318684650585055, "global_step": 45879, "epoch": 385, "lr": 2.8703017143988777e-05} +{"train_loss": 0.0011284102220088243, "global_step": 45880, "epoch": 385, "lr": 2.870101267907543e-05} +{"train_loss": 0.0012218211777508259, "global_step": 45881, "epoch": 385, "lr": 2.8699008255980363e-05} +{"train_loss": 0.0015473305247724056, "global_step": 45882, "epoch": 385, "lr": 2.8697003874707507e-05} +{"train_loss": 0.001499547273851931, "global_step": 45883, "epoch": 385, "lr": 2.8694999535260824e-05} +{"train_loss": 0.0005519564147107303, "global_step": 45884, "epoch": 385, "lr": 2.8692995237644205e-05} +{"train_loss": 0.0010779330041259527, "global_step": 45885, "epoch": 385, "lr": 2.8690990981861642e-05} +{"train_loss": 0.0019249129109084606, "global_step": 45886, "epoch": 385, "lr": 2.8688986767917025e-05} +{"train_loss": 0.0005961653077974916, "global_step": 45887, "epoch": 385, "lr": 2.8686982595814314e-05} +{"train_loss": 0.001130752032622695, "global_step": 45888, "epoch": 385, "lr": 2.8684978465557443e-05} +{"train_loss": 0.000615597702562809, "global_step": 45889, "epoch": 385, "lr": 2.8682974377150322e-05} +{"train_loss": 0.00184115138836205, "global_step": 45890, "epoch": 385, "lr": 2.8680970330596922e-05} +{"train_loss": 0.0012061927700415254, "global_step": 45891, "epoch": 385, "lr": 2.8678966325901135e-05} +{"train_loss": 0.0010167285799980164, "global_step": 45892, "epoch": 385, "lr": 2.8676962363066944e-05} +{"train_loss": 0.0013612140901386738, "global_step": 45893, "epoch": 385, "lr": 2.867495844209826e-05} +{"train_loss": 0.0011394548928365111, "global_step": 45894, "epoch": 385, "lr": 2.8672954562998994e-05} +{"train_loss": 0.0008118454716168344, "global_step": 45895, "epoch": 385, "lr": 2.8670950725773127e-05} +{"train_loss": 0.0009433922823518515, "global_step": 45896, "epoch": 385, "lr": 2.8668946930424545e-05} +{"train_loss": 0.0015665290411561728, "global_step": 45897, "epoch": 385, "lr": 2.8666943176957227e-05} +{"train_loss": 0.001329432358033955, "global_step": 45898, "epoch": 385, "lr": 2.8664939465375067e-05} +{"train_loss": 0.0015287442365661263, "global_step": 45899, "epoch": 385, "lr": 2.8662935795682044e-05} +{"train_loss": 0.0013915441231802106, "global_step": 45900, "epoch": 385, "lr": 2.8660932167882038e-05} +{"train_loss": 0.0018806513398885727, "global_step": 45901, "epoch": 385, "lr": 2.865892858197904e-05} +{"train_loss": 0.0016575866611674428, "global_step": 45902, "epoch": 385, "lr": 2.8656925037976934e-05} +{"train_loss": 0.0015104219783097506, "global_step": 45903, "epoch": 385, "lr": 2.8654921535879697e-05} +{"train_loss": 0.0015766515862196684, "global_step": 45904, "epoch": 385, "lr": 2.8652918075691214e-05} +{"train_loss": 0.002392888069152832, "global_step": 45905, "epoch": 385, "lr": 2.8650914657415473e-05} +{"train_loss": 0.0017849853029474616, "global_step": 45906, "epoch": 385, "lr": 2.8648911281056356e-05} +{"train_loss": 0.0009569915710017085, "global_step": 45907, "epoch": 385, "lr": 2.864690794661784e-05} +{"train_loss": 0.001050164457410574, "global_step": 45908, "epoch": 385, "lr": 2.864490465410382e-05} +{"train_loss": 0.0011366058606654406, "global_step": 45909, "epoch": 385, "lr": 2.8642901403518276e-05} +{"train_loss": 0.002955225994810462, "global_step": 45910, "epoch": 385, "lr": 2.8640898194865083e-05} +{"train_loss": 0.0012765158899128437, "global_step": 45911, "epoch": 385, "lr": 2.8638895028148234e-05} +{"train_loss": 0.0012893900275230408, "global_step": 45912, "epoch": 385, "lr": 2.8636891903371625e-05} +{"train_loss": 0.0017560985870659351, "global_step": 45913, "epoch": 385, "lr": 2.863488882053918e-05} +{"train_loss": 0.001073315623216331, "global_step": 45914, "epoch": 385, "lr": 2.8632885779654865e-05} +{"train_loss": 0.0012581527698785067, "global_step": 45915, "epoch": 385, "lr": 2.8630882780722578e-05} +{"train_loss": 0.001205637352541089, "global_step": 45916, "epoch": 385, "lr": 2.862887982374629e-05} +{"train_loss": 0.0008797836489975452, "global_step": 45917, "epoch": 385, "lr": 2.8626876908729895e-05} +{"train_loss": 0.0016590974992141128, "global_step": 45918, "epoch": 385, "lr": 2.8624874035677363e-05} +{"train_loss": 0.001124568865634501, "global_step": 45919, "epoch": 385, "lr": 2.8622871204592606e-05} +{"train_loss": 0.0017402502708137035, "global_step": 45920, "epoch": 385, "lr": 2.8620868415479535e-05} +{"train_loss": 0.0010667335009202361, "global_step": 45921, "epoch": 385, "lr": 2.8618865668342127e-05} +{"train_loss": 0.0016944410745054483, "global_step": 45922, "epoch": 385, "lr": 2.8616862963184278e-05} +{"train_loss": 0.001383433467708528, "global_step": 45923, "epoch": 385, "lr": 2.8614860300009942e-05} +{"train_loss": 0.001022490905597806, "global_step": 45924, "epoch": 385, "lr": 2.861285767882305e-05} +{"train_loss": 0.001711392542347312, "global_step": 45925, "epoch": 385, "lr": 2.8610855099627508e-05} +{"train_loss": 0.0015486942138522863, "global_step": 45926, "epoch": 385, "lr": 2.8608852562427284e-05} +{"train_loss": 0.001519393757916987, "global_step": 45927, "epoch": 385, "lr": 2.8606850067226276e-05} +{"train_loss": 0.0010867605451494455, "global_step": 45928, "epoch": 385, "lr": 2.860484761402845e-05} +{"train_loss": 0.000960384146310389, "global_step": 45929, "epoch": 385, "lr": 2.8602845202837702e-05} +{"train_loss": 0.001293217414058745, "global_step": 45930, "epoch": 385, "lr": 2.8600842833658003e-05} +{"train_loss": 0.0016618738882243633, "global_step": 45931, "epoch": 385, "lr": 2.859884050649324e-05} +{"train_loss": 0.001237866934388876, "global_step": 45932, "epoch": 385, "lr": 2.859683822134739e-05} +{"train_loss": 0.001309378059901798, "global_step": 45933, "epoch": 385, "lr": 2.8594835978224333e-05, "val_loss": 0.016287054866552353, "train_action_mse_error": 2.0000297809019685e-05} +{"train_loss": 0.0016495933523401618, "global_step": 45934, "epoch": 386, "lr": 2.859283377712806e-05} +{"train_loss": 0.0019290521740913391, "global_step": 45935, "epoch": 386, "lr": 2.859083161806244e-05} +{"train_loss": 0.000961112673394382, "global_step": 45936, "epoch": 386, "lr": 2.858882950103146e-05} +{"train_loss": 0.0021265174727886915, "global_step": 45937, "epoch": 386, "lr": 2.8586827426039008e-05} +{"train_loss": 0.002136983908712864, "global_step": 45938, "epoch": 386, "lr": 2.8584825393089054e-05} +{"train_loss": 0.0013797438004985452, "global_step": 45939, "epoch": 386, "lr": 2.8582823402185483e-05} +{"train_loss": 0.0008550668717361987, "global_step": 45940, "epoch": 386, "lr": 2.8580821453332274e-05} +{"train_loss": 0.001120269880630076, "global_step": 45941, "epoch": 386, "lr": 2.8578819546533308e-05} +{"train_loss": 0.0022215251810848713, "global_step": 45942, "epoch": 386, "lr": 2.8576817681792568e-05} +{"train_loss": 0.0016860481118783355, "global_step": 45943, "epoch": 386, "lr": 2.8574815859113952e-05} +{"train_loss": 0.0031021027825772762, "global_step": 45944, "epoch": 386, "lr": 2.8572814078501374e-05} +{"train_loss": 0.0009057606221176684, "global_step": 45945, "epoch": 386, "lr": 2.857081233995882e-05} +{"train_loss": 0.001788100809790194, "global_step": 45946, "epoch": 386, "lr": 2.856881064349015e-05} +{"train_loss": 0.0012437065597623587, "global_step": 45947, "epoch": 386, "lr": 2.8566808989099357e-05} +{"train_loss": 0.001624818192794919, "global_step": 45948, "epoch": 386, "lr": 2.8564807376790332e-05} +{"train_loss": 0.0018395853694528341, "global_step": 45949, "epoch": 386, "lr": 2.8562805806567026e-05} +{"train_loss": 0.0006131198606453836, "global_step": 45950, "epoch": 386, "lr": 2.8560804278433374e-05} +{"train_loss": 0.0018768219742923975, "global_step": 45951, "epoch": 386, "lr": 2.8558802792393258e-05} +{"train_loss": 0.0010023978538811207, "global_step": 45952, "epoch": 386, "lr": 2.855680134845067e-05} +{"train_loss": 0.00129900558385998, "global_step": 45953, "epoch": 386, "lr": 2.855479994660949e-05} +{"train_loss": 0.0017108864849433303, "global_step": 45954, "epoch": 386, "lr": 2.8552798586873693e-05} +{"train_loss": 0.0018924078904092312, "global_step": 45955, "epoch": 386, "lr": 2.8550797269247182e-05} +{"train_loss": 0.001484968583099544, "global_step": 45956, "epoch": 386, "lr": 2.8548795993733866e-05} +{"train_loss": 0.0008488172898069024, "global_step": 45957, "epoch": 386, "lr": 2.8546794760337725e-05} +{"train_loss": 0.0012449274072423577, "global_step": 45958, "epoch": 386, "lr": 2.8544793569062632e-05} +{"train_loss": 0.0017597494879737496, "global_step": 45959, "epoch": 386, "lr": 2.8542792419912567e-05} +{"train_loss": 0.0014772628201171756, "global_step": 45960, "epoch": 386, "lr": 2.8540791312891418e-05} +{"train_loss": 0.0013970129657536745, "global_step": 45961, "epoch": 386, "lr": 2.8538790248003154e-05} +{"train_loss": 0.0010599329834803939, "global_step": 45962, "epoch": 386, "lr": 2.8536789225251683e-05} +{"train_loss": 0.000882655440364033, "global_step": 45963, "epoch": 386, "lr": 2.853478824464091e-05} +{"train_loss": 0.0016118512721732259, "global_step": 45964, "epoch": 386, "lr": 2.8532787306174807e-05} +{"train_loss": 0.0009736783686093986, "global_step": 45965, "epoch": 386, "lr": 2.8530786409857264e-05} +{"train_loss": 0.0006823341827839613, "global_step": 45966, "epoch": 386, "lr": 2.8528785555692227e-05} +{"train_loss": 0.0010933666490018368, "global_step": 45967, "epoch": 386, "lr": 2.8526784743683648e-05} +{"train_loss": 0.0031628853175789118, "global_step": 45968, "epoch": 386, "lr": 2.852478397383541e-05} +{"train_loss": 0.0013931043213233352, "global_step": 45969, "epoch": 386, "lr": 2.8522783246151485e-05} +{"train_loss": 0.0013047036482021213, "global_step": 45970, "epoch": 386, "lr": 2.852078256063576e-05} +{"train_loss": 0.0009472492383792996, "global_step": 45971, "epoch": 386, "lr": 2.8518781917292213e-05} +{"train_loss": 0.0013927207328379154, "global_step": 45972, "epoch": 386, "lr": 2.8516781316124713e-05} +{"train_loss": 0.0017267965013161302, "global_step": 45973, "epoch": 386, "lr": 2.8514780757137238e-05} +{"train_loss": 0.0011405822588130832, "global_step": 45974, "epoch": 386, "lr": 2.8512780240333704e-05} +{"train_loss": 0.0014394602039828897, "global_step": 45975, "epoch": 386, "lr": 2.8510779765718e-05} +{"train_loss": 0.000897090882062912, "global_step": 45976, "epoch": 386, "lr": 2.8508779333294112e-05} +{"train_loss": 0.0019206827273592353, "global_step": 45977, "epoch": 386, "lr": 2.8506778943065913e-05} +{"train_loss": 0.002405781066045165, "global_step": 45978, "epoch": 386, "lr": 2.8504778595037384e-05} +{"train_loss": 0.0012818463146686554, "global_step": 45979, "epoch": 386, "lr": 2.85027782892124e-05} +{"train_loss": 0.0010903438087552786, "global_step": 45980, "epoch": 386, "lr": 2.8500778025594937e-05} +{"train_loss": 0.0009975011926144361, "global_step": 45981, "epoch": 386, "lr": 2.84987778041889e-05} +{"train_loss": 0.001623075921088457, "global_step": 45982, "epoch": 386, "lr": 2.8496777624998193e-05} +{"train_loss": 0.0009690250735729933, "global_step": 45983, "epoch": 386, "lr": 2.849477748802679e-05} +{"train_loss": 0.0009956809226423502, "global_step": 45984, "epoch": 386, "lr": 2.849277739327857e-05} +{"train_loss": 0.0033716512843966484, "global_step": 45985, "epoch": 386, "lr": 2.84907773407575e-05} +{"train_loss": 0.0007679651607759297, "global_step": 45986, "epoch": 386, "lr": 2.848877733046748e-05} +{"train_loss": 0.0015648171538487077, "global_step": 45987, "epoch": 386, "lr": 2.8486777362412466e-05} +{"train_loss": 0.00128992332611233, "global_step": 45988, "epoch": 386, "lr": 2.8484777436596366e-05} +{"train_loss": 0.001206464134156704, "global_step": 45989, "epoch": 386, "lr": 2.8482777553023083e-05} +{"train_loss": 0.0014294651336967945, "global_step": 45990, "epoch": 386, "lr": 2.848077771169659e-05} +{"train_loss": 0.0015605029184371233, "global_step": 45991, "epoch": 386, "lr": 2.8478777912620768e-05} +{"train_loss": 0.0015082239406183362, "global_step": 45992, "epoch": 386, "lr": 2.847677815579959e-05} +{"train_loss": 0.0014752245042473078, "global_step": 45993, "epoch": 386, "lr": 2.847477844123696e-05} +{"train_loss": 0.0021154480054974556, "global_step": 45994, "epoch": 386, "lr": 2.847277876893678e-05} +{"train_loss": 0.001367168384604156, "global_step": 45995, "epoch": 386, "lr": 2.8470779138903013e-05} +{"train_loss": 0.001320241834037006, "global_step": 45996, "epoch": 386, "lr": 2.846877955113956e-05} +{"train_loss": 0.0017750449478626251, "global_step": 45997, "epoch": 386, "lr": 2.846678000565038e-05} +{"train_loss": 0.0011749172117561102, "global_step": 45998, "epoch": 386, "lr": 2.846478050243935e-05} +{"train_loss": 0.001357631990686059, "global_step": 45999, "epoch": 386, "lr": 2.8462781041510445e-05} +{"train_loss": 0.0006360210245475173, "global_step": 46000, "epoch": 386, "lr": 2.846078162286755e-05} +{"train_loss": 0.000985791441053152, "global_step": 46001, "epoch": 386, "lr": 2.8458782246514625e-05} +{"train_loss": 0.0011195105034857988, "global_step": 46002, "epoch": 386, "lr": 2.8456782912455566e-05} +{"train_loss": 0.0011708432575687766, "global_step": 46003, "epoch": 386, "lr": 2.845478362069431e-05} +{"train_loss": 0.0010339337168261409, "global_step": 46004, "epoch": 386, "lr": 2.8452784371234804e-05} +{"train_loss": 0.0021628569811582565, "global_step": 46005, "epoch": 386, "lr": 2.845078516408093e-05} +{"train_loss": 0.0013010975671932101, "global_step": 46006, "epoch": 386, "lr": 2.844878599923666e-05} +{"train_loss": 0.0014022474642843008, "global_step": 46007, "epoch": 386, "lr": 2.84467868767059e-05} +{"train_loss": 0.0019560533110052347, "global_step": 46008, "epoch": 386, "lr": 2.8444787796492545e-05} +{"train_loss": 0.001307453727349639, "global_step": 46009, "epoch": 386, "lr": 2.8442788758600568e-05} +{"train_loss": 0.0010762920137494802, "global_step": 46010, "epoch": 386, "lr": 2.844078976303386e-05} +{"train_loss": 0.001773548312485218, "global_step": 46011, "epoch": 386, "lr": 2.8438790809796368e-05} +{"train_loss": 0.0012535880086943507, "global_step": 46012, "epoch": 386, "lr": 2.843679189889201e-05} +{"train_loss": 0.0011927428422495723, "global_step": 46013, "epoch": 386, "lr": 2.8434793030324693e-05} +{"train_loss": 0.0010037076426669955, "global_step": 46014, "epoch": 386, "lr": 2.843279420409837e-05} +{"train_loss": 0.0005605891346931458, "global_step": 46015, "epoch": 386, "lr": 2.8430795420216933e-05} +{"train_loss": 0.0006903865141794086, "global_step": 46016, "epoch": 386, "lr": 2.8428796678684343e-05} +{"train_loss": 0.0018417087849229574, "global_step": 46017, "epoch": 386, "lr": 2.8426797979504488e-05} +{"train_loss": 0.00128649128600955, "global_step": 46018, "epoch": 386, "lr": 2.8424799322681328e-05} +{"train_loss": 0.0010152984177693725, "global_step": 46019, "epoch": 386, "lr": 2.842280070821877e-05} +{"train_loss": 0.0009814093355089426, "global_step": 46020, "epoch": 386, "lr": 2.842080213612072e-05} +{"train_loss": 0.0022518502082675695, "global_step": 46021, "epoch": 386, "lr": 2.8418803606391142e-05} +{"train_loss": 0.0007903790683485568, "global_step": 46022, "epoch": 386, "lr": 2.8416805119033912e-05} +{"train_loss": 0.0008860750240273774, "global_step": 46023, "epoch": 386, "lr": 2.8414806674053e-05} +{"train_loss": 0.0014240016462281346, "global_step": 46024, "epoch": 386, "lr": 2.8412808271452313e-05} +{"train_loss": 0.001052418607287109, "global_step": 46025, "epoch": 386, "lr": 2.8410809911235748e-05} +{"train_loss": 0.0011139468988403678, "global_step": 46026, "epoch": 386, "lr": 2.840881159340727e-05} +{"train_loss": 0.001335912849754095, "global_step": 46027, "epoch": 386, "lr": 2.840681331797077e-05} +{"train_loss": 0.0009404767188243568, "global_step": 46028, "epoch": 386, "lr": 2.84048150849302e-05} +{"train_loss": 0.0009993668645620346, "global_step": 46029, "epoch": 386, "lr": 2.8402816894289446e-05} +{"train_loss": 0.0009129618410952389, "global_step": 46030, "epoch": 386, "lr": 2.8400818746052478e-05} +{"train_loss": 0.001376160653308034, "global_step": 46031, "epoch": 386, "lr": 2.8398820640223173e-05} +{"train_loss": 0.0022468818351626396, "global_step": 46032, "epoch": 386, "lr": 2.8396822576805492e-05} +{"train_loss": 0.0008226142381317914, "global_step": 46033, "epoch": 386, "lr": 2.8394824555803335e-05} +{"train_loss": 0.0014174685347825289, "global_step": 46034, "epoch": 386, "lr": 2.839282657722064e-05} +{"train_loss": 0.0008921984117478132, "global_step": 46035, "epoch": 386, "lr": 2.8390828641061307e-05} +{"train_loss": 0.000786457268986851, "global_step": 46036, "epoch": 386, "lr": 2.8388830747329286e-05} +{"train_loss": 0.0021941454615443945, "global_step": 46037, "epoch": 386, "lr": 2.8386832896028475e-05} +{"train_loss": 0.0006086633657105267, "global_step": 46038, "epoch": 386, "lr": 2.8384835087162826e-05} +{"train_loss": 0.0009998730383813381, "global_step": 46039, "epoch": 386, "lr": 2.8382837320736222e-05} +{"train_loss": 0.0007185994763858616, "global_step": 46040, "epoch": 386, "lr": 2.838083959675263e-05} +{"train_loss": 0.0016376689309254289, "global_step": 46041, "epoch": 386, "lr": 2.8378841915215927e-05} +{"train_loss": 0.0009468722273595631, "global_step": 46042, "epoch": 386, "lr": 2.8376844276130084e-05} +{"train_loss": 0.0012490748194977641, "global_step": 46043, "epoch": 386, "lr": 2.837484667949899e-05} +{"train_loss": 0.0020216903649270535, "global_step": 46044, "epoch": 386, "lr": 2.8372849125326562e-05} +{"train_loss": 0.0012830693740397692, "global_step": 46045, "epoch": 386, "lr": 2.8370851613616744e-05} +{"train_loss": 0.000914713426027447, "global_step": 46046, "epoch": 386, "lr": 2.8368854144373435e-05} +{"train_loss": 0.0012225988321006298, "global_step": 46047, "epoch": 386, "lr": 2.8366856717600588e-05} +{"train_loss": 0.0014325230149552226, "global_step": 46048, "epoch": 386, "lr": 2.836485933330209e-05} +{"train_loss": 0.001649100100621581, "global_step": 46049, "epoch": 386, "lr": 2.83628619914819e-05} +{"train_loss": 0.0028926944360136986, "global_step": 46050, "epoch": 386, "lr": 2.8360864692143913e-05} +{"train_loss": 0.0010904459049925208, "global_step": 46051, "epoch": 386, "lr": 2.8358867435292034e-05} +{"train_loss": 0.0013847408548169652, "global_step": 46052, "epoch": 386, "lr": 2.8356870220930236e-05, "val_loss": 0.03481242433190346} +{"train_loss": 0.0007954550092108548, "global_step": 46053, "epoch": 387, "lr": 2.8354873049062393e-05} +{"train_loss": 0.0013428775127977133, "global_step": 46054, "epoch": 387, "lr": 2.8352875919692456e-05} +{"train_loss": 0.00153507967479527, "global_step": 46055, "epoch": 387, "lr": 2.835087883282431e-05} +{"train_loss": 0.002044150372967124, "global_step": 46056, "epoch": 387, "lr": 2.8348881788461934e-05} +{"train_loss": 0.0020695629063993692, "global_step": 46057, "epoch": 387, "lr": 2.8346884786609206e-05} +{"train_loss": 0.0017879989463835955, "global_step": 46058, "epoch": 387, "lr": 2.834488782727004e-05} +{"train_loss": 0.0012958361767232418, "global_step": 46059, "epoch": 387, "lr": 2.8342890910448395e-05} +{"train_loss": 0.0018640650669112802, "global_step": 46060, "epoch": 387, "lr": 2.8340894036148146e-05} +{"train_loss": 0.0009494445403106511, "global_step": 46061, "epoch": 387, "lr": 2.833889720437326e-05} +{"train_loss": 0.0011603025486692786, "global_step": 46062, "epoch": 387, "lr": 2.8336900415127632e-05} +{"train_loss": 0.0011879336088895798, "global_step": 46063, "epoch": 387, "lr": 2.833490366841517e-05} +{"train_loss": 0.0005764664965681732, "global_step": 46064, "epoch": 387, "lr": 2.8332906964239804e-05} +{"train_loss": 0.0013900522608309984, "global_step": 46065, "epoch": 387, "lr": 2.8330910302605486e-05} +{"train_loss": 0.0021201421041041613, "global_step": 46066, "epoch": 387, "lr": 2.832891368351609e-05} +{"train_loss": 0.0018752174219116569, "global_step": 46067, "epoch": 387, "lr": 2.8326917106975577e-05} +{"train_loss": 0.0007744812173768878, "global_step": 46068, "epoch": 387, "lr": 2.8324920572987823e-05} +{"train_loss": 0.0019148916471749544, "global_step": 46069, "epoch": 387, "lr": 2.8322924081556796e-05} +{"train_loss": 0.001111163990572095, "global_step": 46070, "epoch": 387, "lr": 2.8320927632686367e-05} +{"train_loss": 0.0015444394666701555, "global_step": 46071, "epoch": 387, "lr": 2.8318931226380508e-05} +{"train_loss": 0.0017032874748110771, "global_step": 46072, "epoch": 387, "lr": 2.8316934862643086e-05} +{"train_loss": 0.0025247458834201097, "global_step": 46073, "epoch": 387, "lr": 2.8314938541478066e-05} +{"train_loss": 0.001799894031137228, "global_step": 46074, "epoch": 387, "lr": 2.8312942262889353e-05} +{"train_loss": 0.0008797029731795192, "global_step": 46075, "epoch": 387, "lr": 2.8310946026880837e-05} +{"train_loss": 0.0016484434017911553, "global_step": 46076, "epoch": 387, "lr": 2.8308949833456476e-05} +{"train_loss": 0.0025131478905677795, "global_step": 46077, "epoch": 387, "lr": 2.8306953682620162e-05} +{"train_loss": 0.0009016942931339145, "global_step": 46078, "epoch": 387, "lr": 2.830495757437584e-05} +{"train_loss": 0.0010109870927408338, "global_step": 46079, "epoch": 387, "lr": 2.83029615087274e-05} +{"train_loss": 0.0010989378206431866, "global_step": 46080, "epoch": 387, "lr": 2.83009654856788e-05} +{"train_loss": 0.001313411514274776, "global_step": 46081, "epoch": 387, "lr": 2.829896950523393e-05} +{"train_loss": 0.0012014632811769843, "global_step": 46082, "epoch": 387, "lr": 2.8296973567396702e-05} +{"train_loss": 0.0012599499896168709, "global_step": 46083, "epoch": 387, "lr": 2.8294977672171062e-05} +{"train_loss": 0.0013483582297340035, "global_step": 46084, "epoch": 387, "lr": 2.8292981819560894e-05} +{"train_loss": 0.0016443321947008371, "global_step": 46085, "epoch": 387, "lr": 2.8290986009570164e-05} +{"train_loss": 0.0013433725107461214, "global_step": 46086, "epoch": 387, "lr": 2.828899024220274e-05} +{"train_loss": 0.0012716627679765224, "global_step": 46087, "epoch": 387, "lr": 2.8286994517462584e-05} +{"train_loss": 0.0007119688671082258, "global_step": 46088, "epoch": 387, "lr": 2.8284998835353592e-05} +{"train_loss": 0.0013369062216952443, "global_step": 46089, "epoch": 387, "lr": 2.8283003195879664e-05} +{"train_loss": 0.001956098945811391, "global_step": 46090, "epoch": 387, "lr": 2.828100759904476e-05} +{"train_loss": 0.0010494025191292167, "global_step": 46091, "epoch": 387, "lr": 2.8279012044852764e-05} +{"train_loss": 0.0009298520744778216, "global_step": 46092, "epoch": 387, "lr": 2.827701653330762e-05} +{"train_loss": 0.0022509191185235977, "global_step": 46093, "epoch": 387, "lr": 2.8275021064413244e-05} +{"train_loss": 0.0009914581896737218, "global_step": 46094, "epoch": 387, "lr": 2.827302563817351e-05} +{"train_loss": 0.0017354560550302267, "global_step": 46095, "epoch": 387, "lr": 2.8271030254592394e-05} +{"train_loss": 0.0007578733493573964, "global_step": 46096, "epoch": 387, "lr": 2.826903491367377e-05} +{"train_loss": 0.0018124185735359788, "global_step": 46097, "epoch": 387, "lr": 2.8267039615421592e-05} +{"train_loss": 0.0014171188231557608, "global_step": 46098, "epoch": 387, "lr": 2.8265044359839743e-05} +{"train_loss": 0.0013208857271820307, "global_step": 46099, "epoch": 387, "lr": 2.8263049146932153e-05} +{"train_loss": 0.000978442607447505, "global_step": 46100, "epoch": 387, "lr": 2.8261053976702766e-05} +{"train_loss": 0.0013851984404027462, "global_step": 46101, "epoch": 387, "lr": 2.8259058849155463e-05} +{"train_loss": 0.0012463736347854137, "global_step": 46102, "epoch": 387, "lr": 2.825706376429419e-05} +{"train_loss": 0.000888662994839251, "global_step": 46103, "epoch": 387, "lr": 2.8255068722122824e-05} +{"train_loss": 0.0006123721832409501, "global_step": 46104, "epoch": 387, "lr": 2.825307372264533e-05} +{"train_loss": 0.0010573607869446278, "global_step": 46105, "epoch": 387, "lr": 2.825107876586559e-05} +{"train_loss": 0.0011128471232950687, "global_step": 46106, "epoch": 387, "lr": 2.8249083851787544e-05} +{"train_loss": 0.0014677444705739617, "global_step": 46107, "epoch": 387, "lr": 2.8247088980415103e-05} +{"train_loss": 0.0010113579919561744, "global_step": 46108, "epoch": 387, "lr": 2.824509415175216e-05} +{"train_loss": 0.0007349043735302985, "global_step": 46109, "epoch": 387, "lr": 2.8243099365802665e-05} +{"train_loss": 0.0011239952873438597, "global_step": 46110, "epoch": 387, "lr": 2.82411046225705e-05} +{"train_loss": 0.0015017802361398935, "global_step": 46111, "epoch": 387, "lr": 2.8239109922059633e-05} +{"train_loss": 0.0009652451262809336, "global_step": 46112, "epoch": 387, "lr": 2.823711526427394e-05} +{"train_loss": 0.0011822462547570467, "global_step": 46113, "epoch": 387, "lr": 2.8235120649217328e-05} +{"train_loss": 0.0007045036763884127, "global_step": 46114, "epoch": 387, "lr": 2.8233126076893746e-05} +{"train_loss": 0.0012217821786180139, "global_step": 46115, "epoch": 387, "lr": 2.8231131547307082e-05} +{"train_loss": 0.0011649446096271276, "global_step": 46116, "epoch": 387, "lr": 2.8229137060461285e-05} +{"train_loss": 0.0009540213504806161, "global_step": 46117, "epoch": 387, "lr": 2.8227142616360225e-05} +{"train_loss": 0.001399839879013598, "global_step": 46118, "epoch": 387, "lr": 2.8225148215007875e-05} +{"train_loss": 0.000927840534131974, "global_step": 46119, "epoch": 387, "lr": 2.8223153856408114e-05} +{"train_loss": 0.00094851094763726, "global_step": 46120, "epoch": 387, "lr": 2.8221159540564844e-05} +{"train_loss": 0.0009033691021613777, "global_step": 46121, "epoch": 387, "lr": 2.8219165267482017e-05} +{"train_loss": 0.001123170368373394, "global_step": 46122, "epoch": 387, "lr": 2.821717103716352e-05} +{"train_loss": 0.0009020509896799922, "global_step": 46123, "epoch": 387, "lr": 2.8215176849613296e-05} +{"train_loss": 0.0008463466074317694, "global_step": 46124, "epoch": 387, "lr": 2.8213182704835228e-05} +{"train_loss": 0.001085661700926721, "global_step": 46125, "epoch": 387, "lr": 2.821118860283326e-05} +{"train_loss": 0.0011802901281043887, "global_step": 46126, "epoch": 387, "lr": 2.8209194543611306e-05} +{"train_loss": 0.0014699694002047181, "global_step": 46127, "epoch": 387, "lr": 2.8207200527173245e-05} +{"train_loss": 0.0009027309715747833, "global_step": 46128, "epoch": 387, "lr": 2.8205206553523033e-05} +{"train_loss": 0.0016711389180272818, "global_step": 46129, "epoch": 387, "lr": 2.8203212622664556e-05} +{"train_loss": 0.0011931932531297207, "global_step": 46130, "epoch": 387, "lr": 2.8201218734601764e-05} +{"train_loss": 0.0010179899400100112, "global_step": 46131, "epoch": 387, "lr": 2.8199224889338528e-05} +{"train_loss": 0.0005028542364016175, "global_step": 46132, "epoch": 387, "lr": 2.81972310868788e-05} +{"train_loss": 0.0007624648860655725, "global_step": 46133, "epoch": 387, "lr": 2.8195237327226465e-05} +{"train_loss": 0.0013955616159364581, "global_step": 46134, "epoch": 387, "lr": 2.819324361038545e-05} +{"train_loss": 0.0011589108034968376, "global_step": 46135, "epoch": 387, "lr": 2.8191249936359693e-05} +{"train_loss": 0.001517936703749001, "global_step": 46136, "epoch": 387, "lr": 2.8189256305153066e-05} +{"train_loss": 0.0012813422363251448, "global_step": 46137, "epoch": 387, "lr": 2.8187262716769525e-05} +{"train_loss": 0.0007780054002068937, "global_step": 46138, "epoch": 387, "lr": 2.818526917121296e-05} +{"train_loss": 0.0020971116609871387, "global_step": 46139, "epoch": 387, "lr": 2.818327566848727e-05} +{"train_loss": 0.0005714696599170566, "global_step": 46140, "epoch": 387, "lr": 2.8181282208596403e-05} +{"train_loss": 0.000883526518009603, "global_step": 46141, "epoch": 387, "lr": 2.8179288791544246e-05} +{"train_loss": 0.0014912837650626898, "global_step": 46142, "epoch": 387, "lr": 2.8177295417334744e-05} +{"train_loss": 0.001957186032086611, "global_step": 46143, "epoch": 387, "lr": 2.8175302085971787e-05} +{"train_loss": 0.0005815745680592954, "global_step": 46144, "epoch": 387, "lr": 2.8173308797459275e-05} +{"train_loss": 0.0009199349442496896, "global_step": 46145, "epoch": 387, "lr": 2.817131555180116e-05} +{"train_loss": 0.0012482814490795135, "global_step": 46146, "epoch": 387, "lr": 2.8169322349001303e-05} +{"train_loss": 0.0007330222288146615, "global_step": 46147, "epoch": 387, "lr": 2.8167329189063686e-05} +{"train_loss": 0.0016585191478952765, "global_step": 46148, "epoch": 387, "lr": 2.8165336071992154e-05} +{"train_loss": 0.0013113400200381875, "global_step": 46149, "epoch": 387, "lr": 2.8163342997790677e-05} +{"train_loss": 0.0008552903309464455, "global_step": 46150, "epoch": 387, "lr": 2.8161349966463148e-05} +{"train_loss": 0.0016040061600506306, "global_step": 46151, "epoch": 387, "lr": 2.8159356978013446e-05} +{"train_loss": 0.0008072873461060226, "global_step": 46152, "epoch": 387, "lr": 2.8157364032445537e-05} +{"train_loss": 0.0008280647452920675, "global_step": 46153, "epoch": 387, "lr": 2.815537112976329e-05} +{"train_loss": 0.0016416755970567465, "global_step": 46154, "epoch": 387, "lr": 2.8153378269970658e-05} +{"train_loss": 0.0011804833775386214, "global_step": 46155, "epoch": 387, "lr": 2.8151385453071515e-05} +{"train_loss": 0.0013933652080595493, "global_step": 46156, "epoch": 387, "lr": 2.8149392679069807e-05} +{"train_loss": 0.0013607216533273458, "global_step": 46157, "epoch": 387, "lr": 2.8147399947969444e-05} +{"train_loss": 0.000915205106139183, "global_step": 46158, "epoch": 387, "lr": 2.814540725977429e-05} +{"train_loss": 0.001263309270143509, "global_step": 46159, "epoch": 387, "lr": 2.814341461448833e-05} +{"train_loss": 0.0005912237102165818, "global_step": 46160, "epoch": 387, "lr": 2.8141422012115415e-05} +{"train_loss": 0.0013279885752126575, "global_step": 46161, "epoch": 387, "lr": 2.81394294526595e-05} +{"train_loss": 0.0011651529930531979, "global_step": 46162, "epoch": 387, "lr": 2.813743693612446e-05} +{"train_loss": 0.0014829945284873247, "global_step": 46163, "epoch": 387, "lr": 2.813544446251425e-05} +{"train_loss": 0.001038457965478301, "global_step": 46164, "epoch": 387, "lr": 2.8133452031832734e-05} +{"train_loss": 0.0013596474891528487, "global_step": 46165, "epoch": 387, "lr": 2.8131459644083875e-05} +{"train_loss": 0.0008544460870325565, "global_step": 46166, "epoch": 387, "lr": 2.8129467299271535e-05} +{"train_loss": 0.0011040946701541543, "global_step": 46167, "epoch": 387, "lr": 2.8127474997399673e-05} +{"train_loss": 0.0014792436268180609, "global_step": 46168, "epoch": 387, "lr": 2.8125482738472154e-05} +{"train_loss": 0.001369285280816257, "global_step": 46169, "epoch": 387, "lr": 2.812349052249293e-05} +{"train_loss": 0.000692686764523387, "global_step": 46170, "epoch": 387, "lr": 2.812149834946588e-05} +{"train_loss": 0.001248086563961095, "global_step": 46171, "epoch": 387, "lr": 2.811950621939494e-05, "val_loss": 0.023310013115406036} +{"train_loss": 0.0008716767770238221, "global_step": 46172, "epoch": 388, "lr": 2.8117514132284007e-05} +{"train_loss": 0.0011335861636325717, "global_step": 46173, "epoch": 388, "lr": 2.811552208813701e-05} +{"train_loss": 0.0008650186937302351, "global_step": 46174, "epoch": 388, "lr": 2.811353008695783e-05} +{"train_loss": 0.0013640220277011395, "global_step": 46175, "epoch": 388, "lr": 2.8111538128750415e-05} +{"train_loss": 0.0007953752065077424, "global_step": 46176, "epoch": 388, "lr": 2.810954621351865e-05} +{"train_loss": 0.0007945982506498694, "global_step": 46177, "epoch": 388, "lr": 2.810755434126644e-05} +{"train_loss": 0.0009745999705046415, "global_step": 46178, "epoch": 388, "lr": 2.8105562511997725e-05} +{"train_loss": 0.0009718486107885838, "global_step": 46179, "epoch": 388, "lr": 2.8103570725716377e-05} +{"train_loss": 0.0007879135082475841, "global_step": 46180, "epoch": 388, "lr": 2.810157898242635e-05} +{"train_loss": 0.0013314846437424421, "global_step": 46181, "epoch": 388, "lr": 2.8099587282131535e-05} +{"train_loss": 0.001116987899877131, "global_step": 46182, "epoch": 388, "lr": 2.8097595624835822e-05} +{"train_loss": 0.0011352605652064085, "global_step": 46183, "epoch": 388, "lr": 2.809560401054315e-05} +{"train_loss": 0.0014779106713831425, "global_step": 46184, "epoch": 388, "lr": 2.809361243925741e-05} +{"train_loss": 0.0013905703090131283, "global_step": 46185, "epoch": 388, "lr": 2.809162091098254e-05} +{"train_loss": 0.0015388935571536422, "global_step": 46186, "epoch": 388, "lr": 2.8089629425722414e-05} +{"train_loss": 0.0017083442071452737, "global_step": 46187, "epoch": 388, "lr": 2.8087637983480973e-05} +{"train_loss": 0.0014064384158700705, "global_step": 46188, "epoch": 388, "lr": 2.808564658426212e-05} +{"train_loss": 0.0007596194627694786, "global_step": 46189, "epoch": 388, "lr": 2.8083655228069737e-05} +{"train_loss": 0.0007811000104993582, "global_step": 46190, "epoch": 388, "lr": 2.8081663914907776e-05} +{"train_loss": 0.0012405496090650558, "global_step": 46191, "epoch": 388, "lr": 2.8079672644780102e-05} +{"train_loss": 0.0010912547586485744, "global_step": 46192, "epoch": 388, "lr": 2.807768141769067e-05} +{"train_loss": 0.0009676741319708526, "global_step": 46193, "epoch": 388, "lr": 2.8075690233643355e-05} +{"train_loss": 0.0008255193242803216, "global_step": 46194, "epoch": 388, "lr": 2.8073699092642093e-05} +{"train_loss": 0.001507693319581449, "global_step": 46195, "epoch": 388, "lr": 2.8071707994690783e-05} +{"train_loss": 0.0004616779333446175, "global_step": 46196, "epoch": 388, "lr": 2.806971693979331e-05} +{"train_loss": 0.0011875929776579142, "global_step": 46197, "epoch": 388, "lr": 2.8067725927953604e-05} +{"train_loss": 0.0006205538520589471, "global_step": 46198, "epoch": 388, "lr": 2.8065734959175597e-05} +{"train_loss": 0.0012825559824705124, "global_step": 46199, "epoch": 388, "lr": 2.806374403346316e-05} +{"train_loss": 0.0012701157247647643, "global_step": 46200, "epoch": 388, "lr": 2.8061753150820235e-05} +{"train_loss": 0.0012326629366725683, "global_step": 46201, "epoch": 388, "lr": 2.805976231125069e-05} +{"train_loss": 0.001498393015936017, "global_step": 46202, "epoch": 388, "lr": 2.8057771514758478e-05} +{"train_loss": 0.0005776480538770556, "global_step": 46203, "epoch": 388, "lr": 2.8055780761347472e-05} +{"train_loss": 0.0009146721567958593, "global_step": 46204, "epoch": 388, "lr": 2.8053790051021617e-05} +{"train_loss": 0.0007383549818769097, "global_step": 46205, "epoch": 388, "lr": 2.8051799383784782e-05} +{"train_loss": 0.0011753980070352554, "global_step": 46206, "epoch": 388, "lr": 2.8049808759640905e-05} +{"train_loss": 0.0008295673178508878, "global_step": 46207, "epoch": 388, "lr": 2.8047818178593887e-05} +{"train_loss": 0.0008329841075465083, "global_step": 46208, "epoch": 388, "lr": 2.8045827640647616e-05} +{"train_loss": 0.000833844009321183, "global_step": 46209, "epoch": 388, "lr": 2.804383714580604e-05} +{"train_loss": 0.0006830845377407968, "global_step": 46210, "epoch": 388, "lr": 2.8041846694073016e-05} +{"train_loss": 0.0012712436728179455, "global_step": 46211, "epoch": 388, "lr": 2.8039856285452504e-05} +{"train_loss": 0.0015709473518654704, "global_step": 46212, "epoch": 388, "lr": 2.803786591994839e-05} +{"train_loss": 0.0010270599741488695, "global_step": 46213, "epoch": 388, "lr": 2.8035875597564555e-05} +{"train_loss": 0.0006595480372197926, "global_step": 46214, "epoch": 388, "lr": 2.8033885318304954e-05} +{"train_loss": 0.0014762565260753036, "global_step": 46215, "epoch": 388, "lr": 2.8031895082173453e-05} +{"train_loss": 0.0007875363808125257, "global_step": 46216, "epoch": 388, "lr": 2.8029904889173997e-05} +{"train_loss": 0.0010361610911786556, "global_step": 46217, "epoch": 388, "lr": 2.8027914739310456e-05} +{"train_loss": 0.001171630690805614, "global_step": 46218, "epoch": 388, "lr": 2.8025924632586788e-05} +{"train_loss": 0.001120124477893114, "global_step": 46219, "epoch": 388, "lr": 2.8023934569006855e-05} +{"train_loss": 0.0011680450988933444, "global_step": 46220, "epoch": 388, "lr": 2.8021944548574563e-05} +{"train_loss": 0.0011505134170874953, "global_step": 46221, "epoch": 388, "lr": 2.8019954571293853e-05} +{"train_loss": 0.0012320404639467597, "global_step": 46222, "epoch": 388, "lr": 2.8017964637168605e-05} +{"train_loss": 0.0021511127706617117, "global_step": 46223, "epoch": 388, "lr": 2.8015974746202745e-05} +{"train_loss": 0.0015051134396344423, "global_step": 46224, "epoch": 388, "lr": 2.801398489840015e-05} +{"train_loss": 0.001189664239063859, "global_step": 46225, "epoch": 388, "lr": 2.8011995093764764e-05} +{"train_loss": 0.001328450976870954, "global_step": 46226, "epoch": 388, "lr": 2.8010005332300483e-05} +{"train_loss": 0.0013028635876253247, "global_step": 46227, "epoch": 388, "lr": 2.8008015614011186e-05} +{"train_loss": 0.002310653915628791, "global_step": 46228, "epoch": 388, "lr": 2.8006025938900813e-05} +{"train_loss": 0.0009240367216989398, "global_step": 46229, "epoch": 388, "lr": 2.8004036306973248e-05} +{"train_loss": 0.0006967333029024303, "global_step": 46230, "epoch": 388, "lr": 2.8002046718232426e-05} +{"train_loss": 0.0008494382491335273, "global_step": 46231, "epoch": 388, "lr": 2.8000057172682214e-05} +{"train_loss": 0.0007520161452703178, "global_step": 46232, "epoch": 388, "lr": 2.7998067670326545e-05} +{"train_loss": 0.0010295948013663292, "global_step": 46233, "epoch": 388, "lr": 2.799607821116933e-05} +{"train_loss": 0.0008879996603354812, "global_step": 46234, "epoch": 388, "lr": 2.7994088795214447e-05} +{"train_loss": 0.0010060458444058895, "global_step": 46235, "epoch": 388, "lr": 2.7992099422465844e-05} +{"train_loss": 0.0018166981171816587, "global_step": 46236, "epoch": 388, "lr": 2.799011009292738e-05} +{"train_loss": 0.0015725106932222843, "global_step": 46237, "epoch": 388, "lr": 2.7988120806603003e-05} +{"train_loss": 0.0014529747422784567, "global_step": 46238, "epoch": 388, "lr": 2.7986131563496597e-05} +{"train_loss": 0.0009729210869409144, "global_step": 46239, "epoch": 388, "lr": 2.7984142363612054e-05} +{"train_loss": 0.0014148843474686146, "global_step": 46240, "epoch": 388, "lr": 2.7982153206953316e-05} +{"train_loss": 0.0011101977434009314, "global_step": 46241, "epoch": 388, "lr": 2.798016409352424e-05} +{"train_loss": 0.0015701391967013478, "global_step": 46242, "epoch": 388, "lr": 2.797817502332879e-05} +{"train_loss": 0.0012947979848831892, "global_step": 46243, "epoch": 388, "lr": 2.797618599637082e-05} +{"train_loss": 0.0007795608835294843, "global_step": 46244, "epoch": 388, "lr": 2.7974197012654268e-05} +{"train_loss": 0.000897117133717984, "global_step": 46245, "epoch": 388, "lr": 2.7972208072183024e-05} +{"train_loss": 0.0013393920380622149, "global_step": 46246, "epoch": 388, "lr": 2.7970219174960988e-05} +{"train_loss": 0.0018678326159715652, "global_step": 46247, "epoch": 388, "lr": 2.796823032099209e-05} +{"train_loss": 0.0009843638399615884, "global_step": 46248, "epoch": 388, "lr": 2.7966241510280195e-05} +{"train_loss": 0.000928058463614434, "global_step": 46249, "epoch": 388, "lr": 2.796425274282925e-05} +{"train_loss": 0.0008230559760704637, "global_step": 46250, "epoch": 388, "lr": 2.7962264018643148e-05} +{"train_loss": 0.0009047306375578046, "global_step": 46251, "epoch": 388, "lr": 2.7960275337725757e-05} +{"train_loss": 0.0007781271706335247, "global_step": 46252, "epoch": 388, "lr": 2.7958286700081033e-05} +{"train_loss": 0.002000529319047928, "global_step": 46253, "epoch": 388, "lr": 2.7956298105712842e-05} +{"train_loss": 0.001258639502339065, "global_step": 46254, "epoch": 388, "lr": 2.7954309554625118e-05} +{"train_loss": 0.0013432663399726152, "global_step": 46255, "epoch": 388, "lr": 2.795232104682174e-05} +{"train_loss": 0.0014274839777499437, "global_step": 46256, "epoch": 388, "lr": 2.7950332582306637e-05} +{"train_loss": 0.0014756562886759639, "global_step": 46257, "epoch": 388, "lr": 2.7948344161083706e-05} +{"train_loss": 0.001410653698258102, "global_step": 46258, "epoch": 388, "lr": 2.7946355783156818e-05} +{"train_loss": 0.0007739348220638931, "global_step": 46259, "epoch": 388, "lr": 2.7944367448529935e-05} +{"train_loss": 0.0006269158329814672, "global_step": 46260, "epoch": 388, "lr": 2.7942379157206904e-05} +{"train_loss": 0.0010875051375478506, "global_step": 46261, "epoch": 388, "lr": 2.794039090919167e-05} +{"train_loss": 0.0011640503071248531, "global_step": 46262, "epoch": 388, "lr": 2.793840270448811e-05} +{"train_loss": 0.0018853596411645412, "global_step": 46263, "epoch": 388, "lr": 2.793641454310016e-05} +{"train_loss": 0.0011426870478317142, "global_step": 46264, "epoch": 388, "lr": 2.793442642503168e-05} +{"train_loss": 0.0015295707853510976, "global_step": 46265, "epoch": 388, "lr": 2.7932438350286617e-05} +{"train_loss": 0.0023396287579089403, "global_step": 46266, "epoch": 388, "lr": 2.793045031886883e-05} +{"train_loss": 0.0009870915673673153, "global_step": 46267, "epoch": 388, "lr": 2.7928462330782244e-05} +{"train_loss": 0.0010894926963374019, "global_step": 46268, "epoch": 388, "lr": 2.7926474386030793e-05} +{"train_loss": 0.0008502344717271626, "global_step": 46269, "epoch": 388, "lr": 2.792448648461835e-05} +{"train_loss": 0.0013646536972373724, "global_step": 46270, "epoch": 388, "lr": 2.7922498626548798e-05} +{"train_loss": 0.0014948087045922875, "global_step": 46271, "epoch": 388, "lr": 2.792051081182608e-05} +{"train_loss": 0.0012937154388055205, "global_step": 46272, "epoch": 388, "lr": 2.791852304045406e-05} +{"train_loss": 0.000763525313232094, "global_step": 46273, "epoch": 388, "lr": 2.7916535312436676e-05} +{"train_loss": 0.0013043226208537817, "global_step": 46274, "epoch": 388, "lr": 2.7914547627777805e-05} +{"train_loss": 0.0013941010693088174, "global_step": 46275, "epoch": 388, "lr": 2.7912559986481373e-05} +{"train_loss": 0.0011551891220733523, "global_step": 46276, "epoch": 388, "lr": 2.791057238855127e-05} +{"train_loss": 0.0022184248082339764, "global_step": 46277, "epoch": 388, "lr": 2.7908584833991386e-05} +{"train_loss": 0.002085847547277808, "global_step": 46278, "epoch": 388, "lr": 2.790659732280565e-05} +{"train_loss": 0.0012726180721074343, "global_step": 46279, "epoch": 388, "lr": 2.7904609854997932e-05} +{"train_loss": 0.0013295330572873354, "global_step": 46280, "epoch": 388, "lr": 2.7902622430572166e-05} +{"train_loss": 0.001247878884896636, "global_step": 46281, "epoch": 388, "lr": 2.7900635049532248e-05} +{"train_loss": 0.0012288059806451201, "global_step": 46282, "epoch": 388, "lr": 2.7898647711882047e-05} +{"train_loss": 0.002040224615484476, "global_step": 46283, "epoch": 388, "lr": 2.789666041762551e-05} +{"train_loss": 0.001652185688726604, "global_step": 46284, "epoch": 388, "lr": 2.7894673166766505e-05} +{"train_loss": 0.0009321995312348008, "global_step": 46285, "epoch": 388, "lr": 2.789268595930896e-05} +{"train_loss": 0.000615234486758709, "global_step": 46286, "epoch": 388, "lr": 2.789069879525675e-05} +{"train_loss": 0.0011242475593462586, "global_step": 46287, "epoch": 388, "lr": 2.7888711674613803e-05} +{"train_loss": 0.0008626979542896152, "global_step": 46288, "epoch": 388, "lr": 2.7886724597384017e-05} +{"train_loss": 0.001317181740887463, "global_step": 46289, "epoch": 388, "lr": 2.7884737563571263e-05} +{"train_loss": 0.0011870861163523299, "global_step": 46290, "epoch": 388, "lr": 2.7882750573179484e-05, "val_loss": 0.019463885575532913} +{"train_loss": 0.0010984580731019378, "global_step": 46291, "epoch": 389, "lr": 2.7880763626212537e-05} +{"train_loss": 0.0010637708473950624, "global_step": 46292, "epoch": 389, "lr": 2.787877672267437e-05} +{"train_loss": 0.0016543730162084103, "global_step": 46293, "epoch": 389, "lr": 2.7876789862568843e-05} +{"train_loss": 0.0008468043524771929, "global_step": 46294, "epoch": 389, "lr": 2.7874803045899893e-05} +{"train_loss": 0.0012961028842255473, "global_step": 46295, "epoch": 389, "lr": 2.7872816272671387e-05} +{"train_loss": 0.0008638571016490459, "global_step": 46296, "epoch": 389, "lr": 2.7870829542887255e-05} +{"train_loss": 0.0008863555267453194, "global_step": 46297, "epoch": 389, "lr": 2.7868842856551376e-05} +{"train_loss": 0.0014767195098102093, "global_step": 46298, "epoch": 389, "lr": 2.7866856213667668e-05} +{"train_loss": 0.0005525401211343706, "global_step": 46299, "epoch": 389, "lr": 2.7864869614240013e-05} +{"train_loss": 0.0006671876180917025, "global_step": 46300, "epoch": 389, "lr": 2.7862883058272337e-05} +{"train_loss": 0.0010310725774616003, "global_step": 46301, "epoch": 389, "lr": 2.786089654576851e-05} +{"train_loss": 0.0018020129064098, "global_step": 46302, "epoch": 389, "lr": 2.7858910076732463e-05} +{"train_loss": 0.0009826753521338105, "global_step": 46303, "epoch": 389, "lr": 2.785692365116806e-05} +{"train_loss": 0.0009132905979640782, "global_step": 46304, "epoch": 389, "lr": 2.7854937269079244e-05} +{"train_loss": 0.001132688019424677, "global_step": 46305, "epoch": 389, "lr": 2.7852950930469873e-05} +{"train_loss": 0.0011435956694185734, "global_step": 46306, "epoch": 389, "lr": 2.7850964635343886e-05} +{"train_loss": 0.0013518438208848238, "global_step": 46307, "epoch": 389, "lr": 2.784897838370516e-05} +{"train_loss": 0.0005370479193516076, "global_step": 46308, "epoch": 389, "lr": 2.7846992175557584e-05} +{"train_loss": 0.0009545503999106586, "global_step": 46309, "epoch": 389, "lr": 2.784500601090509e-05} +{"train_loss": 0.0013519017957150936, "global_step": 46310, "epoch": 389, "lr": 2.7843019889751542e-05} +{"train_loss": 0.0012889509089291096, "global_step": 46311, "epoch": 389, "lr": 2.7841033812100868e-05} +{"train_loss": 0.0009474370162934065, "global_step": 46312, "epoch": 389, "lr": 2.783904777795695e-05} +{"train_loss": 0.0015338336816057563, "global_step": 46313, "epoch": 389, "lr": 2.7837061787323702e-05} +{"train_loss": 0.0010823847260326147, "global_step": 46314, "epoch": 389, "lr": 2.7835075840205027e-05} +{"train_loss": 0.0009893382666632533, "global_step": 46315, "epoch": 389, "lr": 2.7833089936604784e-05} +{"train_loss": 0.0006295618368312716, "global_step": 46316, "epoch": 389, "lr": 2.7831104076526926e-05} +{"train_loss": 0.0011275855358690023, "global_step": 46317, "epoch": 389, "lr": 2.7829118259975306e-05} +{"train_loss": 0.0006665447144769132, "global_step": 46318, "epoch": 389, "lr": 2.7827132486953862e-05} +{"train_loss": 0.0013405074132606387, "global_step": 46319, "epoch": 389, "lr": 2.782514675746647e-05} +{"train_loss": 0.0014671721728518605, "global_step": 46320, "epoch": 389, "lr": 2.7823161071517023e-05} +{"train_loss": 0.0015824487200006843, "global_step": 46321, "epoch": 389, "lr": 2.7821175429109448e-05} +{"train_loss": 0.0005072359926998615, "global_step": 46322, "epoch": 389, "lr": 2.78191898302476e-05} +{"train_loss": 0.00162211072165519, "global_step": 46323, "epoch": 389, "lr": 2.7817204274935425e-05} +{"train_loss": 0.0031432779505848885, "global_step": 46324, "epoch": 389, "lr": 2.7815218763176777e-05} +{"train_loss": 0.0019455034052953124, "global_step": 46325, "epoch": 389, "lr": 2.7813233294975606e-05} +{"train_loss": 0.0007198707317002118, "global_step": 46326, "epoch": 389, "lr": 2.7811247870335773e-05} +{"train_loss": 0.0007436801097355783, "global_step": 46327, "epoch": 389, "lr": 2.7809262489261166e-05} +{"train_loss": 0.0007466312381438911, "global_step": 46328, "epoch": 389, "lr": 2.7807277151755718e-05} +{"train_loss": 0.0009386251331306994, "global_step": 46329, "epoch": 389, "lr": 2.78052918578233e-05} +{"train_loss": 0.0009631359716877341, "global_step": 46330, "epoch": 389, "lr": 2.780330660746781e-05} +{"train_loss": 0.0020538971293717623, "global_step": 46331, "epoch": 389, "lr": 2.780132140069318e-05} +{"train_loss": 0.000822020519990474, "global_step": 46332, "epoch": 389, "lr": 2.779933623750327e-05} +{"train_loss": 0.0020397892221808434, "global_step": 46333, "epoch": 389, "lr": 2.7797351117902004e-05} +{"train_loss": 0.0014172479277476668, "global_step": 46334, "epoch": 389, "lr": 2.7795366041893245e-05} +{"train_loss": 0.0010236849775537848, "global_step": 46335, "epoch": 389, "lr": 2.779338100948094e-05} +{"train_loss": 0.0006425943574868143, "global_step": 46336, "epoch": 389, "lr": 2.7791396020668937e-05} +{"train_loss": 0.001294797519221902, "global_step": 46337, "epoch": 389, "lr": 2.7789411075461168e-05} +{"train_loss": 0.0015602053608745337, "global_step": 46338, "epoch": 389, "lr": 2.778742617386153e-05} +{"train_loss": 0.0009279205114580691, "global_step": 46339, "epoch": 389, "lr": 2.778544131587388e-05} +{"train_loss": 0.0017757320310920477, "global_step": 46340, "epoch": 389, "lr": 2.778345650150216e-05} +{"train_loss": 0.0013245466398075223, "global_step": 46341, "epoch": 389, "lr": 2.7781471730750237e-05} +{"train_loss": 0.001037207548506558, "global_step": 46342, "epoch": 389, "lr": 2.7779487003622033e-05} +{"train_loss": 0.0016895232256501913, "global_step": 46343, "epoch": 389, "lr": 2.7777502320121417e-05} +{"train_loss": 0.002725091762840748, "global_step": 46344, "epoch": 389, "lr": 2.777551768025232e-05} +{"train_loss": 0.0009315281640738249, "global_step": 46345, "epoch": 389, "lr": 2.7773533084018622e-05} +{"train_loss": 0.001775467535480857, "global_step": 46346, "epoch": 389, "lr": 2.7771548531424197e-05} +{"train_loss": 0.0021183257922530174, "global_step": 46347, "epoch": 389, "lr": 2.776956402247298e-05} +{"train_loss": 0.0016623802948743105, "global_step": 46348, "epoch": 389, "lr": 2.7767579557168827e-05} +{"train_loss": 0.0014066514559090137, "global_step": 46349, "epoch": 389, "lr": 2.7765595135515677e-05} +{"train_loss": 0.0012323748087510467, "global_step": 46350, "epoch": 389, "lr": 2.776361075751741e-05} +{"train_loss": 0.001285430509597063, "global_step": 46351, "epoch": 389, "lr": 2.7761626423177894e-05} +{"train_loss": 0.0015477092238143086, "global_step": 46352, "epoch": 389, "lr": 2.775964213250107e-05} +{"train_loss": 0.001599057693965733, "global_step": 46353, "epoch": 389, "lr": 2.7757657885490797e-05} +{"train_loss": 0.0009166924864985049, "global_step": 46354, "epoch": 389, "lr": 2.7755673682150996e-05} +{"train_loss": 0.0009346964070573449, "global_step": 46355, "epoch": 389, "lr": 2.7753689522485536e-05} +{"train_loss": 0.0018665592651814222, "global_step": 46356, "epoch": 389, "lr": 2.7751705406498353e-05} +{"train_loss": 0.0015689361607655883, "global_step": 46357, "epoch": 389, "lr": 2.7749721334193323e-05} +{"train_loss": 0.0008104313747026026, "global_step": 46358, "epoch": 389, "lr": 2.774773730557431e-05} +{"train_loss": 0.0017931073671206832, "global_step": 46359, "epoch": 389, "lr": 2.7745753320645263e-05} +{"train_loss": 0.0012228686828166246, "global_step": 46360, "epoch": 389, "lr": 2.7743769379410034e-05} +{"train_loss": 0.003445773385465145, "global_step": 46361, "epoch": 389, "lr": 2.774178548187255e-05} +{"train_loss": 0.000953131471760571, "global_step": 46362, "epoch": 389, "lr": 2.7739801628036676e-05} +{"train_loss": 0.001541233854368329, "global_step": 46363, "epoch": 389, "lr": 2.773781781790634e-05} +{"train_loss": 0.000919516256544739, "global_step": 46364, "epoch": 389, "lr": 2.7735834051485403e-05} +{"train_loss": 0.0012824631994590163, "global_step": 46365, "epoch": 389, "lr": 2.773385032877778e-05} +{"train_loss": 0.0010517806513234973, "global_step": 46366, "epoch": 389, "lr": 2.773186664978738e-05} +{"train_loss": 0.0017340837512165308, "global_step": 46367, "epoch": 389, "lr": 2.772988301451806e-05} +{"train_loss": 0.0021237144246697426, "global_step": 46368, "epoch": 389, "lr": 2.772789942297376e-05} +{"train_loss": 0.00108509068377316, "global_step": 46369, "epoch": 389, "lr": 2.7725915875158344e-05} +{"train_loss": 0.0009344291756860912, "global_step": 46370, "epoch": 389, "lr": 2.7723932371075696e-05} +{"train_loss": 0.0012530034873634577, "global_step": 46371, "epoch": 389, "lr": 2.7721948910729745e-05} +{"train_loss": 0.0012046112678945065, "global_step": 46372, "epoch": 389, "lr": 2.7719965494124344e-05} +{"train_loss": 0.002614513738080859, "global_step": 46373, "epoch": 389, "lr": 2.771798212126344e-05} +{"train_loss": 0.0019967600237578154, "global_step": 46374, "epoch": 389, "lr": 2.7715998792150872e-05} +{"train_loss": 0.000980457291007042, "global_step": 46375, "epoch": 389, "lr": 2.771401550679058e-05} +{"train_loss": 0.0008823331445455551, "global_step": 46376, "epoch": 389, "lr": 2.771203226518644e-05} +{"train_loss": 0.0010699074482545257, "global_step": 46377, "epoch": 389, "lr": 2.7710049067342316e-05} +{"train_loss": 0.0011854689801111817, "global_step": 46378, "epoch": 389, "lr": 2.770806591326216e-05} +{"train_loss": 0.0013279288541525602, "global_step": 46379, "epoch": 389, "lr": 2.7706082802949805e-05} +{"train_loss": 0.001078886678442359, "global_step": 46380, "epoch": 389, "lr": 2.77040997364092e-05} +{"train_loss": 0.001766656176187098, "global_step": 46381, "epoch": 389, "lr": 2.7702116713644212e-05} +{"train_loss": 0.0009632958681322634, "global_step": 46382, "epoch": 389, "lr": 2.770013373465872e-05} +{"train_loss": 0.0013421495677903295, "global_step": 46383, "epoch": 389, "lr": 2.7698150799456647e-05} +{"train_loss": 0.001746219233609736, "global_step": 46384, "epoch": 389, "lr": 2.7696167908041855e-05} +{"train_loss": 0.0009601764613762498, "global_step": 46385, "epoch": 389, "lr": 2.769418506041827e-05} +{"train_loss": 0.0010920766508206725, "global_step": 46386, "epoch": 389, "lr": 2.7692202256589754e-05} +{"train_loss": 0.0013367709470912814, "global_step": 46387, "epoch": 389, "lr": 2.769021949656023e-05} +{"train_loss": 0.00175478623714298, "global_step": 46388, "epoch": 389, "lr": 2.7688236780333587e-05} +{"train_loss": 0.0014884237898513675, "global_step": 46389, "epoch": 389, "lr": 2.7686254107913685e-05} +{"train_loss": 0.00111395213752985, "global_step": 46390, "epoch": 389, "lr": 2.7684271479304458e-05} +{"train_loss": 0.0011498157400637865, "global_step": 46391, "epoch": 389, "lr": 2.7682288894509755e-05} +{"train_loss": 0.0008359065977856517, "global_step": 46392, "epoch": 389, "lr": 2.7680306353533513e-05} +{"train_loss": 0.0014343251241371036, "global_step": 46393, "epoch": 389, "lr": 2.7678323856379595e-05} +{"train_loss": 0.00121870799921453, "global_step": 46394, "epoch": 389, "lr": 2.7676341403051914e-05} +{"train_loss": 0.001053670304827392, "global_step": 46395, "epoch": 389, "lr": 2.7674358993554335e-05} +{"train_loss": 0.001619271351955831, "global_step": 46396, "epoch": 389, "lr": 2.7672376627890783e-05} +{"train_loss": 0.0010360110318288207, "global_step": 46397, "epoch": 389, "lr": 2.767039430606512e-05} +{"train_loss": 0.0012792584020644426, "global_step": 46398, "epoch": 389, "lr": 2.766841202808127e-05} +{"train_loss": 0.0013665021397173405, "global_step": 46399, "epoch": 389, "lr": 2.766642979394309e-05} +{"train_loss": 0.0013633208582177758, "global_step": 46400, "epoch": 389, "lr": 2.7664447603654507e-05} +{"train_loss": 0.001186296925880015, "global_step": 46401, "epoch": 389, "lr": 2.766246545721937e-05} +{"train_loss": 0.0009714096668176353, "global_step": 46402, "epoch": 389, "lr": 2.766048335464162e-05} +{"train_loss": 0.0008019196102395654, "global_step": 46403, "epoch": 389, "lr": 2.765850129592511e-05} +{"train_loss": 0.0010850864928215742, "global_step": 46404, "epoch": 389, "lr": 2.7656519281073756e-05} +{"train_loss": 0.0016918095061555505, "global_step": 46405, "epoch": 389, "lr": 2.7654537310091422e-05} +{"train_loss": 0.0009722418617457151, "global_step": 46406, "epoch": 389, "lr": 2.7652555382982038e-05} +{"train_loss": 0.0009511734824627638, "global_step": 46407, "epoch": 389, "lr": 2.7650573499749478e-05} +{"train_loss": 0.0015693005407229066, "global_step": 46408, "epoch": 389, "lr": 2.7648591660397606e-05} +{"train_loss": 0.0012920470546320582, "global_step": 46409, "epoch": 389, "lr": 2.7646609864930352e-05, "val_loss": 0.011102374643087387} +{"train_loss": 0.001013044617138803, "global_step": 46410, "epoch": 390, "lr": 2.7644628113351578e-05} +{"train_loss": 0.0005033215857110918, "global_step": 46411, "epoch": 390, "lr": 2.7642646405665208e-05} +{"train_loss": 0.0009278950747102499, "global_step": 46412, "epoch": 390, "lr": 2.7640664741875087e-05} +{"train_loss": 0.0012145255459472537, "global_step": 46413, "epoch": 390, "lr": 2.7638683121985155e-05} +{"train_loss": 0.0013960747746750712, "global_step": 46414, "epoch": 390, "lr": 2.7636701545999283e-05} +{"train_loss": 0.0007240494596771896, "global_step": 46415, "epoch": 390, "lr": 2.7634720013921335e-05} +{"train_loss": 0.0009535984136164188, "global_step": 46416, "epoch": 390, "lr": 2.7632738525755242e-05} +{"train_loss": 0.0012720570666715503, "global_step": 46417, "epoch": 390, "lr": 2.7630757081504867e-05} +{"train_loss": 0.0011869784211739898, "global_step": 46418, "epoch": 390, "lr": 2.7628775681174125e-05} +{"train_loss": 0.000983772217296064, "global_step": 46419, "epoch": 390, "lr": 2.762679432476689e-05} +{"train_loss": 0.0009151826379820704, "global_step": 46420, "epoch": 390, "lr": 2.7624813012287032e-05} +{"train_loss": 0.0008955789962783456, "global_step": 46421, "epoch": 390, "lr": 2.7622831743738493e-05} +{"train_loss": 0.001481168088503182, "global_step": 46422, "epoch": 390, "lr": 2.762085051912511e-05} +{"train_loss": 0.0011811417061835527, "global_step": 46423, "epoch": 390, "lr": 2.7618869338450807e-05} +{"train_loss": 0.0009341700933873653, "global_step": 46424, "epoch": 390, "lr": 2.761688820171945e-05} +{"train_loss": 0.0012738569639623165, "global_step": 46425, "epoch": 390, "lr": 2.761490710893496e-05} +{"train_loss": 0.0008341424399986863, "global_step": 46426, "epoch": 390, "lr": 2.761292606010119e-05} +{"train_loss": 0.0008332172292284667, "global_step": 46427, "epoch": 390, "lr": 2.761094505522207e-05} +{"train_loss": 0.0009410957572981715, "global_step": 46428, "epoch": 390, "lr": 2.760896409430145e-05} +{"train_loss": 0.0016780565492808819, "global_step": 46429, "epoch": 390, "lr": 2.760698317734325e-05} +{"train_loss": 0.0012170409318059683, "global_step": 46430, "epoch": 390, "lr": 2.7605002304351325e-05} +{"train_loss": 0.0015178871108219028, "global_step": 46431, "epoch": 390, "lr": 2.7603021475329605e-05} +{"train_loss": 0.0011428919387981296, "global_step": 46432, "epoch": 390, "lr": 2.7601040690281943e-05} +{"train_loss": 0.0009175427840091288, "global_step": 46433, "epoch": 390, "lr": 2.759905994921227e-05} +{"train_loss": 0.0013878613244742155, "global_step": 46434, "epoch": 390, "lr": 2.7597079252124425e-05} +{"train_loss": 0.0010507367551326752, "global_step": 46435, "epoch": 390, "lr": 2.759509859902234e-05} +{"train_loss": 0.0024135082494467497, "global_step": 46436, "epoch": 390, "lr": 2.7593117989909867e-05} +{"train_loss": 0.0008587036281824112, "global_step": 46437, "epoch": 390, "lr": 2.759113742479093e-05} +{"train_loss": 0.001552912057377398, "global_step": 46438, "epoch": 390, "lr": 2.75891569036694e-05} +{"train_loss": 0.00131698336917907, "global_step": 46439, "epoch": 390, "lr": 2.7587176426549157e-05} +{"train_loss": 0.0013208244927227497, "global_step": 46440, "epoch": 390, "lr": 2.7585195993434103e-05} +{"train_loss": 0.0010511489817872643, "global_step": 46441, "epoch": 390, "lr": 2.7583215604328112e-05} +{"train_loss": 0.001128323026932776, "global_step": 46442, "epoch": 390, "lr": 2.75812352592351e-05} +{"train_loss": 0.001325215445831418, "global_step": 46443, "epoch": 390, "lr": 2.757925495815892e-05} +{"train_loss": 0.0011880120728164911, "global_step": 46444, "epoch": 390, "lr": 2.7577274701103495e-05} +{"train_loss": 0.0015773957129567862, "global_step": 46445, "epoch": 390, "lr": 2.757529448807269e-05} +{"train_loss": 0.0016956183826550841, "global_step": 46446, "epoch": 390, "lr": 2.7573314319070387e-05} +{"train_loss": 0.0012283511459827423, "global_step": 46447, "epoch": 390, "lr": 2.75713341941005e-05} +{"train_loss": 0.0011671767570078373, "global_step": 46448, "epoch": 390, "lr": 2.756935411316689e-05} +{"train_loss": 0.001918796100653708, "global_step": 46449, "epoch": 390, "lr": 2.7567374076273466e-05} +{"train_loss": 0.0010249686893075705, "global_step": 46450, "epoch": 390, "lr": 2.756539408342411e-05} +{"train_loss": 0.0012697919737547636, "global_step": 46451, "epoch": 390, "lr": 2.756341413462269e-05} +{"train_loss": 0.0014678178122267127, "global_step": 46452, "epoch": 390, "lr": 2.7561434229873127e-05} +{"train_loss": 0.0010422362247481942, "global_step": 46453, "epoch": 390, "lr": 2.7559454369179273e-05} +{"train_loss": 0.0009331844048574567, "global_step": 46454, "epoch": 390, "lr": 2.7557474552545047e-05} +{"train_loss": 0.000837859814055264, "global_step": 46455, "epoch": 390, "lr": 2.7555494779974312e-05} +{"train_loss": 0.001233489252626896, "global_step": 46456, "epoch": 390, "lr": 2.755351505147098e-05} +{"train_loss": 0.0018395234365016222, "global_step": 46457, "epoch": 390, "lr": 2.7551535367038917e-05} +{"train_loss": 0.001278152223676443, "global_step": 46458, "epoch": 390, "lr": 2.7549555726682e-05} +{"train_loss": 0.0014521065168082714, "global_step": 46459, "epoch": 390, "lr": 2.7547576130404152e-05} +{"train_loss": 0.0009045378537848592, "global_step": 46460, "epoch": 390, "lr": 2.754559657820922e-05} +{"train_loss": 0.0012838034890592098, "global_step": 46461, "epoch": 390, "lr": 2.7543617070101136e-05} +{"train_loss": 0.0016401833854615688, "global_step": 46462, "epoch": 390, "lr": 2.7541637606083738e-05} +{"train_loss": 0.0018514258554205298, "global_step": 46463, "epoch": 390, "lr": 2.7539658186160933e-05} +{"train_loss": 0.000798034539911896, "global_step": 46464, "epoch": 390, "lr": 2.7537678810336626e-05} +{"train_loss": 0.0014675242127850652, "global_step": 46465, "epoch": 390, "lr": 2.7535699478614675e-05} +{"train_loss": 0.001365494797937572, "global_step": 46466, "epoch": 390, "lr": 2.753372019099899e-05} +{"train_loss": 0.0009790905751287937, "global_step": 46467, "epoch": 390, "lr": 2.753174094749343e-05} +{"train_loss": 0.0007970247534103692, "global_step": 46468, "epoch": 390, "lr": 2.7529761748101913e-05} +{"train_loss": 0.0008238937007263303, "global_step": 46469, "epoch": 390, "lr": 2.7527782592828312e-05} +{"train_loss": 0.001275577349588275, "global_step": 46470, "epoch": 390, "lr": 2.752580348167648e-05} +{"train_loss": 0.0011971526546403766, "global_step": 46471, "epoch": 390, "lr": 2.7523824414650368e-05} +{"train_loss": 0.0007174763013608754, "global_step": 46472, "epoch": 390, "lr": 2.7521845391753793e-05} +{"train_loss": 0.0011744373477995396, "global_step": 46473, "epoch": 390, "lr": 2.7519866412990698e-05} +{"train_loss": 0.0010044397786259651, "global_step": 46474, "epoch": 390, "lr": 2.7517887478364924e-05} +{"train_loss": 0.001312566688284278, "global_step": 46475, "epoch": 390, "lr": 2.7515908587880392e-05} +{"train_loss": 0.0016762807499617338, "global_step": 46476, "epoch": 390, "lr": 2.7513929741540974e-05} +{"train_loss": 0.0010338322026655078, "global_step": 46477, "epoch": 390, "lr": 2.7511950939350533e-05} +{"train_loss": 0.0009205095702782273, "global_step": 46478, "epoch": 390, "lr": 2.7509972181312992e-05} +{"train_loss": 0.0011659155134111643, "global_step": 46479, "epoch": 390, "lr": 2.7507993467432204e-05} +{"train_loss": 0.0020316680893301964, "global_step": 46480, "epoch": 390, "lr": 2.7506014797712078e-05} +{"train_loss": 0.0009517743019387126, "global_step": 46481, "epoch": 390, "lr": 2.7504036172156477e-05} +{"train_loss": 0.000732982181943953, "global_step": 46482, "epoch": 390, "lr": 2.7502057590769314e-05} +{"train_loss": 0.0013638435630127788, "global_step": 46483, "epoch": 390, "lr": 2.750007905355446e-05} +{"train_loss": 0.0013710990315303206, "global_step": 46484, "epoch": 390, "lr": 2.7498100560515772e-05} +{"train_loss": 0.0020336408633738756, "global_step": 46485, "epoch": 390, "lr": 2.7496122111657187e-05} +{"train_loss": 0.002096785232424736, "global_step": 46486, "epoch": 390, "lr": 2.7494143706982533e-05} +{"train_loss": 0.0010367707582190633, "global_step": 46487, "epoch": 390, "lr": 2.7492165346495746e-05} +{"train_loss": 0.0008255150751210749, "global_step": 46488, "epoch": 390, "lr": 2.7490187030200693e-05} +{"train_loss": 0.001344699994660914, "global_step": 46489, "epoch": 390, "lr": 2.748820875810123e-05} +{"train_loss": 0.0022972854785621166, "global_step": 46490, "epoch": 390, "lr": 2.7486230530201283e-05} +{"train_loss": 0.0012717198114842176, "global_step": 46491, "epoch": 390, "lr": 2.74842523465047e-05} +{"train_loss": 0.0013225332368165255, "global_step": 46492, "epoch": 390, "lr": 2.7482274207015403e-05} +{"train_loss": 0.0006335750222206116, "global_step": 46493, "epoch": 390, "lr": 2.7480296111737226e-05} +{"train_loss": 0.00123019446618855, "global_step": 46494, "epoch": 390, "lr": 2.7478318060674112e-05} +{"train_loss": 0.0023596519604325294, "global_step": 46495, "epoch": 390, "lr": 2.7476340053829885e-05} +{"train_loss": 0.0011122743599116802, "global_step": 46496, "epoch": 390, "lr": 2.7474362091208482e-05} +{"train_loss": 0.0018488230416551232, "global_step": 46497, "epoch": 390, "lr": 2.7472384172813747e-05} +{"train_loss": 0.0013968244893476367, "global_step": 46498, "epoch": 390, "lr": 2.7470406298649577e-05} +{"train_loss": 0.0008602314628660679, "global_step": 46499, "epoch": 390, "lr": 2.7468428468719877e-05} +{"train_loss": 0.0011656609131023288, "global_step": 46500, "epoch": 390, "lr": 2.746645068302849e-05} +{"train_loss": 0.0010085570393130183, "global_step": 46501, "epoch": 390, "lr": 2.746447294157934e-05} +{"train_loss": 0.000927348795812577, "global_step": 46502, "epoch": 390, "lr": 2.7462495244376286e-05} +{"train_loss": 0.0015050646616145968, "global_step": 46503, "epoch": 390, "lr": 2.7460517591423197e-05} +{"train_loss": 0.0014911799225956202, "global_step": 46504, "epoch": 390, "lr": 2.7458539982723995e-05} +{"train_loss": 0.0011347942054271698, "global_step": 46505, "epoch": 390, "lr": 2.745656241828252e-05} +{"train_loss": 0.0009220088832080364, "global_step": 46506, "epoch": 390, "lr": 2.7454584898102697e-05} +{"train_loss": 0.0016743817832320929, "global_step": 46507, "epoch": 390, "lr": 2.745260742218839e-05} +{"train_loss": 0.0016524092061445117, "global_step": 46508, "epoch": 390, "lr": 2.745062999054346e-05} +{"train_loss": 0.0011627173516899347, "global_step": 46509, "epoch": 390, "lr": 2.7448652603171825e-05} +{"train_loss": 0.0009581900085322559, "global_step": 46510, "epoch": 390, "lr": 2.7446675260077337e-05} +{"train_loss": 0.0008210481610149145, "global_step": 46511, "epoch": 390, "lr": 2.744469796126391e-05} +{"train_loss": 0.001246312982402742, "global_step": 46512, "epoch": 390, "lr": 2.7442720706735382e-05} +{"train_loss": 0.0018024110468104482, "global_step": 46513, "epoch": 390, "lr": 2.744074349649569e-05} +{"train_loss": 0.0017425764817744493, "global_step": 46514, "epoch": 390, "lr": 2.743876633054868e-05} +{"train_loss": 0.0016009893734008074, "global_step": 46515, "epoch": 390, "lr": 2.7436789208898235e-05} +{"train_loss": 0.0012393243378028274, "global_step": 46516, "epoch": 390, "lr": 2.7434812131548255e-05} +{"train_loss": 0.0017849506111815572, "global_step": 46517, "epoch": 390, "lr": 2.743283509850259e-05} +{"train_loss": 0.0009475862607359886, "global_step": 46518, "epoch": 390, "lr": 2.7430858109765167e-05} +{"train_loss": 0.001106383977457881, "global_step": 46519, "epoch": 390, "lr": 2.7428881165339838e-05} +{"train_loss": 0.0015024211024865508, "global_step": 46520, "epoch": 390, "lr": 2.7426904265230476e-05} +{"train_loss": 0.0015064848121255636, "global_step": 46521, "epoch": 390, "lr": 2.742492740944099e-05} +{"train_loss": 0.0017401233781129122, "global_step": 46522, "epoch": 390, "lr": 2.7422950597975226e-05} +{"train_loss": 0.0015530235832557082, "global_step": 46523, "epoch": 390, "lr": 2.7420973830837115e-05} +{"train_loss": 0.0028553633019328117, "global_step": 46524, "epoch": 390, "lr": 2.7418997108030482e-05} +{"train_loss": 0.0017304338980466127, "global_step": 46525, "epoch": 390, "lr": 2.741702042955926e-05} +{"train_loss": 0.0014789985725656152, "global_step": 46526, "epoch": 390, "lr": 2.741504379542728e-05} +{"train_loss": 0.0020248815417289734, "global_step": 46527, "epoch": 390, "lr": 2.7413067205638478e-05} +{"train_loss": 0.0012908454988339619, "global_step": 46528, "epoch": 390, "lr": 2.7411090660196675e-05, "val_loss": 0.024407697841525078, "train_action_mse_error": 1.6661164409015328e-05} +{"train_loss": 0.0010156574426218867, "global_step": 46529, "epoch": 391, "lr": 2.7409114159105808e-05} +{"train_loss": 0.0012338694650679827, "global_step": 46530, "epoch": 391, "lr": 2.7407137702369713e-05} +{"train_loss": 0.0015972064575180411, "global_step": 46531, "epoch": 391, "lr": 2.740516128999231e-05} +{"train_loss": 0.0021523188333958387, "global_step": 46532, "epoch": 391, "lr": 2.740318492197743e-05} +{"train_loss": 0.0011803567176684737, "global_step": 46533, "epoch": 391, "lr": 2.740120859832901e-05} +{"train_loss": 0.002113556256517768, "global_step": 46534, "epoch": 391, "lr": 2.739923231905088e-05} +{"train_loss": 0.00046428473433479667, "global_step": 46535, "epoch": 391, "lr": 2.7397256084146966e-05} +{"train_loss": 0.0020534321665763855, "global_step": 46536, "epoch": 391, "lr": 2.7395279893621105e-05} +{"train_loss": 0.001848282990977168, "global_step": 46537, "epoch": 391, "lr": 2.7393303747477217e-05} +{"train_loss": 0.0007463148212991655, "global_step": 46538, "epoch": 391, "lr": 2.7391327645719156e-05} +{"train_loss": 0.0018550344975665212, "global_step": 46539, "epoch": 391, "lr": 2.738935158835079e-05} +{"train_loss": 0.000795237603597343, "global_step": 46540, "epoch": 391, "lr": 2.738737557537604e-05} +{"train_loss": 0.0008763070800341666, "global_step": 46541, "epoch": 391, "lr": 2.738539960679874e-05} +{"train_loss": 0.0017207675846293569, "global_step": 46542, "epoch": 391, "lr": 2.738342368262281e-05} +{"train_loss": 0.000326995097566396, "global_step": 46543, "epoch": 391, "lr": 2.7381447802852102e-05} +{"train_loss": 0.0020012231543660164, "global_step": 46544, "epoch": 391, "lr": 2.737947196749051e-05} +{"train_loss": 0.0007309385691769421, "global_step": 46545, "epoch": 391, "lr": 2.7377496176541916e-05} +{"train_loss": 0.0012221348006278276, "global_step": 46546, "epoch": 391, "lr": 2.737552043001017e-05} +{"train_loss": 0.0010659558465704322, "global_step": 46547, "epoch": 391, "lr": 2.737354472789919e-05} +{"train_loss": 0.0008813261520117521, "global_step": 46548, "epoch": 391, "lr": 2.737156907021282e-05} +{"train_loss": 0.001506286789663136, "global_step": 46549, "epoch": 391, "lr": 2.7369593456954977e-05} +{"train_loss": 0.0018741117091849446, "global_step": 46550, "epoch": 391, "lr": 2.7367617888129504e-05} +{"train_loss": 0.0007431705598719418, "global_step": 46551, "epoch": 391, "lr": 2.7365642363740307e-05} +{"train_loss": 0.0016862908378243446, "global_step": 46552, "epoch": 391, "lr": 2.736366688379126e-05} +{"train_loss": 0.0021618553437292576, "global_step": 46553, "epoch": 391, "lr": 2.736169144828621e-05} +{"train_loss": 0.0015688425628468394, "global_step": 46554, "epoch": 391, "lr": 2.735971605722908e-05} +{"train_loss": 0.000659128709230572, "global_step": 46555, "epoch": 391, "lr": 2.7357740710623712e-05} +{"train_loss": 0.0010156019125133753, "global_step": 46556, "epoch": 391, "lr": 2.735576540847402e-05} +{"train_loss": 0.0021452722139656544, "global_step": 46557, "epoch": 391, "lr": 2.7353790150783864e-05} +{"train_loss": 0.0007865522638894618, "global_step": 46558, "epoch": 391, "lr": 2.7351814937557103e-05} +{"train_loss": 0.0016635018400847912, "global_step": 46559, "epoch": 391, "lr": 2.734983976879763e-05} +{"train_loss": 0.001235108356922865, "global_step": 46560, "epoch": 391, "lr": 2.7347864644509346e-05} +{"train_loss": 0.0012141799088567495, "global_step": 46561, "epoch": 391, "lr": 2.7345889564696092e-05} +{"train_loss": 0.0008947982569225132, "global_step": 46562, "epoch": 391, "lr": 2.7343914529361784e-05} +{"train_loss": 0.0011897127842530608, "global_step": 46563, "epoch": 391, "lr": 2.7341939538510263e-05} +{"train_loss": 0.002221818547695875, "global_step": 46564, "epoch": 391, "lr": 2.733996459214544e-05} +{"train_loss": 0.0011889387387782335, "global_step": 46565, "epoch": 391, "lr": 2.7337989690271155e-05} +{"train_loss": 0.0011635635746642947, "global_step": 46566, "epoch": 391, "lr": 2.733601483289132e-05} +{"train_loss": 0.0011971675558015704, "global_step": 46567, "epoch": 391, "lr": 2.7334040020009787e-05} +{"train_loss": 0.0012036468833684921, "global_step": 46568, "epoch": 391, "lr": 2.7332065251630466e-05} +{"train_loss": 0.002067709341645241, "global_step": 46569, "epoch": 391, "lr": 2.7330090527757207e-05} +{"train_loss": 0.0014420339139178395, "global_step": 46570, "epoch": 391, "lr": 2.7328115848393876e-05} +{"train_loss": 0.0014070445904508233, "global_step": 46571, "epoch": 391, "lr": 2.7326141213544387e-05} +{"train_loss": 0.0014989344635978341, "global_step": 46572, "epoch": 391, "lr": 2.7324166623212577e-05} +{"train_loss": 0.0007181604742072523, "global_step": 46573, "epoch": 391, "lr": 2.7322192077402364e-05} +{"train_loss": 0.0012935642153024673, "global_step": 46574, "epoch": 391, "lr": 2.732021757611759e-05} +{"train_loss": 0.0026210793294012547, "global_step": 46575, "epoch": 391, "lr": 2.7318243119362158e-05} +{"train_loss": 0.0010954717872664332, "global_step": 46576, "epoch": 391, "lr": 2.7316268707139937e-05} +{"train_loss": 0.0015524841146543622, "global_step": 46577, "epoch": 391, "lr": 2.731429433945477e-05} +{"train_loss": 0.001756216399371624, "global_step": 46578, "epoch": 391, "lr": 2.731232001631059e-05} +{"train_loss": 0.0007255733362399042, "global_step": 46579, "epoch": 391, "lr": 2.731034573771123e-05} +{"train_loss": 0.0012000532587990165, "global_step": 46580, "epoch": 391, "lr": 2.730837150366059e-05} +{"train_loss": 0.0012163419742137194, "global_step": 46581, "epoch": 391, "lr": 2.730639731416253e-05} +{"train_loss": 0.001003354205749929, "global_step": 46582, "epoch": 391, "lr": 2.730442316922095e-05} +{"train_loss": 0.001002045231871307, "global_step": 46583, "epoch": 391, "lr": 2.7302449068839708e-05} +{"train_loss": 0.0013887709937989712, "global_step": 46584, "epoch": 391, "lr": 2.7300475013022663e-05} +{"train_loss": 0.0012144013307988644, "global_step": 46585, "epoch": 391, "lr": 2.7298501001773737e-05} +{"train_loss": 0.0015189849073067307, "global_step": 46586, "epoch": 391, "lr": 2.7296527035096752e-05} +{"train_loss": 0.00164414057508111, "global_step": 46587, "epoch": 391, "lr": 2.729455311299563e-05} +{"train_loss": 0.0016415179707109928, "global_step": 46588, "epoch": 391, "lr": 2.729257923547423e-05} +{"train_loss": 0.0010959969367831945, "global_step": 46589, "epoch": 391, "lr": 2.7290605402536406e-05} +{"train_loss": 0.0016445430228486657, "global_step": 46590, "epoch": 391, "lr": 2.7288631614186066e-05} +{"train_loss": 0.001633586478419602, "global_step": 46591, "epoch": 391, "lr": 2.728665787042706e-05} +{"train_loss": 0.0012190459528937936, "global_step": 46592, "epoch": 391, "lr": 2.7284684171263285e-05} +{"train_loss": 0.0013309759087860584, "global_step": 46593, "epoch": 391, "lr": 2.7282710516698595e-05} +{"train_loss": 0.0016956215258687735, "global_step": 46594, "epoch": 391, "lr": 2.728073690673687e-05} +{"train_loss": 0.0013841841137036681, "global_step": 46595, "epoch": 391, "lr": 2.727876334138202e-05} +{"train_loss": 0.0016891185659915209, "global_step": 46596, "epoch": 391, "lr": 2.7276789820637862e-05} +{"train_loss": 0.0011005682172253728, "global_step": 46597, "epoch": 391, "lr": 2.7274816344508326e-05} +{"train_loss": 0.0007092190789990127, "global_step": 46598, "epoch": 391, "lr": 2.7272842912997233e-05} +{"train_loss": 0.0010103755630552769, "global_step": 46599, "epoch": 391, "lr": 2.7270869526108506e-05} +{"train_loss": 0.0011264653876423836, "global_step": 46600, "epoch": 391, "lr": 2.7268896183845982e-05} +{"train_loss": 0.0019347434863448143, "global_step": 46601, "epoch": 391, "lr": 2.7266922886213562e-05} +{"train_loss": 0.001123934518545866, "global_step": 46602, "epoch": 391, "lr": 2.7264949633215124e-05} +{"train_loss": 0.0013463855721056461, "global_step": 46603, "epoch": 391, "lr": 2.7262976424854502e-05} +{"train_loss": 0.001394780701957643, "global_step": 46604, "epoch": 391, "lr": 2.726100326113562e-05} +{"train_loss": 0.0015510141383856535, "global_step": 46605, "epoch": 391, "lr": 2.7259030142062302e-05} +{"train_loss": 0.0013308768393471837, "global_step": 46606, "epoch": 391, "lr": 2.7257057067638474e-05} +{"train_loss": 0.0009141095215454698, "global_step": 46607, "epoch": 391, "lr": 2.7255084037867982e-05} +{"train_loss": 0.0016768209170550108, "global_step": 46608, "epoch": 391, "lr": 2.7253111052754688e-05} +{"train_loss": 0.001524635124951601, "global_step": 46609, "epoch": 391, "lr": 2.72511381123025e-05} +{"train_loss": 0.0006123468047007918, "global_step": 46610, "epoch": 391, "lr": 2.724916521651525e-05} +{"train_loss": 0.0012279762886464596, "global_step": 46611, "epoch": 391, "lr": 2.7247192365396844e-05} +{"train_loss": 0.001005441532470286, "global_step": 46612, "epoch": 391, "lr": 2.724521955895114e-05} +{"train_loss": 0.0013040215708315372, "global_step": 46613, "epoch": 391, "lr": 2.7243246797182032e-05} +{"train_loss": 0.0008002109243534505, "global_step": 46614, "epoch": 391, "lr": 2.724127408009337e-05} +{"train_loss": 0.002256590873003006, "global_step": 46615, "epoch": 391, "lr": 2.723930140768902e-05} +{"train_loss": 0.001023224089294672, "global_step": 46616, "epoch": 391, "lr": 2.7237328779972892e-05} +{"train_loss": 0.0015487041091546416, "global_step": 46617, "epoch": 391, "lr": 2.7235356196948814e-05} +{"train_loss": 0.0012404263252392411, "global_step": 46618, "epoch": 391, "lr": 2.7233383658620703e-05} +{"train_loss": 0.0009103136835619807, "global_step": 46619, "epoch": 391, "lr": 2.7231411164992394e-05} +{"train_loss": 0.0010155565105378628, "global_step": 46620, "epoch": 391, "lr": 2.722943871606779e-05} +{"train_loss": 0.0016006227815523744, "global_step": 46621, "epoch": 391, "lr": 2.7227466311850758e-05} +{"train_loss": 0.0015104188350960612, "global_step": 46622, "epoch": 391, "lr": 2.722549395234514e-05} +{"train_loss": 0.0006424457533285022, "global_step": 46623, "epoch": 391, "lr": 2.722352163755485e-05} +{"train_loss": 0.0016626989236101508, "global_step": 46624, "epoch": 391, "lr": 2.7221549367483724e-05} +{"train_loss": 0.0013872550334781408, "global_step": 46625, "epoch": 391, "lr": 2.7219577142135672e-05} +{"train_loss": 0.0019820232409983873, "global_step": 46626, "epoch": 391, "lr": 2.7217604961514525e-05} +{"train_loss": 0.001151700271293521, "global_step": 46627, "epoch": 391, "lr": 2.7215632825624198e-05} +{"train_loss": 0.0008258860325440764, "global_step": 46628, "epoch": 391, "lr": 2.721366073446852e-05} +{"train_loss": 0.0012284438125789165, "global_step": 46629, "epoch": 391, "lr": 2.7211688688051385e-05} +{"train_loss": 0.0009129762183874846, "global_step": 46630, "epoch": 391, "lr": 2.7209716686376684e-05} +{"train_loss": 0.0018218090990558267, "global_step": 46631, "epoch": 391, "lr": 2.7207744729448258e-05} +{"train_loss": 0.001263142446987331, "global_step": 46632, "epoch": 391, "lr": 2.7205772817270005e-05} +{"train_loss": 0.0016792027745395899, "global_step": 46633, "epoch": 391, "lr": 2.7203800949845775e-05} +{"train_loss": 0.0006692985771223903, "global_step": 46634, "epoch": 391, "lr": 2.7201829127179436e-05} +{"train_loss": 0.0015370375476777554, "global_step": 46635, "epoch": 391, "lr": 2.7199857349274882e-05} +{"train_loss": 0.0006143914069980383, "global_step": 46636, "epoch": 391, "lr": 2.7197885616135955e-05} +{"train_loss": 0.0015021533472463489, "global_step": 46637, "epoch": 391, "lr": 2.719591392776657e-05} +{"train_loss": 0.0007780523155815899, "global_step": 46638, "epoch": 391, "lr": 2.7193942284170564e-05} +{"train_loss": 0.001162606873549521, "global_step": 46639, "epoch": 391, "lr": 2.7191970685351797e-05} +{"train_loss": 0.000929902889765799, "global_step": 46640, "epoch": 391, "lr": 2.7189999131314182e-05} +{"train_loss": 0.0014090993208810687, "global_step": 46641, "epoch": 391, "lr": 2.718802762206154e-05} +{"train_loss": 0.0016555656911805272, "global_step": 46642, "epoch": 391, "lr": 2.7186056157597795e-05} +{"train_loss": 0.0009668940911069512, "global_step": 46643, "epoch": 391, "lr": 2.7184084737926775e-05} +{"train_loss": 0.0016479713376611471, "global_step": 46644, "epoch": 391, "lr": 2.718211336305238e-05} +{"train_loss": 0.0011592627270147204, "global_step": 46645, "epoch": 391, "lr": 2.718014203297847e-05} +{"train_loss": 0.0014352974249050021, "global_step": 46646, "epoch": 391, "lr": 2.7178170747708893e-05} +{"train_loss": 0.0013225372418949083, "global_step": 46647, "epoch": 391, "lr": 2.7176199507247557e-05, "val_loss": 0.016071341931819916} +{"train_loss": 0.0011624221224337816, "global_step": 46648, "epoch": 392, "lr": 2.71742283115983e-05} +{"train_loss": 0.001465755165554583, "global_step": 46649, "epoch": 392, "lr": 2.7172257160765024e-05} +{"train_loss": 0.001130971359089017, "global_step": 46650, "epoch": 392, "lr": 2.717028605475156e-05} +{"train_loss": 0.001157707767561078, "global_step": 46651, "epoch": 392, "lr": 2.7168314993561828e-05} +{"train_loss": 0.0007196919177658856, "global_step": 46652, "epoch": 392, "lr": 2.716634397719966e-05} +{"train_loss": 0.0022602155804634094, "global_step": 46653, "epoch": 392, "lr": 2.7164373005668924e-05} +{"train_loss": 0.0008879800443537533, "global_step": 46654, "epoch": 392, "lr": 2.716240207897352e-05} +{"train_loss": 0.001384591800160706, "global_step": 46655, "epoch": 392, "lr": 2.7160431197117282e-05} +{"train_loss": 0.0008560116402804852, "global_step": 46656, "epoch": 392, "lr": 2.715846036010411e-05} +{"train_loss": 0.0015982930781319737, "global_step": 46657, "epoch": 392, "lr": 2.7156489567937847e-05} +{"train_loss": 0.0010042916983366013, "global_step": 46658, "epoch": 392, "lr": 2.7154518820622397e-05} +{"train_loss": 0.0011955187655985355, "global_step": 46659, "epoch": 392, "lr": 2.7152548118161587e-05} +{"train_loss": 0.0010864147916436195, "global_step": 46660, "epoch": 392, "lr": 2.7150577460559323e-05} +{"train_loss": 0.00195394572801888, "global_step": 46661, "epoch": 392, "lr": 2.7148606847819447e-05} +{"train_loss": 0.0008975986274890602, "global_step": 46662, "epoch": 392, "lr": 2.714663627994586e-05} +{"train_loss": 0.0017355151940137148, "global_step": 46663, "epoch": 392, "lr": 2.7144665756942383e-05} +{"train_loss": 0.0010035679442808032, "global_step": 46664, "epoch": 392, "lr": 2.7142695278812936e-05} +{"train_loss": 0.0006984648061916232, "global_step": 46665, "epoch": 392, "lr": 2.714072484556135e-05} +{"train_loss": 0.0015458691632375121, "global_step": 46666, "epoch": 392, "lr": 2.7138754457191525e-05} +{"train_loss": 0.0014290024992078543, "global_step": 46667, "epoch": 392, "lr": 2.7136784113707292e-05} +{"train_loss": 0.0007992413593456149, "global_step": 46668, "epoch": 392, "lr": 2.713481381511256e-05} +{"train_loss": 0.0009898412972688675, "global_step": 46669, "epoch": 392, "lr": 2.7132843561411164e-05} +{"train_loss": 0.0009736242354847491, "global_step": 46670, "epoch": 392, "lr": 2.7130873352607e-05} +{"train_loss": 0.0008141238940879703, "global_step": 46671, "epoch": 392, "lr": 2.7128903188703923e-05} +{"train_loss": 0.0010709423804655671, "global_step": 46672, "epoch": 392, "lr": 2.712693306970579e-05} +{"train_loss": 0.001756693352945149, "global_step": 46673, "epoch": 392, "lr": 2.7124962995616493e-05} +{"train_loss": 0.0017975984374061227, "global_step": 46674, "epoch": 392, "lr": 2.712299296643987e-05} +{"train_loss": 0.0012438241392374039, "global_step": 46675, "epoch": 392, "lr": 2.7121022982179822e-05} +{"train_loss": 0.0013140100054442883, "global_step": 46676, "epoch": 392, "lr": 2.7119053042840203e-05} +{"train_loss": 0.002075585536658764, "global_step": 46677, "epoch": 392, "lr": 2.7117083148424867e-05} +{"train_loss": 0.001614549313671887, "global_step": 46678, "epoch": 392, "lr": 2.7115113298937707e-05} +{"train_loss": 0.0016212278278544545, "global_step": 46679, "epoch": 392, "lr": 2.7113143494382554e-05} +{"train_loss": 0.0006733244517818093, "global_step": 46680, "epoch": 392, "lr": 2.711117373476332e-05} +{"train_loss": 0.0011233504628762603, "global_step": 46681, "epoch": 392, "lr": 2.7109204020083834e-05} +{"train_loss": 0.0011712632840499282, "global_step": 46682, "epoch": 392, "lr": 2.7107234350348e-05} +{"train_loss": 0.0007769965450279415, "global_step": 46683, "epoch": 392, "lr": 2.7105264725559665e-05} +{"train_loss": 0.0018779350211843848, "global_step": 46684, "epoch": 392, "lr": 2.7103295145722672e-05} +{"train_loss": 0.0014793508453294635, "global_step": 46685, "epoch": 392, "lr": 2.7101325610840943e-05} +{"train_loss": 0.0017955461516976357, "global_step": 46686, "epoch": 392, "lr": 2.7099356120918283e-05} +{"train_loss": 0.0015444796299561858, "global_step": 46687, "epoch": 392, "lr": 2.709738667595862e-05} +{"train_loss": 0.0008526922320015728, "global_step": 46688, "epoch": 392, "lr": 2.7095417275965768e-05} +{"train_loss": 0.0008835170301608741, "global_step": 46689, "epoch": 392, "lr": 2.709344792094364e-05} +{"train_loss": 0.0010847595985978842, "global_step": 46690, "epoch": 392, "lr": 2.7091478610896072e-05} +{"train_loss": 0.0016493265284225345, "global_step": 46691, "epoch": 392, "lr": 2.7089509345826923e-05} +{"train_loss": 0.002083301544189453, "global_step": 46692, "epoch": 392, "lr": 2.708754012574008e-05} +{"train_loss": 0.0014669910306110978, "global_step": 46693, "epoch": 392, "lr": 2.7085570950639417e-05} +{"train_loss": 0.0013742257142439485, "global_step": 46694, "epoch": 392, "lr": 2.708360182052877e-05} +{"train_loss": 0.000994181726127863, "global_step": 46695, "epoch": 392, "lr": 2.7081632735412042e-05} +{"train_loss": 0.0015120255993679166, "global_step": 46696, "epoch": 392, "lr": 2.7079663695293063e-05} +{"train_loss": 0.0013325994368642569, "global_step": 46697, "epoch": 392, "lr": 2.7077694700175727e-05} +{"train_loss": 0.0007668526377528906, "global_step": 46698, "epoch": 392, "lr": 2.7075725750063874e-05} +{"train_loss": 0.0007905059028416872, "global_step": 46699, "epoch": 392, "lr": 2.7073756844961407e-05} +{"train_loss": 0.001123428693972528, "global_step": 46700, "epoch": 392, "lr": 2.707178798487215e-05} +{"train_loss": 0.000613158568739891, "global_step": 46701, "epoch": 392, "lr": 2.7069819169800004e-05} +{"train_loss": 0.0021054591052234173, "global_step": 46702, "epoch": 392, "lr": 2.7067850399748816e-05} +{"train_loss": 0.0005358365597203374, "global_step": 46703, "epoch": 392, "lr": 2.7065881674722437e-05} +{"train_loss": 0.0018054104875773191, "global_step": 46704, "epoch": 392, "lr": 2.7063912994724773e-05} +{"train_loss": 0.0015949283260852098, "global_step": 46705, "epoch": 392, "lr": 2.706194435975964e-05} +{"train_loss": 0.002449375344440341, "global_step": 46706, "epoch": 392, "lr": 2.7059975769830946e-05} +{"train_loss": 0.001075143227353692, "global_step": 46707, "epoch": 392, "lr": 2.7058007224942545e-05} +{"train_loss": 0.001686889212578535, "global_step": 46708, "epoch": 392, "lr": 2.7056038725098276e-05} +{"train_loss": 0.0007981792441569269, "global_step": 46709, "epoch": 392, "lr": 2.705407027030204e-05} +{"train_loss": 0.0011017289943993092, "global_step": 46710, "epoch": 392, "lr": 2.7052101860557665e-05} +{"train_loss": 0.0014874936314299703, "global_step": 46711, "epoch": 392, "lr": 2.7050133495869056e-05} +{"train_loss": 0.0013182469410821795, "global_step": 46712, "epoch": 392, "lr": 2.7048165176240042e-05} +{"train_loss": 0.0019001722102984786, "global_step": 46713, "epoch": 392, "lr": 2.7046196901674525e-05} +{"train_loss": 0.0010180785320699215, "global_step": 46714, "epoch": 392, "lr": 2.7044228672176342e-05} +{"train_loss": 0.000555211678147316, "global_step": 46715, "epoch": 392, "lr": 2.7042260487749348e-05} +{"train_loss": 0.0009827062021940947, "global_step": 46716, "epoch": 392, "lr": 2.7040292348397446e-05} +{"train_loss": 0.00175512267742306, "global_step": 46717, "epoch": 392, "lr": 2.7038324254124447e-05} +{"train_loss": 0.0019108925480395555, "global_step": 46718, "epoch": 392, "lr": 2.7036356204934272e-05} +{"train_loss": 0.0017334894509986043, "global_step": 46719, "epoch": 392, "lr": 2.703438820083074e-05} +{"train_loss": 0.0011732366401702166, "global_step": 46720, "epoch": 392, "lr": 2.7032420241817746e-05} +{"train_loss": 0.0013164394767954946, "global_step": 46721, "epoch": 392, "lr": 2.7030452327899146e-05} +{"train_loss": 0.0011943186400458217, "global_step": 46722, "epoch": 392, "lr": 2.702848445907878e-05} +{"train_loss": 0.0014042335096746683, "global_step": 46723, "epoch": 392, "lr": 2.702651663536055e-05} +{"train_loss": 0.0014715137658640742, "global_step": 46724, "epoch": 392, "lr": 2.7024548856748276e-05} +{"train_loss": 0.0016532535664737225, "global_step": 46725, "epoch": 392, "lr": 2.702258112324587e-05} +{"train_loss": 0.0008043723646551371, "global_step": 46726, "epoch": 392, "lr": 2.702061343485715e-05} +{"train_loss": 0.0012860955903306603, "global_step": 46727, "epoch": 392, "lr": 2.7018645791586007e-05} +{"train_loss": 0.0011389516294002533, "global_step": 46728, "epoch": 392, "lr": 2.7016678193436306e-05} +{"train_loss": 0.0011561050778254867, "global_step": 46729, "epoch": 392, "lr": 2.701471064041189e-05} +{"train_loss": 0.0015925507759675384, "global_step": 46730, "epoch": 392, "lr": 2.701274313251665e-05} +{"train_loss": 0.0013423687778413296, "global_step": 46731, "epoch": 392, "lr": 2.7010775669754417e-05} +{"train_loss": 0.0006458871066570282, "global_step": 46732, "epoch": 392, "lr": 2.7008808252129087e-05} +{"train_loss": 0.0012680350337177515, "global_step": 46733, "epoch": 392, "lr": 2.70068408796445e-05} +{"train_loss": 0.0013540020445361733, "global_step": 46734, "epoch": 392, "lr": 2.7004873552304515e-05} +{"train_loss": 0.0009690864244475961, "global_step": 46735, "epoch": 392, "lr": 2.700290627011302e-05} +{"train_loss": 0.0008383735548704863, "global_step": 46736, "epoch": 392, "lr": 2.7000939033073842e-05} +{"train_loss": 0.0016734824748709798, "global_step": 46737, "epoch": 392, "lr": 2.6998971841190877e-05} +{"train_loss": 0.0012714150361716747, "global_step": 46738, "epoch": 392, "lr": 2.6997004694467965e-05} +{"train_loss": 0.0009109603124670684, "global_step": 46739, "epoch": 392, "lr": 2.6995037592908988e-05} +{"train_loss": 0.0008687312947586179, "global_step": 46740, "epoch": 392, "lr": 2.6993070536517806e-05} +{"train_loss": 0.0013356679119169712, "global_step": 46741, "epoch": 392, "lr": 2.6991103525298244e-05} +{"train_loss": 0.0014968299074098468, "global_step": 46742, "epoch": 392, "lr": 2.6989136559254212e-05} +{"train_loss": 0.0011152984807267785, "global_step": 46743, "epoch": 392, "lr": 2.6987169638389532e-05} +{"train_loss": 0.0013012909330427647, "global_step": 46744, "epoch": 392, "lr": 2.6985202762708113e-05} +{"train_loss": 0.0009990923572331667, "global_step": 46745, "epoch": 392, "lr": 2.698323593221378e-05} +{"train_loss": 0.000772819563280791, "global_step": 46746, "epoch": 392, "lr": 2.6981269146910394e-05} +{"train_loss": 0.0012463823659345508, "global_step": 46747, "epoch": 392, "lr": 2.6979302406801844e-05} +{"train_loss": 0.0015485396143049002, "global_step": 46748, "epoch": 392, "lr": 2.697733571189195e-05} +{"train_loss": 0.0020244454499334097, "global_step": 46749, "epoch": 392, "lr": 2.697536906218462e-05} +{"train_loss": 0.0010168071603402495, "global_step": 46750, "epoch": 392, "lr": 2.6973402457683672e-05} +{"train_loss": 0.001025970559567213, "global_step": 46751, "epoch": 392, "lr": 2.6971435898393007e-05} +{"train_loss": 0.000706588092725724, "global_step": 46752, "epoch": 392, "lr": 2.696946938431647e-05} +{"train_loss": 0.0012583924690261483, "global_step": 46753, "epoch": 392, "lr": 2.69675029154579e-05} +{"train_loss": 0.0008193796966224909, "global_step": 46754, "epoch": 392, "lr": 2.6965536491821197e-05} +{"train_loss": 0.0011652745306491852, "global_step": 46755, "epoch": 392, "lr": 2.6963570113410175e-05} +{"train_loss": 0.0015339170349761844, "global_step": 46756, "epoch": 392, "lr": 2.696160378022875e-05} +{"train_loss": 0.0023644864559173584, "global_step": 46757, "epoch": 392, "lr": 2.6959637492280732e-05} +{"train_loss": 0.0004965715343132615, "global_step": 46758, "epoch": 392, "lr": 2.6957671249570027e-05} +{"train_loss": 0.0014360479544848204, "global_step": 46759, "epoch": 392, "lr": 2.6955705052100455e-05} +{"train_loss": 0.0012773287016898394, "global_step": 46760, "epoch": 392, "lr": 2.6953738899875907e-05} +{"train_loss": 0.0012914566323161125, "global_step": 46761, "epoch": 392, "lr": 2.6951772792900215e-05} +{"train_loss": 0.001406033174134791, "global_step": 46762, "epoch": 392, "lr": 2.694980673117725e-05} +{"train_loss": 0.0013110575964674354, "global_step": 46763, "epoch": 392, "lr": 2.6947840714710903e-05} +{"train_loss": 0.0008778289193287492, "global_step": 46764, "epoch": 392, "lr": 2.6945874743505007e-05} +{"train_loss": 0.0014803048688918352, "global_step": 46765, "epoch": 392, "lr": 2.69439088175634e-05} +{"train_loss": 0.0012783622031663584, "global_step": 46766, "epoch": 392, "lr": 2.6941942936889985e-05, "val_loss": 0.021694883704185486} +{"train_loss": 0.0010398918529972434, "global_step": 46767, "epoch": 393, "lr": 2.693997710148859e-05} +{"train_loss": 0.0014051215257495642, "global_step": 46768, "epoch": 393, "lr": 2.69380113113631e-05} +{"train_loss": 0.0017882655374705791, "global_step": 46769, "epoch": 393, "lr": 2.693604556651733e-05} +{"train_loss": 0.0011057943338528275, "global_step": 46770, "epoch": 393, "lr": 2.693407986695521e-05} +{"train_loss": 0.0009720218367874622, "global_step": 46771, "epoch": 393, "lr": 2.6932114212680548e-05} +{"train_loss": 0.0017613726668059826, "global_step": 46772, "epoch": 393, "lr": 2.6930148603697196e-05} +{"train_loss": 0.0008807323174551129, "global_step": 46773, "epoch": 393, "lr": 2.692818304000906e-05} +{"train_loss": 0.0014072732301428914, "global_step": 46774, "epoch": 393, "lr": 2.6926217521619944e-05} +{"train_loss": 0.0006527452496811748, "global_step": 46775, "epoch": 393, "lr": 2.6924252048533756e-05} +{"train_loss": 0.0004338718135841191, "global_step": 46776, "epoch": 393, "lr": 2.6922286620754333e-05} +{"train_loss": 0.0013733819359913468, "global_step": 46777, "epoch": 393, "lr": 2.6920321238285518e-05} +{"train_loss": 0.0018346356227993965, "global_step": 46778, "epoch": 393, "lr": 2.691835590113121e-05} +{"train_loss": 0.0008410230511799455, "global_step": 46779, "epoch": 393, "lr": 2.6916390609295215e-05} +{"train_loss": 0.0008614641265012324, "global_step": 46780, "epoch": 393, "lr": 2.691442536278145e-05} +{"train_loss": 0.0008509281324222684, "global_step": 46781, "epoch": 393, "lr": 2.6912460161593718e-05} +{"train_loss": 0.0013163031544536352, "global_step": 46782, "epoch": 393, "lr": 2.6910495005735926e-05} +{"train_loss": 0.0004790517268702388, "global_step": 46783, "epoch": 393, "lr": 2.6908529895211908e-05} +{"train_loss": 0.0009945498313754797, "global_step": 46784, "epoch": 393, "lr": 2.6906564830025504e-05} +{"train_loss": 0.0009676865884102881, "global_step": 46785, "epoch": 393, "lr": 2.690459981018062e-05} +{"train_loss": 0.0016978397034108639, "global_step": 46786, "epoch": 393, "lr": 2.690263483568106e-05} +{"train_loss": 0.001435319078154862, "global_step": 46787, "epoch": 393, "lr": 2.6900669906530734e-05} +{"train_loss": 0.0006181984208524227, "global_step": 46788, "epoch": 393, "lr": 2.689870502273345e-05} +{"train_loss": 0.001265080412849784, "global_step": 46789, "epoch": 393, "lr": 2.689674018429311e-05} +{"train_loss": 0.0009079320589080453, "global_step": 46790, "epoch": 393, "lr": 2.6894775391213538e-05} +{"train_loss": 0.0010020865593105555, "global_step": 46791, "epoch": 393, "lr": 2.6892810643498623e-05} +{"train_loss": 0.000692998815793544, "global_step": 46792, "epoch": 393, "lr": 2.689084594115219e-05} +{"train_loss": 0.0009415626409463584, "global_step": 46793, "epoch": 393, "lr": 2.6888881284178125e-05} +{"train_loss": 0.0009701855015009642, "global_step": 46794, "epoch": 393, "lr": 2.688691667258026e-05} +{"train_loss": 0.0007416016305796802, "global_step": 46795, "epoch": 393, "lr": 2.6884952106362482e-05} +{"train_loss": 0.0005846992135047913, "global_step": 46796, "epoch": 393, "lr": 2.688298758552861e-05} +{"train_loss": 0.0007417045999318361, "global_step": 46797, "epoch": 393, "lr": 2.6881023110082538e-05} +{"train_loss": 0.0006141301128081977, "global_step": 46798, "epoch": 393, "lr": 2.687905868002809e-05} +{"train_loss": 0.0012363584246486425, "global_step": 46799, "epoch": 393, "lr": 2.6877094295369165e-05} +{"train_loss": 0.0007649962208233774, "global_step": 46800, "epoch": 393, "lr": 2.687512995610957e-05} +{"train_loss": 0.00215217936784029, "global_step": 46801, "epoch": 393, "lr": 2.6873165662253208e-05} +{"train_loss": 0.0009951300453394651, "global_step": 46802, "epoch": 393, "lr": 2.6871201413803913e-05} +{"train_loss": 0.0009972923435270786, "global_step": 46803, "epoch": 393, "lr": 2.686923721076553e-05} +{"train_loss": 0.0013378240400925279, "global_step": 46804, "epoch": 393, "lr": 2.6867273053141938e-05} +{"train_loss": 0.0015969143714755774, "global_step": 46805, "epoch": 393, "lr": 2.686530894093697e-05} +{"train_loss": 0.0009949048981070518, "global_step": 46806, "epoch": 393, "lr": 2.6863344874154516e-05} +{"train_loss": 0.0005536543903872371, "global_step": 46807, "epoch": 393, "lr": 2.686138085279839e-05} +{"train_loss": 0.001555100199766457, "global_step": 46808, "epoch": 393, "lr": 2.6859416876872494e-05} +{"train_loss": 0.0013282232685014606, "global_step": 46809, "epoch": 393, "lr": 2.6857452946380663e-05} +{"train_loss": 0.0007218638202175498, "global_step": 46810, "epoch": 393, "lr": 2.685548906132672e-05} +{"train_loss": 0.0007144420524127781, "global_step": 46811, "epoch": 393, "lr": 2.6853525221714582e-05} +{"train_loss": 0.0015223186928778887, "global_step": 46812, "epoch": 393, "lr": 2.6851561427548055e-05} +{"train_loss": 0.0007768023642711341, "global_step": 46813, "epoch": 393, "lr": 2.6849597678831028e-05} +{"train_loss": 0.0017303850036114454, "global_step": 46814, "epoch": 393, "lr": 2.6847633975567345e-05} +{"train_loss": 0.0010508885607123375, "global_step": 46815, "epoch": 393, "lr": 2.684567031776084e-05} +{"train_loss": 0.0015070372028276324, "global_step": 46816, "epoch": 393, "lr": 2.6843706705415406e-05} +{"train_loss": 0.0006872428930364549, "global_step": 46817, "epoch": 393, "lr": 2.6841743138534863e-05} +{"train_loss": 0.0009570826659910381, "global_step": 46818, "epoch": 393, "lr": 2.6839779617123102e-05} +{"train_loss": 0.0012822296703234315, "global_step": 46819, "epoch": 393, "lr": 2.6837816141183936e-05} +{"train_loss": 0.0017125329468399286, "global_step": 46820, "epoch": 393, "lr": 2.6835852710721267e-05} +{"train_loss": 0.0012191056739538908, "global_step": 46821, "epoch": 393, "lr": 2.6833889325738924e-05} +{"train_loss": 0.0006925574271008372, "global_step": 46822, "epoch": 393, "lr": 2.6831925986240747e-05} +{"train_loss": 0.0009413470979779959, "global_step": 46823, "epoch": 393, "lr": 2.6829962692230627e-05} +{"train_loss": 0.00055061059538275, "global_step": 46824, "epoch": 393, "lr": 2.682799944371238e-05} +{"train_loss": 0.0012046487536281347, "global_step": 46825, "epoch": 393, "lr": 2.6826036240689883e-05} +{"train_loss": 0.0009496191632933915, "global_step": 46826, "epoch": 393, "lr": 2.6824073083167006e-05} +{"train_loss": 0.000912882445845753, "global_step": 46827, "epoch": 393, "lr": 2.682210997114757e-05} +{"train_loss": 0.0007993402541615069, "global_step": 46828, "epoch": 393, "lr": 2.6820146904635457e-05} +{"train_loss": 0.0008717437740415335, "global_step": 46829, "epoch": 393, "lr": 2.681818388363449e-05} +{"train_loss": 0.0005549995694309473, "global_step": 46830, "epoch": 393, "lr": 2.6816220908148564e-05} +{"train_loss": 0.001533573609776795, "global_step": 46831, "epoch": 393, "lr": 2.681425797818149e-05} +{"train_loss": 0.0007083627278916538, "global_step": 46832, "epoch": 393, "lr": 2.6812295093737173e-05} +{"train_loss": 0.001111808349378407, "global_step": 46833, "epoch": 393, "lr": 2.6810332254819427e-05} +{"train_loss": 0.0014644534094259143, "global_step": 46834, "epoch": 393, "lr": 2.68083694614321e-05} +{"train_loss": 0.0012997171143069863, "global_step": 46835, "epoch": 393, "lr": 2.680640671357908e-05} +{"train_loss": 0.0006986440275795758, "global_step": 46836, "epoch": 393, "lr": 2.6804444011264184e-05} +{"train_loss": 0.0018333822954446077, "global_step": 46837, "epoch": 393, "lr": 2.6802481354491306e-05} +{"train_loss": 0.0013672009808942676, "global_step": 46838, "epoch": 393, "lr": 2.6800518743264247e-05} +{"train_loss": 0.001443622400984168, "global_step": 46839, "epoch": 393, "lr": 2.679855617758692e-05} +{"train_loss": 0.0011424595722928643, "global_step": 46840, "epoch": 393, "lr": 2.6796593657463153e-05} +{"train_loss": 0.0009207711555063725, "global_step": 46841, "epoch": 393, "lr": 2.679463118289677e-05} +{"train_loss": 0.0008492097840644419, "global_step": 46842, "epoch": 393, "lr": 2.679266875389167e-05} +{"train_loss": 0.0017735506407916546, "global_step": 46843, "epoch": 393, "lr": 2.679070637045167e-05} +{"train_loss": 0.000916203367523849, "global_step": 46844, "epoch": 393, "lr": 2.6788744032580648e-05} +{"train_loss": 0.0010580437956377864, "global_step": 46845, "epoch": 393, "lr": 2.6786781740282453e-05} +{"train_loss": 0.0009678017231635749, "global_step": 46846, "epoch": 393, "lr": 2.6784819493560915e-05} +{"train_loss": 0.0006891285302117467, "global_step": 46847, "epoch": 393, "lr": 2.678285729241992e-05} +{"train_loss": 0.0011277933372184634, "global_step": 46848, "epoch": 393, "lr": 2.6780895136863288e-05} +{"train_loss": 0.0016441417392343283, "global_step": 46849, "epoch": 393, "lr": 2.6778933026894904e-05} +{"train_loss": 0.00039812090108171105, "global_step": 46850, "epoch": 393, "lr": 2.6776970962518587e-05} +{"train_loss": 0.0010707753244787455, "global_step": 46851, "epoch": 393, "lr": 2.6775008943738223e-05} +{"train_loss": 0.00038492915336973965, "global_step": 46852, "epoch": 393, "lr": 2.6773046970557648e-05} +{"train_loss": 0.0018455820390954614, "global_step": 46853, "epoch": 393, "lr": 2.67710850429807e-05} +{"train_loss": 0.0014379690401256084, "global_step": 46854, "epoch": 393, "lr": 2.6769123161011257e-05} +{"train_loss": 0.0007310806540772319, "global_step": 46855, "epoch": 393, "lr": 2.6767161324653146e-05} +{"train_loss": 0.0008897521183826029, "global_step": 46856, "epoch": 393, "lr": 2.6765199533910247e-05} +{"train_loss": 0.0017323218053206801, "global_step": 46857, "epoch": 393, "lr": 2.6763237788786377e-05} +{"train_loss": 0.0010610469616949558, "global_step": 46858, "epoch": 393, "lr": 2.6761276089285426e-05} +{"train_loss": 0.0016638332745060325, "global_step": 46859, "epoch": 393, "lr": 2.675931443541121e-05} +{"train_loss": 0.0011051963083446026, "global_step": 46860, "epoch": 393, "lr": 2.6757352827167596e-05} +{"train_loss": 0.0020189916249364614, "global_step": 46861, "epoch": 393, "lr": 2.675539126455846e-05} +{"train_loss": 0.002074682619422674, "global_step": 46862, "epoch": 393, "lr": 2.6753429747587606e-05} +{"train_loss": 0.0013924246886745095, "global_step": 46863, "epoch": 393, "lr": 2.6751468276258927e-05} +{"train_loss": 0.0007480377680622041, "global_step": 46864, "epoch": 393, "lr": 2.6749506850576257e-05} +{"train_loss": 0.0006683752289973199, "global_step": 46865, "epoch": 393, "lr": 2.6747545470543435e-05} +{"train_loss": 0.0015155154978856444, "global_step": 46866, "epoch": 393, "lr": 2.674558413616433e-05} +{"train_loss": 0.0008552801446057856, "global_step": 46867, "epoch": 393, "lr": 2.674362284744277e-05} +{"train_loss": 0.0010957787744700909, "global_step": 46868, "epoch": 393, "lr": 2.674166160438265e-05} +{"train_loss": 0.0008782354416325688, "global_step": 46869, "epoch": 393, "lr": 2.6739700406987765e-05} +{"train_loss": 0.0011698103044182062, "global_step": 46870, "epoch": 393, "lr": 2.6737739255262018e-05} +{"train_loss": 0.002157842507585883, "global_step": 46871, "epoch": 393, "lr": 2.6735778149209233e-05} +{"train_loss": 0.0006178845069371164, "global_step": 46872, "epoch": 393, "lr": 2.6733817088833236e-05} +{"train_loss": 0.0014489018358290195, "global_step": 46873, "epoch": 393, "lr": 2.6731856074137928e-05} +{"train_loss": 0.0007043768418952823, "global_step": 46874, "epoch": 393, "lr": 2.6729895105127122e-05} +{"train_loss": 0.001036363304592669, "global_step": 46875, "epoch": 393, "lr": 2.6727934181804694e-05} +{"train_loss": 0.0006336534861475229, "global_step": 46876, "epoch": 393, "lr": 2.672597330417448e-05} +{"train_loss": 0.0012342262780293822, "global_step": 46877, "epoch": 393, "lr": 2.6724012472240312e-05} +{"train_loss": 0.0006796049419790506, "global_step": 46878, "epoch": 393, "lr": 2.6722051686006077e-05} +{"train_loss": 0.001056341570802033, "global_step": 46879, "epoch": 393, "lr": 2.672009094547559e-05} +{"train_loss": 0.0009670160943642259, "global_step": 46880, "epoch": 393, "lr": 2.671813025065274e-05} +{"train_loss": 0.001836986979469657, "global_step": 46881, "epoch": 393, "lr": 2.671616960154133e-05} +{"train_loss": 0.001210009679198265, "global_step": 46882, "epoch": 393, "lr": 2.6714208998145252e-05} +{"train_loss": 0.0012286596465855837, "global_step": 46883, "epoch": 393, "lr": 2.6712248440468333e-05} +{"train_loss": 0.0013612067559733987, "global_step": 46884, "epoch": 393, "lr": 2.6710287928514415e-05} +{"train_loss": 0.001113000009629578, "global_step": 46885, "epoch": 393, "lr": 2.6708327462287374e-05, "val_loss": 0.01185697689652443} +{"train_loss": 0.0012446003966033459, "global_step": 46886, "epoch": 394, "lr": 2.6706367041791025e-05} +{"train_loss": 0.0013307721819728613, "global_step": 46887, "epoch": 394, "lr": 2.670440666702926e-05} +{"train_loss": 0.0007007710519246757, "global_step": 46888, "epoch": 394, "lr": 2.670244633800588e-05} +{"train_loss": 0.0011730295373126864, "global_step": 46889, "epoch": 394, "lr": 2.6700486054724777e-05} +{"train_loss": 0.0008101413259282708, "global_step": 46890, "epoch": 394, "lr": 2.6698525817189758e-05} +{"train_loss": 0.0010203944984823465, "global_step": 46891, "epoch": 394, "lr": 2.669656562540472e-05} +{"train_loss": 0.0014803532976657152, "global_step": 46892, "epoch": 394, "lr": 2.669460547937346e-05} +{"train_loss": 0.0016221572877839208, "global_step": 46893, "epoch": 394, "lr": 2.6692645379099877e-05} +{"train_loss": 0.0007246798486448824, "global_step": 46894, "epoch": 394, "lr": 2.6690685324587773e-05} +{"train_loss": 0.00108504225499928, "global_step": 46895, "epoch": 394, "lr": 2.6688725315841035e-05} +{"train_loss": 0.0009368450846523046, "global_step": 46896, "epoch": 394, "lr": 2.668676535286348e-05} +{"train_loss": 0.0014743661740794778, "global_step": 46897, "epoch": 394, "lr": 2.668480543565899e-05} +{"train_loss": 0.0005979180568829179, "global_step": 46898, "epoch": 394, "lr": 2.6682845564231368e-05} +{"train_loss": 0.0013559613144025207, "global_step": 46899, "epoch": 394, "lr": 2.668088573858451e-05} +{"train_loss": 0.0011433627223595977, "global_step": 46900, "epoch": 394, "lr": 2.6678925958722222e-05} +{"train_loss": 0.001543280086480081, "global_step": 46901, "epoch": 394, "lr": 2.6676966224648394e-05} +{"train_loss": 0.0008457062649540603, "global_step": 46902, "epoch": 394, "lr": 2.6675006536366854e-05} +{"train_loss": 0.0009214857127517462, "global_step": 46903, "epoch": 394, "lr": 2.6673046893881414e-05} +{"train_loss": 0.0011734366416931152, "global_step": 46904, "epoch": 394, "lr": 2.6671087297195984e-05} +{"train_loss": 0.0013774533290416002, "global_step": 46905, "epoch": 394, "lr": 2.666912774631436e-05} +{"train_loss": 0.000876205216627568, "global_step": 46906, "epoch": 394, "lr": 2.6667168241240435e-05} +{"train_loss": 0.001097878091968596, "global_step": 46907, "epoch": 394, "lr": 2.6665208781978007e-05} +{"train_loss": 0.0008375314064323902, "global_step": 46908, "epoch": 394, "lr": 2.6663249368530974e-05} +{"train_loss": 0.0008540167473256588, "global_step": 46909, "epoch": 394, "lr": 2.6661290000903148e-05} +{"train_loss": 0.0016243498539552093, "global_step": 46910, "epoch": 394, "lr": 2.6659330679098372e-05} +{"train_loss": 0.0007017204770818353, "global_step": 46911, "epoch": 394, "lr": 2.665737140312053e-05} +{"train_loss": 0.0009643008233979344, "global_step": 46912, "epoch": 394, "lr": 2.665541217297342e-05} +{"train_loss": 0.0015323824482038617, "global_step": 46913, "epoch": 394, "lr": 2.6653452988660932e-05} +{"train_loss": 0.0006039226427674294, "global_step": 46914, "epoch": 394, "lr": 2.6651493850186903e-05} +{"train_loss": 0.0007573342300020158, "global_step": 46915, "epoch": 394, "lr": 2.664953475755515e-05} +{"train_loss": 0.0007466470706276596, "global_step": 46916, "epoch": 394, "lr": 2.6647575710769558e-05} +{"train_loss": 0.0007756907725706697, "global_step": 46917, "epoch": 394, "lr": 2.664561670983393e-05} +{"train_loss": 0.0009372841450385749, "global_step": 46918, "epoch": 394, "lr": 2.6643657754752173e-05} +{"train_loss": 0.0006263842224143445, "global_step": 46919, "epoch": 394, "lr": 2.664169884552806e-05} +{"train_loss": 0.000614015618339181, "global_step": 46920, "epoch": 394, "lr": 2.6639739982165512e-05} +{"train_loss": 0.000996243441477418, "global_step": 46921, "epoch": 394, "lr": 2.663778116466833e-05} +{"train_loss": 0.0007256536628119648, "global_step": 46922, "epoch": 394, "lr": 2.6635822393040354e-05} +{"train_loss": 0.0009412596700713038, "global_step": 46923, "epoch": 394, "lr": 2.6633863667285442e-05} +{"train_loss": 0.001564991776831448, "global_step": 46924, "epoch": 394, "lr": 2.6631904987407465e-05} +{"train_loss": 0.00177941529545933, "global_step": 46925, "epoch": 394, "lr": 2.6629946353410223e-05} +{"train_loss": 0.0006810618797317147, "global_step": 46926, "epoch": 394, "lr": 2.6627987765297606e-05} +{"train_loss": 0.0009494603145867586, "global_step": 46927, "epoch": 394, "lr": 2.6626029223073416e-05} +{"train_loss": 0.000924907042644918, "global_step": 46928, "epoch": 394, "lr": 2.6624070726741546e-05} +{"train_loss": 0.0005203175242058933, "global_step": 46929, "epoch": 394, "lr": 2.662211227630579e-05} +{"train_loss": 0.0017020829254761338, "global_step": 46930, "epoch": 394, "lr": 2.6620153871770044e-05} +{"train_loss": 0.0007991577149368823, "global_step": 46931, "epoch": 394, "lr": 2.66181955131381e-05} +{"train_loss": 0.0009800931438803673, "global_step": 46932, "epoch": 394, "lr": 2.6616237200413862e-05} +{"train_loss": 0.0017277778824791312, "global_step": 46933, "epoch": 394, "lr": 2.6614278933601134e-05} +{"train_loss": 0.0008562167640775442, "global_step": 46934, "epoch": 394, "lr": 2.6612320712703758e-05} +{"train_loss": 0.0011616580886766315, "global_step": 46935, "epoch": 394, "lr": 2.6610362537725607e-05} +{"train_loss": 0.0008842853712849319, "global_step": 46936, "epoch": 394, "lr": 2.6608404408670495e-05} +{"train_loss": 0.001494478085078299, "global_step": 46937, "epoch": 394, "lr": 2.66064463255423e-05} +{"train_loss": 0.0006874798564240336, "global_step": 46938, "epoch": 394, "lr": 2.6604488288344824e-05} +{"train_loss": 0.0011734433937817812, "global_step": 46939, "epoch": 394, "lr": 2.6602530297081963e-05} +{"train_loss": 0.002558824373409152, "global_step": 46940, "epoch": 394, "lr": 2.660057235175753e-05} +{"train_loss": 0.001143197761848569, "global_step": 46941, "epoch": 394, "lr": 2.6598614452375352e-05} +{"train_loss": 0.0008149346685968339, "global_step": 46942, "epoch": 394, "lr": 2.6596656598939316e-05} +{"train_loss": 0.0011095269583165646, "global_step": 46943, "epoch": 394, "lr": 2.6594698791453226e-05} +{"train_loss": 0.0022533710580319166, "global_step": 46944, "epoch": 394, "lr": 2.6592741029920964e-05} +{"train_loss": 0.000793601619079709, "global_step": 46945, "epoch": 394, "lr": 2.6590783314346358e-05} +{"train_loss": 0.0011948299361392856, "global_step": 46946, "epoch": 394, "lr": 2.6588825644733216e-05} +{"train_loss": 0.001260361517779529, "global_step": 46947, "epoch": 394, "lr": 2.6586868021085442e-05} +{"train_loss": 0.0010739592835307121, "global_step": 46948, "epoch": 394, "lr": 2.658491044340683e-05} +{"train_loss": 0.0015726308338344097, "global_step": 46949, "epoch": 394, "lr": 2.6582952911701265e-05} +{"train_loss": 0.001044680830091238, "global_step": 46950, "epoch": 394, "lr": 2.6580995425972556e-05} +{"train_loss": 0.0011362566146999598, "global_step": 46951, "epoch": 394, "lr": 2.6579037986224576e-05} +{"train_loss": 0.0008915705839172006, "global_step": 46952, "epoch": 394, "lr": 2.6577080592461144e-05} +{"train_loss": 0.0015517548890784383, "global_step": 46953, "epoch": 394, "lr": 2.6575123244686106e-05} +{"train_loss": 0.0005690354737453163, "global_step": 46954, "epoch": 394, "lr": 2.657316594290332e-05} +{"train_loss": 0.0012984350323677063, "global_step": 46955, "epoch": 394, "lr": 2.6571208687116612e-05} +{"train_loss": 0.00226135877892375, "global_step": 46956, "epoch": 394, "lr": 2.656925147732984e-05} +{"train_loss": 0.0022988030686974525, "global_step": 46957, "epoch": 394, "lr": 2.6567294313546832e-05} +{"train_loss": 0.0009660848299972713, "global_step": 46958, "epoch": 394, "lr": 2.6565337195771424e-05} +{"train_loss": 0.00153815106023103, "global_step": 46959, "epoch": 394, "lr": 2.6563380124007503e-05} +{"train_loss": 0.0008216539863497019, "global_step": 46960, "epoch": 394, "lr": 2.656142309825886e-05} +{"train_loss": 0.0008686644141562283, "global_step": 46961, "epoch": 394, "lr": 2.6559466118529375e-05} +{"train_loss": 0.0005472059710882604, "global_step": 46962, "epoch": 394, "lr": 2.655750918482286e-05} +{"train_loss": 0.0021344551350921392, "global_step": 46963, "epoch": 394, "lr": 2.6555552297143182e-05} +{"train_loss": 0.0011601266451179981, "global_step": 46964, "epoch": 394, "lr": 2.655359545549418e-05} +{"train_loss": 0.0005372154409997165, "global_step": 46965, "epoch": 394, "lr": 2.655163865987966e-05} +{"train_loss": 0.0013615459902212024, "global_step": 46966, "epoch": 394, "lr": 2.6549681910303526e-05} +{"train_loss": 0.0008085203007794917, "global_step": 46967, "epoch": 394, "lr": 2.6547725206769557e-05} +{"train_loss": 0.00132356071844697, "global_step": 46968, "epoch": 394, "lr": 2.6545768549281647e-05} +{"train_loss": 0.0007150140008889139, "global_step": 46969, "epoch": 394, "lr": 2.654381193784359e-05} +{"train_loss": 0.0006966253858990967, "global_step": 46970, "epoch": 394, "lr": 2.654185537245928e-05} +{"train_loss": 0.001130604767240584, "global_step": 46971, "epoch": 394, "lr": 2.653989885313252e-05} +{"train_loss": 0.0009452425874769688, "global_step": 46972, "epoch": 394, "lr": 2.6537942379867152e-05} +{"train_loss": 0.0005312638240866363, "global_step": 46973, "epoch": 394, "lr": 2.6535985952667043e-05} +{"train_loss": 0.0006616130121983588, "global_step": 46974, "epoch": 394, "lr": 2.6534029571536003e-05} +{"train_loss": 0.0023806216195225716, "global_step": 46975, "epoch": 394, "lr": 2.6532073236477907e-05} +{"train_loss": 0.0007784842746332288, "global_step": 46976, "epoch": 394, "lr": 2.6530116947496553e-05} +{"train_loss": 0.001345828757621348, "global_step": 46977, "epoch": 394, "lr": 2.6528160704595834e-05} +{"train_loss": 0.0010158105287700891, "global_step": 46978, "epoch": 394, "lr": 2.6526204507779563e-05} +{"train_loss": 0.0011692920234054327, "global_step": 46979, "epoch": 394, "lr": 2.652424835705156e-05} +{"train_loss": 0.001113839796744287, "global_step": 46980, "epoch": 394, "lr": 2.6522292252415703e-05} +{"train_loss": 0.0005613424000330269, "global_step": 46981, "epoch": 394, "lr": 2.6520336193875805e-05} +{"train_loss": 0.0010156536009162664, "global_step": 46982, "epoch": 394, "lr": 2.651838018143573e-05} +{"train_loss": 0.0012944007758051157, "global_step": 46983, "epoch": 394, "lr": 2.6516424215099312e-05} +{"train_loss": 0.0018963939510285854, "global_step": 46984, "epoch": 394, "lr": 2.6514468294870364e-05} +{"train_loss": 0.0012380158295854926, "global_step": 46985, "epoch": 394, "lr": 2.6512512420752778e-05} +{"train_loss": 0.0008331853314302862, "global_step": 46986, "epoch": 394, "lr": 2.6510556592750336e-05} +{"train_loss": 0.0011318748584017158, "global_step": 46987, "epoch": 394, "lr": 2.6508600810866923e-05} +{"train_loss": 0.0008633707766421139, "global_step": 46988, "epoch": 394, "lr": 2.650664507510635e-05} +{"train_loss": 0.0014183998573571444, "global_step": 46989, "epoch": 394, "lr": 2.650468938547248e-05} +{"train_loss": 0.0017335254233330488, "global_step": 46990, "epoch": 394, "lr": 2.6502733741969132e-05} +{"train_loss": 0.0005146529874764383, "global_step": 46991, "epoch": 394, "lr": 2.6500778144600174e-05} +{"train_loss": 0.0004923531669192016, "global_step": 46992, "epoch": 394, "lr": 2.649882259336941e-05} +{"train_loss": 0.0014117996906861663, "global_step": 46993, "epoch": 394, "lr": 2.649686708828069e-05} +{"train_loss": 0.0015934635885059834, "global_step": 46994, "epoch": 394, "lr": 2.6494911629337883e-05} +{"train_loss": 0.000807910633739084, "global_step": 46995, "epoch": 394, "lr": 2.6492956216544784e-05} +{"train_loss": 0.001311123138293624, "global_step": 46996, "epoch": 394, "lr": 2.6491000849905278e-05} +{"train_loss": 0.0008833332685753703, "global_step": 46997, "epoch": 394, "lr": 2.6489045529423185e-05} +{"train_loss": 0.0010322821326553822, "global_step": 46998, "epoch": 394, "lr": 2.648709025510231e-05} +{"train_loss": 0.001758383703418076, "global_step": 46999, "epoch": 394, "lr": 2.6485135026946545e-05} +{"train_loss": 0.0015813957434147596, "global_step": 47000, "epoch": 394, "lr": 2.648317984495968e-05} +{"train_loss": 0.0026103456038981676, "global_step": 47001, "epoch": 394, "lr": 2.6481224709145615e-05} +{"train_loss": 0.0014309425605461001, "global_step": 47002, "epoch": 394, "lr": 2.6479269619508135e-05} +{"train_loss": 0.0006762210396118462, "global_step": 47003, "epoch": 394, "lr": 2.647731457605108e-05} +{"train_loss": 0.0011393565639556081, "global_step": 47004, "epoch": 394, "lr": 2.647535957877833e-05, "val_loss": 0.0396842360496521} +{"train_loss": 0.001131367520429194, "global_step": 47005, "epoch": 395, "lr": 2.6473404627693678e-05} +{"train_loss": 0.001768792630173266, "global_step": 47006, "epoch": 395, "lr": 2.6471449722801e-05} +{"train_loss": 0.001280739321373403, "global_step": 47007, "epoch": 395, "lr": 2.6469494864104095e-05} +{"train_loss": 0.0017159322742372751, "global_step": 47008, "epoch": 395, "lr": 2.6467540051606847e-05} +{"train_loss": 0.000868937757331878, "global_step": 47009, "epoch": 395, "lr": 2.6465585285313065e-05} +{"train_loss": 0.0010428887326270342, "global_step": 47010, "epoch": 395, "lr": 2.6463630565226584e-05} +{"train_loss": 0.0013449740363284945, "global_step": 47011, "epoch": 395, "lr": 2.6461675891351255e-05} +{"train_loss": 0.0020459662191569805, "global_step": 47012, "epoch": 395, "lr": 2.6459721263690895e-05} +{"train_loss": 0.0018418836407363415, "global_step": 47013, "epoch": 395, "lr": 2.6457766682249385e-05} +{"train_loss": 0.0013883005594834685, "global_step": 47014, "epoch": 395, "lr": 2.6455812147030528e-05} +{"train_loss": 0.002516884356737137, "global_step": 47015, "epoch": 395, "lr": 2.645385765803815e-05} +{"train_loss": 0.0010298355482518673, "global_step": 47016, "epoch": 395, "lr": 2.6451903215276125e-05} +{"train_loss": 0.002838935935869813, "global_step": 47017, "epoch": 395, "lr": 2.6449948818748254e-05} +{"train_loss": 0.0012044641189277172, "global_step": 47018, "epoch": 395, "lr": 2.6447994468458414e-05} +{"train_loss": 0.001291975611820817, "global_step": 47019, "epoch": 395, "lr": 2.6446040164410403e-05} +{"train_loss": 0.0015270878793671727, "global_step": 47020, "epoch": 395, "lr": 2.6444085906608083e-05} +{"train_loss": 0.0012911538360640407, "global_step": 47021, "epoch": 395, "lr": 2.6442131695055277e-05} +{"train_loss": 0.001567575614899397, "global_step": 47022, "epoch": 395, "lr": 2.644017752975585e-05} +{"train_loss": 0.001595569308847189, "global_step": 47023, "epoch": 395, "lr": 2.643822341071359e-05} +{"train_loss": 0.0011680808383971453, "global_step": 47024, "epoch": 395, "lr": 2.6436269337932385e-05} +{"train_loss": 0.0012415031669661403, "global_step": 47025, "epoch": 395, "lr": 2.6434315311416023e-05} +{"train_loss": 0.001877854228951037, "global_step": 47026, "epoch": 395, "lr": 2.6432361331168386e-05} +{"train_loss": 0.001051992061547935, "global_step": 47027, "epoch": 395, "lr": 2.6430407397193267e-05} +{"train_loss": 0.0015776860527694225, "global_step": 47028, "epoch": 395, "lr": 2.6428453509494554e-05} +{"train_loss": 0.0007404859061352909, "global_step": 47029, "epoch": 395, "lr": 2.6426499668076033e-05} +{"train_loss": 0.0007501017535105348, "global_step": 47030, "epoch": 395, "lr": 2.6424545872941575e-05} +{"train_loss": 0.001452495576813817, "global_step": 47031, "epoch": 395, "lr": 2.642259212409499e-05} +{"train_loss": 0.0012342326808720827, "global_step": 47032, "epoch": 395, "lr": 2.642063842154014e-05} +{"train_loss": 0.001927569624967873, "global_step": 47033, "epoch": 395, "lr": 2.6418684765280855e-05} +{"train_loss": 0.0013505916576832533, "global_step": 47034, "epoch": 395, "lr": 2.6416731155320935e-05} +{"train_loss": 0.0014050289755687118, "global_step": 47035, "epoch": 395, "lr": 2.6414777591664264e-05} +{"train_loss": 0.0015865814639255404, "global_step": 47036, "epoch": 395, "lr": 2.6412824074314647e-05} +{"train_loss": 0.0013355988776311278, "global_step": 47037, "epoch": 395, "lr": 2.641087060327594e-05} +{"train_loss": 0.0011048737214878201, "global_step": 47038, "epoch": 395, "lr": 2.640891717855195e-05} +{"train_loss": 0.0008491979097016156, "global_step": 47039, "epoch": 395, "lr": 2.6406963800146555e-05} +{"train_loss": 0.0007722949958406389, "global_step": 47040, "epoch": 395, "lr": 2.6405010468063562e-05} +{"train_loss": 0.0007958973874337971, "global_step": 47041, "epoch": 395, "lr": 2.640305718230679e-05} +{"train_loss": 0.002547777956351638, "global_step": 47042, "epoch": 395, "lr": 2.6401103942880118e-05} +{"train_loss": 0.001425521564669907, "global_step": 47043, "epoch": 395, "lr": 2.6399150749787337e-05} +{"train_loss": 0.0007995286141522229, "global_step": 47044, "epoch": 395, "lr": 2.639719760303232e-05} +{"train_loss": 0.0011735795997083187, "global_step": 47045, "epoch": 395, "lr": 2.6395244502618866e-05} +{"train_loss": 0.0010819938033819199, "global_step": 47046, "epoch": 395, "lr": 2.6393291448550843e-05} +{"train_loss": 0.0007120058289729059, "global_step": 47047, "epoch": 395, "lr": 2.639133844083207e-05} +{"train_loss": 0.0015251991571858525, "global_step": 47048, "epoch": 395, "lr": 2.6389385479466365e-05} +{"train_loss": 0.002006996190175414, "global_step": 47049, "epoch": 395, "lr": 2.6387432564457604e-05} +{"train_loss": 0.002172471722587943, "global_step": 47050, "epoch": 395, "lr": 2.6385479695809566e-05} +{"train_loss": 0.001494710217230022, "global_step": 47051, "epoch": 395, "lr": 2.6383526873526142e-05} +{"train_loss": 0.0022726028691977262, "global_step": 47052, "epoch": 395, "lr": 2.638157409761114e-05} +{"train_loss": 0.0009347631130367517, "global_step": 47053, "epoch": 395, "lr": 2.6379621368068374e-05} +{"train_loss": 0.0010130226146429777, "global_step": 47054, "epoch": 395, "lr": 2.6377668684901702e-05} +{"train_loss": 0.0007263675215654075, "global_step": 47055, "epoch": 395, "lr": 2.6375716048114967e-05} +{"train_loss": 0.0008410097798332572, "global_step": 47056, "epoch": 395, "lr": 2.6373763457711977e-05} +{"train_loss": 0.0012408376205712557, "global_step": 47057, "epoch": 395, "lr": 2.6371810913696593e-05} +{"train_loss": 0.0021831111516803503, "global_step": 47058, "epoch": 395, "lr": 2.6369858416072614e-05} +{"train_loss": 0.0013062318321317434, "global_step": 47059, "epoch": 395, "lr": 2.636790596484391e-05} +{"train_loss": 0.0008652390097267926, "global_step": 47060, "epoch": 395, "lr": 2.6365953560014277e-05} +{"train_loss": 0.001338184461928904, "global_step": 47061, "epoch": 395, "lr": 2.6364001201587597e-05} +{"train_loss": 0.001596302492544055, "global_step": 47062, "epoch": 395, "lr": 2.636204888956766e-05} +{"train_loss": 0.0012394110672175884, "global_step": 47063, "epoch": 395, "lr": 2.636009662395832e-05} +{"train_loss": 0.0014679358573630452, "global_step": 47064, "epoch": 395, "lr": 2.6358144404763413e-05} +{"train_loss": 0.0008134887320920825, "global_step": 47065, "epoch": 395, "lr": 2.6356192231986744e-05} +{"train_loss": 0.001162425964139402, "global_step": 47066, "epoch": 395, "lr": 2.6354240105632183e-05} +{"train_loss": 0.0007541306549683213, "global_step": 47067, "epoch": 395, "lr": 2.6352288025703532e-05} +{"train_loss": 0.0006318177911452949, "global_step": 47068, "epoch": 395, "lr": 2.6350335992204643e-05} +{"train_loss": 0.0011261086910963058, "global_step": 47069, "epoch": 395, "lr": 2.6348384005139338e-05} +{"train_loss": 0.000997787807136774, "global_step": 47070, "epoch": 395, "lr": 2.6346432064511462e-05} +{"train_loss": 0.0017019377555698156, "global_step": 47071, "epoch": 395, "lr": 2.6344480170324848e-05} +{"train_loss": 0.0010687721660360694, "global_step": 47072, "epoch": 395, "lr": 2.6342528322583293e-05} +{"train_loss": 0.0009601966594345868, "global_step": 47073, "epoch": 395, "lr": 2.6340576521290684e-05} +{"train_loss": 0.00195758743211627, "global_step": 47074, "epoch": 395, "lr": 2.6338624766450804e-05} +{"train_loss": 0.001271416898816824, "global_step": 47075, "epoch": 395, "lr": 2.6336673058067518e-05} +{"train_loss": 0.001023684861138463, "global_step": 47076, "epoch": 395, "lr": 2.6334721396144636e-05} +{"train_loss": 0.00236651417799294, "global_step": 47077, "epoch": 395, "lr": 2.6332769780686017e-05} +{"train_loss": 0.000932593597099185, "global_step": 47078, "epoch": 395, "lr": 2.6330818211695473e-05} +{"train_loss": 0.0011083504650741816, "global_step": 47079, "epoch": 395, "lr": 2.6328866689176823e-05} +{"train_loss": 0.0007422679918818176, "global_step": 47080, "epoch": 395, "lr": 2.6326915213133935e-05} +{"train_loss": 0.0013246494345366955, "global_step": 47081, "epoch": 395, "lr": 2.63249637835706e-05} +{"train_loss": 0.0012224126840010285, "global_step": 47082, "epoch": 395, "lr": 2.6323012400490687e-05} +{"train_loss": 0.0006423724698834121, "global_step": 47083, "epoch": 395, "lr": 2.6321061063898005e-05} +{"train_loss": 0.0015116229187697172, "global_step": 47084, "epoch": 395, "lr": 2.631910977379638e-05} +{"train_loss": 0.0012546376092359424, "global_step": 47085, "epoch": 395, "lr": 2.6317158530189666e-05} +{"train_loss": 0.0006338576204143465, "global_step": 47086, "epoch": 395, "lr": 2.631520733308166e-05} +{"train_loss": 0.0010386088397353888, "global_step": 47087, "epoch": 395, "lr": 2.6313256182476237e-05} +{"train_loss": 0.0006937014986760914, "global_step": 47088, "epoch": 395, "lr": 2.6311305078377185e-05} +{"train_loss": 0.0009957186412066221, "global_step": 47089, "epoch": 395, "lr": 2.6309354020788374e-05} +{"train_loss": 0.0012511506211012602, "global_step": 47090, "epoch": 395, "lr": 2.6307403009713594e-05} +{"train_loss": 0.0007491956930607557, "global_step": 47091, "epoch": 395, "lr": 2.6305452045156705e-05} +{"train_loss": 0.0007942990050651133, "global_step": 47092, "epoch": 395, "lr": 2.6303501127121545e-05} +{"train_loss": 0.0014433579053729773, "global_step": 47093, "epoch": 395, "lr": 2.6301550255611906e-05} +{"train_loss": 0.0007735329563729465, "global_step": 47094, "epoch": 395, "lr": 2.629959943063166e-05} +{"train_loss": 0.00040766908205114305, "global_step": 47095, "epoch": 395, "lr": 2.6297648652184604e-05} +{"train_loss": 0.0019476659363135695, "global_step": 47096, "epoch": 395, "lr": 2.6295697920274597e-05} +{"train_loss": 0.0020863176323473454, "global_step": 47097, "epoch": 395, "lr": 2.6293747234905452e-05} +{"train_loss": 0.0007424826617352664, "global_step": 47098, "epoch": 395, "lr": 2.6291796596080992e-05} +{"train_loss": 0.0011588344350457191, "global_step": 47099, "epoch": 395, "lr": 2.6289846003805075e-05} +{"train_loss": 0.0010617473162710667, "global_step": 47100, "epoch": 395, "lr": 2.6287895458081485e-05} +{"train_loss": 0.0017729897517710924, "global_step": 47101, "epoch": 395, "lr": 2.6285944958914106e-05} +{"train_loss": 0.001829962944611907, "global_step": 47102, "epoch": 395, "lr": 2.6283994506306736e-05} +{"train_loss": 0.0009876226540654898, "global_step": 47103, "epoch": 395, "lr": 2.6282044100263192e-05} +{"train_loss": 0.0005349960993044078, "global_step": 47104, "epoch": 395, "lr": 2.6280093740787338e-05} +{"train_loss": 0.0016585198463872075, "global_step": 47105, "epoch": 395, "lr": 2.627814342788297e-05} +{"train_loss": 0.001991000957787037, "global_step": 47106, "epoch": 395, "lr": 2.6276193161553945e-05} +{"train_loss": 0.0023366413079202175, "global_step": 47107, "epoch": 395, "lr": 2.6274242941804067e-05} +{"train_loss": 0.0010713402880355716, "global_step": 47108, "epoch": 395, "lr": 2.6272292768637196e-05} +{"train_loss": 0.0008864520350471139, "global_step": 47109, "epoch": 395, "lr": 2.6270342642057144e-05} +{"train_loss": 0.001201435225084424, "global_step": 47110, "epoch": 395, "lr": 2.6268392562067722e-05} +{"train_loss": 0.00143105024471879, "global_step": 47111, "epoch": 395, "lr": 2.6266442528672786e-05} +{"train_loss": 0.0013635189970955253, "global_step": 47112, "epoch": 395, "lr": 2.6264492541876145e-05} +{"train_loss": 0.0008754423470236361, "global_step": 47113, "epoch": 395, "lr": 2.626254260168165e-05} +{"train_loss": 0.0007388755911961198, "global_step": 47114, "epoch": 395, "lr": 2.62605927080931e-05} +{"train_loss": 0.0005445417482405901, "global_step": 47115, "epoch": 395, "lr": 2.6258642861114363e-05} +{"train_loss": 0.00164636573754251, "global_step": 47116, "epoch": 395, "lr": 2.6256693060749237e-05} +{"train_loss": 0.0014621432637795806, "global_step": 47117, "epoch": 395, "lr": 2.625474330700155e-05} +{"train_loss": 0.0012394211953505874, "global_step": 47118, "epoch": 395, "lr": 2.6252793599875148e-05} +{"train_loss": 0.0008309450349770486, "global_step": 47119, "epoch": 395, "lr": 2.6250843939373827e-05} +{"train_loss": 0.002085480373352766, "global_step": 47120, "epoch": 395, "lr": 2.6248894325501462e-05} +{"train_loss": 0.0009451870573684573, "global_step": 47121, "epoch": 395, "lr": 2.624694475826184e-05} +{"train_loss": 0.0006638693739660084, "global_step": 47122, "epoch": 395, "lr": 2.624499523765881e-05} +{"train_loss": 0.0012825431295831007, "global_step": 47123, "epoch": 395, "lr": 2.6243045763696183e-05, "val_loss": 0.023752715438604355, "train_action_mse_error": 1.6748921552789398e-05} +{"train_loss": 0.0011874487390741706, "global_step": 47124, "epoch": 396, "lr": 2.6241096336377818e-05} +{"train_loss": 0.0009167447569780052, "global_step": 47125, "epoch": 396, "lr": 2.62391469557075e-05} +{"train_loss": 0.001509655499830842, "global_step": 47126, "epoch": 396, "lr": 2.623719762168908e-05} +{"train_loss": 0.0018169181421399117, "global_step": 47127, "epoch": 396, "lr": 2.6235248334326402e-05} +{"train_loss": 0.0005040310206823051, "global_step": 47128, "epoch": 396, "lr": 2.6233299093623276e-05} +{"train_loss": 0.0006216242909431458, "global_step": 47129, "epoch": 396, "lr": 2.6231349899583513e-05} +{"train_loss": 0.0010143944527953863, "global_step": 47130, "epoch": 396, "lr": 2.6229400752210963e-05} +{"train_loss": 0.0011318903416395187, "global_step": 47131, "epoch": 396, "lr": 2.6227451651509437e-05} +{"train_loss": 0.0009143711067736149, "global_step": 47132, "epoch": 396, "lr": 2.6225502597482787e-05} +{"train_loss": 0.0012983347987756133, "global_step": 47133, "epoch": 396, "lr": 2.622355359013482e-05} +{"train_loss": 0.001044035772792995, "global_step": 47134, "epoch": 396, "lr": 2.6221604629469344e-05} +{"train_loss": 0.0008311585988849401, "global_step": 47135, "epoch": 396, "lr": 2.621965571549023e-05} +{"train_loss": 0.0004379594756755978, "global_step": 47136, "epoch": 396, "lr": 2.621770684820126e-05} +{"train_loss": 0.0010179246310144663, "global_step": 47137, "epoch": 396, "lr": 2.6215758027606307e-05} +{"train_loss": 0.001364843687042594, "global_step": 47138, "epoch": 396, "lr": 2.6213809253709144e-05} +{"train_loss": 0.0007102342788130045, "global_step": 47139, "epoch": 396, "lr": 2.621186052651365e-05} +{"train_loss": 0.0017527062445878983, "global_step": 47140, "epoch": 396, "lr": 2.6209911846023628e-05} +{"train_loss": 0.0008243684424087405, "global_step": 47141, "epoch": 396, "lr": 2.620796321224288e-05} +{"train_loss": 0.00117450300604105, "global_step": 47142, "epoch": 396, "lr": 2.6206014625175273e-05} +{"train_loss": 0.0008250985993072391, "global_step": 47143, "epoch": 396, "lr": 2.6204066084824596e-05} +{"train_loss": 0.0013542140368372202, "global_step": 47144, "epoch": 396, "lr": 2.6202117591194707e-05} +{"train_loss": 0.0010070782154798508, "global_step": 47145, "epoch": 396, "lr": 2.6200169144289412e-05} +{"train_loss": 0.002648745197802782, "global_step": 47146, "epoch": 396, "lr": 2.619822074411255e-05} +{"train_loss": 0.0006291637546382844, "global_step": 47147, "epoch": 396, "lr": 2.619627239066794e-05} +{"train_loss": 0.0008308525430038571, "global_step": 47148, "epoch": 396, "lr": 2.6194324083959393e-05} +{"train_loss": 0.0017172542866319418, "global_step": 47149, "epoch": 396, "lr": 2.6192375823990763e-05} +{"train_loss": 0.001032196800224483, "global_step": 47150, "epoch": 396, "lr": 2.619042761076584e-05} +{"train_loss": 0.0013433523708954453, "global_step": 47151, "epoch": 396, "lr": 2.6188479444288484e-05} +{"train_loss": 0.001980602741241455, "global_step": 47152, "epoch": 396, "lr": 2.6186531324562492e-05} +{"train_loss": 0.0010961467633023858, "global_step": 47153, "epoch": 396, "lr": 2.618458325159172e-05} +{"train_loss": 0.001505353138782084, "global_step": 47154, "epoch": 396, "lr": 2.6182635225379954e-05} +{"train_loss": 0.0007890098495408893, "global_step": 47155, "epoch": 396, "lr": 2.6180687245931055e-05} +{"train_loss": 0.0023334743455052376, "global_step": 47156, "epoch": 396, "lr": 2.6178739313248817e-05} +{"train_loss": 0.0015366773586720228, "global_step": 47157, "epoch": 396, "lr": 2.61767914273371e-05} +{"train_loss": 0.0010867052478715777, "global_step": 47158, "epoch": 396, "lr": 2.6174843588199682e-05} +{"train_loss": 0.0009402403375133872, "global_step": 47159, "epoch": 396, "lr": 2.6172895795840435e-05} +{"train_loss": 0.0010140037629753351, "global_step": 47160, "epoch": 396, "lr": 2.6170948050263144e-05} +{"train_loss": 0.0005756858736276627, "global_step": 47161, "epoch": 396, "lr": 2.6169000351471673e-05} +{"train_loss": 0.0015296993078663945, "global_step": 47162, "epoch": 396, "lr": 2.61670526994698e-05} +{"train_loss": 0.0013610734604299068, "global_step": 47163, "epoch": 396, "lr": 2.6165105094261392e-05} +{"train_loss": 0.0011739465408027172, "global_step": 47164, "epoch": 396, "lr": 2.6163157535850237e-05} +{"train_loss": 0.001460022758692503, "global_step": 47165, "epoch": 396, "lr": 2.6161210024240196e-05} +{"train_loss": 0.002116276416927576, "global_step": 47166, "epoch": 396, "lr": 2.615926255943507e-05} +{"train_loss": 0.0008281025220640004, "global_step": 47167, "epoch": 396, "lr": 2.6157315141438665e-05} +{"train_loss": 0.0018002265132963657, "global_step": 47168, "epoch": 396, "lr": 2.6155367770254845e-05} +{"train_loss": 0.0017023537075147033, "global_step": 47169, "epoch": 396, "lr": 2.6153420445887394e-05} +{"train_loss": 0.000566593836992979, "global_step": 47170, "epoch": 396, "lr": 2.6151473168340173e-05} +{"train_loss": 0.0009855114622041583, "global_step": 47171, "epoch": 396, "lr": 2.6149525937616988e-05} +{"train_loss": 0.0017694731941446662, "global_step": 47172, "epoch": 396, "lr": 2.6147578753721636e-05} +{"train_loss": 0.0018737646751105785, "global_step": 47173, "epoch": 396, "lr": 2.6145631616657994e-05} +{"train_loss": 0.001524721970781684, "global_step": 47174, "epoch": 396, "lr": 2.614368452642983e-05} +{"train_loss": 0.0013463885989040136, "global_step": 47175, "epoch": 396, "lr": 2.614173748304101e-05} +{"train_loss": 0.0017994921654462814, "global_step": 47176, "epoch": 396, "lr": 2.6139790486495324e-05} +{"train_loss": 0.0010035457089543343, "global_step": 47177, "epoch": 396, "lr": 2.613784353679663e-05} +{"train_loss": 0.0007606388535350561, "global_step": 47178, "epoch": 396, "lr": 2.6135896633948732e-05} +{"train_loss": 0.0007001128396950662, "global_step": 47179, "epoch": 396, "lr": 2.6133949777955423e-05} +{"train_loss": 0.0010339750442653894, "global_step": 47180, "epoch": 396, "lr": 2.6132002968820583e-05} +{"train_loss": 0.0008450334426015615, "global_step": 47181, "epoch": 396, "lr": 2.613005620654798e-05} +{"train_loss": 0.0010732263326644897, "global_step": 47182, "epoch": 396, "lr": 2.6128109491141483e-05} +{"train_loss": 0.0017832723679021, "global_step": 47183, "epoch": 396, "lr": 2.6126162822604893e-05} +{"train_loss": 0.0012154957512393594, "global_step": 47184, "epoch": 396, "lr": 2.612421620094202e-05} +{"train_loss": 0.0011161210713908076, "global_step": 47185, "epoch": 396, "lr": 2.6122269626156703e-05} +{"train_loss": 0.0015943293692544103, "global_step": 47186, "epoch": 396, "lr": 2.6120323098252753e-05} +{"train_loss": 0.0009400423732586205, "global_step": 47187, "epoch": 396, "lr": 2.6118376617233988e-05} +{"train_loss": 0.0014221802121028304, "global_step": 47188, "epoch": 396, "lr": 2.6116430183104262e-05} +{"train_loss": 0.0013234760845080018, "global_step": 47189, "epoch": 396, "lr": 2.6114483795867352e-05} +{"train_loss": 0.001952237682417035, "global_step": 47190, "epoch": 396, "lr": 2.6112537455527118e-05} +{"train_loss": 0.001495991600677371, "global_step": 47191, "epoch": 396, "lr": 2.6110591162087356e-05} +{"train_loss": 0.0007001494523137808, "global_step": 47192, "epoch": 396, "lr": 2.6108644915551905e-05} +{"train_loss": 0.0014595927204936743, "global_step": 47193, "epoch": 396, "lr": 2.6106698715924566e-05} +{"train_loss": 0.0016260930569842458, "global_step": 47194, "epoch": 396, "lr": 2.6104752563209184e-05} +{"train_loss": 0.0006683783722110093, "global_step": 47195, "epoch": 396, "lr": 2.610280645740955e-05} +{"train_loss": 0.0013492503203451633, "global_step": 47196, "epoch": 396, "lr": 2.6100860398529527e-05} +{"train_loss": 0.0011581324506551027, "global_step": 47197, "epoch": 396, "lr": 2.6098914386572905e-05} +{"train_loss": 0.0012350640026852489, "global_step": 47198, "epoch": 396, "lr": 2.6096968421543493e-05} +{"train_loss": 0.0010108489077538252, "global_step": 47199, "epoch": 396, "lr": 2.6095022503445156e-05} +{"train_loss": 0.0016376853454858065, "global_step": 47200, "epoch": 396, "lr": 2.6093076632281655e-05} +{"train_loss": 0.0016467149835079908, "global_step": 47201, "epoch": 396, "lr": 2.6091130808056876e-05} +{"train_loss": 0.000834582548122853, "global_step": 47202, "epoch": 396, "lr": 2.6089185030774597e-05} +{"train_loss": 0.0008750956039875746, "global_step": 47203, "epoch": 396, "lr": 2.6087239300438636e-05} +{"train_loss": 0.0010991401504725218, "global_step": 47204, "epoch": 396, "lr": 2.6085293617052846e-05} +{"train_loss": 0.0006827290635555983, "global_step": 47205, "epoch": 396, "lr": 2.608334798062101e-05} +{"train_loss": 0.0012399120023474097, "global_step": 47206, "epoch": 396, "lr": 2.608140239114698e-05} +{"train_loss": 0.0006438609561882913, "global_step": 47207, "epoch": 396, "lr": 2.6079456848634544e-05} +{"train_loss": 0.0013941008364781737, "global_step": 47208, "epoch": 396, "lr": 2.6077511353087553e-05} +{"train_loss": 0.0012196848401799798, "global_step": 47209, "epoch": 396, "lr": 2.6075565904509814e-05} +{"train_loss": 0.0012403368018567562, "global_step": 47210, "epoch": 396, "lr": 2.6073620502905126e-05} +{"train_loss": 0.0007303972379304469, "global_step": 47211, "epoch": 396, "lr": 2.6071675148277354e-05} +{"train_loss": 0.0010384422494098544, "global_step": 47212, "epoch": 396, "lr": 2.606972984063027e-05} +{"train_loss": 0.0005712926504202187, "global_step": 47213, "epoch": 396, "lr": 2.606778457996773e-05} +{"train_loss": 0.0011503323912620544, "global_step": 47214, "epoch": 396, "lr": 2.606583936629352e-05} +{"train_loss": 0.000720494834240526, "global_step": 47215, "epoch": 396, "lr": 2.60638941996115e-05} +{"train_loss": 0.001245957799255848, "global_step": 47216, "epoch": 396, "lr": 2.6061949079925462e-05} +{"train_loss": 0.0014196560950949788, "global_step": 47217, "epoch": 396, "lr": 2.6060004007239213e-05} +{"train_loss": 0.001209729234687984, "global_step": 47218, "epoch": 396, "lr": 2.605805898155661e-05} +{"train_loss": 0.00053738261340186, "global_step": 47219, "epoch": 396, "lr": 2.6056114002881428e-05} +{"train_loss": 0.0006895902333781123, "global_step": 47220, "epoch": 396, "lr": 2.6054169071217528e-05} +{"train_loss": 0.0009725371492095292, "global_step": 47221, "epoch": 396, "lr": 2.6052224186568687e-05} +{"train_loss": 0.0009708528523333371, "global_step": 47222, "epoch": 396, "lr": 2.605027934893875e-05} +{"train_loss": 0.0014136132085695863, "global_step": 47223, "epoch": 396, "lr": 2.6048334558331544e-05} +{"train_loss": 0.0018744581611827016, "global_step": 47224, "epoch": 396, "lr": 2.604638981475086e-05} +{"train_loss": 0.0009570723632350564, "global_step": 47225, "epoch": 396, "lr": 2.604444511820055e-05} +{"train_loss": 0.0005915160290896893, "global_step": 47226, "epoch": 396, "lr": 2.6042500468684394e-05} +{"train_loss": 0.0011449300218373537, "global_step": 47227, "epoch": 396, "lr": 2.604055586620624e-05} +{"train_loss": 0.0012905587209388614, "global_step": 47228, "epoch": 396, "lr": 2.6038611310769905e-05} +{"train_loss": 0.0014212795067578554, "global_step": 47229, "epoch": 396, "lr": 2.6036666802379174e-05} +{"train_loss": 0.0009752093465067446, "global_step": 47230, "epoch": 396, "lr": 2.6034722341037908e-05} +{"train_loss": 0.000891014002263546, "global_step": 47231, "epoch": 396, "lr": 2.6032777926749884e-05} +{"train_loss": 0.0014708484522998333, "global_step": 47232, "epoch": 396, "lr": 2.6030833559518952e-05} +{"train_loss": 0.002057368168607354, "global_step": 47233, "epoch": 396, "lr": 2.602888923934891e-05} +{"train_loss": 0.000749667757190764, "global_step": 47234, "epoch": 396, "lr": 2.6026944966243595e-05} +{"train_loss": 0.000596972880885005, "global_step": 47235, "epoch": 396, "lr": 2.6025000740206818e-05} +{"train_loss": 0.002332446863874793, "global_step": 47236, "epoch": 396, "lr": 2.6023056561242365e-05} +{"train_loss": 0.0007776651764288545, "global_step": 47237, "epoch": 396, "lr": 2.60211124293541e-05} +{"train_loss": 0.0006553190178237855, "global_step": 47238, "epoch": 396, "lr": 2.601916834454581e-05} +{"train_loss": 0.0004999390803277493, "global_step": 47239, "epoch": 396, "lr": 2.6017224306821325e-05} +{"train_loss": 0.0014710940886288881, "global_step": 47240, "epoch": 396, "lr": 2.6015280316184463e-05} +{"train_loss": 0.0013067485997453332, "global_step": 47241, "epoch": 396, "lr": 2.601333637263902e-05} +{"train_loss": 0.0011838819318501857, "global_step": 47242, "epoch": 396, "lr": 2.6011392476188846e-05, "val_loss": 0.026511529460549355} +{"train_loss": 0.0005423956317827106, "global_step": 47243, "epoch": 397, "lr": 2.6009448626837717e-05} +{"train_loss": 0.0008937788661569357, "global_step": 47244, "epoch": 397, "lr": 2.60075048245895e-05} +{"train_loss": 0.0017804972594603896, "global_step": 47245, "epoch": 397, "lr": 2.6005561069447957e-05} +{"train_loss": 0.0008680530590936542, "global_step": 47246, "epoch": 397, "lr": 2.6003617361416954e-05} +{"train_loss": 0.0014895459171384573, "global_step": 47247, "epoch": 397, "lr": 2.6001673700500284e-05} +{"train_loss": 0.001166131580248475, "global_step": 47248, "epoch": 397, "lr": 2.5999730086701747e-05} +{"train_loss": 0.0011788828996941447, "global_step": 47249, "epoch": 397, "lr": 2.599778652002519e-05} +{"train_loss": 0.0018253220478072762, "global_step": 47250, "epoch": 397, "lr": 2.59958430004744e-05} +{"train_loss": 0.0009176124003715813, "global_step": 47251, "epoch": 397, "lr": 2.5993899528053224e-05} +{"train_loss": 0.0008406527922488749, "global_step": 47252, "epoch": 397, "lr": 2.5991956102765446e-05} +{"train_loss": 0.0007076540496200323, "global_step": 47253, "epoch": 397, "lr": 2.5990012724614914e-05} +{"train_loss": 0.0007032401626929641, "global_step": 47254, "epoch": 397, "lr": 2.5988069393605407e-05} +{"train_loss": 0.0008293571299873292, "global_step": 47255, "epoch": 397, "lr": 2.5986126109740782e-05} +{"train_loss": 0.0011513192439451814, "global_step": 47256, "epoch": 397, "lr": 2.5984182873024816e-05} +{"train_loss": 0.0014731402043253183, "global_step": 47257, "epoch": 397, "lr": 2.598223968346134e-05} +{"train_loss": 0.0009628191473893821, "global_step": 47258, "epoch": 397, "lr": 2.5980296541054182e-05} +{"train_loss": 0.0012822155840694904, "global_step": 47259, "epoch": 397, "lr": 2.5978353445807152e-05} +{"train_loss": 0.001430418691597879, "global_step": 47260, "epoch": 397, "lr": 2.5976410397724037e-05} +{"train_loss": 0.0019075488671660423, "global_step": 47261, "epoch": 397, "lr": 2.5974467396808698e-05} +{"train_loss": 0.0018915035761892796, "global_step": 47262, "epoch": 397, "lr": 2.5972524443064905e-05} +{"train_loss": 0.0016729930648580194, "global_step": 47263, "epoch": 397, "lr": 2.5970581536496506e-05} +{"train_loss": 0.0006435270188376307, "global_step": 47264, "epoch": 397, "lr": 2.5968638677107294e-05} +{"train_loss": 0.0019236202351748943, "global_step": 47265, "epoch": 397, "lr": 2.5966695864901103e-05} +{"train_loss": 0.0009234050521627069, "global_step": 47266, "epoch": 397, "lr": 2.596475309988174e-05} +{"train_loss": 0.001381336827762425, "global_step": 47267, "epoch": 397, "lr": 2.5962810382052993e-05} +{"train_loss": 0.0018455618992447853, "global_step": 47268, "epoch": 397, "lr": 2.5960867711418724e-05} +{"train_loss": 0.0012584840878844261, "global_step": 47269, "epoch": 397, "lr": 2.5958925087982706e-05} +{"train_loss": 0.0029188981279730797, "global_step": 47270, "epoch": 397, "lr": 2.5956982511748785e-05} +{"train_loss": 0.0009752808837220073, "global_step": 47271, "epoch": 397, "lr": 2.5955039982720762e-05} +{"train_loss": 0.0009025328909046948, "global_step": 47272, "epoch": 397, "lr": 2.595309750090243e-05} +{"train_loss": 0.0016166107961907983, "global_step": 47273, "epoch": 397, "lr": 2.5951155066297638e-05} +{"train_loss": 0.0007838107994757593, "global_step": 47274, "epoch": 397, "lr": 2.5949212678910173e-05} +{"train_loss": 0.0010651471093297005, "global_step": 47275, "epoch": 397, "lr": 2.5947270338743867e-05} +{"train_loss": 0.0008392469608224928, "global_step": 47276, "epoch": 397, "lr": 2.594532804580252e-05} +{"train_loss": 0.0014126804890111089, "global_step": 47277, "epoch": 397, "lr": 2.594338580008996e-05} +{"train_loss": 0.001017751987092197, "global_step": 47278, "epoch": 397, "lr": 2.5941443601609995e-05} +{"train_loss": 0.001101430389098823, "global_step": 47279, "epoch": 397, "lr": 2.5939501450366423e-05} +{"train_loss": 0.0014277251902967691, "global_step": 47280, "epoch": 397, "lr": 2.5937559346363077e-05} +{"train_loss": 0.0006433958187699318, "global_step": 47281, "epoch": 397, "lr": 2.593561728960375e-05} +{"train_loss": 0.0008837534114718437, "global_step": 47282, "epoch": 397, "lr": 2.5933675280092285e-05} +{"train_loss": 0.0013649823376908898, "global_step": 47283, "epoch": 397, "lr": 2.593173331783246e-05} +{"train_loss": 0.001389116863720119, "global_step": 47284, "epoch": 397, "lr": 2.592979140282812e-05} +{"train_loss": 0.0006616676109842956, "global_step": 47285, "epoch": 397, "lr": 2.592784953508305e-05} +{"train_loss": 0.001605499885044992, "global_step": 47286, "epoch": 397, "lr": 2.592590771460109e-05} +{"train_loss": 0.0005997907719574869, "global_step": 47287, "epoch": 397, "lr": 2.592396594138602e-05} +{"train_loss": 0.000716166221536696, "global_step": 47288, "epoch": 397, "lr": 2.5922024215441694e-05} +{"train_loss": 0.001081592170521617, "global_step": 47289, "epoch": 397, "lr": 2.5920082536771874e-05} +{"train_loss": 0.0007749580545350909, "global_step": 47290, "epoch": 397, "lr": 2.5918140905380427e-05} +{"train_loss": 0.0009297703509218991, "global_step": 47291, "epoch": 397, "lr": 2.5916199321271118e-05} +{"train_loss": 0.0007474024896509945, "global_step": 47292, "epoch": 397, "lr": 2.5914257784447793e-05} +{"train_loss": 0.0008829477010294795, "global_step": 47293, "epoch": 397, "lr": 2.591231629491423e-05} +{"train_loss": 0.0011249718954786658, "global_step": 47294, "epoch": 397, "lr": 2.591037485267428e-05} +{"train_loss": 0.0013265347806736827, "global_step": 47295, "epoch": 397, "lr": 2.5908433457731717e-05} +{"train_loss": 0.0010895085288211703, "global_step": 47296, "epoch": 397, "lr": 2.59064921100904e-05} +{"train_loss": 0.0011786592658609152, "global_step": 47297, "epoch": 397, "lr": 2.5904550809754098e-05} +{"train_loss": 0.0016444918001070619, "global_step": 47298, "epoch": 397, "lr": 2.590260955672662e-05} +{"train_loss": 0.0010763885220512748, "global_step": 47299, "epoch": 397, "lr": 2.5900668351011815e-05} +{"train_loss": 0.000850555719807744, "global_step": 47300, "epoch": 397, "lr": 2.5898727192613453e-05} +{"train_loss": 0.0013255577068775892, "global_step": 47301, "epoch": 397, "lr": 2.5896786081535386e-05} +{"train_loss": 0.0008236166322603822, "global_step": 47302, "epoch": 397, "lr": 2.5894845017781388e-05} +{"train_loss": 0.0010724370367825031, "global_step": 47303, "epoch": 397, "lr": 2.5892904001355302e-05} +{"train_loss": 0.0005845390260219574, "global_step": 47304, "epoch": 397, "lr": 2.5890963032260922e-05} +{"train_loss": 0.0007773342658765614, "global_step": 47305, "epoch": 397, "lr": 2.5889022110502044e-05} +{"train_loss": 0.0017444074619561434, "global_step": 47306, "epoch": 397, "lr": 2.5887081236082512e-05} +{"train_loss": 0.001451403135433793, "global_step": 47307, "epoch": 397, "lr": 2.5885140409006105e-05} +{"train_loss": 0.0006920213927514851, "global_step": 47308, "epoch": 397, "lr": 2.5883199629276667e-05} +{"train_loss": 0.000740662741009146, "global_step": 47309, "epoch": 397, "lr": 2.5881258896897988e-05} +{"train_loss": 0.0010214070789515972, "global_step": 47310, "epoch": 397, "lr": 2.587931821187386e-05} +{"train_loss": 0.0012329377932474017, "global_step": 47311, "epoch": 397, "lr": 2.587737757420813e-05} +{"train_loss": 0.0017123590223491192, "global_step": 47312, "epoch": 397, "lr": 2.5875436983904576e-05} +{"train_loss": 0.001335892011411488, "global_step": 47313, "epoch": 397, "lr": 2.5873496440967048e-05} +{"train_loss": 0.0006693597533740103, "global_step": 47314, "epoch": 397, "lr": 2.5871555945399305e-05} +{"train_loss": 0.0013906644890084863, "global_step": 47315, "epoch": 397, "lr": 2.5869615497205214e-05} +{"train_loss": 0.0007918124902062118, "global_step": 47316, "epoch": 397, "lr": 2.5867675096388542e-05} +{"train_loss": 0.000962959136813879, "global_step": 47317, "epoch": 397, "lr": 2.5865734742953108e-05} +{"train_loss": 0.0012331996113061905, "global_step": 47318, "epoch": 397, "lr": 2.5863794436902733e-05} +{"train_loss": 0.0015717089409008622, "global_step": 47319, "epoch": 397, "lr": 2.5861854178241202e-05} +{"train_loss": 0.000708055857103318, "global_step": 47320, "epoch": 397, "lr": 2.5859913966972343e-05} +{"train_loss": 0.0007199825486168265, "global_step": 47321, "epoch": 397, "lr": 2.5857973803099982e-05} +{"train_loss": 0.0007193852798081934, "global_step": 47322, "epoch": 397, "lr": 2.585603368662789e-05} +{"train_loss": 0.0010943622328341007, "global_step": 47323, "epoch": 397, "lr": 2.5854093617559915e-05} +{"train_loss": 0.000930923328269273, "global_step": 47324, "epoch": 397, "lr": 2.585215359589983e-05} +{"train_loss": 0.001640619128011167, "global_step": 47325, "epoch": 397, "lr": 2.5850213621651487e-05} +{"train_loss": 0.000832802033983171, "global_step": 47326, "epoch": 397, "lr": 2.5848273694818644e-05} +{"train_loss": 0.001292065135203302, "global_step": 47327, "epoch": 397, "lr": 2.5846333815405154e-05} +{"train_loss": 0.0006068022921681404, "global_step": 47328, "epoch": 397, "lr": 2.5844393983414807e-05} +{"train_loss": 0.0007094588363543153, "global_step": 47329, "epoch": 397, "lr": 2.5842454198851396e-05} +{"train_loss": 0.0007357579306699336, "global_step": 47330, "epoch": 397, "lr": 2.5840514461718763e-05} +{"train_loss": 0.0004887848044745624, "global_step": 47331, "epoch": 397, "lr": 2.583857477202068e-05} +{"train_loss": 0.0011425806442275643, "global_step": 47332, "epoch": 397, "lr": 2.583663512976099e-05} +{"train_loss": 0.0008573413360863924, "global_step": 47333, "epoch": 397, "lr": 2.583469553494347e-05} +{"train_loss": 0.0009142688359133899, "global_step": 47334, "epoch": 397, "lr": 2.583275598757196e-05} +{"train_loss": 0.002305693458765745, "global_step": 47335, "epoch": 397, "lr": 2.5830816487650255e-05} +{"train_loss": 0.0013406940270215273, "global_step": 47336, "epoch": 397, "lr": 2.5828877035182143e-05} +{"train_loss": 0.0010720209684222937, "global_step": 47337, "epoch": 397, "lr": 2.5826937630171462e-05} +{"train_loss": 0.0013958461349830031, "global_step": 47338, "epoch": 397, "lr": 2.5824998272621988e-05} +{"train_loss": 0.0006195784662850201, "global_step": 47339, "epoch": 397, "lr": 2.5823058962537567e-05} +{"train_loss": 0.0012343775015324354, "global_step": 47340, "epoch": 397, "lr": 2.5821119699921987e-05} +{"train_loss": 0.0015518424334004521, "global_step": 47341, "epoch": 397, "lr": 2.5819180484779037e-05} +{"train_loss": 0.0010974680772051215, "global_step": 47342, "epoch": 397, "lr": 2.581724131711256e-05} +{"train_loss": 0.0017939262324944139, "global_step": 47343, "epoch": 397, "lr": 2.5815302196926326e-05} +{"train_loss": 0.0009803386637941003, "global_step": 47344, "epoch": 397, "lr": 2.5813363124224186e-05} +{"train_loss": 0.0007602323894388974, "global_step": 47345, "epoch": 397, "lr": 2.5811424099009902e-05} +{"train_loss": 0.001022422220557928, "global_step": 47346, "epoch": 397, "lr": 2.5809485121287325e-05} +{"train_loss": 0.0012646786635741591, "global_step": 47347, "epoch": 397, "lr": 2.5807546191060234e-05} +{"train_loss": 0.0008287150994874537, "global_step": 47348, "epoch": 397, "lr": 2.5805607308332425e-05} +{"train_loss": 0.0006120430189184844, "global_step": 47349, "epoch": 397, "lr": 2.580366847310774e-05} +{"train_loss": 0.0011848281137645245, "global_step": 47350, "epoch": 397, "lr": 2.5801729685389947e-05} +{"train_loss": 0.0015152596170082688, "global_step": 47351, "epoch": 397, "lr": 2.579979094518289e-05} +{"train_loss": 0.0011781741632148623, "global_step": 47352, "epoch": 397, "lr": 2.5797852252490345e-05} +{"train_loss": 0.0008985439781099558, "global_step": 47353, "epoch": 397, "lr": 2.5795913607316145e-05} +{"train_loss": 0.0010928453411906958, "global_step": 47354, "epoch": 397, "lr": 2.579397500966407e-05} +{"train_loss": 0.0008457001531496644, "global_step": 47355, "epoch": 397, "lr": 2.5792036459537934e-05} +{"train_loss": 0.0012926316121593118, "global_step": 47356, "epoch": 397, "lr": 2.5790097956941568e-05} +{"train_loss": 0.0010275065433233976, "global_step": 47357, "epoch": 397, "lr": 2.578815950187874e-05} +{"train_loss": 0.0011722453637048602, "global_step": 47358, "epoch": 397, "lr": 2.5786221094353292e-05} +{"train_loss": 0.000755283806938678, "global_step": 47359, "epoch": 397, "lr": 2.5784282734369014e-05} +{"train_loss": 0.000595216522924602, "global_step": 47360, "epoch": 397, "lr": 2.5782344421929682e-05} +{"train_loss": 0.001119666312676424, "global_step": 47361, "epoch": 397, "lr": 2.578040615703916e-05, "val_loss": 0.026805629953742027} +{"train_loss": 0.0012611824786290526, "global_step": 47362, "epoch": 398, "lr": 2.57784679397012e-05} +{"train_loss": 0.0005785675020888448, "global_step": 47363, "epoch": 398, "lr": 2.577652976991965e-05} +{"train_loss": 0.0012487221974879503, "global_step": 47364, "epoch": 398, "lr": 2.5774591647698276e-05} +{"train_loss": 0.0012641046196222305, "global_step": 47365, "epoch": 398, "lr": 2.5772653573040922e-05} +{"train_loss": 0.0012632978614419699, "global_step": 47366, "epoch": 398, "lr": 2.5770715545951374e-05} +{"train_loss": 0.0012246135156601667, "global_step": 47367, "epoch": 398, "lr": 2.5768777566433422e-05} +{"train_loss": 0.001698449021205306, "global_step": 47368, "epoch": 398, "lr": 2.5766839634490902e-05} +{"train_loss": 0.000569476280361414, "global_step": 47369, "epoch": 398, "lr": 2.5764901750127585e-05} +{"train_loss": 0.0009276459459215403, "global_step": 47370, "epoch": 398, "lr": 2.5762963913347315e-05} +{"train_loss": 0.0013378997100517154, "global_step": 47371, "epoch": 398, "lr": 2.5761026124153875e-05} +{"train_loss": 0.0006796721718274057, "global_step": 47372, "epoch": 398, "lr": 2.575908838255105e-05} +{"train_loss": 0.0014500502729788423, "global_step": 47373, "epoch": 398, "lr": 2.5757150688542686e-05} +{"train_loss": 0.0013247125316411257, "global_step": 47374, "epoch": 398, "lr": 2.5755213042132543e-05} +{"train_loss": 0.0010466156527400017, "global_step": 47375, "epoch": 398, "lr": 2.5753275443324476e-05} +{"train_loss": 0.0009998880559578538, "global_step": 47376, "epoch": 398, "lr": 2.575133789212224e-05} +{"train_loss": 0.001061889692209661, "global_step": 47377, "epoch": 398, "lr": 2.5749400388529677e-05} +{"train_loss": 0.0011789655545726418, "global_step": 47378, "epoch": 398, "lr": 2.5747462932550583e-05} +{"train_loss": 0.0007115901098586619, "global_step": 47379, "epoch": 398, "lr": 2.574552552418873e-05} +{"train_loss": 0.0012433006195351481, "global_step": 47380, "epoch": 398, "lr": 2.5743588163447963e-05} +{"train_loss": 0.0009275999036617577, "global_step": 47381, "epoch": 398, "lr": 2.5741650850332054e-05} +{"train_loss": 0.0012320751557126641, "global_step": 47382, "epoch": 398, "lr": 2.5739713584844838e-05} +{"train_loss": 0.0008022625697776675, "global_step": 47383, "epoch": 398, "lr": 2.573777636699009e-05} +{"train_loss": 0.0012369956821203232, "global_step": 47384, "epoch": 398, "lr": 2.5735839196771637e-05} +{"train_loss": 0.0007230188930407166, "global_step": 47385, "epoch": 398, "lr": 2.5733902074193262e-05} +{"train_loss": 0.0009539228631183505, "global_step": 47386, "epoch": 398, "lr": 2.573196499925879e-05} +{"train_loss": 0.0008806175319477916, "global_step": 47387, "epoch": 398, "lr": 2.5730027971971994e-05} +{"train_loss": 0.0006759038078598678, "global_step": 47388, "epoch": 398, "lr": 2.5728090992336717e-05} +{"train_loss": 0.0009002662263810635, "global_step": 47389, "epoch": 398, "lr": 2.5726154060356717e-05} +{"train_loss": 0.0011360300704836845, "global_step": 47390, "epoch": 398, "lr": 2.5724217176035842e-05} +{"train_loss": 0.0008116710232570767, "global_step": 47391, "epoch": 398, "lr": 2.5722280339377853e-05} +{"train_loss": 0.001057203859090805, "global_step": 47392, "epoch": 398, "lr": 2.5720343550386596e-05} +{"train_loss": 0.0008804210228845477, "global_step": 47393, "epoch": 398, "lr": 2.571840680906582e-05} +{"train_loss": 0.002155168680474162, "global_step": 47394, "epoch": 398, "lr": 2.5716470115419387e-05} +{"train_loss": 0.0008824812830425799, "global_step": 47395, "epoch": 398, "lr": 2.5714533469451053e-05} +{"train_loss": 0.000982479308731854, "global_step": 47396, "epoch": 398, "lr": 2.5712596871164652e-05} +{"train_loss": 0.0004503340751398355, "global_step": 47397, "epoch": 398, "lr": 2.5710660320563974e-05} +{"train_loss": 0.001835030852816999, "global_step": 47398, "epoch": 398, "lr": 2.5708723817652803e-05} +{"train_loss": 0.0009436095715500414, "global_step": 47399, "epoch": 398, "lr": 2.570678736243497e-05} +{"train_loss": 0.001589416991919279, "global_step": 47400, "epoch": 398, "lr": 2.570485095491425e-05} +{"train_loss": 0.0008545168675482273, "global_step": 47401, "epoch": 398, "lr": 2.570291459509448e-05} +{"train_loss": 0.0011773374862968922, "global_step": 47402, "epoch": 398, "lr": 2.5700978282979416e-05} +{"train_loss": 0.0007356232381425798, "global_step": 47403, "epoch": 398, "lr": 2.5699042018572916e-05} +{"train_loss": 0.0016240167897194624, "global_step": 47404, "epoch": 398, "lr": 2.569710580187874e-05} +{"train_loss": 0.0017109360778704286, "global_step": 47405, "epoch": 398, "lr": 2.5695169632900683e-05} +{"train_loss": 0.0023961092811077833, "global_step": 47406, "epoch": 398, "lr": 2.5693233511642588e-05} +{"train_loss": 0.0011128488695248961, "global_step": 47407, "epoch": 398, "lr": 2.569129743810821e-05} +{"train_loss": 0.0009346992010250688, "global_step": 47408, "epoch": 398, "lr": 2.5689361412301393e-05} +{"train_loss": 0.0013020177138969302, "global_step": 47409, "epoch": 398, "lr": 2.5687425434225913e-05} +{"train_loss": 0.0008745866362005472, "global_step": 47410, "epoch": 398, "lr": 2.568548950388556e-05} +{"train_loss": 0.002043620217591524, "global_step": 47411, "epoch": 398, "lr": 2.5683553621284173e-05} +{"train_loss": 0.0008734801085665822, "global_step": 47412, "epoch": 398, "lr": 2.5681617786425505e-05} +{"train_loss": 0.0013062783982604742, "global_step": 47413, "epoch": 398, "lr": 2.567968199931341e-05} +{"train_loss": 0.0010787718929350376, "global_step": 47414, "epoch": 398, "lr": 2.567774625995163e-05} +{"train_loss": 0.000740588060580194, "global_step": 47415, "epoch": 398, "lr": 2.5675810568344027e-05} +{"train_loss": 0.0007200597319751978, "global_step": 47416, "epoch": 398, "lr": 2.5673874924494368e-05} +{"train_loss": 0.0006548762903548777, "global_step": 47417, "epoch": 398, "lr": 2.5671939328406435e-05} +{"train_loss": 0.0019361830782145262, "global_step": 47418, "epoch": 398, "lr": 2.567000378008405e-05} +{"train_loss": 0.002036121441051364, "global_step": 47419, "epoch": 398, "lr": 2.5668068279531032e-05} +{"train_loss": 0.0010402689222246408, "global_step": 47420, "epoch": 398, "lr": 2.566613282675115e-05} +{"train_loss": 0.0010044430382549763, "global_step": 47421, "epoch": 398, "lr": 2.5664197421748227e-05} +{"train_loss": 0.0019609928131103516, "global_step": 47422, "epoch": 398, "lr": 2.5662262064526044e-05} +{"train_loss": 0.0010471483692526817, "global_step": 47423, "epoch": 398, "lr": 2.5660326755088415e-05} +{"train_loss": 0.0011894631898030639, "global_step": 47424, "epoch": 398, "lr": 2.565839149343913e-05} +{"train_loss": 0.0015493982937186956, "global_step": 47425, "epoch": 398, "lr": 2.5656456279581998e-05} +{"train_loss": 0.0010063889203593135, "global_step": 47426, "epoch": 398, "lr": 2.5654521113520803e-05} +{"train_loss": 0.0011588383931666613, "global_step": 47427, "epoch": 398, "lr": 2.565258599525937e-05} +{"train_loss": 0.00202456908300519, "global_step": 47428, "epoch": 398, "lr": 2.5650650924801483e-05} +{"train_loss": 0.0012375739170238376, "global_step": 47429, "epoch": 398, "lr": 2.564871590215092e-05} +{"train_loss": 0.001685547293163836, "global_step": 47430, "epoch": 398, "lr": 2.564678092731153e-05} +{"train_loss": 0.0007843897328712046, "global_step": 47431, "epoch": 398, "lr": 2.564484600028706e-05} +{"train_loss": 0.0010592907201498747, "global_step": 47432, "epoch": 398, "lr": 2.564291112108135e-05} +{"train_loss": 0.0010336076375097036, "global_step": 47433, "epoch": 398, "lr": 2.564097628969816e-05} +{"train_loss": 0.0010130687151104212, "global_step": 47434, "epoch": 398, "lr": 2.5639041506141338e-05} +{"train_loss": 0.0014018018264323473, "global_step": 47435, "epoch": 398, "lr": 2.5637106770414655e-05} +{"train_loss": 0.0009894935647025704, "global_step": 47436, "epoch": 398, "lr": 2.5635172082521885e-05} +{"train_loss": 0.0008319006883539259, "global_step": 47437, "epoch": 398, "lr": 2.5633237442466872e-05} +{"train_loss": 0.001903796917758882, "global_step": 47438, "epoch": 398, "lr": 2.5631302850253375e-05} +{"train_loss": 0.0007918298942968249, "global_step": 47439, "epoch": 398, "lr": 2.5629368305885232e-05} +{"train_loss": 0.001254184520803392, "global_step": 47440, "epoch": 398, "lr": 2.562743380936622e-05} +{"train_loss": 0.0012719391379505396, "global_step": 47441, "epoch": 398, "lr": 2.5625499360700122e-05} +{"train_loss": 0.0014868384459987283, "global_step": 47442, "epoch": 398, "lr": 2.5623564959890768e-05} +{"train_loss": 0.0010748282074928284, "global_step": 47443, "epoch": 398, "lr": 2.5621630606941917e-05} +{"train_loss": 0.002128623891621828, "global_step": 47444, "epoch": 398, "lr": 2.561969630185741e-05} +{"train_loss": 0.0009422729490324855, "global_step": 47445, "epoch": 398, "lr": 2.5617762044641015e-05} +{"train_loss": 0.000992529559880495, "global_step": 47446, "epoch": 398, "lr": 2.5615827835296547e-05} +{"train_loss": 0.0010557505302131176, "global_step": 47447, "epoch": 398, "lr": 2.5613893673827804e-05} +{"train_loss": 0.0023170216009020805, "global_step": 47448, "epoch": 398, "lr": 2.561195956023855e-05} +{"train_loss": 0.002232051221653819, "global_step": 47449, "epoch": 398, "lr": 2.561002549453263e-05} +{"train_loss": 0.0013410166138783097, "global_step": 47450, "epoch": 398, "lr": 2.5608091476713804e-05} +{"train_loss": 0.0017230059020221233, "global_step": 47451, "epoch": 398, "lr": 2.56061575067859e-05} +{"train_loss": 0.0010838123271241784, "global_step": 47452, "epoch": 398, "lr": 2.560422358475268e-05} +{"train_loss": 0.0005386794218793511, "global_step": 47453, "epoch": 398, "lr": 2.560228971061796e-05} +{"train_loss": 0.0015615519369021058, "global_step": 47454, "epoch": 398, "lr": 2.5600355884385562e-05} +{"train_loss": 0.0009501128224655986, "global_step": 47455, "epoch": 398, "lr": 2.5598422106059234e-05} +{"train_loss": 0.0006898342981003225, "global_step": 47456, "epoch": 398, "lr": 2.5596488375642814e-05} +{"train_loss": 0.0010058118496090174, "global_step": 47457, "epoch": 398, "lr": 2.5594554693140073e-05} +{"train_loss": 0.0012417740654200315, "global_step": 47458, "epoch": 398, "lr": 2.5592621058554822e-05} +{"train_loss": 0.0007780904415994883, "global_step": 47459, "epoch": 398, "lr": 2.559068747189086e-05} +{"train_loss": 0.0010177299845963717, "global_step": 47460, "epoch": 398, "lr": 2.558875393315196e-05} +{"train_loss": 0.001922032330185175, "global_step": 47461, "epoch": 398, "lr": 2.5586820442341945e-05} +{"train_loss": 0.0014037369983270764, "global_step": 47462, "epoch": 398, "lr": 2.5584886999464584e-05} +{"train_loss": 0.0013371718814596534, "global_step": 47463, "epoch": 398, "lr": 2.5582953604523708e-05} +{"train_loss": 0.000850263109896332, "global_step": 47464, "epoch": 398, "lr": 2.558102025752308e-05} +{"train_loss": 0.0010949639836326241, "global_step": 47465, "epoch": 398, "lr": 2.5579086958466524e-05} +{"train_loss": 0.0009269803413189948, "global_step": 47466, "epoch": 398, "lr": 2.5577153707357822e-05} +{"train_loss": 0.0016760649159550667, "global_step": 47467, "epoch": 398, "lr": 2.5575220504200746e-05} +{"train_loss": 0.0008194606634788215, "global_step": 47468, "epoch": 398, "lr": 2.5573287348999142e-05} +{"train_loss": 0.0008170662331394851, "global_step": 47469, "epoch": 398, "lr": 2.5571354241756757e-05} +{"train_loss": 0.0013614065246656537, "global_step": 47470, "epoch": 398, "lr": 2.5569421182477426e-05} +{"train_loss": 0.0009727589786052704, "global_step": 47471, "epoch": 398, "lr": 2.556748817116491e-05} +{"train_loss": 0.0015442983713001013, "global_step": 47472, "epoch": 398, "lr": 2.5565555207823032e-05} +{"train_loss": 0.0022726983297616243, "global_step": 47473, "epoch": 398, "lr": 2.5563622292455585e-05} +{"train_loss": 0.0006904163165017962, "global_step": 47474, "epoch": 398, "lr": 2.5561689425066333e-05} +{"train_loss": 0.001040448434650898, "global_step": 47475, "epoch": 398, "lr": 2.5559756605659113e-05} +{"train_loss": 0.0005151483928784728, "global_step": 47476, "epoch": 398, "lr": 2.5557823834237675e-05} +{"train_loss": 0.0015149236423894763, "global_step": 47477, "epoch": 398, "lr": 2.5555891110805864e-05} +{"train_loss": 0.0020475205965340137, "global_step": 47478, "epoch": 398, "lr": 2.555395843536745e-05} +{"train_loss": 0.0009552415576763451, "global_step": 47479, "epoch": 398, "lr": 2.5552025807926206e-05} +{"train_loss": 0.0011931010876574844, "global_step": 47480, "epoch": 398, "lr": 2.555009322848596e-05, "val_loss": 0.021691108122467995} +{"train_loss": 0.0016314869280904531, "global_step": 47481, "epoch": 399, "lr": 2.554816069705048e-05} +{"train_loss": 0.0012987282825633883, "global_step": 47482, "epoch": 399, "lr": 2.5546228213623596e-05} +{"train_loss": 0.0011250956449657679, "global_step": 47483, "epoch": 399, "lr": 2.554429577820906e-05} +{"train_loss": 0.0010546417906880379, "global_step": 47484, "epoch": 399, "lr": 2.554236339081071e-05} +{"train_loss": 0.0008600427536293864, "global_step": 47485, "epoch": 399, "lr": 2.554043105143229e-05} +{"train_loss": 0.0017253505066037178, "global_step": 47486, "epoch": 399, "lr": 2.553849876007764e-05} +{"train_loss": 0.001407415489666164, "global_step": 47487, "epoch": 399, "lr": 2.5536566516750514e-05} +{"train_loss": 0.0015473717357963324, "global_step": 47488, "epoch": 399, "lr": 2.553463432145473e-05} +{"train_loss": 0.001085128984414041, "global_step": 47489, "epoch": 399, "lr": 2.55327021741941e-05} +{"train_loss": 0.0010289627825841308, "global_step": 47490, "epoch": 399, "lr": 2.5530770074972388e-05} +{"train_loss": 0.0013972752494737506, "global_step": 47491, "epoch": 399, "lr": 2.5528838023793378e-05} +{"train_loss": 0.001715615508146584, "global_step": 47492, "epoch": 399, "lr": 2.55269060206609e-05} +{"train_loss": 0.0010567307472229004, "global_step": 47493, "epoch": 399, "lr": 2.552497406557871e-05} +{"train_loss": 0.0007079893257468939, "global_step": 47494, "epoch": 399, "lr": 2.5523042158550637e-05} +{"train_loss": 0.0010962308151647449, "global_step": 47495, "epoch": 399, "lr": 2.5521110299580435e-05} +{"train_loss": 0.0018576052971184254, "global_step": 47496, "epoch": 399, "lr": 2.551917848867194e-05} +{"train_loss": 0.00045330930151976645, "global_step": 47497, "epoch": 399, "lr": 2.5517246725828925e-05} +{"train_loss": 0.0008392900344915688, "global_step": 47498, "epoch": 399, "lr": 2.5515315011055153e-05} +{"train_loss": 0.0013444948708638549, "global_step": 47499, "epoch": 399, "lr": 2.5513383344354467e-05} +{"train_loss": 0.0009788665920495987, "global_step": 47500, "epoch": 399, "lr": 2.5511451725730616e-05} +{"train_loss": 0.0012749439338222146, "global_step": 47501, "epoch": 399, "lr": 2.550952015518744e-05} +{"train_loss": 0.001273138215765357, "global_step": 47502, "epoch": 399, "lr": 2.5507588632728675e-05} +{"train_loss": 0.0007835050346329808, "global_step": 47503, "epoch": 399, "lr": 2.550565715835817e-05} +{"train_loss": 0.000777779845520854, "global_step": 47504, "epoch": 399, "lr": 2.5503725732079686e-05} +{"train_loss": 0.0008522571879439056, "global_step": 47505, "epoch": 399, "lr": 2.5501794353897003e-05} +{"train_loss": 0.0013499690685421228, "global_step": 47506, "epoch": 399, "lr": 2.5499863023813947e-05} +{"train_loss": 0.0008992847288027406, "global_step": 47507, "epoch": 399, "lr": 2.5497931741834274e-05} +{"train_loss": 0.0011651149252429605, "global_step": 47508, "epoch": 399, "lr": 2.5496000507961814e-05} +{"train_loss": 0.0011435856577008963, "global_step": 47509, "epoch": 399, "lr": 2.549406932220034e-05} +{"train_loss": 0.0008142187143675983, "global_step": 47510, "epoch": 399, "lr": 2.5492138184553622e-05} +{"train_loss": 0.0009427437325939536, "global_step": 47511, "epoch": 399, "lr": 2.5490207095025487e-05} +{"train_loss": 0.0006983331986702979, "global_step": 47512, "epoch": 399, "lr": 2.54882760536197e-05} +{"train_loss": 0.000724820070900023, "global_step": 47513, "epoch": 399, "lr": 2.5486345060340083e-05} +{"train_loss": 0.0011186363408342004, "global_step": 47514, "epoch": 399, "lr": 2.5484414115190387e-05} +{"train_loss": 0.0010999541264027357, "global_step": 47515, "epoch": 399, "lr": 2.5482483218174446e-05} +{"train_loss": 0.0007641966221854091, "global_step": 47516, "epoch": 399, "lr": 2.5480552369296007e-05} +{"train_loss": 0.000958516146056354, "global_step": 47517, "epoch": 399, "lr": 2.5478621568558903e-05} +{"train_loss": 0.001405238755978644, "global_step": 47518, "epoch": 399, "lr": 2.547669081596689e-05} +{"train_loss": 0.0011523566208779812, "global_step": 47519, "epoch": 399, "lr": 2.5474760111523793e-05} +{"train_loss": 0.0009562202612869442, "global_step": 47520, "epoch": 399, "lr": 2.5472829455233365e-05} +{"train_loss": 0.0007145099225454032, "global_step": 47521, "epoch": 399, "lr": 2.5470898847099434e-05} +{"train_loss": 0.0006291814497672021, "global_step": 47522, "epoch": 399, "lr": 2.5468968287125757e-05} +{"train_loss": 0.0011112963547930121, "global_step": 47523, "epoch": 399, "lr": 2.5467037775316155e-05} +{"train_loss": 0.0005157201085239649, "global_step": 47524, "epoch": 399, "lr": 2.5465107311674386e-05} +{"train_loss": 0.0015116401482373476, "global_step": 47525, "epoch": 399, "lr": 2.546317689620428e-05} +{"train_loss": 0.0005433046608231962, "global_step": 47526, "epoch": 399, "lr": 2.5461246528909577e-05} +{"train_loss": 0.0017007929272949696, "global_step": 47527, "epoch": 399, "lr": 2.5459316209794122e-05} +{"train_loss": 0.0008510330226272345, "global_step": 47528, "epoch": 399, "lr": 2.5457385938861676e-05} +{"train_loss": 0.0008779350901022553, "global_step": 47529, "epoch": 399, "lr": 2.5455455716116007e-05} +{"train_loss": 0.0009294482879340649, "global_step": 47530, "epoch": 399, "lr": 2.545352554156095e-05} +{"train_loss": 0.0016105271643027663, "global_step": 47531, "epoch": 399, "lr": 2.545159541520026e-05} +{"train_loss": 0.001158646191470325, "global_step": 47532, "epoch": 399, "lr": 2.5449665337037753e-05} +{"train_loss": 0.0017600659048184752, "global_step": 47533, "epoch": 399, "lr": 2.544773530707719e-05} +{"train_loss": 0.0010305863106623292, "global_step": 47534, "epoch": 399, "lr": 2.544580532532239e-05} +{"train_loss": 0.0007278069970197976, "global_step": 47535, "epoch": 399, "lr": 2.5443875391777126e-05} +{"train_loss": 0.001004511839710176, "global_step": 47536, "epoch": 399, "lr": 2.544194550644518e-05} +{"train_loss": 0.00084211170906201, "global_step": 47537, "epoch": 399, "lr": 2.5440015669330363e-05} +{"train_loss": 0.0017051586182788014, "global_step": 47538, "epoch": 399, "lr": 2.5438085880436435e-05} +{"train_loss": 0.001269438536837697, "global_step": 47539, "epoch": 399, "lr": 2.543615613976722e-05} +{"train_loss": 0.0004097922646906227, "global_step": 47540, "epoch": 399, "lr": 2.5434226447326464e-05} +{"train_loss": 0.0013021095655858517, "global_step": 47541, "epoch": 399, "lr": 2.5432296803118005e-05} +{"train_loss": 0.0010545740369707346, "global_step": 47542, "epoch": 399, "lr": 2.54303672071456e-05} +{"train_loss": 0.0008100449340417981, "global_step": 47543, "epoch": 399, "lr": 2.542843765941303e-05} +{"train_loss": 0.0012224589008837938, "global_step": 47544, "epoch": 399, "lr": 2.5426508159924116e-05} +{"train_loss": 0.000859769235830754, "global_step": 47545, "epoch": 399, "lr": 2.542457870868261e-05} +{"train_loss": 0.0010812337277457118, "global_step": 47546, "epoch": 399, "lr": 2.5422649305692338e-05} +{"train_loss": 0.0007838188321329653, "global_step": 47547, "epoch": 399, "lr": 2.542071995095706e-05} +{"train_loss": 0.0006681086961179972, "global_step": 47548, "epoch": 399, "lr": 2.541879064448056e-05} +{"train_loss": 0.0007063735974952579, "global_step": 47549, "epoch": 399, "lr": 2.5416861386266665e-05} +{"train_loss": 0.0010294753592461348, "global_step": 47550, "epoch": 399, "lr": 2.5414932176319107e-05} +{"train_loss": 0.0016631616745144129, "global_step": 47551, "epoch": 399, "lr": 2.5413003014641707e-05} +{"train_loss": 0.001132428995333612, "global_step": 47552, "epoch": 399, "lr": 2.5411073901238263e-05} +{"train_loss": 0.0008107467438094318, "global_step": 47553, "epoch": 399, "lr": 2.5409144836112535e-05} +{"train_loss": 0.0008818574133329093, "global_step": 47554, "epoch": 399, "lr": 2.5407215819268336e-05} +{"train_loss": 0.0009186795214191079, "global_step": 47555, "epoch": 399, "lr": 2.540528685070943e-05} +{"train_loss": 0.0004658376856241375, "global_step": 47556, "epoch": 399, "lr": 2.540335793043963e-05} +{"train_loss": 0.0005554615054279566, "global_step": 47557, "epoch": 399, "lr": 2.54014290584627e-05} +{"train_loss": 0.0006058607250452042, "global_step": 47558, "epoch": 399, "lr": 2.539950023478245e-05} +{"train_loss": 0.0006700857193209231, "global_step": 47559, "epoch": 399, "lr": 2.5397571459402647e-05} +{"train_loss": 0.0010630604811012745, "global_step": 47560, "epoch": 399, "lr": 2.5395642732327064e-05} +{"train_loss": 0.0006800983683206141, "global_step": 47561, "epoch": 399, "lr": 2.5393714053559535e-05} +{"train_loss": 0.0008107750909402966, "global_step": 47562, "epoch": 399, "lr": 2.5391785423103798e-05} +{"train_loss": 0.0005673759733326733, "global_step": 47563, "epoch": 399, "lr": 2.5389856840963677e-05} +{"train_loss": 0.000912549439817667, "global_step": 47564, "epoch": 399, "lr": 2.5387928307142927e-05} +{"train_loss": 0.000946558138821274, "global_step": 47565, "epoch": 399, "lr": 2.538599982164537e-05} +{"train_loss": 0.0007752536912448704, "global_step": 47566, "epoch": 399, "lr": 2.5384071384474767e-05} +{"train_loss": 0.0009971251711249352, "global_step": 47567, "epoch": 399, "lr": 2.5382142995634893e-05} +{"train_loss": 0.0012140123872086406, "global_step": 47568, "epoch": 399, "lr": 2.5380214655129576e-05} +{"train_loss": 0.0011407278943806887, "global_step": 47569, "epoch": 399, "lr": 2.5378286362962555e-05} +{"train_loss": 0.0009198314510285854, "global_step": 47570, "epoch": 399, "lr": 2.5376358119137656e-05} +{"train_loss": 0.0009118226589635015, "global_step": 47571, "epoch": 399, "lr": 2.5374429923658626e-05} +{"train_loss": 0.0006805226439610124, "global_step": 47572, "epoch": 399, "lr": 2.53725017765293e-05} +{"train_loss": 0.0005554463132284582, "global_step": 47573, "epoch": 399, "lr": 2.537057367775343e-05} +{"train_loss": 0.0008395373006351292, "global_step": 47574, "epoch": 399, "lr": 2.5368645627334786e-05} +{"train_loss": 0.0015061352169141173, "global_step": 47575, "epoch": 399, "lr": 2.5366717625277193e-05} +{"train_loss": 0.001137835206463933, "global_step": 47576, "epoch": 399, "lr": 2.5364789671584405e-05} +{"train_loss": 0.0011658936273306608, "global_step": 47577, "epoch": 399, "lr": 2.536286176626024e-05} +{"train_loss": 0.001018740702420473, "global_step": 47578, "epoch": 399, "lr": 2.536093390930846e-05} +{"train_loss": 0.0008259156602434814, "global_step": 47579, "epoch": 399, "lr": 2.535900610073283e-05} +{"train_loss": 0.001183277228847146, "global_step": 47580, "epoch": 399, "lr": 2.5357078340537187e-05} +{"train_loss": 0.0011332551948726177, "global_step": 47581, "epoch": 399, "lr": 2.5355150628725266e-05} +{"train_loss": 0.0013442026684060693, "global_step": 47582, "epoch": 399, "lr": 2.5353222965300895e-05} +{"train_loss": 0.0010203862329944968, "global_step": 47583, "epoch": 399, "lr": 2.535129535026781e-05} +{"train_loss": 0.0011888447916135192, "global_step": 47584, "epoch": 399, "lr": 2.5349367783629852e-05} +{"train_loss": 0.0008454301860183477, "global_step": 47585, "epoch": 399, "lr": 2.5347440265390754e-05} +{"train_loss": 0.0007787419017404318, "global_step": 47586, "epoch": 399, "lr": 2.5345512795554326e-05} +{"train_loss": 0.0033670852426439524, "global_step": 47587, "epoch": 399, "lr": 2.534358537412436e-05} +{"train_loss": 0.0011817425256595016, "global_step": 47588, "epoch": 399, "lr": 2.534165800110462e-05} +{"train_loss": 0.001412952900864184, "global_step": 47589, "epoch": 399, "lr": 2.533973067649892e-05} +{"train_loss": 0.0008329209522344172, "global_step": 47590, "epoch": 399, "lr": 2.5337803400311e-05} +{"train_loss": 0.0010564711410552263, "global_step": 47591, "epoch": 399, "lr": 2.5335876172544687e-05} +{"train_loss": 0.0011400677030906081, "global_step": 47592, "epoch": 399, "lr": 2.533394899320375e-05} +{"train_loss": 0.001202595653012395, "global_step": 47593, "epoch": 399, "lr": 2.5332021862291942e-05} +{"train_loss": 0.0014709128299728036, "global_step": 47594, "epoch": 399, "lr": 2.53300947798131e-05} +{"train_loss": 0.001108457800000906, "global_step": 47595, "epoch": 399, "lr": 2.5328167745770964e-05} +{"train_loss": 0.0013155096676200628, "global_step": 47596, "epoch": 399, "lr": 2.532624076016935e-05} +{"train_loss": 0.0013984109973534942, "global_step": 47597, "epoch": 399, "lr": 2.5324313823012024e-05} +{"train_loss": 0.0007426876109093428, "global_step": 47598, "epoch": 399, "lr": 2.5322386934302757e-05} +{"train_loss": 0.0010617743860128015, "global_step": 47599, "epoch": 399, "lr": 2.5320460094045367e-05, "val_loss": 0.018352404236793518} +{"train_loss": 0.0012586511438712478, "global_step": 47600, "epoch": 400, "lr": 2.5318533302243597e-05} +{"train_loss": 0.0016886318335309625, "global_step": 47601, "epoch": 400, "lr": 2.5316606558901267e-05} +{"train_loss": 0.0009134316351264715, "global_step": 47602, "epoch": 400, "lr": 2.5314679864022124e-05} +{"train_loss": 0.0012395965168252587, "global_step": 47603, "epoch": 400, "lr": 2.5312753217609985e-05} +{"train_loss": 0.0023596042301505804, "global_step": 47604, "epoch": 400, "lr": 2.5310826619668626e-05} +{"train_loss": 0.0008844526018947363, "global_step": 47605, "epoch": 400, "lr": 2.5308900070201797e-05} +{"train_loss": 0.0009915719274431467, "global_step": 47606, "epoch": 400, "lr": 2.5306973569213323e-05} +{"train_loss": 0.0007585913990624249, "global_step": 47607, "epoch": 400, "lr": 2.5305047116706955e-05} +{"train_loss": 0.0013731119688600302, "global_step": 47608, "epoch": 400, "lr": 2.53031207126865e-05} +{"train_loss": 0.0020776749588549137, "global_step": 47609, "epoch": 400, "lr": 2.5301194357155716e-05} +{"train_loss": 0.0011076971422880888, "global_step": 47610, "epoch": 400, "lr": 2.529926805011842e-05} +{"train_loss": 0.0016870065592229366, "global_step": 47611, "epoch": 400, "lr": 2.5297341791578366e-05} +{"train_loss": 0.0007558568613603711, "global_step": 47612, "epoch": 400, "lr": 2.5295415581539323e-05} +{"train_loss": 0.0008720509358681738, "global_step": 47613, "epoch": 400, "lr": 2.5293489420005113e-05} +{"train_loss": 0.001515062409453094, "global_step": 47614, "epoch": 400, "lr": 2.529156330697948e-05} +{"train_loss": 0.0007882847567088902, "global_step": 47615, "epoch": 400, "lr": 2.5289637242466234e-05} +{"train_loss": 0.0026655804831534624, "global_step": 47616, "epoch": 400, "lr": 2.5287711226469134e-05} +{"train_loss": 0.0009496152051724494, "global_step": 47617, "epoch": 400, "lr": 2.528578525899199e-05} +{"train_loss": 0.0013653734931722283, "global_step": 47618, "epoch": 400, "lr": 2.5283859340038552e-05} +{"train_loss": 0.0006285684066824615, "global_step": 47619, "epoch": 400, "lr": 2.528193346961263e-05} +{"train_loss": 0.0007634651265107095, "global_step": 47620, "epoch": 400, "lr": 2.5280007647717974e-05} +{"train_loss": 0.0013240582775324583, "global_step": 47621, "epoch": 400, "lr": 2.527808187435837e-05} +{"train_loss": 0.0007628321181982756, "global_step": 47622, "epoch": 400, "lr": 2.5276156149537643e-05} +{"train_loss": 0.0017581876600161195, "global_step": 47623, "epoch": 400, "lr": 2.5274230473259542e-05} +{"train_loss": 0.0012836616951972246, "global_step": 47624, "epoch": 400, "lr": 2.5272304845527827e-05} +{"train_loss": 0.0006382793071679771, "global_step": 47625, "epoch": 400, "lr": 2.5270379266346316e-05} +{"train_loss": 0.000770045502576977, "global_step": 47626, "epoch": 400, "lr": 2.5268453735718756e-05} +{"train_loss": 0.0015405674930661917, "global_step": 47627, "epoch": 400, "lr": 2.526652825364897e-05} +{"train_loss": 0.0017206233460456133, "global_step": 47628, "epoch": 400, "lr": 2.5264602820140702e-05} +{"train_loss": 0.0013638024684041739, "global_step": 47629, "epoch": 400, "lr": 2.5262677435197734e-05} +{"train_loss": 0.001341720693744719, "global_step": 47630, "epoch": 400, "lr": 2.526075209882387e-05} +{"train_loss": 0.00048759407945908606, "global_step": 47631, "epoch": 400, "lr": 2.5258826811022857e-05} +{"train_loss": 0.0019423237536102533, "global_step": 47632, "epoch": 400, "lr": 2.525690157179852e-05} +{"train_loss": 0.0009907626081258059, "global_step": 47633, "epoch": 400, "lr": 2.5254976381154583e-05} +{"train_loss": 0.0012780827237293124, "global_step": 47634, "epoch": 400, "lr": 2.5253051239094883e-05} +{"train_loss": 0.0006729409797117114, "global_step": 47635, "epoch": 400, "lr": 2.5251126145623172e-05} +{"train_loss": 0.0006222085212357342, "global_step": 47636, "epoch": 400, "lr": 2.5249201100743214e-05} +{"train_loss": 0.0012163285864517093, "global_step": 47637, "epoch": 400, "lr": 2.5247276104458816e-05} +{"train_loss": 0.0009801434352993965, "global_step": 47638, "epoch": 400, "lr": 2.5245351156773733e-05} +{"train_loss": 0.0007864154758863151, "global_step": 47639, "epoch": 400, "lr": 2.5243426257691784e-05} +{"train_loss": 0.000997979543171823, "global_step": 47640, "epoch": 400, "lr": 2.5241501407216695e-05} +{"train_loss": 0.002035569166764617, "global_step": 47641, "epoch": 400, "lr": 2.5239576605352295e-05} +{"train_loss": 0.0011568180052563548, "global_step": 47642, "epoch": 400, "lr": 2.523765185210234e-05} +{"train_loss": 0.0012061572633683681, "global_step": 47643, "epoch": 400, "lr": 2.5235727147470588e-05} +{"train_loss": 0.0010280952556058764, "global_step": 47644, "epoch": 400, "lr": 2.5233802491460867e-05} +{"train_loss": 0.0007277103723026812, "global_step": 47645, "epoch": 400, "lr": 2.5231877884076905e-05} +{"train_loss": 0.00212489883415401, "global_step": 47646, "epoch": 400, "lr": 2.5229953325322525e-05} +{"train_loss": 0.0008340918575413525, "global_step": 47647, "epoch": 400, "lr": 2.5228028815201466e-05} +{"train_loss": 0.0013744138414040208, "global_step": 47648, "epoch": 400, "lr": 2.5226104353717543e-05} +{"train_loss": 0.0009945272468030453, "global_step": 47649, "epoch": 400, "lr": 2.5224179940874505e-05} +{"train_loss": 0.0006030883523635566, "global_step": 47650, "epoch": 400, "lr": 2.5222255576676156e-05} +{"train_loss": 0.0007968733552843332, "global_step": 47651, "epoch": 400, "lr": 2.522033126112624e-05} +{"train_loss": 0.0009315020870417356, "global_step": 47652, "epoch": 400, "lr": 2.5218406994228583e-05} +{"train_loss": 0.0012907085474580526, "global_step": 47653, "epoch": 400, "lr": 2.521648277598691e-05} +{"train_loss": 0.0008163749007508159, "global_step": 47654, "epoch": 400, "lr": 2.521455860640505e-05} +{"train_loss": 0.001267016283236444, "global_step": 47655, "epoch": 400, "lr": 2.521263448548673e-05} +{"train_loss": 0.0013037921162322164, "global_step": 47656, "epoch": 400, "lr": 2.5210710413235777e-05} +{"train_loss": 0.0009788144379854202, "global_step": 47657, "epoch": 400, "lr": 2.5208786389655925e-05} +{"train_loss": 0.00047960938536562026, "global_step": 47658, "epoch": 400, "lr": 2.5206862414750997e-05} +{"train_loss": 0.0017951417248696089, "global_step": 47659, "epoch": 400, "lr": 2.520493848852472e-05} +{"train_loss": 0.0008732854039408267, "global_step": 47660, "epoch": 400, "lr": 2.5203014610980925e-05} +{"train_loss": 0.0007188037852756679, "global_step": 47661, "epoch": 400, "lr": 2.5201090782123353e-05} +{"train_loss": 0.0019373451359570026, "global_step": 47662, "epoch": 400, "lr": 2.5199167001955776e-05} +{"train_loss": 0.0015317774377763271, "global_step": 47663, "epoch": 400, "lr": 2.5197243270482002e-05} +{"train_loss": 0.0009863111190497875, "global_step": 47664, "epoch": 400, "lr": 2.5195319587705768e-05} +{"train_loss": 0.0007408103556372225, "global_step": 47665, "epoch": 400, "lr": 2.51933959536309e-05} +{"train_loss": 0.0013206338044255972, "global_step": 47666, "epoch": 400, "lr": 2.5191472368261148e-05} +{"train_loss": 0.0016131808515638113, "global_step": 47667, "epoch": 400, "lr": 2.518954883160027e-05} +{"train_loss": 0.0005308108520694077, "global_step": 47668, "epoch": 400, "lr": 2.5187625343652076e-05} +{"train_loss": 0.0007526044500991702, "global_step": 47669, "epoch": 400, "lr": 2.518570190442031e-05} +{"train_loss": 0.0008691528928466141, "global_step": 47670, "epoch": 400, "lr": 2.5183778513908795e-05} +{"train_loss": 0.0012177701573818922, "global_step": 47671, "epoch": 400, "lr": 2.5181855172121256e-05} +{"train_loss": 0.001392801757901907, "global_step": 47672, "epoch": 400, "lr": 2.5179931879061513e-05} +{"train_loss": 0.001588710700161755, "global_step": 47673, "epoch": 400, "lr": 2.5178008634733318e-05} +{"train_loss": 0.0009643696830607951, "global_step": 47674, "epoch": 400, "lr": 2.517608543914044e-05} +{"train_loss": 0.0006947379442863166, "global_step": 47675, "epoch": 400, "lr": 2.5174162292286675e-05} +{"train_loss": 0.0010598934022709727, "global_step": 47676, "epoch": 400, "lr": 2.5172239194175777e-05} +{"train_loss": 0.0007086948025971651, "global_step": 47677, "epoch": 400, "lr": 2.5170316144811557e-05} +{"train_loss": 0.0012491614324972034, "global_step": 47678, "epoch": 400, "lr": 2.5168393144197766e-05} +{"train_loss": 0.0005495757213793695, "global_step": 47679, "epoch": 400, "lr": 2.5166470192338155e-05} +{"train_loss": 0.0008128983317874372, "global_step": 47680, "epoch": 400, "lr": 2.5164547289236555e-05} +{"train_loss": 0.0010144109837710857, "global_step": 47681, "epoch": 400, "lr": 2.516262443489669e-05} +{"train_loss": 0.0007201107800938189, "global_step": 47682, "epoch": 400, "lr": 2.516070162932236e-05} +{"train_loss": 0.0008967696339823306, "global_step": 47683, "epoch": 400, "lr": 2.5158778872517364e-05} +{"train_loss": 0.0008809471037238836, "global_step": 47684, "epoch": 400, "lr": 2.5156856164485422e-05} +{"train_loss": 0.001052956678904593, "global_step": 47685, "epoch": 400, "lr": 2.515493350523036e-05} +{"train_loss": 0.00065345608163625, "global_step": 47686, "epoch": 400, "lr": 2.5153010894755917e-05} +{"train_loss": 0.000811027770396322, "global_step": 47687, "epoch": 400, "lr": 2.51510883330659e-05} +{"train_loss": 0.0012595744337886572, "global_step": 47688, "epoch": 400, "lr": 2.5149165820164043e-05} +{"train_loss": 0.0006475734990090132, "global_step": 47689, "epoch": 400, "lr": 2.514724335605417e-05} +{"train_loss": 0.00112624978646636, "global_step": 47690, "epoch": 400, "lr": 2.5145320940740015e-05} +{"train_loss": 0.0009475370752625167, "global_step": 47691, "epoch": 400, "lr": 2.5143398574225375e-05} +{"train_loss": 0.0005636553978547454, "global_step": 47692, "epoch": 400, "lr": 2.514147625651402e-05} +{"train_loss": 0.0006919010193087161, "global_step": 47693, "epoch": 400, "lr": 2.51395539876097e-05} +{"train_loss": 0.0014190493384376168, "global_step": 47694, "epoch": 400, "lr": 2.5137631767516235e-05} +{"train_loss": 0.0003903034667018801, "global_step": 47695, "epoch": 400, "lr": 2.5135709596237346e-05} +{"train_loss": 0.0007103766547515988, "global_step": 47696, "epoch": 400, "lr": 2.513378747377686e-05} +{"train_loss": 0.0007612673798575997, "global_step": 47697, "epoch": 400, "lr": 2.513186540013852e-05} +{"train_loss": 0.0014929421013221145, "global_step": 47698, "epoch": 400, "lr": 2.512994337532609e-05} +{"train_loss": 0.0011847078567370772, "global_step": 47699, "epoch": 400, "lr": 2.512802139934338e-05} +{"train_loss": 0.0006323228008113801, "global_step": 47700, "epoch": 400, "lr": 2.5126099472194126e-05} +{"train_loss": 0.0011138389818370342, "global_step": 47701, "epoch": 400, "lr": 2.5124177593882138e-05} +{"train_loss": 0.0007400678587146103, "global_step": 47702, "epoch": 400, "lr": 2.512225576441114e-05} +{"train_loss": 0.001052101724781096, "global_step": 47703, "epoch": 400, "lr": 2.512033398378496e-05} +{"train_loss": 0.0014875452034175396, "global_step": 47704, "epoch": 400, "lr": 2.511841225200735e-05} +{"train_loss": 0.0012014290550723672, "global_step": 47705, "epoch": 400, "lr": 2.5116490569082052e-05} +{"train_loss": 0.0010544512188062072, "global_step": 47706, "epoch": 400, "lr": 2.5114568935012895e-05} +{"train_loss": 0.0011218024883419275, "global_step": 47707, "epoch": 400, "lr": 2.5112647349803597e-05} +{"train_loss": 0.001142539898864925, "global_step": 47708, "epoch": 400, "lr": 2.511072581345798e-05} +{"train_loss": 0.0010048574768006802, "global_step": 47709, "epoch": 400, "lr": 2.5108804325979773e-05} +{"train_loss": 0.0014529484324157238, "global_step": 47710, "epoch": 400, "lr": 2.510688288737279e-05} +{"train_loss": 0.0006458999705500901, "global_step": 47711, "epoch": 400, "lr": 2.5104961497640782e-05} +{"train_loss": 0.0007732811500318348, "global_step": 47712, "epoch": 400, "lr": 2.5103040156787506e-05} +{"train_loss": 0.0012680958025157452, "global_step": 47713, "epoch": 400, "lr": 2.5101118864816765e-05} +{"train_loss": 0.0008540484705008566, "global_step": 47714, "epoch": 400, "lr": 2.50991976217323e-05} +{"train_loss": 0.0011901205871254206, "global_step": 47715, "epoch": 400, "lr": 2.509727642753792e-05} +{"train_loss": 0.000893547257874161, "global_step": 47716, "epoch": 400, "lr": 2.509535528223736e-05} +{"train_loss": 0.0010900124907493591, "global_step": 47717, "epoch": 400, "lr": 2.509343418583441e-05} +{"train_loss": 0.0010977846263622191, "global_step": 47718, "epoch": 400, "lr": 2.5091513138332855e-05, "val_loss": 0.03897673264145851, "train_action_mse_error": 1.4711062249261886e-05} +{"train_loss": 0.000722344615496695, "global_step": 47719, "epoch": 401, "lr": 2.5089592139736434e-05} +{"train_loss": 0.00047632999485358596, "global_step": 47720, "epoch": 401, "lr": 2.5087671190048956e-05} +{"train_loss": 0.001152589451521635, "global_step": 47721, "epoch": 401, "lr": 2.508575028927416e-05} +{"train_loss": 0.001587117905728519, "global_step": 47722, "epoch": 401, "lr": 2.5083829437415852e-05} +{"train_loss": 0.0012876272667199373, "global_step": 47723, "epoch": 401, "lr": 2.508190863447778e-05} +{"train_loss": 0.0007613493944518268, "global_step": 47724, "epoch": 401, "lr": 2.5079987880463696e-05} +{"train_loss": 0.0013189584715291858, "global_step": 47725, "epoch": 401, "lr": 2.507806717537742e-05} +{"train_loss": 0.0010562086245045066, "global_step": 47726, "epoch": 401, "lr": 2.5076146519222667e-05} +{"train_loss": 0.001029908424243331, "global_step": 47727, "epoch": 401, "lr": 2.5074225912003264e-05} +{"train_loss": 0.000969761866144836, "global_step": 47728, "epoch": 401, "lr": 2.5072305353722935e-05} +{"train_loss": 0.0006894280668348074, "global_step": 47729, "epoch": 401, "lr": 2.5070384844385487e-05} +{"train_loss": 0.0015347112203016877, "global_step": 47730, "epoch": 401, "lr": 2.5068464383994683e-05} +{"train_loss": 0.0012834989465773106, "global_step": 47731, "epoch": 401, "lr": 2.5066543972554257e-05} +{"train_loss": 0.0007335231057368219, "global_step": 47732, "epoch": 401, "lr": 2.5064623610068033e-05} +{"train_loss": 0.0009515965357422829, "global_step": 47733, "epoch": 401, "lr": 2.5062703296539734e-05} +{"train_loss": 0.0018657197942957282, "global_step": 47734, "epoch": 401, "lr": 2.506078303197318e-05} +{"train_loss": 0.0011197762796655297, "global_step": 47735, "epoch": 401, "lr": 2.5058862816372107e-05} +{"train_loss": 0.00048554842942394316, "global_step": 47736, "epoch": 401, "lr": 2.5056942649740277e-05} +{"train_loss": 0.0015950415981933475, "global_step": 47737, "epoch": 401, "lr": 2.505502253208149e-05} +{"train_loss": 0.0007800066377967596, "global_step": 47738, "epoch": 401, "lr": 2.5053102463399485e-05} +{"train_loss": 0.0011289685498923063, "global_step": 47739, "epoch": 401, "lr": 2.5051182443698063e-05} +{"train_loss": 0.0009170022094622254, "global_step": 47740, "epoch": 401, "lr": 2.5049262472980965e-05} +{"train_loss": 0.0010103065287694335, "global_step": 47741, "epoch": 401, "lr": 2.5047342551251995e-05} +{"train_loss": 0.0010982755338773131, "global_step": 47742, "epoch": 401, "lr": 2.5045422678514895e-05} +{"train_loss": 0.0011719330213963985, "global_step": 47743, "epoch": 401, "lr": 2.5043502854773426e-05} +{"train_loss": 0.001478621968999505, "global_step": 47744, "epoch": 401, "lr": 2.5041583080031394e-05} +{"train_loss": 0.0007670024642720819, "global_step": 47745, "epoch": 401, "lr": 2.5039663354292532e-05} +{"train_loss": 0.001822328777052462, "global_step": 47746, "epoch": 401, "lr": 2.503774367756063e-05} +{"train_loss": 0.0016607734141871333, "global_step": 47747, "epoch": 401, "lr": 2.5035824049839446e-05} +{"train_loss": 0.0012483219616115093, "global_step": 47748, "epoch": 401, "lr": 2.5033904471132768e-05} +{"train_loss": 0.00143349205609411, "global_step": 47749, "epoch": 401, "lr": 2.503198494144433e-05} +{"train_loss": 0.0008649307419545949, "global_step": 47750, "epoch": 401, "lr": 2.503006546077795e-05} +{"train_loss": 0.0007238698308356106, "global_step": 47751, "epoch": 401, "lr": 2.5028146029137345e-05} +{"train_loss": 0.000987047329545021, "global_step": 47752, "epoch": 401, "lr": 2.502622664652632e-05} +{"train_loss": 0.0007475184975191951, "global_step": 47753, "epoch": 401, "lr": 2.5024307312948614e-05} +{"train_loss": 0.0012873937375843525, "global_step": 47754, "epoch": 401, "lr": 2.502238802840804e-05} +{"train_loss": 0.0012739647645503283, "global_step": 47755, "epoch": 401, "lr": 2.5020468792908312e-05} +{"train_loss": 0.0007063884986564517, "global_step": 47756, "epoch": 401, "lr": 2.5018549606453244e-05} +{"train_loss": 0.0013904634397476912, "global_step": 47757, "epoch": 401, "lr": 2.501663046904657e-05} +{"train_loss": 0.0007560327067039907, "global_step": 47758, "epoch": 401, "lr": 2.501471138069209e-05} +{"train_loss": 0.0007416882435791194, "global_step": 47759, "epoch": 401, "lr": 2.5012792341393533e-05} +{"train_loss": 0.001382677466608584, "global_step": 47760, "epoch": 401, "lr": 2.501087335115471e-05} +{"train_loss": 0.0018548730295151472, "global_step": 47761, "epoch": 401, "lr": 2.5008954409979367e-05} +{"train_loss": 0.0011891908943653107, "global_step": 47762, "epoch": 401, "lr": 2.5007035517871257e-05} +{"train_loss": 0.0019393612165004015, "global_step": 47763, "epoch": 401, "lr": 2.5005116674834177e-05} +{"train_loss": 0.0012911116937175393, "global_step": 47764, "epoch": 401, "lr": 2.5003197880871866e-05} +{"train_loss": 0.00040403305320069194, "global_step": 47765, "epoch": 401, "lr": 2.500127913598812e-05} +{"train_loss": 0.0010865736985579133, "global_step": 47766, "epoch": 401, "lr": 2.4999360440186692e-05} +{"train_loss": 0.0016528762644156814, "global_step": 47767, "epoch": 401, "lr": 2.499744179347133e-05} +{"train_loss": 0.0012172393035143614, "global_step": 47768, "epoch": 401, "lr": 2.499552319584584e-05} +{"train_loss": 0.0011494581121951342, "global_step": 47769, "epoch": 401, "lr": 2.499360464731395e-05} +{"train_loss": 0.0013892716960981488, "global_step": 47770, "epoch": 401, "lr": 2.4991686147879462e-05} +{"train_loss": 0.0007987517165020108, "global_step": 47771, "epoch": 401, "lr": 2.4989767697546112e-05} +{"train_loss": 0.0013722884468734264, "global_step": 47772, "epoch": 401, "lr": 2.49878492963177e-05} +{"train_loss": 0.002633815398439765, "global_step": 47773, "epoch": 401, "lr": 2.4985930944197973e-05} +{"train_loss": 0.0009592653368599713, "global_step": 47774, "epoch": 401, "lr": 2.4984012641190673e-05} +{"train_loss": 0.0012061186134815216, "global_step": 47775, "epoch": 401, "lr": 2.4982094387299614e-05} +{"train_loss": 0.0012172282440587878, "global_step": 47776, "epoch": 401, "lr": 2.4980176182528525e-05} +{"train_loss": 0.0011833818862214684, "global_step": 47777, "epoch": 401, "lr": 2.4978258026881203e-05} +{"train_loss": 0.0008598056738264859, "global_step": 47778, "epoch": 401, "lr": 2.497633992036138e-05} +{"train_loss": 0.00084352632984519, "global_step": 47779, "epoch": 401, "lr": 2.4974421862972857e-05} +{"train_loss": 0.0006859650602564216, "global_step": 47780, "epoch": 401, "lr": 2.497250385471937e-05} +{"train_loss": 0.0022187470458447933, "global_step": 47781, "epoch": 401, "lr": 2.497058589560471e-05} +{"train_loss": 0.0013939967611804605, "global_step": 47782, "epoch": 401, "lr": 2.4968667985632616e-05} +{"train_loss": 0.0020744623616337776, "global_step": 47783, "epoch": 401, "lr": 2.4966750124806886e-05} +{"train_loss": 0.0011702715419232845, "global_step": 47784, "epoch": 401, "lr": 2.4964832313131248e-05} +{"train_loss": 0.0006686753476969898, "global_step": 47785, "epoch": 401, "lr": 2.4962914550609508e-05} +{"train_loss": 0.00172447320073843, "global_step": 47786, "epoch": 401, "lr": 2.4960996837245386e-05} +{"train_loss": 0.0011484769638627768, "global_step": 47787, "epoch": 401, "lr": 2.4959079173042697e-05} +{"train_loss": 0.0012173735303804278, "global_step": 47788, "epoch": 401, "lr": 2.495716155800516e-05} +{"train_loss": 0.0009338500676676631, "global_step": 47789, "epoch": 401, "lr": 2.4955243992136578e-05} +{"train_loss": 0.0005608405917882919, "global_step": 47790, "epoch": 401, "lr": 2.495332647544068e-05} +{"train_loss": 0.0006451585795730352, "global_step": 47791, "epoch": 401, "lr": 2.4951409007921274e-05} +{"train_loss": 0.0009880171855911613, "global_step": 47792, "epoch": 401, "lr": 2.494949158958209e-05} +{"train_loss": 0.0005475009675137699, "global_step": 47793, "epoch": 401, "lr": 2.4947574220426894e-05} +{"train_loss": 0.0010814613196998835, "global_step": 47794, "epoch": 401, "lr": 2.4945656900459473e-05} +{"train_loss": 0.0013648240128532052, "global_step": 47795, "epoch": 401, "lr": 2.494373962968356e-05} +{"train_loss": 0.0010834673885256052, "global_step": 47796, "epoch": 401, "lr": 2.494182240810296e-05} +{"train_loss": 0.0013096821494400501, "global_step": 47797, "epoch": 401, "lr": 2.493990523572141e-05} +{"train_loss": 0.000829941825941205, "global_step": 47798, "epoch": 401, "lr": 2.493798811254266e-05} +{"train_loss": 0.0013731698272749782, "global_step": 47799, "epoch": 401, "lr": 2.4936071038570513e-05} +{"train_loss": 0.0010401951149106026, "global_step": 47800, "epoch": 401, "lr": 2.4934154013808697e-05} +{"train_loss": 0.0007686780882067978, "global_step": 47801, "epoch": 401, "lr": 2.493223703826101e-05} +{"train_loss": 0.00079601991456002, "global_step": 47802, "epoch": 401, "lr": 2.493032011193117e-05} +{"train_loss": 0.0008634019177407026, "global_step": 47803, "epoch": 401, "lr": 2.4928403234822993e-05} +{"train_loss": 0.001154900761321187, "global_step": 47804, "epoch": 401, "lr": 2.492648640694022e-05} +{"train_loss": 0.0008690474787726998, "global_step": 47805, "epoch": 401, "lr": 2.4924569628286594e-05} +{"train_loss": 0.0006412392831407487, "global_step": 47806, "epoch": 401, "lr": 2.4922652898865912e-05} +{"train_loss": 0.0010562509996816516, "global_step": 47807, "epoch": 401, "lr": 2.4920736218681906e-05} +{"train_loss": 0.0011257639853283763, "global_step": 47808, "epoch": 401, "lr": 2.491881958773837e-05} +{"train_loss": 0.0016506110550835729, "global_step": 47809, "epoch": 401, "lr": 2.4916903006039033e-05} +{"train_loss": 0.0008692010887898505, "global_step": 47810, "epoch": 401, "lr": 2.4914986473587698e-05} +{"train_loss": 0.000636527722235769, "global_step": 47811, "epoch": 401, "lr": 2.491306999038811e-05} +{"train_loss": 0.0014914697967469692, "global_step": 47812, "epoch": 401, "lr": 2.4911153556444005e-05} +{"train_loss": 0.0015392753994092345, "global_step": 47813, "epoch": 401, "lr": 2.4909237171759193e-05} +{"train_loss": 0.0010743711609393358, "global_step": 47814, "epoch": 401, "lr": 2.4907320836337394e-05} +{"train_loss": 0.0011055304203182459, "global_step": 47815, "epoch": 401, "lr": 2.490540455018239e-05} +{"train_loss": 0.0009757665102370083, "global_step": 47816, "epoch": 401, "lr": 2.4903488313297958e-05} +{"train_loss": 0.0012155931908637285, "global_step": 47817, "epoch": 401, "lr": 2.4901572125687826e-05} +{"train_loss": 0.000925620726775378, "global_step": 47818, "epoch": 401, "lr": 2.48996559873558e-05} +{"train_loss": 0.0009400987182743847, "global_step": 47819, "epoch": 401, "lr": 2.48977398983056e-05} +{"train_loss": 0.0007365565397776663, "global_step": 47820, "epoch": 401, "lr": 2.4895823858541017e-05} +{"train_loss": 0.0013379785232245922, "global_step": 47821, "epoch": 401, "lr": 2.489390786806579e-05} +{"train_loss": 0.00074498396134004, "global_step": 47822, "epoch": 401, "lr": 2.4891991926883706e-05} +{"train_loss": 0.0010975970653817058, "global_step": 47823, "epoch": 401, "lr": 2.4890076034998522e-05} +{"train_loss": 0.0009891949594020844, "global_step": 47824, "epoch": 401, "lr": 2.4888160192413963e-05} +{"train_loss": 0.0006916197598911822, "global_step": 47825, "epoch": 401, "lr": 2.488624439913384e-05} +{"train_loss": 0.0012382455170154572, "global_step": 47826, "epoch": 401, "lr": 2.4884328655161877e-05} +{"train_loss": 0.0010038273176178336, "global_step": 47827, "epoch": 401, "lr": 2.488241296050187e-05} +{"train_loss": 0.0010107560083270073, "global_step": 47828, "epoch": 401, "lr": 2.4880497315157543e-05} +{"train_loss": 0.002174339024350047, "global_step": 47829, "epoch": 401, "lr": 2.4878581719132694e-05} +{"train_loss": 0.0005899292882531881, "global_step": 47830, "epoch": 401, "lr": 2.4876666172431062e-05} +{"train_loss": 0.0005419052322395146, "global_step": 47831, "epoch": 401, "lr": 2.4874750675056396e-05} +{"train_loss": 0.0014572769869118929, "global_step": 47832, "epoch": 401, "lr": 2.4872835227012493e-05} +{"train_loss": 0.001153067103587091, "global_step": 47833, "epoch": 401, "lr": 2.4870919828303075e-05} +{"train_loss": 0.0007208317401818931, "global_step": 47834, "epoch": 401, "lr": 2.486900447893194e-05} +{"train_loss": 0.001411616918630898, "global_step": 47835, "epoch": 401, "lr": 2.486708917890283e-05} +{"train_loss": 0.0005876738578081131, "global_step": 47836, "epoch": 401, "lr": 2.4865173928219483e-05} +{"train_loss": 0.0011144169665454346, "global_step": 47837, "epoch": 401, "lr": 2.4863258726885703e-05, "val_loss": 0.028314128518104553} +{"train_loss": 0.0013924025697633624, "global_step": 47838, "epoch": 402, "lr": 2.486134357490521e-05} +{"train_loss": 0.0012454907409846783, "global_step": 47839, "epoch": 402, "lr": 2.4859428472281805e-05} +{"train_loss": 0.001155841862782836, "global_step": 47840, "epoch": 402, "lr": 2.4857513419019202e-05} +{"train_loss": 0.0006301578832790256, "global_step": 47841, "epoch": 402, "lr": 2.4855598415121206e-05} +{"train_loss": 0.0008526519523002207, "global_step": 47842, "epoch": 402, "lr": 2.485368346059156e-05} +{"train_loss": 0.000532478850800544, "global_step": 47843, "epoch": 402, "lr": 2.4851768555433995e-05} +{"train_loss": 0.001218849210999906, "global_step": 47844, "epoch": 402, "lr": 2.484985369965232e-05} +{"train_loss": 0.0006734589696861804, "global_step": 47845, "epoch": 402, "lr": 2.484793889325025e-05} +{"train_loss": 0.0009085604688152671, "global_step": 47846, "epoch": 402, "lr": 2.4846024136231583e-05} +{"train_loss": 0.0013177369255572557, "global_step": 47847, "epoch": 402, "lr": 2.4844109428600043e-05} +{"train_loss": 0.0010295307729393244, "global_step": 47848, "epoch": 402, "lr": 2.4842194770359424e-05} +{"train_loss": 0.0008743158541619778, "global_step": 47849, "epoch": 402, "lr": 2.4840280161513447e-05} +{"train_loss": 0.0006385009619407356, "global_step": 47850, "epoch": 402, "lr": 2.4838365602065893e-05} +{"train_loss": 0.0009169838158413768, "global_step": 47851, "epoch": 402, "lr": 2.483645109202054e-05} +{"train_loss": 0.0005562951555475593, "global_step": 47852, "epoch": 402, "lr": 2.4834536631381113e-05} +{"train_loss": 0.001296875299885869, "global_step": 47853, "epoch": 402, "lr": 2.48326222201514e-05} +{"train_loss": 0.0006964387139305472, "global_step": 47854, "epoch": 402, "lr": 2.483070785833514e-05} +{"train_loss": 0.0011675003916025162, "global_step": 47855, "epoch": 402, "lr": 2.482879354593608e-05} +{"train_loss": 0.0010052570141851902, "global_step": 47856, "epoch": 402, "lr": 2.4826879282958014e-05} +{"train_loss": 0.0012801806442439556, "global_step": 47857, "epoch": 402, "lr": 2.482496506940466e-05} +{"train_loss": 0.0008293056162074208, "global_step": 47858, "epoch": 402, "lr": 2.482305090527982e-05} +{"train_loss": 0.0011182361049577594, "global_step": 47859, "epoch": 402, "lr": 2.4821136790587207e-05} +{"train_loss": 0.0011085697915405035, "global_step": 47860, "epoch": 402, "lr": 2.4819222725330628e-05} +{"train_loss": 0.000737555674277246, "global_step": 47861, "epoch": 402, "lr": 2.481730870951381e-05} +{"train_loss": 0.0005120796267874539, "global_step": 47862, "epoch": 402, "lr": 2.4815394743140497e-05} +{"train_loss": 0.0010867955861613154, "global_step": 47863, "epoch": 402, "lr": 2.4813480826214484e-05} +{"train_loss": 0.0005022374098189175, "global_step": 47864, "epoch": 402, "lr": 2.4811566958739495e-05} +{"train_loss": 0.0010663935681805015, "global_step": 47865, "epoch": 402, "lr": 2.480965314071932e-05} +{"train_loss": 0.0007075059693306684, "global_step": 47866, "epoch": 402, "lr": 2.48077393721577e-05} +{"train_loss": 0.0015581791521981359, "global_step": 47867, "epoch": 402, "lr": 2.4805825653058374e-05} +{"train_loss": 0.0005507671739906073, "global_step": 47868, "epoch": 402, "lr": 2.4803911983425138e-05} +{"train_loss": 0.0007046338869258761, "global_step": 47869, "epoch": 402, "lr": 2.480199836326171e-05} +{"train_loss": 0.0016424369532614946, "global_step": 47870, "epoch": 402, "lr": 2.4800084792571883e-05} +{"train_loss": 0.0005118500557728112, "global_step": 47871, "epoch": 402, "lr": 2.4798171271359378e-05} +{"train_loss": 0.0006043156026862562, "global_step": 47872, "epoch": 402, "lr": 2.4796257799627987e-05} +{"train_loss": 0.0014199032448232174, "global_step": 47873, "epoch": 402, "lr": 2.4794344377381456e-05} +{"train_loss": 0.0007887238170951605, "global_step": 47874, "epoch": 402, "lr": 2.4792431004623517e-05} +{"train_loss": 0.0009817159734666348, "global_step": 47875, "epoch": 402, "lr": 2.4790517681357967e-05} +{"train_loss": 0.0012120443861931562, "global_step": 47876, "epoch": 402, "lr": 2.4788604407588523e-05} +{"train_loss": 0.0005630283849313855, "global_step": 47877, "epoch": 402, "lr": 2.4786691183318977e-05} +{"train_loss": 0.00170873012393713, "global_step": 47878, "epoch": 402, "lr": 2.4784778008553054e-05} +{"train_loss": 0.0006274229963310063, "global_step": 47879, "epoch": 402, "lr": 2.4782864883294544e-05} +{"train_loss": 0.000539202825166285, "global_step": 47880, "epoch": 402, "lr": 2.4780951807547166e-05} +{"train_loss": 0.0009073970722965896, "global_step": 47881, "epoch": 402, "lr": 2.4779038781314712e-05} +{"train_loss": 0.000595884514041245, "global_step": 47882, "epoch": 402, "lr": 2.4777125804600898e-05} +{"train_loss": 0.000707285653334111, "global_step": 47883, "epoch": 402, "lr": 2.4775212877409526e-05} +{"train_loss": 0.0011709727114066482, "global_step": 47884, "epoch": 402, "lr": 2.477329999974431e-05} +{"train_loss": 0.001471595256589353, "global_step": 47885, "epoch": 402, "lr": 2.4771387171609044e-05} +{"train_loss": 0.0006252806633710861, "global_step": 47886, "epoch": 402, "lr": 2.4769474393007447e-05} +{"train_loss": 0.0013542530359700322, "global_step": 47887, "epoch": 402, "lr": 2.4767561663943306e-05} +{"train_loss": 0.0009728464065119624, "global_step": 47888, "epoch": 402, "lr": 2.4765648984420343e-05} +{"train_loss": 0.0007924309466034174, "global_step": 47889, "epoch": 402, "lr": 2.4763736354442353e-05} +{"train_loss": 0.0005431199679151177, "global_step": 47890, "epoch": 402, "lr": 2.4761823774013053e-05} +{"train_loss": 0.0017921703401952982, "global_step": 47891, "epoch": 402, "lr": 2.475991124313623e-05} +{"train_loss": 0.001507853507064283, "global_step": 47892, "epoch": 402, "lr": 2.4757998761815633e-05} +{"train_loss": 0.0010674982331693172, "global_step": 47893, "epoch": 402, "lr": 2.4756086330054984e-05} +{"train_loss": 0.0007762765744701028, "global_step": 47894, "epoch": 402, "lr": 2.4754173947858085e-05} +{"train_loss": 0.001320683746598661, "global_step": 47895, "epoch": 402, "lr": 2.4752261615228646e-05} +{"train_loss": 0.0013495439197868109, "global_step": 47896, "epoch": 402, "lr": 2.475034933217046e-05} +{"train_loss": 0.00073098239954561, "global_step": 47897, "epoch": 402, "lr": 2.474843709868725e-05} +{"train_loss": 0.0005510690971277654, "global_step": 47898, "epoch": 402, "lr": 2.4746524914782803e-05} +{"train_loss": 0.0019174605840817094, "global_step": 47899, "epoch": 402, "lr": 2.4744612780460863e-05} +{"train_loss": 0.0009779746178537607, "global_step": 47900, "epoch": 402, "lr": 2.474270069572515e-05} +{"train_loss": 0.0014716841978952289, "global_step": 47901, "epoch": 402, "lr": 2.4740788660579473e-05} +{"train_loss": 0.0010863995412364602, "global_step": 47902, "epoch": 402, "lr": 2.4738876675027534e-05} +{"train_loss": 0.0005861383979208767, "global_step": 47903, "epoch": 402, "lr": 2.4736964739073132e-05} +{"train_loss": 0.00048676374717615545, "global_step": 47904, "epoch": 402, "lr": 2.4735052852720003e-05} +{"train_loss": 0.0010497169569134712, "global_step": 47905, "epoch": 402, "lr": 2.4733141015971878e-05} +{"train_loss": 0.0009316029609180987, "global_step": 47906, "epoch": 402, "lr": 2.473122922883255e-05} +{"train_loss": 0.00121119839604944, "global_step": 47907, "epoch": 402, "lr": 2.4729317491305737e-05} +{"train_loss": 0.0006638730992563069, "global_step": 47908, "epoch": 402, "lr": 2.4727405803395226e-05} +{"train_loss": 0.0007997120264917612, "global_step": 47909, "epoch": 402, "lr": 2.4725494165104735e-05} +{"train_loss": 0.0013711083447560668, "global_step": 47910, "epoch": 402, "lr": 2.472358257643806e-05} +{"train_loss": 0.001553127309307456, "global_step": 47911, "epoch": 402, "lr": 2.4721671037398925e-05} +{"train_loss": 0.0011482026893645525, "global_step": 47912, "epoch": 402, "lr": 2.4719759547991067e-05} +{"train_loss": 0.000550081196706742, "global_step": 47913, "epoch": 402, "lr": 2.4717848108218268e-05} +{"train_loss": 0.0008719240431673825, "global_step": 47914, "epoch": 402, "lr": 2.471593671808428e-05} +{"train_loss": 0.0009719883091747761, "global_step": 47915, "epoch": 402, "lr": 2.4714025377592844e-05} +{"train_loss": 0.0008020189707167447, "global_step": 47916, "epoch": 402, "lr": 2.471211408674773e-05} +{"train_loss": 0.0014340373454615474, "global_step": 47917, "epoch": 402, "lr": 2.471020284555266e-05} +{"train_loss": 0.0008891818579286337, "global_step": 47918, "epoch": 402, "lr": 2.4708291654011422e-05} +{"train_loss": 0.0006164064980112016, "global_step": 47919, "epoch": 402, "lr": 2.4706380512127734e-05} +{"train_loss": 0.0006660684593953192, "global_step": 47920, "epoch": 402, "lr": 2.4704469419905385e-05} +{"train_loss": 0.0008151241345331073, "global_step": 47921, "epoch": 402, "lr": 2.470255837734809e-05} +{"train_loss": 0.0013998596696183085, "global_step": 47922, "epoch": 402, "lr": 2.4700647384459636e-05} +{"train_loss": 0.0013681829441338778, "global_step": 47923, "epoch": 402, "lr": 2.4698736441243758e-05} +{"train_loss": 0.000763602729421109, "global_step": 47924, "epoch": 402, "lr": 2.4696825547704188e-05} +{"train_loss": 0.0013697093818336725, "global_step": 47925, "epoch": 402, "lr": 2.469491470384472e-05} +{"train_loss": 0.0010981856612488627, "global_step": 47926, "epoch": 402, "lr": 2.469300390966906e-05} +{"train_loss": 0.0007839599857106805, "global_step": 47927, "epoch": 402, "lr": 2.4691093165181005e-05} +{"train_loss": 0.0012552511179819703, "global_step": 47928, "epoch": 402, "lr": 2.4689182470384265e-05} +{"train_loss": 0.0014821809018030763, "global_step": 47929, "epoch": 402, "lr": 2.4687271825282633e-05} +{"train_loss": 0.0011773256119340658, "global_step": 47930, "epoch": 402, "lr": 2.468536122987984e-05} +{"train_loss": 0.0009432596270926297, "global_step": 47931, "epoch": 402, "lr": 2.468345068417961e-05} +{"train_loss": 0.0015063596656545997, "global_step": 47932, "epoch": 402, "lr": 2.4681540188185744e-05} +{"train_loss": 0.0009892398957163095, "global_step": 47933, "epoch": 402, "lr": 2.4679629741901945e-05} +{"train_loss": 0.0014558107359334826, "global_step": 47934, "epoch": 402, "lr": 2.4677719345332013e-05} +{"train_loss": 0.0010567590361461043, "global_step": 47935, "epoch": 402, "lr": 2.4675808998479667e-05} +{"train_loss": 0.00106864795088768, "global_step": 47936, "epoch": 402, "lr": 2.4673898701348653e-05} +{"train_loss": 0.0009979850146919489, "global_step": 47937, "epoch": 402, "lr": 2.4671988453942745e-05} +{"train_loss": 0.0013558955397456884, "global_step": 47938, "epoch": 402, "lr": 2.4670078256265667e-05} +{"train_loss": 0.0008778667543083429, "global_step": 47939, "epoch": 402, "lr": 2.4668168108321204e-05} +{"train_loss": 0.001490607624873519, "global_step": 47940, "epoch": 402, "lr": 2.4666258010113065e-05} +{"train_loss": 0.0006919993320479989, "global_step": 47941, "epoch": 402, "lr": 2.466434796164504e-05} +{"train_loss": 0.0016024586511775851, "global_step": 47942, "epoch": 402, "lr": 2.4662437962920865e-05} +{"train_loss": 0.0009107107180170715, "global_step": 47943, "epoch": 402, "lr": 2.466052801394426e-05} +{"train_loss": 0.0010172786423936486, "global_step": 47944, "epoch": 402, "lr": 2.465861811471903e-05} +{"train_loss": 0.0012025596806779504, "global_step": 47945, "epoch": 402, "lr": 2.4656708265248875e-05} +{"train_loss": 0.0016434690915048122, "global_step": 47946, "epoch": 402, "lr": 2.4654798465537576e-05} +{"train_loss": 0.0013108913553878665, "global_step": 47947, "epoch": 402, "lr": 2.4652888715588863e-05} +{"train_loss": 0.0006953231641091406, "global_step": 47948, "epoch": 402, "lr": 2.465097901540649e-05} +{"train_loss": 0.0010252195643261075, "global_step": 47949, "epoch": 402, "lr": 2.464906936499423e-05} +{"train_loss": 0.000985123566351831, "global_step": 47950, "epoch": 402, "lr": 2.4647159764355797e-05} +{"train_loss": 0.0010878799948841333, "global_step": 47951, "epoch": 402, "lr": 2.464525021349498e-05} +{"train_loss": 0.0007545098778791726, "global_step": 47952, "epoch": 402, "lr": 2.464334071241548e-05} +{"train_loss": 0.0022285147570073605, "global_step": 47953, "epoch": 402, "lr": 2.4641431261121097e-05} +{"train_loss": 0.0006123822531662881, "global_step": 47954, "epoch": 402, "lr": 2.4639521859615548e-05} +{"train_loss": 0.0008761576027609408, "global_step": 47955, "epoch": 402, "lr": 2.4637612507902574e-05} +{"train_loss": 0.0010239339236487017, "global_step": 47956, "epoch": 402, "lr": 2.4635703205985955e-05, "val_loss": 0.02741367742419243} +{"train_loss": 0.0016248648753389716, "global_step": 47957, "epoch": 403, "lr": 2.4633793953869405e-05} +{"train_loss": 0.0014582795556634665, "global_step": 47958, "epoch": 403, "lr": 2.463188475155671e-05} +{"train_loss": 0.0034574870951473713, "global_step": 47959, "epoch": 403, "lr": 2.462997559905158e-05} +{"train_loss": 0.0007448868709616363, "global_step": 47960, "epoch": 403, "lr": 2.46280664963578e-05} +{"train_loss": 0.0011225396301597357, "global_step": 47961, "epoch": 403, "lr": 2.4626157443479103e-05} +{"train_loss": 0.001153533230535686, "global_step": 47962, "epoch": 403, "lr": 2.462424844041921e-05} +{"train_loss": 0.0012186117237433791, "global_step": 47963, "epoch": 403, "lr": 2.4622339487181923e-05} +{"train_loss": 0.0021111732348799706, "global_step": 47964, "epoch": 403, "lr": 2.4620430583770937e-05} +{"train_loss": 0.0017570207128301263, "global_step": 47965, "epoch": 403, "lr": 2.4618521730190043e-05} +{"train_loss": 0.0005503693246282637, "global_step": 47966, "epoch": 403, "lr": 2.461661292644295e-05} +{"train_loss": 0.0017574274679645896, "global_step": 47967, "epoch": 403, "lr": 2.4614704172533443e-05} +{"train_loss": 0.0015045577893033624, "global_step": 47968, "epoch": 403, "lr": 2.4612795468465255e-05} +{"train_loss": 0.0006737670628353953, "global_step": 47969, "epoch": 403, "lr": 2.4610886814242113e-05} +{"train_loss": 0.0006770914187654853, "global_step": 47970, "epoch": 403, "lr": 2.46089782098678e-05} +{"train_loss": 0.001158841885626316, "global_step": 47971, "epoch": 403, "lr": 2.4607069655346026e-05} +{"train_loss": 0.0011565655004233122, "global_step": 47972, "epoch": 403, "lr": 2.4605161150680584e-05} +{"train_loss": 0.0007270066416822374, "global_step": 47973, "epoch": 403, "lr": 2.4603252695875185e-05} +{"train_loss": 0.0007073808228597045, "global_step": 47974, "epoch": 403, "lr": 2.460134429093357e-05} +{"train_loss": 0.0015164496144279838, "global_step": 47975, "epoch": 403, "lr": 2.4599435935859527e-05} +{"train_loss": 0.0009712465689517558, "global_step": 47976, "epoch": 403, "lr": 2.459752763065675e-05} +{"train_loss": 0.0012708405265584588, "global_step": 47977, "epoch": 403, "lr": 2.4595619375329038e-05} +{"train_loss": 0.0006817136309109628, "global_step": 47978, "epoch": 403, "lr": 2.4593711169880096e-05} +{"train_loss": 0.0007507186965085566, "global_step": 47979, "epoch": 403, "lr": 2.4591803014313704e-05} +{"train_loss": 0.0020258468575775623, "global_step": 47980, "epoch": 403, "lr": 2.458989490863357e-05} +{"train_loss": 0.000976131297647953, "global_step": 47981, "epoch": 403, "lr": 2.4587986852843486e-05} +{"train_loss": 0.0011813284363597631, "global_step": 47982, "epoch": 403, "lr": 2.458607884694715e-05} +{"train_loss": 0.0008046136936172843, "global_step": 47983, "epoch": 403, "lr": 2.4584170890948345e-05} +{"train_loss": 0.0008718233439140022, "global_step": 47984, "epoch": 403, "lr": 2.458226298485081e-05} +{"train_loss": 0.0009332673507742584, "global_step": 47985, "epoch": 403, "lr": 2.45803551286583e-05} +{"train_loss": 0.0022460026666522026, "global_step": 47986, "epoch": 403, "lr": 2.457844732237452e-05} +{"train_loss": 0.0011014429619535804, "global_step": 47987, "epoch": 403, "lr": 2.457653956600326e-05} +{"train_loss": 0.0017093574861064553, "global_step": 47988, "epoch": 403, "lr": 2.4574631859548237e-05} +{"train_loss": 0.0014503394486382604, "global_step": 47989, "epoch": 403, "lr": 2.457272420301322e-05} +{"train_loss": 0.0016792616806924343, "global_step": 47990, "epoch": 403, "lr": 2.4570816596401925e-05} +{"train_loss": 0.0011806783732026815, "global_step": 47991, "epoch": 403, "lr": 2.4568909039718136e-05} +{"train_loss": 0.0010007243836298585, "global_step": 47992, "epoch": 403, "lr": 2.4567001532965578e-05} +{"train_loss": 0.0013621923280879855, "global_step": 47993, "epoch": 403, "lr": 2.456509407614797e-05} +{"train_loss": 0.0008156441617757082, "global_step": 47994, "epoch": 403, "lr": 2.456318666926911e-05} +{"train_loss": 0.0011311676353216171, "global_step": 47995, "epoch": 403, "lr": 2.456127931233269e-05} +{"train_loss": 0.0010940557112917304, "global_step": 47996, "epoch": 403, "lr": 2.4559372005342502e-05} +{"train_loss": 0.0011535314843058586, "global_step": 47997, "epoch": 403, "lr": 2.455746474830225e-05} +{"train_loss": 0.0010869462275877595, "global_step": 47998, "epoch": 403, "lr": 2.4555557541215718e-05} +{"train_loss": 0.0009041076409630477, "global_step": 47999, "epoch": 403, "lr": 2.455365038408663e-05} +{"train_loss": 0.00144009361974895, "global_step": 48000, "epoch": 403, "lr": 2.4551743276918708e-05} +{"train_loss": 0.0010028420947492123, "global_step": 48001, "epoch": 403, "lr": 2.4549836219715744e-05} +{"train_loss": 0.0008963958825916052, "global_step": 48002, "epoch": 403, "lr": 2.4547929212481435e-05} +{"train_loss": 0.0016594722401350737, "global_step": 48003, "epoch": 403, "lr": 2.454602225521957e-05} +{"train_loss": 0.0019072089344263077, "global_step": 48004, "epoch": 403, "lr": 2.4544115347933866e-05} +{"train_loss": 0.0012997040757909417, "global_step": 48005, "epoch": 403, "lr": 2.4542208490628062e-05} +{"train_loss": 0.0018290849402546883, "global_step": 48006, "epoch": 403, "lr": 2.4540301683305923e-05} +{"train_loss": 0.000981462188065052, "global_step": 48007, "epoch": 403, "lr": 2.4538394925971165e-05} +{"train_loss": 0.0011021073441952467, "global_step": 48008, "epoch": 403, "lr": 2.4536488218627564e-05} +{"train_loss": 0.000981776276603341, "global_step": 48009, "epoch": 403, "lr": 2.453458156127883e-05} +{"train_loss": 0.0007661212584935129, "global_step": 48010, "epoch": 403, "lr": 2.4532674953928748e-05} +{"train_loss": 0.0016719194827601314, "global_step": 48011, "epoch": 403, "lr": 2.4530768396581017e-05} +{"train_loss": 0.0016618616646155715, "global_step": 48012, "epoch": 403, "lr": 2.4528861889239418e-05} +{"train_loss": 0.0011841258965432644, "global_step": 48013, "epoch": 403, "lr": 2.452695543190766e-05} +{"train_loss": 0.0020242929458618164, "global_step": 48014, "epoch": 403, "lr": 2.452504902458952e-05} +{"train_loss": 0.0009908227948471904, "global_step": 48015, "epoch": 403, "lr": 2.452314266728871e-05} +{"train_loss": 0.0014642190653830767, "global_step": 48016, "epoch": 403, "lr": 2.4521236360009003e-05} +{"train_loss": 0.000896962417755276, "global_step": 48017, "epoch": 403, "lr": 2.4519330102754112e-05} +{"train_loss": 0.0007663925644010305, "global_step": 48018, "epoch": 403, "lr": 2.451742389552781e-05} +{"train_loss": 0.0013629290042445064, "global_step": 48019, "epoch": 403, "lr": 2.4515517738333805e-05} +{"train_loss": 0.0009102120529860258, "global_step": 48020, "epoch": 403, "lr": 2.4513611631175876e-05} +{"train_loss": 0.001024030614644289, "global_step": 48021, "epoch": 403, "lr": 2.451170557405773e-05} +{"train_loss": 0.001893636304885149, "global_step": 48022, "epoch": 403, "lr": 2.4509799566983148e-05} +{"train_loss": 0.0007382853655144572, "global_step": 48023, "epoch": 403, "lr": 2.4507893609955853e-05} +{"train_loss": 0.0009432791848666966, "global_step": 48024, "epoch": 403, "lr": 2.450598770297956e-05} +{"train_loss": 0.002406100742518902, "global_step": 48025, "epoch": 403, "lr": 2.450408184605806e-05} +{"train_loss": 0.0008173075621016324, "global_step": 48026, "epoch": 403, "lr": 2.4502176039195052e-05} +{"train_loss": 0.00047790579264983535, "global_step": 48027, "epoch": 403, "lr": 2.450027028239431e-05} +{"train_loss": 0.0013272048672661185, "global_step": 48028, "epoch": 403, "lr": 2.449836457565955e-05} +{"train_loss": 0.001317430636845529, "global_step": 48029, "epoch": 403, "lr": 2.4496458918994546e-05} +{"train_loss": 0.0014361821813508868, "global_step": 48030, "epoch": 403, "lr": 2.449455331240302e-05} +{"train_loss": 0.0008510312763974071, "global_step": 48031, "epoch": 403, "lr": 2.4492647755888694e-05} +{"train_loss": 0.0010645186994224787, "global_step": 48032, "epoch": 403, "lr": 2.449074224945535e-05} +{"train_loss": 0.0009263299289159477, "global_step": 48033, "epoch": 403, "lr": 2.4488836793106683e-05} +{"train_loss": 0.0012039433931931853, "global_step": 48034, "epoch": 403, "lr": 2.4486931386846485e-05} +{"train_loss": 0.0015281878877431154, "global_step": 48035, "epoch": 403, "lr": 2.4485026030678454e-05} +{"train_loss": 0.0010410507675260305, "global_step": 48036, "epoch": 403, "lr": 2.4483120724606363e-05} +{"train_loss": 0.0005646058707498014, "global_step": 48037, "epoch": 403, "lr": 2.4481215468633937e-05} +{"train_loss": 0.0013358755968511105, "global_step": 48038, "epoch": 403, "lr": 2.4479310262764903e-05} +{"train_loss": 0.0015653872396796942, "global_step": 48039, "epoch": 403, "lr": 2.447740510700303e-05} +{"train_loss": 0.0009944298071786761, "global_step": 48040, "epoch": 403, "lr": 2.4475500001352037e-05} +{"train_loss": 0.0011359022464603186, "global_step": 48041, "epoch": 403, "lr": 2.447359494581568e-05} +{"train_loss": 0.0010330576915293932, "global_step": 48042, "epoch": 403, "lr": 2.44716899403977e-05} +{"train_loss": 0.0012534551788121462, "global_step": 48043, "epoch": 403, "lr": 2.4469784985101808e-05} +{"train_loss": 0.0011714271968230605, "global_step": 48044, "epoch": 403, "lr": 2.4467880079931787e-05} +{"train_loss": 0.0013134476030245423, "global_step": 48045, "epoch": 403, "lr": 2.4465975224891334e-05} +{"train_loss": 0.0005488229217007756, "global_step": 48046, "epoch": 403, "lr": 2.4464070419984214e-05} +{"train_loss": 0.0005818411591462791, "global_step": 48047, "epoch": 403, "lr": 2.4462165665214176e-05} +{"train_loss": 0.0012317454675212502, "global_step": 48048, "epoch": 403, "lr": 2.4460260960584935e-05} +{"train_loss": 0.0008280971669591963, "global_step": 48049, "epoch": 403, "lr": 2.445835630610026e-05} +{"train_loss": 0.001497536664828658, "global_step": 48050, "epoch": 403, "lr": 2.4456451701763854e-05} +{"train_loss": 0.0006697383360005915, "global_step": 48051, "epoch": 403, "lr": 2.4454547147579492e-05} +{"train_loss": 0.0019448046805337071, "global_step": 48052, "epoch": 403, "lr": 2.445264264355088e-05} +{"train_loss": 0.0020876023918390274, "global_step": 48053, "epoch": 403, "lr": 2.44507381896818e-05} +{"train_loss": 0.0008415274787694216, "global_step": 48054, "epoch": 403, "lr": 2.4448833785975962e-05} +{"train_loss": 0.0009205690585076809, "global_step": 48055, "epoch": 403, "lr": 2.4446929432437086e-05} +{"train_loss": 0.0013177160872146487, "global_step": 48056, "epoch": 403, "lr": 2.4445025129068962e-05} +{"train_loss": 0.001472483854740858, "global_step": 48057, "epoch": 403, "lr": 2.4443120875875274e-05} +{"train_loss": 0.0009579223114997149, "global_step": 48058, "epoch": 403, "lr": 2.444121667285981e-05} +{"train_loss": 0.0007945242105051875, "global_step": 48059, "epoch": 403, "lr": 2.443931252002627e-05} +{"train_loss": 0.0006803296855650842, "global_step": 48060, "epoch": 403, "lr": 2.443740841737843e-05} +{"train_loss": 0.0005834948387928307, "global_step": 48061, "epoch": 403, "lr": 2.443550436492e-05} +{"train_loss": 0.0014773235889151692, "global_step": 48062, "epoch": 403, "lr": 2.4433600362654706e-05} +{"train_loss": 0.0019007568480446935, "global_step": 48063, "epoch": 403, "lr": 2.443169641058633e-05} +{"train_loss": 0.0007094747852534056, "global_step": 48064, "epoch": 403, "lr": 2.442979250871857e-05} +{"train_loss": 0.0010495062451809645, "global_step": 48065, "epoch": 403, "lr": 2.4427888657055198e-05} +{"train_loss": 0.0018831792986020446, "global_step": 48066, "epoch": 403, "lr": 2.4425984855599916e-05} +{"train_loss": 0.0011558759724721313, "global_step": 48067, "epoch": 403, "lr": 2.4424081104356496e-05} +{"train_loss": 0.0015588923124596477, "global_step": 48068, "epoch": 403, "lr": 2.442217740332866e-05} +{"train_loss": 0.0011809407733380795, "global_step": 48069, "epoch": 403, "lr": 2.442027375252013e-05} +{"train_loss": 0.0008495367947034538, "global_step": 48070, "epoch": 403, "lr": 2.4418370151934676e-05} +{"train_loss": 0.000985364313237369, "global_step": 48071, "epoch": 403, "lr": 2.4416466601576005e-05} +{"train_loss": 0.0014212240930646658, "global_step": 48072, "epoch": 403, "lr": 2.4414563101447886e-05} +{"train_loss": 0.0009499574662186205, "global_step": 48073, "epoch": 403, "lr": 2.441265965155404e-05} +{"train_loss": 0.0005963437142781913, "global_step": 48074, "epoch": 403, "lr": 2.4410756251898176e-05} +{"train_loss": 0.0012071998290983693, "global_step": 48075, "epoch": 403, "lr": 2.4408852902484086e-05, "val_loss": 0.012589371763169765} +{"train_loss": 0.0007424290524795651, "global_step": 48076, "epoch": 404, "lr": 2.4406949603315455e-05} +{"train_loss": 0.0010728653287515044, "global_step": 48077, "epoch": 404, "lr": 2.4405046354396064e-05} +{"train_loss": 0.002022080821916461, "global_step": 48078, "epoch": 404, "lr": 2.4403143155729617e-05} +{"train_loss": 0.001609539962373674, "global_step": 48079, "epoch": 404, "lr": 2.4401240007319875e-05} +{"train_loss": 0.0008596297120675445, "global_step": 48080, "epoch": 404, "lr": 2.439933690917055e-05} +{"train_loss": 0.0008459256496280432, "global_step": 48081, "epoch": 404, "lr": 2.439743386128539e-05} +{"train_loss": 0.0029516678769141436, "global_step": 48082, "epoch": 404, "lr": 2.4395530863668155e-05} +{"train_loss": 0.0009120465256273746, "global_step": 48083, "epoch": 404, "lr": 2.4393627916322536e-05} +{"train_loss": 0.0012993296841159463, "global_step": 48084, "epoch": 404, "lr": 2.4391725019252314e-05} +{"train_loss": 0.0006845044554211199, "global_step": 48085, "epoch": 404, "lr": 2.4389822172461185e-05} +{"train_loss": 0.0005328095867298543, "global_step": 48086, "epoch": 404, "lr": 2.4387919375952923e-05} +{"train_loss": 0.0010707095498219132, "global_step": 48087, "epoch": 404, "lr": 2.4386016629731246e-05} +{"train_loss": 0.0006465993938036263, "global_step": 48088, "epoch": 404, "lr": 2.4384113933799866e-05} +{"train_loss": 0.0012925422051921487, "global_step": 48089, "epoch": 404, "lr": 2.4382211288162565e-05} +{"train_loss": 0.0010776798008009791, "global_step": 48090, "epoch": 404, "lr": 2.438030869282304e-05} +{"train_loss": 0.0012766586150974035, "global_step": 48091, "epoch": 404, "lr": 2.4378406147785054e-05} +{"train_loss": 0.001360816997475922, "global_step": 48092, "epoch": 404, "lr": 2.437650365305233e-05} +{"train_loss": 0.0013315592659637332, "global_step": 48093, "epoch": 404, "lr": 2.437460120862859e-05} +{"train_loss": 0.0012225644895806909, "global_step": 48094, "epoch": 404, "lr": 2.4372698814517598e-05} +{"train_loss": 0.0009562508203089237, "global_step": 48095, "epoch": 404, "lr": 2.4370796470723056e-05} +{"train_loss": 0.0012997477315366268, "global_step": 48096, "epoch": 404, "lr": 2.4368894177248736e-05} +{"train_loss": 0.0009660260402597487, "global_step": 48097, "epoch": 404, "lr": 2.4366991934098333e-05} +{"train_loss": 0.0008075365331023932, "global_step": 48098, "epoch": 404, "lr": 2.4365089741275627e-05} +{"train_loss": 0.0005883380654267967, "global_step": 48099, "epoch": 404, "lr": 2.436318759878432e-05} +{"train_loss": 0.0005361835355870426, "global_step": 48100, "epoch": 404, "lr": 2.4361285506628145e-05} +{"train_loss": 0.0011447620345279574, "global_step": 48101, "epoch": 404, "lr": 2.4359383464810864e-05} +{"train_loss": 0.0013218536041676998, "global_step": 48102, "epoch": 404, "lr": 2.435748147333617e-05} +{"train_loss": 0.0010389866074547172, "global_step": 48103, "epoch": 404, "lr": 2.4355579532207847e-05} +{"train_loss": 0.001024962984956801, "global_step": 48104, "epoch": 404, "lr": 2.4353677641429578e-05} +{"train_loss": 0.0016385216731578112, "global_step": 48105, "epoch": 404, "lr": 2.435177580100515e-05} +{"train_loss": 0.001036804635077715, "global_step": 48106, "epoch": 404, "lr": 2.4349874010938266e-05} +{"train_loss": 0.002159902360290289, "global_step": 48107, "epoch": 404, "lr": 2.4347972271232643e-05} +{"train_loss": 0.0011911230394616723, "global_step": 48108, "epoch": 404, "lr": 2.434607058189206e-05} +{"train_loss": 0.0008686127839609981, "global_step": 48109, "epoch": 404, "lr": 2.4344168942920203e-05} +{"train_loss": 0.0010711493669077754, "global_step": 48110, "epoch": 404, "lr": 2.4342267354320853e-05} +{"train_loss": 0.0009504021145403385, "global_step": 48111, "epoch": 404, "lr": 2.4340365816097694e-05} +{"train_loss": 0.0012519104639068246, "global_step": 48112, "epoch": 404, "lr": 2.4338464328254512e-05} +{"train_loss": 0.0008620813023298979, "global_step": 48113, "epoch": 404, "lr": 2.433656289079499e-05} +{"train_loss": 0.0009961915202438831, "global_step": 48114, "epoch": 404, "lr": 2.4334661503722907e-05} +{"train_loss": 0.0011394203174859285, "global_step": 48115, "epoch": 404, "lr": 2.433276016704195e-05} +{"train_loss": 0.001333273365162313, "global_step": 48116, "epoch": 404, "lr": 2.433085888075588e-05} +{"train_loss": 0.0014734008582308888, "global_step": 48117, "epoch": 404, "lr": 2.4328957644868446e-05} +{"train_loss": 0.0007376488065347075, "global_step": 48118, "epoch": 404, "lr": 2.432705645938336e-05} +{"train_loss": 0.0007460943306796253, "global_step": 48119, "epoch": 404, "lr": 2.4325155324304337e-05} +{"train_loss": 0.0010383896296843886, "global_step": 48120, "epoch": 404, "lr": 2.432325423963515e-05} +{"train_loss": 0.0008879347005859017, "global_step": 48121, "epoch": 404, "lr": 2.4321353205379488e-05} +{"train_loss": 0.0008418841171078384, "global_step": 48122, "epoch": 404, "lr": 2.4319452221541124e-05} +{"train_loss": 0.0015451220097020268, "global_step": 48123, "epoch": 404, "lr": 2.4317551288123775e-05} +{"train_loss": 0.0011770869605243206, "global_step": 48124, "epoch": 404, "lr": 2.431565040513115e-05} +{"train_loss": 0.0005689628887921572, "global_step": 48125, "epoch": 404, "lr": 2.431374957256702e-05} +{"train_loss": 0.0017547496827319264, "global_step": 48126, "epoch": 404, "lr": 2.4311848790435078e-05} +{"train_loss": 0.0006760807591490448, "global_step": 48127, "epoch": 404, "lr": 2.4309948058739096e-05} +{"train_loss": 0.0014355072053149343, "global_step": 48128, "epoch": 404, "lr": 2.4308047377482774e-05} +{"train_loss": 0.0012860022252425551, "global_step": 48129, "epoch": 404, "lr": 2.4306146746669867e-05} +{"train_loss": 0.0007748638745397329, "global_step": 48130, "epoch": 404, "lr": 2.43042461663041e-05} +{"train_loss": 0.0009142431663349271, "global_step": 48131, "epoch": 404, "lr": 2.4302345636389178e-05} +{"train_loss": 0.0005969344056211412, "global_step": 48132, "epoch": 404, "lr": 2.4300445156928874e-05} +{"train_loss": 0.0015778766246512532, "global_step": 48133, "epoch": 404, "lr": 2.4298544727926886e-05} +{"train_loss": 0.0009575272561050951, "global_step": 48134, "epoch": 404, "lr": 2.4296644349386977e-05} +{"train_loss": 0.0010534990578889847, "global_step": 48135, "epoch": 404, "lr": 2.4294744021312843e-05} +{"train_loss": 0.000677071395330131, "global_step": 48136, "epoch": 404, "lr": 2.429284374370825e-05} +{"train_loss": 0.0006100303726270795, "global_step": 48137, "epoch": 404, "lr": 2.429094351657691e-05} +{"train_loss": 0.0011125083547085524, "global_step": 48138, "epoch": 404, "lr": 2.428904333992254e-05} +{"train_loss": 0.0006273610633797944, "global_step": 48139, "epoch": 404, "lr": 2.4287143213748904e-05} +{"train_loss": 0.0005378592177294195, "global_step": 48140, "epoch": 404, "lr": 2.4285243138059693e-05} +{"train_loss": 0.0008216843707486987, "global_step": 48141, "epoch": 404, "lr": 2.4283343112858686e-05} +{"train_loss": 0.001451259246096015, "global_step": 48142, "epoch": 404, "lr": 2.428144313814956e-05} +{"train_loss": 0.0004675712843891233, "global_step": 48143, "epoch": 404, "lr": 2.4279543213936102e-05} +{"train_loss": 0.0009526953799650073, "global_step": 48144, "epoch": 404, "lr": 2.4277643340221985e-05} +{"train_loss": 0.0013331760419532657, "global_step": 48145, "epoch": 404, "lr": 2.427574351701099e-05} +{"train_loss": 0.0010163233382627368, "global_step": 48146, "epoch": 404, "lr": 2.4273843744306806e-05} +{"train_loss": 0.0016968389973044395, "global_step": 48147, "epoch": 404, "lr": 2.4271944022113195e-05} +{"train_loss": 0.0013932624133303761, "global_step": 48148, "epoch": 404, "lr": 2.427004435043386e-05} +{"train_loss": 0.0010991833405569196, "global_step": 48149, "epoch": 404, "lr": 2.426814472927256e-05} +{"train_loss": 0.0007925491081550717, "global_step": 48150, "epoch": 404, "lr": 2.4266245158632996e-05} +{"train_loss": 0.0009594758157618344, "global_step": 48151, "epoch": 404, "lr": 2.4264345638518925e-05} +{"train_loss": 0.0005176023114472628, "global_step": 48152, "epoch": 404, "lr": 2.4262446168934046e-05} +{"train_loss": 0.0005675125867128372, "global_step": 48153, "epoch": 404, "lr": 2.426054674988212e-05} +{"train_loss": 0.001850826432928443, "global_step": 48154, "epoch": 404, "lr": 2.425864738136684e-05} +{"train_loss": 0.0008370063733309507, "global_step": 48155, "epoch": 404, "lr": 2.4256748063391975e-05} +{"train_loss": 0.0005825675907544792, "global_step": 48156, "epoch": 404, "lr": 2.425484879596124e-05} +{"train_loss": 0.0006415524403564632, "global_step": 48157, "epoch": 404, "lr": 2.4252949579078333e-05} +{"train_loss": 0.0008649509400129318, "global_step": 48158, "epoch": 404, "lr": 2.4251050412747035e-05} +{"train_loss": 0.0011253682896494865, "global_step": 48159, "epoch": 404, "lr": 2.4249151296971023e-05} +{"train_loss": 0.0008343977970071137, "global_step": 48160, "epoch": 404, "lr": 2.4247252231754075e-05} +{"train_loss": 0.0008522268617525697, "global_step": 48161, "epoch": 404, "lr": 2.4245353217099892e-05} +{"train_loss": 0.0006789040053263307, "global_step": 48162, "epoch": 404, "lr": 2.4243454253012194e-05} +{"train_loss": 0.0014709780225530267, "global_step": 48163, "epoch": 404, "lr": 2.4241555339494738e-05} +{"train_loss": 0.0006155832088552415, "global_step": 48164, "epoch": 404, "lr": 2.4239656476551216e-05} +{"train_loss": 0.0017029459122568369, "global_step": 48165, "epoch": 404, "lr": 2.423775766418539e-05} +{"train_loss": 0.0007296589901670814, "global_step": 48166, "epoch": 404, "lr": 2.4235858902400965e-05} +{"train_loss": 0.0009563789353705943, "global_step": 48167, "epoch": 404, "lr": 2.4233960191201692e-05} +{"train_loss": 0.0019009282113984227, "global_step": 48168, "epoch": 404, "lr": 2.423206153059129e-05} +{"train_loss": 0.000684591825120151, "global_step": 48169, "epoch": 404, "lr": 2.4230162920573456e-05} +{"train_loss": 0.0008798312628641725, "global_step": 48170, "epoch": 404, "lr": 2.4228264361151963e-05} +{"train_loss": 0.0006137012969702482, "global_step": 48171, "epoch": 404, "lr": 2.4226365852330508e-05} +{"train_loss": 0.0008636500569991767, "global_step": 48172, "epoch": 404, "lr": 2.4224467394112848e-05} +{"train_loss": 0.0007287220214493573, "global_step": 48173, "epoch": 404, "lr": 2.4222568986502692e-05} +{"train_loss": 0.0008995272219181061, "global_step": 48174, "epoch": 404, "lr": 2.4220670629503744e-05} +{"train_loss": 0.0005359374335967004, "global_step": 48175, "epoch": 404, "lr": 2.4218772323119775e-05} +{"train_loss": 0.0008824162068776786, "global_step": 48176, "epoch": 404, "lr": 2.421687406735448e-05} +{"train_loss": 0.0017738534370437264, "global_step": 48177, "epoch": 404, "lr": 2.4214975862211614e-05} +{"train_loss": 0.0011254720157012343, "global_step": 48178, "epoch": 404, "lr": 2.4213077707694866e-05} +{"train_loss": 0.0007488100090995431, "global_step": 48179, "epoch": 404, "lr": 2.4211179603807987e-05} +{"train_loss": 0.0012110028183087707, "global_step": 48180, "epoch": 404, "lr": 2.420928155055472e-05} +{"train_loss": 0.0005334898014552891, "global_step": 48181, "epoch": 404, "lr": 2.4207383547938754e-05} +{"train_loss": 0.0013909434201195836, "global_step": 48182, "epoch": 404, "lr": 2.4205485595963857e-05} +{"train_loss": 0.0004727629420813173, "global_step": 48183, "epoch": 404, "lr": 2.4203587694633713e-05} +{"train_loss": 0.0010187445441260934, "global_step": 48184, "epoch": 404, "lr": 2.4201689843952084e-05} +{"train_loss": 0.0005032363114878535, "global_step": 48185, "epoch": 404, "lr": 2.419979204392267e-05} +{"train_loss": 0.0007566332933492959, "global_step": 48186, "epoch": 404, "lr": 2.4197894294549217e-05} +{"train_loss": 0.0006009959033690393, "global_step": 48187, "epoch": 404, "lr": 2.4195996595835453e-05} +{"train_loss": 0.0014445931883528829, "global_step": 48188, "epoch": 404, "lr": 2.4194098947785064e-05} +{"train_loss": 0.0013654647627845407, "global_step": 48189, "epoch": 404, "lr": 2.4192201350401828e-05} +{"train_loss": 0.0010188421001657844, "global_step": 48190, "epoch": 404, "lr": 2.419030380368943e-05} +{"train_loss": 0.0006397819379344583, "global_step": 48191, "epoch": 404, "lr": 2.418840630765163e-05} +{"train_loss": 0.0008462133700959384, "global_step": 48192, "epoch": 404, "lr": 2.4186508862292135e-05} +{"train_loss": 0.0010151745518669486, "global_step": 48193, "epoch": 404, "lr": 2.4184611467614654e-05} +{"train_loss": 0.001035675238191831, "global_step": 48194, "epoch": 404, "lr": 2.418271412362295e-05, "val_loss": 0.021721303462982178} +{"train_loss": 0.0008062665001489222, "global_step": 48195, "epoch": 405, "lr": 2.4180816830320714e-05} +{"train_loss": 0.0007141534588299692, "global_step": 48196, "epoch": 405, "lr": 2.4178919587711695e-05} +{"train_loss": 0.0005751277785748243, "global_step": 48197, "epoch": 405, "lr": 2.4177022395799597e-05} +{"train_loss": 0.0006466444465331733, "global_step": 48198, "epoch": 405, "lr": 2.4175125254588177e-05} +{"train_loss": 0.0016082179499790072, "global_step": 48199, "epoch": 405, "lr": 2.4173228164081135e-05} +{"train_loss": 0.0008812496671453118, "global_step": 48200, "epoch": 405, "lr": 2.417133112428218e-05} +{"train_loss": 0.001816421514376998, "global_step": 48201, "epoch": 405, "lr": 2.416943413519508e-05} +{"train_loss": 0.0005915178917348385, "global_step": 48202, "epoch": 405, "lr": 2.416753719682352e-05} +{"train_loss": 0.0008193362154997885, "global_step": 48203, "epoch": 405, "lr": 2.4165640309171255e-05} +{"train_loss": 0.0010936380131170154, "global_step": 48204, "epoch": 405, "lr": 2.4163743472241978e-05} +{"train_loss": 0.0006337384111247957, "global_step": 48205, "epoch": 405, "lr": 2.4161846686039447e-05} +{"train_loss": 0.0010550713632255793, "global_step": 48206, "epoch": 405, "lr": 2.4159949950567373e-05} +{"train_loss": 0.00130168697796762, "global_step": 48207, "epoch": 405, "lr": 2.4158053265829456e-05} +{"train_loss": 0.0009301576646976173, "global_step": 48208, "epoch": 405, "lr": 2.4156156631829462e-05} +{"train_loss": 0.0004922669613733888, "global_step": 48209, "epoch": 405, "lr": 2.415426004857107e-05} +{"train_loss": 0.0009717287612147629, "global_step": 48210, "epoch": 405, "lr": 2.4152363516058054e-05} +{"train_loss": 0.0007913622539490461, "global_step": 48211, "epoch": 405, "lr": 2.4150467034294082e-05} +{"train_loss": 0.0009234750177711248, "global_step": 48212, "epoch": 405, "lr": 2.4148570603282932e-05} +{"train_loss": 0.0016459062462672591, "global_step": 48213, "epoch": 405, "lr": 2.414667422302828e-05} +{"train_loss": 0.0012012380175292492, "global_step": 48214, "epoch": 405, "lr": 2.414477789353387e-05} +{"train_loss": 0.0006903065950609744, "global_step": 48215, "epoch": 405, "lr": 2.414288161480345e-05} +{"train_loss": 0.0006382821593433619, "global_step": 48216, "epoch": 405, "lr": 2.4140985386840696e-05} +{"train_loss": 0.000787709781434387, "global_step": 48217, "epoch": 405, "lr": 2.413908920964938e-05} +{"train_loss": 0.0008875725325196981, "global_step": 48218, "epoch": 405, "lr": 2.413719308323319e-05} +{"train_loss": 0.0009467258933000267, "global_step": 48219, "epoch": 405, "lr": 2.4135297007595847e-05} +{"train_loss": 0.0009180041961371899, "global_step": 48220, "epoch": 405, "lr": 2.4133400982741102e-05} +{"train_loss": 0.001484410371631384, "global_step": 48221, "epoch": 405, "lr": 2.413150500867264e-05} +{"train_loss": 0.0007479008636437356, "global_step": 48222, "epoch": 405, "lr": 2.412960908539422e-05} +{"train_loss": 0.0007533382158726454, "global_step": 48223, "epoch": 405, "lr": 2.4127713212909536e-05} +{"train_loss": 0.001303474185988307, "global_step": 48224, "epoch": 405, "lr": 2.4125817391222345e-05} +{"train_loss": 0.0007126877317205071, "global_step": 48225, "epoch": 405, "lr": 2.4123921620336338e-05} +{"train_loss": 0.0009322239784523845, "global_step": 48226, "epoch": 405, "lr": 2.4122025900255235e-05} +{"train_loss": 0.001635993947274983, "global_step": 48227, "epoch": 405, "lr": 2.4120130230982786e-05} +{"train_loss": 0.0007881683413870633, "global_step": 48228, "epoch": 405, "lr": 2.4118234612522672e-05} +{"train_loss": 0.0011313017457723618, "global_step": 48229, "epoch": 405, "lr": 2.4116339044878667e-05} +{"train_loss": 0.0007893444853834808, "global_step": 48230, "epoch": 405, "lr": 2.411444352805446e-05} +{"train_loss": 0.0007521061925217509, "global_step": 48231, "epoch": 405, "lr": 2.4112548062053757e-05} +{"train_loss": 0.000866080925334245, "global_step": 48232, "epoch": 405, "lr": 2.411065264688032e-05} +{"train_loss": 0.002030980307608843, "global_step": 48233, "epoch": 405, "lr": 2.4108757282537836e-05} +{"train_loss": 0.001086648553609848, "global_step": 48234, "epoch": 405, "lr": 2.410686196903006e-05} +{"train_loss": 0.0011294608702883124, "global_step": 48235, "epoch": 405, "lr": 2.410496670636067e-05} +{"train_loss": 0.0006930239032953978, "global_step": 48236, "epoch": 405, "lr": 2.4103071494533434e-05} +{"train_loss": 0.001396323787048459, "global_step": 48237, "epoch": 405, "lr": 2.410117633355205e-05} +{"train_loss": 0.000852189667057246, "global_step": 48238, "epoch": 405, "lr": 2.4099281223420223e-05} +{"train_loss": 0.0006127403466962278, "global_step": 48239, "epoch": 405, "lr": 2.4097386164141706e-05} +{"train_loss": 0.0009137484012171626, "global_step": 48240, "epoch": 405, "lr": 2.4095491155720186e-05} +{"train_loss": 0.0006987006054259837, "global_step": 48241, "epoch": 405, "lr": 2.409359619815942e-05} +{"train_loss": 0.0016743711894378066, "global_step": 48242, "epoch": 405, "lr": 2.4091701291463086e-05} +{"train_loss": 0.0009526263456791639, "global_step": 48243, "epoch": 405, "lr": 2.4089806435634954e-05} +{"train_loss": 0.0015991718973964453, "global_step": 48244, "epoch": 405, "lr": 2.40879116306787e-05} +{"train_loss": 0.0008873339393176138, "global_step": 48245, "epoch": 405, "lr": 2.4086016876598083e-05} +{"train_loss": 0.000783325347583741, "global_step": 48246, "epoch": 405, "lr": 2.4084122173396778e-05} +{"train_loss": 0.0008674088167026639, "global_step": 48247, "epoch": 405, "lr": 2.4082227521078554e-05} +{"train_loss": 0.0012513173278421164, "global_step": 48248, "epoch": 405, "lr": 2.408033291964709e-05} +{"train_loss": 0.0014544854639098048, "global_step": 48249, "epoch": 405, "lr": 2.4078438369106144e-05} +{"train_loss": 0.0006215148023329675, "global_step": 48250, "epoch": 405, "lr": 2.4076543869459388e-05} +{"train_loss": 0.0004127350985072553, "global_step": 48251, "epoch": 405, "lr": 2.4074649420710595e-05} +{"train_loss": 0.0006245612166821957, "global_step": 48252, "epoch": 405, "lr": 2.4072755022863436e-05} +{"train_loss": 0.001340832095593214, "global_step": 48253, "epoch": 405, "lr": 2.407086067592167e-05} +{"train_loss": 0.0009078108705580235, "global_step": 48254, "epoch": 405, "lr": 2.406896637988898e-05} +{"train_loss": 0.000676055031362921, "global_step": 48255, "epoch": 405, "lr": 2.4067072134769124e-05} +{"train_loss": 0.0007371055544354022, "global_step": 48256, "epoch": 405, "lr": 2.4065177940565803e-05} +{"train_loss": 0.0008114937227219343, "global_step": 48257, "epoch": 405, "lr": 2.4063283797282715e-05} +{"train_loss": 0.0010417664889246225, "global_step": 48258, "epoch": 405, "lr": 2.4061389704923614e-05} +{"train_loss": 0.00044891380821354687, "global_step": 48259, "epoch": 405, "lr": 2.405949566349219e-05} +{"train_loss": 0.001305280369706452, "global_step": 48260, "epoch": 405, "lr": 2.405760167299219e-05} +{"train_loss": 0.001084908377379179, "global_step": 48261, "epoch": 405, "lr": 2.405570773342732e-05} +{"train_loss": 0.0007825045031495392, "global_step": 48262, "epoch": 405, "lr": 2.4053813844801275e-05} +{"train_loss": 0.0010363142937421799, "global_step": 48263, "epoch": 405, "lr": 2.405192000711781e-05} +{"train_loss": 0.0011544395238161087, "global_step": 48264, "epoch": 405, "lr": 2.405002622038062e-05} +{"train_loss": 0.0007630468462593853, "global_step": 48265, "epoch": 405, "lr": 2.404813248459344e-05} +{"train_loss": 0.0013049698900431395, "global_step": 48266, "epoch": 405, "lr": 2.404623879975996e-05} +{"train_loss": 0.0010706763714551926, "global_step": 48267, "epoch": 405, "lr": 2.404434516588394e-05} +{"train_loss": 0.0009402200812473893, "global_step": 48268, "epoch": 405, "lr": 2.404245158296908e-05} +{"train_loss": 0.0007544556283392012, "global_step": 48269, "epoch": 405, "lr": 2.4040558051019068e-05} +{"train_loss": 0.0013115270994603634, "global_step": 48270, "epoch": 405, "lr": 2.403866457003767e-05} +{"train_loss": 0.0007027185638435185, "global_step": 48271, "epoch": 405, "lr": 2.4036771140028557e-05} +{"train_loss": 0.0014470380265265703, "global_step": 48272, "epoch": 405, "lr": 2.403487776099549e-05} +{"train_loss": 0.0007209049072116613, "global_step": 48273, "epoch": 405, "lr": 2.4032984432942146e-05} +{"train_loss": 0.0014087938470765948, "global_step": 48274, "epoch": 405, "lr": 2.4031091155872287e-05} +{"train_loss": 0.0008593458915129304, "global_step": 48275, "epoch": 405, "lr": 2.4029197929789583e-05} +{"train_loss": 0.001419262494891882, "global_step": 48276, "epoch": 405, "lr": 2.4027304754697795e-05} +{"train_loss": 0.0009449447388760746, "global_step": 48277, "epoch": 405, "lr": 2.4025411630600602e-05} +{"train_loss": 0.0005568019114434719, "global_step": 48278, "epoch": 405, "lr": 2.4023518557501755e-05} +{"train_loss": 0.0007100565126165748, "global_step": 48279, "epoch": 405, "lr": 2.4021625535404934e-05} +{"train_loss": 0.0007969085709191859, "global_step": 48280, "epoch": 405, "lr": 2.4019732564313896e-05} +{"train_loss": 0.0009244741522707045, "global_step": 48281, "epoch": 405, "lr": 2.401783964423232e-05} +{"train_loss": 0.0009571430273354053, "global_step": 48282, "epoch": 405, "lr": 2.401594677516396e-05} +{"train_loss": 0.0007213813369162381, "global_step": 48283, "epoch": 405, "lr": 2.401405395711249e-05} +{"train_loss": 0.0007071025320328772, "global_step": 48284, "epoch": 405, "lr": 2.401216119008167e-05} +{"train_loss": 0.0005093241925351322, "global_step": 48285, "epoch": 405, "lr": 2.4010268474075178e-05} +{"train_loss": 0.0005231759278103709, "global_step": 48286, "epoch": 405, "lr": 2.400837580909676e-05} +{"train_loss": 0.0012074646074324846, "global_step": 48287, "epoch": 405, "lr": 2.4006483195150124e-05} +{"train_loss": 0.0011202309979125857, "global_step": 48288, "epoch": 405, "lr": 2.400459063223896e-05} +{"train_loss": 0.0011443940456956625, "global_step": 48289, "epoch": 405, "lr": 2.400269812036703e-05} +{"train_loss": 0.001338298781774938, "global_step": 48290, "epoch": 405, "lr": 2.4000805659538e-05} +{"train_loss": 0.000587714952416718, "global_step": 48291, "epoch": 405, "lr": 2.3998913249755627e-05} +{"train_loss": 0.00074121227953583, "global_step": 48292, "epoch": 405, "lr": 2.399702089102362e-05} +{"train_loss": 0.0007396434084512293, "global_step": 48293, "epoch": 405, "lr": 2.3995128583345655e-05} +{"train_loss": 0.0019340832950547338, "global_step": 48294, "epoch": 405, "lr": 2.3993236326725498e-05} +{"train_loss": 0.0009410027996636927, "global_step": 48295, "epoch": 405, "lr": 2.3991344121166832e-05} +{"train_loss": 0.0006987362285144627, "global_step": 48296, "epoch": 405, "lr": 2.3989451966673394e-05} +{"train_loss": 0.00047000651829876006, "global_step": 48297, "epoch": 405, "lr": 2.398755986324887e-05} +{"train_loss": 0.0006214636377990246, "global_step": 48298, "epoch": 405, "lr": 2.3985667810897017e-05} +{"train_loss": 0.0006540563772432506, "global_step": 48299, "epoch": 405, "lr": 2.3983775809621522e-05} +{"train_loss": 0.000983875128440559, "global_step": 48300, "epoch": 405, "lr": 2.3981883859426085e-05} +{"train_loss": 0.0011286120861768723, "global_step": 48301, "epoch": 405, "lr": 2.397999196031446e-05} +{"train_loss": 0.0010822783224284649, "global_step": 48302, "epoch": 405, "lr": 2.3978100112290318e-05} +{"train_loss": 0.0009964685887098312, "global_step": 48303, "epoch": 405, "lr": 2.3976208315357418e-05} +{"train_loss": 0.0005833089235238731, "global_step": 48304, "epoch": 405, "lr": 2.3974316569519433e-05} +{"train_loss": 0.0014527760213240981, "global_step": 48305, "epoch": 405, "lr": 2.397242487478012e-05} +{"train_loss": 0.0006556513253599405, "global_step": 48306, "epoch": 405, "lr": 2.3970533231143166e-05} +{"train_loss": 0.0009343040292151272, "global_step": 48307, "epoch": 405, "lr": 2.3968641638612273e-05} +{"train_loss": 0.0007723195012658834, "global_step": 48308, "epoch": 405, "lr": 2.396675009719119e-05} +{"train_loss": 0.0006757472874596715, "global_step": 48309, "epoch": 405, "lr": 2.396485860688359e-05} +{"train_loss": 0.0013308136258274317, "global_step": 48310, "epoch": 405, "lr": 2.3962967167693212e-05} +{"train_loss": 0.0012416810495778918, "global_step": 48311, "epoch": 405, "lr": 2.3961075779623783e-05} +{"train_loss": 0.000752126972656697, "global_step": 48312, "epoch": 405, "lr": 2.3959184442678977e-05} +{"train_loss": 0.0009549289634607795, "global_step": 48313, "epoch": 405, "lr": 2.3957293156862553e-05, "val_loss": 0.02137674205005169, "train_action_mse_error": 1.2651261386054102e-05} +{"train_loss": 0.001521450001746416, "global_step": 48314, "epoch": 406, "lr": 2.395540192217819e-05} +{"train_loss": 0.0011733472347259521, "global_step": 48315, "epoch": 406, "lr": 2.395351073862962e-05} +{"train_loss": 0.0004115591000299901, "global_step": 48316, "epoch": 406, "lr": 2.3951619606220537e-05} +{"train_loss": 0.0011045014252886176, "global_step": 48317, "epoch": 406, "lr": 2.3949728524954685e-05} +{"train_loss": 0.0008544399170204997, "global_step": 48318, "epoch": 406, "lr": 2.3947837494835756e-05} +{"train_loss": 0.0018523299368098378, "global_step": 48319, "epoch": 406, "lr": 2.3945946515867446e-05} +{"train_loss": 0.00065179931698367, "global_step": 48320, "epoch": 406, "lr": 2.3944055588053505e-05} +{"train_loss": 0.0010293202940374613, "global_step": 48321, "epoch": 406, "lr": 2.3942164711397606e-05} +{"train_loss": 0.0016475921729579568, "global_step": 48322, "epoch": 406, "lr": 2.3940273885903507e-05} +{"train_loss": 0.0009791224729269743, "global_step": 48323, "epoch": 406, "lr": 2.3938383111574874e-05} +{"train_loss": 0.000602641433943063, "global_step": 48324, "epoch": 406, "lr": 2.393649238841546e-05} +{"train_loss": 0.0007190920296125114, "global_step": 48325, "epoch": 406, "lr": 2.3934601716428963e-05} +{"train_loss": 0.0018890221836045384, "global_step": 48326, "epoch": 406, "lr": 2.3932711095619065e-05} +{"train_loss": 0.0007201106054708362, "global_step": 48327, "epoch": 406, "lr": 2.393082052598953e-05} +{"train_loss": 0.0010160432429984212, "global_step": 48328, "epoch": 406, "lr": 2.392893000754402e-05} +{"train_loss": 0.0006126039079390466, "global_step": 48329, "epoch": 406, "lr": 2.3927039540286287e-05} +{"train_loss": 0.0008546601166017354, "global_step": 48330, "epoch": 406, "lr": 2.392514912422003e-05} +{"train_loss": 0.0011117213871330023, "global_step": 48331, "epoch": 406, "lr": 2.3923258759348944e-05} +{"train_loss": 0.0010194155620411038, "global_step": 48332, "epoch": 406, "lr": 2.3921368445676763e-05} +{"train_loss": 0.0010781139135360718, "global_step": 48333, "epoch": 406, "lr": 2.3919478183207172e-05} +{"train_loss": 0.0005001925746910274, "global_step": 48334, "epoch": 406, "lr": 2.391758797194392e-05} +{"train_loss": 0.0007856186712160707, "global_step": 48335, "epoch": 406, "lr": 2.391569781189068e-05} +{"train_loss": 0.0009067418286576867, "global_step": 48336, "epoch": 406, "lr": 2.39138077030512e-05} +{"train_loss": 0.0007576059433631599, "global_step": 48337, "epoch": 406, "lr": 2.3911917645429172e-05} +{"train_loss": 0.0019020724575966597, "global_step": 48338, "epoch": 406, "lr": 2.3910027639028283e-05} +{"train_loss": 0.0009603711077943444, "global_step": 48339, "epoch": 406, "lr": 2.3908137683852287e-05} +{"train_loss": 0.0020564596634358168, "global_step": 48340, "epoch": 406, "lr": 2.390624777990486e-05} +{"train_loss": 0.0008998127887025476, "global_step": 48341, "epoch": 406, "lr": 2.3904357927189745e-05} +{"train_loss": 0.0012536880094558, "global_step": 48342, "epoch": 406, "lr": 2.3902468125710615e-05} +{"train_loss": 0.0010698104742914438, "global_step": 48343, "epoch": 406, "lr": 2.3900578375471223e-05} +{"train_loss": 0.0011017053620889783, "global_step": 48344, "epoch": 406, "lr": 2.3898688676475232e-05} +{"train_loss": 0.0011301739141345024, "global_step": 48345, "epoch": 406, "lr": 2.3896799028726386e-05} +{"train_loss": 0.0011269710958003998, "global_step": 48346, "epoch": 406, "lr": 2.3894909432228402e-05} +{"train_loss": 0.0007500083884224296, "global_step": 48347, "epoch": 406, "lr": 2.3893019886984952e-05} +{"train_loss": 0.0007684627780690789, "global_step": 48348, "epoch": 406, "lr": 2.389113039299979e-05} +{"train_loss": 0.0009393749642185867, "global_step": 48349, "epoch": 406, "lr": 2.3889240950276605e-05} +{"train_loss": 0.0010569714941084385, "global_step": 48350, "epoch": 406, "lr": 2.388735155881908e-05} +{"train_loss": 0.0008852998726069927, "global_step": 48351, "epoch": 406, "lr": 2.3885462218630977e-05} +{"train_loss": 0.000772730796597898, "global_step": 48352, "epoch": 406, "lr": 2.388357292971596e-05} +{"train_loss": 0.0009782519191503525, "global_step": 48353, "epoch": 406, "lr": 2.3881683692077772e-05} +{"train_loss": 0.001127399387769401, "global_step": 48354, "epoch": 406, "lr": 2.3879794505720094e-05} +{"train_loss": 0.0012921225279569626, "global_step": 48355, "epoch": 406, "lr": 2.3877905370646663e-05} +{"train_loss": 0.0009911188390105963, "global_step": 48356, "epoch": 406, "lr": 2.3876016286861176e-05} +{"train_loss": 0.0012097981525585055, "global_step": 48357, "epoch": 406, "lr": 2.3874127254367324e-05} +{"train_loss": 0.0011787888361141086, "global_step": 48358, "epoch": 406, "lr": 2.3872238273168846e-05} +{"train_loss": 0.000450901803560555, "global_step": 48359, "epoch": 406, "lr": 2.387034934326942e-05} +{"train_loss": 0.0016503434162586927, "global_step": 48360, "epoch": 406, "lr": 2.3868460464672792e-05} +{"train_loss": 0.0007155899656936526, "global_step": 48361, "epoch": 406, "lr": 2.3866571637382647e-05} +{"train_loss": 0.0005656589055433869, "global_step": 48362, "epoch": 406, "lr": 2.386468286140268e-05} +{"train_loss": 0.0007483705412596464, "global_step": 48363, "epoch": 406, "lr": 2.3862794136736632e-05} +{"train_loss": 0.0012867576442658901, "global_step": 48364, "epoch": 406, "lr": 2.3860905463388182e-05} +{"train_loss": 0.0014811980072408915, "global_step": 48365, "epoch": 406, "lr": 2.3859016841361066e-05} +{"train_loss": 0.0007881178171373904, "global_step": 48366, "epoch": 406, "lr": 2.3857128270658962e-05} +{"train_loss": 0.00116146809887141, "global_step": 48367, "epoch": 406, "lr": 2.3855239751285608e-05} +{"train_loss": 0.0012024708557873964, "global_step": 48368, "epoch": 406, "lr": 2.38533512832447e-05} +{"train_loss": 0.0010861600749194622, "global_step": 48369, "epoch": 406, "lr": 2.3851462866539926e-05} +{"train_loss": 0.0017079288372769952, "global_step": 48370, "epoch": 406, "lr": 2.384957450117503e-05} +{"train_loss": 0.0016970306169241667, "global_step": 48371, "epoch": 406, "lr": 2.384768618715368e-05} +{"train_loss": 0.0009550068061798811, "global_step": 48372, "epoch": 406, "lr": 2.3845797924479622e-05} +{"train_loss": 0.0009352266788482666, "global_step": 48373, "epoch": 406, "lr": 2.3843909713156532e-05} +{"train_loss": 0.0013093124143779278, "global_step": 48374, "epoch": 406, "lr": 2.384202155318814e-05} +{"train_loss": 0.000978608150035143, "global_step": 48375, "epoch": 406, "lr": 2.3840133444578133e-05} +{"train_loss": 0.0013714295346289873, "global_step": 48376, "epoch": 406, "lr": 2.3838245387330248e-05} +{"train_loss": 0.00100510916672647, "global_step": 48377, "epoch": 406, "lr": 2.3836357381448155e-05} +{"train_loss": 0.0013079473283141851, "global_step": 48378, "epoch": 406, "lr": 2.3834469426935595e-05} +{"train_loss": 0.0008425142150372267, "global_step": 48379, "epoch": 406, "lr": 2.3832581523796238e-05} +{"train_loss": 0.00038109428714960814, "global_step": 48380, "epoch": 406, "lr": 2.3830693672033832e-05} +{"train_loss": 0.0009431240614503622, "global_step": 48381, "epoch": 406, "lr": 2.382880587165205e-05} +{"train_loss": 0.0014305730583146214, "global_step": 48382, "epoch": 406, "lr": 2.3826918122654623e-05} +{"train_loss": 0.00065685308072716, "global_step": 48383, "epoch": 406, "lr": 2.382503042504523e-05} +{"train_loss": 0.0011622700840234756, "global_step": 48384, "epoch": 406, "lr": 2.382314277882762e-05} +{"train_loss": 0.0009409001795575023, "global_step": 48385, "epoch": 406, "lr": 2.382125518400544e-05} +{"train_loss": 0.0007880821358412504, "global_step": 48386, "epoch": 406, "lr": 2.3819367640582457e-05} +{"train_loss": 0.000883915345184505, "global_step": 48387, "epoch": 406, "lr": 2.3817480148562344e-05} +{"train_loss": 0.0006570901605300605, "global_step": 48388, "epoch": 406, "lr": 2.3815592707948793e-05} +{"train_loss": 0.0005118487169966102, "global_step": 48389, "epoch": 406, "lr": 2.3813705318745548e-05} +{"train_loss": 0.0010884411167353392, "global_step": 48390, "epoch": 406, "lr": 2.381181798095628e-05} +{"train_loss": 0.0010813995031639934, "global_step": 48391, "epoch": 406, "lr": 2.3809930694584726e-05} +{"train_loss": 0.0013262914726510644, "global_step": 48392, "epoch": 406, "lr": 2.3808043459634556e-05} +{"train_loss": 0.001377374050207436, "global_step": 48393, "epoch": 406, "lr": 2.380615627610951e-05} +{"train_loss": 0.0006671037408523262, "global_step": 48394, "epoch": 406, "lr": 2.380426914401328e-05} +{"train_loss": 0.0008968344191089272, "global_step": 48395, "epoch": 406, "lr": 2.380238206334955e-05} +{"train_loss": 0.0006820952985435724, "global_step": 48396, "epoch": 406, "lr": 2.380049503412206e-05} +{"train_loss": 0.0007717133848927915, "global_step": 48397, "epoch": 406, "lr": 2.3798608056334486e-05} +{"train_loss": 0.0010709615889936686, "global_step": 48398, "epoch": 406, "lr": 2.379672112999056e-05} +{"train_loss": 0.00137520139105618, "global_step": 48399, "epoch": 406, "lr": 2.3794834255093978e-05} +{"train_loss": 0.0014074151404201984, "global_step": 48400, "epoch": 406, "lr": 2.3792947431648416e-05} +{"train_loss": 0.0010318788699805737, "global_step": 48401, "epoch": 406, "lr": 2.379106065965762e-05} +{"train_loss": 0.0008235270506702363, "global_step": 48402, "epoch": 406, "lr": 2.3789173939125265e-05} +{"train_loss": 0.000571640906855464, "global_step": 48403, "epoch": 406, "lr": 2.3787287270055076e-05} +{"train_loss": 0.0008265638607554138, "global_step": 48404, "epoch": 406, "lr": 2.3785400652450734e-05} +{"train_loss": 0.001281693927012384, "global_step": 48405, "epoch": 406, "lr": 2.3783514086315976e-05} +{"train_loss": 0.0006052490207366645, "global_step": 48406, "epoch": 406, "lr": 2.3781627571654486e-05} +{"train_loss": 0.0016591610619798303, "global_step": 48407, "epoch": 406, "lr": 2.377974110846995e-05} +{"train_loss": 0.0013866354711353779, "global_step": 48408, "epoch": 406, "lr": 2.3777854696766093e-05} +{"train_loss": 0.0014100096886977553, "global_step": 48409, "epoch": 406, "lr": 2.3775968336546634e-05} +{"train_loss": 0.0012457153061404824, "global_step": 48410, "epoch": 406, "lr": 2.377408202781524e-05} +{"train_loss": 0.0014115560334175825, "global_step": 48411, "epoch": 406, "lr": 2.3772195770575656e-05} +{"train_loss": 0.0009778481908142567, "global_step": 48412, "epoch": 406, "lr": 2.3770309564831544e-05} +{"train_loss": 0.0005571970250457525, "global_step": 48413, "epoch": 406, "lr": 2.376842341058664e-05} +{"train_loss": 0.0010106355184689164, "global_step": 48414, "epoch": 406, "lr": 2.3766537307844626e-05} +{"train_loss": 0.0014945643488317728, "global_step": 48415, "epoch": 406, "lr": 2.3764651256609227e-05} +{"train_loss": 0.0006035112892277539, "global_step": 48416, "epoch": 406, "lr": 2.3762765256884113e-05} +{"train_loss": 0.0005595576367340982, "global_step": 48417, "epoch": 406, "lr": 2.3760879308673023e-05} +{"train_loss": 0.0006146441446617246, "global_step": 48418, "epoch": 406, "lr": 2.3758993411979646e-05} +{"train_loss": 0.0007488679839298129, "global_step": 48419, "epoch": 406, "lr": 2.3757107566807664e-05} +{"train_loss": 0.0015876558609306812, "global_step": 48420, "epoch": 406, "lr": 2.375522177316082e-05} +{"train_loss": 0.0008663392509333789, "global_step": 48421, "epoch": 406, "lr": 2.3753336031042765e-05} +{"train_loss": 0.000636194134131074, "global_step": 48422, "epoch": 406, "lr": 2.375145034045726e-05} +{"train_loss": 0.0009334752103313804, "global_step": 48423, "epoch": 406, "lr": 2.374956470140795e-05} +{"train_loss": 0.0013662801356986165, "global_step": 48424, "epoch": 406, "lr": 2.374767911389859e-05} +{"train_loss": 0.0010948153212666512, "global_step": 48425, "epoch": 406, "lr": 2.3745793577932856e-05} +{"train_loss": 0.0007303092861548066, "global_step": 48426, "epoch": 406, "lr": 2.3743908093514433e-05} +{"train_loss": 0.0010633973870426416, "global_step": 48427, "epoch": 406, "lr": 2.3742022660647055e-05} +{"train_loss": 0.0005192344542592764, "global_step": 48428, "epoch": 406, "lr": 2.37401372793344e-05} +{"train_loss": 0.001833977410569787, "global_step": 48429, "epoch": 406, "lr": 2.3738251949580192e-05} +{"train_loss": 0.0008799356874078512, "global_step": 48430, "epoch": 406, "lr": 2.373636667138813e-05} +{"train_loss": 0.0005658945883624256, "global_step": 48431, "epoch": 406, "lr": 2.373448144476188e-05} +{"train_loss": 0.001026697939373318, "global_step": 48432, "epoch": 406, "lr": 2.3732596269705187e-05, "val_loss": 0.013327976688742638} +{"train_loss": 0.0015810843324288726, "global_step": 48433, "epoch": 407, "lr": 2.373071114622172e-05} +{"train_loss": 0.0004370007663965225, "global_step": 48434, "epoch": 407, "lr": 2.3728826074315215e-05} +{"train_loss": 0.0007147029391489923, "global_step": 48435, "epoch": 407, "lr": 2.3726941053989328e-05} +{"train_loss": 0.0011993887601420283, "global_step": 48436, "epoch": 407, "lr": 2.372505608524781e-05} +{"train_loss": 0.001048050238750875, "global_step": 48437, "epoch": 407, "lr": 2.3723171168094333e-05} +{"train_loss": 0.0009050738299265504, "global_step": 48438, "epoch": 407, "lr": 2.3721286302532587e-05} +{"train_loss": 0.0012021384900435805, "global_step": 48439, "epoch": 407, "lr": 2.3719401488566305e-05} +{"train_loss": 0.0018983861664310098, "global_step": 48440, "epoch": 407, "lr": 2.3717516726199152e-05} +{"train_loss": 0.0008016180945560336, "global_step": 48441, "epoch": 407, "lr": 2.371563201543487e-05} +{"train_loss": 0.0010211672633886337, "global_step": 48442, "epoch": 407, "lr": 2.371374735627711e-05} +{"train_loss": 0.0009642102522775531, "global_step": 48443, "epoch": 407, "lr": 2.3711862748729602e-05} +{"train_loss": 0.0009086339850910008, "global_step": 48444, "epoch": 407, "lr": 2.3709978192796067e-05} +{"train_loss": 0.0007754503167234361, "global_step": 48445, "epoch": 407, "lr": 2.3708093688480155e-05} +{"train_loss": 0.002067224821075797, "global_step": 48446, "epoch": 407, "lr": 2.3706209235785615e-05} +{"train_loss": 0.0010075990576297045, "global_step": 48447, "epoch": 407, "lr": 2.37043248347161e-05} +{"train_loss": 0.0005864924169145525, "global_step": 48448, "epoch": 407, "lr": 2.370244048527536e-05} +{"train_loss": 0.0008794496534392238, "global_step": 48449, "epoch": 407, "lr": 2.3700556187467064e-05} +{"train_loss": 0.00114451942499727, "global_step": 48450, "epoch": 407, "lr": 2.36986719412949e-05} +{"train_loss": 0.000755380024202168, "global_step": 48451, "epoch": 407, "lr": 2.36967877467626e-05} +{"train_loss": 0.00045001960825175047, "global_step": 48452, "epoch": 407, "lr": 2.369490360387383e-05} +{"train_loss": 0.0010447045788168907, "global_step": 48453, "epoch": 407, "lr": 2.3693019512632326e-05} +{"train_loss": 0.0009958611335605383, "global_step": 48454, "epoch": 407, "lr": 2.3691135473041748e-05} +{"train_loss": 0.0009619603515602648, "global_step": 48455, "epoch": 407, "lr": 2.3689251485105835e-05} +{"train_loss": 0.000693617039360106, "global_step": 48456, "epoch": 407, "lr": 2.3687367548828265e-05} +{"train_loss": 0.0009188773692585528, "global_step": 48457, "epoch": 407, "lr": 2.3685483664212716e-05} +{"train_loss": 0.0009790671756491065, "global_step": 48458, "epoch": 407, "lr": 2.368359983126293e-05} +{"train_loss": 0.0014073000056669116, "global_step": 48459, "epoch": 407, "lr": 2.3681716049982565e-05} +{"train_loss": 0.0005133522790856659, "global_step": 48460, "epoch": 407, "lr": 2.3679832320375363e-05} +{"train_loss": 0.0008776073809713125, "global_step": 48461, "epoch": 407, "lr": 2.367794864244497e-05} +{"train_loss": 0.0009750278550200164, "global_step": 48462, "epoch": 407, "lr": 2.3676065016195137e-05} +{"train_loss": 0.000590847572311759, "global_step": 48463, "epoch": 407, "lr": 2.3674181441629534e-05} +{"train_loss": 0.0011406209086999297, "global_step": 48464, "epoch": 407, "lr": 2.3672297918751852e-05} +{"train_loss": 0.0010381632018834352, "global_step": 48465, "epoch": 407, "lr": 2.3670414447565814e-05} +{"train_loss": 0.001221485435962677, "global_step": 48466, "epoch": 407, "lr": 2.3668531028075087e-05} +{"train_loss": 0.0007927202386781573, "global_step": 48467, "epoch": 407, "lr": 2.3666647660283402e-05} +{"train_loss": 0.0014544681180268526, "global_step": 48468, "epoch": 407, "lr": 2.366476434419444e-05} +{"train_loss": 0.0009277864010073245, "global_step": 48469, "epoch": 407, "lr": 2.3662881079811888e-05} +{"train_loss": 0.0011899200035259128, "global_step": 48470, "epoch": 407, "lr": 2.3660997867139467e-05} +{"train_loss": 0.0009083148906938732, "global_step": 48471, "epoch": 407, "lr": 2.3659114706180845e-05} +{"train_loss": 0.0015247842529788613, "global_step": 48472, "epoch": 407, "lr": 2.365723159693976e-05} +{"train_loss": 0.0007759861182421446, "global_step": 48473, "epoch": 407, "lr": 2.3655348539419863e-05} +{"train_loss": 0.0015408038161695004, "global_step": 48474, "epoch": 407, "lr": 2.3653465533624896e-05} +{"train_loss": 0.0011960746487602592, "global_step": 48475, "epoch": 407, "lr": 2.365158257955852e-05} +{"train_loss": 0.0011822028318420053, "global_step": 48476, "epoch": 407, "lr": 2.3649699677224463e-05} +{"train_loss": 0.0011275768047198653, "global_step": 48477, "epoch": 407, "lr": 2.3647816826626383e-05} +{"train_loss": 0.0009746527066454291, "global_step": 48478, "epoch": 407, "lr": 2.3645934027768003e-05} +{"train_loss": 0.0008600295404903591, "global_step": 48479, "epoch": 407, "lr": 2.3644051280653036e-05} +{"train_loss": 0.0004582699039019644, "global_step": 48480, "epoch": 407, "lr": 2.364216858528515e-05} +{"train_loss": 0.0010610789759084582, "global_step": 48481, "epoch": 407, "lr": 2.364028594166804e-05} +{"train_loss": 0.0012993920827284455, "global_step": 48482, "epoch": 407, "lr": 2.3638403349805426e-05} +{"train_loss": 0.0015088203363120556, "global_step": 48483, "epoch": 407, "lr": 2.3636520809700974e-05} +{"train_loss": 0.0014061803231015801, "global_step": 48484, "epoch": 407, "lr": 2.3634638321358415e-05} +{"train_loss": 0.001010129926726222, "global_step": 48485, "epoch": 407, "lr": 2.363275588478141e-05} +{"train_loss": 0.0014948182506486773, "global_step": 48486, "epoch": 407, "lr": 2.3630873499973693e-05} +{"train_loss": 0.0021580045577138662, "global_step": 48487, "epoch": 407, "lr": 2.3628991166938934e-05} +{"train_loss": 0.0011266922811046243, "global_step": 48488, "epoch": 407, "lr": 2.3627108885680816e-05} +{"train_loss": 0.0011778147891163826, "global_step": 48489, "epoch": 407, "lr": 2.362522665620307e-05} +{"train_loss": 0.0010017342865467072, "global_step": 48490, "epoch": 407, "lr": 2.3623344478509358e-05} +{"train_loss": 0.001005028490908444, "global_step": 48491, "epoch": 407, "lr": 2.3621462352603407e-05} +{"train_loss": 0.0012477762065827847, "global_step": 48492, "epoch": 407, "lr": 2.361958027848888e-05} +{"train_loss": 0.0017571947537362576, "global_step": 48493, "epoch": 407, "lr": 2.3617698256169506e-05} +{"train_loss": 0.0013517428888007998, "global_step": 48494, "epoch": 407, "lr": 2.361581628564897e-05} +{"train_loss": 0.001073228195309639, "global_step": 48495, "epoch": 407, "lr": 2.361393436693093e-05} +{"train_loss": 0.0012694424949586391, "global_step": 48496, "epoch": 407, "lr": 2.3612052500019133e-05} +{"train_loss": 0.0019481825875118375, "global_step": 48497, "epoch": 407, "lr": 2.361017068491724e-05} +{"train_loss": 0.0013720437418669462, "global_step": 48498, "epoch": 407, "lr": 2.3608288921628967e-05} +{"train_loss": 0.0013428275706246495, "global_step": 48499, "epoch": 407, "lr": 2.3606407210158006e-05} +{"train_loss": 0.0011542362626641989, "global_step": 48500, "epoch": 407, "lr": 2.3604525550508016e-05} +{"train_loss": 0.000775318534579128, "global_step": 48501, "epoch": 407, "lr": 2.360264394268275e-05} +{"train_loss": 0.0013876012526452541, "global_step": 48502, "epoch": 407, "lr": 2.360076238668585e-05} +{"train_loss": 0.001251920941285789, "global_step": 48503, "epoch": 407, "lr": 2.359888088252105e-05} +{"train_loss": 0.0013266371097415686, "global_step": 48504, "epoch": 407, "lr": 2.3596999430192007e-05} +{"train_loss": 0.0008739193435758352, "global_step": 48505, "epoch": 407, "lr": 2.3595118029702457e-05} +{"train_loss": 0.001409892807714641, "global_step": 48506, "epoch": 407, "lr": 2.3593236681056053e-05} +{"train_loss": 0.0008520213887095451, "global_step": 48507, "epoch": 407, "lr": 2.3591355384256526e-05} +{"train_loss": 0.001869875704869628, "global_step": 48508, "epoch": 407, "lr": 2.358947413930753e-05} +{"train_loss": 0.0010652225464582443, "global_step": 48509, "epoch": 407, "lr": 2.35875929462128e-05} +{"train_loss": 0.0006600522319786251, "global_step": 48510, "epoch": 407, "lr": 2.358571180497599e-05} +{"train_loss": 0.0006521186442114413, "global_step": 48511, "epoch": 407, "lr": 2.3583830715600835e-05} +{"train_loss": 0.0021102253813296556, "global_step": 48512, "epoch": 407, "lr": 2.3581949678090982e-05} +{"train_loss": 0.0008221757016144693, "global_step": 48513, "epoch": 407, "lr": 2.3580068692450174e-05} +{"train_loss": 0.0010583073599264026, "global_step": 48514, "epoch": 407, "lr": 2.3578187758682053e-05} +{"train_loss": 0.001261481549590826, "global_step": 48515, "epoch": 407, "lr": 2.357630687679036e-05} +{"train_loss": 0.0005502953426912427, "global_step": 48516, "epoch": 407, "lr": 2.3574426046778747e-05} +{"train_loss": 0.0013170860474929214, "global_step": 48517, "epoch": 407, "lr": 2.357254526865094e-05} +{"train_loss": 0.001499651581980288, "global_step": 48518, "epoch": 407, "lr": 2.3570664542410625e-05} +{"train_loss": 0.001081235008314252, "global_step": 48519, "epoch": 407, "lr": 2.3568783868061462e-05} +{"train_loss": 0.001075098174624145, "global_step": 48520, "epoch": 407, "lr": 2.3566903245607192e-05} +{"train_loss": 0.0011365411337465048, "global_step": 48521, "epoch": 407, "lr": 2.3565022675051458e-05} +{"train_loss": 0.0012806039303541183, "global_step": 48522, "epoch": 407, "lr": 2.3563142156398e-05} +{"train_loss": 0.0012522382894530892, "global_step": 48523, "epoch": 407, "lr": 2.3561261689650466e-05} +{"train_loss": 0.0010858754394575953, "global_step": 48524, "epoch": 407, "lr": 2.355938127481259e-05} +{"train_loss": 0.0014519670512527227, "global_step": 48525, "epoch": 407, "lr": 2.3557500911888047e-05} +{"train_loss": 0.0010464392835274339, "global_step": 48526, "epoch": 407, "lr": 2.3555620600880507e-05} +{"train_loss": 0.0013478343607857823, "global_step": 48527, "epoch": 407, "lr": 2.3553740341793702e-05} +{"train_loss": 0.001891672844067216, "global_step": 48528, "epoch": 407, "lr": 2.3551860134631277e-05} +{"train_loss": 0.0005928058526478708, "global_step": 48529, "epoch": 407, "lr": 2.3549979979396976e-05} +{"train_loss": 0.0011420436203479767, "global_step": 48530, "epoch": 407, "lr": 2.3548099876094437e-05} +{"train_loss": 0.0017558503895998001, "global_step": 48531, "epoch": 407, "lr": 2.35462198247274e-05} +{"train_loss": 0.0007970469305291772, "global_step": 48532, "epoch": 407, "lr": 2.3544339825299533e-05} +{"train_loss": 0.0009235344477929175, "global_step": 48533, "epoch": 407, "lr": 2.354245987781451e-05} +{"train_loss": 0.0006949635571800172, "global_step": 48534, "epoch": 407, "lr": 2.354057998227606e-05} +{"train_loss": 0.000612115312833339, "global_step": 48535, "epoch": 407, "lr": 2.3538700138687837e-05} +{"train_loss": 0.0018682265654206276, "global_step": 48536, "epoch": 407, "lr": 2.3536820347053562e-05} +{"train_loss": 0.0014174855314195156, "global_step": 48537, "epoch": 407, "lr": 2.353494060737692e-05} +{"train_loss": 0.0007057801703922451, "global_step": 48538, "epoch": 407, "lr": 2.353306091966157e-05} +{"train_loss": 0.0006103237974457443, "global_step": 48539, "epoch": 407, "lr": 2.353118128391125e-05} +{"train_loss": 0.0007124508847482502, "global_step": 48540, "epoch": 407, "lr": 2.352930170012961e-05} +{"train_loss": 0.0010906595271080732, "global_step": 48541, "epoch": 407, "lr": 2.3527422168320356e-05} +{"train_loss": 0.0008393424213863909, "global_step": 48542, "epoch": 407, "lr": 2.3525542688487203e-05} +{"train_loss": 0.0009190078708343208, "global_step": 48543, "epoch": 407, "lr": 2.3523663260633795e-05} +{"train_loss": 0.0007693831576034427, "global_step": 48544, "epoch": 407, "lr": 2.3521783884763866e-05} +{"train_loss": 0.0010715530952438712, "global_step": 48545, "epoch": 407, "lr": 2.3519904560881066e-05} +{"train_loss": 0.0011149164056405425, "global_step": 48546, "epoch": 407, "lr": 2.3518025288989125e-05} +{"train_loss": 0.0005932719795964658, "global_step": 48547, "epoch": 407, "lr": 2.3516146069091694e-05} +{"train_loss": 0.0015649388078600168, "global_step": 48548, "epoch": 407, "lr": 2.3514266901192495e-05} +{"train_loss": 0.0006753301713615656, "global_step": 48549, "epoch": 407, "lr": 2.3512387785295202e-05} +{"train_loss": 0.0010488445404917002, "global_step": 48550, "epoch": 407, "lr": 2.3510508721403497e-05} +{"train_loss": 0.0011095934441829678, "global_step": 48551, "epoch": 407, "lr": 2.3508629709521092e-05, "val_loss": 0.019561562687158585} +{"train_loss": 0.0018378265667706728, "global_step": 48552, "epoch": 408, "lr": 2.350675074965164e-05} +{"train_loss": 0.0003436191182117909, "global_step": 48553, "epoch": 408, "lr": 2.3504871841798876e-05} +{"train_loss": 0.0009883528109639883, "global_step": 48554, "epoch": 408, "lr": 2.3502992985966442e-05} +{"train_loss": 0.000920899910852313, "global_step": 48555, "epoch": 408, "lr": 2.3501114182158073e-05} +{"train_loss": 0.0010486211394891143, "global_step": 48556, "epoch": 408, "lr": 2.3499235430377436e-05} +{"train_loss": 0.0010381679749116302, "global_step": 48557, "epoch": 408, "lr": 2.3497356730628194e-05} +{"train_loss": 0.0010452400892972946, "global_step": 48558, "epoch": 408, "lr": 2.3495478082914085e-05} +{"train_loss": 0.0008281494956463575, "global_step": 48559, "epoch": 408, "lr": 2.3493599487238754e-05} +{"train_loss": 0.0010647609597072005, "global_step": 48560, "epoch": 408, "lr": 2.3491720943605927e-05} +{"train_loss": 0.0006917790160514414, "global_step": 48561, "epoch": 408, "lr": 2.3489842452019256e-05} +{"train_loss": 0.000751387735363096, "global_step": 48562, "epoch": 408, "lr": 2.3487964012482465e-05} +{"train_loss": 0.001019003801047802, "global_step": 48563, "epoch": 408, "lr": 2.3486085624999226e-05} +{"train_loss": 0.0009483620524406433, "global_step": 48564, "epoch": 408, "lr": 2.3484207289573202e-05} +{"train_loss": 0.0011542547727003694, "global_step": 48565, "epoch": 408, "lr": 2.3482329006208124e-05} +{"train_loss": 0.0008511964115314186, "global_step": 48566, "epoch": 408, "lr": 2.3480450774907648e-05} +{"train_loss": 0.0006729513988830149, "global_step": 48567, "epoch": 408, "lr": 2.3478572595675486e-05} +{"train_loss": 0.0012480623554438353, "global_step": 48568, "epoch": 408, "lr": 2.3476694468515314e-05} +{"train_loss": 0.0020407186821103096, "global_step": 48569, "epoch": 408, "lr": 2.34748163934308e-05} +{"train_loss": 0.0007156370556913316, "global_step": 48570, "epoch": 408, "lr": 2.3472938370425672e-05} +{"train_loss": 0.0008467541192658246, "global_step": 48571, "epoch": 408, "lr": 2.3471060399503574e-05} +{"train_loss": 0.0004893823061138391, "global_step": 48572, "epoch": 408, "lr": 2.3469182480668232e-05} +{"train_loss": 0.001338211353868246, "global_step": 48573, "epoch": 408, "lr": 2.3467304613923303e-05} +{"train_loss": 0.0009037834824994206, "global_step": 48574, "epoch": 408, "lr": 2.3465426799272498e-05} +{"train_loss": 0.001406187890097499, "global_step": 48575, "epoch": 408, "lr": 2.346354903671948e-05} +{"train_loss": 0.0011791546130552888, "global_step": 48576, "epoch": 408, "lr": 2.3461671326267943e-05} +{"train_loss": 0.0008855939959175885, "global_step": 48577, "epoch": 408, "lr": 2.3459793667921603e-05} +{"train_loss": 0.0009216618491336703, "global_step": 48578, "epoch": 408, "lr": 2.34579160616841e-05} +{"train_loss": 0.0005731940036639571, "global_step": 48579, "epoch": 408, "lr": 2.3456038507559165e-05} +{"train_loss": 0.0010498109040781856, "global_step": 48580, "epoch": 408, "lr": 2.345416100555044e-05} +{"train_loss": 0.001145601854659617, "global_step": 48581, "epoch": 408, "lr": 2.345228355566166e-05} +{"train_loss": 0.0010881794150918722, "global_step": 48582, "epoch": 408, "lr": 2.3450406157896477e-05} +{"train_loss": 0.0004509214195422828, "global_step": 48583, "epoch": 408, "lr": 2.344852881225857e-05} +{"train_loss": 0.0008652739925310016, "global_step": 48584, "epoch": 408, "lr": 2.344665151875166e-05} +{"train_loss": 0.0011028305161744356, "global_step": 48585, "epoch": 408, "lr": 2.3444774277379396e-05} +{"train_loss": 0.0007961808005347848, "global_step": 48586, "epoch": 408, "lr": 2.3442897088145495e-05} +{"train_loss": 0.0014772370923310518, "global_step": 48587, "epoch": 408, "lr": 2.3441019951053628e-05} +{"train_loss": 0.001001014024950564, "global_step": 48588, "epoch": 408, "lr": 2.343914286610746e-05} +{"train_loss": 0.0003802308638114482, "global_step": 48589, "epoch": 408, "lr": 2.3437265833310723e-05} +{"train_loss": 0.0009423868032172322, "global_step": 48590, "epoch": 408, "lr": 2.343538885266705e-05} +{"train_loss": 0.0009632176952436566, "global_step": 48591, "epoch": 408, "lr": 2.3433511924180178e-05} +{"train_loss": 0.0007940625655464828, "global_step": 48592, "epoch": 408, "lr": 2.343163504785375e-05} +{"train_loss": 0.0007592173642478883, "global_step": 48593, "epoch": 408, "lr": 2.3429758223691483e-05} +{"train_loss": 0.0014358015032485127, "global_step": 48594, "epoch": 408, "lr": 2.3427881451697047e-05} +{"train_loss": 0.0005019742529839277, "global_step": 48595, "epoch": 408, "lr": 2.342600473187411e-05} +{"train_loss": 0.000954320072196424, "global_step": 48596, "epoch": 408, "lr": 2.342412806422639e-05} +{"train_loss": 0.0010674160439521074, "global_step": 48597, "epoch": 408, "lr": 2.3422251448757537e-05} +{"train_loss": 0.0007580003002658486, "global_step": 48598, "epoch": 408, "lr": 2.3420374885471274e-05} +{"train_loss": 0.001060903538018465, "global_step": 48599, "epoch": 408, "lr": 2.3418498374371267e-05} +{"train_loss": 0.0014958957908675075, "global_step": 48600, "epoch": 408, "lr": 2.3416621915461178e-05} +{"train_loss": 0.0007048427360132337, "global_step": 48601, "epoch": 408, "lr": 2.341474550874473e-05} +{"train_loss": 0.0007252299692481756, "global_step": 48602, "epoch": 408, "lr": 2.341286915422557e-05} +{"train_loss": 0.00070276262704283, "global_step": 48603, "epoch": 408, "lr": 2.341099285190742e-05} +{"train_loss": 0.0011744233779609203, "global_step": 48604, "epoch": 408, "lr": 2.340911660179393e-05} +{"train_loss": 0.0011728149838745594, "global_step": 48605, "epoch": 408, "lr": 2.3407240403888814e-05} +{"train_loss": 0.001048564212396741, "global_step": 48606, "epoch": 408, "lr": 2.3405364258195723e-05} +{"train_loss": 0.0012298058718442917, "global_step": 48607, "epoch": 408, "lr": 2.3403488164718375e-05} +{"train_loss": 0.0008094173390418291, "global_step": 48608, "epoch": 408, "lr": 2.3401612123460415e-05} +{"train_loss": 0.0008400571532547474, "global_step": 48609, "epoch": 408, "lr": 2.339973613442557e-05} +{"train_loss": 0.001052630483172834, "global_step": 48610, "epoch": 408, "lr": 2.339786019761748e-05} +{"train_loss": 0.0007199803949333727, "global_step": 48611, "epoch": 408, "lr": 2.3395984313039854e-05} +{"train_loss": 0.0010072977747768164, "global_step": 48612, "epoch": 408, "lr": 2.339410848069639e-05} +{"train_loss": 0.0008302871719934046, "global_step": 48613, "epoch": 408, "lr": 2.339223270059075e-05} +{"train_loss": 0.0019260153640061617, "global_step": 48614, "epoch": 408, "lr": 2.3390356972726597e-05} +{"train_loss": 0.0011128876358270645, "global_step": 48615, "epoch": 408, "lr": 2.3388481297107655e-05} +{"train_loss": 0.0009178720647469163, "global_step": 48616, "epoch": 408, "lr": 2.3386605673737573e-05} +{"train_loss": 0.0016341173322871327, "global_step": 48617, "epoch": 408, "lr": 2.3384730102620063e-05} +{"train_loss": 0.000948929984588176, "global_step": 48618, "epoch": 408, "lr": 2.338285458375879e-05} +{"train_loss": 0.0010940969223156571, "global_step": 48619, "epoch": 408, "lr": 2.338097911715742e-05} +{"train_loss": 0.0006134122377261519, "global_step": 48620, "epoch": 408, "lr": 2.337910370281967e-05} +{"train_loss": 0.0008757201139815152, "global_step": 48621, "epoch": 408, "lr": 2.337722834074919e-05} +{"train_loss": 0.0010880227200686932, "global_step": 48622, "epoch": 408, "lr": 2.3375353030949698e-05} +{"train_loss": 0.0009597546886652708, "global_step": 48623, "epoch": 408, "lr": 2.337347777342484e-05} +{"train_loss": 0.0015154731227084994, "global_step": 48624, "epoch": 408, "lr": 2.3371602568178324e-05} +{"train_loss": 0.0011342985089868307, "global_step": 48625, "epoch": 408, "lr": 2.3369727415213828e-05} +{"train_loss": 0.0007754240068607032, "global_step": 48626, "epoch": 408, "lr": 2.336785231453501e-05} +{"train_loss": 0.0005807889392599463, "global_step": 48627, "epoch": 408, "lr": 2.3365977266145582e-05} +{"train_loss": 0.0013227761955931783, "global_step": 48628, "epoch": 408, "lr": 2.33641022700492e-05} +{"train_loss": 0.0010749527718871832, "global_step": 48629, "epoch": 408, "lr": 2.3362227326249568e-05} +{"train_loss": 0.000901304476428777, "global_step": 48630, "epoch": 408, "lr": 2.3360352434750342e-05} +{"train_loss": 0.0014957728562876582, "global_step": 48631, "epoch": 408, "lr": 2.335847759555524e-05} +{"train_loss": 0.0007611170294694602, "global_step": 48632, "epoch": 408, "lr": 2.3356602808667916e-05} +{"train_loss": 0.0016539307544007897, "global_step": 48633, "epoch": 408, "lr": 2.3354728074092037e-05} +{"train_loss": 0.0016254946822300553, "global_step": 48634, "epoch": 408, "lr": 2.3352853391831325e-05} +{"train_loss": 0.0013304247986525297, "global_step": 48635, "epoch": 408, "lr": 2.335097876188942e-05} +{"train_loss": 0.0007219834951683879, "global_step": 48636, "epoch": 408, "lr": 2.3349104184270036e-05} +{"train_loss": 0.001534900045953691, "global_step": 48637, "epoch": 408, "lr": 2.3347229658976842e-05} +{"train_loss": 0.000677852367516607, "global_step": 48638, "epoch": 408, "lr": 2.3345355186013496e-05} +{"train_loss": 0.0012981456238776445, "global_step": 48639, "epoch": 408, "lr": 2.3343480765383697e-05} +{"train_loss": 0.0009370144689455628, "global_step": 48640, "epoch": 408, "lr": 2.3341606397091143e-05} +{"train_loss": 0.0010503161465749145, "global_step": 48641, "epoch": 408, "lr": 2.3339732081139482e-05} +{"train_loss": 0.0005905920988880098, "global_step": 48642, "epoch": 408, "lr": 2.333785781753242e-05} +{"train_loss": 0.0007058237097226083, "global_step": 48643, "epoch": 408, "lr": 2.3335983606273615e-05} +{"train_loss": 0.0020258906297385693, "global_step": 48644, "epoch": 408, "lr": 2.3334109447366775e-05} +{"train_loss": 0.0009259170619770885, "global_step": 48645, "epoch": 408, "lr": 2.333223534081554e-05} +{"train_loss": 0.0009671307634562254, "global_step": 48646, "epoch": 408, "lr": 2.333036128662363e-05} +{"train_loss": 0.00040852141682989895, "global_step": 48647, "epoch": 408, "lr": 2.3328487284794693e-05} +{"train_loss": 0.0012813403736799955, "global_step": 48648, "epoch": 408, "lr": 2.3326613335332436e-05} +{"train_loss": 0.0009227544069290161, "global_step": 48649, "epoch": 408, "lr": 2.3324739438240512e-05} +{"train_loss": 0.0015350423054769635, "global_step": 48650, "epoch": 408, "lr": 2.3322865593522624e-05} +{"train_loss": 0.0005077673122286797, "global_step": 48651, "epoch": 408, "lr": 2.3320991801182442e-05} +{"train_loss": 0.0011911015026271343, "global_step": 48652, "epoch": 408, "lr": 2.331911806122362e-05} +{"train_loss": 0.0008220045710913837, "global_step": 48653, "epoch": 408, "lr": 2.3317244373649884e-05} +{"train_loss": 0.0009048777283169329, "global_step": 48654, "epoch": 408, "lr": 2.3315370738464863e-05} +{"train_loss": 0.0008795050089247525, "global_step": 48655, "epoch": 408, "lr": 2.3313497155672287e-05} +{"train_loss": 0.0004615859652403742, "global_step": 48656, "epoch": 408, "lr": 2.3311623625275803e-05} +{"train_loss": 0.0011673838598653674, "global_step": 48657, "epoch": 408, "lr": 2.3309750147279075e-05} +{"train_loss": 0.0008993376977741718, "global_step": 48658, "epoch": 408, "lr": 2.3307876721685822e-05} +{"train_loss": 0.0012954117264598608, "global_step": 48659, "epoch": 408, "lr": 2.3306003348499683e-05} +{"train_loss": 0.001732605742290616, "global_step": 48660, "epoch": 408, "lr": 2.3304130027724376e-05} +{"train_loss": 0.0008429500740021467, "global_step": 48661, "epoch": 408, "lr": 2.3302256759363535e-05} +{"train_loss": 0.0010652675991877913, "global_step": 48662, "epoch": 408, "lr": 2.3300383543420877e-05} +{"train_loss": 0.0010370195377618074, "global_step": 48663, "epoch": 408, "lr": 2.329851037990007e-05} +{"train_loss": 0.001014572218991816, "global_step": 48664, "epoch": 408, "lr": 2.3296637268804762e-05} +{"train_loss": 0.0009414370288141072, "global_step": 48665, "epoch": 408, "lr": 2.3294764210138677e-05} +{"train_loss": 0.0006450123619288206, "global_step": 48666, "epoch": 408, "lr": 2.3292891203905442e-05} +{"train_loss": 0.0005245031206868589, "global_step": 48667, "epoch": 408, "lr": 2.3291018250108785e-05} +{"train_loss": 0.0009667817503213882, "global_step": 48668, "epoch": 408, "lr": 2.328914534875237e-05} +{"train_loss": 0.0010381134925410151, "global_step": 48669, "epoch": 408, "lr": 2.328727249983983e-05} +{"train_loss": 0.0010015641218305666, "global_step": 48670, "epoch": 408, "lr": 2.3285399703374905e-05, "val_loss": 0.01780783012509346} +{"train_loss": 0.0011188823264092207, "global_step": 48671, "epoch": 409, "lr": 2.3283526959361225e-05} +{"train_loss": 0.0005105237942188978, "global_step": 48672, "epoch": 409, "lr": 2.32816542678025e-05} +{"train_loss": 0.0016427823575213552, "global_step": 48673, "epoch": 409, "lr": 2.3279781628702373e-05} +{"train_loss": 0.0007019921322353184, "global_step": 48674, "epoch": 409, "lr": 2.3277909042064545e-05} +{"train_loss": 0.0010659362887963653, "global_step": 48675, "epoch": 409, "lr": 2.3276036507892702e-05} +{"train_loss": 0.0008946495363488793, "global_step": 48676, "epoch": 409, "lr": 2.3274164026190492e-05} +{"train_loss": 0.0009454782120883465, "global_step": 48677, "epoch": 409, "lr": 2.327229159696162e-05} +{"train_loss": 0.0007907532854005694, "global_step": 48678, "epoch": 409, "lr": 2.3270419220209734e-05} +{"train_loss": 0.0011766450479626656, "global_step": 48679, "epoch": 409, "lr": 2.3268546895938538e-05} +{"train_loss": 0.0009738720837049186, "global_step": 48680, "epoch": 409, "lr": 2.326667462415168e-05} +{"train_loss": 0.0010253324871882796, "global_step": 48681, "epoch": 409, "lr": 2.3264802404852865e-05} +{"train_loss": 0.0007217710372060537, "global_step": 48682, "epoch": 409, "lr": 2.3262930238045754e-05} +{"train_loss": 0.0011918561067432165, "global_step": 48683, "epoch": 409, "lr": 2.326105812373401e-05} +{"train_loss": 0.0022896593436598778, "global_step": 48684, "epoch": 409, "lr": 2.3259186061921335e-05} +{"train_loss": 0.0007369658560492098, "global_step": 48685, "epoch": 409, "lr": 2.3257314052611375e-05} +{"train_loss": 0.0006765794241800904, "global_step": 48686, "epoch": 409, "lr": 2.3255442095807838e-05} +{"train_loss": 0.0006478283321484923, "global_step": 48687, "epoch": 409, "lr": 2.325357019151439e-05} +{"train_loss": 0.001258647651411593, "global_step": 48688, "epoch": 409, "lr": 2.3251698339734674e-05} +{"train_loss": 0.0010467758402228355, "global_step": 48689, "epoch": 409, "lr": 2.3249826540472415e-05} +{"train_loss": 0.0011698671150952578, "global_step": 48690, "epoch": 409, "lr": 2.3247954793731237e-05} +{"train_loss": 0.0011503882706165314, "global_step": 48691, "epoch": 409, "lr": 2.3246083099514866e-05} +{"train_loss": 0.0005524844746105373, "global_step": 48692, "epoch": 409, "lr": 2.3244211457826933e-05} +{"train_loss": 0.0010887053795158863, "global_step": 48693, "epoch": 409, "lr": 2.324233986867115e-05} +{"train_loss": 0.0014185429317876697, "global_step": 48694, "epoch": 409, "lr": 2.3240468332051174e-05} +{"train_loss": 0.0006354641518555582, "global_step": 48695, "epoch": 409, "lr": 2.323859684797066e-05} +{"train_loss": 0.001186480512842536, "global_step": 48696, "epoch": 409, "lr": 2.3236725416433326e-05} +{"train_loss": 0.0007084142998792231, "global_step": 48697, "epoch": 409, "lr": 2.3234854037442798e-05} +{"train_loss": 0.000418611743953079, "global_step": 48698, "epoch": 409, "lr": 2.32329827110028e-05} +{"train_loss": 0.001398490509018302, "global_step": 48699, "epoch": 409, "lr": 2.3231111437116955e-05} +{"train_loss": 0.0009957667207345366, "global_step": 48700, "epoch": 409, "lr": 2.3229240215788983e-05} +{"train_loss": 0.0008861397509463131, "global_step": 48701, "epoch": 409, "lr": 2.3227369047022542e-05} +{"train_loss": 0.0005771050928160548, "global_step": 48702, "epoch": 409, "lr": 2.322549793082128e-05} +{"train_loss": 0.0008981011342257261, "global_step": 48703, "epoch": 409, "lr": 2.3223626867188913e-05} +{"train_loss": 0.000533119251485914, "global_step": 48704, "epoch": 409, "lr": 2.3221755856129074e-05} +{"train_loss": 0.0014852957101538777, "global_step": 48705, "epoch": 409, "lr": 2.321988489764547e-05} +{"train_loss": 0.0007917560869827867, "global_step": 48706, "epoch": 409, "lr": 2.321801399174175e-05} +{"train_loss": 0.0014717418234795332, "global_step": 48707, "epoch": 409, "lr": 2.3216143138421613e-05} +{"train_loss": 0.0006895202677696943, "global_step": 48708, "epoch": 409, "lr": 2.3214272337688698e-05} +{"train_loss": 0.0008446783758699894, "global_step": 48709, "epoch": 409, "lr": 2.32124015895467e-05} +{"train_loss": 0.0006785162840969861, "global_step": 48710, "epoch": 409, "lr": 2.321053089399931e-05} +{"train_loss": 0.0006541854236274958, "global_step": 48711, "epoch": 409, "lr": 2.3208660251050158e-05} +{"train_loss": 0.0007736137486062944, "global_step": 48712, "epoch": 409, "lr": 2.320678966070296e-05} +{"train_loss": 0.0005916781956329942, "global_step": 48713, "epoch": 409, "lr": 2.3204919122961365e-05} +{"train_loss": 0.001237859483808279, "global_step": 48714, "epoch": 409, "lr": 2.3203048637829032e-05} +{"train_loss": 0.0007893291767686605, "global_step": 48715, "epoch": 409, "lr": 2.3201178205309677e-05} +{"train_loss": 0.001023204647935927, "global_step": 48716, "epoch": 409, "lr": 2.3199307825406918e-05} +{"train_loss": 0.0007381944451481104, "global_step": 48717, "epoch": 409, "lr": 2.3197437498124474e-05} +{"train_loss": 0.0006390696507878602, "global_step": 48718, "epoch": 409, "lr": 2.319556722346598e-05} +{"train_loss": 0.0010488474508747458, "global_step": 48719, "epoch": 409, "lr": 2.3193697001435145e-05} +{"train_loss": 0.00041724517359398305, "global_step": 48720, "epoch": 409, "lr": 2.3191826832035624e-05} +{"train_loss": 0.001131789293140173, "global_step": 48721, "epoch": 409, "lr": 2.3189956715271066e-05} +{"train_loss": 0.0008757126634009182, "global_step": 48722, "epoch": 409, "lr": 2.318808665114518e-05} +{"train_loss": 0.0009524484048597515, "global_step": 48723, "epoch": 409, "lr": 2.3186216639661608e-05} +{"train_loss": 0.0007532282033935189, "global_step": 48724, "epoch": 409, "lr": 2.318434668082405e-05} +{"train_loss": 0.0007263016304932535, "global_step": 48725, "epoch": 409, "lr": 2.3182476774636165e-05} +{"train_loss": 0.0005901927361264825, "global_step": 48726, "epoch": 409, "lr": 2.31806069211016e-05} +{"train_loss": 0.0013813454424962401, "global_step": 48727, "epoch": 409, "lr": 2.317873712022407e-05} +{"train_loss": 0.0010754414834082127, "global_step": 48728, "epoch": 409, "lr": 2.3176867372007205e-05} +{"train_loss": 0.0013465817319229245, "global_step": 48729, "epoch": 409, "lr": 2.3174997676454714e-05} +{"train_loss": 0.0006408184999600053, "global_step": 48730, "epoch": 409, "lr": 2.317312803357023e-05} +{"train_loss": 0.0007885636878199875, "global_step": 48731, "epoch": 409, "lr": 2.3171258443357463e-05} +{"train_loss": 0.0011571662034839392, "global_step": 48732, "epoch": 409, "lr": 2.3169388905820062e-05} +{"train_loss": 0.001268535852432251, "global_step": 48733, "epoch": 409, "lr": 2.316751942096168e-05} +{"train_loss": 0.000978986150585115, "global_step": 48734, "epoch": 409, "lr": 2.3165649988786026e-05} +{"train_loss": 0.0008327207760885358, "global_step": 48735, "epoch": 409, "lr": 2.3163780609296737e-05} +{"train_loss": 0.0016530639259144664, "global_step": 48736, "epoch": 409, "lr": 2.3161911282497512e-05} +{"train_loss": 0.000539586297236383, "global_step": 48737, "epoch": 409, "lr": 2.3160042008391986e-05} +{"train_loss": 0.0005641779280267656, "global_step": 48738, "epoch": 409, "lr": 2.3158172786983873e-05} +{"train_loss": 0.0011251317337155342, "global_step": 48739, "epoch": 409, "lr": 2.3156303618276804e-05} +{"train_loss": 0.0008607252966612577, "global_step": 48740, "epoch": 409, "lr": 2.315443450227448e-05} +{"train_loss": 0.00044719086145050824, "global_step": 48741, "epoch": 409, "lr": 2.3152565438980534e-05} +{"train_loss": 0.0012693305034190416, "global_step": 48742, "epoch": 409, "lr": 2.3150696428398684e-05} +{"train_loss": 0.0013175738276913762, "global_step": 48743, "epoch": 409, "lr": 2.3148827470532547e-05} +{"train_loss": 0.0011975483503192663, "global_step": 48744, "epoch": 409, "lr": 2.314695856538584e-05} +{"train_loss": 0.0012035061372444034, "global_step": 48745, "epoch": 409, "lr": 2.3145089712962193e-05} +{"train_loss": 0.000673106755129993, "global_step": 48746, "epoch": 409, "lr": 2.3143220913265313e-05} +{"train_loss": 0.0009941415628418326, "global_step": 48747, "epoch": 409, "lr": 2.314135216629883e-05} +{"train_loss": 0.00134165002964437, "global_step": 48748, "epoch": 409, "lr": 2.313948347206645e-05} +{"train_loss": 0.0011597818229347467, "global_step": 48749, "epoch": 409, "lr": 2.313761483057181e-05} +{"train_loss": 0.0005298957694321871, "global_step": 48750, "epoch": 409, "lr": 2.3135746241818608e-05} +{"train_loss": 0.001055512810125947, "global_step": 48751, "epoch": 409, "lr": 2.3133877705810497e-05} +{"train_loss": 0.0005559908458963037, "global_step": 48752, "epoch": 409, "lr": 2.3132009222551133e-05} +{"train_loss": 0.0011614018585532904, "global_step": 48753, "epoch": 409, "lr": 2.3130140792044212e-05} +{"train_loss": 0.0013307419139891863, "global_step": 48754, "epoch": 409, "lr": 2.3128272414293373e-05} +{"train_loss": 0.0008848664001561701, "global_step": 48755, "epoch": 409, "lr": 2.3126404089302318e-05} +{"train_loss": 0.0007893304573372006, "global_step": 48756, "epoch": 409, "lr": 2.31245358170747e-05} +{"train_loss": 0.001304272678680718, "global_step": 48757, "epoch": 409, "lr": 2.3122667597614163e-05} +{"train_loss": 0.001037227688357234, "global_step": 48758, "epoch": 409, "lr": 2.312079943092442e-05} +{"train_loss": 0.0007025062222965062, "global_step": 48759, "epoch": 409, "lr": 2.3118931317009092e-05} +{"train_loss": 0.0008606454939581454, "global_step": 48760, "epoch": 409, "lr": 2.311706325587189e-05} +{"train_loss": 0.0011144103482365608, "global_step": 48761, "epoch": 409, "lr": 2.3115195247516446e-05} +{"train_loss": 0.0010519959032535553, "global_step": 48762, "epoch": 409, "lr": 2.3113327291946458e-05} +{"train_loss": 0.0015255495673045516, "global_step": 48763, "epoch": 409, "lr": 2.3111459389165586e-05} +{"train_loss": 0.0007909138803370297, "global_step": 48764, "epoch": 409, "lr": 2.3109591539177466e-05} +{"train_loss": 0.0019095921888947487, "global_step": 48765, "epoch": 409, "lr": 2.3107723741985814e-05} +{"train_loss": 0.0009130642865784466, "global_step": 48766, "epoch": 409, "lr": 2.3105855997594252e-05} +{"train_loss": 0.0009110475657507777, "global_step": 48767, "epoch": 409, "lr": 2.3103988306006487e-05} +{"train_loss": 0.0006894228863529861, "global_step": 48768, "epoch": 409, "lr": 2.310212066722615e-05} +{"train_loss": 0.0006741301040165126, "global_step": 48769, "epoch": 409, "lr": 2.3100253081256946e-05} +{"train_loss": 0.001274215872399509, "global_step": 48770, "epoch": 409, "lr": 2.3098385548102496e-05} +{"train_loss": 0.0007404776988551021, "global_step": 48771, "epoch": 409, "lr": 2.3096518067766516e-05} +{"train_loss": 0.0011788562405854464, "global_step": 48772, "epoch": 409, "lr": 2.309465064025263e-05} +{"train_loss": 0.0014844225952401757, "global_step": 48773, "epoch": 409, "lr": 2.3092783265564538e-05} +{"train_loss": 0.0004701942962128669, "global_step": 48774, "epoch": 409, "lr": 2.3090915943705875e-05} +{"train_loss": 0.0014649169752374291, "global_step": 48775, "epoch": 409, "lr": 2.308904867468034e-05} +{"train_loss": 0.0008775885216891766, "global_step": 48776, "epoch": 409, "lr": 2.3087181458491568e-05} +{"train_loss": 0.0013717201072722673, "global_step": 48777, "epoch": 409, "lr": 2.3085314295143263e-05} +{"train_loss": 0.0011920295655727386, "global_step": 48778, "epoch": 409, "lr": 2.308344718463904e-05} +{"train_loss": 0.0005484719295054674, "global_step": 48779, "epoch": 409, "lr": 2.3081580126982617e-05} +{"train_loss": 0.0016907398821786046, "global_step": 48780, "epoch": 409, "lr": 2.3079713122177615e-05} +{"train_loss": 0.0014332651626318693, "global_step": 48781, "epoch": 409, "lr": 2.307784617022774e-05} +{"train_loss": 0.000591220916248858, "global_step": 48782, "epoch": 409, "lr": 2.307597927113664e-05} +{"train_loss": 0.0006143368664197624, "global_step": 48783, "epoch": 409, "lr": 2.307411242490795e-05} +{"train_loss": 0.0014111163327470422, "global_step": 48784, "epoch": 409, "lr": 2.3072245631545393e-05} +{"train_loss": 0.0011789468117058277, "global_step": 48785, "epoch": 409, "lr": 2.307037889105258e-05} +{"train_loss": 0.0007026947569102049, "global_step": 48786, "epoch": 409, "lr": 2.3068512203433225e-05} +{"train_loss": 0.0015727670397609472, "global_step": 48787, "epoch": 409, "lr": 2.3066645568690965e-05} +{"train_loss": 0.0011439563240855932, "global_step": 48788, "epoch": 409, "lr": 2.306477898682945e-05} +{"train_loss": 0.0009825157521081258, "global_step": 48789, "epoch": 409, "lr": 2.3062912457852386e-05, "val_loss": 0.014504333958029747} +{"train_loss": 0.0005853980546817183, "global_step": 48790, "epoch": 410, "lr": 2.3061045981763395e-05} +{"train_loss": 0.0009465559851378202, "global_step": 48791, "epoch": 410, "lr": 2.305917955856618e-05} +{"train_loss": 0.000823172100353986, "global_step": 48792, "epoch": 410, "lr": 2.3057313188264368e-05} +{"train_loss": 0.0009295346098951995, "global_step": 48793, "epoch": 410, "lr": 2.3055446870861663e-05} +{"train_loss": 0.0011974438093602657, "global_step": 48794, "epoch": 410, "lr": 2.3053580606361713e-05} +{"train_loss": 0.0010813131229951978, "global_step": 48795, "epoch": 410, "lr": 2.3051714394768155e-05} +{"train_loss": 0.0009655642206780612, "global_step": 48796, "epoch": 410, "lr": 2.3049848236084697e-05} +{"train_loss": 0.0008151204092428088, "global_step": 48797, "epoch": 410, "lr": 2.3047982130314966e-05} +{"train_loss": 0.0015534913400188088, "global_step": 48798, "epoch": 410, "lr": 2.304611607746266e-05} +{"train_loss": 0.0015713418833911419, "global_step": 48799, "epoch": 410, "lr": 2.3044250077531408e-05} +{"train_loss": 0.003998441621661186, "global_step": 48800, "epoch": 410, "lr": 2.304238413052491e-05} +{"train_loss": 0.0007719978457316756, "global_step": 48801, "epoch": 410, "lr": 2.3040518236446808e-05} +{"train_loss": 0.001533384551294148, "global_step": 48802, "epoch": 410, "lr": 2.303865239530075e-05} +{"train_loss": 0.001752139301970601, "global_step": 48803, "epoch": 410, "lr": 2.303678660709044e-05} +{"train_loss": 0.0008150351932272315, "global_step": 48804, "epoch": 410, "lr": 2.3034920871819493e-05} +{"train_loss": 0.000774173648096621, "global_step": 48805, "epoch": 410, "lr": 2.3033055189491602e-05} +{"train_loss": 0.0014393202727660537, "global_step": 48806, "epoch": 410, "lr": 2.303118956011045e-05} +{"train_loss": 0.0013495705788955092, "global_step": 48807, "epoch": 410, "lr": 2.3029323983679653e-05} +{"train_loss": 0.0011092436034232378, "global_step": 48808, "epoch": 410, "lr": 2.3027458460202915e-05} +{"train_loss": 0.0009195745224133134, "global_step": 48809, "epoch": 410, "lr": 2.3025592989683863e-05} +{"train_loss": 0.0009759714012034237, "global_step": 48810, "epoch": 410, "lr": 2.3023727572126197e-05} +{"train_loss": 0.0016446284716948867, "global_step": 48811, "epoch": 410, "lr": 2.3021862207533535e-05} +{"train_loss": 0.0016150918090716004, "global_step": 48812, "epoch": 410, "lr": 2.301999689590959e-05} +{"train_loss": 0.001446417300030589, "global_step": 48813, "epoch": 410, "lr": 2.3018131637257995e-05} +{"train_loss": 0.0014760843478143215, "global_step": 48814, "epoch": 410, "lr": 2.30162664315824e-05} +{"train_loss": 0.0012085831258445978, "global_step": 48815, "epoch": 410, "lr": 2.30144012788865e-05} +{"train_loss": 0.0010789311490952969, "global_step": 48816, "epoch": 410, "lr": 2.301253617917392e-05} +{"train_loss": 0.0013860552571713924, "global_step": 48817, "epoch": 410, "lr": 2.3010671132448364e-05} +{"train_loss": 0.0013971029547974467, "global_step": 48818, "epoch": 410, "lr": 2.300880613871345e-05} +{"train_loss": 0.0018547106301411986, "global_step": 48819, "epoch": 410, "lr": 2.3006941197972888e-05} +{"train_loss": 0.0007883777725510299, "global_step": 48820, "epoch": 410, "lr": 2.3005076310230305e-05} +{"train_loss": 0.0009695652406662703, "global_step": 48821, "epoch": 410, "lr": 2.3003211475489355e-05} +{"train_loss": 0.0015114150010049343, "global_step": 48822, "epoch": 410, "lr": 2.3001346693753735e-05} +{"train_loss": 0.001985573209822178, "global_step": 48823, "epoch": 410, "lr": 2.2999481965027063e-05} +{"train_loss": 0.0020826891995966434, "global_step": 48824, "epoch": 410, "lr": 2.2997617289313046e-05} +{"train_loss": 0.0013431862462311983, "global_step": 48825, "epoch": 410, "lr": 2.2995752666615322e-05} +{"train_loss": 0.0006641830550506711, "global_step": 48826, "epoch": 410, "lr": 2.299388809693753e-05} +{"train_loss": 0.0014167234767228365, "global_step": 48827, "epoch": 410, "lr": 2.299202358028338e-05} +{"train_loss": 0.0019903031643480062, "global_step": 48828, "epoch": 410, "lr": 2.2990159116656484e-05} +{"train_loss": 0.0017096720403060317, "global_step": 48829, "epoch": 410, "lr": 2.2988294706060544e-05} +{"train_loss": 0.0016535553149878979, "global_step": 48830, "epoch": 410, "lr": 2.2986430348499183e-05} +{"train_loss": 0.0007797732832841575, "global_step": 48831, "epoch": 410, "lr": 2.2984566043976098e-05} +{"train_loss": 0.0008675383287481964, "global_step": 48832, "epoch": 410, "lr": 2.2982701792494927e-05} +{"train_loss": 0.0010070650605484843, "global_step": 48833, "epoch": 410, "lr": 2.2980837594059324e-05} +{"train_loss": 0.0013836942380294204, "global_step": 48834, "epoch": 410, "lr": 2.2978973448672974e-05} +{"train_loss": 0.001613973523490131, "global_step": 48835, "epoch": 410, "lr": 2.2977109356339505e-05} +{"train_loss": 0.0014261358883231878, "global_step": 48836, "epoch": 410, "lr": 2.297524531706261e-05} +{"train_loss": 0.0009112341795116663, "global_step": 48837, "epoch": 410, "lr": 2.2973381330845923e-05} +{"train_loss": 0.0009866362670436502, "global_step": 48838, "epoch": 410, "lr": 2.2971517397693128e-05} +{"train_loss": 0.0012004387099295855, "global_step": 48839, "epoch": 410, "lr": 2.2969653517607854e-05} +{"train_loss": 0.000983507139608264, "global_step": 48840, "epoch": 410, "lr": 2.2967789690593792e-05} +{"train_loss": 0.0007767543429508805, "global_step": 48841, "epoch": 410, "lr": 2.2965925916654575e-05} +{"train_loss": 0.001317374175414443, "global_step": 48842, "epoch": 410, "lr": 2.2964062195793867e-05} +{"train_loss": 0.0011268083471804857, "global_step": 48843, "epoch": 410, "lr": 2.2962198528015355e-05} +{"train_loss": 0.001124397269450128, "global_step": 48844, "epoch": 410, "lr": 2.2960334913322678e-05} +{"train_loss": 0.0008725054794922471, "global_step": 48845, "epoch": 410, "lr": 2.295847135171948e-05} +{"train_loss": 0.0008965418674051762, "global_step": 48846, "epoch": 410, "lr": 2.295660784320945e-05} +{"train_loss": 0.0010046219686046243, "global_step": 48847, "epoch": 410, "lr": 2.2954744387796213e-05} +{"train_loss": 0.001080170040950179, "global_step": 48848, "epoch": 410, "lr": 2.2952880985483464e-05} +{"train_loss": 0.0011045117862522602, "global_step": 48849, "epoch": 410, "lr": 2.295101763627483e-05} +{"train_loss": 0.001424384769052267, "global_step": 48850, "epoch": 410, "lr": 2.2949154340173996e-05} +{"train_loss": 0.0010398707818239927, "global_step": 48851, "epoch": 410, "lr": 2.2947291097184608e-05} +{"train_loss": 0.0007622435223311186, "global_step": 48852, "epoch": 410, "lr": 2.2945427907310308e-05} +{"train_loss": 0.000962608668487519, "global_step": 48853, "epoch": 410, "lr": 2.2943564770554786e-05} +{"train_loss": 0.0008147654589265585, "global_step": 48854, "epoch": 410, "lr": 2.2941701686921667e-05} +{"train_loss": 0.0021029480267316103, "global_step": 48855, "epoch": 410, "lr": 2.293983865641464e-05} +{"train_loss": 0.0012548111844807863, "global_step": 48856, "epoch": 410, "lr": 2.2937975679037353e-05} +{"train_loss": 0.001036008121445775, "global_step": 48857, "epoch": 410, "lr": 2.2936112754793443e-05} +{"train_loss": 0.0011936444789171219, "global_step": 48858, "epoch": 410, "lr": 2.2934249883686603e-05} +{"train_loss": 0.0008550483617000282, "global_step": 48859, "epoch": 410, "lr": 2.293238706572045e-05} +{"train_loss": 0.0007609936874359846, "global_step": 48860, "epoch": 410, "lr": 2.2930524300898682e-05} +{"train_loss": 0.0011487507726997137, "global_step": 48861, "epoch": 410, "lr": 2.292866158922492e-05} +{"train_loss": 0.002113890368491411, "global_step": 48862, "epoch": 410, "lr": 2.292679893070286e-05} +{"train_loss": 0.001361230737529695, "global_step": 48863, "epoch": 410, "lr": 2.2924936325336132e-05} +{"train_loss": 0.0013085937825962901, "global_step": 48864, "epoch": 410, "lr": 2.2923073773128384e-05} +{"train_loss": 0.0011025099083781242, "global_step": 48865, "epoch": 410, "lr": 2.2921211274083304e-05} +{"train_loss": 0.0012626645620912313, "global_step": 48866, "epoch": 410, "lr": 2.2919348828204517e-05} +{"train_loss": 0.0015634658047929406, "global_step": 48867, "epoch": 410, "lr": 2.2917486435495715e-05} +{"train_loss": 0.0013797773281112313, "global_step": 48868, "epoch": 410, "lr": 2.2915624095960515e-05} +{"train_loss": 0.001380997127853334, "global_step": 48869, "epoch": 410, "lr": 2.2913761809602606e-05} +{"train_loss": 0.0022374067921191454, "global_step": 48870, "epoch": 410, "lr": 2.2911899576425623e-05} +{"train_loss": 0.0014685214264318347, "global_step": 48871, "epoch": 410, "lr": 2.291003739643325e-05} +{"train_loss": 0.0010182014666497707, "global_step": 48872, "epoch": 410, "lr": 2.2908175269629097e-05} +{"train_loss": 0.0013317731209099293, "global_step": 48873, "epoch": 410, "lr": 2.290631319601687e-05} +{"train_loss": 0.0019932554569095373, "global_step": 48874, "epoch": 410, "lr": 2.2904451175600182e-05} +{"train_loss": 0.0016775216208770871, "global_step": 48875, "epoch": 410, "lr": 2.2902589208382736e-05} +{"train_loss": 0.0007577748619951308, "global_step": 48876, "epoch": 410, "lr": 2.2900727294368137e-05} +{"train_loss": 0.001109711010940373, "global_step": 48877, "epoch": 410, "lr": 2.2898865433560085e-05} +{"train_loss": 0.0015363955171778798, "global_step": 48878, "epoch": 410, "lr": 2.2897003625962192e-05} +{"train_loss": 0.0012675253674387932, "global_step": 48879, "epoch": 410, "lr": 2.2895141871578162e-05} +{"train_loss": 0.0010616601211950183, "global_step": 48880, "epoch": 410, "lr": 2.2893280170411603e-05} +{"train_loss": 0.0012683654204010963, "global_step": 48881, "epoch": 410, "lr": 2.2891418522466214e-05} +{"train_loss": 0.0016386115457862616, "global_step": 48882, "epoch": 410, "lr": 2.288955692774562e-05} +{"train_loss": 0.001835011993534863, "global_step": 48883, "epoch": 410, "lr": 2.2887695386253476e-05} +{"train_loss": 0.001408131094649434, "global_step": 48884, "epoch": 410, "lr": 2.288583389799346e-05} +{"train_loss": 0.0014109923504292965, "global_step": 48885, "epoch": 410, "lr": 2.2883972462969195e-05} +{"train_loss": 0.0008982953149825335, "global_step": 48886, "epoch": 410, "lr": 2.288211108118437e-05} +{"train_loss": 0.002139034913852811, "global_step": 48887, "epoch": 410, "lr": 2.2880249752642607e-05} +{"train_loss": 0.001338039175607264, "global_step": 48888, "epoch": 410, "lr": 2.287838847734759e-05} +{"train_loss": 0.0017050305614247918, "global_step": 48889, "epoch": 410, "lr": 2.2876527255302965e-05} +{"train_loss": 0.0014464699197560549, "global_step": 48890, "epoch": 410, "lr": 2.2874666086512357e-05} +{"train_loss": 0.002282944740727544, "global_step": 48891, "epoch": 410, "lr": 2.2872804970979468e-05} +{"train_loss": 0.0008081435807980597, "global_step": 48892, "epoch": 410, "lr": 2.287094390870791e-05} +{"train_loss": 0.0016333163948729634, "global_step": 48893, "epoch": 410, "lr": 2.2869082899701373e-05} +{"train_loss": 0.0013696622336283326, "global_step": 48894, "epoch": 410, "lr": 2.286722194396349e-05} +{"train_loss": 0.0010975933400914073, "global_step": 48895, "epoch": 410, "lr": 2.2865361041497902e-05} +{"train_loss": 0.0011782279470935464, "global_step": 48896, "epoch": 410, "lr": 2.2863500192308296e-05} +{"train_loss": 0.0012879220303148031, "global_step": 48897, "epoch": 410, "lr": 2.286163939639829e-05} +{"train_loss": 0.0009730422752909362, "global_step": 48898, "epoch": 410, "lr": 2.2859778653771573e-05} +{"train_loss": 0.0010378779843449593, "global_step": 48899, "epoch": 410, "lr": 2.2857917964431765e-05} +{"train_loss": 0.0008772040600888431, "global_step": 48900, "epoch": 410, "lr": 2.2856057328382553e-05} +{"train_loss": 0.001257808180525899, "global_step": 48901, "epoch": 410, "lr": 2.285419674562757e-05} +{"train_loss": 0.000632688170298934, "global_step": 48902, "epoch": 410, "lr": 2.2852336216170455e-05} +{"train_loss": 0.0008345873211510479, "global_step": 48903, "epoch": 410, "lr": 2.285047574001488e-05} +{"train_loss": 0.0012218470219522715, "global_step": 48904, "epoch": 410, "lr": 2.2848615317164512e-05} +{"train_loss": 0.001226125517860055, "global_step": 48905, "epoch": 410, "lr": 2.2846754947622965e-05} +{"train_loss": 0.0013751661172136664, "global_step": 48906, "epoch": 410, "lr": 2.2844894631393943e-05} +{"train_loss": 0.0009459852008149028, "global_step": 48907, "epoch": 410, "lr": 2.284303436848104e-05} +{"train_loss": 0.001282805238435624, "global_step": 48908, "epoch": 410, "lr": 2.284117415888796e-05, "val_loss": 0.042005106806755066, "train_action_mse_error": 1.2999309547012672e-05} +{"train_loss": 0.0007093900931067765, "global_step": 48909, "epoch": 411, "lr": 2.2839314002618316e-05} +{"train_loss": 0.0009580153855495155, "global_step": 48910, "epoch": 411, "lr": 2.2837453899675792e-05} +{"train_loss": 0.0006986925145611167, "global_step": 48911, "epoch": 411, "lr": 2.2835593850064014e-05} +{"train_loss": 0.001908833859488368, "global_step": 48912, "epoch": 411, "lr": 2.2833733853786654e-05} +{"train_loss": 0.0010051591088995337, "global_step": 48913, "epoch": 411, "lr": 2.2831873910847363e-05} +{"train_loss": 0.0016388302901759744, "global_step": 48914, "epoch": 411, "lr": 2.283001402124976e-05} +{"train_loss": 0.0009625147213228047, "global_step": 48915, "epoch": 411, "lr": 2.2828154184997546e-05} +{"train_loss": 0.0012510732049122453, "global_step": 48916, "epoch": 411, "lr": 2.2826294402094328e-05} +{"train_loss": 0.0008268191595561802, "global_step": 48917, "epoch": 411, "lr": 2.28244346725438e-05} +{"train_loss": 0.000995954847894609, "global_step": 48918, "epoch": 411, "lr": 2.2822574996349565e-05} +{"train_loss": 0.0012145321816205978, "global_step": 48919, "epoch": 411, "lr": 2.2820715373515327e-05} +{"train_loss": 0.0013214542996138334, "global_step": 48920, "epoch": 411, "lr": 2.2818855804044703e-05} +{"train_loss": 0.0020741091575473547, "global_step": 48921, "epoch": 411, "lr": 2.281699628794134e-05} +{"train_loss": 0.0009418957051821053, "global_step": 48922, "epoch": 411, "lr": 2.2815136825208916e-05} +{"train_loss": 0.000680704484693706, "global_step": 48923, "epoch": 411, "lr": 2.2813277415851047e-05} +{"train_loss": 0.0008965365123003721, "global_step": 48924, "epoch": 411, "lr": 2.2811418059871425e-05} +{"train_loss": 0.0011775970924645662, "global_step": 48925, "epoch": 411, "lr": 2.2809558757273673e-05} +{"train_loss": 0.0011303265346214175, "global_step": 48926, "epoch": 411, "lr": 2.2807699508061437e-05} +{"train_loss": 0.0010386558715254068, "global_step": 48927, "epoch": 411, "lr": 2.280584031223839e-05} +{"train_loss": 0.0011284834472462535, "global_step": 48928, "epoch": 411, "lr": 2.280398116980816e-05} +{"train_loss": 0.0013256649253889918, "global_step": 48929, "epoch": 411, "lr": 2.2802122080774417e-05} +{"train_loss": 0.00084255775436759, "global_step": 48930, "epoch": 411, "lr": 2.2800263045140786e-05} +{"train_loss": 0.0008711391710676253, "global_step": 48931, "epoch": 411, "lr": 2.2798404062910956e-05} +{"train_loss": 0.0012300421949476004, "global_step": 48932, "epoch": 411, "lr": 2.279654513408855e-05} +{"train_loss": 0.0006373043870553374, "global_step": 48933, "epoch": 411, "lr": 2.27946862586772e-05} +{"train_loss": 0.0017385846003890038, "global_step": 48934, "epoch": 411, "lr": 2.2792827436680596e-05} +{"train_loss": 0.0013909728731960058, "global_step": 48935, "epoch": 411, "lr": 2.279096866810235e-05} +{"train_loss": 0.001324419747106731, "global_step": 48936, "epoch": 411, "lr": 2.2789109952946153e-05} +{"train_loss": 0.00145576277282089, "global_step": 48937, "epoch": 411, "lr": 2.278725129121561e-05} +{"train_loss": 0.0010034749284386635, "global_step": 48938, "epoch": 411, "lr": 2.2785392682914393e-05} +{"train_loss": 0.001794806681573391, "global_step": 48939, "epoch": 411, "lr": 2.278353412804617e-05} +{"train_loss": 0.0011605710024014115, "global_step": 48940, "epoch": 411, "lr": 2.2781675626614545e-05} +{"train_loss": 0.0010529316496104002, "global_step": 48941, "epoch": 411, "lr": 2.277981717862322e-05} +{"train_loss": 0.001209471607580781, "global_step": 48942, "epoch": 411, "lr": 2.2777958784075793e-05} +{"train_loss": 0.0015188403194770217, "global_step": 48943, "epoch": 411, "lr": 2.277610044297595e-05} +{"train_loss": 0.0011796712642535567, "global_step": 48944, "epoch": 411, "lr": 2.277424215532733e-05} +{"train_loss": 0.000891088682692498, "global_step": 48945, "epoch": 411, "lr": 2.2772383921133557e-05} +{"train_loss": 0.0011618302669376135, "global_step": 48946, "epoch": 411, "lr": 2.277052574039832e-05} +{"train_loss": 0.0014827201375737786, "global_step": 48947, "epoch": 411, "lr": 2.2768667613125223e-05} +{"train_loss": 0.0012790629407390952, "global_step": 48948, "epoch": 411, "lr": 2.276680953931796e-05} +{"train_loss": 0.00045102735748514533, "global_step": 48949, "epoch": 411, "lr": 2.276495151898014e-05} +{"train_loss": 0.0009648351697251201, "global_step": 48950, "epoch": 411, "lr": 2.2763093552115445e-05} +{"train_loss": 0.0010090263094753027, "global_step": 48951, "epoch": 411, "lr": 2.276123563872751e-05} +{"train_loss": 0.0018251842120662332, "global_step": 48952, "epoch": 411, "lr": 2.2759377778819952e-05} +{"train_loss": 0.0010533600579947233, "global_step": 48953, "epoch": 411, "lr": 2.275751997239647e-05} +{"train_loss": 0.0014022968243807554, "global_step": 48954, "epoch": 411, "lr": 2.2755662219460666e-05} +{"train_loss": 0.0008696820586919785, "global_step": 48955, "epoch": 411, "lr": 2.2753804520016227e-05} +{"train_loss": 0.0023321628104895353, "global_step": 48956, "epoch": 411, "lr": 2.2751946874066767e-05} +{"train_loss": 0.0006317083025351167, "global_step": 48957, "epoch": 411, "lr": 2.2750089281615962e-05} +{"train_loss": 0.0007917190669104457, "global_step": 48958, "epoch": 411, "lr": 2.2748231742667448e-05} +{"train_loss": 0.0011939292307943106, "global_step": 48959, "epoch": 411, "lr": 2.274637425722485e-05} +{"train_loss": 0.001679366105236113, "global_step": 48960, "epoch": 411, "lr": 2.2744516825291857e-05} +{"train_loss": 0.0008891806937754154, "global_step": 48961, "epoch": 411, "lr": 2.2742659446872068e-05} +{"train_loss": 0.0005721052293665707, "global_step": 48962, "epoch": 411, "lr": 2.274080212196918e-05} +{"train_loss": 0.0012233619345352054, "global_step": 48963, "epoch": 411, "lr": 2.2738944850586807e-05} +{"train_loss": 0.0006396195967681706, "global_step": 48964, "epoch": 411, "lr": 2.2737087632728594e-05} +{"train_loss": 0.0008024538983590901, "global_step": 48965, "epoch": 411, "lr": 2.273523046839821e-05} +{"train_loss": 0.001162828179076314, "global_step": 48966, "epoch": 411, "lr": 2.273337335759927e-05} +{"train_loss": 0.0015999599127098918, "global_step": 48967, "epoch": 411, "lr": 2.2731516300335458e-05} +{"train_loss": 0.0016482502687722445, "global_step": 48968, "epoch": 411, "lr": 2.2729659296610384e-05} +{"train_loss": 0.0014466632856056094, "global_step": 48969, "epoch": 411, "lr": 2.2727802346427722e-05} +{"train_loss": 0.0012329415185377002, "global_step": 48970, "epoch": 411, "lr": 2.27259454497911e-05} +{"train_loss": 0.0011623043101280928, "global_step": 48971, "epoch": 411, "lr": 2.272408860670418e-05} +{"train_loss": 0.0011969057377427816, "global_step": 48972, "epoch": 411, "lr": 2.272223181717058e-05} +{"train_loss": 0.001281153759919107, "global_step": 48973, "epoch": 411, "lr": 2.272037508119396e-05} +{"train_loss": 0.0010178722441196442, "global_step": 48974, "epoch": 411, "lr": 2.2718518398778e-05} +{"train_loss": 0.0012522590113803744, "global_step": 48975, "epoch": 411, "lr": 2.2716661769926307e-05} +{"train_loss": 0.001405168790370226, "global_step": 48976, "epoch": 411, "lr": 2.2714805194642515e-05} +{"train_loss": 0.0008813682943582535, "global_step": 48977, "epoch": 411, "lr": 2.2712948672930308e-05} +{"train_loss": 0.0007410863181576133, "global_step": 48978, "epoch": 411, "lr": 2.271109220479329e-05} +{"train_loss": 0.0007696828106418252, "global_step": 48979, "epoch": 411, "lr": 2.2709235790235145e-05} +{"train_loss": 0.0009694487089291215, "global_step": 48980, "epoch": 411, "lr": 2.2707379429259484e-05} +{"train_loss": 0.0005879273521713912, "global_step": 48981, "epoch": 411, "lr": 2.2705523121869987e-05} +{"train_loss": 0.0013199766399338841, "global_step": 48982, "epoch": 411, "lr": 2.270366686807028e-05} +{"train_loss": 0.0006181804346852005, "global_step": 48983, "epoch": 411, "lr": 2.2701810667863982e-05} +{"train_loss": 0.000686759827658534, "global_step": 48984, "epoch": 411, "lr": 2.2699954521254786e-05} +{"train_loss": 0.0014879214577376842, "global_step": 48985, "epoch": 411, "lr": 2.2698098428246295e-05} +{"train_loss": 0.0011113815708085895, "global_step": 48986, "epoch": 411, "lr": 2.2696242388842187e-05} +{"train_loss": 0.001740792184136808, "global_step": 48987, "epoch": 411, "lr": 2.2694386403046068e-05} +{"train_loss": 0.0010788548970595002, "global_step": 48988, "epoch": 411, "lr": 2.269253047086163e-05} +{"train_loss": 0.0010954330209642649, "global_step": 48989, "epoch": 411, "lr": 2.269067459229249e-05} +{"train_loss": 0.0009069584193639457, "global_step": 48990, "epoch": 411, "lr": 2.2688818767342273e-05} +{"train_loss": 0.0012798983370885253, "global_step": 48991, "epoch": 411, "lr": 2.268696299601466e-05} +{"train_loss": 0.0007895809249021113, "global_step": 48992, "epoch": 411, "lr": 2.268510727831326e-05} +{"train_loss": 0.0012249154970049858, "global_step": 48993, "epoch": 411, "lr": 2.268325161424175e-05} +{"train_loss": 0.0007057617767713964, "global_step": 48994, "epoch": 411, "lr": 2.2681396003803756e-05} +{"train_loss": 0.0013150755548849702, "global_step": 48995, "epoch": 411, "lr": 2.2679540447002913e-05} +{"train_loss": 0.0007358862785622478, "global_step": 48996, "epoch": 411, "lr": 2.267768494384288e-05} +{"train_loss": 0.0012983579654246569, "global_step": 48997, "epoch": 411, "lr": 2.2675829494327283e-05} +{"train_loss": 0.0010764000471681356, "global_step": 48998, "epoch": 411, "lr": 2.2673974098459793e-05} +{"train_loss": 0.0009816070087254047, "global_step": 48999, "epoch": 411, "lr": 2.2672118756244014e-05} +{"train_loss": 0.0014300666516646743, "global_step": 49000, "epoch": 411, "lr": 2.2670263467683632e-05} +{"train_loss": 0.0007077775080688298, "global_step": 49001, "epoch": 411, "lr": 2.2668408232782245e-05} +{"train_loss": 0.001000691088847816, "global_step": 49002, "epoch": 411, "lr": 2.2666553051543543e-05} +{"train_loss": 0.0019646151922643185, "global_step": 49003, "epoch": 411, "lr": 2.2664697923971123e-05} +{"train_loss": 0.0007507299305871129, "global_step": 49004, "epoch": 411, "lr": 2.2662842850068667e-05} +{"train_loss": 0.0006664200336672366, "global_step": 49005, "epoch": 411, "lr": 2.266098782983978e-05} +{"train_loss": 0.001147991861216724, "global_step": 49006, "epoch": 411, "lr": 2.2659132863288142e-05} +{"train_loss": 0.0007974534528329968, "global_step": 49007, "epoch": 411, "lr": 2.2657277950417355e-05} +{"train_loss": 0.0009521197061985731, "global_step": 49008, "epoch": 411, "lr": 2.26554230912311e-05} +{"train_loss": 0.0012111507821828127, "global_step": 49009, "epoch": 411, "lr": 2.265356828573298e-05} +{"train_loss": 0.000810150639154017, "global_step": 49010, "epoch": 411, "lr": 2.2651713533926677e-05} +{"train_loss": 0.0006778478855267167, "global_step": 49011, "epoch": 411, "lr": 2.2649858835815795e-05} +{"train_loss": 0.001590930507518351, "global_step": 49012, "epoch": 411, "lr": 2.2648004191404016e-05} +{"train_loss": 0.0009542275220155716, "global_step": 49013, "epoch": 411, "lr": 2.2646149600694954e-05} +{"train_loss": 0.0007755826809443533, "global_step": 49014, "epoch": 411, "lr": 2.2644295063692238e-05} +{"train_loss": 0.0005674985586665571, "global_step": 49015, "epoch": 411, "lr": 2.2642440580399543e-05} +{"train_loss": 0.0009530571987852454, "global_step": 49016, "epoch": 411, "lr": 2.2640586150820474e-05} +{"train_loss": 0.0007026963285170496, "global_step": 49017, "epoch": 411, "lr": 2.2638731774958716e-05} +{"train_loss": 0.0009091364918276668, "global_step": 49018, "epoch": 411, "lr": 2.263687745281786e-05} +{"train_loss": 0.0004979124641977251, "global_step": 49019, "epoch": 411, "lr": 2.2635023184401592e-05} +{"train_loss": 0.0006021644803695381, "global_step": 49020, "epoch": 411, "lr": 2.263316896971353e-05} +{"train_loss": 0.0016596881905570626, "global_step": 49021, "epoch": 411, "lr": 2.2631314808757303e-05} +{"train_loss": 0.0006796265370212495, "global_step": 49022, "epoch": 411, "lr": 2.262946070153658e-05} +{"train_loss": 0.000816613610368222, "global_step": 49023, "epoch": 411, "lr": 2.2627606648054974e-05} +{"train_loss": 0.0012552167754620314, "global_step": 49024, "epoch": 411, "lr": 2.262575264831615e-05} +{"train_loss": 0.0007232091156765819, "global_step": 49025, "epoch": 411, "lr": 2.262389870232372e-05} +{"train_loss": 0.0007273549563251436, "global_step": 49026, "epoch": 411, "lr": 2.262204481008136e-05} +{"train_loss": 0.0010890919356137327, "global_step": 49027, "epoch": 411, "lr": 2.2620190971592693e-05, "val_loss": 0.019437456503510475} +{"train_loss": 0.0012776494259014726, "global_step": 49028, "epoch": 412, "lr": 2.2618337186861334e-05} +{"train_loss": 0.0009745280258357525, "global_step": 49029, "epoch": 412, "lr": 2.2616483455890963e-05} +{"train_loss": 0.00040649910806678236, "global_step": 49030, "epoch": 412, "lr": 2.2614629778685182e-05} +{"train_loss": 0.0006798420217819512, "global_step": 49031, "epoch": 412, "lr": 2.2612776155247667e-05} +{"train_loss": 0.0018920816946774721, "global_step": 49032, "epoch": 412, "lr": 2.2610922585582046e-05} +{"train_loss": 0.0007986038108356297, "global_step": 49033, "epoch": 412, "lr": 2.2609069069691928e-05} +{"train_loss": 0.0012355432845652103, "global_step": 49034, "epoch": 412, "lr": 2.2607215607580996e-05} +{"train_loss": 0.0006052801618352532, "global_step": 49035, "epoch": 412, "lr": 2.2605362199252854e-05} +{"train_loss": 0.0010134333278983831, "global_step": 49036, "epoch": 412, "lr": 2.2603508844711152e-05} +{"train_loss": 0.0009028366766870022, "global_step": 49037, "epoch": 412, "lr": 2.2601655543959555e-05} +{"train_loss": 0.0006532840197905898, "global_step": 49038, "epoch": 412, "lr": 2.2599802297001666e-05} +{"train_loss": 0.0003802727733273059, "global_step": 49039, "epoch": 412, "lr": 2.2597949103841147e-05} +{"train_loss": 0.001175092300400138, "global_step": 49040, "epoch": 412, "lr": 2.2596095964481616e-05} +{"train_loss": 0.0015185985248535872, "global_step": 49041, "epoch": 412, "lr": 2.2594242878926742e-05} +{"train_loss": 0.0009503129404038191, "global_step": 49042, "epoch": 412, "lr": 2.259238984718012e-05} +{"train_loss": 0.0014323515351861715, "global_step": 49043, "epoch": 412, "lr": 2.259053686924544e-05} +{"train_loss": 0.0016263077268376946, "global_step": 49044, "epoch": 412, "lr": 2.2588683945126304e-05} +{"train_loss": 0.000763804535381496, "global_step": 49045, "epoch": 412, "lr": 2.2586831074826342e-05} +{"train_loss": 0.000918289995752275, "global_step": 49046, "epoch": 412, "lr": 2.2584978258349228e-05} +{"train_loss": 0.0007020848570391536, "global_step": 49047, "epoch": 412, "lr": 2.258312549569856e-05} +{"train_loss": 0.0011291017290204763, "global_step": 49048, "epoch": 412, "lr": 2.2581272786878016e-05} +{"train_loss": 0.0012351120822131634, "global_step": 49049, "epoch": 412, "lr": 2.2579420131891193e-05} +{"train_loss": 0.000563952955417335, "global_step": 49050, "epoch": 412, "lr": 2.2577567530741773e-05} +{"train_loss": 0.0010147042339667678, "global_step": 49051, "epoch": 412, "lr": 2.2575714983433366e-05} +{"train_loss": 0.0006829726626165211, "global_step": 49052, "epoch": 412, "lr": 2.2573862489969593e-05} +{"train_loss": 0.0005457113729789853, "global_step": 49053, "epoch": 412, "lr": 2.257201005035413e-05} +{"train_loss": 0.001165861845947802, "global_step": 49054, "epoch": 412, "lr": 2.257015766459058e-05} +{"train_loss": 0.0006458710413426161, "global_step": 49055, "epoch": 412, "lr": 2.256830533268261e-05} +{"train_loss": 0.0007799130980856717, "global_step": 49056, "epoch": 412, "lr": 2.2566453054633825e-05} +{"train_loss": 0.0008610563818365335, "global_step": 49057, "epoch": 412, "lr": 2.2564600830447897e-05} +{"train_loss": 0.0008038229425437748, "global_step": 49058, "epoch": 412, "lr": 2.2562748660128447e-05} +{"train_loss": 0.000902810599654913, "global_step": 49059, "epoch": 412, "lr": 2.2560896543679083e-05} +{"train_loss": 0.0013431697152554989, "global_step": 49060, "epoch": 412, "lr": 2.255904448110349e-05} +{"train_loss": 0.0009652922162786126, "global_step": 49061, "epoch": 412, "lr": 2.2557192472405263e-05} +{"train_loss": 0.001189711969345808, "global_step": 49062, "epoch": 412, "lr": 2.2555340517588075e-05} +{"train_loss": 0.0010475432500243187, "global_step": 49063, "epoch": 412, "lr": 2.2553488616655545e-05} +{"train_loss": 0.0006850750651210546, "global_step": 49064, "epoch": 412, "lr": 2.255163676961129e-05} +{"train_loss": 0.0014921404654160142, "global_step": 49065, "epoch": 412, "lr": 2.254978497645898e-05} +{"train_loss": 0.0008658214355818927, "global_step": 49066, "epoch": 412, "lr": 2.2547933237202217e-05} +{"train_loss": 0.0013734160456806421, "global_step": 49067, "epoch": 412, "lr": 2.254608155184467e-05} +{"train_loss": 0.0010946240508928895, "global_step": 49068, "epoch": 412, "lr": 2.2544229920389944e-05} +{"train_loss": 0.0007609677268192172, "global_step": 49069, "epoch": 412, "lr": 2.2542378342841708e-05} +{"train_loss": 0.0007589463493786752, "global_step": 49070, "epoch": 412, "lr": 2.2540526819203554e-05} +{"train_loss": 0.000700540782418102, "global_step": 49071, "epoch": 412, "lr": 2.253867534947915e-05} +{"train_loss": 0.0006484646582975984, "global_step": 49072, "epoch": 412, "lr": 2.253682393367214e-05} +{"train_loss": 0.00045082453289069235, "global_step": 49073, "epoch": 412, "lr": 2.2534972571786122e-05} +{"train_loss": 0.001952435588464141, "global_step": 49074, "epoch": 412, "lr": 2.253312126382477e-05} +{"train_loss": 0.001834510825574398, "global_step": 49075, "epoch": 412, "lr": 2.2531270009791677e-05} +{"train_loss": 0.000673124857712537, "global_step": 49076, "epoch": 412, "lr": 2.2529418809690528e-05} +{"train_loss": 0.0010519431671127677, "global_step": 49077, "epoch": 412, "lr": 2.2527567663524923e-05} +{"train_loss": 0.0008075562072917819, "global_step": 49078, "epoch": 412, "lr": 2.252571657129849e-05} +{"train_loss": 0.0006187792751006782, "global_step": 49079, "epoch": 412, "lr": 2.2523865533014893e-05} +{"train_loss": 0.0008565144380554557, "global_step": 49080, "epoch": 412, "lr": 2.2522014548677732e-05} +{"train_loss": 0.0008264844072982669, "global_step": 49081, "epoch": 412, "lr": 2.252016361829068e-05} +{"train_loss": 0.0007165346760302782, "global_step": 49082, "epoch": 412, "lr": 2.251831274185735e-05} +{"train_loss": 0.0011207275092601776, "global_step": 49083, "epoch": 412, "lr": 2.251646191938136e-05} +{"train_loss": 0.0011122089345008135, "global_step": 49084, "epoch": 412, "lr": 2.2514611150866376e-05} +{"train_loss": 0.000727277307305485, "global_step": 49085, "epoch": 412, "lr": 2.2512760436316005e-05} +{"train_loss": 0.0011490234173834324, "global_step": 49086, "epoch": 412, "lr": 2.2510909775733908e-05} +{"train_loss": 0.0005747355753555894, "global_step": 49087, "epoch": 412, "lr": 2.250905916912368e-05} +{"train_loss": 0.0009042990859597921, "global_step": 49088, "epoch": 412, "lr": 2.2507208616489e-05} +{"train_loss": 0.0010575703345239162, "global_step": 49089, "epoch": 412, "lr": 2.2505358117833475e-05} +{"train_loss": 0.0010373461991548538, "global_step": 49090, "epoch": 412, "lr": 2.2503507673160724e-05} +{"train_loss": 0.0011879528174176812, "global_step": 49091, "epoch": 412, "lr": 2.250165728247442e-05} +{"train_loss": 0.0007549001602455974, "global_step": 49092, "epoch": 412, "lr": 2.249980694577815e-05} +{"train_loss": 0.0004328879003878683, "global_step": 49093, "epoch": 412, "lr": 2.24979566630756e-05} +{"train_loss": 0.0007715618121437728, "global_step": 49094, "epoch": 412, "lr": 2.2496106434370367e-05} +{"train_loss": 0.0006415386451408267, "global_step": 49095, "epoch": 412, "lr": 2.249425625966607e-05} +{"train_loss": 0.0005666887736879289, "global_step": 49096, "epoch": 412, "lr": 2.249240613896638e-05} +{"train_loss": 0.0018818035023286939, "global_step": 49097, "epoch": 412, "lr": 2.24905560722749e-05} +{"train_loss": 0.0009651887812651694, "global_step": 49098, "epoch": 412, "lr": 2.2488706059595287e-05} +{"train_loss": 0.0004043404187541455, "global_step": 49099, "epoch": 412, "lr": 2.2486856100931148e-05} +{"train_loss": 0.0009506577625870705, "global_step": 49100, "epoch": 412, "lr": 2.248500619628614e-05} +{"train_loss": 0.0007088318816386163, "global_step": 49101, "epoch": 412, "lr": 2.248315634566387e-05} +{"train_loss": 0.0008556748507544398, "global_step": 49102, "epoch": 412, "lr": 2.2481306549067997e-05} +{"train_loss": 0.0013781243469566107, "global_step": 49103, "epoch": 412, "lr": 2.247945680650212e-05} +{"train_loss": 0.0007377646979875863, "global_step": 49104, "epoch": 412, "lr": 2.2477607117969913e-05} +{"train_loss": 0.0010877640452235937, "global_step": 49105, "epoch": 412, "lr": 2.2475757483474956e-05} +{"train_loss": 0.0010944200912490487, "global_step": 49106, "epoch": 412, "lr": 2.2473907903020918e-05} +{"train_loss": 0.0009912305977195501, "global_step": 49107, "epoch": 412, "lr": 2.2472058376611438e-05} +{"train_loss": 0.0006511799292638898, "global_step": 49108, "epoch": 412, "lr": 2.2470208904250127e-05} +{"train_loss": 0.000986855593509972, "global_step": 49109, "epoch": 412, "lr": 2.2468359485940604e-05} +{"train_loss": 0.0009282520622946322, "global_step": 49110, "epoch": 412, "lr": 2.246651012168653e-05} +{"train_loss": 0.0008772885194048285, "global_step": 49111, "epoch": 412, "lr": 2.2464660811491505e-05} +{"train_loss": 0.000537471380084753, "global_step": 49112, "epoch": 412, "lr": 2.2462811555359196e-05} +{"train_loss": 0.0005906703299842775, "global_step": 49113, "epoch": 412, "lr": 2.2460962353293217e-05} +{"train_loss": 0.0009800315601751208, "global_step": 49114, "epoch": 412, "lr": 2.2459113205297177e-05} +{"train_loss": 0.0009424814488738775, "global_step": 49115, "epoch": 412, "lr": 2.2457264111374744e-05} +{"train_loss": 0.001077192253433168, "global_step": 49116, "epoch": 412, "lr": 2.2455415071529513e-05} +{"train_loss": 0.0010156750213354826, "global_step": 49117, "epoch": 412, "lr": 2.2453566085765147e-05} +{"train_loss": 0.0008206017664633691, "global_step": 49118, "epoch": 412, "lr": 2.2451717154085244e-05} +{"train_loss": 0.0007198493112809956, "global_step": 49119, "epoch": 412, "lr": 2.2449868276493468e-05} +{"train_loss": 0.0007850563270039856, "global_step": 49120, "epoch": 412, "lr": 2.2448019452993435e-05} +{"train_loss": 0.0011270480463281274, "global_step": 49121, "epoch": 412, "lr": 2.244617068358875e-05} +{"train_loss": 0.0013410442043095827, "global_step": 49122, "epoch": 412, "lr": 2.244432196828309e-05} +{"train_loss": 0.0008062129491008818, "global_step": 49123, "epoch": 412, "lr": 2.2442473307080042e-05} +{"train_loss": 0.0006064933841116726, "global_step": 49124, "epoch": 412, "lr": 2.2440624699983266e-05} +{"train_loss": 0.0007036091992631555, "global_step": 49125, "epoch": 412, "lr": 2.2438776146996365e-05} +{"train_loss": 0.0007339725852943957, "global_step": 49126, "epoch": 412, "lr": 2.2436927648122997e-05} +{"train_loss": 0.0005246557993814349, "global_step": 49127, "epoch": 412, "lr": 2.2435079203366777e-05} +{"train_loss": 0.0007270794594660401, "global_step": 49128, "epoch": 412, "lr": 2.243323081273132e-05} +{"train_loss": 0.0008047098526731133, "global_step": 49129, "epoch": 412, "lr": 2.2431382476220287e-05} +{"train_loss": 0.0011578126577660441, "global_step": 49130, "epoch": 412, "lr": 2.2429534193837265e-05} +{"train_loss": 0.0005780308274552226, "global_step": 49131, "epoch": 412, "lr": 2.2427685965585933e-05} +{"train_loss": 0.0010905629023909569, "global_step": 49132, "epoch": 412, "lr": 2.242583779146989e-05} +{"train_loss": 0.00139840436168015, "global_step": 49133, "epoch": 412, "lr": 2.2423989671492752e-05} +{"train_loss": 0.0006514946580864489, "global_step": 49134, "epoch": 412, "lr": 2.2422141605658158e-05} +{"train_loss": 0.0007620810647495091, "global_step": 49135, "epoch": 412, "lr": 2.2420293593969766e-05} +{"train_loss": 0.00036762974923476577, "global_step": 49136, "epoch": 412, "lr": 2.2418445636431163e-05} +{"train_loss": 0.0008107683388516307, "global_step": 49137, "epoch": 412, "lr": 2.2416597733046012e-05} +{"train_loss": 0.0011743073118850589, "global_step": 49138, "epoch": 412, "lr": 2.241474988381791e-05} +{"train_loss": 0.0006016495754010975, "global_step": 49139, "epoch": 412, "lr": 2.2412902088750515e-05} +{"train_loss": 0.00092626380501315, "global_step": 49140, "epoch": 412, "lr": 2.2411054347847423e-05} +{"train_loss": 0.0006561611080542207, "global_step": 49141, "epoch": 412, "lr": 2.2409206661112297e-05} +{"train_loss": 0.0007523095118813217, "global_step": 49142, "epoch": 412, "lr": 2.2407359028548723e-05} +{"train_loss": 0.001012385473586619, "global_step": 49143, "epoch": 412, "lr": 2.2405511450160377e-05} +{"train_loss": 0.0006877265986986458, "global_step": 49144, "epoch": 412, "lr": 2.2403663925950837e-05} +{"train_loss": 0.0014286184450611472, "global_step": 49145, "epoch": 412, "lr": 2.2401816455923775e-05} +{"train_loss": 0.0009180448077200371, "global_step": 49146, "epoch": 412, "lr": 2.2399969040082796e-05, "val_loss": 0.03173544630408287} +{"train_loss": 0.0007228804170154035, "global_step": 49147, "epoch": 413, "lr": 2.2398121678431516e-05} +{"train_loss": 0.0007854936993680894, "global_step": 49148, "epoch": 413, "lr": 2.239627437097359e-05} +{"train_loss": 0.0009515078854747117, "global_step": 49149, "epoch": 413, "lr": 2.2394427117712613e-05} +{"train_loss": 0.0004332686075940728, "global_step": 49150, "epoch": 413, "lr": 2.2392579918652245e-05} +{"train_loss": 0.0009645593818277121, "global_step": 49151, "epoch": 413, "lr": 2.2390732773796097e-05} +{"train_loss": 0.0007799466256983578, "global_step": 49152, "epoch": 413, "lr": 2.238888568314778e-05} +{"train_loss": 0.000645425810944289, "global_step": 49153, "epoch": 413, "lr": 2.2387038646710954e-05} +{"train_loss": 0.0010067140683531761, "global_step": 49154, "epoch": 413, "lr": 2.2385191664489208e-05} +{"train_loss": 0.0011078168172389269, "global_step": 49155, "epoch": 413, "lr": 2.2383344736486206e-05} +{"train_loss": 0.0005879612872377038, "global_step": 49156, "epoch": 413, "lr": 2.238149786270554e-05} +{"train_loss": 0.0007610521861352026, "global_step": 49157, "epoch": 413, "lr": 2.2379651043150868e-05} +{"train_loss": 0.001164724351838231, "global_step": 49158, "epoch": 413, "lr": 2.2377804277825803e-05} +{"train_loss": 0.0024394707288593054, "global_step": 49159, "epoch": 413, "lr": 2.2375957566733953e-05} +{"train_loss": 0.0011576386168599129, "global_step": 49160, "epoch": 413, "lr": 2.237411090987897e-05} +{"train_loss": 0.0005650336970575154, "global_step": 49161, "epoch": 413, "lr": 2.237226430726445e-05} +{"train_loss": 0.0009023395832628012, "global_step": 49162, "epoch": 413, "lr": 2.2370417758894065e-05} +{"train_loss": 0.0012307623401284218, "global_step": 49163, "epoch": 413, "lr": 2.2368571264771405e-05} +{"train_loss": 0.0006832216749899089, "global_step": 49164, "epoch": 413, "lr": 2.2366724824900088e-05} +{"train_loss": 0.0008997159311547875, "global_step": 49165, "epoch": 413, "lr": 2.236487843928377e-05} +{"train_loss": 0.001097154337912798, "global_step": 49166, "epoch": 413, "lr": 2.2363032107926045e-05} +{"train_loss": 0.0008339174673892558, "global_step": 49167, "epoch": 413, "lr": 2.2361185830830573e-05} +{"train_loss": 0.0009965975768864155, "global_step": 49168, "epoch": 413, "lr": 2.235933960800094e-05} +{"train_loss": 0.0011952024651691318, "global_step": 49169, "epoch": 413, "lr": 2.2357493439440796e-05} +{"train_loss": 0.0008700262405909598, "global_step": 49170, "epoch": 413, "lr": 2.235564732515377e-05} +{"train_loss": 0.0007135117193683982, "global_step": 49171, "epoch": 413, "lr": 2.2353801265143466e-05} +{"train_loss": 0.0009607698884792626, "global_step": 49172, "epoch": 413, "lr": 2.2351955259413533e-05} +{"train_loss": 0.001366621465422213, "global_step": 49173, "epoch": 413, "lr": 2.2350109307967565e-05} +{"train_loss": 0.0005982471047900617, "global_step": 49174, "epoch": 413, "lr": 2.2348263410809224e-05} +{"train_loss": 0.0005863153492100537, "global_step": 49175, "epoch": 413, "lr": 2.2346417567942096e-05} +{"train_loss": 0.0011164448224008083, "global_step": 49176, "epoch": 413, "lr": 2.2344571779369838e-05} +{"train_loss": 0.000595410238020122, "global_step": 49177, "epoch": 413, "lr": 2.2342726045096058e-05} +{"train_loss": 0.0009344082209281623, "global_step": 49178, "epoch": 413, "lr": 2.2340880365124367e-05} +{"train_loss": 0.0014732970157638192, "global_step": 49179, "epoch": 413, "lr": 2.2339034739458415e-05} +{"train_loss": 0.0006617492763325572, "global_step": 49180, "epoch": 413, "lr": 2.2337189168101796e-05} +{"train_loss": 0.0006956100696697831, "global_step": 49181, "epoch": 413, "lr": 2.233534365105817e-05} +{"train_loss": 0.0005877296207472682, "global_step": 49182, "epoch": 413, "lr": 2.2333498188331142e-05} +{"train_loss": 0.0011373147135600448, "global_step": 49183, "epoch": 413, "lr": 2.2331652779924316e-05} +{"train_loss": 0.0009582660277374089, "global_step": 49184, "epoch": 413, "lr": 2.2329807425841352e-05} +{"train_loss": 0.0008779552881605923, "global_step": 49185, "epoch": 413, "lr": 2.2327962126085838e-05} +{"train_loss": 0.0005532747018150985, "global_step": 49186, "epoch": 413, "lr": 2.2326116880661436e-05} +{"train_loss": 0.0008790323045104742, "global_step": 49187, "epoch": 413, "lr": 2.2324271689571718e-05} +{"train_loss": 0.0018229493871331215, "global_step": 49188, "epoch": 413, "lr": 2.2322426552820362e-05} +{"train_loss": 0.0005314563750289381, "global_step": 49189, "epoch": 413, "lr": 2.232058147041096e-05} +{"train_loss": 0.00039724077214486897, "global_step": 49190, "epoch": 413, "lr": 2.2318736442347126e-05} +{"train_loss": 0.0007559768273495138, "global_step": 49191, "epoch": 413, "lr": 2.2316891468632513e-05} +{"train_loss": 0.0006763646961189806, "global_step": 49192, "epoch": 413, "lr": 2.2315046549270707e-05} +{"train_loss": 0.0015429664636030793, "global_step": 49193, "epoch": 413, "lr": 2.2313201684265366e-05} +{"train_loss": 0.0016916062450036407, "global_step": 49194, "epoch": 413, "lr": 2.2311356873620076e-05} +{"train_loss": 0.0011496326187625527, "global_step": 49195, "epoch": 413, "lr": 2.2309512117338505e-05} +{"train_loss": 0.0010082665830850601, "global_step": 49196, "epoch": 413, "lr": 2.230766741542424e-05} +{"train_loss": 0.0008853877661749721, "global_step": 49197, "epoch": 413, "lr": 2.2305822767880896e-05} +{"train_loss": 0.0010967039270326495, "global_step": 49198, "epoch": 413, "lr": 2.230397817471213e-05} +{"train_loss": 0.0007971450104378164, "global_step": 49199, "epoch": 413, "lr": 2.2302133635921523e-05} +{"train_loss": 0.0007984457770362496, "global_step": 49200, "epoch": 413, "lr": 2.2300289151512738e-05} +{"train_loss": 0.0019895886071026325, "global_step": 49201, "epoch": 413, "lr": 2.229844472148936e-05} +{"train_loss": 0.0005961357383057475, "global_step": 49202, "epoch": 413, "lr": 2.229660034585504e-05} +{"train_loss": 0.0009666403639130294, "global_step": 49203, "epoch": 413, "lr": 2.2294756024613366e-05} +{"train_loss": 0.0006413862574845552, "global_step": 49204, "epoch": 413, "lr": 2.2292911757767982e-05} +{"train_loss": 0.0007766283233650029, "global_step": 49205, "epoch": 413, "lr": 2.2291067545322526e-05} +{"train_loss": 0.001093048951588571, "global_step": 49206, "epoch": 413, "lr": 2.2289223387280576e-05} +{"train_loss": 0.0012478588614612818, "global_step": 49207, "epoch": 413, "lr": 2.2287379283645793e-05} +{"train_loss": 0.0018888188060373068, "global_step": 49208, "epoch": 413, "lr": 2.2285535234421783e-05} +{"train_loss": 0.0014713505515828729, "global_step": 49209, "epoch": 413, "lr": 2.2283691239612146e-05} +{"train_loss": 0.0010952986776828766, "global_step": 49210, "epoch": 413, "lr": 2.2281847299220537e-05} +{"train_loss": 0.001397608662955463, "global_step": 49211, "epoch": 413, "lr": 2.2280003413250544e-05} +{"train_loss": 0.0016953985905274749, "global_step": 49212, "epoch": 413, "lr": 2.227815958170582e-05} +{"train_loss": 0.0015806978335604072, "global_step": 49213, "epoch": 413, "lr": 2.2276315804589966e-05} +{"train_loss": 0.001399433589540422, "global_step": 49214, "epoch": 413, "lr": 2.227447208190659e-05} +{"train_loss": 0.0012054736725986004, "global_step": 49215, "epoch": 413, "lr": 2.2272628413659335e-05} +{"train_loss": 0.000945286825299263, "global_step": 49216, "epoch": 413, "lr": 2.2270784799851802e-05} +{"train_loss": 0.0007686310564167798, "global_step": 49217, "epoch": 413, "lr": 2.226894124048764e-05} +{"train_loss": 0.0011698686284944415, "global_step": 49218, "epoch": 413, "lr": 2.2267097735570426e-05} +{"train_loss": 0.0009995285654440522, "global_step": 49219, "epoch": 413, "lr": 2.2265254285103822e-05} +{"train_loss": 0.0012269795406609774, "global_step": 49220, "epoch": 413, "lr": 2.2263410889091428e-05} +{"train_loss": 0.0010981080122292042, "global_step": 49221, "epoch": 413, "lr": 2.2261567547536842e-05} +{"train_loss": 0.0017383844824507833, "global_step": 49222, "epoch": 413, "lr": 2.225972426044373e-05} +{"train_loss": 0.001773205236531794, "global_step": 49223, "epoch": 413, "lr": 2.2257881027815665e-05} +{"train_loss": 0.0010954394238069654, "global_step": 49224, "epoch": 413, "lr": 2.2256037849656303e-05} +{"train_loss": 0.001395367900840938, "global_step": 49225, "epoch": 413, "lr": 2.225419472596923e-05} +{"train_loss": 0.0022213254123926163, "global_step": 49226, "epoch": 413, "lr": 2.2252351656758102e-05} +{"train_loss": 0.0011113905347883701, "global_step": 49227, "epoch": 413, "lr": 2.2250508642026513e-05} +{"train_loss": 0.0008532305364497006, "global_step": 49228, "epoch": 413, "lr": 2.224866568177807e-05} +{"train_loss": 0.0010380697203800082, "global_step": 49229, "epoch": 413, "lr": 2.2246822776016423e-05} +{"train_loss": 0.0008533618529327214, "global_step": 49230, "epoch": 413, "lr": 2.2244979924745165e-05} +{"train_loss": 0.0014453165931627154, "global_step": 49231, "epoch": 413, "lr": 2.2243137127967934e-05} +{"train_loss": 0.0008123992593027651, "global_step": 49232, "epoch": 413, "lr": 2.2241294385688314e-05} +{"train_loss": 0.0008006798452697694, "global_step": 49233, "epoch": 413, "lr": 2.2239451697909973e-05} +{"train_loss": 0.002379022538661957, "global_step": 49234, "epoch": 413, "lr": 2.2237609064636484e-05} +{"train_loss": 0.0008043841226026416, "global_step": 49235, "epoch": 413, "lr": 2.22357664858715e-05} +{"train_loss": 0.0010003144852817059, "global_step": 49236, "epoch": 413, "lr": 2.223392396161861e-05} +{"train_loss": 0.0007054102024994791, "global_step": 49237, "epoch": 413, "lr": 2.2232081491881456e-05} +{"train_loss": 0.000942897517234087, "global_step": 49238, "epoch": 413, "lr": 2.2230239076663623e-05} +{"train_loss": 0.0009254214819520712, "global_step": 49239, "epoch": 413, "lr": 2.2228396715968776e-05} +{"train_loss": 0.0009581777267158031, "global_step": 49240, "epoch": 413, "lr": 2.2226554409800475e-05} +{"train_loss": 0.0013862851774320006, "global_step": 49241, "epoch": 413, "lr": 2.2224712158162397e-05} +{"train_loss": 0.0017714325804263353, "global_step": 49242, "epoch": 413, "lr": 2.2222869961058106e-05} +{"train_loss": 0.0008775522001087666, "global_step": 49243, "epoch": 413, "lr": 2.2221027818491257e-05} +{"train_loss": 0.002291859593242407, "global_step": 49244, "epoch": 413, "lr": 2.2219185730465443e-05} +{"train_loss": 0.000986883882433176, "global_step": 49245, "epoch": 413, "lr": 2.22173436969843e-05} +{"train_loss": 0.0008608114439994097, "global_step": 49246, "epoch": 413, "lr": 2.2215501718051436e-05} +{"train_loss": 0.0007267860928550363, "global_step": 49247, "epoch": 413, "lr": 2.221365979367045e-05} +{"train_loss": 0.0005768173723481596, "global_step": 49248, "epoch": 413, "lr": 2.221181792384499e-05} +{"train_loss": 0.00090557592920959, "global_step": 49249, "epoch": 413, "lr": 2.220997610857864e-05} +{"train_loss": 0.0004339040315244347, "global_step": 49250, "epoch": 413, "lr": 2.2208134347875054e-05} +{"train_loss": 0.0012458947021514177, "global_step": 49251, "epoch": 413, "lr": 2.2206292641737825e-05} +{"train_loss": 0.0013835302088409662, "global_step": 49252, "epoch": 413, "lr": 2.220445099017055e-05} +{"train_loss": 0.0006577790481969714, "global_step": 49253, "epoch": 413, "lr": 2.2202609393176886e-05} +{"train_loss": 0.0014959723921492696, "global_step": 49254, "epoch": 413, "lr": 2.2200767850760413e-05} +{"train_loss": 0.000898077036254108, "global_step": 49255, "epoch": 413, "lr": 2.2198926362924778e-05} +{"train_loss": 0.001099246321246028, "global_step": 49256, "epoch": 413, "lr": 2.2197084929673562e-05} +{"train_loss": 0.0013140789233148098, "global_step": 49257, "epoch": 413, "lr": 2.219524355101042e-05} +{"train_loss": 0.0006894484395161271, "global_step": 49258, "epoch": 413, "lr": 2.2193402226938946e-05} +{"train_loss": 0.0010621848050504923, "global_step": 49259, "epoch": 413, "lr": 2.2191560957462737e-05} +{"train_loss": 0.0009540270548313856, "global_step": 49260, "epoch": 413, "lr": 2.2189719742585447e-05} +{"train_loss": 0.001539427088573575, "global_step": 49261, "epoch": 413, "lr": 2.218787858231065e-05} +{"train_loss": 0.0012380587868392467, "global_step": 49262, "epoch": 413, "lr": 2.2186037476642003e-05} +{"train_loss": 0.0011188037460669875, "global_step": 49263, "epoch": 413, "lr": 2.218419642558308e-05} +{"train_loss": 0.0006046305643394589, "global_step": 49264, "epoch": 413, "lr": 2.2182355429137537e-05} +{"train_loss": 0.0010554676400027982, "global_step": 49265, "epoch": 413, "lr": 2.218051448730896e-05, "val_loss": 0.020293913781642914} +{"train_loss": 0.0014180843718349934, "global_step": 49266, "epoch": 414, "lr": 2.2178673600100964e-05} +{"train_loss": 0.0004212948842905462, "global_step": 49267, "epoch": 414, "lr": 2.2176832767517165e-05} +{"train_loss": 0.0014549982734024525, "global_step": 49268, "epoch": 414, "lr": 2.2174991989561195e-05} +{"train_loss": 0.0006426044274121523, "global_step": 49269, "epoch": 414, "lr": 2.217315126623664e-05} +{"train_loss": 0.0019024352077394724, "global_step": 49270, "epoch": 414, "lr": 2.217131059754715e-05} +{"train_loss": 0.0012958415318280458, "global_step": 49271, "epoch": 414, "lr": 2.2169469983496305e-05} +{"train_loss": 0.0009547554072923958, "global_step": 49272, "epoch": 414, "lr": 2.2167629424087743e-05} +{"train_loss": 0.0012874004896730185, "global_step": 49273, "epoch": 414, "lr": 2.2165788919325052e-05} +{"train_loss": 0.0012672810116782784, "global_step": 49274, "epoch": 414, "lr": 2.2163948469211876e-05} +{"train_loss": 0.0009557168232277036, "global_step": 49275, "epoch": 414, "lr": 2.2162108073751797e-05} +{"train_loss": 0.0008304341463372111, "global_step": 49276, "epoch": 414, "lr": 2.2160267732948463e-05} +{"train_loss": 0.0010673294309526682, "global_step": 49277, "epoch": 414, "lr": 2.2158427446805473e-05} +{"train_loss": 0.0009113285923376679, "global_step": 49278, "epoch": 414, "lr": 2.2156587215326412e-05} +{"train_loss": 0.0019758245907723904, "global_step": 49279, "epoch": 414, "lr": 2.215474703851494e-05} +{"train_loss": 0.0006947586662136018, "global_step": 49280, "epoch": 414, "lr": 2.2152906916374628e-05} +{"train_loss": 0.0005596132832579315, "global_step": 49281, "epoch": 414, "lr": 2.2151066848909124e-05} +{"train_loss": 0.0015226674731820822, "global_step": 49282, "epoch": 414, "lr": 2.2149226836122027e-05} +{"train_loss": 0.0007211622432805598, "global_step": 49283, "epoch": 414, "lr": 2.2147386878016934e-05} +{"train_loss": 0.0010786037892103195, "global_step": 49284, "epoch": 414, "lr": 2.214554697459748e-05} +{"train_loss": 0.0005883377161808312, "global_step": 49285, "epoch": 414, "lr": 2.2143707125867258e-05} +{"train_loss": 0.0006245259428396821, "global_step": 49286, "epoch": 414, "lr": 2.2141867331829906e-05} +{"train_loss": 0.0008832355961203575, "global_step": 49287, "epoch": 414, "lr": 2.2140027592489005e-05} +{"train_loss": 0.000909275549929589, "global_step": 49288, "epoch": 414, "lr": 2.21381879078482e-05} +{"train_loss": 0.001079465844668448, "global_step": 49289, "epoch": 414, "lr": 2.213634827791109e-05} +{"train_loss": 0.0011827056296169758, "global_step": 49290, "epoch": 414, "lr": 2.2134508702681262e-05} +{"train_loss": 0.0006759489770047367, "global_step": 49291, "epoch": 414, "lr": 2.2132669182162364e-05} +{"train_loss": 0.0009195655584335327, "global_step": 49292, "epoch": 414, "lr": 2.213082971635798e-05} +{"train_loss": 0.0011427849531173706, "global_step": 49293, "epoch": 414, "lr": 2.2128990305271752e-05} +{"train_loss": 0.00046999950427562, "global_step": 49294, "epoch": 414, "lr": 2.2127150948907254e-05} +{"train_loss": 0.0011578958947211504, "global_step": 49295, "epoch": 414, "lr": 2.212531164726813e-05} +{"train_loss": 0.0015781287802383304, "global_step": 49296, "epoch": 414, "lr": 2.2123472400357992e-05} +{"train_loss": 0.0012773022754117846, "global_step": 49297, "epoch": 414, "lr": 2.212163320818041e-05} +{"train_loss": 0.00043367178295738995, "global_step": 49298, "epoch": 414, "lr": 2.2119794070739043e-05} +{"train_loss": 0.0022725295275449753, "global_step": 49299, "epoch": 414, "lr": 2.2117954988037466e-05} +{"train_loss": 0.000805486342869699, "global_step": 49300, "epoch": 414, "lr": 2.211611596007932e-05} +{"train_loss": 0.0015737202484160662, "global_step": 49301, "epoch": 414, "lr": 2.2114276986868184e-05} +{"train_loss": 0.0006262611714191735, "global_step": 49302, "epoch": 414, "lr": 2.2112438068407688e-05} +{"train_loss": 0.0014551411150023341, "global_step": 49303, "epoch": 414, "lr": 2.2110599204701455e-05} +{"train_loss": 0.0005718858446925879, "global_step": 49304, "epoch": 414, "lr": 2.2108760395753063e-05} +{"train_loss": 0.0013618377270177007, "global_step": 49305, "epoch": 414, "lr": 2.2106921641566164e-05} +{"train_loss": 0.0013460804475471377, "global_step": 49306, "epoch": 414, "lr": 2.2105082942144322e-05} +{"train_loss": 0.000543701637070626, "global_step": 49307, "epoch": 414, "lr": 2.2103244297491187e-05} +{"train_loss": 0.0006272789323702455, "global_step": 49308, "epoch": 414, "lr": 2.2101405707610357e-05} +{"train_loss": 0.0014114551013335586, "global_step": 49309, "epoch": 414, "lr": 2.2099567172505413e-05} +{"train_loss": 0.0010318222921341658, "global_step": 49310, "epoch": 414, "lr": 2.209772869218001e-05} +{"train_loss": 0.0012077197898179293, "global_step": 49311, "epoch": 414, "lr": 2.2095890266637714e-05} +{"train_loss": 0.0012383176945149899, "global_step": 49312, "epoch": 414, "lr": 2.2094051895882173e-05} +{"train_loss": 0.0006539632449857891, "global_step": 49313, "epoch": 414, "lr": 2.2092213579916964e-05} +{"train_loss": 0.0011547848116606474, "global_step": 49314, "epoch": 414, "lr": 2.209037531874573e-05} +{"train_loss": 0.000804168579634279, "global_step": 49315, "epoch": 414, "lr": 2.2088537112372065e-05} +{"train_loss": 0.0005976575776003301, "global_step": 49316, "epoch": 414, "lr": 2.2086698960799556e-05} +{"train_loss": 0.000774455489590764, "global_step": 49317, "epoch": 414, "lr": 2.2084860864031848e-05} +{"train_loss": 0.0010996285127475858, "global_step": 49318, "epoch": 414, "lr": 2.2083022822072518e-05} +{"train_loss": 0.0006400784477591515, "global_step": 49319, "epoch": 414, "lr": 2.2081184834925205e-05} +{"train_loss": 0.0006791019695810974, "global_step": 49320, "epoch": 414, "lr": 2.2079346902593507e-05} +{"train_loss": 0.0008590755169279873, "global_step": 49321, "epoch": 414, "lr": 2.2077509025081006e-05} +{"train_loss": 0.0009586343076080084, "global_step": 49322, "epoch": 414, "lr": 2.207567120239135e-05} +{"train_loss": 0.0009841760620474815, "global_step": 49323, "epoch": 414, "lr": 2.2073833434528118e-05} +{"train_loss": 0.0008562662405893207, "global_step": 49324, "epoch": 414, "lr": 2.2071995721494944e-05} +{"train_loss": 0.0006684325053356588, "global_step": 49325, "epoch": 414, "lr": 2.207015806329541e-05} +{"train_loss": 0.001088937046006322, "global_step": 49326, "epoch": 414, "lr": 2.206832045993315e-05} +{"train_loss": 0.0007980733644217253, "global_step": 49327, "epoch": 414, "lr": 2.2066482911411758e-05} +{"train_loss": 0.0007486572139896452, "global_step": 49328, "epoch": 414, "lr": 2.2064645417734825e-05} +{"train_loss": 0.0015570748364552855, "global_step": 49329, "epoch": 414, "lr": 2.2062807978905996e-05} +{"train_loss": 0.0007324308389797807, "global_step": 49330, "epoch": 414, "lr": 2.2060970594928843e-05} +{"train_loss": 0.0007665802258998156, "global_step": 49331, "epoch": 414, "lr": 2.2059133265807003e-05} +{"train_loss": 0.0016792917158454657, "global_step": 49332, "epoch": 414, "lr": 2.2057295991544052e-05} +{"train_loss": 0.0007421955233439803, "global_step": 49333, "epoch": 414, "lr": 2.2055458772143638e-05} +{"train_loss": 0.0010323491878807545, "global_step": 49334, "epoch": 414, "lr": 2.2053621607609326e-05} +{"train_loss": 0.0014350154669955373, "global_step": 49335, "epoch": 414, "lr": 2.2051784497944755e-05} +{"train_loss": 0.000495361047796905, "global_step": 49336, "epoch": 414, "lr": 2.204994744315351e-05} +{"train_loss": 0.0009963297052308917, "global_step": 49337, "epoch": 414, "lr": 2.20481104432392e-05} +{"train_loss": 0.0005392660386860371, "global_step": 49338, "epoch": 414, "lr": 2.2046273498205456e-05} +{"train_loss": 0.0014942358247935772, "global_step": 49339, "epoch": 414, "lr": 2.2044436608055873e-05} +{"train_loss": 0.0011403950629755855, "global_step": 49340, "epoch": 414, "lr": 2.204259977279403e-05} +{"train_loss": 0.000828488206025213, "global_step": 49341, "epoch": 414, "lr": 2.2040762992423574e-05} +{"train_loss": 0.0010168281150981784, "global_step": 49342, "epoch": 414, "lr": 2.203892626694808e-05} +{"train_loss": 0.00053870101692155, "global_step": 49343, "epoch": 414, "lr": 2.203708959637118e-05} +{"train_loss": 0.0007095237378962338, "global_step": 49344, "epoch": 414, "lr": 2.2035252980696448e-05} +{"train_loss": 0.0010001298505812883, "global_step": 49345, "epoch": 414, "lr": 2.2033416419927533e-05} +{"train_loss": 0.0008076228550635278, "global_step": 49346, "epoch": 414, "lr": 2.2031579914068012e-05} +{"train_loss": 0.0006022014422342181, "global_step": 49347, "epoch": 414, "lr": 2.2029743463121476e-05} +{"train_loss": 0.0009822878055274487, "global_step": 49348, "epoch": 414, "lr": 2.2027907067091574e-05} +{"train_loss": 0.0006755624781362712, "global_step": 49349, "epoch": 414, "lr": 2.2026070725981867e-05} +{"train_loss": 0.0007263661245815456, "global_step": 49350, "epoch": 414, "lr": 2.2024234439795998e-05} +{"train_loss": 0.0008687176741659641, "global_step": 49351, "epoch": 414, "lr": 2.2022398208537566e-05} +{"train_loss": 0.001022364478558302, "global_step": 49352, "epoch": 414, "lr": 2.2020562032210135e-05} +{"train_loss": 0.0009137961897067726, "global_step": 49353, "epoch": 414, "lr": 2.2018725910817366e-05} +{"train_loss": 0.0007626915466971695, "global_step": 49354, "epoch": 414, "lr": 2.201688984436282e-05} +{"train_loss": 0.000677314237691462, "global_step": 49355, "epoch": 414, "lr": 2.201505383285014e-05} +{"train_loss": 0.0005625946796499193, "global_step": 49356, "epoch": 414, "lr": 2.2013217876282893e-05} +{"train_loss": 0.0006921397289261222, "global_step": 49357, "epoch": 414, "lr": 2.2011381974664724e-05} +{"train_loss": 0.001082852017134428, "global_step": 49358, "epoch": 414, "lr": 2.200954612799921e-05} +{"train_loss": 0.0005940904375165701, "global_step": 49359, "epoch": 414, "lr": 2.200771033628995e-05} +{"train_loss": 0.0008712399867363274, "global_step": 49360, "epoch": 414, "lr": 2.2005874599540577e-05} +{"train_loss": 0.0007179456879384816, "global_step": 49361, "epoch": 414, "lr": 2.2004038917754654e-05} +{"train_loss": 0.0018059748690575361, "global_step": 49362, "epoch": 414, "lr": 2.2002203290935837e-05} +{"train_loss": 0.001138209248892963, "global_step": 49363, "epoch": 414, "lr": 2.200036771908768e-05} +{"train_loss": 0.0013011576374992728, "global_step": 49364, "epoch": 414, "lr": 2.199853220221383e-05} +{"train_loss": 0.00114549754653126, "global_step": 49365, "epoch": 414, "lr": 2.1996696740317846e-05} +{"train_loss": 0.0006097507430240512, "global_step": 49366, "epoch": 414, "lr": 2.199486133340338e-05} +{"train_loss": 0.0019453219138085842, "global_step": 49367, "epoch": 414, "lr": 2.1993025981473992e-05} +{"train_loss": 0.0007647521561011672, "global_step": 49368, "epoch": 414, "lr": 2.1991190684533325e-05} +{"train_loss": 0.0005036514485254884, "global_step": 49369, "epoch": 414, "lr": 2.198935544258494e-05} +{"train_loss": 0.0006682387320324779, "global_step": 49370, "epoch": 414, "lr": 2.1987520255632487e-05} +{"train_loss": 0.002186670433729887, "global_step": 49371, "epoch": 414, "lr": 2.1985685123679527e-05} +{"train_loss": 0.0008036231156438589, "global_step": 49372, "epoch": 414, "lr": 2.1983850046729698e-05} +{"train_loss": 0.0007805601926520467, "global_step": 49373, "epoch": 414, "lr": 2.1982015024786568e-05} +{"train_loss": 0.0004744384787045419, "global_step": 49374, "epoch": 414, "lr": 2.198018005785378e-05} +{"train_loss": 0.0009597738389857113, "global_step": 49375, "epoch": 414, "lr": 2.1978345145934885e-05} +{"train_loss": 0.0006416453397832811, "global_step": 49376, "epoch": 414, "lr": 2.1976510289033547e-05} +{"train_loss": 0.0005432524485513568, "global_step": 49377, "epoch": 414, "lr": 2.197467548715333e-05} +{"train_loss": 0.0008685553329996765, "global_step": 49378, "epoch": 414, "lr": 2.1972840740297828e-05} +{"train_loss": 0.0008873823098838329, "global_step": 49379, "epoch": 414, "lr": 2.1971006048470678e-05} +{"train_loss": 0.0009318155352957547, "global_step": 49380, "epoch": 414, "lr": 2.1969171411675445e-05} +{"train_loss": 0.0009941424941644073, "global_step": 49381, "epoch": 414, "lr": 2.1967336829915764e-05} +{"train_loss": 0.0014340609777718782, "global_step": 49382, "epoch": 414, "lr": 2.1965502303195207e-05} +{"train_loss": 0.0009492874378338456, "global_step": 49383, "epoch": 414, "lr": 2.196366783151741e-05} +{"train_loss": 0.0009720680710346978, "global_step": 49384, "epoch": 414, "lr": 2.196183341488595e-05, "val_loss": 0.019253289327025414} +{"train_loss": 0.0008436237112618983, "global_step": 49385, "epoch": 415, "lr": 2.1959999053304424e-05} +{"train_loss": 0.001413022051565349, "global_step": 49386, "epoch": 415, "lr": 2.195816474677646e-05} +{"train_loss": 0.0007585983257740736, "global_step": 49387, "epoch": 415, "lr": 2.195633049530562e-05} +{"train_loss": 0.0006528896046802402, "global_step": 49388, "epoch": 415, "lr": 2.1954496298895556e-05} +{"train_loss": 0.001217854442074895, "global_step": 49389, "epoch": 415, "lr": 2.1952662157549843e-05} +{"train_loss": 0.0016131580341607332, "global_step": 49390, "epoch": 415, "lr": 2.1950828071272056e-05} +{"train_loss": 0.001500180340372026, "global_step": 49391, "epoch": 415, "lr": 2.194899404006584e-05} +{"train_loss": 0.0008057954837568104, "global_step": 49392, "epoch": 415, "lr": 2.1947160063934765e-05} +{"train_loss": 0.0008762910729274154, "global_step": 49393, "epoch": 415, "lr": 2.1945326142882457e-05} +{"train_loss": 0.0007116932538338006, "global_step": 49394, "epoch": 415, "lr": 2.1943492276912488e-05} +{"train_loss": 0.0009816109668463469, "global_step": 49395, "epoch": 415, "lr": 2.194165846602849e-05} +{"train_loss": 0.0007914781454019248, "global_step": 49396, "epoch": 415, "lr": 2.1939824710234052e-05} +{"train_loss": 0.0006321938126347959, "global_step": 49397, "epoch": 415, "lr": 2.193799100953275e-05} +{"train_loss": 0.0010035254526883364, "global_step": 49398, "epoch": 415, "lr": 2.1936157363928205e-05} +{"train_loss": 0.0011126581812277436, "global_step": 49399, "epoch": 415, "lr": 2.1934323773424036e-05} +{"train_loss": 0.000557536375708878, "global_step": 49400, "epoch": 415, "lr": 2.1932490238023807e-05} +{"train_loss": 0.0012023367453366518, "global_step": 49401, "epoch": 415, "lr": 2.193065675773115e-05} +{"train_loss": 0.000359695142833516, "global_step": 49402, "epoch": 415, "lr": 2.192882333254963e-05} +{"train_loss": 0.0009118749876506627, "global_step": 49403, "epoch": 415, "lr": 2.1926989962482893e-05} +{"train_loss": 0.0005583873717114329, "global_step": 49404, "epoch": 415, "lr": 2.1925156647534483e-05} +{"train_loss": 0.0005454655038192868, "global_step": 49405, "epoch": 415, "lr": 2.1923323387708054e-05} +{"train_loss": 0.000429864798206836, "global_step": 49406, "epoch": 415, "lr": 2.192149018300716e-05} +{"train_loss": 0.001351867918856442, "global_step": 49407, "epoch": 415, "lr": 2.191965703343544e-05} +{"train_loss": 0.0015916728880256414, "global_step": 49408, "epoch": 415, "lr": 2.1917823938996468e-05} +{"train_loss": 0.0014121894491836429, "global_step": 49409, "epoch": 415, "lr": 2.1915990899693834e-05} +{"train_loss": 0.001120291417464614, "global_step": 49410, "epoch": 415, "lr": 2.191415791553117e-05} +{"train_loss": 0.0008553695515729487, "global_step": 49411, "epoch": 415, "lr": 2.191232498651204e-05} +{"train_loss": 0.0015047439374029636, "global_step": 49412, "epoch": 415, "lr": 2.1910492112640076e-05} +{"train_loss": 0.0014252857072278857, "global_step": 49413, "epoch": 415, "lr": 2.1908659293918837e-05} +{"train_loss": 0.0009444795432500541, "global_step": 49414, "epoch": 415, "lr": 2.1906826530351966e-05} +{"train_loss": 0.0012742880498990417, "global_step": 49415, "epoch": 415, "lr": 2.1904993821943044e-05} +{"train_loss": 0.0012831168714910746, "global_step": 49416, "epoch": 415, "lr": 2.190316116869564e-05} +{"train_loss": 0.0010772872483357787, "global_step": 49417, "epoch": 415, "lr": 2.19013285706134e-05} +{"train_loss": 0.0014649364165961742, "global_step": 49418, "epoch": 415, "lr": 2.189949602769988e-05} +{"train_loss": 0.0008572421502321959, "global_step": 49419, "epoch": 415, "lr": 2.1897663539958714e-05} +{"train_loss": 0.0009825456654652953, "global_step": 49420, "epoch": 415, "lr": 2.1895831107393484e-05} +{"train_loss": 0.000831533398013562, "global_step": 49421, "epoch": 415, "lr": 2.189399873000777e-05} +{"train_loss": 0.0010604917770251632, "global_step": 49422, "epoch": 415, "lr": 2.1892166407805202e-05} +{"train_loss": 0.0006662945379503071, "global_step": 49423, "epoch": 415, "lr": 2.1890334140789353e-05} +{"train_loss": 0.00079157022992149, "global_step": 49424, "epoch": 415, "lr": 2.188850192896384e-05} +{"train_loss": 0.0004872554272878915, "global_step": 49425, "epoch": 415, "lr": 2.1886669772332234e-05} +{"train_loss": 0.0007934703608043492, "global_step": 49426, "epoch": 415, "lr": 2.1884837670898167e-05} +{"train_loss": 0.001266780192963779, "global_step": 49427, "epoch": 415, "lr": 2.1883005624665214e-05} +{"train_loss": 0.0006150317494757473, "global_step": 49428, "epoch": 415, "lr": 2.1881173633636965e-05} +{"train_loss": 0.0019885629881173372, "global_step": 49429, "epoch": 415, "lr": 2.187934169781704e-05} +{"train_loss": 0.0007222950225695968, "global_step": 49430, "epoch": 415, "lr": 2.187750981720901e-05} +{"train_loss": 0.0010153286857530475, "global_step": 49431, "epoch": 415, "lr": 2.1875677991816494e-05} +{"train_loss": 0.0007403765921480954, "global_step": 49432, "epoch": 415, "lr": 2.1873846221643067e-05} +{"train_loss": 0.0010023096110671759, "global_step": 49433, "epoch": 415, "lr": 2.187201450669234e-05} +{"train_loss": 0.0010130467126145959, "global_step": 49434, "epoch": 415, "lr": 2.1870182846967922e-05} +{"train_loss": 0.0014226891798898578, "global_step": 49435, "epoch": 415, "lr": 2.1868351242473378e-05} +{"train_loss": 0.0009915126720443368, "global_step": 49436, "epoch": 415, "lr": 2.1866519693212343e-05} +{"train_loss": 0.0006129624089226127, "global_step": 49437, "epoch": 415, "lr": 2.186468819918837e-05} +{"train_loss": 0.0006681777886115015, "global_step": 49438, "epoch": 415, "lr": 2.1862856760405092e-05} +{"train_loss": 0.0007697200635448098, "global_step": 49439, "epoch": 415, "lr": 2.186102537686609e-05} +{"train_loss": 0.0008886900031939149, "global_step": 49440, "epoch": 415, "lr": 2.1859194048574943e-05} +{"train_loss": 0.0009251259034499526, "global_step": 49441, "epoch": 415, "lr": 2.1857362775535277e-05} +{"train_loss": 0.0005911675398238003, "global_step": 49442, "epoch": 415, "lr": 2.1855531557750653e-05} +{"train_loss": 0.0005483863642439246, "global_step": 49443, "epoch": 415, "lr": 2.1853700395224706e-05} +{"train_loss": 0.0007844097563065588, "global_step": 49444, "epoch": 415, "lr": 2.1851869287960995e-05} +{"train_loss": 0.0014151646755635738, "global_step": 49445, "epoch": 415, "lr": 2.185003823596315e-05} +{"train_loss": 0.0007856524898670614, "global_step": 49446, "epoch": 415, "lr": 2.184820723923474e-05} +{"train_loss": 0.0006807340541854501, "global_step": 49447, "epoch": 415, "lr": 2.1846376297779358e-05} +{"train_loss": 0.0010093626333400607, "global_step": 49448, "epoch": 415, "lr": 2.1844545411600625e-05} +{"train_loss": 0.0007657954702153802, "global_step": 49449, "epoch": 415, "lr": 2.18427145807021e-05} +{"train_loss": 0.0012980062747374177, "global_step": 49450, "epoch": 415, "lr": 2.1840883805087415e-05} +{"train_loss": 0.0011469287564978004, "global_step": 49451, "epoch": 415, "lr": 2.1839053084760124e-05} +{"train_loss": 0.0011319521581754088, "global_step": 49452, "epoch": 415, "lr": 2.183722241972387e-05} +{"train_loss": 0.0013443637872114778, "global_step": 49453, "epoch": 415, "lr": 2.1835391809982215e-05} +{"train_loss": 0.0005294204456731677, "global_step": 49454, "epoch": 415, "lr": 2.183356125553874e-05} +{"train_loss": 0.0013048541732132435, "global_step": 49455, "epoch": 415, "lr": 2.183173075639708e-05} +{"train_loss": 0.0009815033990889788, "global_step": 49456, "epoch": 415, "lr": 2.1829900312560784e-05} +{"train_loss": 0.0012906950432807207, "global_step": 49457, "epoch": 415, "lr": 2.1828069924033494e-05} +{"train_loss": 0.0007901726057752967, "global_step": 49458, "epoch": 415, "lr": 2.1826239590818777e-05} +{"train_loss": 0.00045166120980866253, "global_step": 49459, "epoch": 415, "lr": 2.1824409312920207e-05} +{"train_loss": 0.0009507509530521929, "global_step": 49460, "epoch": 415, "lr": 2.1822579090341423e-05} +{"train_loss": 0.000872568809427321, "global_step": 49461, "epoch": 415, "lr": 2.1820748923085976e-05} +{"train_loss": 0.000991466804407537, "global_step": 49462, "epoch": 415, "lr": 2.181891881115749e-05} +{"train_loss": 0.0008053054916672409, "global_step": 49463, "epoch": 415, "lr": 2.1817088754559533e-05} +{"train_loss": 0.0006835308158770204, "global_step": 49464, "epoch": 415, "lr": 2.181525875329573e-05} +{"train_loss": 0.0008671797695569694, "global_step": 49465, "epoch": 415, "lr": 2.1813428807369634e-05} +{"train_loss": 0.0009784128051251173, "global_step": 49466, "epoch": 415, "lr": 2.181159891678488e-05} +{"train_loss": 0.0008163070888258517, "global_step": 49467, "epoch": 415, "lr": 2.180976908154502e-05} +{"train_loss": 0.001096912077628076, "global_step": 49468, "epoch": 415, "lr": 2.1807939301653686e-05} +{"train_loss": 0.0009981401963159442, "global_step": 49469, "epoch": 415, "lr": 2.1806109577114436e-05} +{"train_loss": 0.0009491026867181063, "global_step": 49470, "epoch": 415, "lr": 2.1804279907930892e-05} +{"train_loss": 0.0006189016858115792, "global_step": 49471, "epoch": 415, "lr": 2.1802450294106614e-05} +{"train_loss": 0.0007099391659721732, "global_step": 49472, "epoch": 415, "lr": 2.1800620735645232e-05} +{"train_loss": 0.0014232790563255548, "global_step": 49473, "epoch": 415, "lr": 2.1798791232550298e-05} +{"train_loss": 0.000633794057648629, "global_step": 49474, "epoch": 415, "lr": 2.179696178482545e-05} +{"train_loss": 0.0009662818629294634, "global_step": 49475, "epoch": 415, "lr": 2.1795132392474225e-05} +{"train_loss": 0.0006384763983078301, "global_step": 49476, "epoch": 415, "lr": 2.179330305550027e-05} +{"train_loss": 0.0006637452752329409, "global_step": 49477, "epoch": 415, "lr": 2.1791473773907152e-05} +{"train_loss": 0.0011437184875831008, "global_step": 49478, "epoch": 415, "lr": 2.178964454769844e-05} +{"train_loss": 0.0005802097148261964, "global_step": 49479, "epoch": 415, "lr": 2.178781537687776e-05} +{"train_loss": 0.0007276644464582205, "global_step": 49480, "epoch": 415, "lr": 2.1785986261448682e-05} +{"train_loss": 0.0009264030959457159, "global_step": 49481, "epoch": 415, "lr": 2.178415720141482e-05} +{"train_loss": 0.0009275325573980808, "global_step": 49482, "epoch": 415, "lr": 2.1782328196779733e-05} +{"train_loss": 0.0016039892798289657, "global_step": 49483, "epoch": 415, "lr": 2.178049924754705e-05} +{"train_loss": 0.0009748133015818894, "global_step": 49484, "epoch": 415, "lr": 2.177867035372034e-05} +{"train_loss": 0.0004425467341206968, "global_step": 49485, "epoch": 415, "lr": 2.1776841515303176e-05} +{"train_loss": 0.0009149552788585424, "global_step": 49486, "epoch": 415, "lr": 2.1775012732299187e-05} +{"train_loss": 0.0006487630307674408, "global_step": 49487, "epoch": 415, "lr": 2.177318400471193e-05} +{"train_loss": 0.000583539716899395, "global_step": 49488, "epoch": 415, "lr": 2.177135533254503e-05} +{"train_loss": 0.0013680014526471496, "global_step": 49489, "epoch": 415, "lr": 2.176952671580205e-05} +{"train_loss": 0.0006566078518517315, "global_step": 49490, "epoch": 415, "lr": 2.1767698154486578e-05} +{"train_loss": 0.0010422330815345049, "global_step": 49491, "epoch": 415, "lr": 2.1765869648602228e-05} +{"train_loss": 0.0011443032417446375, "global_step": 49492, "epoch": 415, "lr": 2.1764041198152563e-05} +{"train_loss": 0.0005550780333578587, "global_step": 49493, "epoch": 415, "lr": 2.1762212803141204e-05} +{"train_loss": 0.0008547946927137673, "global_step": 49494, "epoch": 415, "lr": 2.1760384463571698e-05} +{"train_loss": 0.0012027887860313058, "global_step": 49495, "epoch": 415, "lr": 2.1758556179447686e-05} +{"train_loss": 0.0012422007275745273, "global_step": 49496, "epoch": 415, "lr": 2.175672795077271e-05} +{"train_loss": 0.0012971553951501846, "global_step": 49497, "epoch": 415, "lr": 2.1754899777550402e-05} +{"train_loss": 0.0004922754596918821, "global_step": 49498, "epoch": 415, "lr": 2.1753071659784308e-05} +{"train_loss": 0.0006133446004241705, "global_step": 49499, "epoch": 415, "lr": 2.175124359747806e-05} +{"train_loss": 0.0011799382045865059, "global_step": 49500, "epoch": 415, "lr": 2.1749415590635213e-05} +{"train_loss": 0.0005974267842248082, "global_step": 49501, "epoch": 415, "lr": 2.1747587639259387e-05} +{"train_loss": 0.0011067077284678817, "global_step": 49502, "epoch": 415, "lr": 2.174575974335413e-05} +{"train_loss": 0.000942595476458757, "global_step": 49503, "epoch": 415, "lr": 2.1743931902923083e-05, "val_loss": 0.04498045891523361, "train_action_mse_error": 1.668081313255243e-05} +{"train_loss": 0.0005587643245235085, "global_step": 49504, "epoch": 416, "lr": 2.1742104117969786e-05} +{"train_loss": 0.0012315241619944572, "global_step": 49505, "epoch": 416, "lr": 2.1740276388497865e-05} +{"train_loss": 0.0012730711605399847, "global_step": 49506, "epoch": 416, "lr": 2.173844871451087e-05} +{"train_loss": 0.0009804106084629893, "global_step": 49507, "epoch": 416, "lr": 2.1736621096012437e-05} +{"train_loss": 0.0006748057785443962, "global_step": 49508, "epoch": 416, "lr": 2.1734793533006126e-05} +{"train_loss": 0.0011691659456118941, "global_step": 49509, "epoch": 416, "lr": 2.173296602549551e-05} +{"train_loss": 0.0008688835077919066, "global_step": 49510, "epoch": 416, "lr": 2.1731138573484213e-05} +{"train_loss": 0.0012368677416816354, "global_step": 49511, "epoch": 416, "lr": 2.1729311176975787e-05} +{"train_loss": 0.0009217338520102203, "global_step": 49512, "epoch": 416, "lr": 2.172748383597386e-05} +{"train_loss": 0.0005987115437164903, "global_step": 49513, "epoch": 416, "lr": 2.1725656550481976e-05} +{"train_loss": 0.0007116986671462655, "global_step": 49514, "epoch": 416, "lr": 2.1723829320503765e-05} +{"train_loss": 0.0008494814392179251, "global_step": 49515, "epoch": 416, "lr": 2.172200214604279e-05} +{"train_loss": 0.0009424779564142227, "global_step": 49516, "epoch": 416, "lr": 2.172017502710263e-05} +{"train_loss": 0.0010536302579566836, "global_step": 49517, "epoch": 416, "lr": 2.17183479636869e-05} +{"train_loss": 0.0008749524131417274, "global_step": 49518, "epoch": 416, "lr": 2.1716520955799153e-05} +{"train_loss": 0.0012076436541974545, "global_step": 49519, "epoch": 416, "lr": 2.171469400344302e-05} +{"train_loss": 0.0010099367937073112, "global_step": 49520, "epoch": 416, "lr": 2.1712867106622058e-05} +{"train_loss": 0.0012917598942294717, "global_step": 49521, "epoch": 416, "lr": 2.1711040265339842e-05} +{"train_loss": 0.0006711507448926568, "global_step": 49522, "epoch": 416, "lr": 2.1709213479599993e-05} +{"train_loss": 0.0018376160878688097, "global_step": 49523, "epoch": 416, "lr": 2.1707386749406068e-05} +{"train_loss": 0.0012905651237815619, "global_step": 49524, "epoch": 416, "lr": 2.1705560074761677e-05} +{"train_loss": 0.0007720206631347537, "global_step": 49525, "epoch": 416, "lr": 2.1703733455670384e-05} +{"train_loss": 0.0007521443767473102, "global_step": 49526, "epoch": 416, "lr": 2.1701906892135804e-05} +{"train_loss": 0.0009672587621025741, "global_step": 49527, "epoch": 416, "lr": 2.1700080384161505e-05} +{"train_loss": 0.000942094309721142, "global_step": 49528, "epoch": 416, "lr": 2.1698253931751055e-05} +{"train_loss": 0.0007418991881422698, "global_step": 49529, "epoch": 416, "lr": 2.169642753490808e-05} +{"train_loss": 0.0009314027847722173, "global_step": 49530, "epoch": 416, "lr": 2.1694601193636133e-05} +{"train_loss": 0.0007914782618172467, "global_step": 49531, "epoch": 416, "lr": 2.1692774907938806e-05} +{"train_loss": 0.0008229219820350409, "global_step": 49532, "epoch": 416, "lr": 2.1690948677819712e-05} +{"train_loss": 0.0013151222374290228, "global_step": 49533, "epoch": 416, "lr": 2.16891225032824e-05} +{"train_loss": 0.0010542579693719745, "global_step": 49534, "epoch": 416, "lr": 2.1687296384330487e-05} +{"train_loss": 0.0010887939715757966, "global_step": 49535, "epoch": 416, "lr": 2.1685470320967522e-05} +{"train_loss": 0.000904584361705929, "global_step": 49536, "epoch": 416, "lr": 2.168364431319713e-05} +{"train_loss": 0.0013863296480849385, "global_step": 49537, "epoch": 416, "lr": 2.168181836102286e-05} +{"train_loss": 0.0007093914900906384, "global_step": 49538, "epoch": 416, "lr": 2.1679992464448335e-05} +{"train_loss": 0.0010092180455103517, "global_step": 49539, "epoch": 416, "lr": 2.1678166623477112e-05} +{"train_loss": 0.0007356765563599765, "global_step": 49540, "epoch": 416, "lr": 2.1676340838112773e-05} +{"train_loss": 0.00198121415451169, "global_step": 49541, "epoch": 416, "lr": 2.1674515108358928e-05} +{"train_loss": 0.0007063787779770792, "global_step": 49542, "epoch": 416, "lr": 2.1672689434219128e-05} +{"train_loss": 0.0011572742369025946, "global_step": 49543, "epoch": 416, "lr": 2.1670863815696995e-05} +{"train_loss": 0.0012159149628132582, "global_step": 49544, "epoch": 416, "lr": 2.1669038252796074e-05} +{"train_loss": 0.0009315124480053782, "global_step": 49545, "epoch": 416, "lr": 2.1667212745519993e-05} +{"train_loss": 0.0007214698125608265, "global_step": 49546, "epoch": 416, "lr": 2.1665387293872306e-05} +{"train_loss": 0.0003328250895719975, "global_step": 49547, "epoch": 416, "lr": 2.1663561897856595e-05} +{"train_loss": 0.0009676235495135188, "global_step": 49548, "epoch": 416, "lr": 2.1661736557476464e-05} +{"train_loss": 0.0008094465592876077, "global_step": 49549, "epoch": 416, "lr": 2.1659911272735467e-05} +{"train_loss": 0.0010013363789767027, "global_step": 49550, "epoch": 416, "lr": 2.1658086043637227e-05} +{"train_loss": 0.0006863073213025928, "global_step": 49551, "epoch": 416, "lr": 2.165626087018529e-05} +{"train_loss": 0.0014718238962814212, "global_step": 49552, "epoch": 416, "lr": 2.1654435752383273e-05} +{"train_loss": 0.001018333830870688, "global_step": 49553, "epoch": 416, "lr": 2.1652610690234742e-05} +{"train_loss": 0.0007019350887276232, "global_step": 49554, "epoch": 416, "lr": 2.165078568374327e-05} +{"train_loss": 0.0013021953636780381, "global_step": 49555, "epoch": 416, "lr": 2.164896073291246e-05} +{"train_loss": 0.0007465318194590509, "global_step": 49556, "epoch": 416, "lr": 2.1647135837745875e-05} +{"train_loss": 0.0005122944712638855, "global_step": 49557, "epoch": 416, "lr": 2.1645310998247127e-05} +{"train_loss": 0.0007182068075053394, "global_step": 49558, "epoch": 416, "lr": 2.164348621441978e-05} +{"train_loss": 0.001646077842451632, "global_step": 49559, "epoch": 416, "lr": 2.16416614862674e-05} +{"train_loss": 0.0007400305476039648, "global_step": 49560, "epoch": 416, "lr": 2.1639836813793607e-05} +{"train_loss": 0.0004920685314573348, "global_step": 49561, "epoch": 416, "lr": 2.1638012197001945e-05} +{"train_loss": 0.0018149021780118346, "global_step": 49562, "epoch": 416, "lr": 2.163618763589604e-05} +{"train_loss": 0.0006858020205982029, "global_step": 49563, "epoch": 416, "lr": 2.1634363130479425e-05} +{"train_loss": 0.000988644897006452, "global_step": 49564, "epoch": 416, "lr": 2.1632538680755725e-05} +{"train_loss": 0.0016762297600507736, "global_step": 49565, "epoch": 416, "lr": 2.1630714286728494e-05} +{"train_loss": 0.0008794381283223629, "global_step": 49566, "epoch": 416, "lr": 2.162888994840132e-05} +{"train_loss": 0.0008426179992966354, "global_step": 49567, "epoch": 416, "lr": 2.1627065665777806e-05} +{"train_loss": 0.0010479615302756429, "global_step": 49568, "epoch": 416, "lr": 2.1625241438861505e-05} +{"train_loss": 0.0007297068368643522, "global_step": 49569, "epoch": 416, "lr": 2.1623417267656025e-05} +{"train_loss": 0.002022814704105258, "global_step": 49570, "epoch": 416, "lr": 2.1621593152164916e-05} +{"train_loss": 0.0007886941893957555, "global_step": 49571, "epoch": 416, "lr": 2.1619769092391794e-05} +{"train_loss": 0.0014407713897526264, "global_step": 49572, "epoch": 416, "lr": 2.161794508834023e-05} +{"train_loss": 0.0008459946839138865, "global_step": 49573, "epoch": 416, "lr": 2.1616121140013772e-05} +{"train_loss": 0.0008912245975807309, "global_step": 49574, "epoch": 416, "lr": 2.1614297247416053e-05} +{"train_loss": 0.001017073867842555, "global_step": 49575, "epoch": 416, "lr": 2.1612473410550605e-05} +{"train_loss": 0.0010747105116024613, "global_step": 49576, "epoch": 416, "lr": 2.1610649629421052e-05} +{"train_loss": 0.0017022719839587808, "global_step": 49577, "epoch": 416, "lr": 2.160882590403096e-05} +{"train_loss": 0.0011018222430720925, "global_step": 49578, "epoch": 416, "lr": 2.1607002234383883e-05} +{"train_loss": 0.0008527925238013268, "global_step": 49579, "epoch": 416, "lr": 2.160517862048344e-05} +{"train_loss": 0.000707930710632354, "global_step": 49580, "epoch": 416, "lr": 2.160335506233318e-05} +{"train_loss": 0.001071292906999588, "global_step": 49581, "epoch": 416, "lr": 2.1601531559936715e-05} +{"train_loss": 0.0013767494820058346, "global_step": 49582, "epoch": 416, "lr": 2.1599708113297597e-05} +{"train_loss": 0.0008256600704044104, "global_step": 49583, "epoch": 416, "lr": 2.1597884722419427e-05} +{"train_loss": 0.0015596834709867835, "global_step": 49584, "epoch": 416, "lr": 2.1596061387305783e-05} +{"train_loss": 0.0014972921926528215, "global_step": 49585, "epoch": 416, "lr": 2.1594238107960212e-05} +{"train_loss": 0.0007819244056008756, "global_step": 49586, "epoch": 416, "lr": 2.1592414884386346e-05} +{"train_loss": 0.0010942919179797173, "global_step": 49587, "epoch": 416, "lr": 2.1590591716587717e-05} +{"train_loss": 0.0011530108749866486, "global_step": 49588, "epoch": 416, "lr": 2.1588768604567945e-05} +{"train_loss": 0.0013660669792443514, "global_step": 49589, "epoch": 416, "lr": 2.1586945548330588e-05} +{"train_loss": 0.0010042060166597366, "global_step": 49590, "epoch": 416, "lr": 2.1585122547879218e-05} +{"train_loss": 0.0006936801946721971, "global_step": 49591, "epoch": 416, "lr": 2.1583299603217432e-05} +{"train_loss": 0.0017429515719413757, "global_step": 49592, "epoch": 416, "lr": 2.1581476714348788e-05} +{"train_loss": 0.0004293177044019103, "global_step": 49593, "epoch": 416, "lr": 2.1579653881276894e-05} +{"train_loss": 0.0006052767857909203, "global_step": 49594, "epoch": 416, "lr": 2.15778311040053e-05} +{"train_loss": 0.0010931864380836487, "global_step": 49595, "epoch": 416, "lr": 2.157600838253761e-05} +{"train_loss": 0.001323765842244029, "global_step": 49596, "epoch": 416, "lr": 2.1574185716877377e-05} +{"train_loss": 0.0007429170073010027, "global_step": 49597, "epoch": 416, "lr": 2.157236310702821e-05} +{"train_loss": 0.001344232470728457, "global_step": 49598, "epoch": 416, "lr": 2.1570540552993658e-05} +{"train_loss": 0.0007405454525724053, "global_step": 49599, "epoch": 416, "lr": 2.156871805477732e-05} +{"train_loss": 0.0014899310190230608, "global_step": 49600, "epoch": 416, "lr": 2.156689561238276e-05} +{"train_loss": 0.0013102074153721333, "global_step": 49601, "epoch": 416, "lr": 2.1565073225813553e-05} +{"train_loss": 0.0009324726415798068, "global_step": 49602, "epoch": 416, "lr": 2.1563250895073313e-05} +{"train_loss": 0.001068205339834094, "global_step": 49603, "epoch": 416, "lr": 2.1561428620165587e-05} +{"train_loss": 0.0010681338608264923, "global_step": 49604, "epoch": 416, "lr": 2.1559606401093942e-05} +{"train_loss": 0.0008377536432817578, "global_step": 49605, "epoch": 416, "lr": 2.1557784237861988e-05} +{"train_loss": 0.0009285960113629699, "global_step": 49606, "epoch": 416, "lr": 2.1555962130473267e-05} +{"train_loss": 0.0008494858630001545, "global_step": 49607, "epoch": 416, "lr": 2.1554140078931396e-05} +{"train_loss": 0.0010678945109248161, "global_step": 49608, "epoch": 416, "lr": 2.155231808323993e-05} +{"train_loss": 0.0012253200402483344, "global_step": 49609, "epoch": 416, "lr": 2.1550496143402433e-05} +{"train_loss": 0.0008983876323327422, "global_step": 49610, "epoch": 416, "lr": 2.1548674259422514e-05} +{"train_loss": 0.0009919945150613785, "global_step": 49611, "epoch": 416, "lr": 2.1546852431303716e-05} +{"train_loss": 0.0009225425310432911, "global_step": 49612, "epoch": 416, "lr": 2.1545030659049648e-05} +{"train_loss": 0.00101237534545362, "global_step": 49613, "epoch": 416, "lr": 2.1543208942663857e-05} +{"train_loss": 0.0014287964440882206, "global_step": 49614, "epoch": 416, "lr": 2.1541387282149956e-05} +{"train_loss": 0.0009056013659574091, "global_step": 49615, "epoch": 416, "lr": 2.1539565677511497e-05} +{"train_loss": 0.0008889900054782629, "global_step": 49616, "epoch": 416, "lr": 2.153774412875204e-05} +{"train_loss": 0.0007089052232913673, "global_step": 49617, "epoch": 416, "lr": 2.1535922635875204e-05} +{"train_loss": 0.0014715221477672458, "global_step": 49618, "epoch": 416, "lr": 2.1534101198884522e-05} +{"train_loss": 0.0012455536052584648, "global_step": 49619, "epoch": 416, "lr": 2.1532279817783612e-05} +{"train_loss": 0.0012080160668119788, "global_step": 49620, "epoch": 416, "lr": 2.153045849257601e-05} +{"train_loss": 0.0007064781384542584, "global_step": 49621, "epoch": 416, "lr": 2.152863722326533e-05} +{"train_loss": 0.0010215308560751098, "global_step": 49622, "epoch": 416, "lr": 2.152681600985513e-05, "val_loss": 0.02512139268219471} +{"train_loss": 0.0010519070783630013, "global_step": 49623, "epoch": 417, "lr": 2.152499485234896e-05} +{"train_loss": 0.0014436285709962249, "global_step": 49624, "epoch": 417, "lr": 2.1523173750750448e-05} +{"train_loss": 0.0006661987281404436, "global_step": 49625, "epoch": 417, "lr": 2.152135270506312e-05} +{"train_loss": 0.0008402667008340359, "global_step": 49626, "epoch": 417, "lr": 2.151953171529059e-05} +{"train_loss": 0.0011978503316640854, "global_step": 49627, "epoch": 417, "lr": 2.151771078143642e-05} +{"train_loss": 0.0009479301515966654, "global_step": 49628, "epoch": 417, "lr": 2.151588990350416e-05} +{"train_loss": 0.0009823122527450323, "global_step": 49629, "epoch": 417, "lr": 2.1514069081497407e-05} +{"train_loss": 0.001674120663665235, "global_step": 49630, "epoch": 417, "lr": 2.1512248315419757e-05} +{"train_loss": 0.0009541545296087861, "global_step": 49631, "epoch": 417, "lr": 2.1510427605274745e-05} +{"train_loss": 0.0022261752746999264, "global_step": 49632, "epoch": 417, "lr": 2.1508606951065984e-05} +{"train_loss": 0.0007607212173752487, "global_step": 49633, "epoch": 417, "lr": 2.150678635279701e-05} +{"train_loss": 0.000848052091896534, "global_step": 49634, "epoch": 417, "lr": 2.1504965810471433e-05} +{"train_loss": 0.0009671044535934925, "global_step": 49635, "epoch": 417, "lr": 2.15031453240928e-05} +{"train_loss": 0.001620507682673633, "global_step": 49636, "epoch": 417, "lr": 2.150132489366471e-05} +{"train_loss": 0.0010516648180782795, "global_step": 49637, "epoch": 417, "lr": 2.1499504519190706e-05} +{"train_loss": 0.00046072143595665693, "global_step": 49638, "epoch": 417, "lr": 2.1497684200674396e-05} +{"train_loss": 0.0016223021084442735, "global_step": 49639, "epoch": 417, "lr": 2.1495863938119327e-05} +{"train_loss": 0.0015586641384288669, "global_step": 49640, "epoch": 417, "lr": 2.1494043731529094e-05} +{"train_loss": 0.0012178680626675487, "global_step": 49641, "epoch": 417, "lr": 2.1492223580907267e-05} +{"train_loss": 0.0004945595865137875, "global_step": 49642, "epoch": 417, "lr": 2.1490403486257388e-05} +{"train_loss": 0.0008486562292091548, "global_step": 49643, "epoch": 417, "lr": 2.148858344758308e-05} +{"train_loss": 0.0010809075320139527, "global_step": 49644, "epoch": 417, "lr": 2.148676346488787e-05} +{"train_loss": 0.0009003687300719321, "global_step": 49645, "epoch": 417, "lr": 2.148494353817538e-05} +{"train_loss": 0.0012132865376770496, "global_step": 49646, "epoch": 417, "lr": 2.1483123667449153e-05} +{"train_loss": 0.001342037576250732, "global_step": 49647, "epoch": 417, "lr": 2.1481303852712742e-05} +{"train_loss": 0.0010757895652204752, "global_step": 49648, "epoch": 417, "lr": 2.1479484093969763e-05} +{"train_loss": 0.0010806489735841751, "global_step": 49649, "epoch": 417, "lr": 2.147766439122376e-05} +{"train_loss": 0.0008817087509669363, "global_step": 49650, "epoch": 417, "lr": 2.147584474447833e-05} +{"train_loss": 0.000619799189735204, "global_step": 49651, "epoch": 417, "lr": 2.1474025153737015e-05} +{"train_loss": 0.0006789324688725173, "global_step": 49652, "epoch": 417, "lr": 2.1472205619003415e-05} +{"train_loss": 0.0012076059356331825, "global_step": 49653, "epoch": 417, "lr": 2.1470386140281103e-05} +{"train_loss": 0.0007789506344124675, "global_step": 49654, "epoch": 417, "lr": 2.1468566717573614e-05} +{"train_loss": 0.0014653842663392425, "global_step": 49655, "epoch": 417, "lr": 2.1466747350884565e-05} +{"train_loss": 0.0008788141421973705, "global_step": 49656, "epoch": 417, "lr": 2.1464928040217492e-05} +{"train_loss": 0.000780379050411284, "global_step": 49657, "epoch": 417, "lr": 2.1463108785576004e-05} +{"train_loss": 0.0011599110439419746, "global_step": 49658, "epoch": 417, "lr": 2.1461289586963645e-05} +{"train_loss": 0.0010630638571456075, "global_step": 49659, "epoch": 417, "lr": 2.145947044438399e-05} +{"train_loss": 0.0009267614223062992, "global_step": 49660, "epoch": 417, "lr": 2.1457651357840624e-05} +{"train_loss": 0.0012134917778894305, "global_step": 49661, "epoch": 417, "lr": 2.1455832327337095e-05} +{"train_loss": 0.0011529442854225636, "global_step": 49662, "epoch": 417, "lr": 2.1454013352877006e-05} +{"train_loss": 0.0009659925126470625, "global_step": 49663, "epoch": 417, "lr": 2.1452194434463895e-05} +{"train_loss": 0.0014387042028829455, "global_step": 49664, "epoch": 417, "lr": 2.1450375572101356e-05} +{"train_loss": 0.0010042211506515741, "global_step": 49665, "epoch": 417, "lr": 2.1448556765792967e-05} +{"train_loss": 0.0011495903600007296, "global_step": 49666, "epoch": 417, "lr": 2.144673801554227e-05} +{"train_loss": 0.0017253003316000104, "global_step": 49667, "epoch": 417, "lr": 2.144491932135287e-05} +{"train_loss": 0.0010887101525440812, "global_step": 49668, "epoch": 417, "lr": 2.14431006832283e-05} +{"train_loss": 0.0016883165808394551, "global_step": 49669, "epoch": 417, "lr": 2.144128210117217e-05} +{"train_loss": 0.0010560407536104321, "global_step": 49670, "epoch": 417, "lr": 2.143946357518802e-05} +{"train_loss": 0.001022518496029079, "global_step": 49671, "epoch": 417, "lr": 2.1437645105279442e-05} +{"train_loss": 0.0014839478535577655, "global_step": 49672, "epoch": 417, "lr": 2.1435826691449997e-05} +{"train_loss": 0.0006994324503466487, "global_step": 49673, "epoch": 417, "lr": 2.1434008333703236e-05} +{"train_loss": 0.0015394393121823668, "global_step": 49674, "epoch": 417, "lr": 2.143219003204277e-05} +{"train_loss": 0.0007263189763762057, "global_step": 49675, "epoch": 417, "lr": 2.1430371786472133e-05} +{"train_loss": 0.0010694705415517092, "global_step": 49676, "epoch": 417, "lr": 2.1428553596994915e-05} +{"train_loss": 0.001094405073672533, "global_step": 49677, "epoch": 417, "lr": 2.142673546361469e-05} +{"train_loss": 0.001394235179759562, "global_step": 49678, "epoch": 417, "lr": 2.1424917386334992e-05} +{"train_loss": 0.001252639340236783, "global_step": 49679, "epoch": 417, "lr": 2.142309936515944e-05} +{"train_loss": 0.0009170385310426354, "global_step": 49680, "epoch": 417, "lr": 2.142128140009156e-05} +{"train_loss": 0.00086238794028759, "global_step": 49681, "epoch": 417, "lr": 2.1419463491134957e-05} +{"train_loss": 0.0014007198624312878, "global_step": 49682, "epoch": 417, "lr": 2.141764563829316e-05} +{"train_loss": 0.0009338975651189685, "global_step": 49683, "epoch": 417, "lr": 2.141582784156979e-05} +{"train_loss": 0.000988614745438099, "global_step": 49684, "epoch": 417, "lr": 2.1414010100968383e-05} +{"train_loss": 0.0015284873079508543, "global_step": 49685, "epoch": 417, "lr": 2.14121924164925e-05} +{"train_loss": 0.0013722380390390754, "global_step": 49686, "epoch": 417, "lr": 2.1410374788145736e-05} +{"train_loss": 0.0010256606619805098, "global_step": 49687, "epoch": 417, "lr": 2.140855721593163e-05} +{"train_loss": 0.0011246632784605026, "global_step": 49688, "epoch": 417, "lr": 2.1406739699853783e-05} +{"train_loss": 0.00041079852962866426, "global_step": 49689, "epoch": 417, "lr": 2.1404922239915735e-05} +{"train_loss": 0.001119977212511003, "global_step": 49690, "epoch": 417, "lr": 2.1403104836121085e-05} +{"train_loss": 0.0011296870652586222, "global_step": 49691, "epoch": 417, "lr": 2.1401287488473383e-05} +{"train_loss": 0.001255576964467764, "global_step": 49692, "epoch": 417, "lr": 2.1399470196976172e-05} +{"train_loss": 0.0011257920414209366, "global_step": 49693, "epoch": 417, "lr": 2.1397652961633075e-05} +{"train_loss": 0.0014714394928887486, "global_step": 49694, "epoch": 417, "lr": 2.1395835782447605e-05} +{"train_loss": 0.0011171214282512665, "global_step": 49695, "epoch": 417, "lr": 2.1394018659423377e-05} +{"train_loss": 0.0013306032633408904, "global_step": 49696, "epoch": 417, "lr": 2.1392201592563922e-05} +{"train_loss": 0.0010033291764557362, "global_step": 49697, "epoch": 417, "lr": 2.1390384581872835e-05} +{"train_loss": 0.001840274897404015, "global_step": 49698, "epoch": 417, "lr": 2.1388567627353655e-05} +{"train_loss": 0.0011429921723902225, "global_step": 49699, "epoch": 417, "lr": 2.1386750729009968e-05} +{"train_loss": 0.000813713064417243, "global_step": 49700, "epoch": 417, "lr": 2.1384933886845355e-05} +{"train_loss": 0.001433784724213183, "global_step": 49701, "epoch": 417, "lr": 2.1383117100863347e-05} +{"train_loss": 0.0005697104497812688, "global_step": 49702, "epoch": 417, "lr": 2.1381300371067555e-05} +{"train_loss": 0.00105666508898139, "global_step": 49703, "epoch": 417, "lr": 2.1379483697461522e-05} +{"train_loss": 0.0010370572563260794, "global_step": 49704, "epoch": 417, "lr": 2.137766708004879e-05} +{"train_loss": 0.001079833833500743, "global_step": 49705, "epoch": 417, "lr": 2.1375850518832972e-05} +{"train_loss": 0.001319030998274684, "global_step": 49706, "epoch": 417, "lr": 2.13740340138176e-05} +{"train_loss": 0.001077587017789483, "global_step": 49707, "epoch": 417, "lr": 2.1372217565006268e-05} +{"train_loss": 0.0008465040009468794, "global_step": 49708, "epoch": 417, "lr": 2.1370401172402532e-05} +{"train_loss": 0.0017315333243459463, "global_step": 49709, "epoch": 417, "lr": 2.1368584836009932e-05} +{"train_loss": 0.0018237648764625192, "global_step": 49710, "epoch": 417, "lr": 2.136676855583208e-05} +{"train_loss": 0.0009626212413422763, "global_step": 49711, "epoch": 417, "lr": 2.1364952331872494e-05} +{"train_loss": 0.0017435216577723622, "global_step": 49712, "epoch": 417, "lr": 2.136313616413479e-05} +{"train_loss": 0.000458346214145422, "global_step": 49713, "epoch": 417, "lr": 2.1361320052622484e-05} +{"train_loss": 0.0005908257444389164, "global_step": 49714, "epoch": 417, "lr": 2.135950399733919e-05} +{"train_loss": 0.0007838791934773326, "global_step": 49715, "epoch": 417, "lr": 2.135768799828845e-05} +{"train_loss": 0.0009755823411978781, "global_step": 49716, "epoch": 417, "lr": 2.1355872055473807e-05} +{"train_loss": 0.0009032076923176646, "global_step": 49717, "epoch": 417, "lr": 2.1354056168898874e-05} +{"train_loss": 0.0005742776556871831, "global_step": 49718, "epoch": 417, "lr": 2.1352240338567165e-05} +{"train_loss": 0.0012427305337041616, "global_step": 49719, "epoch": 417, "lr": 2.1350424564482296e-05} +{"train_loss": 0.0007836807053536177, "global_step": 49720, "epoch": 417, "lr": 2.1348608846647784e-05} +{"train_loss": 0.0010857436573132873, "global_step": 49721, "epoch": 417, "lr": 2.1346793185067237e-05} +{"train_loss": 0.0016548237763345242, "global_step": 49722, "epoch": 417, "lr": 2.1344977579744206e-05} +{"train_loss": 0.001745280809700489, "global_step": 49723, "epoch": 417, "lr": 2.134316203068223e-05} +{"train_loss": 0.0008093338692560792, "global_step": 49724, "epoch": 417, "lr": 2.134134653788491e-05} +{"train_loss": 0.0007010411936789751, "global_step": 49725, "epoch": 417, "lr": 2.1339531101355775e-05} +{"train_loss": 0.0011375721078366041, "global_step": 49726, "epoch": 417, "lr": 2.1337715721098428e-05} +{"train_loss": 0.001214152667671442, "global_step": 49727, "epoch": 417, "lr": 2.133590039711639e-05} +{"train_loss": 0.001007281243801117, "global_step": 49728, "epoch": 417, "lr": 2.1334085129413277e-05} +{"train_loss": 0.002631568117067218, "global_step": 49729, "epoch": 417, "lr": 2.1332269917992608e-05} +{"train_loss": 0.001303924829699099, "global_step": 49730, "epoch": 417, "lr": 2.1330454762857977e-05} +{"train_loss": 0.0009030386572703719, "global_step": 49731, "epoch": 417, "lr": 2.1328639664012917e-05} +{"train_loss": 0.0006822912837378681, "global_step": 49732, "epoch": 417, "lr": 2.132682462146103e-05} +{"train_loss": 0.0011483699781820178, "global_step": 49733, "epoch": 417, "lr": 2.1325009635205838e-05} +{"train_loss": 0.0015089587541297078, "global_step": 49734, "epoch": 417, "lr": 2.1323194705250948e-05} +{"train_loss": 0.0006226630648598075, "global_step": 49735, "epoch": 417, "lr": 2.1321379831599886e-05} +{"train_loss": 0.0005884991842322052, "global_step": 49736, "epoch": 417, "lr": 2.1319565014256245e-05} +{"train_loss": 0.0014956489903852344, "global_step": 49737, "epoch": 417, "lr": 2.1317750253223557e-05} +{"train_loss": 0.0012048403732478619, "global_step": 49738, "epoch": 417, "lr": 2.1315935548505417e-05} +{"train_loss": 0.0018557598814368248, "global_step": 49739, "epoch": 417, "lr": 2.131412090010536e-05} +{"train_loss": 0.0011874549090862274, "global_step": 49740, "epoch": 417, "lr": 2.1312306308026976e-05} +{"train_loss": 0.0011303943509486417, "global_step": 49741, "epoch": 417, "lr": 2.1310491772273817e-05, "val_loss": 0.014325682073831558} +{"train_loss": 0.0008754439186304808, "global_step": 49742, "epoch": 418, "lr": 2.1308677292849422e-05} +{"train_loss": 0.0010348138166591525, "global_step": 49743, "epoch": 418, "lr": 2.1306862869757395e-05} +{"train_loss": 0.0020838407799601555, "global_step": 49744, "epoch": 418, "lr": 2.1305048503001257e-05} +{"train_loss": 0.0007495652534998953, "global_step": 49745, "epoch": 418, "lr": 2.130323419258461e-05} +{"train_loss": 0.0009315789211541414, "global_step": 49746, "epoch": 418, "lr": 2.1301419938510992e-05} +{"train_loss": 0.0008051848853938282, "global_step": 49747, "epoch": 418, "lr": 2.1299605740783955e-05} +{"train_loss": 0.0015462531009688973, "global_step": 49748, "epoch": 418, "lr": 2.1297791599407097e-05} +{"train_loss": 0.0009980732575058937, "global_step": 49749, "epoch": 418, "lr": 2.1295977514383937e-05} +{"train_loss": 0.0010106334229931235, "global_step": 49750, "epoch": 418, "lr": 2.1294163485718076e-05} +{"train_loss": 0.001180659281089902, "global_step": 49751, "epoch": 418, "lr": 2.1292349513413046e-05} +{"train_loss": 0.0010778889991343021, "global_step": 49752, "epoch": 418, "lr": 2.1290535597472434e-05} +{"train_loss": 0.0020390236750245094, "global_step": 49753, "epoch": 418, "lr": 2.128872173789979e-05} +{"train_loss": 0.0009889951907098293, "global_step": 49754, "epoch": 418, "lr": 2.1286907934698652e-05} +{"train_loss": 0.0008435534546151757, "global_step": 49755, "epoch": 418, "lr": 2.1285094187872623e-05} +{"train_loss": 0.0011842147214338183, "global_step": 49756, "epoch": 418, "lr": 2.128328049742523e-05} +{"train_loss": 0.0010222221026197076, "global_step": 49757, "epoch": 418, "lr": 2.1281466863360063e-05} +{"train_loss": 0.0010301906149834394, "global_step": 49758, "epoch": 418, "lr": 2.1279653285680646e-05} +{"train_loss": 0.0004580099484883249, "global_step": 49759, "epoch": 418, "lr": 2.1277839764390583e-05} +{"train_loss": 0.001027693971991539, "global_step": 49760, "epoch": 418, "lr": 2.1276026299493414e-05} +{"train_loss": 0.0008728434913791716, "global_step": 49761, "epoch": 418, "lr": 2.127421289099268e-05} +{"train_loss": 0.0005928419413976371, "global_step": 49762, "epoch": 418, "lr": 2.1272399538891957e-05} +{"train_loss": 0.0016204832354560494, "global_step": 49763, "epoch": 418, "lr": 2.127058624319483e-05} +{"train_loss": 0.0007401908515021205, "global_step": 49764, "epoch": 418, "lr": 2.1268773003904813e-05} +{"train_loss": 0.00042461632983759046, "global_step": 49765, "epoch": 418, "lr": 2.1266959821025518e-05} +{"train_loss": 0.0006942079635336995, "global_step": 49766, "epoch": 418, "lr": 2.126514669456045e-05} +{"train_loss": 0.0006939831655472517, "global_step": 49767, "epoch": 418, "lr": 2.126333362451322e-05} +{"train_loss": 0.0006661209044978023, "global_step": 49768, "epoch": 418, "lr": 2.126152061088735e-05} +{"train_loss": 0.0006146999076008797, "global_step": 49769, "epoch": 418, "lr": 2.1259707653686427e-05} +{"train_loss": 0.0014526373706758022, "global_step": 49770, "epoch": 418, "lr": 2.1257894752913982e-05} +{"train_loss": 0.0009979305323213339, "global_step": 49771, "epoch": 418, "lr": 2.1256081908573604e-05} +{"train_loss": 0.00041090097511187196, "global_step": 49772, "epoch": 418, "lr": 2.1254269120668845e-05} +{"train_loss": 0.0008282954222522676, "global_step": 49773, "epoch": 418, "lr": 2.1252456389203233e-05} +{"train_loss": 0.0013192537007853389, "global_step": 49774, "epoch": 418, "lr": 2.1250643714180373e-05} +{"train_loss": 0.0005521131097339094, "global_step": 49775, "epoch": 418, "lr": 2.124883109560379e-05} +{"train_loss": 0.001258905977010727, "global_step": 49776, "epoch": 418, "lr": 2.1247018533477065e-05} +{"train_loss": 0.000475080480100587, "global_step": 49777, "epoch": 418, "lr": 2.124520602780375e-05} +{"train_loss": 0.0007705622701905668, "global_step": 49778, "epoch": 418, "lr": 2.1243393578587384e-05} +{"train_loss": 0.0008741557830944657, "global_step": 49779, "epoch": 418, "lr": 2.124158118583156e-05} +{"train_loss": 0.0005323991645127535, "global_step": 49780, "epoch": 418, "lr": 2.1239768849539797e-05} +{"train_loss": 0.001263667712919414, "global_step": 49781, "epoch": 418, "lr": 2.12379565697157e-05} +{"train_loss": 0.000655852141790092, "global_step": 49782, "epoch": 418, "lr": 2.123614434636278e-05} +{"train_loss": 0.0016055010491982102, "global_step": 49783, "epoch": 418, "lr": 2.123433217948464e-05} +{"train_loss": 0.000932984403334558, "global_step": 49784, "epoch": 418, "lr": 2.123252006908481e-05} +{"train_loss": 0.0008750759880058467, "global_step": 49785, "epoch": 418, "lr": 2.1230708015166838e-05} +{"train_loss": 0.0011088543105870485, "global_step": 49786, "epoch": 418, "lr": 2.1228896017734317e-05} +{"train_loss": 0.0005337590118870139, "global_step": 49787, "epoch": 418, "lr": 2.1227084076790765e-05} +{"train_loss": 0.0006425354513339698, "global_step": 49788, "epoch": 418, "lr": 2.1225272192339778e-05} +{"train_loss": 0.0012593622086569667, "global_step": 49789, "epoch": 418, "lr": 2.122346036438487e-05} +{"train_loss": 0.0007991746533662081, "global_step": 49790, "epoch": 418, "lr": 2.1221648592929655e-05} +{"train_loss": 0.0005573331727646291, "global_step": 49791, "epoch": 418, "lr": 2.121983687797765e-05} +{"train_loss": 0.0010012895800173283, "global_step": 49792, "epoch": 418, "lr": 2.1218025219532404e-05} +{"train_loss": 0.0009875595569610596, "global_step": 49793, "epoch": 418, "lr": 2.1216213617597506e-05} +{"train_loss": 0.0008863914990797639, "global_step": 49794, "epoch": 418, "lr": 2.1214402072176487e-05} +{"train_loss": 0.0006060742889530957, "global_step": 49795, "epoch": 418, "lr": 2.1212590583272922e-05} +{"train_loss": 0.0016347606433555484, "global_step": 49796, "epoch": 418, "lr": 2.1210779150890347e-05} +{"train_loss": 0.0004657902172766626, "global_step": 49797, "epoch": 418, "lr": 2.1208967775032334e-05} +{"train_loss": 0.0006806242163293064, "global_step": 49798, "epoch": 418, "lr": 2.1207156455702454e-05} +{"train_loss": 0.0012213371228426695, "global_step": 49799, "epoch": 418, "lr": 2.1205345192904223e-05} +{"train_loss": 0.0010256365640088916, "global_step": 49800, "epoch": 418, "lr": 2.1203533986641244e-05} +{"train_loss": 0.0010447631357237697, "global_step": 49801, "epoch": 418, "lr": 2.120172283691703e-05} +{"train_loss": 0.000481747614685446, "global_step": 49802, "epoch": 418, "lr": 2.1199911743735172e-05} +{"train_loss": 0.0008021030225791037, "global_step": 49803, "epoch": 418, "lr": 2.1198100707099218e-05} +{"train_loss": 0.0009745113202370703, "global_step": 49804, "epoch": 418, "lr": 2.119628972701269e-05} +{"train_loss": 0.0006039759027771652, "global_step": 49805, "epoch": 418, "lr": 2.119447880347919e-05} +{"train_loss": 0.0009623558144085109, "global_step": 49806, "epoch": 418, "lr": 2.1192667936502236e-05} +{"train_loss": 0.0006679336656816304, "global_step": 49807, "epoch": 418, "lr": 2.119085712608542e-05} +{"train_loss": 0.0009199511841870844, "global_step": 49808, "epoch": 418, "lr": 2.1189046372232263e-05} +{"train_loss": 0.0011916373623535037, "global_step": 49809, "epoch": 418, "lr": 2.1187235674946347e-05} +{"train_loss": 0.00100581010337919, "global_step": 49810, "epoch": 418, "lr": 2.118542503423122e-05} +{"train_loss": 0.0011037278454750776, "global_step": 49811, "epoch": 418, "lr": 2.118361445009041e-05} +{"train_loss": 0.0009881812147796154, "global_step": 49812, "epoch": 418, "lr": 2.1181803922527523e-05} +{"train_loss": 0.000923950516153127, "global_step": 49813, "epoch": 418, "lr": 2.1179993451546056e-05} +{"train_loss": 0.0004345775523688644, "global_step": 49814, "epoch": 418, "lr": 2.117818303714961e-05} +{"train_loss": 0.0003371747152414173, "global_step": 49815, "epoch": 418, "lr": 2.117637267934173e-05} +{"train_loss": 0.0006017790292389691, "global_step": 49816, "epoch": 418, "lr": 2.1174562378125945e-05} +{"train_loss": 0.0011333785951137543, "global_step": 49817, "epoch": 418, "lr": 2.117275213350584e-05} +{"train_loss": 0.0010817889124155045, "global_step": 49818, "epoch": 418, "lr": 2.117094194548494e-05} +{"train_loss": 0.0005424643750302494, "global_step": 49819, "epoch": 418, "lr": 2.1169131814066833e-05} +{"train_loss": 0.001238231430761516, "global_step": 49820, "epoch": 418, "lr": 2.1167321739255042e-05} +{"train_loss": 0.000430135551141575, "global_step": 49821, "epoch": 418, "lr": 2.116551172105315e-05} +{"train_loss": 0.0015335590578615665, "global_step": 49822, "epoch": 418, "lr": 2.1163701759464694e-05} +{"train_loss": 0.0005498267128132284, "global_step": 49823, "epoch": 418, "lr": 2.116189185449321e-05} +{"train_loss": 0.0008350194548256695, "global_step": 49824, "epoch": 418, "lr": 2.116008200614229e-05} +{"train_loss": 0.0011896403739228845, "global_step": 49825, "epoch": 418, "lr": 2.1158272214415447e-05} +{"train_loss": 0.0005221033934503794, "global_step": 49826, "epoch": 418, "lr": 2.115646247931628e-05} +{"train_loss": 0.0013863173080608249, "global_step": 49827, "epoch": 418, "lr": 2.1154652800848294e-05} +{"train_loss": 0.00046591449063271284, "global_step": 49828, "epoch": 418, "lr": 2.1152843179015087e-05} +{"train_loss": 0.0008755248272791505, "global_step": 49829, "epoch": 418, "lr": 2.115103361382017e-05} +{"train_loss": 0.0015128630911931396, "global_step": 49830, "epoch": 418, "lr": 2.1149224105267133e-05} +{"train_loss": 0.0008963603177107871, "global_step": 49831, "epoch": 418, "lr": 2.11474146533595e-05} +{"train_loss": 0.0009108544327318668, "global_step": 49832, "epoch": 418, "lr": 2.1145605258100832e-05} +{"train_loss": 0.002090137917548418, "global_step": 49833, "epoch": 418, "lr": 2.1143795919494704e-05} +{"train_loss": 0.0017344742082059383, "global_step": 49834, "epoch": 418, "lr": 2.1141986637544647e-05} +{"train_loss": 0.0008575530373491347, "global_step": 49835, "epoch": 418, "lr": 2.1140177412254197e-05} +{"train_loss": 0.0010623799171298742, "global_step": 49836, "epoch": 418, "lr": 2.113836824362695e-05} +{"train_loss": 0.0005489870673045516, "global_step": 49837, "epoch": 418, "lr": 2.113655913166641e-05} +{"train_loss": 0.0007400619215331972, "global_step": 49838, "epoch": 418, "lr": 2.1134750076376174e-05} +{"train_loss": 0.001028992235660553, "global_step": 49839, "epoch": 418, "lr": 2.1132941077759753e-05} +{"train_loss": 0.0009236258338205516, "global_step": 49840, "epoch": 418, "lr": 2.1131132135820736e-05} +{"train_loss": 0.0004715413670055568, "global_step": 49841, "epoch": 418, "lr": 2.112932325056266e-05} +{"train_loss": 0.0015579656464979053, "global_step": 49842, "epoch": 418, "lr": 2.1127514421989052e-05} +{"train_loss": 0.0014005147386342287, "global_step": 49843, "epoch": 418, "lr": 2.1125705650103507e-05} +{"train_loss": 0.001288103754632175, "global_step": 49844, "epoch": 418, "lr": 2.112389693490953e-05} +{"train_loss": 0.0005530172493308783, "global_step": 49845, "epoch": 418, "lr": 2.1122088276410716e-05} +{"train_loss": 0.0007408075616694987, "global_step": 49846, "epoch": 418, "lr": 2.11202796746106e-05} +{"train_loss": 0.0007796298596076667, "global_step": 49847, "epoch": 418, "lr": 2.111847112951271e-05} +{"train_loss": 0.0010831296676769853, "global_step": 49848, "epoch": 418, "lr": 2.1116662641120634e-05} +{"train_loss": 0.0017334643052890897, "global_step": 49849, "epoch": 418, "lr": 2.111485420943789e-05} +{"train_loss": 0.0013334477553144097, "global_step": 49850, "epoch": 418, "lr": 2.1113045834468053e-05} +{"train_loss": 0.0013582578394562006, "global_step": 49851, "epoch": 418, "lr": 2.1111237516214655e-05} +{"train_loss": 0.0009266838314943016, "global_step": 49852, "epoch": 418, "lr": 2.1109429254681273e-05} +{"train_loss": 0.0012256358750164509, "global_step": 49853, "epoch": 418, "lr": 2.1107621049871435e-05} +{"train_loss": 0.002333930227905512, "global_step": 49854, "epoch": 418, "lr": 2.1105812901788684e-05} +{"train_loss": 0.0015439963899552822, "global_step": 49855, "epoch": 418, "lr": 2.1104004810436595e-05} +{"train_loss": 0.0005426742136478424, "global_step": 49856, "epoch": 418, "lr": 2.1102196775818695e-05} +{"train_loss": 0.0008868139120750129, "global_step": 49857, "epoch": 418, "lr": 2.1100388797938558e-05} +{"train_loss": 0.000547198171261698, "global_step": 49858, "epoch": 418, "lr": 2.10985808767997e-05} +{"train_loss": 0.0005742686917074025, "global_step": 49859, "epoch": 418, "lr": 2.1096773012405713e-05} +{"train_loss": 0.0009675066631498645, "global_step": 49860, "epoch": 418, "lr": 2.1094965204760103e-05, "val_loss": 0.011764134280383587} +{"train_loss": 0.0006381116108968854, "global_step": 49861, "epoch": 419, "lr": 2.109315745386646e-05} +{"train_loss": 0.0007775667472742498, "global_step": 49862, "epoch": 419, "lr": 2.1091349759728296e-05} +{"train_loss": 0.0015568082453683019, "global_step": 49863, "epoch": 419, "lr": 2.10895421223492e-05} +{"train_loss": 0.0019643171690404415, "global_step": 49864, "epoch": 419, "lr": 2.1087734541732672e-05} +{"train_loss": 0.0016744837630540133, "global_step": 49865, "epoch": 419, "lr": 2.1085927017882314e-05} +{"train_loss": 0.0011979888658970594, "global_step": 49866, "epoch": 419, "lr": 2.1084119550801628e-05} +{"train_loss": 0.0015100711025297642, "global_step": 49867, "epoch": 419, "lr": 2.1082312140494203e-05} +{"train_loss": 0.0012618610635399818, "global_step": 49868, "epoch": 419, "lr": 2.108050478696355e-05} +{"train_loss": 0.0019991479348391294, "global_step": 49869, "epoch": 419, "lr": 2.1078697490213258e-05} +{"train_loss": 0.0008966724271886051, "global_step": 49870, "epoch": 419, "lr": 2.1076890250246832e-05} +{"train_loss": 0.0009908243082463741, "global_step": 49871, "epoch": 419, "lr": 2.1075083067067863e-05} +{"train_loss": 0.0012062665773555636, "global_step": 49872, "epoch": 419, "lr": 2.1073275940679875e-05} +{"train_loss": 0.0011446804273873568, "global_step": 49873, "epoch": 419, "lr": 2.10714688710864e-05} +{"train_loss": 0.0009353805216960609, "global_step": 49874, "epoch": 419, "lr": 2.1069661858291027e-05} +{"train_loss": 0.0007490211864933372, "global_step": 49875, "epoch": 419, "lr": 2.106785490229727e-05} +{"train_loss": 0.0014042857801541686, "global_step": 49876, "epoch": 419, "lr": 2.1066048003108695e-05} +{"train_loss": 0.0009282567189075053, "global_step": 49877, "epoch": 419, "lr": 2.106424116072883e-05} +{"train_loss": 0.0012487559579312801, "global_step": 49878, "epoch": 419, "lr": 2.106243437516126e-05} +{"train_loss": 0.0008328264229930937, "global_step": 49879, "epoch": 419, "lr": 2.1060627646409504e-05} +{"train_loss": 0.0008170216460712254, "global_step": 49880, "epoch": 419, "lr": 2.1058820974477095e-05} +{"train_loss": 0.000688812171574682, "global_step": 49881, "epoch": 419, "lr": 2.1057014359367616e-05} +{"train_loss": 0.0008997998083941638, "global_step": 49882, "epoch": 419, "lr": 2.105520780108458e-05} +{"train_loss": 0.0014299761969596148, "global_step": 49883, "epoch": 419, "lr": 2.105340129963157e-05} +{"train_loss": 0.0010892899008467793, "global_step": 49884, "epoch": 419, "lr": 2.1051594855012113e-05} +{"train_loss": 0.0012691979063674808, "global_step": 49885, "epoch": 419, "lr": 2.1049788467229744e-05} +{"train_loss": 0.0012669970747083426, "global_step": 49886, "epoch": 419, "lr": 2.1047982136288035e-05} +{"train_loss": 0.0012718592770397663, "global_step": 49887, "epoch": 419, "lr": 2.1046175862190504e-05} +{"train_loss": 0.00218117143958807, "global_step": 49888, "epoch": 419, "lr": 2.1044369644940732e-05} +{"train_loss": 0.000938732351642102, "global_step": 49889, "epoch": 419, "lr": 2.1042563484542226e-05} +{"train_loss": 0.0014078806852921844, "global_step": 49890, "epoch": 419, "lr": 2.104075738099857e-05} +{"train_loss": 0.0011873252224177122, "global_step": 49891, "epoch": 419, "lr": 2.1038951334313295e-05} +{"train_loss": 0.0011643623001873493, "global_step": 49892, "epoch": 419, "lr": 2.1037145344489928e-05} +{"train_loss": 0.0011102192802354693, "global_step": 49893, "epoch": 419, "lr": 2.1035339411532033e-05} +{"train_loss": 0.0010364451445639133, "global_step": 49894, "epoch": 419, "lr": 2.103353353544317e-05} +{"train_loss": 0.0007334850379265845, "global_step": 49895, "epoch": 419, "lr": 2.103172771622685e-05} +{"train_loss": 0.0010273701045662165, "global_step": 49896, "epoch": 419, "lr": 2.1029921953886663e-05} +{"train_loss": 0.0011753980070352554, "global_step": 49897, "epoch": 419, "lr": 2.1028116248426107e-05} +{"train_loss": 0.0005636299028992653, "global_step": 49898, "epoch": 419, "lr": 2.1026310599848763e-05} +{"train_loss": 0.0008176890551112592, "global_step": 49899, "epoch": 419, "lr": 2.1024505008158152e-05} +{"train_loss": 0.0019958699122071266, "global_step": 49900, "epoch": 419, "lr": 2.1022699473357842e-05} +{"train_loss": 0.0013954929308965802, "global_step": 49901, "epoch": 419, "lr": 2.1020893995451353e-05} +{"train_loss": 0.0010259903501719236, "global_step": 49902, "epoch": 419, "lr": 2.1019088574442258e-05} +{"train_loss": 0.0008008488221094012, "global_step": 49903, "epoch": 419, "lr": 2.1017283210334086e-05} +{"train_loss": 0.0008949808543547988, "global_step": 49904, "epoch": 419, "lr": 2.1015477903130367e-05} +{"train_loss": 0.0007056320318952203, "global_step": 49905, "epoch": 419, "lr": 2.101367265283467e-05} +{"train_loss": 0.0008303623180836439, "global_step": 49906, "epoch": 419, "lr": 2.1011867459450523e-05} +{"train_loss": 0.0009207972325384617, "global_step": 49907, "epoch": 419, "lr": 2.101006232298149e-05} +{"train_loss": 0.0005572105874307454, "global_step": 49908, "epoch": 419, "lr": 2.1008257243431085e-05} +{"train_loss": 0.0006653897580690682, "global_step": 49909, "epoch": 419, "lr": 2.1006452220802887e-05} +{"train_loss": 0.0011376688489690423, "global_step": 49910, "epoch": 419, "lr": 2.1004647255100422e-05} +{"train_loss": 0.0013007170055061579, "global_step": 49911, "epoch": 419, "lr": 2.1002842346327218e-05} +{"train_loss": 0.0014125212328508496, "global_step": 49912, "epoch": 419, "lr": 2.1001037494486853e-05} +{"train_loss": 0.00046685762936249375, "global_step": 49913, "epoch": 419, "lr": 2.0999232699582832e-05} +{"train_loss": 0.0006865102332085371, "global_step": 49914, "epoch": 419, "lr": 2.099742796161874e-05} +{"train_loss": 0.0009905562037602067, "global_step": 49915, "epoch": 419, "lr": 2.0995623280598104e-05} +{"train_loss": 0.001519315061159432, "global_step": 49916, "epoch": 419, "lr": 2.0993818656524437e-05} +{"train_loss": 0.0007994204643182456, "global_step": 49917, "epoch": 419, "lr": 2.099201408940133e-05} +{"train_loss": 0.0010184708517044783, "global_step": 49918, "epoch": 419, "lr": 2.099020957923229e-05} +{"train_loss": 0.0006877181585878134, "global_step": 49919, "epoch": 419, "lr": 2.098840512602089e-05} +{"train_loss": 0.0006758218514733016, "global_step": 49920, "epoch": 419, "lr": 2.0986600729770634e-05} +{"train_loss": 0.0007903901278041303, "global_step": 49921, "epoch": 419, "lr": 2.0984796390485108e-05} +{"train_loss": 0.00040262783295474946, "global_step": 49922, "epoch": 419, "lr": 2.0982992108167836e-05} +{"train_loss": 0.0005894641508348286, "global_step": 49923, "epoch": 419, "lr": 2.098118788282234e-05} +{"train_loss": 0.0009023156017065048, "global_step": 49924, "epoch": 419, "lr": 2.09793837144522e-05} +{"train_loss": 0.0008835041080601513, "global_step": 49925, "epoch": 419, "lr": 2.0977579603060926e-05} +{"train_loss": 0.0006718937656842172, "global_step": 49926, "epoch": 419, "lr": 2.0975775548652088e-05} +{"train_loss": 0.0008872948819771409, "global_step": 49927, "epoch": 419, "lr": 2.0973971551229195e-05} +{"train_loss": 0.0005170137737877667, "global_step": 49928, "epoch": 419, "lr": 2.0972167610795823e-05} +{"train_loss": 0.0010324427857995033, "global_step": 49929, "epoch": 419, "lr": 2.0970363727355486e-05} +{"train_loss": 0.000730907719116658, "global_step": 49930, "epoch": 419, "lr": 2.096855990091174e-05} +{"train_loss": 0.0006731221219524741, "global_step": 49931, "epoch": 419, "lr": 2.0966756131468136e-05} +{"train_loss": 0.0006333388737402856, "global_step": 49932, "epoch": 419, "lr": 2.096495241902819e-05} +{"train_loss": 0.0006969990790821612, "global_step": 49933, "epoch": 419, "lr": 2.0963148763595476e-05} +{"train_loss": 0.0005273397546261549, "global_step": 49934, "epoch": 419, "lr": 2.0961345165173517e-05} +{"train_loss": 0.0011374112218618393, "global_step": 49935, "epoch": 419, "lr": 2.0959541623765837e-05} +{"train_loss": 0.0005718323518522084, "global_step": 49936, "epoch": 419, "lr": 2.0957738139376014e-05} +{"train_loss": 0.0007829836686141789, "global_step": 49937, "epoch": 419, "lr": 2.095593471200755e-05} +{"train_loss": 0.0008374864119105041, "global_step": 49938, "epoch": 419, "lr": 2.0954131341664025e-05} +{"train_loss": 0.0005514348158612847, "global_step": 49939, "epoch": 419, "lr": 2.095232802834894e-05} +{"train_loss": 0.0010040317429229617, "global_step": 49940, "epoch": 419, "lr": 2.095052477206587e-05} +{"train_loss": 0.0005942294374108315, "global_step": 49941, "epoch": 419, "lr": 2.094872157281835e-05} +{"train_loss": 0.0008609390933997929, "global_step": 49942, "epoch": 419, "lr": 2.0946918430609887e-05} +{"train_loss": 0.0011912414338439703, "global_step": 49943, "epoch": 419, "lr": 2.0945115345444066e-05} +{"train_loss": 0.0005841106176376343, "global_step": 49944, "epoch": 419, "lr": 2.0943312317324386e-05} +{"train_loss": 0.0005333365988917649, "global_step": 49945, "epoch": 419, "lr": 2.094150934625443e-05} +{"train_loss": 0.0005893263733014464, "global_step": 49946, "epoch": 419, "lr": 2.09397064322377e-05} +{"train_loss": 0.0007748848292976618, "global_step": 49947, "epoch": 419, "lr": 2.093790357527776e-05} +{"train_loss": 0.0007338094292208552, "global_step": 49948, "epoch": 419, "lr": 2.0936100775378152e-05} +{"train_loss": 0.001013073488138616, "global_step": 49949, "epoch": 419, "lr": 2.093429803254238e-05} +{"train_loss": 0.0005585750914178789, "global_step": 49950, "epoch": 419, "lr": 2.0932495346774035e-05} +{"train_loss": 0.001075361855328083, "global_step": 49951, "epoch": 419, "lr": 2.09306927180766e-05} +{"train_loss": 0.0008050810429267585, "global_step": 49952, "epoch": 419, "lr": 2.0928890146453672e-05} +{"train_loss": 0.0009294273913837969, "global_step": 49953, "epoch": 419, "lr": 2.092708763190876e-05} +{"train_loss": 0.0008516745874658227, "global_step": 49954, "epoch": 419, "lr": 2.0925285174445385e-05} +{"train_loss": 0.0009465755429118872, "global_step": 49955, "epoch": 419, "lr": 2.0923482774067128e-05} +{"train_loss": 0.00041001258068718016, "global_step": 49956, "epoch": 419, "lr": 2.0921680430777486e-05} +{"train_loss": 0.0007185955764725804, "global_step": 49957, "epoch": 419, "lr": 2.0919878144580036e-05} +{"train_loss": 0.0006127304513938725, "global_step": 49958, "epoch": 419, "lr": 2.091807591547828e-05} +{"train_loss": 0.0007185134454630315, "global_step": 49959, "epoch": 419, "lr": 2.0916273743475788e-05} +{"train_loss": 0.0008873340557329357, "global_step": 49960, "epoch": 419, "lr": 2.0914471628576078e-05} +{"train_loss": 0.0007894137524999678, "global_step": 49961, "epoch": 419, "lr": 2.0912669570782705e-05} +{"train_loss": 0.000679522636346519, "global_step": 49962, "epoch": 419, "lr": 2.0910867570099184e-05} +{"train_loss": 0.0007923489320091903, "global_step": 49963, "epoch": 419, "lr": 2.0909065626529085e-05} +{"train_loss": 0.0006491284584626555, "global_step": 49964, "epoch": 419, "lr": 2.090726374007591e-05} +{"train_loss": 0.0008176051778718829, "global_step": 49965, "epoch": 419, "lr": 2.090546191074323e-05} +{"train_loss": 0.0008158363634720445, "global_step": 49966, "epoch": 419, "lr": 2.0903660138534554e-05} +{"train_loss": 0.0011761587811633945, "global_step": 49967, "epoch": 419, "lr": 2.0901858423453447e-05} +{"train_loss": 0.0011240739841014147, "global_step": 49968, "epoch": 419, "lr": 2.0900056765503413e-05} +{"train_loss": 0.0007839949103072286, "global_step": 49969, "epoch": 419, "lr": 2.089825516468803e-05} +{"train_loss": 0.0007930038846097887, "global_step": 49970, "epoch": 419, "lr": 2.089645362101079e-05} +{"train_loss": 0.0009267092682421207, "global_step": 49971, "epoch": 419, "lr": 2.089465213447528e-05} +{"train_loss": 0.0016753652598708868, "global_step": 49972, "epoch": 419, "lr": 2.0892850705085005e-05} +{"train_loss": 0.0017380891367793083, "global_step": 49973, "epoch": 419, "lr": 2.0891049332843492e-05} +{"train_loss": 0.001645639888010919, "global_step": 49974, "epoch": 419, "lr": 2.0889248017754313e-05} +{"train_loss": 0.001865097670815885, "global_step": 49975, "epoch": 419, "lr": 2.0887446759820966e-05} +{"train_loss": 0.0005151999648660421, "global_step": 49976, "epoch": 419, "lr": 2.088564555904703e-05} +{"train_loss": 0.0010085311951115727, "global_step": 49977, "epoch": 419, "lr": 2.0883844415435995e-05} +{"train_loss": 0.0008499691030010581, "global_step": 49978, "epoch": 419, "lr": 2.088204332899144e-05} +{"train_loss": 0.0009704704725128762, "global_step": 49979, "epoch": 419, "lr": 2.0880242299716878e-05, "val_loss": 0.013186819851398468} +{"train_loss": 0.000821173598524183, "global_step": 49980, "epoch": 420, "lr": 2.087844132761584e-05} +{"train_loss": 0.000448618084192276, "global_step": 49981, "epoch": 420, "lr": 2.0876640412691883e-05} +{"train_loss": 0.0010181679390370846, "global_step": 49982, "epoch": 420, "lr": 2.0874839554948515e-05} +{"train_loss": 0.0015530358068645, "global_step": 49983, "epoch": 420, "lr": 2.0873038754389307e-05} +{"train_loss": 0.0006388102774508297, "global_step": 49984, "epoch": 420, "lr": 2.0871238011017773e-05} +{"train_loss": 0.001039945986121893, "global_step": 49985, "epoch": 420, "lr": 2.086943732483744e-05} +{"train_loss": 0.0014954576035961509, "global_step": 49986, "epoch": 420, "lr": 2.0867636695851862e-05} +{"train_loss": 0.0009040497243404388, "global_step": 49987, "epoch": 420, "lr": 2.0865836124064558e-05} +{"train_loss": 0.0009965284261852503, "global_step": 49988, "epoch": 420, "lr": 2.086403560947909e-05} +{"train_loss": 0.001133828773163259, "global_step": 49989, "epoch": 420, "lr": 2.0862235152098946e-05} +{"train_loss": 0.001116111408919096, "global_step": 49990, "epoch": 420, "lr": 2.086043475192772e-05} +{"train_loss": 0.00045907465391792357, "global_step": 49991, "epoch": 420, "lr": 2.0858634408968896e-05} +{"train_loss": 0.0011537600075826049, "global_step": 49992, "epoch": 420, "lr": 2.0856834123226048e-05} +{"train_loss": 0.0013626186409965158, "global_step": 49993, "epoch": 420, "lr": 2.0855033894702674e-05} +{"train_loss": 0.0007940256618894637, "global_step": 49994, "epoch": 420, "lr": 2.0853233723402345e-05} +{"train_loss": 0.0007487384718842804, "global_step": 49995, "epoch": 420, "lr": 2.0851433609328562e-05} +{"train_loss": 0.0010764173930510879, "global_step": 49996, "epoch": 420, "lr": 2.084963355248489e-05} +{"train_loss": 0.0010778912110254169, "global_step": 49997, "epoch": 420, "lr": 2.0847833552874835e-05} +{"train_loss": 0.0013029301771894097, "global_step": 49998, "epoch": 420, "lr": 2.0846033610501958e-05} +{"train_loss": 0.001494328840635717, "global_step": 49999, "epoch": 420, "lr": 2.084423372536976e-05} +{"train_loss": 0.0006950954557396472, "global_step": 50000, "epoch": 420, "lr": 2.0842433897481815e-05} +{"train_loss": 0.0016043710056692362, "global_step": 50001, "epoch": 420, "lr": 2.084063412684162e-05} +{"train_loss": 0.000955062685534358, "global_step": 50002, "epoch": 420, "lr": 2.083883441345274e-05} +{"train_loss": 0.0010357442079111934, "global_step": 50003, "epoch": 420, "lr": 2.0837034757318697e-05} +{"train_loss": 0.0006011262885294855, "global_step": 50004, "epoch": 420, "lr": 2.0835235158442994e-05} +{"train_loss": 0.0013629578752443194, "global_step": 50005, "epoch": 420, "lr": 2.0833435616829218e-05} +{"train_loss": 0.0010296410182490945, "global_step": 50006, "epoch": 420, "lr": 2.0831636132480853e-05} +{"train_loss": 0.0009357777889817953, "global_step": 50007, "epoch": 420, "lr": 2.0829836705401473e-05} +{"train_loss": 0.0011604542378336191, "global_step": 50008, "epoch": 420, "lr": 2.0828037335594575e-05} +{"train_loss": 0.001008115243166685, "global_step": 50009, "epoch": 420, "lr": 2.0826238023063726e-05} +{"train_loss": 0.0006897636339999735, "global_step": 50010, "epoch": 420, "lr": 2.0824438767812443e-05} +{"train_loss": 0.0007986334967426956, "global_step": 50011, "epoch": 420, "lr": 2.0822639569844237e-05} +{"train_loss": 0.0009086335776373744, "global_step": 50012, "epoch": 420, "lr": 2.0820840429162682e-05} +{"train_loss": 0.0008835020125843585, "global_step": 50013, "epoch": 420, "lr": 2.0819041345771267e-05} +{"train_loss": 0.0011648659128695726, "global_step": 50014, "epoch": 420, "lr": 2.0817242319673568e-05} +{"train_loss": 0.001200465951114893, "global_step": 50015, "epoch": 420, "lr": 2.0815443350873097e-05} +{"train_loss": 0.0011543447617441416, "global_step": 50016, "epoch": 420, "lr": 2.0813644439373365e-05} +{"train_loss": 0.0007310596411116421, "global_step": 50017, "epoch": 420, "lr": 2.0811845585177942e-05} +{"train_loss": 0.00046683367691002786, "global_step": 50018, "epoch": 420, "lr": 2.0810046788290326e-05} +{"train_loss": 0.0009319488890469074, "global_step": 50019, "epoch": 420, "lr": 2.080824804871408e-05} +{"train_loss": 0.0016836051363497972, "global_step": 50020, "epoch": 420, "lr": 2.0806449366452706e-05} +{"train_loss": 0.0005968500627204776, "global_step": 50021, "epoch": 420, "lr": 2.0804650741509766e-05} +{"train_loss": 0.0006005887989886105, "global_step": 50022, "epoch": 420, "lr": 2.0802852173888775e-05} +{"train_loss": 0.000735882727894932, "global_step": 50023, "epoch": 420, "lr": 2.0801053663593246e-05} +{"train_loss": 0.0007413545972667634, "global_step": 50024, "epoch": 420, "lr": 2.0799255210626746e-05} +{"train_loss": 0.0008946076268330216, "global_step": 50025, "epoch": 420, "lr": 2.0797456814992772e-05} +{"train_loss": 0.001031308900564909, "global_step": 50026, "epoch": 420, "lr": 2.0795658476694872e-05} +{"train_loss": 0.0005616014241240919, "global_step": 50027, "epoch": 420, "lr": 2.0793860195736593e-05} +{"train_loss": 0.0005384184187278152, "global_step": 50028, "epoch": 420, "lr": 2.0792061972121435e-05} +{"train_loss": 0.0009924067417159677, "global_step": 50029, "epoch": 420, "lr": 2.0790263805852955e-05} +{"train_loss": 0.0005616911803372204, "global_step": 50030, "epoch": 420, "lr": 2.078846569693466e-05} +{"train_loss": 0.0014899318339303136, "global_step": 50031, "epoch": 420, "lr": 2.0786667645370105e-05} +{"train_loss": 0.0008261848124675453, "global_step": 50032, "epoch": 420, "lr": 2.0784869651162792e-05} +{"train_loss": 0.0007484440575353801, "global_step": 50033, "epoch": 420, "lr": 2.0783071714316283e-05} +{"train_loss": 0.0009543965570628643, "global_step": 50034, "epoch": 420, "lr": 2.078127383483409e-05} +{"train_loss": 0.0007527709822170436, "global_step": 50035, "epoch": 420, "lr": 2.077947601271973e-05} +{"train_loss": 0.0010497968178242445, "global_step": 50036, "epoch": 420, "lr": 2.077767824797676e-05} +{"train_loss": 0.0009510646341368556, "global_step": 50037, "epoch": 420, "lr": 2.0775880540608683e-05} +{"train_loss": 0.0005777503247372806, "global_step": 50038, "epoch": 420, "lr": 2.0774082890619056e-05} +{"train_loss": 0.0007448414107784629, "global_step": 50039, "epoch": 420, "lr": 2.0772285298011378e-05} +{"train_loss": 0.001432333723641932, "global_step": 50040, "epoch": 420, "lr": 2.077048776278922e-05} +{"train_loss": 0.0008163026650436223, "global_step": 50041, "epoch": 420, "lr": 2.0768690284956076e-05} +{"train_loss": 0.0008913531200960279, "global_step": 50042, "epoch": 420, "lr": 2.0766892864515474e-05} +{"train_loss": 0.0005592580419033766, "global_step": 50043, "epoch": 420, "lr": 2.0765095501470978e-05} +{"train_loss": 0.0009855100652202964, "global_step": 50044, "epoch": 420, "lr": 2.0763298195826065e-05} +{"train_loss": 0.0011398742208257318, "global_step": 50045, "epoch": 420, "lr": 2.0761500947584318e-05} +{"train_loss": 0.0004978993674740195, "global_step": 50046, "epoch": 420, "lr": 2.0759703756749215e-05} +{"train_loss": 0.0007161240791901946, "global_step": 50047, "epoch": 420, "lr": 2.0757906623324336e-05} +{"train_loss": 0.0004277163534425199, "global_step": 50048, "epoch": 420, "lr": 2.075610954731318e-05} +{"train_loss": 0.0006707512075081468, "global_step": 50049, "epoch": 420, "lr": 2.075431252871926e-05} +{"train_loss": 0.0005671213148161769, "global_step": 50050, "epoch": 420, "lr": 2.0752515567546138e-05} +{"train_loss": 0.0008112283539958298, "global_step": 50051, "epoch": 420, "lr": 2.0750718663797315e-05} +{"train_loss": 0.0017183185555040836, "global_step": 50052, "epoch": 420, "lr": 2.0748921817476347e-05} +{"train_loss": 0.0014142629224807024, "global_step": 50053, "epoch": 420, "lr": 2.0747125028586744e-05} +{"train_loss": 0.0007165762363001704, "global_step": 50054, "epoch": 420, "lr": 2.0745328297132022e-05} +{"train_loss": 0.0006895724218338728, "global_step": 50055, "epoch": 420, "lr": 2.0743531623115736e-05} +{"train_loss": 0.0006941045285202563, "global_step": 50056, "epoch": 420, "lr": 2.074173500654138e-05} +{"train_loss": 0.00048066378803923726, "global_step": 50057, "epoch": 420, "lr": 2.073993844741253e-05} +{"train_loss": 0.0013623697450384498, "global_step": 50058, "epoch": 420, "lr": 2.0738141945732654e-05} +{"train_loss": 0.0007556673954240978, "global_step": 50059, "epoch": 420, "lr": 2.0736345501505335e-05} +{"train_loss": 0.00042099482379853725, "global_step": 50060, "epoch": 420, "lr": 2.073454911473406e-05} +{"train_loss": 0.0005036129732616246, "global_step": 50061, "epoch": 420, "lr": 2.0732752785422367e-05} +{"train_loss": 0.0005394776817411184, "global_step": 50062, "epoch": 420, "lr": 2.07309565135738e-05} +{"train_loss": 0.0009398470283485949, "global_step": 50063, "epoch": 420, "lr": 2.0729160299191863e-05} +{"train_loss": 0.0006376251112669706, "global_step": 50064, "epoch": 420, "lr": 2.0727364142280108e-05} +{"train_loss": 0.0011040779063478112, "global_step": 50065, "epoch": 420, "lr": 2.072556804284203e-05} +{"train_loss": 0.0004100686637684703, "global_step": 50066, "epoch": 420, "lr": 2.0723772000881185e-05} +{"train_loss": 0.0009379197144880891, "global_step": 50067, "epoch": 420, "lr": 2.072197601640109e-05} +{"train_loss": 0.00047546427231281996, "global_step": 50068, "epoch": 420, "lr": 2.072018008940525e-05} +{"train_loss": 0.0012002673465758562, "global_step": 50069, "epoch": 420, "lr": 2.0718384219897225e-05} +{"train_loss": 0.0004620934196282178, "global_step": 50070, "epoch": 420, "lr": 2.0716588407880504e-05} +{"train_loss": 0.0004185716388747096, "global_step": 50071, "epoch": 420, "lr": 2.0714792653358656e-05} +{"train_loss": 0.000872443022672087, "global_step": 50072, "epoch": 420, "lr": 2.071299695633518e-05} +{"train_loss": 0.0014062527334317565, "global_step": 50073, "epoch": 420, "lr": 2.0711201316813587e-05} +{"train_loss": 0.0015645845560356975, "global_step": 50074, "epoch": 420, "lr": 2.0709405734797442e-05} +{"train_loss": 0.000492995954118669, "global_step": 50075, "epoch": 420, "lr": 2.070761021029023e-05} +{"train_loss": 0.0010148652363568544, "global_step": 50076, "epoch": 420, "lr": 2.0705814743295514e-05} +{"train_loss": 0.0010986935812979937, "global_step": 50077, "epoch": 420, "lr": 2.0704019333816788e-05} +{"train_loss": 0.0009089571540243924, "global_step": 50078, "epoch": 420, "lr": 2.07022239818576e-05} +{"train_loss": 0.000780594942625612, "global_step": 50079, "epoch": 420, "lr": 2.070042868742147e-05} +{"train_loss": 0.00046014500549063087, "global_step": 50080, "epoch": 420, "lr": 2.06986334505119e-05} +{"train_loss": 0.00070671591674909, "global_step": 50081, "epoch": 420, "lr": 2.069683827113245e-05} +{"train_loss": 0.0009884909959509969, "global_step": 50082, "epoch": 420, "lr": 2.0695043149286608e-05} +{"train_loss": 0.0007631810731254518, "global_step": 50083, "epoch": 420, "lr": 2.069324808497794e-05} +{"train_loss": 0.0010976673802360892, "global_step": 50084, "epoch": 420, "lr": 2.0691453078209945e-05} +{"train_loss": 0.0011745276860892773, "global_step": 50085, "epoch": 420, "lr": 2.0689658128986134e-05} +{"train_loss": 0.0005172464298084378, "global_step": 50086, "epoch": 420, "lr": 2.068786323731006e-05} +{"train_loss": 0.0006130992551334202, "global_step": 50087, "epoch": 420, "lr": 2.0686068403185227e-05} +{"train_loss": 0.0004574533086270094, "global_step": 50088, "epoch": 420, "lr": 2.068427362661518e-05} +{"train_loss": 0.000637257588095963, "global_step": 50089, "epoch": 420, "lr": 2.0682478907603413e-05} +{"train_loss": 0.0011881062528118491, "global_step": 50090, "epoch": 420, "lr": 2.068068424615348e-05} +{"train_loss": 0.0013071635039523244, "global_step": 50091, "epoch": 420, "lr": 2.0678889642268878e-05} +{"train_loss": 0.0007099455106072128, "global_step": 50092, "epoch": 420, "lr": 2.0677095095953165e-05} +{"train_loss": 0.0008197155548259616, "global_step": 50093, "epoch": 420, "lr": 2.0675300607209817e-05} +{"train_loss": 0.0009041015873663127, "global_step": 50094, "epoch": 420, "lr": 2.0673506176042406e-05} +{"train_loss": 0.0008132130606099963, "global_step": 50095, "epoch": 420, "lr": 2.0671711802454414e-05} +{"train_loss": 0.0013300542486831546, "global_step": 50096, "epoch": 420, "lr": 2.066991748644938e-05} +{"train_loss": 0.0007278143311850727, "global_step": 50097, "epoch": 420, "lr": 2.066812322803085e-05} +{"train_loss": 0.000899689513436683, "global_step": 50098, "epoch": 420, "lr": 2.066632902720233e-05, "val_loss": 0.013143684715032578, "train_action_mse_error": 1.2064802831446286e-05} +{"train_loss": 0.000832661404274404, "global_step": 50099, "epoch": 421, "lr": 2.0664534883967312e-05} +{"train_loss": 0.0011448018485680223, "global_step": 50100, "epoch": 421, "lr": 2.0662740798329373e-05} +{"train_loss": 0.0010867308592423797, "global_step": 50101, "epoch": 421, "lr": 2.0660946770291982e-05} +{"train_loss": 0.0011264578206464648, "global_step": 50102, "epoch": 421, "lr": 2.065915279985871e-05} +{"train_loss": 0.0009438375709578395, "global_step": 50103, "epoch": 421, "lr": 2.0657358887033057e-05} +{"train_loss": 0.0003577653260435909, "global_step": 50104, "epoch": 421, "lr": 2.065556503181853e-05} +{"train_loss": 0.0009443674935027957, "global_step": 50105, "epoch": 421, "lr": 2.0653771234218684e-05} +{"train_loss": 0.0005789531278423965, "global_step": 50106, "epoch": 421, "lr": 2.0651977494236994e-05} +{"train_loss": 0.0016359480796381831, "global_step": 50107, "epoch": 421, "lr": 2.065018381187704e-05} +{"train_loss": 0.0006049916264601052, "global_step": 50108, "epoch": 421, "lr": 2.064839018714229e-05} +{"train_loss": 0.0005953361978754401, "global_step": 50109, "epoch": 421, "lr": 2.0646596620036312e-05} +{"train_loss": 0.0015000138664618134, "global_step": 50110, "epoch": 421, "lr": 2.0644803110562605e-05} +{"train_loss": 0.0008108435431495309, "global_step": 50111, "epoch": 421, "lr": 2.0643009658724675e-05} +{"train_loss": 0.0006840772111900151, "global_step": 50112, "epoch": 421, "lr": 2.0641216264526074e-05} +{"train_loss": 0.0009869098430499434, "global_step": 50113, "epoch": 421, "lr": 2.063942292797029e-05} +{"train_loss": 0.0009728279546834528, "global_step": 50114, "epoch": 421, "lr": 2.0637629649060886e-05} +{"train_loss": 0.0006044122856110334, "global_step": 50115, "epoch": 421, "lr": 2.0635836427801337e-05} +{"train_loss": 0.0007211233605630696, "global_step": 50116, "epoch": 421, "lr": 2.06340432641952e-05} +{"train_loss": 0.00039852128247730434, "global_step": 50117, "epoch": 421, "lr": 2.0632250158245987e-05} +{"train_loss": 0.0009579267934896052, "global_step": 50118, "epoch": 421, "lr": 2.0630457109957197e-05} +{"train_loss": 0.0012133627897128463, "global_step": 50119, "epoch": 421, "lr": 2.062866411933238e-05} +{"train_loss": 0.0007508023409172893, "global_step": 50120, "epoch": 421, "lr": 2.062687118637503e-05} +{"train_loss": 0.0008825303521007299, "global_step": 50121, "epoch": 421, "lr": 2.0625078311088693e-05} +{"train_loss": 0.0007496914477087557, "global_step": 50122, "epoch": 421, "lr": 2.062328549347688e-05} +{"train_loss": 0.001212645904161036, "global_step": 50123, "epoch": 421, "lr": 2.0621492733543086e-05} +{"train_loss": 0.0010083923116326332, "global_step": 50124, "epoch": 421, "lr": 2.0619700031290856e-05} +{"train_loss": 0.0005658463342115283, "global_step": 50125, "epoch": 421, "lr": 2.0617907386723724e-05} +{"train_loss": 0.0007375831482931972, "global_step": 50126, "epoch": 421, "lr": 2.061611479984517e-05} +{"train_loss": 0.0011101447744295, "global_step": 50127, "epoch": 421, "lr": 2.061432227065876e-05} +{"train_loss": 0.0009032356319949031, "global_step": 50128, "epoch": 421, "lr": 2.061252979916796e-05} +{"train_loss": 0.0010762816527858377, "global_step": 50129, "epoch": 421, "lr": 2.061073738537635e-05} +{"train_loss": 0.0012076114071533084, "global_step": 50130, "epoch": 421, "lr": 2.0608945029287392e-05} +{"train_loss": 0.0006713585462421179, "global_step": 50131, "epoch": 421, "lr": 2.060715273090465e-05} +{"train_loss": 0.0010388449300080538, "global_step": 50132, "epoch": 421, "lr": 2.0605360490231602e-05} +{"train_loss": 0.0006775886286050081, "global_step": 50133, "epoch": 421, "lr": 2.060356830727181e-05} +{"train_loss": 0.0008864502306096256, "global_step": 50134, "epoch": 421, "lr": 2.0601776182028747e-05} +{"train_loss": 0.0006002903101034462, "global_step": 50135, "epoch": 421, "lr": 2.0599984114505982e-05} +{"train_loss": 0.0008386039990000427, "global_step": 50136, "epoch": 421, "lr": 2.0598192104707005e-05} +{"train_loss": 0.00039208366069942713, "global_step": 50137, "epoch": 421, "lr": 2.0596400152635315e-05} +{"train_loss": 0.0012331928592175245, "global_step": 50138, "epoch": 421, "lr": 2.0594608258294474e-05} +{"train_loss": 0.0013326221378520131, "global_step": 50139, "epoch": 421, "lr": 2.059281642168796e-05} +{"train_loss": 0.0008600826840847731, "global_step": 50140, "epoch": 421, "lr": 2.0591024642819323e-05} +{"train_loss": 0.0008378222119063139, "global_step": 50141, "epoch": 421, "lr": 2.058923292169207e-05} +{"train_loss": 0.0011113942600786686, "global_step": 50142, "epoch": 421, "lr": 2.0587441258309698e-05} +{"train_loss": 0.001457634032703936, "global_step": 50143, "epoch": 421, "lr": 2.0585649652675765e-05} +{"train_loss": 0.0008777683833613992, "global_step": 50144, "epoch": 421, "lr": 2.058385810479374e-05} +{"train_loss": 0.0007483337540179491, "global_step": 50145, "epoch": 421, "lr": 2.0582066614667196e-05} +{"train_loss": 0.0020931754261255264, "global_step": 50146, "epoch": 421, "lr": 2.058027518229959e-05} +{"train_loss": 0.0004598027444444597, "global_step": 50147, "epoch": 421, "lr": 2.0578483807694497e-05} +{"train_loss": 0.001468182890675962, "global_step": 50148, "epoch": 421, "lr": 2.057669249085541e-05} +{"train_loss": 0.0007733640377409756, "global_step": 50149, "epoch": 421, "lr": 2.057490123178582e-05} +{"train_loss": 0.0008677414152771235, "global_step": 50150, "epoch": 421, "lr": 2.057311003048929e-05} +{"train_loss": 0.0005309638800099492, "global_step": 50151, "epoch": 421, "lr": 2.0571318886969294e-05} +{"train_loss": 0.0006205591489560902, "global_step": 50152, "epoch": 421, "lr": 2.0569527801229387e-05} +{"train_loss": 0.0013589441077783704, "global_step": 50153, "epoch": 421, "lr": 2.0567736773273066e-05} +{"train_loss": 0.001403294620104134, "global_step": 50154, "epoch": 421, "lr": 2.0565945803103835e-05} +{"train_loss": 0.0017019517254084349, "global_step": 50155, "epoch": 421, "lr": 2.0564154890725244e-05} +{"train_loss": 0.0006621910142712295, "global_step": 50156, "epoch": 421, "lr": 2.0562364036140768e-05} +{"train_loss": 0.0008962757419794798, "global_step": 50157, "epoch": 421, "lr": 2.056057323935397e-05} +{"train_loss": 0.001044252305291593, "global_step": 50158, "epoch": 421, "lr": 2.0558782500368316e-05} +{"train_loss": 0.000991986133158207, "global_step": 50159, "epoch": 421, "lr": 2.0556991819187348e-05} +{"train_loss": 0.0014537220122292638, "global_step": 50160, "epoch": 421, "lr": 2.0555201195814605e-05} +{"train_loss": 0.0009591634152457118, "global_step": 50161, "epoch": 421, "lr": 2.0553410630253556e-05} +{"train_loss": 0.0011790357530117035, "global_step": 50162, "epoch": 421, "lr": 2.0551620122507757e-05} +{"train_loss": 0.0006958363228477538, "global_step": 50163, "epoch": 421, "lr": 2.0549829672580688e-05} +{"train_loss": 0.0012473695678636432, "global_step": 50164, "epoch": 421, "lr": 2.0548039280475906e-05} +{"train_loss": 0.0008001524256542325, "global_step": 50165, "epoch": 421, "lr": 2.0546248946196878e-05} +{"train_loss": 0.0013984005199745297, "global_step": 50166, "epoch": 421, "lr": 2.0544458669747164e-05} +{"train_loss": 0.001503542298451066, "global_step": 50167, "epoch": 421, "lr": 2.054266845113026e-05} +{"train_loss": 0.0015192389255389571, "global_step": 50168, "epoch": 421, "lr": 2.054087829034966e-05} +{"train_loss": 0.0010638876119628549, "global_step": 50169, "epoch": 421, "lr": 2.053908818740891e-05} +{"train_loss": 0.0011933688074350357, "global_step": 50170, "epoch": 421, "lr": 2.05372981423115e-05} +{"train_loss": 0.0007929709390737116, "global_step": 50171, "epoch": 421, "lr": 2.0535508155060977e-05} +{"train_loss": 0.0010525485267862678, "global_step": 50172, "epoch": 421, "lr": 2.0533718225660835e-05} +{"train_loss": 0.000940402620472014, "global_step": 50173, "epoch": 421, "lr": 2.053192835411457e-05} +{"train_loss": 0.0019089069683104753, "global_step": 50174, "epoch": 421, "lr": 2.0530138540425735e-05} +{"train_loss": 0.0014515664661303163, "global_step": 50175, "epoch": 421, "lr": 2.0528348784597806e-05} +{"train_loss": 0.0006866302574053407, "global_step": 50176, "epoch": 421, "lr": 2.0526559086634332e-05} +{"train_loss": 0.0008307358948513865, "global_step": 50177, "epoch": 421, "lr": 2.05247694465388e-05} +{"train_loss": 0.000785393116530031, "global_step": 50178, "epoch": 421, "lr": 2.0522979864314746e-05} +{"train_loss": 0.0009653914603404701, "global_step": 50179, "epoch": 421, "lr": 2.0521190339965667e-05} +{"train_loss": 0.001022959011606872, "global_step": 50180, "epoch": 421, "lr": 2.0519400873495072e-05} +{"train_loss": 0.000801676360424608, "global_step": 50181, "epoch": 421, "lr": 2.05176114649065e-05} +{"train_loss": 0.0015784924617037177, "global_step": 50182, "epoch": 421, "lr": 2.0515822114203427e-05} +{"train_loss": 0.001098123611882329, "global_step": 50183, "epoch": 421, "lr": 2.0514032821389406e-05} +{"train_loss": 0.0015479180729016662, "global_step": 50184, "epoch": 421, "lr": 2.0512243586467917e-05} +{"train_loss": 0.0010240377159789205, "global_step": 50185, "epoch": 421, "lr": 2.0510454409442503e-05} +{"train_loss": 0.0012056240811944008, "global_step": 50186, "epoch": 421, "lr": 2.050866529031666e-05} +{"train_loss": 0.0008354065357707441, "global_step": 50187, "epoch": 421, "lr": 2.0506876229093887e-05} +{"train_loss": 0.0013030065456405282, "global_step": 50188, "epoch": 421, "lr": 2.0505087225777725e-05} +{"train_loss": 0.0006289253360591829, "global_step": 50189, "epoch": 421, "lr": 2.0503298280371658e-05} +{"train_loss": 0.002388865454122424, "global_step": 50190, "epoch": 421, "lr": 2.0501509392879232e-05} +{"train_loss": 0.0012420470593497157, "global_step": 50191, "epoch": 421, "lr": 2.049972056330392e-05} +{"train_loss": 0.0010814645793288946, "global_step": 50192, "epoch": 421, "lr": 2.049793179164928e-05} +{"train_loss": 0.0004898158367723227, "global_step": 50193, "epoch": 421, "lr": 2.0496143077918774e-05} +{"train_loss": 0.0012991512194275856, "global_step": 50194, "epoch": 421, "lr": 2.049435442211594e-05} +{"train_loss": 0.001110708573833108, "global_step": 50195, "epoch": 421, "lr": 2.0492565824244307e-05} +{"train_loss": 0.0009895074181258678, "global_step": 50196, "epoch": 421, "lr": 2.0490777284307355e-05} +{"train_loss": 0.001140680513344705, "global_step": 50197, "epoch": 421, "lr": 2.0488988802308622e-05} +{"train_loss": 0.0007819146267138422, "global_step": 50198, "epoch": 421, "lr": 2.0487200378251608e-05} +{"train_loss": 0.0009405822493135929, "global_step": 50199, "epoch": 421, "lr": 2.048541201213981e-05} +{"train_loss": 0.0009545347420498729, "global_step": 50200, "epoch": 421, "lr": 2.0483623703976768e-05} +{"train_loss": 0.0008043023408390582, "global_step": 50201, "epoch": 421, "lr": 2.0481835453765958e-05} +{"train_loss": 0.0011091354535892606, "global_step": 50202, "epoch": 421, "lr": 2.0480047261510925e-05} +{"train_loss": 0.000961101264692843, "global_step": 50203, "epoch": 421, "lr": 2.047825912721517e-05} +{"train_loss": 0.0009084113989956677, "global_step": 50204, "epoch": 421, "lr": 2.0476471050882177e-05} +{"train_loss": 0.0004439375479705632, "global_step": 50205, "epoch": 421, "lr": 2.04746830325155e-05} +{"train_loss": 0.0010504074161872268, "global_step": 50206, "epoch": 421, "lr": 2.0472895072118613e-05} +{"train_loss": 0.00065426534274593, "global_step": 50207, "epoch": 421, "lr": 2.047110716969506e-05} +{"train_loss": 0.0007734231185168028, "global_step": 50208, "epoch": 421, "lr": 2.0469319325248308e-05} +{"train_loss": 0.0015620398335158825, "global_step": 50209, "epoch": 421, "lr": 2.046753153878192e-05} +{"train_loss": 0.0011356031754985452, "global_step": 50210, "epoch": 421, "lr": 2.0465743810299372e-05} +{"train_loss": 0.0008780153002589941, "global_step": 50211, "epoch": 421, "lr": 2.0463956139804162e-05} +{"train_loss": 0.0010096487822011113, "global_step": 50212, "epoch": 421, "lr": 2.046216852729984e-05} +{"train_loss": 0.00039501668652519584, "global_step": 50213, "epoch": 421, "lr": 2.046038097278988e-05} +{"train_loss": 0.0008183395839296281, "global_step": 50214, "epoch": 421, "lr": 2.0458593476277822e-05} +{"train_loss": 0.0010890269186347723, "global_step": 50215, "epoch": 421, "lr": 2.045680603776714e-05} +{"train_loss": 0.0006769311730749905, "global_step": 50216, "epoch": 421, "lr": 2.0455018657261377e-05} +{"train_loss": 0.0009931897506814356, "global_step": 50217, "epoch": 421, "lr": 2.0453231334764034e-05, "val_loss": 0.03964858129620552} +{"train_loss": 0.00036960787838324904, "global_step": 50218, "epoch": 422, "lr": 2.0451444070278597e-05} +{"train_loss": 0.002052122727036476, "global_step": 50219, "epoch": 422, "lr": 2.044965686380861e-05} +{"train_loss": 0.0007067260448820889, "global_step": 50220, "epoch": 422, "lr": 2.0447869715357542e-05} +{"train_loss": 0.0012038646964356303, "global_step": 50221, "epoch": 422, "lr": 2.0446082624928946e-05} +{"train_loss": 0.0005315413582138717, "global_step": 50222, "epoch": 422, "lr": 2.0444295592526296e-05} +{"train_loss": 0.0009255400509573519, "global_step": 50223, "epoch": 422, "lr": 2.0442508618153127e-05} +{"train_loss": 0.0014080952387303114, "global_step": 50224, "epoch": 422, "lr": 2.0440721701812916e-05} +{"train_loss": 0.0012524935882538557, "global_step": 50225, "epoch": 422, "lr": 2.043893484350921e-05} +{"train_loss": 0.0006388374022208154, "global_step": 50226, "epoch": 422, "lr": 2.043714804324548e-05} +{"train_loss": 0.000886276422534138, "global_step": 50227, "epoch": 422, "lr": 2.0435361301025268e-05} +{"train_loss": 0.0005792547017335892, "global_step": 50228, "epoch": 422, "lr": 2.0433574616852048e-05} +{"train_loss": 0.0013739526038989425, "global_step": 50229, "epoch": 422, "lr": 2.043178799072936e-05} +{"train_loss": 0.0007534709293395281, "global_step": 50230, "epoch": 422, "lr": 2.0430001422660684e-05} +{"train_loss": 0.000742388772778213, "global_step": 50231, "epoch": 422, "lr": 2.0428214912649558e-05} +{"train_loss": 0.0009649948915466666, "global_step": 50232, "epoch": 422, "lr": 2.0426428460699453e-05} +{"train_loss": 0.001120012835599482, "global_step": 50233, "epoch": 422, "lr": 2.042464206681392e-05} +{"train_loss": 0.0011497270315885544, "global_step": 50234, "epoch": 422, "lr": 2.042285573099642e-05} +{"train_loss": 0.0018280553631484509, "global_step": 50235, "epoch": 422, "lr": 2.0421069453250503e-05} +{"train_loss": 0.0005117523251101375, "global_step": 50236, "epoch": 422, "lr": 2.0419283233579652e-05} +{"train_loss": 0.0005966074531897902, "global_step": 50237, "epoch": 422, "lr": 2.0417497071987362e-05} +{"train_loss": 0.0009032438974827528, "global_step": 50238, "epoch": 422, "lr": 2.0415710968477176e-05} +{"train_loss": 0.0009259486105293036, "global_step": 50239, "epoch": 422, "lr": 2.041392492305256e-05} +{"train_loss": 0.0008502007694914937, "global_step": 50240, "epoch": 422, "lr": 2.041213893571706e-05} +{"train_loss": 0.0006003160960972309, "global_step": 50241, "epoch": 422, "lr": 2.0410353006474166e-05} +{"train_loss": 0.0013726202305406332, "global_step": 50242, "epoch": 422, "lr": 2.0408567135327367e-05} +{"train_loss": 0.0005792606389150023, "global_step": 50243, "epoch": 422, "lr": 2.04067813222802e-05} +{"train_loss": 0.0008489129249937832, "global_step": 50244, "epoch": 422, "lr": 2.0404995567336137e-05} +{"train_loss": 0.0012941461754962802, "global_step": 50245, "epoch": 422, "lr": 2.0403209870498724e-05} +{"train_loss": 0.0011454790364950895, "global_step": 50246, "epoch": 422, "lr": 2.0401424231771426e-05} +{"train_loss": 0.0019276211969554424, "global_step": 50247, "epoch": 422, "lr": 2.039963865115779e-05} +{"train_loss": 0.0008274040301330388, "global_step": 50248, "epoch": 422, "lr": 2.0397853128661297e-05} +{"train_loss": 0.0003756754449568689, "global_step": 50249, "epoch": 422, "lr": 2.0396067664285446e-05} +{"train_loss": 0.0005381518276408315, "global_step": 50250, "epoch": 422, "lr": 2.0394282258033764e-05} +{"train_loss": 0.0006468830397352576, "global_step": 50251, "epoch": 422, "lr": 2.0392496909909732e-05} +{"train_loss": 0.0003637341724243015, "global_step": 50252, "epoch": 422, "lr": 2.0390711619916886e-05} +{"train_loss": 0.0012812053319066763, "global_step": 50253, "epoch": 422, "lr": 2.03889263880587e-05} +{"train_loss": 0.0007565731648355722, "global_step": 50254, "epoch": 422, "lr": 2.0387141214338708e-05} +{"train_loss": 0.0014163207961246371, "global_step": 50255, "epoch": 422, "lr": 2.03853560987604e-05} +{"train_loss": 0.00038019896601326764, "global_step": 50256, "epoch": 422, "lr": 2.038357104132726e-05} +{"train_loss": 0.0012410887284204364, "global_step": 50257, "epoch": 422, "lr": 2.0381786042042823e-05} +{"train_loss": 0.001204057247377932, "global_step": 50258, "epoch": 422, "lr": 2.0380001100910597e-05} +{"train_loss": 0.001175474375486374, "global_step": 50259, "epoch": 422, "lr": 2.0378216217934054e-05} +{"train_loss": 0.000693463662173599, "global_step": 50260, "epoch": 422, "lr": 2.037643139311674e-05} +{"train_loss": 0.0008266883669421077, "global_step": 50261, "epoch": 422, "lr": 2.0374646626462124e-05} +{"train_loss": 0.0008380713989026845, "global_step": 50262, "epoch": 422, "lr": 2.037286191797374e-05} +{"train_loss": 0.0015821197303012013, "global_step": 50263, "epoch": 422, "lr": 2.037107726765506e-05} +{"train_loss": 0.0008640094310976565, "global_step": 50264, "epoch": 422, "lr": 2.0369292675509615e-05} +{"train_loss": 0.0011610999936237931, "global_step": 50265, "epoch": 422, "lr": 2.0367508141540886e-05} +{"train_loss": 0.0012958202278241515, "global_step": 50266, "epoch": 422, "lr": 2.0365723665752406e-05} +{"train_loss": 0.0008045971626415849, "global_step": 50267, "epoch": 422, "lr": 2.0363939248147663e-05} +{"train_loss": 0.0006122658960521221, "global_step": 50268, "epoch": 422, "lr": 2.036215488873014e-05} +{"train_loss": 0.0009028984932228923, "global_step": 50269, "epoch": 422, "lr": 2.0360370587503374e-05} +{"train_loss": 0.0016361812595278025, "global_step": 50270, "epoch": 422, "lr": 2.035858634447084e-05} +{"train_loss": 0.0008094057557173073, "global_step": 50271, "epoch": 422, "lr": 2.0356802159636075e-05} +{"train_loss": 0.0004459234478417784, "global_step": 50272, "epoch": 422, "lr": 2.035501803300256e-05} +{"train_loss": 0.0010883875656872988, "global_step": 50273, "epoch": 422, "lr": 2.0353233964573782e-05} +{"train_loss": 0.0019800381269305944, "global_step": 50274, "epoch": 422, "lr": 2.035144995435328e-05} +{"train_loss": 0.000991259585134685, "global_step": 50275, "epoch": 422, "lr": 2.034966600234452e-05} +{"train_loss": 0.0004966523847542703, "global_step": 50276, "epoch": 422, "lr": 2.0347882108551036e-05} +{"train_loss": 0.0010256931418552995, "global_step": 50277, "epoch": 422, "lr": 2.0346098272976306e-05} +{"train_loss": 0.0008588331402279437, "global_step": 50278, "epoch": 422, "lr": 2.0344314495623863e-05} +{"train_loss": 0.0010350296506658196, "global_step": 50279, "epoch": 422, "lr": 2.0342530776497186e-05} +{"train_loss": 0.0012571923434734344, "global_step": 50280, "epoch": 422, "lr": 2.0340747115599762e-05} +{"train_loss": 0.0011631710221990943, "global_step": 50281, "epoch": 422, "lr": 2.0338963512935138e-05} +{"train_loss": 0.001216944307088852, "global_step": 50282, "epoch": 422, "lr": 2.0337179968506764e-05} +{"train_loss": 0.0007725032628513873, "global_step": 50283, "epoch": 422, "lr": 2.0335396482318193e-05} +{"train_loss": 0.0007757878629490733, "global_step": 50284, "epoch": 422, "lr": 2.033361305437288e-05} +{"train_loss": 0.0014782422222197056, "global_step": 50285, "epoch": 422, "lr": 2.033182968467437e-05} +{"train_loss": 0.0005039675161242485, "global_step": 50286, "epoch": 422, "lr": 2.0330046373226135e-05} +{"train_loss": 0.0005609862855635583, "global_step": 50287, "epoch": 422, "lr": 2.0328263120031672e-05} +{"train_loss": 0.00048370062722824514, "global_step": 50288, "epoch": 422, "lr": 2.032647992509451e-05} +{"train_loss": 0.0011070583714172244, "global_step": 50289, "epoch": 422, "lr": 2.032469678841812e-05} +{"train_loss": 0.0009092586115002632, "global_step": 50290, "epoch": 422, "lr": 2.0322913710006036e-05} +{"train_loss": 0.002558087930083275, "global_step": 50291, "epoch": 422, "lr": 2.0321130689861718e-05} +{"train_loss": 0.0007972128223627806, "global_step": 50292, "epoch": 422, "lr": 2.0319347727988693e-05} +{"train_loss": 0.0008335460443049669, "global_step": 50293, "epoch": 422, "lr": 2.0317564824390474e-05} +{"train_loss": 0.00047918566269800067, "global_step": 50294, "epoch": 422, "lr": 2.0315781979070524e-05} +{"train_loss": 0.0007748646894469857, "global_step": 50295, "epoch": 422, "lr": 2.031399919203239e-05} +{"train_loss": 0.001212128670886159, "global_step": 50296, "epoch": 422, "lr": 2.031221646327952e-05} +{"train_loss": 0.0012504600454121828, "global_step": 50297, "epoch": 422, "lr": 2.031043379281547e-05} +{"train_loss": 0.0012186298845335841, "global_step": 50298, "epoch": 422, "lr": 2.0308651180643705e-05} +{"train_loss": 0.0007100357324816287, "global_step": 50299, "epoch": 422, "lr": 2.030686862676771e-05} +{"train_loss": 0.0013063255464658141, "global_step": 50300, "epoch": 422, "lr": 2.0305086131191033e-05} +{"train_loss": 0.0007254004012793303, "global_step": 50301, "epoch": 422, "lr": 2.0303303693917126e-05} +{"train_loss": 0.0004588455776683986, "global_step": 50302, "epoch": 422, "lr": 2.0301521314949523e-05} +{"train_loss": 0.0009000666323117912, "global_step": 50303, "epoch": 422, "lr": 2.0299738994291694e-05} +{"train_loss": 0.0008945711888372898, "global_step": 50304, "epoch": 422, "lr": 2.0297956731947178e-05} +{"train_loss": 0.0015995710855349898, "global_step": 50305, "epoch": 422, "lr": 2.0296174527919443e-05} +{"train_loss": 0.0012483586324378848, "global_step": 50306, "epoch": 422, "lr": 2.029439238221198e-05} +{"train_loss": 0.0009265989647246897, "global_step": 50307, "epoch": 422, "lr": 2.0292610294828323e-05} +{"train_loss": 0.0007396127912215889, "global_step": 50308, "epoch": 422, "lr": 2.0290828265771938e-05} +{"train_loss": 0.0012225895188748837, "global_step": 50309, "epoch": 422, "lr": 2.028904629504635e-05} +{"train_loss": 0.0009199230698868632, "global_step": 50310, "epoch": 422, "lr": 2.0287264382655048e-05} +{"train_loss": 0.000900902901776135, "global_step": 50311, "epoch": 422, "lr": 2.0285482528601507e-05} +{"train_loss": 0.0012773150810971856, "global_step": 50312, "epoch": 422, "lr": 2.0283700732889264e-05} +{"train_loss": 0.0011831031879410148, "global_step": 50313, "epoch": 422, "lr": 2.0281918995521786e-05} +{"train_loss": 0.0008488766034133732, "global_step": 50314, "epoch": 422, "lr": 2.0280137316502606e-05} +{"train_loss": 0.0005813819589093328, "global_step": 50315, "epoch": 422, "lr": 2.0278355695835177e-05} +{"train_loss": 0.0006113041308708489, "global_step": 50316, "epoch": 422, "lr": 2.0276574133523042e-05} +{"train_loss": 0.0009016233962029219, "global_step": 50317, "epoch": 422, "lr": 2.027479262956968e-05} +{"train_loss": 0.0009076475980691612, "global_step": 50318, "epoch": 422, "lr": 2.0273011183978562e-05} +{"train_loss": 0.0009645771933719516, "global_step": 50319, "epoch": 422, "lr": 2.0271229796753237e-05} +{"train_loss": 0.0011807698756456375, "global_step": 50320, "epoch": 422, "lr": 2.0269448467897155e-05} +{"train_loss": 0.0008999492856673896, "global_step": 50321, "epoch": 422, "lr": 2.0267667197413855e-05} +{"train_loss": 0.0009342360426671803, "global_step": 50322, "epoch": 422, "lr": 2.0265885985306794e-05} +{"train_loss": 0.0009161126799881458, "global_step": 50323, "epoch": 422, "lr": 2.0264104831579504e-05} +{"train_loss": 0.0010346004273742437, "global_step": 50324, "epoch": 422, "lr": 2.026232373623545e-05} +{"train_loss": 0.0004560858360491693, "global_step": 50325, "epoch": 422, "lr": 2.026054269927817e-05} +{"train_loss": 0.00042586366180330515, "global_step": 50326, "epoch": 422, "lr": 2.0258761720711112e-05} +{"train_loss": 0.0010338245192542672, "global_step": 50327, "epoch": 422, "lr": 2.02569808005378e-05} +{"train_loss": 0.000900896149687469, "global_step": 50328, "epoch": 422, "lr": 2.025519993876175e-05} +{"train_loss": 0.0012787000741809607, "global_step": 50329, "epoch": 422, "lr": 2.0253419135386436e-05} +{"train_loss": 0.0013916476164013147, "global_step": 50330, "epoch": 422, "lr": 2.025163839041534e-05} +{"train_loss": 0.0008742857608012855, "global_step": 50331, "epoch": 422, "lr": 2.024985770385199e-05} +{"train_loss": 0.0008287362870760262, "global_step": 50332, "epoch": 422, "lr": 2.0248077075699847e-05} +{"train_loss": 0.0009828540496528149, "global_step": 50333, "epoch": 422, "lr": 2.024629650596244e-05} +{"train_loss": 0.001010689651593566, "global_step": 50334, "epoch": 422, "lr": 2.0244515994643238e-05} +{"train_loss": 0.0012661811197176576, "global_step": 50335, "epoch": 422, "lr": 2.0242735541745767e-05} +{"train_loss": 0.0009712035530012007, "global_step": 50336, "epoch": 422, "lr": 2.0240955147273505e-05, "val_loss": 0.00843335222452879} +{"train_loss": 0.0008795025642029941, "global_step": 50337, "epoch": 423, "lr": 2.023917481122993e-05} +{"train_loss": 0.001166980597190559, "global_step": 50338, "epoch": 423, "lr": 2.0237394533618577e-05} +{"train_loss": 0.0004813850682694465, "global_step": 50339, "epoch": 423, "lr": 2.0235614314442897e-05} +{"train_loss": 0.0008144346647895873, "global_step": 50340, "epoch": 423, "lr": 2.0233834153706433e-05} +{"train_loss": 0.0011841589584946632, "global_step": 50341, "epoch": 423, "lr": 2.0232054051412647e-05} +{"train_loss": 0.0004334668628871441, "global_step": 50342, "epoch": 423, "lr": 2.023027400756503e-05} +{"train_loss": 0.0013372352113947272, "global_step": 50343, "epoch": 423, "lr": 2.022849402216711e-05} +{"train_loss": 0.001476968522183597, "global_step": 50344, "epoch": 423, "lr": 2.022671409522234e-05} +{"train_loss": 0.0007838004385121167, "global_step": 50345, "epoch": 423, "lr": 2.0224934226734253e-05} +{"train_loss": 0.0016543257515877485, "global_step": 50346, "epoch": 423, "lr": 2.0223154416706312e-05} +{"train_loss": 0.0009757122024893761, "global_step": 50347, "epoch": 423, "lr": 2.022137466514204e-05} +{"train_loss": 0.000813074060715735, "global_step": 50348, "epoch": 423, "lr": 2.021959497204492e-05} +{"train_loss": 0.0009229022543877363, "global_step": 50349, "epoch": 423, "lr": 2.0217815337418426e-05} +{"train_loss": 0.0009688174468465149, "global_step": 50350, "epoch": 423, "lr": 2.0216035761266087e-05} +{"train_loss": 0.0006018394487909973, "global_step": 50351, "epoch": 423, "lr": 2.021425624359136e-05} +{"train_loss": 0.001389045501127839, "global_step": 50352, "epoch": 423, "lr": 2.0212476784397782e-05} +{"train_loss": 0.0005183297325856984, "global_step": 50353, "epoch": 423, "lr": 2.0210697383688803e-05} +{"train_loss": 0.0005721740308217704, "global_step": 50354, "epoch": 423, "lr": 2.0208918041467956e-05} +{"train_loss": 0.0010674099903553724, "global_step": 50355, "epoch": 423, "lr": 2.0207138757738696e-05} +{"train_loss": 0.0007015792070887983, "global_step": 50356, "epoch": 423, "lr": 2.0205359532504555e-05} +{"train_loss": 0.0008375716279260814, "global_step": 50357, "epoch": 423, "lr": 2.0203580365768985e-05} +{"train_loss": 0.0012071409728378057, "global_step": 50358, "epoch": 423, "lr": 2.0201801257535526e-05} +{"train_loss": 0.0008929118630476296, "global_step": 50359, "epoch": 423, "lr": 2.0200022207807628e-05} +{"train_loss": 0.0011568976333364844, "global_step": 50360, "epoch": 423, "lr": 2.019824321658882e-05} +{"train_loss": 0.0012871677754446864, "global_step": 50361, "epoch": 423, "lr": 2.0196464283882554e-05} +{"train_loss": 0.0008112503564916551, "global_step": 50362, "epoch": 423, "lr": 2.019468540969237e-05} +{"train_loss": 0.0014484182465821505, "global_step": 50363, "epoch": 423, "lr": 2.019290659402172e-05} +{"train_loss": 0.0009375849622301757, "global_step": 50364, "epoch": 423, "lr": 2.019112783687413e-05} +{"train_loss": 0.001249168417416513, "global_step": 50365, "epoch": 423, "lr": 2.0189349138253054e-05} +{"train_loss": 0.0004895874299108982, "global_step": 50366, "epoch": 423, "lr": 2.018757049816203e-05} +{"train_loss": 0.00167156255338341, "global_step": 50367, "epoch": 423, "lr": 2.0185791916604525e-05} +{"train_loss": 0.000689237262122333, "global_step": 50368, "epoch": 423, "lr": 2.018401339358401e-05} +{"train_loss": 0.0017279062885791063, "global_step": 50369, "epoch": 423, "lr": 2.018223492910402e-05} +{"train_loss": 0.0005226815119385719, "global_step": 50370, "epoch": 423, "lr": 2.0180456523168013e-05} +{"train_loss": 0.001337712979875505, "global_step": 50371, "epoch": 423, "lr": 2.0178678175779503e-05} +{"train_loss": 0.000679199758451432, "global_step": 50372, "epoch": 423, "lr": 2.0176899886941962e-05} +{"train_loss": 0.000858164916280657, "global_step": 50373, "epoch": 423, "lr": 2.0175121656658908e-05} +{"train_loss": 0.0005314933368936181, "global_step": 50374, "epoch": 423, "lr": 2.0173343484933816e-05} +{"train_loss": 0.0005908077582716942, "global_step": 50375, "epoch": 423, "lr": 2.0171565371770156e-05} +{"train_loss": 0.0005925424629822373, "global_step": 50376, "epoch": 423, "lr": 2.0169787317171462e-05} +{"train_loss": 0.0007059838972054422, "global_step": 50377, "epoch": 423, "lr": 2.0168009321141184e-05} +{"train_loss": 0.0008639765437692404, "global_step": 50378, "epoch": 423, "lr": 2.0166231383682854e-05} +{"train_loss": 0.0011577971745282412, "global_step": 50379, "epoch": 423, "lr": 2.0164453504799942e-05} +{"train_loss": 0.0011822812957689166, "global_step": 50380, "epoch": 423, "lr": 2.0162675684495914e-05} +{"train_loss": 0.0003900631272699684, "global_step": 50381, "epoch": 423, "lr": 2.016089792277431e-05} +{"train_loss": 0.001360225724056363, "global_step": 50382, "epoch": 423, "lr": 2.0159120219638567e-05} +{"train_loss": 0.0007462852518074214, "global_step": 50383, "epoch": 423, "lr": 2.015734257509223e-05} +{"train_loss": 0.0009413036168552935, "global_step": 50384, "epoch": 423, "lr": 2.0155564989138742e-05} +{"train_loss": 0.0010087564587593079, "global_step": 50385, "epoch": 423, "lr": 2.0153787461781632e-05} +{"train_loss": 0.0007493150187656283, "global_step": 50386, "epoch": 423, "lr": 2.0152009993024372e-05} +{"train_loss": 0.0008910303586162627, "global_step": 50387, "epoch": 423, "lr": 2.0150232582870432e-05} +{"train_loss": 0.0008439820958301425, "global_step": 50388, "epoch": 423, "lr": 2.0148455231323345e-05} +{"train_loss": 0.0008490296895615757, "global_step": 50389, "epoch": 423, "lr": 2.014667793838655e-05} +{"train_loss": 0.0006409201305359602, "global_step": 50390, "epoch": 423, "lr": 2.0144900704063568e-05} +{"train_loss": 0.0003877451235894114, "global_step": 50391, "epoch": 423, "lr": 2.0143123528357905e-05} +{"train_loss": 0.0011705178767442703, "global_step": 50392, "epoch": 423, "lr": 2.0141346411273004e-05} +{"train_loss": 0.0008586206240579486, "global_step": 50393, "epoch": 423, "lr": 2.0139569352812405e-05} +{"train_loss": 0.0008735598530620337, "global_step": 50394, "epoch": 423, "lr": 2.013779235297955e-05} +{"train_loss": 0.0008057165541686118, "global_step": 50395, "epoch": 423, "lr": 2.0136015411777965e-05} +{"train_loss": 0.0005594018730334938, "global_step": 50396, "epoch": 423, "lr": 2.0134238529211107e-05} +{"train_loss": 0.0014461787650361657, "global_step": 50397, "epoch": 423, "lr": 2.0132461705282503e-05} +{"train_loss": 0.0004827010852750391, "global_step": 50398, "epoch": 423, "lr": 2.0130684939995616e-05} +{"train_loss": 0.001439312589354813, "global_step": 50399, "epoch": 423, "lr": 2.0128908233353923e-05} +{"train_loss": 0.0010389355011284351, "global_step": 50400, "epoch": 423, "lr": 2.0127131585360936e-05} +{"train_loss": 0.0011224951595067978, "global_step": 50401, "epoch": 423, "lr": 2.012535499602013e-05} +{"train_loss": 0.0010686763562262058, "global_step": 50402, "epoch": 423, "lr": 2.0123578465335007e-05} +{"train_loss": 0.0004329560324549675, "global_step": 50403, "epoch": 423, "lr": 2.012180199330903e-05} +{"train_loss": 0.001170406467281282, "global_step": 50404, "epoch": 423, "lr": 2.0120025579945718e-05} +{"train_loss": 0.0009298993973061442, "global_step": 50405, "epoch": 423, "lr": 2.011824922524855e-05} +{"train_loss": 0.0015598890604451299, "global_step": 50406, "epoch": 423, "lr": 2.0116472929220987e-05} +{"train_loss": 0.0009632844012230635, "global_step": 50407, "epoch": 423, "lr": 2.0114696691866552e-05} +{"train_loss": 0.0011547007597982883, "global_step": 50408, "epoch": 423, "lr": 2.0112920513188697e-05} +{"train_loss": 0.0008409014553762972, "global_step": 50409, "epoch": 423, "lr": 2.0111144393190958e-05} +{"train_loss": 0.000988735817372799, "global_step": 50410, "epoch": 423, "lr": 2.0109368331876782e-05} +{"train_loss": 0.0010324183385819197, "global_step": 50411, "epoch": 423, "lr": 2.0107592329249657e-05} +{"train_loss": 0.0006972806877456605, "global_step": 50412, "epoch": 423, "lr": 2.01058163853131e-05} +{"train_loss": 0.0013745875330641866, "global_step": 50413, "epoch": 423, "lr": 2.0104040500070555e-05} +{"train_loss": 0.0010952105512842536, "global_step": 50414, "epoch": 423, "lr": 2.010226467352555e-05} +{"train_loss": 0.0011695767752826214, "global_step": 50415, "epoch": 423, "lr": 2.010048890568154e-05} +{"train_loss": 0.0007306397310458124, "global_step": 50416, "epoch": 423, "lr": 2.0098713196542046e-05} +{"train_loss": 0.000923836778383702, "global_step": 50417, "epoch": 423, "lr": 2.0096937546110532e-05} +{"train_loss": 0.0013286963803693652, "global_step": 50418, "epoch": 423, "lr": 2.0095161954390467e-05} +{"train_loss": 0.000830678385682404, "global_step": 50419, "epoch": 423, "lr": 2.0093386421385374e-05} +{"train_loss": 0.0009758693049661815, "global_step": 50420, "epoch": 423, "lr": 2.0091610947098706e-05} +{"train_loss": 0.001022354350425303, "global_step": 50421, "epoch": 423, "lr": 2.0089835531533985e-05} +{"train_loss": 0.0014908857410773635, "global_step": 50422, "epoch": 423, "lr": 2.0088060174694656e-05} +{"train_loss": 0.001317808753810823, "global_step": 50423, "epoch": 423, "lr": 2.0086284876584237e-05} +{"train_loss": 0.0007505248067900538, "global_step": 50424, "epoch": 423, "lr": 2.0084509637206195e-05} +{"train_loss": 0.0008873327751643956, "global_step": 50425, "epoch": 423, "lr": 2.0082734456564016e-05} +{"train_loss": 0.0006932999822311103, "global_step": 50426, "epoch": 423, "lr": 2.008095933466121e-05} +{"train_loss": 0.0006132301641628146, "global_step": 50427, "epoch": 423, "lr": 2.0079184271501228e-05} +{"train_loss": 0.0010698098922148347, "global_step": 50428, "epoch": 423, "lr": 2.0077409267087588e-05} +{"train_loss": 0.0010822077747434378, "global_step": 50429, "epoch": 423, "lr": 2.007563432142376e-05} +{"train_loss": 0.0008622887544333935, "global_step": 50430, "epoch": 423, "lr": 2.0073859434513203e-05} +{"train_loss": 0.0007369531667791307, "global_step": 50431, "epoch": 423, "lr": 2.007208460635945e-05} +{"train_loss": 0.0009261479135602713, "global_step": 50432, "epoch": 423, "lr": 2.0070309836965938e-05} +{"train_loss": 0.00124540482647717, "global_step": 50433, "epoch": 423, "lr": 2.0068535126336196e-05} +{"train_loss": 0.0007038694457150996, "global_step": 50434, "epoch": 423, "lr": 2.0066760474473674e-05} +{"train_loss": 0.0006340509280562401, "global_step": 50435, "epoch": 423, "lr": 2.0064985881381882e-05} +{"train_loss": 0.0006473303656093776, "global_step": 50436, "epoch": 423, "lr": 2.006321134706429e-05} +{"train_loss": 0.0007027409155853093, "global_step": 50437, "epoch": 423, "lr": 2.0061436871524376e-05} +{"train_loss": 0.000769364065490663, "global_step": 50438, "epoch": 423, "lr": 2.0059662454765643e-05} +{"train_loss": 0.0008218438015319407, "global_step": 50439, "epoch": 423, "lr": 2.005788809679155e-05} +{"train_loss": 0.0009465623879805207, "global_step": 50440, "epoch": 423, "lr": 2.005611379760561e-05} +{"train_loss": 0.0009225344401784241, "global_step": 50441, "epoch": 423, "lr": 2.0054339557211272e-05} +{"train_loss": 0.001211586408317089, "global_step": 50442, "epoch": 423, "lr": 2.005256537561206e-05} +{"train_loss": 0.0010323176393285394, "global_step": 50443, "epoch": 423, "lr": 2.0050791252811433e-05} +{"train_loss": 0.0009109743987210095, "global_step": 50444, "epoch": 423, "lr": 2.0049017188812864e-05} +{"train_loss": 0.0005709761753678322, "global_step": 50445, "epoch": 423, "lr": 2.0047243183619868e-05} +{"train_loss": 0.0007529647555202246, "global_step": 50446, "epoch": 423, "lr": 2.0045469237235885e-05} +{"train_loss": 0.000913037802092731, "global_step": 50447, "epoch": 423, "lr": 2.004369534966445e-05} +{"train_loss": 0.0008016845677047968, "global_step": 50448, "epoch": 423, "lr": 2.0041921520909013e-05} +{"train_loss": 0.0009876529220491648, "global_step": 50449, "epoch": 423, "lr": 2.0040147750973048e-05} +{"train_loss": 0.0009834103984758258, "global_step": 50450, "epoch": 423, "lr": 2.003837403986007e-05} +{"train_loss": 0.0011217654682695866, "global_step": 50451, "epoch": 423, "lr": 2.0036600387573522e-05} +{"train_loss": 0.0007514211465604603, "global_step": 50452, "epoch": 423, "lr": 2.003482679411693e-05} +{"train_loss": 0.0006241329829208553, "global_step": 50453, "epoch": 423, "lr": 2.0033053259493735e-05} +{"train_loss": 0.0012741696555167437, "global_step": 50454, "epoch": 423, "lr": 2.0031279783707458e-05} +{"train_loss": 0.0009400417647684509, "global_step": 50455, "epoch": 423, "lr": 2.002950636676154e-05, "val_loss": 0.07002357393503189} +{"train_loss": 0.0008798030321486294, "global_step": 50456, "epoch": 424, "lr": 2.0027733008659504e-05} +{"train_loss": 0.0005202160682529211, "global_step": 50457, "epoch": 424, "lr": 2.0025959709404797e-05} +{"train_loss": 0.0006305056740529835, "global_step": 50458, "epoch": 424, "lr": 2.002418646900093e-05} +{"train_loss": 0.0007806267240084708, "global_step": 50459, "epoch": 424, "lr": 2.0022413287451353e-05} +{"train_loss": 0.0014309725956991315, "global_step": 50460, "epoch": 424, "lr": 2.0020640164759586e-05} +{"train_loss": 0.0007232745410874486, "global_step": 50461, "epoch": 424, "lr": 2.0018867100929067e-05} +{"train_loss": 0.0006978029850870371, "global_step": 50462, "epoch": 424, "lr": 2.001709409596332e-05} +{"train_loss": 0.0014029109152033925, "global_step": 50463, "epoch": 424, "lr": 2.0015321149865785e-05} +{"train_loss": 0.0008863841649144888, "global_step": 50464, "epoch": 424, "lr": 2.001354826263998e-05} +{"train_loss": 0.0005583523889072239, "global_step": 50465, "epoch": 424, "lr": 2.001177543428936e-05} +{"train_loss": 0.0013115155743435025, "global_step": 50466, "epoch": 424, "lr": 2.0010002664817423e-05} +{"train_loss": 0.0012108053779229522, "global_step": 50467, "epoch": 424, "lr": 2.000822995422765e-05} +{"train_loss": 0.0005579095450229943, "global_step": 50468, "epoch": 424, "lr": 2.000645730252349e-05} +{"train_loss": 0.0021316546481102705, "global_step": 50469, "epoch": 424, "lr": 2.0004684709708464e-05} +{"train_loss": 0.0008635582635179162, "global_step": 50470, "epoch": 424, "lr": 2.0002912175786022e-05} +{"train_loss": 0.0008486607694067061, "global_step": 50471, "epoch": 424, "lr": 2.0001139700759675e-05} +{"train_loss": 0.0007476414320990443, "global_step": 50472, "epoch": 424, "lr": 1.9999367284632866e-05} +{"train_loss": 0.0008752085850574076, "global_step": 50473, "epoch": 424, "lr": 1.9997594927409106e-05} +{"train_loss": 0.0009608555119484663, "global_step": 50474, "epoch": 424, "lr": 1.999582262909187e-05} +{"train_loss": 0.0005584545433521271, "global_step": 50475, "epoch": 424, "lr": 1.9994050389684614e-05} +{"train_loss": 0.001792475930415094, "global_step": 50476, "epoch": 424, "lr": 1.999227820919085e-05} +{"train_loss": 0.001138465479016304, "global_step": 50477, "epoch": 424, "lr": 1.9990506087614026e-05} +{"train_loss": 0.0012621262576431036, "global_step": 50478, "epoch": 424, "lr": 1.998873402495765e-05} +{"train_loss": 0.00095232023159042, "global_step": 50479, "epoch": 424, "lr": 1.9986962021225192e-05} +{"train_loss": 0.0007575061754323542, "global_step": 50480, "epoch": 424, "lr": 1.9985190076420108e-05} +{"train_loss": 0.0005555048119276762, "global_step": 50481, "epoch": 424, "lr": 1.9983418190545915e-05} +{"train_loss": 0.001361967297270894, "global_step": 50482, "epoch": 424, "lr": 1.9981646363606055e-05} +{"train_loss": 0.000741025258321315, "global_step": 50483, "epoch": 424, "lr": 1.9979874595604048e-05} +{"train_loss": 0.0009999125031754375, "global_step": 50484, "epoch": 424, "lr": 1.9978102886543327e-05} +{"train_loss": 0.001495095668360591, "global_step": 50485, "epoch": 424, "lr": 1.9976331236427416e-05} +{"train_loss": 0.0006125633371993899, "global_step": 50486, "epoch": 424, "lr": 1.997455964525975e-05} +{"train_loss": 0.0007732104859314859, "global_step": 50487, "epoch": 424, "lr": 1.9972788113043845e-05} +{"train_loss": 0.0009704228723421693, "global_step": 50488, "epoch": 424, "lr": 1.9971016639783148e-05} +{"train_loss": 0.0010367775103077292, "global_step": 50489, "epoch": 424, "lr": 1.9969245225481165e-05} +{"train_loss": 0.000658526667393744, "global_step": 50490, "epoch": 424, "lr": 1.9967473870141345e-05} +{"train_loss": 0.0015857808757573366, "global_step": 50491, "epoch": 424, "lr": 1.9965702573767203e-05} +{"train_loss": 0.0010416508885100484, "global_step": 50492, "epoch": 424, "lr": 1.9963931336362172e-05} +{"train_loss": 0.001027816440910101, "global_step": 50493, "epoch": 424, "lr": 1.9962160157929778e-05} +{"train_loss": 0.0005536070675589144, "global_step": 50494, "epoch": 424, "lr": 1.996038903847345e-05} +{"train_loss": 0.000907857553102076, "global_step": 50495, "epoch": 424, "lr": 1.9958617977996708e-05} +{"train_loss": 0.000870200979989022, "global_step": 50496, "epoch": 424, "lr": 1.995684697650299e-05} +{"train_loss": 0.0008799682254903018, "global_step": 50497, "epoch": 424, "lr": 1.9955076033995812e-05} +{"train_loss": 0.0006227507255971432, "global_step": 50498, "epoch": 424, "lr": 1.9953305150478637e-05} +{"train_loss": 0.000406592182116583, "global_step": 50499, "epoch": 424, "lr": 1.9951534325954914e-05} +{"train_loss": 0.001361427246592939, "global_step": 50500, "epoch": 424, "lr": 1.9949763560428164e-05} +{"train_loss": 0.0006401780992746353, "global_step": 50501, "epoch": 424, "lr": 1.9947992853901826e-05} +{"train_loss": 0.0007441674824804068, "global_step": 50502, "epoch": 424, "lr": 1.9946222206379407e-05} +{"train_loss": 0.0005322018987499177, "global_step": 50503, "epoch": 424, "lr": 1.9944451617864353e-05} +{"train_loss": 0.001519621815532446, "global_step": 50504, "epoch": 424, "lr": 1.9942681088360176e-05} +{"train_loss": 0.0008630674565210938, "global_step": 50505, "epoch": 424, "lr": 1.9940910617870333e-05} +{"train_loss": 0.0014671270037069917, "global_step": 50506, "epoch": 424, "lr": 1.9939140206398287e-05} +{"train_loss": 0.0005191047675907612, "global_step": 50507, "epoch": 424, "lr": 1.993736985394754e-05} +{"train_loss": 0.000785650045145303, "global_step": 50508, "epoch": 424, "lr": 1.9935599560521546e-05} +{"train_loss": 0.0008622726309113204, "global_step": 50509, "epoch": 424, "lr": 1.99338293261238e-05} +{"train_loss": 0.0007204801077023149, "global_step": 50510, "epoch": 424, "lr": 1.993205915075777e-05} +{"train_loss": 0.001021934556774795, "global_step": 50511, "epoch": 424, "lr": 1.9930289034426913e-05} +{"train_loss": 0.0008370800642296672, "global_step": 50512, "epoch": 424, "lr": 1.9928518977134735e-05} +{"train_loss": 0.0011672942200675607, "global_step": 50513, "epoch": 424, "lr": 1.9926748978884686e-05} +{"train_loss": 0.0008113079820759594, "global_step": 50514, "epoch": 424, "lr": 1.9924979039680264e-05} +{"train_loss": 0.0008306154632009566, "global_step": 50515, "epoch": 424, "lr": 1.992320915952492e-05} +{"train_loss": 0.0007858144235797226, "global_step": 50516, "epoch": 424, "lr": 1.9921439338422153e-05} +{"train_loss": 0.0006723151891492307, "global_step": 50517, "epoch": 424, "lr": 1.991966957637543e-05} +{"train_loss": 0.0004885055241174996, "global_step": 50518, "epoch": 424, "lr": 1.9917899873388206e-05} +{"train_loss": 0.0013385441852733493, "global_step": 50519, "epoch": 424, "lr": 1.9916130229463993e-05} +{"train_loss": 0.0012767025036737323, "global_step": 50520, "epoch": 424, "lr": 1.9914360644606216e-05} +{"train_loss": 0.0006653408636339009, "global_step": 50521, "epoch": 424, "lr": 1.9912591118818385e-05} +{"train_loss": 0.0006472666864283383, "global_step": 50522, "epoch": 424, "lr": 1.9910821652103985e-05} +{"train_loss": 0.0007005760562606156, "global_step": 50523, "epoch": 424, "lr": 1.9909052244466452e-05} +{"train_loss": 0.001337396795861423, "global_step": 50524, "epoch": 424, "lr": 1.9907282895909302e-05} +{"train_loss": 0.0004972130991518497, "global_step": 50525, "epoch": 424, "lr": 1.9905513606435966e-05} +{"train_loss": 0.00045255577424541116, "global_step": 50526, "epoch": 424, "lr": 1.9903744376049954e-05} +{"train_loss": 0.0010558393551036716, "global_step": 50527, "epoch": 424, "lr": 1.990197520475471e-05} +{"train_loss": 0.0007764638867229223, "global_step": 50528, "epoch": 424, "lr": 1.990020609255374e-05} +{"train_loss": 0.0006069038063287735, "global_step": 50529, "epoch": 424, "lr": 1.9898437039450495e-05} +{"train_loss": 0.0009449017234146595, "global_step": 50530, "epoch": 424, "lr": 1.9896668045448442e-05} +{"train_loss": 0.0011235865531489253, "global_step": 50531, "epoch": 424, "lr": 1.989489911055108e-05} +{"train_loss": 0.0006249031284824014, "global_step": 50532, "epoch": 424, "lr": 1.9893130234761852e-05} +{"train_loss": 0.0004732478701043874, "global_step": 50533, "epoch": 424, "lr": 1.989136141808426e-05} +{"train_loss": 0.0009601498604752123, "global_step": 50534, "epoch": 424, "lr": 1.988959266052175e-05} +{"train_loss": 0.0007477535982616246, "global_step": 50535, "epoch": 424, "lr": 1.9887823962077822e-05} +{"train_loss": 0.00091221381444484, "global_step": 50536, "epoch": 424, "lr": 1.9886055322755938e-05} +{"train_loss": 0.0013707666657865047, "global_step": 50537, "epoch": 424, "lr": 1.9884286742559545e-05} +{"train_loss": 0.0011018837103620172, "global_step": 50538, "epoch": 424, "lr": 1.9882518221492157e-05} +{"train_loss": 0.0008428104920312762, "global_step": 50539, "epoch": 424, "lr": 1.988074975955721e-05} +{"train_loss": 0.0006116597214713693, "global_step": 50540, "epoch": 424, "lr": 1.9878981356758214e-05} +{"train_loss": 0.0009978264570236206, "global_step": 50541, "epoch": 424, "lr": 1.9877213013098594e-05} +{"train_loss": 0.001122629619203508, "global_step": 50542, "epoch": 424, "lr": 1.987544472858187e-05} +{"train_loss": 0.0009519399609416723, "global_step": 50543, "epoch": 424, "lr": 1.9873676503211496e-05} +{"train_loss": 0.0014162039151415229, "global_step": 50544, "epoch": 424, "lr": 1.987190833699092e-05} +{"train_loss": 0.0006942013860680163, "global_step": 50545, "epoch": 424, "lr": 1.9870140229923652e-05} +{"train_loss": 0.0007903825026005507, "global_step": 50546, "epoch": 424, "lr": 1.9868372182013124e-05} +{"train_loss": 0.001179405371658504, "global_step": 50547, "epoch": 424, "lr": 1.9866604193262844e-05} +{"train_loss": 0.000574657169636339, "global_step": 50548, "epoch": 424, "lr": 1.9864836263676273e-05} +{"train_loss": 0.0007588567095808685, "global_step": 50549, "epoch": 424, "lr": 1.986306839325685e-05} +{"train_loss": 0.0013686452293768525, "global_step": 50550, "epoch": 424, "lr": 1.98613005820081e-05} +{"train_loss": 0.0006299111410044134, "global_step": 50551, "epoch": 424, "lr": 1.985953282993345e-05} +{"train_loss": 0.0008616411942057312, "global_step": 50552, "epoch": 424, "lr": 1.9857765137036394e-05} +{"train_loss": 0.0005235158605501056, "global_step": 50553, "epoch": 424, "lr": 1.9855997503320384e-05} +{"train_loss": 0.0013017759192734957, "global_step": 50554, "epoch": 424, "lr": 1.985422992878892e-05} +{"train_loss": 0.0007172178593464196, "global_step": 50555, "epoch": 424, "lr": 1.9852462413445438e-05} +{"train_loss": 0.0010965291876345873, "global_step": 50556, "epoch": 424, "lr": 1.985069495729344e-05} +{"train_loss": 0.0013376724673435092, "global_step": 50557, "epoch": 424, "lr": 1.9848927560336367e-05} +{"train_loss": 0.000987619161605835, "global_step": 50558, "epoch": 424, "lr": 1.9847160222577703e-05} +{"train_loss": 0.0006018236745148897, "global_step": 50559, "epoch": 424, "lr": 1.9845392944020937e-05} +{"train_loss": 0.0007116060587577522, "global_step": 50560, "epoch": 424, "lr": 1.98436257246695e-05} +{"train_loss": 0.0005981535068713129, "global_step": 50561, "epoch": 424, "lr": 1.9841858564526906e-05} +{"train_loss": 0.0007681691204197705, "global_step": 50562, "epoch": 424, "lr": 1.9840091463596594e-05} +{"train_loss": 0.000859603111166507, "global_step": 50563, "epoch": 424, "lr": 1.9838324421882027e-05} +{"train_loss": 0.002122861333191395, "global_step": 50564, "epoch": 424, "lr": 1.9836557439386698e-05} +{"train_loss": 0.0006932577816769481, "global_step": 50565, "epoch": 424, "lr": 1.9834790516114056e-05} +{"train_loss": 0.0004981269012205303, "global_step": 50566, "epoch": 424, "lr": 1.9833023652067594e-05} +{"train_loss": 0.0011011017486453056, "global_step": 50567, "epoch": 424, "lr": 1.9831256847250774e-05} +{"train_loss": 0.0008509145700372756, "global_step": 50568, "epoch": 424, "lr": 1.982949010166703e-05} +{"train_loss": 0.0008228343212977052, "global_step": 50569, "epoch": 424, "lr": 1.982772341531988e-05} +{"train_loss": 0.001118411310017109, "global_step": 50570, "epoch": 424, "lr": 1.9825956788212756e-05} +{"train_loss": 0.0009636408649384975, "global_step": 50571, "epoch": 424, "lr": 1.9824190220349165e-05} +{"train_loss": 0.00042584867333061993, "global_step": 50572, "epoch": 424, "lr": 1.982242371173253e-05} +{"train_loss": 0.0010813288390636444, "global_step": 50573, "epoch": 424, "lr": 1.982065726236636e-05} +{"train_loss": 0.0009149114154729241, "global_step": 50574, "epoch": 424, "lr": 1.9818890872254102e-05, "val_loss": 0.019690748304128647} +{"train_loss": 0.0013271714560687542, "global_step": 50575, "epoch": 425, "lr": 1.9817124541399214e-05} +{"train_loss": 0.0008446081192232668, "global_step": 50576, "epoch": 425, "lr": 1.981535826980519e-05} +{"train_loss": 0.0008061063126660883, "global_step": 50577, "epoch": 425, "lr": 1.9813592057475472e-05} +{"train_loss": 0.0017001715023070574, "global_step": 50578, "epoch": 425, "lr": 1.9811825904413562e-05} +{"train_loss": 0.001386850024573505, "global_step": 50579, "epoch": 425, "lr": 1.98100598106229e-05} +{"train_loss": 0.0015108303632587194, "global_step": 50580, "epoch": 425, "lr": 1.9808293776106944e-05} +{"train_loss": 0.0016901149647310376, "global_step": 50581, "epoch": 425, "lr": 1.9806527800869196e-05} +{"train_loss": 0.0011609464418143034, "global_step": 50582, "epoch": 425, "lr": 1.9804761884913088e-05} +{"train_loss": 0.0008744849474169314, "global_step": 50583, "epoch": 425, "lr": 1.980299602824212e-05} +{"train_loss": 0.0010106703266501427, "global_step": 50584, "epoch": 425, "lr": 1.980123023085973e-05} +{"train_loss": 0.0009157527820207179, "global_step": 50585, "epoch": 425, "lr": 1.979946449276941e-05} +{"train_loss": 0.0008861126261763275, "global_step": 50586, "epoch": 425, "lr": 1.9797698813974603e-05} +{"train_loss": 0.0007519074133597314, "global_step": 50587, "epoch": 425, "lr": 1.97959331944788e-05} +{"train_loss": 0.0007738514104858041, "global_step": 50588, "epoch": 425, "lr": 1.9794167634285444e-05} +{"train_loss": 0.0004067980917170644, "global_step": 50589, "epoch": 425, "lr": 1.9792402133398025e-05} +{"train_loss": 0.0006953711854293942, "global_step": 50590, "epoch": 425, "lr": 1.979063669181998e-05} +{"train_loss": 0.0007743118912912905, "global_step": 50591, "epoch": 425, "lr": 1.978887130955481e-05} +{"train_loss": 0.0010604658164083958, "global_step": 50592, "epoch": 425, "lr": 1.9787105986605948e-05} +{"train_loss": 0.0007488208939321339, "global_step": 50593, "epoch": 425, "lr": 1.9785340722976893e-05} +{"train_loss": 0.0011932303896173835, "global_step": 50594, "epoch": 425, "lr": 1.9783575518671077e-05} +{"train_loss": 0.000488544290419668, "global_step": 50595, "epoch": 425, "lr": 1.9781810373692e-05} +{"train_loss": 0.0010559530928730965, "global_step": 50596, "epoch": 425, "lr": 1.978004528804309e-05} +{"train_loss": 0.0006687511340714991, "global_step": 50597, "epoch": 425, "lr": 1.977828026172785e-05} +{"train_loss": 0.0006668950663879514, "global_step": 50598, "epoch": 425, "lr": 1.9776515294749733e-05} +{"train_loss": 0.0015039329882711172, "global_step": 50599, "epoch": 425, "lr": 1.9774750387112172e-05} +{"train_loss": 0.0006977983866818249, "global_step": 50600, "epoch": 425, "lr": 1.9772985538818682e-05} +{"train_loss": 0.0010974027682095766, "global_step": 50601, "epoch": 425, "lr": 1.9771220749872694e-05} +{"train_loss": 0.0008903826819732785, "global_step": 50602, "epoch": 425, "lr": 1.9769456020277695e-05} +{"train_loss": 0.0004231906495988369, "global_step": 50603, "epoch": 425, "lr": 1.9767691350037127e-05} +{"train_loss": 0.0014494943898171186, "global_step": 50604, "epoch": 425, "lr": 1.9765926739154476e-05} +{"train_loss": 0.0009968902450054884, "global_step": 50605, "epoch": 425, "lr": 1.9764162187633206e-05} +{"train_loss": 0.000666784297209233, "global_step": 50606, "epoch": 425, "lr": 1.9762397695476755e-05} +{"train_loss": 0.0010965712135657668, "global_step": 50607, "epoch": 425, "lr": 1.9760633262688622e-05} +{"train_loss": 0.000793446961324662, "global_step": 50608, "epoch": 425, "lr": 1.9758868889272235e-05} +{"train_loss": 0.0007002718630246818, "global_step": 50609, "epoch": 425, "lr": 1.97571045752311e-05} +{"train_loss": 0.0010090343421325088, "global_step": 50610, "epoch": 425, "lr": 1.9755340320568638e-05} +{"train_loss": 0.0006783285643905401, "global_step": 50611, "epoch": 425, "lr": 1.9753576125288354e-05} +{"train_loss": 0.0004714613314718008, "global_step": 50612, "epoch": 425, "lr": 1.9751811989393686e-05} +{"train_loss": 0.0007999439258128405, "global_step": 50613, "epoch": 425, "lr": 1.9750047912888093e-05} +{"train_loss": 0.0007250115158967674, "global_step": 50614, "epoch": 425, "lr": 1.9748283895775067e-05} +{"train_loss": 0.0009668669663369656, "global_step": 50615, "epoch": 425, "lr": 1.9746519938058032e-05} +{"train_loss": 0.00099473656155169, "global_step": 50616, "epoch": 425, "lr": 1.9744756039740493e-05} +{"train_loss": 0.0009474585531279445, "global_step": 50617, "epoch": 425, "lr": 1.9742992200825893e-05} +{"train_loss": 0.00153727934230119, "global_step": 50618, "epoch": 425, "lr": 1.9741228421317674e-05} +{"train_loss": 0.0007754709804430604, "global_step": 50619, "epoch": 425, "lr": 1.973946470121933e-05} +{"train_loss": 0.0010091037256643176, "global_step": 50620, "epoch": 425, "lr": 1.9737701040534323e-05} +{"train_loss": 0.0010897595202550292, "global_step": 50621, "epoch": 425, "lr": 1.973593743926609e-05} +{"train_loss": 0.0005351649015210569, "global_step": 50622, "epoch": 425, "lr": 1.973417389741813e-05} +{"train_loss": 0.0009006813052110374, "global_step": 50623, "epoch": 425, "lr": 1.9732410414993867e-05} +{"train_loss": 0.0011190014192834496, "global_step": 50624, "epoch": 425, "lr": 1.9730646991996805e-05} +{"train_loss": 0.0008415182237513363, "global_step": 50625, "epoch": 425, "lr": 1.9728883628430363e-05} +{"train_loss": 0.0008316586608998477, "global_step": 50626, "epoch": 425, "lr": 1.9727120324298044e-05} +{"train_loss": 0.0011519133113324642, "global_step": 50627, "epoch": 425, "lr": 1.9725357079603267e-05} +{"train_loss": 0.0011905240826308727, "global_step": 50628, "epoch": 425, "lr": 1.9723593894349535e-05} +{"train_loss": 0.00042996747652068734, "global_step": 50629, "epoch": 425, "lr": 1.9721830768540295e-05} +{"train_loss": 0.000717008369974792, "global_step": 50630, "epoch": 425, "lr": 1.972006770217899e-05} +{"train_loss": 0.0008856384665705264, "global_step": 50631, "epoch": 425, "lr": 1.9718304695269114e-05} +{"train_loss": 0.0009800182888284326, "global_step": 50632, "epoch": 425, "lr": 1.971654174781409e-05} +{"train_loss": 0.0005916044465266168, "global_step": 50633, "epoch": 425, "lr": 1.971477885981742e-05} +{"train_loss": 0.0006040857988409698, "global_step": 50634, "epoch": 425, "lr": 1.971301603128253e-05} +{"train_loss": 0.0009960721945390105, "global_step": 50635, "epoch": 425, "lr": 1.9711253262212913e-05} +{"train_loss": 0.0007252380601130426, "global_step": 50636, "epoch": 425, "lr": 1.9709490552612014e-05} +{"train_loss": 0.0006182160577736795, "global_step": 50637, "epoch": 425, "lr": 1.970772790248328e-05} +{"train_loss": 0.0010649095056578517, "global_step": 50638, "epoch": 425, "lr": 1.97059653118302e-05} +{"train_loss": 0.0006986187654547393, "global_step": 50639, "epoch": 425, "lr": 1.9704202780656205e-05} +{"train_loss": 0.0008539273403584957, "global_step": 50640, "epoch": 425, "lr": 1.9702440308964794e-05} +{"train_loss": 0.0010991679737344384, "global_step": 50641, "epoch": 425, "lr": 1.9700677896759378e-05} +{"train_loss": 0.0008504713186994195, "global_step": 50642, "epoch": 425, "lr": 1.9698915544043468e-05} +{"train_loss": 0.0008284256909973919, "global_step": 50643, "epoch": 425, "lr": 1.9697153250820493e-05} +{"train_loss": 0.0008772214059717953, "global_step": 50644, "epoch": 425, "lr": 1.9695391017093907e-05} +{"train_loss": 0.0010045765666291118, "global_step": 50645, "epoch": 425, "lr": 1.9693628842867203e-05} +{"train_loss": 0.0005691006081178784, "global_step": 50646, "epoch": 425, "lr": 1.96918667281438e-05} +{"train_loss": 0.0013156214263290167, "global_step": 50647, "epoch": 425, "lr": 1.9690104672927196e-05} +{"train_loss": 0.0008798250928521156, "global_step": 50648, "epoch": 425, "lr": 1.968834267722084e-05} +{"train_loss": 0.0008252388215623796, "global_step": 50649, "epoch": 425, "lr": 1.968658074102816e-05} +{"train_loss": 0.000609966111369431, "global_step": 50650, "epoch": 425, "lr": 1.968481886435266e-05} +{"train_loss": 0.0007859386969357729, "global_step": 50651, "epoch": 425, "lr": 1.968305704719776e-05} +{"train_loss": 0.00046495249262079597, "global_step": 50652, "epoch": 425, "lr": 1.9681295289566958e-05} +{"train_loss": 0.0007405172218568623, "global_step": 50653, "epoch": 425, "lr": 1.9679533591463677e-05} +{"train_loss": 0.0008209199295379221, "global_step": 50654, "epoch": 425, "lr": 1.967777195289139e-05} +{"train_loss": 0.0005639342125505209, "global_step": 50655, "epoch": 425, "lr": 1.9676010373853577e-05} +{"train_loss": 0.0006698080105707049, "global_step": 50656, "epoch": 425, "lr": 1.967424885435366e-05} +{"train_loss": 0.0008032082696445286, "global_step": 50657, "epoch": 425, "lr": 1.9672487394395135e-05} +{"train_loss": 0.0006642274674959481, "global_step": 50658, "epoch": 425, "lr": 1.967072599398142e-05} +{"train_loss": 0.0011068818857893348, "global_step": 50659, "epoch": 425, "lr": 1.966896465311602e-05} +{"train_loss": 0.0006902147433720529, "global_step": 50660, "epoch": 425, "lr": 1.966720337180234e-05} +{"train_loss": 0.0013740337453782558, "global_step": 50661, "epoch": 425, "lr": 1.966544215004389e-05} +{"train_loss": 0.0006844153976999223, "global_step": 50662, "epoch": 425, "lr": 1.9663680987844102e-05} +{"train_loss": 0.000465253135189414, "global_step": 50663, "epoch": 425, "lr": 1.9661919885206416e-05} +{"train_loss": 0.000783436989877373, "global_step": 50664, "epoch": 425, "lr": 1.9660158842134326e-05} +{"train_loss": 0.0009059914154931903, "global_step": 50665, "epoch": 425, "lr": 1.9658397858631254e-05} +{"train_loss": 0.001418420346453786, "global_step": 50666, "epoch": 425, "lr": 1.96566369347007e-05} +{"train_loss": 0.0006952023832127452, "global_step": 50667, "epoch": 425, "lr": 1.9654876070346095e-05} +{"train_loss": 0.0007655321969650686, "global_step": 50668, "epoch": 425, "lr": 1.9653115265570875e-05} +{"train_loss": 0.0010409923270344734, "global_step": 50669, "epoch": 425, "lr": 1.9651354520378544e-05} +{"train_loss": 0.001033899374306202, "global_step": 50670, "epoch": 425, "lr": 1.964959383477252e-05} +{"train_loss": 0.0010096521582454443, "global_step": 50671, "epoch": 425, "lr": 1.9647833208756293e-05} +{"train_loss": 0.0005851071327924728, "global_step": 50672, "epoch": 425, "lr": 1.9646072642333285e-05} +{"train_loss": 0.0007358562434092164, "global_step": 50673, "epoch": 425, "lr": 1.9644312135506986e-05} +{"train_loss": 0.0009828782640397549, "global_step": 50674, "epoch": 425, "lr": 1.9642551688280843e-05} +{"train_loss": 0.0009032065281644464, "global_step": 50675, "epoch": 425, "lr": 1.9640791300658284e-05} +{"train_loss": 0.0008318615728057921, "global_step": 50676, "epoch": 425, "lr": 1.963903097264281e-05} +{"train_loss": 0.0008436136995442212, "global_step": 50677, "epoch": 425, "lr": 1.963727070423783e-05} +{"train_loss": 0.0006082881009206176, "global_step": 50678, "epoch": 425, "lr": 1.9635510495446846e-05} +{"train_loss": 0.001450620940886438, "global_step": 50679, "epoch": 425, "lr": 1.9633750346273277e-05} +{"train_loss": 0.0013565027620643377, "global_step": 50680, "epoch": 425, "lr": 1.9631990256720613e-05} +{"train_loss": 0.0006900860462337732, "global_step": 50681, "epoch": 425, "lr": 1.963023022679229e-05} +{"train_loss": 0.001202849205583334, "global_step": 50682, "epoch": 425, "lr": 1.962847025649175e-05} +{"train_loss": 0.0003664691757876426, "global_step": 50683, "epoch": 425, "lr": 1.962671034582248e-05} +{"train_loss": 0.0005904013523831964, "global_step": 50684, "epoch": 425, "lr": 1.96249504947879e-05} +{"train_loss": 0.001585109275765717, "global_step": 50685, "epoch": 425, "lr": 1.9623190703391502e-05} +{"train_loss": 0.000651558511890471, "global_step": 50686, "epoch": 425, "lr": 1.9621430971636712e-05} +{"train_loss": 0.00044290474033914506, "global_step": 50687, "epoch": 425, "lr": 1.961967129952701e-05} +{"train_loss": 0.0008683069609105587, "global_step": 50688, "epoch": 425, "lr": 1.9617911687065822e-05} +{"train_loss": 0.0006407614564523101, "global_step": 50689, "epoch": 425, "lr": 1.9616152134256615e-05} +{"train_loss": 0.0009920790325850248, "global_step": 50690, "epoch": 425, "lr": 1.9614392641102864e-05} +{"train_loss": 0.0006574906292371452, "global_step": 50691, "epoch": 425, "lr": 1.9612633207607995e-05} +{"train_loss": 0.0011392714222893119, "global_step": 50692, "epoch": 425, "lr": 1.961087383377549e-05} +{"train_loss": 0.0008884237011886758, "global_step": 50693, "epoch": 425, "lr": 1.9609114519608784e-05, "val_loss": 0.06875632703304291, "train_action_mse_error": 1.4198098142514937e-05} +{"train_loss": 0.0006177018512971699, "global_step": 50694, "epoch": 426, "lr": 1.9607355265111322e-05} +{"train_loss": 0.0009144331561401486, "global_step": 50695, "epoch": 426, "lr": 1.9605596070286587e-05} +{"train_loss": 0.0007275072275660932, "global_step": 50696, "epoch": 426, "lr": 1.9603836935138e-05} +{"train_loss": 0.0006572582060471177, "global_step": 50697, "epoch": 426, "lr": 1.9602077859669043e-05} +{"train_loss": 0.0006813200889155269, "global_step": 50698, "epoch": 426, "lr": 1.9600318843883166e-05} +{"train_loss": 0.0005683537456206977, "global_step": 50699, "epoch": 426, "lr": 1.9598559887783797e-05} +{"train_loss": 0.0009219280909746885, "global_step": 50700, "epoch": 426, "lr": 1.959680099137442e-05} +{"train_loss": 0.0006420755526050925, "global_step": 50701, "epoch": 426, "lr": 1.9595042154658465e-05} +{"train_loss": 0.0006157752359285951, "global_step": 50702, "epoch": 426, "lr": 1.959328337763941e-05} +{"train_loss": 0.0006267050630412996, "global_step": 50703, "epoch": 426, "lr": 1.959152466032068e-05} +{"train_loss": 0.0006389611517079175, "global_step": 50704, "epoch": 426, "lr": 1.9589766002705756e-05} +{"train_loss": 0.000474532280350104, "global_step": 50705, "epoch": 426, "lr": 1.958800740479808e-05} +{"train_loss": 0.0003795181692112237, "global_step": 50706, "epoch": 426, "lr": 1.9586248866601086e-05} +{"train_loss": 0.001540651312097907, "global_step": 50707, "epoch": 426, "lr": 1.958449038811826e-05} +{"train_loss": 0.001210915856063366, "global_step": 50708, "epoch": 426, "lr": 1.9582731969353026e-05} +{"train_loss": 0.0005102597060613334, "global_step": 50709, "epoch": 426, "lr": 1.9580973610308855e-05} +{"train_loss": 0.000489126134198159, "global_step": 50710, "epoch": 426, "lr": 1.9579215310989178e-05} +{"train_loss": 0.000673956295941025, "global_step": 50711, "epoch": 426, "lr": 1.957745707139748e-05} +{"train_loss": 0.0011837518541142344, "global_step": 50712, "epoch": 426, "lr": 1.9575698891537198e-05} +{"train_loss": 0.0003574084839783609, "global_step": 50713, "epoch": 426, "lr": 1.9573940771411765e-05} +{"train_loss": 0.0010608070297166705, "global_step": 50714, "epoch": 426, "lr": 1.957218271102466e-05} +{"train_loss": 0.0005409064469859004, "global_step": 50715, "epoch": 426, "lr": 1.957042471037931e-05} +{"train_loss": 0.0007347495411522686, "global_step": 50716, "epoch": 426, "lr": 1.9568666769479195e-05} +{"train_loss": 0.0015231323195621371, "global_step": 50717, "epoch": 426, "lr": 1.9566908888327734e-05} +{"train_loss": 0.00036981209996156394, "global_step": 50718, "epoch": 426, "lr": 1.9565151066928416e-05} +{"train_loss": 0.0007018253090791404, "global_step": 50719, "epoch": 426, "lr": 1.9563393305284654e-05} +{"train_loss": 0.00121829635463655, "global_step": 50720, "epoch": 426, "lr": 1.9561635603399937e-05} +{"train_loss": 0.0007195848156698048, "global_step": 50721, "epoch": 426, "lr": 1.9559877961277674e-05} +{"train_loss": 0.0015754825435578823, "global_step": 50722, "epoch": 426, "lr": 1.9558120378921358e-05} +{"train_loss": 0.0005290606641210616, "global_step": 50723, "epoch": 426, "lr": 1.9556362856334403e-05} +{"train_loss": 0.0008195914560928941, "global_step": 50724, "epoch": 426, "lr": 1.9554605393520297e-05} +{"train_loss": 0.0006629123818129301, "global_step": 50725, "epoch": 426, "lr": 1.9552847990482455e-05} +{"train_loss": 0.0003518140292726457, "global_step": 50726, "epoch": 426, "lr": 1.9551090647224356e-05} +{"train_loss": 0.0005560882855206728, "global_step": 50727, "epoch": 426, "lr": 1.9549333363749422e-05} +{"train_loss": 0.0012357395607978106, "global_step": 50728, "epoch": 426, "lr": 1.9547576140061136e-05} +{"train_loss": 0.0007661322015337646, "global_step": 50729, "epoch": 426, "lr": 1.954581897616291e-05} +{"train_loss": 0.0007960272487252951, "global_step": 50730, "epoch": 426, "lr": 1.954406187205824e-05} +{"train_loss": 0.0007007693056948483, "global_step": 50731, "epoch": 426, "lr": 1.9542304827750546e-05} +{"train_loss": 0.0011717919260263443, "global_step": 50732, "epoch": 426, "lr": 1.9540547843243263e-05} +{"train_loss": 0.0006180992349982262, "global_step": 50733, "epoch": 426, "lr": 1.9538790918539878e-05} +{"train_loss": 0.0006325493450276554, "global_step": 50734, "epoch": 426, "lr": 1.953703405364381e-05} +{"train_loss": 0.0006275557680055499, "global_step": 50735, "epoch": 426, "lr": 1.9535277248558538e-05} +{"train_loss": 0.0014722902560606599, "global_step": 50736, "epoch": 426, "lr": 1.953352050328749e-05} +{"train_loss": 0.0009745082934387028, "global_step": 50737, "epoch": 426, "lr": 1.9531763817834102e-05} +{"train_loss": 0.0011433804174885154, "global_step": 50738, "epoch": 426, "lr": 1.9530007192201866e-05} +{"train_loss": 0.0008013630867935717, "global_step": 50739, "epoch": 426, "lr": 1.952825062639418e-05} +{"train_loss": 0.0006389227928593755, "global_step": 50740, "epoch": 426, "lr": 1.952649412041454e-05} +{"train_loss": 0.0011928159510716796, "global_step": 50741, "epoch": 426, "lr": 1.9524737674266352e-05} +{"train_loss": 0.0005696261650882661, "global_step": 50742, "epoch": 426, "lr": 1.9522981287953107e-05} +{"train_loss": 0.0011128493351861835, "global_step": 50743, "epoch": 426, "lr": 1.952122496147823e-05} +{"train_loss": 0.0005168546340428293, "global_step": 50744, "epoch": 426, "lr": 1.9519468694845156e-05} +{"train_loss": 0.0008466959116049111, "global_step": 50745, "epoch": 426, "lr": 1.9517712488057366e-05} +{"train_loss": 0.000825761235319078, "global_step": 50746, "epoch": 426, "lr": 1.9515956341118275e-05} +{"train_loss": 0.0005769659765064716, "global_step": 50747, "epoch": 426, "lr": 1.951420025403136e-05} +{"train_loss": 0.0004957120981998742, "global_step": 50748, "epoch": 426, "lr": 1.951244422680004e-05} +{"train_loss": 0.0006053642136976123, "global_step": 50749, "epoch": 426, "lr": 1.95106882594278e-05} +{"train_loss": 0.0010627307929098606, "global_step": 50750, "epoch": 426, "lr": 1.9508932351918062e-05} +{"train_loss": 0.0003562714555300772, "global_step": 50751, "epoch": 426, "lr": 1.950717650427426e-05} +{"train_loss": 0.0011321024503558874, "global_step": 50752, "epoch": 426, "lr": 1.950542071649986e-05} +{"train_loss": 0.0009717194479890168, "global_step": 50753, "epoch": 426, "lr": 1.950366498859833e-05} +{"train_loss": 0.0012781450059264898, "global_step": 50754, "epoch": 426, "lr": 1.9501909320573075e-05} +{"train_loss": 0.0008556183893233538, "global_step": 50755, "epoch": 426, "lr": 1.9500153712427575e-05} +{"train_loss": 0.0003197255136910826, "global_step": 50756, "epoch": 426, "lr": 1.9498398164165255e-05} +{"train_loss": 0.0007516665500588715, "global_step": 50757, "epoch": 426, "lr": 1.9496642675789588e-05} +{"train_loss": 0.00032687641214579344, "global_step": 50758, "epoch": 426, "lr": 1.9494887247303988e-05} +{"train_loss": 0.0006205906975083053, "global_step": 50759, "epoch": 426, "lr": 1.9493131878711928e-05} +{"train_loss": 0.0007675564265809953, "global_step": 50760, "epoch": 426, "lr": 1.9491376570016835e-05} +{"train_loss": 0.0011481612455099821, "global_step": 50761, "epoch": 426, "lr": 1.948962132122218e-05} +{"train_loss": 0.0008709745015949011, "global_step": 50762, "epoch": 426, "lr": 1.9487866132331395e-05} +{"train_loss": 0.0004867670650128275, "global_step": 50763, "epoch": 426, "lr": 1.94861110033479e-05} +{"train_loss": 0.0007355874986387789, "global_step": 50764, "epoch": 426, "lr": 1.9484355934275196e-05} +{"train_loss": 0.0006842355360276997, "global_step": 50765, "epoch": 426, "lr": 1.948260092511667e-05} +{"train_loss": 0.0008103580330498517, "global_step": 50766, "epoch": 426, "lr": 1.948084597587582e-05} +{"train_loss": 0.0011438996298238635, "global_step": 50767, "epoch": 426, "lr": 1.9479091086556067e-05} +{"train_loss": 0.0009970193495973945, "global_step": 50768, "epoch": 426, "lr": 1.9477336257160845e-05} +{"train_loss": 0.0007549553993158042, "global_step": 50769, "epoch": 426, "lr": 1.9475581487693624e-05} +{"train_loss": 0.0006524295313283801, "global_step": 50770, "epoch": 426, "lr": 1.9473826778157823e-05} +{"train_loss": 0.0005365373799577355, "global_step": 50771, "epoch": 426, "lr": 1.9472072128556917e-05} +{"train_loss": 0.0004065929097123444, "global_step": 50772, "epoch": 426, "lr": 1.9470317538894316e-05} +{"train_loss": 0.00046084943460300565, "global_step": 50773, "epoch": 426, "lr": 1.9468563009173513e-05} +{"train_loss": 0.0006734667695127428, "global_step": 50774, "epoch": 426, "lr": 1.9466808539397913e-05} +{"train_loss": 0.0005930010229349136, "global_step": 50775, "epoch": 426, "lr": 1.9465054129570964e-05} +{"train_loss": 0.0007046341779641807, "global_step": 50776, "epoch": 426, "lr": 1.9463299779696133e-05} +{"train_loss": 0.0019398696022108197, "global_step": 50777, "epoch": 426, "lr": 1.946154548977683e-05} +{"train_loss": 0.0005243827472440898, "global_step": 50778, "epoch": 426, "lr": 1.945979125981654e-05} +{"train_loss": 0.0009115315042436123, "global_step": 50779, "epoch": 426, "lr": 1.945803708981867e-05} +{"train_loss": 0.0005994471139274538, "global_step": 50780, "epoch": 426, "lr": 1.94562829797867e-05} +{"train_loss": 0.0004630348994396627, "global_step": 50781, "epoch": 426, "lr": 1.9454528929724052e-05} +{"train_loss": 0.0006026716437190771, "global_step": 50782, "epoch": 426, "lr": 1.9452774939634157e-05} +{"train_loss": 0.0007437544409185648, "global_step": 50783, "epoch": 426, "lr": 1.9451021009520493e-05} +{"train_loss": 0.000863761524669826, "global_step": 50784, "epoch": 426, "lr": 1.9449267139386468e-05} +{"train_loss": 0.0008210517698898911, "global_step": 50785, "epoch": 426, "lr": 1.9447513329235563e-05} +{"train_loss": 0.0007759842555969954, "global_step": 50786, "epoch": 426, "lr": 1.9445759579071178e-05} +{"train_loss": 0.0015826841117814183, "global_step": 50787, "epoch": 426, "lr": 1.944400588889678e-05} +{"train_loss": 0.0010260601993650198, "global_step": 50788, "epoch": 426, "lr": 1.9442252258715836e-05} +{"train_loss": 0.0014440041268244386, "global_step": 50789, "epoch": 426, "lr": 1.9440498688531744e-05} +{"train_loss": 0.00044911657460033894, "global_step": 50790, "epoch": 426, "lr": 1.9438745178347985e-05} +{"train_loss": 0.00041879230411723256, "global_step": 50791, "epoch": 426, "lr": 1.943699172816797e-05} +{"train_loss": 0.0007579055964015424, "global_step": 50792, "epoch": 426, "lr": 1.943523833799517e-05} +{"train_loss": 0.0005510028568096459, "global_step": 50793, "epoch": 426, "lr": 1.943348500783302e-05} +{"train_loss": 0.0007930430001579225, "global_step": 50794, "epoch": 426, "lr": 1.943173173768493e-05} +{"train_loss": 0.000653261668048799, "global_step": 50795, "epoch": 426, "lr": 1.9429978527554395e-05} +{"train_loss": 0.0007654256769455969, "global_step": 50796, "epoch": 426, "lr": 1.942822537744481e-05} +{"train_loss": 0.000902252912055701, "global_step": 50797, "epoch": 426, "lr": 1.942647228735966e-05} +{"train_loss": 0.0015257903141900897, "global_step": 50798, "epoch": 426, "lr": 1.9424719257302344e-05} +{"train_loss": 0.0009658327326178551, "global_step": 50799, "epoch": 426, "lr": 1.942296628727634e-05} +{"train_loss": 0.0007730049546808004, "global_step": 50800, "epoch": 426, "lr": 1.9421213377285082e-05} +{"train_loss": 0.00036154751433059573, "global_step": 50801, "epoch": 426, "lr": 1.941946052733198e-05} +{"train_loss": 0.0006252906168811023, "global_step": 50802, "epoch": 426, "lr": 1.9417707737420522e-05} +{"train_loss": 0.001187743153423071, "global_step": 50803, "epoch": 426, "lr": 1.941595500755411e-05} +{"train_loss": 0.0007862380007281899, "global_step": 50804, "epoch": 426, "lr": 1.941420233773622e-05} +{"train_loss": 0.0011372625594958663, "global_step": 50805, "epoch": 426, "lr": 1.941244972797027e-05} +{"train_loss": 0.0009466136689297855, "global_step": 50806, "epoch": 426, "lr": 1.9410697178259702e-05} +{"train_loss": 0.00079290138091892, "global_step": 50807, "epoch": 426, "lr": 1.940894468860797e-05} +{"train_loss": 0.001242846599780023, "global_step": 50808, "epoch": 426, "lr": 1.9407192259018492e-05} +{"train_loss": 0.0006327616283670068, "global_step": 50809, "epoch": 426, "lr": 1.940543988949474e-05} +{"train_loss": 0.00042505550663918257, "global_step": 50810, "epoch": 426, "lr": 1.9403687580040125e-05} +{"train_loss": 0.0008879480883479118, "global_step": 50811, "epoch": 426, "lr": 1.9401935330658116e-05} +{"train_loss": 0.0007957107054378774, "global_step": 50812, "epoch": 426, "lr": 1.9400183141352134e-05, "val_loss": 0.0367237851023674} +{"train_loss": 0.0007781682070344687, "global_step": 50813, "epoch": 427, "lr": 1.939843101212561e-05} +{"train_loss": 0.0015782794216647744, "global_step": 50814, "epoch": 427, "lr": 1.9396678942982017e-05} +{"train_loss": 0.0010637248633429408, "global_step": 50815, "epoch": 427, "lr": 1.9394926933924756e-05} +{"train_loss": 0.0004197148373350501, "global_step": 50816, "epoch": 427, "lr": 1.9393174984957302e-05} +{"train_loss": 0.0004769067745655775, "global_step": 50817, "epoch": 427, "lr": 1.9391423096083062e-05} +{"train_loss": 0.0007100683287717402, "global_step": 50818, "epoch": 427, "lr": 1.9389671267305508e-05} +{"train_loss": 0.0006987799424678087, "global_step": 50819, "epoch": 427, "lr": 1.9387919498628055e-05} +{"train_loss": 0.0015251566655933857, "global_step": 50820, "epoch": 427, "lr": 1.938616779005416e-05} +{"train_loss": 0.0007951685693114996, "global_step": 50821, "epoch": 427, "lr": 1.9384416141587243e-05} +{"train_loss": 0.000748041900806129, "global_step": 50822, "epoch": 427, "lr": 1.938266455323075e-05} +{"train_loss": 0.0004711463989224285, "global_step": 50823, "epoch": 427, "lr": 1.938091302498814e-05} +{"train_loss": 0.0008767537656240165, "global_step": 50824, "epoch": 427, "lr": 1.937916155686284e-05} +{"train_loss": 0.0004444051010068506, "global_step": 50825, "epoch": 427, "lr": 1.9377410148858267e-05} +{"train_loss": 0.00061744824051857, "global_step": 50826, "epoch": 427, "lr": 1.9375658800977896e-05} +{"train_loss": 0.0009368098108097911, "global_step": 50827, "epoch": 427, "lr": 1.9373907513225127e-05} +{"train_loss": 0.0007681773276999593, "global_step": 50828, "epoch": 427, "lr": 1.9372156285603437e-05} +{"train_loss": 0.0006664030370302498, "global_step": 50829, "epoch": 427, "lr": 1.937040511811623e-05} +{"train_loss": 0.0007111456943675876, "global_step": 50830, "epoch": 427, "lr": 1.9368654010766972e-05} +{"train_loss": 0.0006995013682171702, "global_step": 50831, "epoch": 427, "lr": 1.93669029635591e-05} +{"train_loss": 0.0008674172568134964, "global_step": 50832, "epoch": 427, "lr": 1.9365151976496016e-05} +{"train_loss": 0.00045055957161821425, "global_step": 50833, "epoch": 427, "lr": 1.9363401049581203e-05} +{"train_loss": 0.0007117765489965677, "global_step": 50834, "epoch": 427, "lr": 1.936165018281806e-05} +{"train_loss": 0.0006909029907546937, "global_step": 50835, "epoch": 427, "lr": 1.935989937621006e-05} +{"train_loss": 0.0008604524191468954, "global_step": 50836, "epoch": 427, "lr": 1.935814862976063e-05} +{"train_loss": 0.0006926209316588938, "global_step": 50837, "epoch": 427, "lr": 1.9356397943473183e-05} +{"train_loss": 0.0005238840822130442, "global_step": 50838, "epoch": 427, "lr": 1.9354647317351188e-05} +{"train_loss": 0.0007833718555048108, "global_step": 50839, "epoch": 427, "lr": 1.9352896751398053e-05} +{"train_loss": 0.000548811221960932, "global_step": 50840, "epoch": 427, "lr": 1.9351146245617248e-05} +{"train_loss": 0.00047699749120511115, "global_step": 50841, "epoch": 427, "lr": 1.9349395800012178e-05} +{"train_loss": 0.00048765013343654573, "global_step": 50842, "epoch": 427, "lr": 1.9347645414586308e-05} +{"train_loss": 0.0004174509958829731, "global_step": 50843, "epoch": 427, "lr": 1.9345895089343064e-05} +{"train_loss": 0.0004101695667486638, "global_step": 50844, "epoch": 427, "lr": 1.9344144824285864e-05} +{"train_loss": 0.0017499823588877916, "global_step": 50845, "epoch": 427, "lr": 1.9342394619418176e-05} +{"train_loss": 0.0005367903504520655, "global_step": 50846, "epoch": 427, "lr": 1.9340644474743406e-05} +{"train_loss": 0.001126733492128551, "global_step": 50847, "epoch": 427, "lr": 1.9338894390265022e-05} +{"train_loss": 0.0009836307726800442, "global_step": 50848, "epoch": 427, "lr": 1.9337144365986425e-05} +{"train_loss": 0.0011267511872574687, "global_step": 50849, "epoch": 427, "lr": 1.9335394401911084e-05} +{"train_loss": 0.0002995489339809865, "global_step": 50850, "epoch": 427, "lr": 1.9333644498042408e-05} +{"train_loss": 0.0007822156185284257, "global_step": 50851, "epoch": 427, "lr": 1.933189465438386e-05} +{"train_loss": 0.0008331550634466112, "global_step": 50852, "epoch": 427, "lr": 1.9330144870938836e-05} +{"train_loss": 0.0007743145688436925, "global_step": 50853, "epoch": 427, "lr": 1.9328395147710822e-05} +{"train_loss": 0.0005042634438723326, "global_step": 50854, "epoch": 427, "lr": 1.932664548470321e-05} +{"train_loss": 0.0009779164101928473, "global_step": 50855, "epoch": 427, "lr": 1.9324895881919464e-05} +{"train_loss": 0.0008421273087151349, "global_step": 50856, "epoch": 427, "lr": 1.9323146339362995e-05} +{"train_loss": 0.0011813441524282098, "global_step": 50857, "epoch": 427, "lr": 1.9321396857037267e-05} +{"train_loss": 0.0008006394491530955, "global_step": 50858, "epoch": 427, "lr": 1.931964743494568e-05} +{"train_loss": 0.0014398513594642282, "global_step": 50859, "epoch": 427, "lr": 1.9317898073091704e-05} +{"train_loss": 0.0008733239956200123, "global_step": 50860, "epoch": 427, "lr": 1.9316148771478748e-05} +{"train_loss": 0.0005781198851764202, "global_step": 50861, "epoch": 427, "lr": 1.9314399530110267e-05} +{"train_loss": 0.0008230138919316232, "global_step": 50862, "epoch": 427, "lr": 1.9312650348989686e-05} +{"train_loss": 0.0005764259258285165, "global_step": 50863, "epoch": 427, "lr": 1.9310901228120414e-05} +{"train_loss": 0.0007067606202326715, "global_step": 50864, "epoch": 427, "lr": 1.9309152167505932e-05} +{"train_loss": 0.000864281493704766, "global_step": 50865, "epoch": 427, "lr": 1.9307403167149635e-05} +{"train_loss": 0.0004436922026798129, "global_step": 50866, "epoch": 427, "lr": 1.9305654227054986e-05} +{"train_loss": 0.0010851469123736024, "global_step": 50867, "epoch": 427, "lr": 1.9303905347225392e-05} +{"train_loss": 0.0008254334679804742, "global_step": 50868, "epoch": 427, "lr": 1.9302156527664317e-05} +{"train_loss": 0.0006873974925838411, "global_step": 50869, "epoch": 427, "lr": 1.9300407768375172e-05} +{"train_loss": 0.0013743246672675014, "global_step": 50870, "epoch": 427, "lr": 1.9298659069361387e-05} +{"train_loss": 0.0009313856135122478, "global_step": 50871, "epoch": 427, "lr": 1.929691043062642e-05} +{"train_loss": 0.0007267420296557248, "global_step": 50872, "epoch": 427, "lr": 1.929516185217367e-05} +{"train_loss": 0.001076441491022706, "global_step": 50873, "epoch": 427, "lr": 1.929341333400661e-05} +{"train_loss": 0.0009685197146609426, "global_step": 50874, "epoch": 427, "lr": 1.9291664876128653e-05} +{"train_loss": 0.0011453169863671064, "global_step": 50875, "epoch": 427, "lr": 1.9289916478543207e-05} +{"train_loss": 0.0005877023795619607, "global_step": 50876, "epoch": 427, "lr": 1.9288168141253754e-05} +{"train_loss": 0.000631809642072767, "global_step": 50877, "epoch": 427, "lr": 1.928641986426368e-05} +{"train_loss": 0.0007186147850006819, "global_step": 50878, "epoch": 427, "lr": 1.9284671647576457e-05} +{"train_loss": 0.0008958809776231647, "global_step": 50879, "epoch": 427, "lr": 1.9282923491195488e-05} +{"train_loss": 0.0006862807204015553, "global_step": 50880, "epoch": 427, "lr": 1.928117539512423e-05} +{"train_loss": 0.0011274887947365642, "global_step": 50881, "epoch": 427, "lr": 1.92794273593661e-05} +{"train_loss": 0.0008654982084408402, "global_step": 50882, "epoch": 427, "lr": 1.927767938392452e-05} +{"train_loss": 0.0011381754884496331, "global_step": 50883, "epoch": 427, "lr": 1.9275931468802942e-05} +{"train_loss": 0.0008300618501380086, "global_step": 50884, "epoch": 427, "lr": 1.927418361400478e-05} +{"train_loss": 0.0007283826125785708, "global_step": 50885, "epoch": 427, "lr": 1.9272435819533478e-05} +{"train_loss": 0.0006178960902616382, "global_step": 50886, "epoch": 427, "lr": 1.927068808539248e-05} +{"train_loss": 0.0008092031930573285, "global_step": 50887, "epoch": 427, "lr": 1.9268940411585185e-05} +{"train_loss": 0.0010144629050046206, "global_step": 50888, "epoch": 427, "lr": 1.9267192798115062e-05} +{"train_loss": 0.0010885358788073063, "global_step": 50889, "epoch": 427, "lr": 1.9265445244985503e-05} +{"train_loss": 0.0016160925151780248, "global_step": 50890, "epoch": 427, "lr": 1.9263697752199977e-05} +{"train_loss": 0.0006674457690678537, "global_step": 50891, "epoch": 427, "lr": 1.9261950319761886e-05} +{"train_loss": 0.0009131776168942451, "global_step": 50892, "epoch": 427, "lr": 1.9260202947674676e-05} +{"train_loss": 0.0009049890213645995, "global_step": 50893, "epoch": 427, "lr": 1.9258455635941785e-05} +{"train_loss": 0.0009767881128937006, "global_step": 50894, "epoch": 427, "lr": 1.925670838456661e-05} +{"train_loss": 0.0016300949500873685, "global_step": 50895, "epoch": 427, "lr": 1.9254961193552617e-05} +{"train_loss": 0.0006699446821585298, "global_step": 50896, "epoch": 427, "lr": 1.9253214062903213e-05} +{"train_loss": 0.0009637202601879835, "global_step": 50897, "epoch": 427, "lr": 1.9251466992621852e-05} +{"train_loss": 0.0010499429190531373, "global_step": 50898, "epoch": 427, "lr": 1.9249719982711933e-05} +{"train_loss": 0.001343972864560783, "global_step": 50899, "epoch": 427, "lr": 1.924797303317692e-05} +{"train_loss": 0.0005683833151124418, "global_step": 50900, "epoch": 427, "lr": 1.924622614402023e-05} +{"train_loss": 0.0010304456809535623, "global_step": 50901, "epoch": 427, "lr": 1.9244479315245267e-05} +{"train_loss": 0.0009294679621234536, "global_step": 50902, "epoch": 427, "lr": 1.9242732546855508e-05} +{"train_loss": 0.0021232974249869585, "global_step": 50903, "epoch": 427, "lr": 1.9240985838854336e-05} +{"train_loss": 0.001108219032175839, "global_step": 50904, "epoch": 427, "lr": 1.9239239191245217e-05} +{"train_loss": 0.0006128665991127491, "global_step": 50905, "epoch": 427, "lr": 1.923749260403157e-05} +{"train_loss": 0.0016389403026551008, "global_step": 50906, "epoch": 427, "lr": 1.92357460772168e-05} +{"train_loss": 0.0010477884206920862, "global_step": 50907, "epoch": 427, "lr": 1.9233999610804376e-05} +{"train_loss": 0.0011129085905849934, "global_step": 50908, "epoch": 427, "lr": 1.9232253204797683e-05} +{"train_loss": 0.0006916362326592207, "global_step": 50909, "epoch": 427, "lr": 1.9230506859200197e-05} +{"train_loss": 0.0013372768880799413, "global_step": 50910, "epoch": 427, "lr": 1.9228760574015304e-05} +{"train_loss": 0.0012104756897315383, "global_step": 50911, "epoch": 427, "lr": 1.922701434924647e-05} +{"train_loss": 0.0010545726399868727, "global_step": 50912, "epoch": 427, "lr": 1.922526818489711e-05} +{"train_loss": 0.0018589015817269683, "global_step": 50913, "epoch": 427, "lr": 1.9223522080970624e-05} +{"train_loss": 0.0006803999422118068, "global_step": 50914, "epoch": 427, "lr": 1.9221776037470485e-05} +{"train_loss": 0.0004972356837242842, "global_step": 50915, "epoch": 427, "lr": 1.9220030054400086e-05} +{"train_loss": 0.0008346362737938762, "global_step": 50916, "epoch": 427, "lr": 1.921828413176288e-05} +{"train_loss": 0.0021483823657035828, "global_step": 50917, "epoch": 427, "lr": 1.9216538269562274e-05} +{"train_loss": 0.0005573040107265115, "global_step": 50918, "epoch": 427, "lr": 1.9214792467801717e-05} +{"train_loss": 0.0008897960069589317, "global_step": 50919, "epoch": 427, "lr": 1.9213046726484614e-05} +{"train_loss": 0.0018448734190315008, "global_step": 50920, "epoch": 427, "lr": 1.9211301045614404e-05} +{"train_loss": 0.000532700156327337, "global_step": 50921, "epoch": 427, "lr": 1.920955542519453e-05} +{"train_loss": 0.0006886043702252209, "global_step": 50922, "epoch": 427, "lr": 1.9207809865228388e-05} +{"train_loss": 0.001456945901736617, "global_step": 50923, "epoch": 427, "lr": 1.920606436571944e-05} +{"train_loss": 0.0011225573252886534, "global_step": 50924, "epoch": 427, "lr": 1.9204318926671094e-05} +{"train_loss": 0.002280622720718384, "global_step": 50925, "epoch": 427, "lr": 1.920257354808676e-05} +{"train_loss": 0.0018647420220077038, "global_step": 50926, "epoch": 427, "lr": 1.9200828229969903e-05} +{"train_loss": 0.0013868758687749505, "global_step": 50927, "epoch": 427, "lr": 1.919908297232391e-05} +{"train_loss": 0.0008503125282004476, "global_step": 50928, "epoch": 427, "lr": 1.9197337775152242e-05} +{"train_loss": 0.0007467906107194722, "global_step": 50929, "epoch": 427, "lr": 1.91955926384583e-05} +{"train_loss": 0.0007663509459234774, "global_step": 50930, "epoch": 427, "lr": 1.9193847562245533e-05} +{"train_loss": 0.0009199686885513991, "global_step": 50931, "epoch": 427, "lr": 1.9192102546517354e-05, "val_loss": 0.03558734059333801} +{"train_loss": 0.0011184788309037685, "global_step": 50932, "epoch": 428, "lr": 1.9190357591277174e-05} +{"train_loss": 0.0013429060345515609, "global_step": 50933, "epoch": 428, "lr": 1.918861269652845e-05} +{"train_loss": 0.0006790809566155076, "global_step": 50934, "epoch": 428, "lr": 1.918686786227458e-05} +{"train_loss": 0.0009623332880437374, "global_step": 50935, "epoch": 428, "lr": 1.918512308851902e-05} +{"train_loss": 0.0007341656018979847, "global_step": 50936, "epoch": 428, "lr": 1.918337837526518e-05} +{"train_loss": 0.0013579793740063906, "global_step": 50937, "epoch": 428, "lr": 1.9181633722516468e-05} +{"train_loss": 0.0015100097516551614, "global_step": 50938, "epoch": 428, "lr": 1.917988913027634e-05} +{"train_loss": 0.0013267487520352006, "global_step": 50939, "epoch": 428, "lr": 1.9178144598548187e-05} +{"train_loss": 0.0014675385318696499, "global_step": 50940, "epoch": 428, "lr": 1.9176400127335474e-05} +{"train_loss": 0.000935328018385917, "global_step": 50941, "epoch": 428, "lr": 1.917465571664159e-05} +{"train_loss": 0.0007959824870340526, "global_step": 50942, "epoch": 428, "lr": 1.917291136646999e-05} +{"train_loss": 0.0013978072674944997, "global_step": 50943, "epoch": 428, "lr": 1.9171167076824093e-05} +{"train_loss": 0.0007437834283336997, "global_step": 50944, "epoch": 428, "lr": 1.9169422847707297e-05} +{"train_loss": 0.0008017610525712371, "global_step": 50945, "epoch": 428, "lr": 1.9167678679123058e-05} +{"train_loss": 0.0015183842042461038, "global_step": 50946, "epoch": 428, "lr": 1.9165934571074772e-05} +{"train_loss": 0.0009484232868999243, "global_step": 50947, "epoch": 428, "lr": 1.9164190523565896e-05} +{"train_loss": 0.0008580462890677154, "global_step": 50948, "epoch": 428, "lr": 1.916244653659982e-05} +{"train_loss": 0.001214205869473517, "global_step": 50949, "epoch": 428, "lr": 1.9160702610180004e-05} +{"train_loss": 0.0006773084751330316, "global_step": 50950, "epoch": 428, "lr": 1.9158958744309842e-05} +{"train_loss": 0.0009689618018455803, "global_step": 50951, "epoch": 428, "lr": 1.915721493899278e-05} +{"train_loss": 0.001010193140245974, "global_step": 50952, "epoch": 428, "lr": 1.9155471194232218e-05} +{"train_loss": 0.0005851290188729763, "global_step": 50953, "epoch": 428, "lr": 1.9153727510031605e-05} +{"train_loss": 0.001410283730365336, "global_step": 50954, "epoch": 428, "lr": 1.9151983886394337e-05} +{"train_loss": 0.0011346213286742568, "global_step": 50955, "epoch": 428, "lr": 1.9150240323323875e-05} +{"train_loss": 0.0009406207245774567, "global_step": 50956, "epoch": 428, "lr": 1.9148496820823597e-05} +{"train_loss": 0.0007211074116639793, "global_step": 50957, "epoch": 428, "lr": 1.914675337889697e-05} +{"train_loss": 0.0006061068852432072, "global_step": 50958, "epoch": 428, "lr": 1.914500999754738e-05} +{"train_loss": 0.0004981363308615983, "global_step": 50959, "epoch": 428, "lr": 1.9143266676778282e-05} +{"train_loss": 0.0016436275327578187, "global_step": 50960, "epoch": 428, "lr": 1.9141523416593066e-05} +{"train_loss": 0.0011455750791355968, "global_step": 50961, "epoch": 428, "lr": 1.913978021699519e-05} +{"train_loss": 0.000671000627335161, "global_step": 50962, "epoch": 428, "lr": 1.9138037077988058e-05} +{"train_loss": 0.0006244637188501656, "global_step": 50963, "epoch": 428, "lr": 1.913629399957508e-05} +{"train_loss": 0.0009120696340687573, "global_step": 50964, "epoch": 428, "lr": 1.9134550981759702e-05} +{"train_loss": 0.0011678223963826895, "global_step": 50965, "epoch": 428, "lr": 1.9132808024545324e-05} +{"train_loss": 0.0008574249804951251, "global_step": 50966, "epoch": 428, "lr": 1.9131065127935394e-05} +{"train_loss": 0.0005477085942402482, "global_step": 50967, "epoch": 428, "lr": 1.9129322291933304e-05} +{"train_loss": 0.0006298319203779101, "global_step": 50968, "epoch": 428, "lr": 1.9127579516542503e-05} +{"train_loss": 0.0006812017527408898, "global_step": 50969, "epoch": 428, "lr": 1.912583680176641e-05} +{"train_loss": 0.0008415190386585891, "global_step": 50970, "epoch": 428, "lr": 1.912409414760842e-05} +{"train_loss": 0.0004031364223919809, "global_step": 50971, "epoch": 428, "lr": 1.9122351554071984e-05} +{"train_loss": 0.0005064983270131052, "global_step": 50972, "epoch": 428, "lr": 1.9120609021160495e-05} +{"train_loss": 0.0008621248416602612, "global_step": 50973, "epoch": 428, "lr": 1.9118866548877412e-05} +{"train_loss": 0.0011505272705107927, "global_step": 50974, "epoch": 428, "lr": 1.9117124137226133e-05} +{"train_loss": 0.0008677885634824634, "global_step": 50975, "epoch": 428, "lr": 1.9115381786210067e-05} +{"train_loss": 0.0005602810997515917, "global_step": 50976, "epoch": 428, "lr": 1.911363949583267e-05} +{"train_loss": 0.00043278539669699967, "global_step": 50977, "epoch": 428, "lr": 1.9111897266097316e-05} +{"train_loss": 0.0008210462983697653, "global_step": 50978, "epoch": 428, "lr": 1.9110155097007477e-05} +{"train_loss": 0.0009026592597365379, "global_step": 50979, "epoch": 428, "lr": 1.9108412988566526e-05} +{"train_loss": 0.0008537915418855846, "global_step": 50980, "epoch": 428, "lr": 1.910667094077792e-05} +{"train_loss": 0.0009636594913899899, "global_step": 50981, "epoch": 428, "lr": 1.9104928953645075e-05} +{"train_loss": 0.0007554657640866935, "global_step": 50982, "epoch": 428, "lr": 1.9103187027171375e-05} +{"train_loss": 0.0007695152889937162, "global_step": 50983, "epoch": 428, "lr": 1.910144516136027e-05} +{"train_loss": 0.000602992600761354, "global_step": 50984, "epoch": 428, "lr": 1.9099703356215194e-05} +{"train_loss": 0.0006086343782953918, "global_step": 50985, "epoch": 428, "lr": 1.909796161173953e-05} +{"train_loss": 0.0008618426509201527, "global_step": 50986, "epoch": 428, "lr": 1.9096219927936737e-05} +{"train_loss": 0.0013054447481408715, "global_step": 50987, "epoch": 428, "lr": 1.9094478304810198e-05} +{"train_loss": 0.0010893228463828564, "global_step": 50988, "epoch": 428, "lr": 1.9092736742363364e-05} +{"train_loss": 0.0011811056174337864, "global_step": 50989, "epoch": 428, "lr": 1.9090995240599624e-05} +{"train_loss": 0.0004313944955356419, "global_step": 50990, "epoch": 428, "lr": 1.9089253799522427e-05} +{"train_loss": 0.0008062254055403173, "global_step": 50991, "epoch": 428, "lr": 1.908751241913516e-05} +{"train_loss": 0.0008295942679978907, "global_step": 50992, "epoch": 428, "lr": 1.908577109944128e-05} +{"train_loss": 0.0008252860861830413, "global_step": 50993, "epoch": 428, "lr": 1.9084029840444184e-05} +{"train_loss": 0.000774784421082586, "global_step": 50994, "epoch": 428, "lr": 1.9082288642147277e-05} +{"train_loss": 0.0008777747862040997, "global_step": 50995, "epoch": 428, "lr": 1.9080547504554013e-05} +{"train_loss": 0.0014214011607691646, "global_step": 50996, "epoch": 428, "lr": 1.9078806427667766e-05} +{"train_loss": 0.0010922827059403062, "global_step": 50997, "epoch": 428, "lr": 1.9077065411492002e-05} +{"train_loss": 0.0012564403004944324, "global_step": 50998, "epoch": 428, "lr": 1.9075324456030097e-05} +{"train_loss": 0.0011446344433352351, "global_step": 50999, "epoch": 428, "lr": 1.907358356128551e-05} +{"train_loss": 0.0005241259350441396, "global_step": 51000, "epoch": 428, "lr": 1.9071842727261636e-05} +{"train_loss": 0.0005904001300223172, "global_step": 51001, "epoch": 428, "lr": 1.9070101953961873e-05} +{"train_loss": 0.0009212506120093167, "global_step": 51002, "epoch": 428, "lr": 1.906836124138968e-05} +{"train_loss": 0.0006899281870573759, "global_step": 51003, "epoch": 428, "lr": 1.906662058954844e-05} +{"train_loss": 0.001626321580260992, "global_step": 51004, "epoch": 428, "lr": 1.9064879998441598e-05} +{"train_loss": 0.0007003759383223951, "global_step": 51005, "epoch": 428, "lr": 1.9063139468072565e-05} +{"train_loss": 0.0006892821402288973, "global_step": 51006, "epoch": 428, "lr": 1.906139899844473e-05} +{"train_loss": 0.0019212592160329223, "global_step": 51007, "epoch": 428, "lr": 1.9059658589561557e-05} +{"train_loss": 0.000602112035267055, "global_step": 51008, "epoch": 428, "lr": 1.9057918241426415e-05} +{"train_loss": 0.0006078698206692934, "global_step": 51009, "epoch": 428, "lr": 1.9056177954042766e-05} +{"train_loss": 0.0006439354619942605, "global_step": 51010, "epoch": 428, "lr": 1.905443772741399e-05} +{"train_loss": 0.0012203423539176583, "global_step": 51011, "epoch": 428, "lr": 1.905269756154353e-05} +{"train_loss": 0.0005821635131724179, "global_step": 51012, "epoch": 428, "lr": 1.9050957456434796e-05} +{"train_loss": 0.0006440931465476751, "global_step": 51013, "epoch": 428, "lr": 1.9049217412091182e-05} +{"train_loss": 0.0007335337577387691, "global_step": 51014, "epoch": 428, "lr": 1.904747742851614e-05} +{"train_loss": 0.0010675740195438266, "global_step": 51015, "epoch": 428, "lr": 1.9045737505713057e-05} +{"train_loss": 0.0006284731207415462, "global_step": 51016, "epoch": 428, "lr": 1.9043997643685373e-05} +{"train_loss": 0.0008155083633027971, "global_step": 51017, "epoch": 428, "lr": 1.9042257842436477e-05} +{"train_loss": 0.0008980847778730094, "global_step": 51018, "epoch": 428, "lr": 1.90405181019698e-05} +{"train_loss": 0.0008536347304470837, "global_step": 51019, "epoch": 428, "lr": 1.903877842228878e-05} +{"train_loss": 0.0012570933904498816, "global_step": 51020, "epoch": 428, "lr": 1.903703880339679e-05} +{"train_loss": 0.000595290504861623, "global_step": 51021, "epoch": 428, "lr": 1.9035299245297283e-05} +{"train_loss": 0.0014751312555745244, "global_step": 51022, "epoch": 428, "lr": 1.903355974799364e-05} +{"train_loss": 0.0006162876961752772, "global_step": 51023, "epoch": 428, "lr": 1.9031820311489313e-05} +{"train_loss": 0.00033093217643909156, "global_step": 51024, "epoch": 428, "lr": 1.9030080935787697e-05} +{"train_loss": 0.0007289108471013606, "global_step": 51025, "epoch": 428, "lr": 1.9028341620892194e-05} +{"train_loss": 0.0012207487598061562, "global_step": 51026, "epoch": 428, "lr": 1.9026602366806246e-05} +{"train_loss": 0.0017030499875545502, "global_step": 51027, "epoch": 428, "lr": 1.9024863173533243e-05} +{"train_loss": 0.0008717217715457082, "global_step": 51028, "epoch": 428, "lr": 1.9023124041076622e-05} +{"train_loss": 0.0015631492715328932, "global_step": 51029, "epoch": 428, "lr": 1.9021384969439776e-05} +{"train_loss": 0.0007628396851941943, "global_step": 51030, "epoch": 428, "lr": 1.9019645958626146e-05} +{"train_loss": 0.0008522931020706892, "global_step": 51031, "epoch": 428, "lr": 1.9017907008639135e-05} +{"train_loss": 0.0010420128237456083, "global_step": 51032, "epoch": 428, "lr": 1.9016168119482137e-05} +{"train_loss": 0.0018738474464043975, "global_step": 51033, "epoch": 428, "lr": 1.90144292911586e-05} +{"train_loss": 0.001052135950885713, "global_step": 51034, "epoch": 428, "lr": 1.9012690523671893e-05} +{"train_loss": 0.0007673344807699323, "global_step": 51035, "epoch": 428, "lr": 1.9010951817025484e-05} +{"train_loss": 0.001382337766699493, "global_step": 51036, "epoch": 428, "lr": 1.9009213171222746e-05} +{"train_loss": 0.0005183719913475215, "global_step": 51037, "epoch": 428, "lr": 1.9007474586267115e-05} +{"train_loss": 0.0004187033628113568, "global_step": 51038, "epoch": 428, "lr": 1.9005736062162005e-05} +{"train_loss": 0.001178272650577128, "global_step": 51039, "epoch": 428, "lr": 1.90039975989108e-05} +{"train_loss": 0.0011576475808396935, "global_step": 51040, "epoch": 428, "lr": 1.9002259196516953e-05} +{"train_loss": 0.0006471797241829336, "global_step": 51041, "epoch": 428, "lr": 1.900052085498384e-05} +{"train_loss": 0.0007837967132218182, "global_step": 51042, "epoch": 428, "lr": 1.899878257431491e-05} +{"train_loss": 0.0005572584341280162, "global_step": 51043, "epoch": 428, "lr": 1.899704435451356e-05} +{"train_loss": 0.0006203072261996567, "global_step": 51044, "epoch": 428, "lr": 1.8995306195583178e-05} +{"train_loss": 0.0005534541560336947, "global_step": 51045, "epoch": 428, "lr": 1.8993568097527224e-05} +{"train_loss": 0.001595007604919374, "global_step": 51046, "epoch": 428, "lr": 1.8991830060349063e-05} +{"train_loss": 0.0008911495679058135, "global_step": 51047, "epoch": 428, "lr": 1.899009208405215e-05} +{"train_loss": 0.001684992341324687, "global_step": 51048, "epoch": 428, "lr": 1.8988354168639866e-05} +{"train_loss": 0.000678449054248631, "global_step": 51049, "epoch": 428, "lr": 1.8986616314115652e-05} +{"train_loss": 0.0009264355146780046, "global_step": 51050, "epoch": 428, "lr": 1.8984878520482886e-05, "val_loss": 0.030110685154795647} +{"train_loss": 0.0008728321408852935, "global_step": 51051, "epoch": 429, "lr": 1.8983140787745012e-05} +{"train_loss": 0.0011733885621652007, "global_step": 51052, "epoch": 429, "lr": 1.898140311590541e-05} +{"train_loss": 0.000582988141104579, "global_step": 51053, "epoch": 429, "lr": 1.897966550496751e-05} +{"train_loss": 0.0011471484322100878, "global_step": 51054, "epoch": 429, "lr": 1.8977927954934737e-05} +{"train_loss": 0.0012428141199052334, "global_step": 51055, "epoch": 429, "lr": 1.8976190465810478e-05} +{"train_loss": 0.0004426462692208588, "global_step": 51056, "epoch": 429, "lr": 1.8974453037598167e-05} +{"train_loss": 0.001063237083144486, "global_step": 51057, "epoch": 429, "lr": 1.8972715670301207e-05} +{"train_loss": 0.0006711958558298647, "global_step": 51058, "epoch": 429, "lr": 1.897097836392298e-05} +{"train_loss": 0.000775064923800528, "global_step": 51059, "epoch": 429, "lr": 1.8969241118466946e-05} +{"train_loss": 0.0007262391154654324, "global_step": 51060, "epoch": 429, "lr": 1.896750393393647e-05} +{"train_loss": 0.001393610960803926, "global_step": 51061, "epoch": 429, "lr": 1.8965766810335005e-05} +{"train_loss": 0.0010083102388307452, "global_step": 51062, "epoch": 429, "lr": 1.896402974766594e-05} +{"train_loss": 0.0010303979506716132, "global_step": 51063, "epoch": 429, "lr": 1.8962292745932668e-05} +{"train_loss": 0.0006622516666539013, "global_step": 51064, "epoch": 429, "lr": 1.896055580513864e-05} +{"train_loss": 0.0008382794912904501, "global_step": 51065, "epoch": 429, "lr": 1.8958818925287226e-05} +{"train_loss": 0.0010611715260893106, "global_step": 51066, "epoch": 429, "lr": 1.8957082106381872e-05} +{"train_loss": 0.0002868917945306748, "global_step": 51067, "epoch": 429, "lr": 1.895534534842595e-05} +{"train_loss": 0.0009280737722292542, "global_step": 51068, "epoch": 429, "lr": 1.8953608651422915e-05} +{"train_loss": 0.0007821241742931306, "global_step": 51069, "epoch": 429, "lr": 1.895187201537615e-05} +{"train_loss": 0.0008923318819142878, "global_step": 51070, "epoch": 429, "lr": 1.8950135440289046e-05} +{"train_loss": 0.0005210306844674051, "global_step": 51071, "epoch": 429, "lr": 1.8948398926165056e-05} +{"train_loss": 0.0011480484390631318, "global_step": 51072, "epoch": 429, "lr": 1.8946662473007547e-05} +{"train_loss": 0.0005074182408861816, "global_step": 51073, "epoch": 429, "lr": 1.8944926080819964e-05} +{"train_loss": 0.00044523068936541677, "global_step": 51074, "epoch": 429, "lr": 1.8943189749605705e-05} +{"train_loss": 0.0006435620598495007, "global_step": 51075, "epoch": 429, "lr": 1.8941453479368155e-05} +{"train_loss": 0.0005865970742888749, "global_step": 51076, "epoch": 429, "lr": 1.8939717270110764e-05} +{"train_loss": 0.0012343967100605369, "global_step": 51077, "epoch": 429, "lr": 1.89379811218369e-05} +{"train_loss": 0.0019036850426346064, "global_step": 51078, "epoch": 429, "lr": 1.893624503455001e-05} +{"train_loss": 0.000541305635124445, "global_step": 51079, "epoch": 429, "lr": 1.8934509008253466e-05} +{"train_loss": 0.0006383787258528173, "global_step": 51080, "epoch": 429, "lr": 1.893277304295071e-05} +{"train_loss": 0.0009667414706200361, "global_step": 51081, "epoch": 429, "lr": 1.8931037138645118e-05} +{"train_loss": 0.0017562522552907467, "global_step": 51082, "epoch": 429, "lr": 1.8929301295340136e-05} +{"train_loss": 0.0008919706451706588, "global_step": 51083, "epoch": 429, "lr": 1.892756551303913e-05} +{"train_loss": 0.0005516941309906542, "global_step": 51084, "epoch": 429, "lr": 1.8925829791745552e-05} +{"train_loss": 0.00048093526856973767, "global_step": 51085, "epoch": 429, "lr": 1.8924094131462767e-05} +{"train_loss": 0.0004090672009624541, "global_step": 51086, "epoch": 429, "lr": 1.892235853219422e-05} +{"train_loss": 0.000750515318941325, "global_step": 51087, "epoch": 429, "lr": 1.8920622993943287e-05} +{"train_loss": 0.0008005283307284117, "global_step": 51088, "epoch": 429, "lr": 1.891888751671341e-05} +{"train_loss": 0.0008636676939204335, "global_step": 51089, "epoch": 429, "lr": 1.891715210050795e-05} +{"train_loss": 0.0009191095014102757, "global_step": 51090, "epoch": 429, "lr": 1.8915416745330368e-05} +{"train_loss": 0.0007365570636466146, "global_step": 51091, "epoch": 429, "lr": 1.8913681451184022e-05} +{"train_loss": 0.0006296400679275393, "global_step": 51092, "epoch": 429, "lr": 1.8911946218072363e-05} +{"train_loss": 0.0005109020858071744, "global_step": 51093, "epoch": 429, "lr": 1.8910211045998772e-05} +{"train_loss": 0.0016858649905771017, "global_step": 51094, "epoch": 429, "lr": 1.890847593496664e-05} +{"train_loss": 0.0009416928514838219, "global_step": 51095, "epoch": 429, "lr": 1.890674088497942e-05} +{"train_loss": 0.0005132269579917192, "global_step": 51096, "epoch": 429, "lr": 1.8905005896040467e-05} +{"train_loss": 0.0013842176413163543, "global_step": 51097, "epoch": 429, "lr": 1.8903270968153235e-05} +{"train_loss": 0.0008944808505475521, "global_step": 51098, "epoch": 429, "lr": 1.890153610132109e-05} +{"train_loss": 0.0011155912652611732, "global_step": 51099, "epoch": 429, "lr": 1.8899801295547476e-05} +{"train_loss": 0.0006830070051364601, "global_step": 51100, "epoch": 429, "lr": 1.8898066550835776e-05} +{"train_loss": 0.0007587881991639733, "global_step": 51101, "epoch": 429, "lr": 1.8896331867189382e-05} +{"train_loss": 0.0026371756102889776, "global_step": 51102, "epoch": 429, "lr": 1.8894597244611733e-05} +{"train_loss": 0.0006886707851663232, "global_step": 51103, "epoch": 429, "lr": 1.8892862683106206e-05} +{"train_loss": 0.0012268621940165758, "global_step": 51104, "epoch": 429, "lr": 1.8891128182676237e-05} +{"train_loss": 0.00023455523478332907, "global_step": 51105, "epoch": 429, "lr": 1.8889393743325194e-05} +{"train_loss": 0.0004565741401165724, "global_step": 51106, "epoch": 429, "lr": 1.8887659365056526e-05} +{"train_loss": 0.0006849508499726653, "global_step": 51107, "epoch": 429, "lr": 1.888592504787361e-05} +{"train_loss": 0.001179786748252809, "global_step": 51108, "epoch": 429, "lr": 1.8884190791779837e-05} +{"train_loss": 0.0005188779905438423, "global_step": 51109, "epoch": 429, "lr": 1.8882456596778653e-05} +{"train_loss": 0.0007555870688520372, "global_step": 51110, "epoch": 429, "lr": 1.8880722462873423e-05} +{"train_loss": 0.0006231433944776654, "global_step": 51111, "epoch": 429, "lr": 1.8878988390067587e-05} +{"train_loss": 0.001221368322148919, "global_step": 51112, "epoch": 429, "lr": 1.887725437836453e-05} +{"train_loss": 0.000855836144182831, "global_step": 51113, "epoch": 429, "lr": 1.8875520427767644e-05} +{"train_loss": 0.0010527835693210363, "global_step": 51114, "epoch": 429, "lr": 1.8873786538280348e-05} +{"train_loss": 0.0008030807948671281, "global_step": 51115, "epoch": 429, "lr": 1.8872052709906062e-05} +{"train_loss": 0.0006607171380892396, "global_step": 51116, "epoch": 429, "lr": 1.887031894264816e-05} +{"train_loss": 0.0007485813111998141, "global_step": 51117, "epoch": 429, "lr": 1.8868585236510078e-05} +{"train_loss": 0.0009042666060850024, "global_step": 51118, "epoch": 429, "lr": 1.886685159149519e-05} +{"train_loss": 0.0005230683600530028, "global_step": 51119, "epoch": 429, "lr": 1.8865118007606924e-05} +{"train_loss": 0.0004501711227931082, "global_step": 51120, "epoch": 429, "lr": 1.8863384484848655e-05} +{"train_loss": 0.0007684872252866626, "global_step": 51121, "epoch": 429, "lr": 1.8861651023223826e-05} +{"train_loss": 0.0007256051758304238, "global_step": 51122, "epoch": 429, "lr": 1.8859917622735796e-05} +{"train_loss": 0.0008612179080955684, "global_step": 51123, "epoch": 429, "lr": 1.8858184283388013e-05} +{"train_loss": 0.0007374587003141642, "global_step": 51124, "epoch": 429, "lr": 1.8856451005183856e-05} +{"train_loss": 0.0009017880074679852, "global_step": 51125, "epoch": 429, "lr": 1.8854717788126713e-05} +{"train_loss": 0.0006787523743696511, "global_step": 51126, "epoch": 429, "lr": 1.8852984632220022e-05} +{"train_loss": 0.0008186163031496108, "global_step": 51127, "epoch": 429, "lr": 1.8851251537467145e-05} +{"train_loss": 0.0008730305125936866, "global_step": 51128, "epoch": 429, "lr": 1.8849518503871534e-05} +{"train_loss": 0.000730007654055953, "global_step": 51129, "epoch": 429, "lr": 1.8847785531436547e-05} +{"train_loss": 0.00041582639096304774, "global_step": 51130, "epoch": 429, "lr": 1.8846052620165616e-05} +{"train_loss": 0.0008822213858366013, "global_step": 51131, "epoch": 429, "lr": 1.8844319770062142e-05} +{"train_loss": 0.0004155034839641303, "global_step": 51132, "epoch": 429, "lr": 1.884258698112949e-05} +{"train_loss": 0.0007036744500510395, "global_step": 51133, "epoch": 429, "lr": 1.8840854253371114e-05} +{"train_loss": 0.0019990878645330667, "global_step": 51134, "epoch": 429, "lr": 1.883912158679037e-05} +{"train_loss": 0.000594781362451613, "global_step": 51135, "epoch": 429, "lr": 1.8837388981390703e-05} +{"train_loss": 0.001316202338784933, "global_step": 51136, "epoch": 429, "lr": 1.8835656437175476e-05} +{"train_loss": 0.0005824238178320229, "global_step": 51137, "epoch": 429, "lr": 1.883392395414812e-05} +{"train_loss": 0.0013801159802824259, "global_step": 51138, "epoch": 429, "lr": 1.8832191532312033e-05} +{"train_loss": 0.001305204234085977, "global_step": 51139, "epoch": 429, "lr": 1.8830459171670583e-05} +{"train_loss": 0.0010501580545678735, "global_step": 51140, "epoch": 429, "lr": 1.882872687222722e-05} +{"train_loss": 0.00039125062176026404, "global_step": 51141, "epoch": 429, "lr": 1.88269946339853e-05} +{"train_loss": 0.00035012204898521304, "global_step": 51142, "epoch": 429, "lr": 1.8825262456948268e-05} +{"train_loss": 0.0007981077651493251, "global_step": 51143, "epoch": 429, "lr": 1.8823530341119493e-05} +{"train_loss": 0.0006518197478726506, "global_step": 51144, "epoch": 429, "lr": 1.882179828650238e-05} +{"train_loss": 0.0004867904935963452, "global_step": 51145, "epoch": 429, "lr": 1.8820066293100345e-05} +{"train_loss": 0.0009872163645923138, "global_step": 51146, "epoch": 429, "lr": 1.8818334360916763e-05} +{"train_loss": 0.0016428525559604168, "global_step": 51147, "epoch": 429, "lr": 1.8816602489955066e-05} +{"train_loss": 0.000526556046679616, "global_step": 51148, "epoch": 429, "lr": 1.8814870680218627e-05} +{"train_loss": 0.0005337955080904067, "global_step": 51149, "epoch": 429, "lr": 1.881313893171085e-05} +{"train_loss": 0.0008928300812840462, "global_step": 51150, "epoch": 429, "lr": 1.8811407244435165e-05} +{"train_loss": 0.0007859041797928512, "global_step": 51151, "epoch": 429, "lr": 1.8809675618394935e-05} +{"train_loss": 0.000747902609873563, "global_step": 51152, "epoch": 429, "lr": 1.8807944053593584e-05} +{"train_loss": 0.0005408236756920815, "global_step": 51153, "epoch": 429, "lr": 1.880621255003449e-05} +{"train_loss": 0.0007781149470247328, "global_step": 51154, "epoch": 429, "lr": 1.8804481107721084e-05} +{"train_loss": 0.0006825461168773472, "global_step": 51155, "epoch": 429, "lr": 1.8802749726656727e-05} +{"train_loss": 0.0008914695936255157, "global_step": 51156, "epoch": 429, "lr": 1.8801018406844857e-05} +{"train_loss": 0.0006280415691435337, "global_step": 51157, "epoch": 429, "lr": 1.879928714828885e-05} +{"train_loss": 0.0006554360152222216, "global_step": 51158, "epoch": 429, "lr": 1.8797555950992097e-05} +{"train_loss": 0.0006342334672808647, "global_step": 51159, "epoch": 429, "lr": 1.8795824814958025e-05} +{"train_loss": 0.0017395960167050362, "global_step": 51160, "epoch": 429, "lr": 1.879409374019e-05} +{"train_loss": 0.0011680475436151028, "global_step": 51161, "epoch": 429, "lr": 1.8792362726691455e-05} +{"train_loss": 0.0006092164549045265, "global_step": 51162, "epoch": 429, "lr": 1.8790631774465772e-05} +{"train_loss": 0.0005961178685538471, "global_step": 51163, "epoch": 429, "lr": 1.878890088351633e-05} +{"train_loss": 0.0004997688811272383, "global_step": 51164, "epoch": 429, "lr": 1.8787170053846565e-05} +{"train_loss": 0.0006495195557363331, "global_step": 51165, "epoch": 429, "lr": 1.8785439285459842e-05} +{"train_loss": 0.0010552656603977084, "global_step": 51166, "epoch": 429, "lr": 1.8783708578359588e-05} +{"train_loss": 0.0007931768777780235, "global_step": 51167, "epoch": 429, "lr": 1.878197793254917e-05} +{"train_loss": 0.0007450805860571563, "global_step": 51168, "epoch": 429, "lr": 1.8780247348032027e-05} +{"train_loss": 0.0008407520073291869, "global_step": 51169, "epoch": 429, "lr": 1.8778516824811526e-05, "val_loss": 0.019807368516921997} +{"train_loss": 0.0005524693406186998, "global_step": 51170, "epoch": 430, "lr": 1.8776786362891057e-05} +{"train_loss": 0.0008170433575287461, "global_step": 51171, "epoch": 430, "lr": 1.8775055962274053e-05} +{"train_loss": 0.0005465211579576135, "global_step": 51172, "epoch": 430, "lr": 1.8773325622963866e-05} +{"train_loss": 0.0009062878089025617, "global_step": 51173, "epoch": 430, "lr": 1.8771595344963944e-05} +{"train_loss": 0.0008466330473311245, "global_step": 51174, "epoch": 430, "lr": 1.8769865128277636e-05} +{"train_loss": 0.001218221615999937, "global_step": 51175, "epoch": 430, "lr": 1.8768134972908376e-05} +{"train_loss": 0.0008714800351299345, "global_step": 51176, "epoch": 430, "lr": 1.876640487885955e-05} +{"train_loss": 0.0008456538198515773, "global_step": 51177, "epoch": 430, "lr": 1.8764674846134532e-05} +{"train_loss": 0.0006142406491562724, "global_step": 51178, "epoch": 430, "lr": 1.876294487473676e-05} +{"train_loss": 0.0004989773733541369, "global_step": 51179, "epoch": 430, "lr": 1.8761214964669582e-05} +{"train_loss": 0.0016985677648335695, "global_step": 51180, "epoch": 430, "lr": 1.8759485115936447e-05} +{"train_loss": 0.001513528055511415, "global_step": 51181, "epoch": 430, "lr": 1.8757755328540704e-05} +{"train_loss": 0.00029983074637129903, "global_step": 51182, "epoch": 430, "lr": 1.8756025602485787e-05} +{"train_loss": 0.0007991077727638185, "global_step": 51183, "epoch": 430, "lr": 1.8754295937775062e-05} +{"train_loss": 0.0004860689223278314, "global_step": 51184, "epoch": 430, "lr": 1.875256633441196e-05} +{"train_loss": 0.0014111417112872005, "global_step": 51185, "epoch": 430, "lr": 1.875083679239983e-05} +{"train_loss": 0.0008069117902778089, "global_step": 51186, "epoch": 430, "lr": 1.8749107311742096e-05} +{"train_loss": 0.0009242835221812129, "global_step": 51187, "epoch": 430, "lr": 1.874737789244217e-05} +{"train_loss": 0.0011957361130043864, "global_step": 51188, "epoch": 430, "lr": 1.8745648534503425e-05} +{"train_loss": 0.0006449948996305466, "global_step": 51189, "epoch": 430, "lr": 1.8743919237929248e-05} +{"train_loss": 0.001523494254797697, "global_step": 51190, "epoch": 430, "lr": 1.874219000272306e-05} +{"train_loss": 0.0006416192045435309, "global_step": 51191, "epoch": 430, "lr": 1.8740460828888223e-05} +{"train_loss": 0.0004859110922552645, "global_step": 51192, "epoch": 430, "lr": 1.8738731716428177e-05} +{"train_loss": 0.0011165037285536528, "global_step": 51193, "epoch": 430, "lr": 1.8737002665346287e-05} +{"train_loss": 0.0009670707513578236, "global_step": 51194, "epoch": 430, "lr": 1.873527367564593e-05} +{"train_loss": 0.0008287749369628727, "global_step": 51195, "epoch": 430, "lr": 1.8733544747330545e-05} +{"train_loss": 0.000860123080201447, "global_step": 51196, "epoch": 430, "lr": 1.873181588040349e-05} +{"train_loss": 0.0009403515723533928, "global_step": 51197, "epoch": 430, "lr": 1.8730087074868185e-05} +{"train_loss": 0.0006562984199263155, "global_step": 51198, "epoch": 430, "lr": 1.8728358330728002e-05} +{"train_loss": 0.00042361736996099353, "global_step": 51199, "epoch": 430, "lr": 1.872662964798636e-05} +{"train_loss": 0.0010798336006700993, "global_step": 51200, "epoch": 430, "lr": 1.872490102664664e-05} +{"train_loss": 0.001447894494049251, "global_step": 51201, "epoch": 430, "lr": 1.8723172466712224e-05} +{"train_loss": 0.0009785759029909968, "global_step": 51202, "epoch": 430, "lr": 1.8721443968186524e-05} +{"train_loss": 0.0006306840223260224, "global_step": 51203, "epoch": 430, "lr": 1.8719715531072918e-05} +{"train_loss": 0.0005198921426199377, "global_step": 51204, "epoch": 430, "lr": 1.871798715537483e-05} +{"train_loss": 0.0006029847427271307, "global_step": 51205, "epoch": 430, "lr": 1.8716258841095603e-05} +{"train_loss": 0.001075667212717235, "global_step": 51206, "epoch": 430, "lr": 1.8714530588238683e-05} +{"train_loss": 0.0005066664307378232, "global_step": 51207, "epoch": 430, "lr": 1.8712802396807438e-05} +{"train_loss": 0.0009101255564019084, "global_step": 51208, "epoch": 430, "lr": 1.871107426680525e-05} +{"train_loss": 0.0006232658633962274, "global_step": 51209, "epoch": 430, "lr": 1.870934619823554e-05} +{"train_loss": 0.0009039817377924919, "global_step": 51210, "epoch": 430, "lr": 1.8707618191101668e-05} +{"train_loss": 0.0006071394309401512, "global_step": 51211, "epoch": 430, "lr": 1.870589024540706e-05} +{"train_loss": 0.0008377584745176136, "global_step": 51212, "epoch": 430, "lr": 1.870416236115508e-05} +{"train_loss": 0.001083380077034235, "global_step": 51213, "epoch": 430, "lr": 1.8702434538349146e-05} +{"train_loss": 0.0011399356881156564, "global_step": 51214, "epoch": 430, "lr": 1.8700706776992628e-05} +{"train_loss": 0.0007293982780538499, "global_step": 51215, "epoch": 430, "lr": 1.869897907708894e-05} +{"train_loss": 0.0008410828304477036, "global_step": 51216, "epoch": 430, "lr": 1.8697251438641444e-05} +{"train_loss": 0.000885080429725349, "global_step": 51217, "epoch": 430, "lr": 1.869552386165357e-05} +{"train_loss": 0.0010103946551680565, "global_step": 51218, "epoch": 430, "lr": 1.8693796346128673e-05} +{"train_loss": 0.00046151745482347906, "global_step": 51219, "epoch": 430, "lr": 1.869206889207018e-05} +{"train_loss": 0.0007334190304391086, "global_step": 51220, "epoch": 430, "lr": 1.869034149948145e-05} +{"train_loss": 0.0007829631795175374, "global_step": 51221, "epoch": 430, "lr": 1.8688614168365902e-05} +{"train_loss": 0.0011660433374345303, "global_step": 51222, "epoch": 430, "lr": 1.86868868987269e-05} +{"train_loss": 0.0008585180039517581, "global_step": 51223, "epoch": 430, "lr": 1.8685159690567872e-05} +{"train_loss": 0.000722824246622622, "global_step": 51224, "epoch": 430, "lr": 1.8683432543892167e-05} +{"train_loss": 0.0009642558288760483, "global_step": 51225, "epoch": 430, "lr": 1.8681705458703213e-05} +{"train_loss": 0.001434107543900609, "global_step": 51226, "epoch": 430, "lr": 1.867997843500438e-05} +{"train_loss": 0.0007674474618397653, "global_step": 51227, "epoch": 430, "lr": 1.8678251472799052e-05} +{"train_loss": 0.0008597516571171582, "global_step": 51228, "epoch": 430, "lr": 1.867652457209065e-05} +{"train_loss": 0.0007564548286609352, "global_step": 51229, "epoch": 430, "lr": 1.867479773288252e-05} +{"train_loss": 0.0007306354818865657, "global_step": 51230, "epoch": 430, "lr": 1.8673070955178103e-05} +{"train_loss": 0.0007591423927806318, "global_step": 51231, "epoch": 430, "lr": 1.8671344238980763e-05} +{"train_loss": 0.0008131553186103702, "global_step": 51232, "epoch": 430, "lr": 1.8669617584293876e-05} +{"train_loss": 0.0006213149754330516, "global_step": 51233, "epoch": 430, "lr": 1.8667890991120855e-05} +{"train_loss": 0.0011680286843329668, "global_step": 51234, "epoch": 430, "lr": 1.8666164459465073e-05} +{"train_loss": 0.00035465750261209905, "global_step": 51235, "epoch": 430, "lr": 1.8664437989329947e-05} +{"train_loss": 0.0009969600941985846, "global_step": 51236, "epoch": 430, "lr": 1.8662711580718833e-05} +{"train_loss": 0.0009703589603304863, "global_step": 51237, "epoch": 430, "lr": 1.8660985233635152e-05} +{"train_loss": 0.0009581684716977179, "global_step": 51238, "epoch": 430, "lr": 1.865925894808228e-05} +{"train_loss": 0.0006432257941924036, "global_step": 51239, "epoch": 430, "lr": 1.8657532724063587e-05} +{"train_loss": 0.0007067916449159384, "global_step": 51240, "epoch": 430, "lr": 1.8655806561582497e-05} +{"train_loss": 0.0005430844612419605, "global_step": 51241, "epoch": 430, "lr": 1.8654080460642365e-05} +{"train_loss": 0.0010460148332640529, "global_step": 51242, "epoch": 430, "lr": 1.8652354421246614e-05} +{"train_loss": 0.0011008259607478976, "global_step": 51243, "epoch": 430, "lr": 1.8650628443398614e-05} +{"train_loss": 0.0004953540628775954, "global_step": 51244, "epoch": 430, "lr": 1.864890252710174e-05} +{"train_loss": 0.0008625468472018838, "global_step": 51245, "epoch": 430, "lr": 1.8647176672359416e-05} +{"train_loss": 0.001279982621781528, "global_step": 51246, "epoch": 430, "lr": 1.864545087917499e-05} +{"train_loss": 0.0009399562259204686, "global_step": 51247, "epoch": 430, "lr": 1.8643725147551876e-05} +{"train_loss": 0.0011227099457755685, "global_step": 51248, "epoch": 430, "lr": 1.864199947749347e-05} +{"train_loss": 0.001371652469970286, "global_step": 51249, "epoch": 430, "lr": 1.864027386900314e-05} +{"train_loss": 0.0008917675004340708, "global_step": 51250, "epoch": 430, "lr": 1.8638548322084294e-05} +{"train_loss": 0.000529192853718996, "global_step": 51251, "epoch": 430, "lr": 1.8636822836740285e-05} +{"train_loss": 0.001012293854728341, "global_step": 51252, "epoch": 430, "lr": 1.8635097412974544e-05} +{"train_loss": 0.0005860136006958783, "global_step": 51253, "epoch": 430, "lr": 1.8633372050790427e-05} +{"train_loss": 0.00084808433894068, "global_step": 51254, "epoch": 430, "lr": 1.8631646750191344e-05} +{"train_loss": 0.0010399038437753916, "global_step": 51255, "epoch": 430, "lr": 1.8629921511180653e-05} +{"train_loss": 0.0011384121607989073, "global_step": 51256, "epoch": 430, "lr": 1.8628196333761784e-05} +{"train_loss": 0.0010017389431595802, "global_step": 51257, "epoch": 430, "lr": 1.862647121793809e-05} +{"train_loss": 0.0006095426506362855, "global_step": 51258, "epoch": 430, "lr": 1.862474616371296e-05} +{"train_loss": 0.001536638243123889, "global_step": 51259, "epoch": 430, "lr": 1.8623021171089798e-05} +{"train_loss": 0.0007535980548709631, "global_step": 51260, "epoch": 430, "lr": 1.8621296240071973e-05} +{"train_loss": 0.0007300712750293314, "global_step": 51261, "epoch": 430, "lr": 1.8619571370662893e-05} +{"train_loss": 0.0007039343472570181, "global_step": 51262, "epoch": 430, "lr": 1.8617846562865932e-05} +{"train_loss": 0.0007820792379789054, "global_step": 51263, "epoch": 430, "lr": 1.8616121816684462e-05} +{"train_loss": 0.001480798702687025, "global_step": 51264, "epoch": 430, "lr": 1.86143971321219e-05} +{"train_loss": 0.0008194891270250082, "global_step": 51265, "epoch": 430, "lr": 1.86126725091816e-05} +{"train_loss": 0.0009680129587650299, "global_step": 51266, "epoch": 430, "lr": 1.8610947947866982e-05} +{"train_loss": 0.001274524605832994, "global_step": 51267, "epoch": 430, "lr": 1.860922344818139e-05} +{"train_loss": 0.001340529415756464, "global_step": 51268, "epoch": 430, "lr": 1.860749901012826e-05} +{"train_loss": 0.0008810834842734039, "global_step": 51269, "epoch": 430, "lr": 1.8605774633710948e-05} +{"train_loss": 0.0011056492803618312, "global_step": 51270, "epoch": 430, "lr": 1.8604050318932825e-05} +{"train_loss": 0.00047673459630459547, "global_step": 51271, "epoch": 430, "lr": 1.8602326065797317e-05} +{"train_loss": 0.001620544702745974, "global_step": 51272, "epoch": 430, "lr": 1.8600601874307766e-05} +{"train_loss": 0.00096878845943138, "global_step": 51273, "epoch": 430, "lr": 1.8598877744467597e-05} +{"train_loss": 0.000903164385817945, "global_step": 51274, "epoch": 430, "lr": 1.8597153676280162e-05} +{"train_loss": 0.0010909491684287786, "global_step": 51275, "epoch": 430, "lr": 1.859542966974887e-05} +{"train_loss": 0.0005785573157481849, "global_step": 51276, "epoch": 430, "lr": 1.8593705724877103e-05} +{"train_loss": 0.0008557009277865291, "global_step": 51277, "epoch": 430, "lr": 1.8591981841668222e-05} +{"train_loss": 0.0006315039936453104, "global_step": 51278, "epoch": 430, "lr": 1.8590258020125644e-05} +{"train_loss": 0.0007041131611913443, "global_step": 51279, "epoch": 430, "lr": 1.8588534260252726e-05} +{"train_loss": 0.0009765769354999065, "global_step": 51280, "epoch": 430, "lr": 1.858681056205288e-05} +{"train_loss": 0.0014566644094884396, "global_step": 51281, "epoch": 430, "lr": 1.858508692552946e-05} +{"train_loss": 0.001051721628755331, "global_step": 51282, "epoch": 430, "lr": 1.858336335068586e-05} +{"train_loss": 0.0014690173557028174, "global_step": 51283, "epoch": 430, "lr": 1.8581639837525496e-05} +{"train_loss": 0.0010009710676968098, "global_step": 51284, "epoch": 430, "lr": 1.85799163860517e-05} +{"train_loss": 0.000586240435950458, "global_step": 51285, "epoch": 430, "lr": 1.85781929962679e-05} +{"train_loss": 0.000435137510066852, "global_step": 51286, "epoch": 430, "lr": 1.8576469668177447e-05} +{"train_loss": 0.0009173320140689611, "global_step": 51287, "epoch": 430, "lr": 1.8574746401783756e-05} +{"train_loss": 0.0008900990316393872, "global_step": 51288, "epoch": 430, "lr": 1.8573023197090194e-05, "val_loss": 0.021421490237116814, "train_action_mse_error": 8.779022209637333e-06} +{"train_loss": 0.0016262925928458571, "global_step": 51289, "epoch": 431, "lr": 1.8571300054100123e-05} +{"train_loss": 0.0009125311626121402, "global_step": 51290, "epoch": 431, "lr": 1.8569576972816964e-05} +{"train_loss": 0.0005359826027415693, "global_step": 51291, "epoch": 431, "lr": 1.856785395324407e-05} +{"train_loss": 0.0017026246059685946, "global_step": 51292, "epoch": 431, "lr": 1.856613099538485e-05} +{"train_loss": 0.0005732694990001619, "global_step": 51293, "epoch": 431, "lr": 1.8564408099242652e-05} +{"train_loss": 0.0010681188432499766, "global_step": 51294, "epoch": 431, "lr": 1.8562685264820907e-05} +{"train_loss": 0.000866011600010097, "global_step": 51295, "epoch": 431, "lr": 1.8560962492122964e-05} +{"train_loss": 0.001140911364927888, "global_step": 51296, "epoch": 431, "lr": 1.85592397811522e-05} +{"train_loss": 0.0011546977329999208, "global_step": 51297, "epoch": 431, "lr": 1.8557517131912022e-05} +{"train_loss": 0.001011543208733201, "global_step": 51298, "epoch": 431, "lr": 1.8555794544405785e-05} +{"train_loss": 0.0017006113193929195, "global_step": 51299, "epoch": 431, "lr": 1.8554072018636903e-05} +{"train_loss": 0.0007393386913463473, "global_step": 51300, "epoch": 431, "lr": 1.8552349554608743e-05} +{"train_loss": 0.0006701861275359988, "global_step": 51301, "epoch": 431, "lr": 1.8550627152324668e-05} +{"train_loss": 0.0007221478153951466, "global_step": 51302, "epoch": 431, "lr": 1.854890481178809e-05} +{"train_loss": 0.0010358800645917654, "global_step": 51303, "epoch": 431, "lr": 1.8547182533002365e-05} +{"train_loss": 0.0010358173167333007, "global_step": 51304, "epoch": 431, "lr": 1.8545460315970904e-05} +{"train_loss": 0.0006614265730604529, "global_step": 51305, "epoch": 431, "lr": 1.854373816069705e-05} +{"train_loss": 0.0012365367729216814, "global_step": 51306, "epoch": 431, "lr": 1.854201606718422e-05} +{"train_loss": 0.0008190549560822546, "global_step": 51307, "epoch": 431, "lr": 1.8540294035435786e-05} +{"train_loss": 0.0012935306876897812, "global_step": 51308, "epoch": 431, "lr": 1.8538572065455107e-05} +{"train_loss": 0.0012474119430407882, "global_step": 51309, "epoch": 431, "lr": 1.8536850157245594e-05} +{"train_loss": 0.0009194531594403088, "global_step": 51310, "epoch": 431, "lr": 1.85351283108106e-05} +{"train_loss": 0.0006840751157142222, "global_step": 51311, "epoch": 431, "lr": 1.8533406526153534e-05} +{"train_loss": 0.0007955717155709863, "global_step": 51312, "epoch": 431, "lr": 1.853168480327775e-05} +{"train_loss": 0.001231308444403112, "global_step": 51313, "epoch": 431, "lr": 1.8529963142186656e-05} +{"train_loss": 0.0008753496804274619, "global_step": 51314, "epoch": 431, "lr": 1.85282415428836e-05} +{"train_loss": 0.0005474485806189477, "global_step": 51315, "epoch": 431, "lr": 1.8526520005372e-05} +{"train_loss": 0.0007075938046909869, "global_step": 51316, "epoch": 431, "lr": 1.8524798529655198e-05} +{"train_loss": 0.0007185140275396407, "global_step": 51317, "epoch": 431, "lr": 1.8523077115736586e-05} +{"train_loss": 0.0007512716110795736, "global_step": 51318, "epoch": 431, "lr": 1.8521355763619567e-05} +{"train_loss": 0.000857686682138592, "global_step": 51319, "epoch": 431, "lr": 1.8519634473307507e-05} +{"train_loss": 0.0007293774979189038, "global_step": 51320, "epoch": 431, "lr": 1.8517913244803763e-05} +{"train_loss": 0.0012893788516521454, "global_step": 51321, "epoch": 431, "lr": 1.851619207811175e-05} +{"train_loss": 0.0005987021140754223, "global_step": 51322, "epoch": 431, "lr": 1.851447097323481e-05} +{"train_loss": 0.0010828380472958088, "global_step": 51323, "epoch": 431, "lr": 1.8512749930176364e-05} +{"train_loss": 0.0008579202694818377, "global_step": 51324, "epoch": 431, "lr": 1.851102894893975e-05} +{"train_loss": 0.0005179020809009671, "global_step": 51325, "epoch": 431, "lr": 1.8509308029528383e-05} +{"train_loss": 0.0011565969325602055, "global_step": 51326, "epoch": 431, "lr": 1.8507587171945628e-05} +{"train_loss": 0.0003959422174375504, "global_step": 51327, "epoch": 431, "lr": 1.8505866376194846e-05} +{"train_loss": 0.0003651607839856297, "global_step": 51328, "epoch": 431, "lr": 1.850414564227944e-05} +{"train_loss": 0.0011485794093459845, "global_step": 51329, "epoch": 431, "lr": 1.850242497020277e-05} +{"train_loss": 0.0005192166427150369, "global_step": 51330, "epoch": 431, "lr": 1.8500704359968235e-05} +{"train_loss": 0.0008933457429520786, "global_step": 51331, "epoch": 431, "lr": 1.8498983811579208e-05} +{"train_loss": 0.0005744636291638017, "global_step": 51332, "epoch": 431, "lr": 1.849726332503904e-05} +{"train_loss": 0.0006844071904197335, "global_step": 51333, "epoch": 431, "lr": 1.8495542900351148e-05} +{"train_loss": 0.0010007828241214156, "global_step": 51334, "epoch": 431, "lr": 1.8493822537518874e-05} +{"train_loss": 0.0006910223164595664, "global_step": 51335, "epoch": 431, "lr": 1.8492102236545627e-05} +{"train_loss": 0.0004172132757958025, "global_step": 51336, "epoch": 431, "lr": 1.8490381997434756e-05} +{"train_loss": 0.0008052291814237833, "global_step": 51337, "epoch": 431, "lr": 1.8488661820189675e-05} +{"train_loss": 0.0005526866880245507, "global_step": 51338, "epoch": 431, "lr": 1.8486941704813737e-05} +{"train_loss": 0.0015657524345442653, "global_step": 51339, "epoch": 431, "lr": 1.848522165131031e-05} +{"train_loss": 0.0007900199270807207, "global_step": 51340, "epoch": 431, "lr": 1.8483501659682788e-05} +{"train_loss": 0.0009198146872222424, "global_step": 51341, "epoch": 431, "lr": 1.848178172993454e-05} +{"train_loss": 0.0009220990468747914, "global_step": 51342, "epoch": 431, "lr": 1.8480061862068954e-05} +{"train_loss": 0.0008964758599177003, "global_step": 51343, "epoch": 431, "lr": 1.8478342056089387e-05} +{"train_loss": 0.0005121334688737988, "global_step": 51344, "epoch": 431, "lr": 1.8476622311999242e-05} +{"train_loss": 0.001451768446713686, "global_step": 51345, "epoch": 431, "lr": 1.8474902629801865e-05} +{"train_loss": 0.0008463316480629146, "global_step": 51346, "epoch": 431, "lr": 1.8473183009500672e-05} +{"train_loss": 0.0005182040622457862, "global_step": 51347, "epoch": 431, "lr": 1.847146345109899e-05} +{"train_loss": 0.0007083977689035237, "global_step": 51348, "epoch": 431, "lr": 1.8469743954600244e-05} +{"train_loss": 0.0010599041124805808, "global_step": 51349, "epoch": 431, "lr": 1.8468024520007766e-05} +{"train_loss": 0.0012936270795762539, "global_step": 51350, "epoch": 431, "lr": 1.8466305147324976e-05} +{"train_loss": 0.0006683241226710379, "global_step": 51351, "epoch": 431, "lr": 1.8464585836555202e-05} +{"train_loss": 0.00092030392261222, "global_step": 51352, "epoch": 431, "lr": 1.8462866587701867e-05} +{"train_loss": 0.0008473534835502505, "global_step": 51353, "epoch": 431, "lr": 1.846114740076831e-05} +{"train_loss": 0.001023868564516306, "global_step": 51354, "epoch": 431, "lr": 1.8459428275757927e-05} +{"train_loss": 0.0007124108378775418, "global_step": 51355, "epoch": 431, "lr": 1.845770921267408e-05} +{"train_loss": 0.0012208630796521902, "global_step": 51356, "epoch": 431, "lr": 1.8455990211520163e-05} +{"train_loss": 0.0008264740463346243, "global_step": 51357, "epoch": 431, "lr": 1.8454271272299545e-05} +{"train_loss": 0.0004064531240146607, "global_step": 51358, "epoch": 431, "lr": 1.8452552395015572e-05} +{"train_loss": 0.0003710336168296635, "global_step": 51359, "epoch": 431, "lr": 1.8450833579671663e-05} +{"train_loss": 0.0006861541769467294, "global_step": 51360, "epoch": 431, "lr": 1.844911482627115e-05} +{"train_loss": 0.0006526780780404806, "global_step": 51361, "epoch": 431, "lr": 1.844739613481745e-05} +{"train_loss": 0.0006150074768811464, "global_step": 51362, "epoch": 431, "lr": 1.8445677505313902e-05} +{"train_loss": 0.0007973170140758157, "global_step": 51363, "epoch": 431, "lr": 1.8443958937763905e-05} +{"train_loss": 0.0008459786185994744, "global_step": 51364, "epoch": 431, "lr": 1.8442240432170833e-05} +{"train_loss": 0.000549637246876955, "global_step": 51365, "epoch": 431, "lr": 1.8440521988538022e-05} +{"train_loss": 0.0011791236465796828, "global_step": 51366, "epoch": 431, "lr": 1.84388036068689e-05} +{"train_loss": 0.0005030384054407477, "global_step": 51367, "epoch": 431, "lr": 1.8437085287166794e-05} +{"train_loss": 0.0005688815144822001, "global_step": 51368, "epoch": 431, "lr": 1.843536702943512e-05} +{"train_loss": 0.0005560217541642487, "global_step": 51369, "epoch": 431, "lr": 1.843364883367723e-05} +{"train_loss": 0.0006296911160461605, "global_step": 51370, "epoch": 431, "lr": 1.8431930699896478e-05} +{"train_loss": 0.0005588577478192747, "global_step": 51371, "epoch": 431, "lr": 1.8430212628096277e-05} +{"train_loss": 0.0009006025502458215, "global_step": 51372, "epoch": 431, "lr": 1.8428494618279962e-05} +{"train_loss": 0.000540778215508908, "global_step": 51373, "epoch": 431, "lr": 1.8426776670450947e-05} +{"train_loss": 0.0016081619542092085, "global_step": 51374, "epoch": 431, "lr": 1.8425058784612558e-05} +{"train_loss": 0.0009809902403503656, "global_step": 51375, "epoch": 431, "lr": 1.8423340960768215e-05} +{"train_loss": 0.0007228752947412431, "global_step": 51376, "epoch": 431, "lr": 1.8421623198921266e-05} +{"train_loss": 0.0007529042195528746, "global_step": 51377, "epoch": 431, "lr": 1.841990549907507e-05} +{"train_loss": 0.0004891820135526359, "global_step": 51378, "epoch": 431, "lr": 1.841818786123303e-05} +{"train_loss": 0.001055204658769071, "global_step": 51379, "epoch": 431, "lr": 1.8416470285398492e-05} +{"train_loss": 0.0004938071360811591, "global_step": 51380, "epoch": 431, "lr": 1.8414752771574838e-05} +{"train_loss": 0.0009295002673752606, "global_step": 51381, "epoch": 431, "lr": 1.8413035319765458e-05} +{"train_loss": 0.0005594601389020681, "global_step": 51382, "epoch": 431, "lr": 1.84113179299737e-05} +{"train_loss": 0.0004747035272885114, "global_step": 51383, "epoch": 431, "lr": 1.8409600602202953e-05} +{"train_loss": 0.0011195670813322067, "global_step": 51384, "epoch": 431, "lr": 1.8407883336456568e-05} +{"train_loss": 0.0007830031681805849, "global_step": 51385, "epoch": 431, "lr": 1.840616613273794e-05} +{"train_loss": 0.0008515882072970271, "global_step": 51386, "epoch": 431, "lr": 1.8404448991050416e-05} +{"train_loss": 0.0007734609534963965, "global_step": 51387, "epoch": 431, "lr": 1.8402731911397396e-05} +{"train_loss": 0.0013152702013030648, "global_step": 51388, "epoch": 431, "lr": 1.840101489378224e-05} +{"train_loss": 0.00036346932756714523, "global_step": 51389, "epoch": 431, "lr": 1.83992979382083e-05} +{"train_loss": 0.0008705329964868724, "global_step": 51390, "epoch": 431, "lr": 1.8397581044678975e-05} +{"train_loss": 0.0008028302108868957, "global_step": 51391, "epoch": 431, "lr": 1.8395864213197606e-05} +{"train_loss": 0.0005475271609611809, "global_step": 51392, "epoch": 431, "lr": 1.8394147443767594e-05} +{"train_loss": 0.0006896395934745669, "global_step": 51393, "epoch": 431, "lr": 1.839243073639229e-05} +{"train_loss": 0.0005005607381463051, "global_step": 51394, "epoch": 431, "lr": 1.8390714091075085e-05} +{"train_loss": 0.0006563328788615763, "global_step": 51395, "epoch": 431, "lr": 1.8388997507819333e-05} +{"train_loss": 0.0008116266108117998, "global_step": 51396, "epoch": 431, "lr": 1.8387280986628393e-05} +{"train_loss": 0.0007288674241863191, "global_step": 51397, "epoch": 431, "lr": 1.8385564527505665e-05} +{"train_loss": 0.0007638122187927365, "global_step": 51398, "epoch": 431, "lr": 1.8383848130454485e-05} +{"train_loss": 0.00101371668279171, "global_step": 51399, "epoch": 431, "lr": 1.8382131795478263e-05} +{"train_loss": 0.0008007815922610462, "global_step": 51400, "epoch": 431, "lr": 1.8380415522580347e-05} +{"train_loss": 0.000481293594930321, "global_step": 51401, "epoch": 431, "lr": 1.8378699311764084e-05} +{"train_loss": 0.0011199023574590683, "global_step": 51402, "epoch": 431, "lr": 1.837698316303289e-05} +{"train_loss": 0.0009741750545799732, "global_step": 51403, "epoch": 431, "lr": 1.837526707639009e-05} +{"train_loss": 0.0012024848256260157, "global_step": 51404, "epoch": 431, "lr": 1.8373551051839093e-05} +{"train_loss": 0.0009587703971192241, "global_step": 51405, "epoch": 431, "lr": 1.837183508938323e-05} +{"train_loss": 0.0005767300608567894, "global_step": 51406, "epoch": 431, "lr": 1.8370119189025913e-05} +{"train_loss": 0.0008391589327410114, "global_step": 51407, "epoch": 431, "lr": 1.8368403350770486e-05, "val_loss": 0.04015824571251869} +{"train_loss": 0.00135669088922441, "global_step": 51408, "epoch": 432, "lr": 1.83666875746203e-05} +{"train_loss": 0.000924720661714673, "global_step": 51409, "epoch": 432, "lr": 1.836497186057876e-05} +{"train_loss": 0.0006641451618634164, "global_step": 51410, "epoch": 432, "lr": 1.8363256208649203e-05} +{"train_loss": 0.0005872657638974488, "global_step": 51411, "epoch": 432, "lr": 1.8361540618835034e-05} +{"train_loss": 0.0006150025292299688, "global_step": 51412, "epoch": 432, "lr": 1.8359825091139578e-05} +{"train_loss": 0.0011765885865315795, "global_step": 51413, "epoch": 432, "lr": 1.835810962556624e-05} +{"train_loss": 0.0007232678472064435, "global_step": 51414, "epoch": 432, "lr": 1.835639422211836e-05} +{"train_loss": 0.0010520971845835447, "global_step": 51415, "epoch": 432, "lr": 1.8354678880799315e-05} +{"train_loss": 0.0012527083745226264, "global_step": 51416, "epoch": 432, "lr": 1.83529636016125e-05} +{"train_loss": 0.001270861946977675, "global_step": 51417, "epoch": 432, "lr": 1.8351248384561238e-05} +{"train_loss": 0.0007041257922537625, "global_step": 51418, "epoch": 432, "lr": 1.834953322964894e-05} +{"train_loss": 0.0009036061819642782, "global_step": 51419, "epoch": 432, "lr": 1.8347818136878945e-05} +{"train_loss": 0.000526280899066478, "global_step": 51420, "epoch": 432, "lr": 1.834610310625462e-05} +{"train_loss": 0.0009120505419559777, "global_step": 51421, "epoch": 432, "lr": 1.834438813777935e-05} +{"train_loss": 0.001085013383999467, "global_step": 51422, "epoch": 432, "lr": 1.8342673231456482e-05} +{"train_loss": 0.0007837691809982061, "global_step": 51423, "epoch": 432, "lr": 1.8340958387289404e-05} +{"train_loss": 0.0008328207186423242, "global_step": 51424, "epoch": 432, "lr": 1.8339243605281453e-05} +{"train_loss": 0.0008445500861853361, "global_step": 51425, "epoch": 432, "lr": 1.833752888543604e-05} +{"train_loss": 0.0006776195368729532, "global_step": 51426, "epoch": 432, "lr": 1.8335814227756497e-05} +{"train_loss": 0.00038314072298817337, "global_step": 51427, "epoch": 432, "lr": 1.8334099632246187e-05} +{"train_loss": 0.0003699924563989043, "global_step": 51428, "epoch": 432, "lr": 1.833238509890851e-05} +{"train_loss": 0.0009494755649939179, "global_step": 51429, "epoch": 432, "lr": 1.833067062774679e-05} +{"train_loss": 0.0003641114162746817, "global_step": 51430, "epoch": 432, "lr": 1.8328956218764436e-05} +{"train_loss": 0.0015236630570143461, "global_step": 51431, "epoch": 432, "lr": 1.832724187196479e-05} +{"train_loss": 0.0004777321591973305, "global_step": 51432, "epoch": 432, "lr": 1.8325527587351206e-05} +{"train_loss": 0.0006940289167687297, "global_step": 51433, "epoch": 432, "lr": 1.8323813364927077e-05} +{"train_loss": 0.001105781993828714, "global_step": 51434, "epoch": 432, "lr": 1.8322099204695743e-05} +{"train_loss": 0.0005310281412675977, "global_step": 51435, "epoch": 432, "lr": 1.83203851066606e-05} +{"train_loss": 0.0008176917326636612, "global_step": 51436, "epoch": 432, "lr": 1.8318671070824977e-05} +{"train_loss": 0.0008019845699891448, "global_step": 51437, "epoch": 432, "lr": 1.8316957097192277e-05} +{"train_loss": 0.001411203877069056, "global_step": 51438, "epoch": 432, "lr": 1.8315243185765846e-05} +{"train_loss": 0.0005061781266704202, "global_step": 51439, "epoch": 432, "lr": 1.8313529336549036e-05} +{"train_loss": 0.0006219493225216866, "global_step": 51440, "epoch": 432, "lr": 1.8311815549545243e-05} +{"train_loss": 0.0005718134343624115, "global_step": 51441, "epoch": 432, "lr": 1.8310101824757792e-05} +{"train_loss": 0.0007614076021127403, "global_step": 51442, "epoch": 432, "lr": 1.8308388162190092e-05} +{"train_loss": 0.0006361327250488102, "global_step": 51443, "epoch": 432, "lr": 1.8306674561845466e-05} +{"train_loss": 0.0006310371682047844, "global_step": 51444, "epoch": 432, "lr": 1.830496102372732e-05} +{"train_loss": 0.0008196003036573529, "global_step": 51445, "epoch": 432, "lr": 1.8303247547838975e-05} +{"train_loss": 0.0006312604527920485, "global_step": 51446, "epoch": 432, "lr": 1.830153413418384e-05} +{"train_loss": 0.0009320940007455647, "global_step": 51447, "epoch": 432, "lr": 1.8299820782765236e-05} +{"train_loss": 0.0005503170541487634, "global_step": 51448, "epoch": 432, "lr": 1.8298107493586565e-05} +{"train_loss": 0.0013094408204779029, "global_step": 51449, "epoch": 432, "lr": 1.8296394266651156e-05} +{"train_loss": 0.0010710371425375342, "global_step": 51450, "epoch": 432, "lr": 1.82946811019624e-05} +{"train_loss": 0.00046481381286866963, "global_step": 51451, "epoch": 432, "lr": 1.8292967999523647e-05} +{"train_loss": 0.0007660181727260351, "global_step": 51452, "epoch": 432, "lr": 1.829125495933827e-05} +{"train_loss": 0.0007490954012610018, "global_step": 51453, "epoch": 432, "lr": 1.8289541981409612e-05} +{"train_loss": 0.0010027800453826785, "global_step": 51454, "epoch": 432, "lr": 1.828782906574107e-05} +{"train_loss": 0.0007154581253416836, "global_step": 51455, "epoch": 432, "lr": 1.828611621233597e-05} +{"train_loss": 0.0008820449002087116, "global_step": 51456, "epoch": 432, "lr": 1.828440342119771e-05} +{"train_loss": 0.00040599057683721185, "global_step": 51457, "epoch": 432, "lr": 1.8282690692329636e-05} +{"train_loss": 0.0004073966993018985, "global_step": 51458, "epoch": 432, "lr": 1.828097802573509e-05} +{"train_loss": 0.00087540945969522, "global_step": 51459, "epoch": 432, "lr": 1.8279265421417476e-05} +{"train_loss": 0.0008991938084363937, "global_step": 51460, "epoch": 432, "lr": 1.827755287938011e-05} +{"train_loss": 0.0008115664822980762, "global_step": 51461, "epoch": 432, "lr": 1.827584039962641e-05} +{"train_loss": 0.0005986581672914326, "global_step": 51462, "epoch": 432, "lr": 1.8274127982159682e-05} +{"train_loss": 0.0008133145747706294, "global_step": 51463, "epoch": 432, "lr": 1.827241562698333e-05} +{"train_loss": 0.000730200728867203, "global_step": 51464, "epoch": 432, "lr": 1.8270703334100707e-05} +{"train_loss": 0.001137700630351901, "global_step": 51465, "epoch": 432, "lr": 1.8268991103515147e-05} +{"train_loss": 0.0006192087894305587, "global_step": 51466, "epoch": 432, "lr": 1.8267278935230053e-05} +{"train_loss": 0.0009484890033490956, "global_step": 51467, "epoch": 432, "lr": 1.826556682924875e-05} +{"train_loss": 0.0009341301629319787, "global_step": 51468, "epoch": 432, "lr": 1.826385478557463e-05} +{"train_loss": 0.0007004147628322244, "global_step": 51469, "epoch": 432, "lr": 1.826214280421104e-05} +{"train_loss": 0.001165034482255578, "global_step": 51470, "epoch": 432, "lr": 1.8260430885161327e-05} +{"train_loss": 0.000650701520498842, "global_step": 51471, "epoch": 432, "lr": 1.8258719028428883e-05} +{"train_loss": 0.0007041975040920079, "global_step": 51472, "epoch": 432, "lr": 1.8257007234017037e-05} +{"train_loss": 0.0004200154507998377, "global_step": 51473, "epoch": 432, "lr": 1.825529550192918e-05} +{"train_loss": 0.001076540327630937, "global_step": 51474, "epoch": 432, "lr": 1.825358383216865e-05} +{"train_loss": 0.0012312912149354815, "global_step": 51475, "epoch": 432, "lr": 1.8251872224738824e-05} +{"train_loss": 0.0009240283397957683, "global_step": 51476, "epoch": 432, "lr": 1.8250160679643063e-05} +{"train_loss": 0.0006418332923203707, "global_step": 51477, "epoch": 432, "lr": 1.8248449196884698e-05} +{"train_loss": 0.00041291338857263327, "global_step": 51478, "epoch": 432, "lr": 1.824673777646711e-05} +{"train_loss": 0.002121653174981475, "global_step": 51479, "epoch": 432, "lr": 1.824502641839368e-05} +{"train_loss": 0.0006571730482392013, "global_step": 51480, "epoch": 432, "lr": 1.824331512266773e-05} +{"train_loss": 0.000760834023822099, "global_step": 51481, "epoch": 432, "lr": 1.824160388929265e-05} +{"train_loss": 0.0006453801761381328, "global_step": 51482, "epoch": 432, "lr": 1.823989271827178e-05} +{"train_loss": 0.0005301762139424682, "global_step": 51483, "epoch": 432, "lr": 1.82381816096085e-05} +{"train_loss": 0.0007652316708117723, "global_step": 51484, "epoch": 432, "lr": 1.823647056330614e-05} +{"train_loss": 0.0008398429490625858, "global_step": 51485, "epoch": 432, "lr": 1.8234759579368095e-05} +{"train_loss": 0.000582262349780649, "global_step": 51486, "epoch": 432, "lr": 1.823304865779769e-05} +{"train_loss": 0.0005872728070244193, "global_step": 51487, "epoch": 432, "lr": 1.8231337798598313e-05} +{"train_loss": 0.0007341076270677149, "global_step": 51488, "epoch": 432, "lr": 1.8229627001773314e-05} +{"train_loss": 0.0007661354611627758, "global_step": 51489, "epoch": 432, "lr": 1.822791626732603e-05} +{"train_loss": 0.0008836894412524998, "global_step": 51490, "epoch": 432, "lr": 1.8226205595259853e-05} +{"train_loss": 0.0007217339007183909, "global_step": 51491, "epoch": 432, "lr": 1.822449498557811e-05} +{"train_loss": 0.0008910237811505795, "global_step": 51492, "epoch": 432, "lr": 1.8222784438284196e-05} +{"train_loss": 0.0005000592209398746, "global_step": 51493, "epoch": 432, "lr": 1.8221073953381434e-05} +{"train_loss": 0.0005386802949942648, "global_step": 51494, "epoch": 432, "lr": 1.8219363530873213e-05} +{"train_loss": 0.0005053149652667344, "global_step": 51495, "epoch": 432, "lr": 1.8217653170762877e-05} +{"train_loss": 0.0008476405055262148, "global_step": 51496, "epoch": 432, "lr": 1.8215942873053767e-05} +{"train_loss": 0.0016917191678658128, "global_step": 51497, "epoch": 432, "lr": 1.8214232637749273e-05} +{"train_loss": 0.000926606822758913, "global_step": 51498, "epoch": 432, "lr": 1.821252246485272e-05} +{"train_loss": 0.0005491970223374665, "global_step": 51499, "epoch": 432, "lr": 1.82108123543675e-05} +{"train_loss": 0.0016058444743975997, "global_step": 51500, "epoch": 432, "lr": 1.8209102306296953e-05} +{"train_loss": 0.0005646430654451251, "global_step": 51501, "epoch": 432, "lr": 1.8207392320644423e-05} +{"train_loss": 0.001779654761776328, "global_step": 51502, "epoch": 432, "lr": 1.82056823974133e-05} +{"train_loss": 0.0005066163721494377, "global_step": 51503, "epoch": 432, "lr": 1.8203972536606906e-05} +{"train_loss": 0.0005884125712327659, "global_step": 51504, "epoch": 432, "lr": 1.8202262738228627e-05} +{"train_loss": 0.0005891316686756909, "global_step": 51505, "epoch": 432, "lr": 1.8200553002281796e-05} +{"train_loss": 0.0006041839951649308, "global_step": 51506, "epoch": 432, "lr": 1.8198843328769794e-05} +{"train_loss": 0.0005649614031426609, "global_step": 51507, "epoch": 432, "lr": 1.819713371769597e-05} +{"train_loss": 0.000819855195004493, "global_step": 51508, "epoch": 432, "lr": 1.8195424169063657e-05} +{"train_loss": 0.0006954984273761511, "global_step": 51509, "epoch": 432, "lr": 1.819371468287625e-05} +{"train_loss": 0.00131790351588279, "global_step": 51510, "epoch": 432, "lr": 1.8192005259137067e-05} +{"train_loss": 0.0010830382816493511, "global_step": 51511, "epoch": 432, "lr": 1.81902958978495e-05} +{"train_loss": 0.0010174959897994995, "global_step": 51512, "epoch": 432, "lr": 1.818858659901687e-05} +{"train_loss": 0.0010715483222156763, "global_step": 51513, "epoch": 432, "lr": 1.8186877362642558e-05} +{"train_loss": 0.0009406706085428596, "global_step": 51514, "epoch": 432, "lr": 1.8185168188729927e-05} +{"train_loss": 0.001033150008879602, "global_step": 51515, "epoch": 432, "lr": 1.81834590772823e-05} +{"train_loss": 0.0007160894456319511, "global_step": 51516, "epoch": 432, "lr": 1.8181750028303073e-05} +{"train_loss": 0.000922872219234705, "global_step": 51517, "epoch": 432, "lr": 1.8180041041795564e-05} +{"train_loss": 0.001645793323405087, "global_step": 51518, "epoch": 432, "lr": 1.817833211776316e-05} +{"train_loss": 0.0008076800149865448, "global_step": 51519, "epoch": 432, "lr": 1.8176623256209202e-05} +{"train_loss": 0.000773053674492985, "global_step": 51520, "epoch": 432, "lr": 1.8174914457137027e-05} +{"train_loss": 0.0009645386599004269, "global_step": 51521, "epoch": 432, "lr": 1.8173205720550025e-05} +{"train_loss": 0.0007958255591802299, "global_step": 51522, "epoch": 432, "lr": 1.8171497046451513e-05} +{"train_loss": 0.0008322509820573032, "global_step": 51523, "epoch": 432, "lr": 1.8169788434844886e-05} +{"train_loss": 0.0006283841794356704, "global_step": 51524, "epoch": 432, "lr": 1.8168079885733458e-05} +{"train_loss": 0.0006365052540786564, "global_step": 51525, "epoch": 432, "lr": 1.8166371399120624e-05} +{"train_loss": 0.0008234879923514833, "global_step": 51526, "epoch": 432, "lr": 1.816466297500972e-05, "val_loss": 0.027128903195261955} +{"train_loss": 0.0007750625372864306, "global_step": 51527, "epoch": 433, "lr": 1.8162954613404082e-05} +{"train_loss": 0.0009027239866554737, "global_step": 51528, "epoch": 433, "lr": 1.81612463143071e-05} +{"train_loss": 0.0008546250755898654, "global_step": 51529, "epoch": 433, "lr": 1.8159538077722088e-05} +{"train_loss": 0.0007663361611776054, "global_step": 51530, "epoch": 433, "lr": 1.8157829903652445e-05} +{"train_loss": 0.0008229796658270061, "global_step": 51531, "epoch": 433, "lr": 1.8156121792101476e-05} +{"train_loss": 0.0008038485539145768, "global_step": 51532, "epoch": 433, "lr": 1.8154413743072585e-05} +{"train_loss": 0.0011102849384769797, "global_step": 51533, "epoch": 433, "lr": 1.8152705756569093e-05} +{"train_loss": 0.0005862846155650914, "global_step": 51534, "epoch": 433, "lr": 1.8150997832594347e-05} +{"train_loss": 0.0014672051183879375, "global_step": 51535, "epoch": 433, "lr": 1.8149289971151733e-05} +{"train_loss": 0.0006248123245313764, "global_step": 51536, "epoch": 433, "lr": 1.8147582172244566e-05} +{"train_loss": 0.0007468474213965237, "global_step": 51537, "epoch": 433, "lr": 1.8145874435876237e-05} +{"train_loss": 0.0014364313101395965, "global_step": 51538, "epoch": 433, "lr": 1.814416676205008e-05} +{"train_loss": 0.0006887564668431878, "global_step": 51539, "epoch": 433, "lr": 1.814245915076943e-05} +{"train_loss": 0.0007276012329384685, "global_step": 51540, "epoch": 433, "lr": 1.8140751602037676e-05} +{"train_loss": 0.0007985556731000543, "global_step": 51541, "epoch": 433, "lr": 1.8139044115858133e-05} +{"train_loss": 0.0011181117733940482, "global_step": 51542, "epoch": 433, "lr": 1.81373366922342e-05} +{"train_loss": 0.0005309199332259595, "global_step": 51543, "epoch": 433, "lr": 1.8135629331169173e-05} +{"train_loss": 0.0007569302688352764, "global_step": 51544, "epoch": 433, "lr": 1.8133922032666455e-05} +{"train_loss": 0.0006991446716710925, "global_step": 51545, "epoch": 433, "lr": 1.8132214796729362e-05} +{"train_loss": 0.000437203940236941, "global_step": 51546, "epoch": 433, "lr": 1.8130507623361274e-05} +{"train_loss": 0.0011589945061132312, "global_step": 51547, "epoch": 433, "lr": 1.8128800512565513e-05} +{"train_loss": 0.00045756291365250945, "global_step": 51548, "epoch": 433, "lr": 1.8127093464345453e-05} +{"train_loss": 0.0010625036666169763, "global_step": 51549, "epoch": 433, "lr": 1.8125386478704447e-05} +{"train_loss": 0.0013338739518076181, "global_step": 51550, "epoch": 433, "lr": 1.8123679555645834e-05} +{"train_loss": 0.0005619220901280642, "global_step": 51551, "epoch": 433, "lr": 1.8121972695172978e-05} +{"train_loss": 0.0011151384096592665, "global_step": 51552, "epoch": 433, "lr": 1.812026589728923e-05} +{"train_loss": 0.001002905541099608, "global_step": 51553, "epoch": 433, "lr": 1.811855916199791e-05} +{"train_loss": 0.0010203151032328606, "global_step": 51554, "epoch": 433, "lr": 1.8116852489302417e-05} +{"train_loss": 0.0007691740756854415, "global_step": 51555, "epoch": 433, "lr": 1.8115145879206052e-05} +{"train_loss": 0.0010291755897924304, "global_step": 51556, "epoch": 433, "lr": 1.811343933171222e-05} +{"train_loss": 0.00044329179218038917, "global_step": 51557, "epoch": 433, "lr": 1.8111732846824237e-05} +{"train_loss": 0.0006624992820434272, "global_step": 51558, "epoch": 433, "lr": 1.811002642454544e-05} +{"train_loss": 0.0007608159212395549, "global_step": 51559, "epoch": 433, "lr": 1.810832006487922e-05} +{"train_loss": 0.00041275969124399126, "global_step": 51560, "epoch": 433, "lr": 1.8106613767828888e-05} +{"train_loss": 0.001310918596573174, "global_step": 51561, "epoch": 433, "lr": 1.810490753339783e-05} +{"train_loss": 0.0008817760972306132, "global_step": 51562, "epoch": 433, "lr": 1.8103201361589362e-05} +{"train_loss": 0.0010777951683849096, "global_step": 51563, "epoch": 433, "lr": 1.810149525240687e-05} +{"train_loss": 0.0006181612843647599, "global_step": 51564, "epoch": 433, "lr": 1.8099789205853678e-05} +{"train_loss": 0.0012423157459124923, "global_step": 51565, "epoch": 433, "lr": 1.809808322193313e-05} +{"train_loss": 0.0007560563390143216, "global_step": 51566, "epoch": 433, "lr": 1.8096377300648604e-05} +{"train_loss": 0.0008853076724335551, "global_step": 51567, "epoch": 433, "lr": 1.8094671442003414e-05} +{"train_loss": 0.0009060677839443088, "global_step": 51568, "epoch": 433, "lr": 1.8092965646000948e-05} +{"train_loss": 0.0003648981510195881, "global_step": 51569, "epoch": 433, "lr": 1.809125991264453e-05} +{"train_loss": 0.0014755470911040902, "global_step": 51570, "epoch": 433, "lr": 1.80895542419375e-05} +{"train_loss": 0.0006992522394284606, "global_step": 51571, "epoch": 433, "lr": 1.8087848633883243e-05} +{"train_loss": 0.0011934939539059997, "global_step": 51572, "epoch": 433, "lr": 1.8086143088485064e-05} +{"train_loss": 0.0005602167220786214, "global_step": 51573, "epoch": 433, "lr": 1.8084437605746346e-05} +{"train_loss": 0.0007060354109853506, "global_step": 51574, "epoch": 433, "lr": 1.8082732185670415e-05} +{"train_loss": 0.0010606505675241351, "global_step": 51575, "epoch": 433, "lr": 1.8081026828260644e-05} +{"train_loss": 0.001007568440400064, "global_step": 51576, "epoch": 433, "lr": 1.807932153352035e-05} +{"train_loss": 0.0004025961388833821, "global_step": 51577, "epoch": 433, "lr": 1.8077616301452915e-05} +{"train_loss": 0.0006775843212381005, "global_step": 51578, "epoch": 433, "lr": 1.807591113206165e-05} +{"train_loss": 0.0008455576607957482, "global_step": 51579, "epoch": 433, "lr": 1.8074206025349948e-05} +{"train_loss": 0.0005246895598247647, "global_step": 51580, "epoch": 433, "lr": 1.807250098132111e-05} +{"train_loss": 0.0009638889459893107, "global_step": 51581, "epoch": 433, "lr": 1.8070795999978518e-05} +{"train_loss": 0.0008338087354786694, "global_step": 51582, "epoch": 433, "lr": 1.8069091081325495e-05} +{"train_loss": 0.0012425020104274154, "global_step": 51583, "epoch": 433, "lr": 1.806738622536542e-05} +{"train_loss": 0.0009232659940607846, "global_step": 51584, "epoch": 433, "lr": 1.80656814321016e-05} +{"train_loss": 0.000990701955743134, "global_step": 51585, "epoch": 433, "lr": 1.8063976701537416e-05} +{"train_loss": 0.0005420009256340563, "global_step": 51586, "epoch": 433, "lr": 1.8062272033676192e-05} +{"train_loss": 0.0011692452244460583, "global_step": 51587, "epoch": 433, "lr": 1.8060567428521297e-05} +{"train_loss": 0.0009483470348641276, "global_step": 51588, "epoch": 433, "lr": 1.8058862886076067e-05} +{"train_loss": 0.0005890543689019978, "global_step": 51589, "epoch": 433, "lr": 1.805715840634383e-05} +{"train_loss": 0.0005451078759506345, "global_step": 51590, "epoch": 433, "lr": 1.805545398932797e-05} +{"train_loss": 0.0007642536656931043, "global_step": 51591, "epoch": 433, "lr": 1.8053749635031792e-05} +{"train_loss": 0.0008738667238503695, "global_step": 51592, "epoch": 433, "lr": 1.805204534345868e-05} +{"train_loss": 0.0009268483845517039, "global_step": 51593, "epoch": 433, "lr": 1.805034111461195e-05} +{"train_loss": 0.002009063493460417, "global_step": 51594, "epoch": 433, "lr": 1.804863694849498e-05} +{"train_loss": 0.0006858998094685376, "global_step": 51595, "epoch": 433, "lr": 1.8046932845111093e-05} +{"train_loss": 0.0005620631854981184, "global_step": 51596, "epoch": 433, "lr": 1.8045228804463627e-05} +{"train_loss": 0.001122782938182354, "global_step": 51597, "epoch": 433, "lr": 1.8043524826555956e-05} +{"train_loss": 0.0008389487047679722, "global_step": 51598, "epoch": 433, "lr": 1.8041820911391394e-05} +{"train_loss": 0.0007189253228716552, "global_step": 51599, "epoch": 433, "lr": 1.8040117058973317e-05} +{"train_loss": 0.0005922045675106347, "global_step": 51600, "epoch": 433, "lr": 1.8038413269305037e-05} +{"train_loss": 0.001189502771012485, "global_step": 51601, "epoch": 433, "lr": 1.803670954238994e-05} +{"train_loss": 0.0007271101931110024, "global_step": 51602, "epoch": 433, "lr": 1.803500587823135e-05} +{"train_loss": 0.0013887571403756738, "global_step": 51603, "epoch": 433, "lr": 1.8033302276832588e-05} +{"train_loss": 0.0011056968942284584, "global_step": 51604, "epoch": 433, "lr": 1.8031598738197043e-05} +{"train_loss": 0.001282988116145134, "global_step": 51605, "epoch": 433, "lr": 1.8029895262328016e-05} +{"train_loss": 0.0008737768512219191, "global_step": 51606, "epoch": 433, "lr": 1.8028191849228897e-05} +{"train_loss": 0.0005425799172371626, "global_step": 51607, "epoch": 433, "lr": 1.802648849890301e-05} +{"train_loss": 0.001300507108680904, "global_step": 51608, "epoch": 433, "lr": 1.8024785211353673e-05} +{"train_loss": 0.001065627089701593, "global_step": 51609, "epoch": 433, "lr": 1.8023081986584263e-05} +{"train_loss": 0.00030240684282034636, "global_step": 51610, "epoch": 433, "lr": 1.8021378824598124e-05} +{"train_loss": 0.0010033056605607271, "global_step": 51611, "epoch": 433, "lr": 1.8019675725398577e-05} +{"train_loss": 0.0008794196182861924, "global_step": 51612, "epoch": 433, "lr": 1.8017972688988992e-05} +{"train_loss": 0.0008517448441125453, "global_step": 51613, "epoch": 433, "lr": 1.801626971537269e-05} +{"train_loss": 0.0013222628040239215, "global_step": 51614, "epoch": 433, "lr": 1.8014566804553044e-05} +{"train_loss": 0.0008767584222368896, "global_step": 51615, "epoch": 433, "lr": 1.801286395653336e-05} +{"train_loss": 0.0006981833139434457, "global_step": 51616, "epoch": 433, "lr": 1.8011161171317016e-05} +{"train_loss": 0.0011633004760369658, "global_step": 51617, "epoch": 433, "lr": 1.8009458448907322e-05} +{"train_loss": 0.0009877767879515886, "global_step": 51618, "epoch": 433, "lr": 1.8007755789307656e-05} +{"train_loss": 0.001219390775077045, "global_step": 51619, "epoch": 433, "lr": 1.8006053192521344e-05} +{"train_loss": 0.0011783562367781997, "global_step": 51620, "epoch": 433, "lr": 1.800435065855171e-05} +{"train_loss": 0.0004591377801261842, "global_step": 51621, "epoch": 433, "lr": 1.8002648187402137e-05} +{"train_loss": 0.0003149546682834625, "global_step": 51622, "epoch": 433, "lr": 1.800094577907593e-05} +{"train_loss": 0.0003891474043484777, "global_step": 51623, "epoch": 433, "lr": 1.7999243433576457e-05} +{"train_loss": 0.0008830380393192172, "global_step": 51624, "epoch": 433, "lr": 1.7997541150907038e-05} +{"train_loss": 0.0008086594170890749, "global_step": 51625, "epoch": 433, "lr": 1.7995838931071042e-05} +{"train_loss": 0.0008501183474436402, "global_step": 51626, "epoch": 433, "lr": 1.7994136774071802e-05} +{"train_loss": 0.0005110185011290014, "global_step": 51627, "epoch": 433, "lr": 1.7992434679912636e-05} +{"train_loss": 0.0018234868766739964, "global_step": 51628, "epoch": 433, "lr": 1.799073264859692e-05} +{"train_loss": 0.0009776256047189236, "global_step": 51629, "epoch": 433, "lr": 1.7989030680127967e-05} +{"train_loss": 0.0008637786959297955, "global_step": 51630, "epoch": 433, "lr": 1.7987328774509142e-05} +{"train_loss": 0.0003811339265666902, "global_step": 51631, "epoch": 433, "lr": 1.7985626931743764e-05} +{"train_loss": 0.0008493408095091581, "global_step": 51632, "epoch": 433, "lr": 1.7983925151835207e-05} +{"train_loss": 0.0006487863138318062, "global_step": 51633, "epoch": 433, "lr": 1.7982223434786794e-05} +{"train_loss": 0.0005975427338853478, "global_step": 51634, "epoch": 433, "lr": 1.7980521780601843e-05} +{"train_loss": 0.000764531665481627, "global_step": 51635, "epoch": 433, "lr": 1.7978820189283735e-05} +{"train_loss": 0.0009018887067213655, "global_step": 51636, "epoch": 433, "lr": 1.797711866083578e-05} +{"train_loss": 0.0007573300390504301, "global_step": 51637, "epoch": 433, "lr": 1.797541719526134e-05} +{"train_loss": 0.0007360934396274388, "global_step": 51638, "epoch": 433, "lr": 1.7973715792563756e-05} +{"train_loss": 0.0010588044533506036, "global_step": 51639, "epoch": 433, "lr": 1.797201445274634e-05} +{"train_loss": 0.001852433430030942, "global_step": 51640, "epoch": 433, "lr": 1.7970313175812464e-05} +{"train_loss": 0.0009569154353812337, "global_step": 51641, "epoch": 433, "lr": 1.796861196176544e-05} +{"train_loss": 0.0010322495363652706, "global_step": 51642, "epoch": 433, "lr": 1.7966910810608646e-05} +{"train_loss": 0.0008088789763860404, "global_step": 51643, "epoch": 433, "lr": 1.7965209722345384e-05} +{"train_loss": 0.0013110365252941847, "global_step": 51644, "epoch": 433, "lr": 1.796350869697902e-05} +{"train_loss": 0.0008795284768840408, "global_step": 51645, "epoch": 433, "lr": 1.796180773451287e-05, "val_loss": 0.017544090747833252} +{"train_loss": 0.0007874235743656754, "global_step": 51646, "epoch": 434, "lr": 1.796010683495029e-05} +{"train_loss": 0.0007695619715377688, "global_step": 51647, "epoch": 434, "lr": 1.7958405998294635e-05} +{"train_loss": 0.0005497497040778399, "global_step": 51648, "epoch": 434, "lr": 1.7956705224549208e-05} +{"train_loss": 0.000701691082213074, "global_step": 51649, "epoch": 434, "lr": 1.7955004513717382e-05} +{"train_loss": 0.0005862139514647424, "global_step": 51650, "epoch": 434, "lr": 1.7953303865802467e-05} +{"train_loss": 0.0013740650610998273, "global_step": 51651, "epoch": 434, "lr": 1.795160328080783e-05} +{"train_loss": 0.0005370365688577294, "global_step": 51652, "epoch": 434, "lr": 1.7949902758736804e-05} +{"train_loss": 0.0011567045003175735, "global_step": 51653, "epoch": 434, "lr": 1.7948202299592698e-05} +{"train_loss": 0.0007318214629776776, "global_step": 51654, "epoch": 434, "lr": 1.7946501903378888e-05} +{"train_loss": 0.0009822959545999765, "global_step": 51655, "epoch": 434, "lr": 1.794480157009868e-05} +{"train_loss": 0.0008109158952720463, "global_step": 51656, "epoch": 434, "lr": 1.794310129975545e-05} +{"train_loss": 0.0014787974068894982, "global_step": 51657, "epoch": 434, "lr": 1.794140109235251e-05} +{"train_loss": 0.0009748489246703684, "global_step": 51658, "epoch": 434, "lr": 1.793970094789319e-05} +{"train_loss": 0.0005544906016439199, "global_step": 51659, "epoch": 434, "lr": 1.793800086638086e-05} +{"train_loss": 0.0003480942395981401, "global_step": 51660, "epoch": 434, "lr": 1.793630084781882e-05} +{"train_loss": 0.0008371858857572079, "global_step": 51661, "epoch": 434, "lr": 1.7934600892210452e-05} +{"train_loss": 0.0007375197019428015, "global_step": 51662, "epoch": 434, "lr": 1.7932900999559043e-05} +{"train_loss": 0.0009972803527489305, "global_step": 51663, "epoch": 434, "lr": 1.793120116986798e-05} +{"train_loss": 0.00045042092096991837, "global_step": 51664, "epoch": 434, "lr": 1.7929501403140575e-05} +{"train_loss": 0.0011642685858532786, "global_step": 51665, "epoch": 434, "lr": 1.7927801699380153e-05} +{"train_loss": 0.0013546309201046824, "global_step": 51666, "epoch": 434, "lr": 1.7926102058590082e-05} +{"train_loss": 0.0011431816965341568, "global_step": 51667, "epoch": 434, "lr": 1.7924402480773668e-05} +{"train_loss": 0.0017099601682275534, "global_step": 51668, "epoch": 434, "lr": 1.7922702965934275e-05} +{"train_loss": 0.0008951816707849503, "global_step": 51669, "epoch": 434, "lr": 1.7921003514075214e-05} +{"train_loss": 0.0009341419208794832, "global_step": 51670, "epoch": 434, "lr": 1.7919304125199852e-05} +{"train_loss": 0.0008527747122570872, "global_step": 51671, "epoch": 434, "lr": 1.791760479931151e-05} +{"train_loss": 0.0008595852414146066, "global_step": 51672, "epoch": 434, "lr": 1.7915905536413507e-05} +{"train_loss": 0.000387668696930632, "global_step": 51673, "epoch": 434, "lr": 1.791420633650921e-05} +{"train_loss": 0.0015637603355571628, "global_step": 51674, "epoch": 434, "lr": 1.7912507199601926e-05} +{"train_loss": 0.0006818309775553644, "global_step": 51675, "epoch": 434, "lr": 1.7910808125695024e-05} +{"train_loss": 0.0009993957355618477, "global_step": 51676, "epoch": 434, "lr": 1.79091091147918e-05} +{"train_loss": 0.000441727606812492, "global_step": 51677, "epoch": 434, "lr": 1.7907410166895633e-05} +{"train_loss": 0.0006983358762226999, "global_step": 51678, "epoch": 434, "lr": 1.790571128200982e-05} +{"train_loss": 0.0011655287817120552, "global_step": 51679, "epoch": 434, "lr": 1.7904012460137733e-05} +{"train_loss": 0.0008791007567197084, "global_step": 51680, "epoch": 434, "lr": 1.790231370128267e-05} +{"train_loss": 0.0006268402794376016, "global_step": 51681, "epoch": 434, "lr": 1.7900615005447984e-05} +{"train_loss": 0.0013677258975803852, "global_step": 51682, "epoch": 434, "lr": 1.7898916372637027e-05} +{"train_loss": 0.0006869963835924864, "global_step": 51683, "epoch": 434, "lr": 1.7897217802853123e-05} +{"train_loss": 0.0009715769556351006, "global_step": 51684, "epoch": 434, "lr": 1.7895519296099578e-05} +{"train_loss": 0.0008395213517360389, "global_step": 51685, "epoch": 434, "lr": 1.789382085237977e-05} +{"train_loss": 0.001090462552383542, "global_step": 51686, "epoch": 434, "lr": 1.7892122471697003e-05} +{"train_loss": 0.0011872915783897042, "global_step": 51687, "epoch": 434, "lr": 1.7890424154054635e-05} +{"train_loss": 0.000664097664412111, "global_step": 51688, "epoch": 434, "lr": 1.7888725899455995e-05} +{"train_loss": 0.0008137793047353625, "global_step": 51689, "epoch": 434, "lr": 1.7887027707904385e-05} +{"train_loss": 0.0007295851828530431, "global_step": 51690, "epoch": 434, "lr": 1.7885329579403186e-05} +{"train_loss": 0.0007426138618029654, "global_step": 51691, "epoch": 434, "lr": 1.78836315139557e-05} +{"train_loss": 0.0011426418786868453, "global_step": 51692, "epoch": 434, "lr": 1.7881933511565287e-05} +{"train_loss": 0.0005055909277871251, "global_step": 51693, "epoch": 434, "lr": 1.7880235572235243e-05} +{"train_loss": 0.0004256000684108585, "global_step": 51694, "epoch": 434, "lr": 1.787853769596895e-05} +{"train_loss": 0.0007539538200944662, "global_step": 51695, "epoch": 434, "lr": 1.787683988276971e-05} +{"train_loss": 0.0007992080063559115, "global_step": 51696, "epoch": 434, "lr": 1.787514213264085e-05} +{"train_loss": 0.0006440283032134175, "global_step": 51697, "epoch": 434, "lr": 1.787344444558573e-05} +{"train_loss": 0.0008561817812733352, "global_step": 51698, "epoch": 434, "lr": 1.7871746821607654e-05} +{"train_loss": 0.0008533226209692657, "global_step": 51699, "epoch": 434, "lr": 1.7870049260709993e-05} +{"train_loss": 0.0007548342109657824, "global_step": 51700, "epoch": 434, "lr": 1.7868351762896036e-05} +{"train_loss": 0.0006823143339715898, "global_step": 51701, "epoch": 434, "lr": 1.7866654328169153e-05} +{"train_loss": 0.0006098360172472894, "global_step": 51702, "epoch": 434, "lr": 1.7864956956532663e-05} +{"train_loss": 0.001021742820739746, "global_step": 51703, "epoch": 434, "lr": 1.7863259647989878e-05} +{"train_loss": 0.0009528854861855507, "global_step": 51704, "epoch": 434, "lr": 1.786156240254417e-05} +{"train_loss": 0.0009552751434966922, "global_step": 51705, "epoch": 434, "lr": 1.7859865220198828e-05} +{"train_loss": 0.0006215836037881672, "global_step": 51706, "epoch": 434, "lr": 1.7858168100957234e-05} +{"train_loss": 0.0007328896899707615, "global_step": 51707, "epoch": 434, "lr": 1.785647104482267e-05} +{"train_loss": 0.0007389340898953378, "global_step": 51708, "epoch": 434, "lr": 1.7854774051798507e-05} +{"train_loss": 0.0006641687941737473, "global_step": 51709, "epoch": 434, "lr": 1.7853077121888045e-05} +{"train_loss": 0.0010337040293961763, "global_step": 51710, "epoch": 434, "lr": 1.7851380255094647e-05} +{"train_loss": 0.0009059460717253387, "global_step": 51711, "epoch": 434, "lr": 1.7849683451421618e-05} +{"train_loss": 0.0005821750382892787, "global_step": 51712, "epoch": 434, "lr": 1.784798671087231e-05} +{"train_loss": 0.0006142750498838723, "global_step": 51713, "epoch": 434, "lr": 1.784629003345003e-05} +{"train_loss": 0.0004020057385787368, "global_step": 51714, "epoch": 434, "lr": 1.7844593419158146e-05} +{"train_loss": 0.0019811755046248436, "global_step": 51715, "epoch": 434, "lr": 1.7842896867999947e-05} +{"train_loss": 0.0011455462081357837, "global_step": 51716, "epoch": 434, "lr": 1.7841200379978805e-05} +{"train_loss": 0.0009179339976981282, "global_step": 51717, "epoch": 434, "lr": 1.783950395509801e-05} +{"train_loss": 0.0009251302108168602, "global_step": 51718, "epoch": 434, "lr": 1.7837807593360935e-05} +{"train_loss": 0.0005546333268284798, "global_step": 51719, "epoch": 434, "lr": 1.7836111294770864e-05} +{"train_loss": 0.0005953171639703214, "global_step": 51720, "epoch": 434, "lr": 1.7834415059331172e-05} +{"train_loss": 0.0016401783796027303, "global_step": 51721, "epoch": 434, "lr": 1.7832718887045173e-05} +{"train_loss": 0.0008327626273967326, "global_step": 51722, "epoch": 434, "lr": 1.7831022777916173e-05} +{"train_loss": 0.001594860223121941, "global_step": 51723, "epoch": 434, "lr": 1.7829326731947543e-05} +{"train_loss": 0.0010427095694467425, "global_step": 51724, "epoch": 434, "lr": 1.782763074914257e-05} +{"train_loss": 0.0011548285838216543, "global_step": 51725, "epoch": 434, "lr": 1.782593482950463e-05} +{"train_loss": 0.0007638112874701619, "global_step": 51726, "epoch": 434, "lr": 1.782423897303703e-05} +{"train_loss": 0.0004012025601696223, "global_step": 51727, "epoch": 434, "lr": 1.782254317974308e-05} +{"train_loss": 0.0005586715415120125, "global_step": 51728, "epoch": 434, "lr": 1.7820847449626148e-05} +{"train_loss": 0.0011280489852651954, "global_step": 51729, "epoch": 434, "lr": 1.7819151782689526e-05} +{"train_loss": 0.0005808374844491482, "global_step": 51730, "epoch": 434, "lr": 1.7817456178936577e-05} +{"train_loss": 0.0008421057718805969, "global_step": 51731, "epoch": 434, "lr": 1.78157606383706e-05} +{"train_loss": 0.0007751573575660586, "global_step": 51732, "epoch": 434, "lr": 1.7814065160994953e-05} +{"train_loss": 0.0005807879497297108, "global_step": 51733, "epoch": 434, "lr": 1.7812369746812952e-05} +{"train_loss": 0.0004136688366997987, "global_step": 51734, "epoch": 434, "lr": 1.781067439582791e-05} +{"train_loss": 0.0010234664659947157, "global_step": 51735, "epoch": 434, "lr": 1.7808979108043177e-05} +{"train_loss": 0.0006679263315163553, "global_step": 51736, "epoch": 434, "lr": 1.7807283883462067e-05} +{"train_loss": 0.0010586417047306895, "global_step": 51737, "epoch": 434, "lr": 1.780558872208793e-05} +{"train_loss": 0.0011164047755300999, "global_step": 51738, "epoch": 434, "lr": 1.7803893623924078e-05} +{"train_loss": 0.0006102463230490685, "global_step": 51739, "epoch": 434, "lr": 1.7802198588973828e-05} +{"train_loss": 0.0008370502619072795, "global_step": 51740, "epoch": 434, "lr": 1.7800503617240537e-05} +{"train_loss": 0.00039983689202927053, "global_step": 51741, "epoch": 434, "lr": 1.77988087087275e-05} +{"train_loss": 0.0013760799774900079, "global_step": 51742, "epoch": 434, "lr": 1.7797113863438063e-05} +{"train_loss": 0.0011806790716946125, "global_step": 51743, "epoch": 434, "lr": 1.779541908137557e-05} +{"train_loss": 0.0006261013331823051, "global_step": 51744, "epoch": 434, "lr": 1.7793724362543313e-05} +{"train_loss": 0.001163482666015625, "global_step": 51745, "epoch": 434, "lr": 1.7792029706944653e-05} +{"train_loss": 0.0007197858649305999, "global_step": 51746, "epoch": 434, "lr": 1.7790335114582884e-05} +{"train_loss": 0.0005645655910484493, "global_step": 51747, "epoch": 434, "lr": 1.778864058546137e-05} +{"train_loss": 0.00039324231329374015, "global_step": 51748, "epoch": 434, "lr": 1.7786946119583403e-05} +{"train_loss": 0.0007074628374539316, "global_step": 51749, "epoch": 434, "lr": 1.778525171695234e-05} +{"train_loss": 0.0008202033932320774, "global_step": 51750, "epoch": 434, "lr": 1.7783557377571475e-05} +{"train_loss": 0.0006052967510186136, "global_step": 51751, "epoch": 434, "lr": 1.7781863101444175e-05} +{"train_loss": 0.0005813338793814182, "global_step": 51752, "epoch": 434, "lr": 1.7780168888573746e-05} +{"train_loss": 0.0006556377629749477, "global_step": 51753, "epoch": 434, "lr": 1.777847473896349e-05} +{"train_loss": 0.0008298473549075425, "global_step": 51754, "epoch": 434, "lr": 1.7776780652616776e-05} +{"train_loss": 0.0012133767595514655, "global_step": 51755, "epoch": 434, "lr": 1.7775086629536896e-05} +{"train_loss": 0.0016598632792010903, "global_step": 51756, "epoch": 434, "lr": 1.7773392669727206e-05} +{"train_loss": 0.0008037619991227984, "global_step": 51757, "epoch": 434, "lr": 1.7771698773191013e-05} +{"train_loss": 0.0005678030429407954, "global_step": 51758, "epoch": 434, "lr": 1.7770004939931633e-05} +{"train_loss": 0.0006481613963842392, "global_step": 51759, "epoch": 434, "lr": 1.776831116995242e-05} +{"train_loss": 0.000668743799906224, "global_step": 51760, "epoch": 434, "lr": 1.7766617463256674e-05} +{"train_loss": 0.00056218181271106, "global_step": 51761, "epoch": 434, "lr": 1.7764923819847746e-05} +{"train_loss": 0.0012492351233959198, "global_step": 51762, "epoch": 434, "lr": 1.7763230239728923e-05} +{"train_loss": 0.00033230779808945954, "global_step": 51763, "epoch": 434, "lr": 1.7761536722903577e-05} +{"train_loss": 0.0008531356413316514, "global_step": 51764, "epoch": 434, "lr": 1.7759843269375003e-05, "val_loss": 0.03993133082985878} +{"train_loss": 0.0009170452831313014, "global_step": 51765, "epoch": 435, "lr": 1.7758149879146517e-05} +{"train_loss": 0.0008124327869154513, "global_step": 51766, "epoch": 435, "lr": 1.7756456552221485e-05} +{"train_loss": 0.0008143394952639937, "global_step": 51767, "epoch": 435, "lr": 1.7754763288603177e-05} +{"train_loss": 0.0009420525748282671, "global_step": 51768, "epoch": 435, "lr": 1.775307008829497e-05} +{"train_loss": 0.0008505827281624079, "global_step": 51769, "epoch": 435, "lr": 1.7751376951300147e-05} +{"train_loss": 0.000898448983207345, "global_step": 51770, "epoch": 435, "lr": 1.7749683877622066e-05} +{"train_loss": 0.000463508942630142, "global_step": 51771, "epoch": 435, "lr": 1.7747990867264037e-05} +{"train_loss": 0.0009024001774378121, "global_step": 51772, "epoch": 435, "lr": 1.774629792022936e-05} +{"train_loss": 0.0005451188771985471, "global_step": 51773, "epoch": 435, "lr": 1.7744605036521404e-05} +{"train_loss": 0.00045018165837973356, "global_step": 51774, "epoch": 435, "lr": 1.7742912216143454e-05} +{"train_loss": 0.0009524814086034894, "global_step": 51775, "epoch": 435, "lr": 1.774121945909886e-05} +{"train_loss": 0.00042786344420164824, "global_step": 51776, "epoch": 435, "lr": 1.7739526765390924e-05} +{"train_loss": 0.0009084938792511821, "global_step": 51777, "epoch": 435, "lr": 1.773783413502298e-05} +{"train_loss": 0.0011007969733327627, "global_step": 51778, "epoch": 435, "lr": 1.7736141567998366e-05} +{"train_loss": 0.0004563196562230587, "global_step": 51779, "epoch": 435, "lr": 1.7734449064320373e-05} +{"train_loss": 0.0006012739613652229, "global_step": 51780, "epoch": 435, "lr": 1.7732756623992364e-05} +{"train_loss": 0.0010829837992787361, "global_step": 51781, "epoch": 435, "lr": 1.7731064247017625e-05} +{"train_loss": 0.0008651352254673839, "global_step": 51782, "epoch": 435, "lr": 1.7729371933399507e-05} +{"train_loss": 0.0007268710760399699, "global_step": 51783, "epoch": 435, "lr": 1.7727679683141317e-05} +{"train_loss": 0.0004195748770143837, "global_step": 51784, "epoch": 435, "lr": 1.7725987496246365e-05} +{"train_loss": 0.0015406837919726968, "global_step": 51785, "epoch": 435, "lr": 1.772429537271801e-05} +{"train_loss": 0.000529502343852073, "global_step": 51786, "epoch": 435, "lr": 1.7722603312559532e-05} +{"train_loss": 0.0008486934239044785, "global_step": 51787, "epoch": 435, "lr": 1.772091131577429e-05} +{"train_loss": 0.001017606584355235, "global_step": 51788, "epoch": 435, "lr": 1.7719219382365577e-05} +{"train_loss": 0.000808327691629529, "global_step": 51789, "epoch": 435, "lr": 1.771752751233674e-05} +{"train_loss": 0.0012691995361819863, "global_step": 51790, "epoch": 435, "lr": 1.7715835705691093e-05} +{"train_loss": 0.001213640789501369, "global_step": 51791, "epoch": 435, "lr": 1.7714143962431935e-05} +{"train_loss": 0.0004392221162561327, "global_step": 51792, "epoch": 435, "lr": 1.7712452282562624e-05} +{"train_loss": 0.0003915320266969502, "global_step": 51793, "epoch": 435, "lr": 1.7710760666086446e-05} +{"train_loss": 0.0009087244980037212, "global_step": 51794, "epoch": 435, "lr": 1.7709069113006753e-05} +{"train_loss": 0.0009068006183952093, "global_step": 51795, "epoch": 435, "lr": 1.770737762332686e-05} +{"train_loss": 0.0005175614496693015, "global_step": 51796, "epoch": 435, "lr": 1.770568619705006e-05} +{"train_loss": 0.0008624003967270255, "global_step": 51797, "epoch": 435, "lr": 1.770399483417971e-05} +{"train_loss": 0.0005681447219103575, "global_step": 51798, "epoch": 435, "lr": 1.77023035347191e-05} +{"train_loss": 0.0011719973990693688, "global_step": 51799, "epoch": 435, "lr": 1.7700612298671587e-05} +{"train_loss": 0.0012913221726194024, "global_step": 51800, "epoch": 435, "lr": 1.7698921126040452e-05} +{"train_loss": 0.0005560222780331969, "global_step": 51801, "epoch": 435, "lr": 1.7697230016829053e-05} +{"train_loss": 0.00039067829493433237, "global_step": 51802, "epoch": 435, "lr": 1.7695538971040686e-05} +{"train_loss": 0.0003986795782111585, "global_step": 51803, "epoch": 435, "lr": 1.769384798867867e-05} +{"train_loss": 0.0008641870226711035, "global_step": 51804, "epoch": 435, "lr": 1.7692157069746342e-05} +{"train_loss": 0.0010994855547323823, "global_step": 51805, "epoch": 435, "lr": 1.7690466214247e-05} +{"train_loss": 0.000818939006421715, "global_step": 51806, "epoch": 435, "lr": 1.7688775422183983e-05} +{"train_loss": 0.0008614920079708099, "global_step": 51807, "epoch": 435, "lr": 1.7687084693560598e-05} +{"train_loss": 0.0008943825960159302, "global_step": 51808, "epoch": 435, "lr": 1.768539402838018e-05} +{"train_loss": 0.0015146700898185372, "global_step": 51809, "epoch": 435, "lr": 1.768370342664602e-05} +{"train_loss": 0.0009689770522527397, "global_step": 51810, "epoch": 435, "lr": 1.7682012888361478e-05} +{"train_loss": 0.0005700631299987435, "global_step": 51811, "epoch": 435, "lr": 1.768032241352983e-05} +{"train_loss": 0.0016437205485999584, "global_step": 51812, "epoch": 435, "lr": 1.7678632002154423e-05} +{"train_loss": 0.0007884672959335148, "global_step": 51813, "epoch": 435, "lr": 1.7676941654238578e-05} +{"train_loss": 0.0007149224984459579, "global_step": 51814, "epoch": 435, "lr": 1.7675251369785612e-05} +{"train_loss": 0.0009221069631166756, "global_step": 51815, "epoch": 435, "lr": 1.7673561148798813e-05} +{"train_loss": 0.0006647270638495684, "global_step": 51816, "epoch": 435, "lr": 1.767187099128154e-05} +{"train_loss": 0.0005721919587813318, "global_step": 51817, "epoch": 435, "lr": 1.7670180897237082e-05} +{"train_loss": 0.00043908398947678506, "global_step": 51818, "epoch": 435, "lr": 1.7668490866668785e-05} +{"train_loss": 0.0007846569060347974, "global_step": 51819, "epoch": 435, "lr": 1.766680089957994e-05} +{"train_loss": 0.0009885135805234313, "global_step": 51820, "epoch": 435, "lr": 1.7665110995973888e-05} +{"train_loss": 0.0010245006997138262, "global_step": 51821, "epoch": 435, "lr": 1.766342115585394e-05} +{"train_loss": 0.0005634515546262264, "global_step": 51822, "epoch": 435, "lr": 1.7661731379223385e-05} +{"train_loss": 0.0012541820760816336, "global_step": 51823, "epoch": 435, "lr": 1.766004166608559e-05} +{"train_loss": 0.0007022517966106534, "global_step": 51824, "epoch": 435, "lr": 1.765835201644383e-05} +{"train_loss": 0.0008991868235170841, "global_step": 51825, "epoch": 435, "lr": 1.7656662430301457e-05} +{"train_loss": 0.0007142185932025313, "global_step": 51826, "epoch": 435, "lr": 1.765497290766177e-05} +{"train_loss": 0.001085922122001648, "global_step": 51827, "epoch": 435, "lr": 1.7653283448528075e-05} +{"train_loss": 0.00040294433711096644, "global_step": 51828, "epoch": 435, "lr": 1.7651594052903715e-05} +{"train_loss": 0.0006940164021216333, "global_step": 51829, "epoch": 435, "lr": 1.7649904720791983e-05} +{"train_loss": 0.0012411181814968586, "global_step": 51830, "epoch": 435, "lr": 1.7648215452196216e-05} +{"train_loss": 0.0009015673422254622, "global_step": 51831, "epoch": 435, "lr": 1.764652624711971e-05} +{"train_loss": 0.00043190931319259107, "global_step": 51832, "epoch": 435, "lr": 1.764483710556581e-05} +{"train_loss": 0.0006244543474167585, "global_step": 51833, "epoch": 435, "lr": 1.7643148027537815e-05} +{"train_loss": 0.0004902036744169891, "global_step": 51834, "epoch": 435, "lr": 1.7641459013039024e-05} +{"train_loss": 0.0009803680004552007, "global_step": 51835, "epoch": 435, "lr": 1.763977006207279e-05} +{"train_loss": 0.0012801939155906439, "global_step": 51836, "epoch": 435, "lr": 1.763808117464239e-05} +{"train_loss": 0.0017567361937835813, "global_step": 51837, "epoch": 435, "lr": 1.763639235075118e-05} +{"train_loss": 0.0009115348220802844, "global_step": 51838, "epoch": 435, "lr": 1.763470359040244e-05} +{"train_loss": 0.0016713418299332261, "global_step": 51839, "epoch": 435, "lr": 1.763301489359952e-05} +{"train_loss": 0.0005041905678808689, "global_step": 51840, "epoch": 435, "lr": 1.76313262603457e-05} +{"train_loss": 0.0007222217973321676, "global_step": 51841, "epoch": 435, "lr": 1.7629637690644325e-05} +{"train_loss": 0.0005900812102481723, "global_step": 51842, "epoch": 435, "lr": 1.7627949184498682e-05} +{"train_loss": 0.0007546172710135579, "global_step": 51843, "epoch": 435, "lr": 1.762626074191212e-05} +{"train_loss": 0.0016312736552208662, "global_step": 51844, "epoch": 435, "lr": 1.762457236288792e-05} +{"train_loss": 0.0005165631300769746, "global_step": 51845, "epoch": 435, "lr": 1.7622884047429434e-05} +{"train_loss": 0.0009312852052971721, "global_step": 51846, "epoch": 435, "lr": 1.7621195795539937e-05} +{"train_loss": 0.0005530109629034996, "global_step": 51847, "epoch": 435, "lr": 1.761950760722278e-05} +{"train_loss": 0.0020730653777718544, "global_step": 51848, "epoch": 435, "lr": 1.761781948248124e-05} +{"train_loss": 0.0013023008359596133, "global_step": 51849, "epoch": 435, "lr": 1.761613142131867e-05} +{"train_loss": 0.0005044882418587804, "global_step": 51850, "epoch": 435, "lr": 1.7614443423738352e-05} +{"train_loss": 0.00046165031380951405, "global_step": 51851, "epoch": 435, "lr": 1.761275548974363e-05} +{"train_loss": 0.0007031845743767917, "global_step": 51852, "epoch": 435, "lr": 1.76110676193378e-05} +{"train_loss": 0.0015421457355841994, "global_step": 51853, "epoch": 435, "lr": 1.7609379812524168e-05} +{"train_loss": 0.0005948205944150686, "global_step": 51854, "epoch": 435, "lr": 1.760769206930607e-05} +{"train_loss": 0.0005804732209071517, "global_step": 51855, "epoch": 435, "lr": 1.7606004389686792e-05} +{"train_loss": 0.0011344278464093804, "global_step": 51856, "epoch": 435, "lr": 1.7604316773669683e-05} +{"train_loss": 0.0013481501955538988, "global_step": 51857, "epoch": 435, "lr": 1.7602629221258015e-05} +{"train_loss": 0.000621180864982307, "global_step": 51858, "epoch": 435, "lr": 1.7600941732455144e-05} +{"train_loss": 0.0007834192947484553, "global_step": 51859, "epoch": 435, "lr": 1.7599254307264363e-05} +{"train_loss": 0.0007016587187536061, "global_step": 51860, "epoch": 435, "lr": 1.759756694568897e-05} +{"train_loss": 0.0005262754275463521, "global_step": 51861, "epoch": 435, "lr": 1.7595879647732306e-05} +{"train_loss": 0.0008164736209437251, "global_step": 51862, "epoch": 435, "lr": 1.7594192413397652e-05} +{"train_loss": 0.001161483465693891, "global_step": 51863, "epoch": 435, "lr": 1.7592505242688355e-05} +{"train_loss": 0.0006584872608073056, "global_step": 51864, "epoch": 435, "lr": 1.759081813560772e-05} +{"train_loss": 0.0021914176177233458, "global_step": 51865, "epoch": 435, "lr": 1.7589131092159027e-05} +{"train_loss": 0.0013958272757008672, "global_step": 51866, "epoch": 435, "lr": 1.758744411234563e-05} +{"train_loss": 0.0004584466805681586, "global_step": 51867, "epoch": 435, "lr": 1.758575719617081e-05} +{"train_loss": 0.0014355604071170092, "global_step": 51868, "epoch": 435, "lr": 1.758407034363791e-05} +{"train_loss": 0.0015593102434650064, "global_step": 51869, "epoch": 435, "lr": 1.7582383554750205e-05} +{"train_loss": 0.0005836635245941579, "global_step": 51870, "epoch": 435, "lr": 1.758069682951104e-05} +{"train_loss": 0.0005452174809761345, "global_step": 51871, "epoch": 435, "lr": 1.7579010167923722e-05} +{"train_loss": 0.0004946239641867578, "global_step": 51872, "epoch": 435, "lr": 1.7577323569991528e-05} +{"train_loss": 0.0007254097145050764, "global_step": 51873, "epoch": 435, "lr": 1.7575637035717817e-05} +{"train_loss": 0.0006721740937791765, "global_step": 51874, "epoch": 435, "lr": 1.7573950565105862e-05} +{"train_loss": 0.0005572095979005098, "global_step": 51875, "epoch": 435, "lr": 1.757226415815899e-05} +{"train_loss": 0.001152949407696724, "global_step": 51876, "epoch": 435, "lr": 1.757057781488053e-05} +{"train_loss": 0.0005992157384753227, "global_step": 51877, "epoch": 435, "lr": 1.7568891535273763e-05} +{"train_loss": 0.0013272884534671903, "global_step": 51878, "epoch": 435, "lr": 1.7567205319342023e-05} +{"train_loss": 0.0012558511225506663, "global_step": 51879, "epoch": 435, "lr": 1.7565519167088594e-05} +{"train_loss": 0.0006031885277479887, "global_step": 51880, "epoch": 435, "lr": 1.7563833078516823e-05} +{"train_loss": 0.001353820669464767, "global_step": 51881, "epoch": 435, "lr": 1.7562147053629984e-05} +{"train_loss": 0.0007707321783527732, "global_step": 51882, "epoch": 435, "lr": 1.756046109243142e-05} +{"train_loss": 0.0008771563557313144, "global_step": 51883, "epoch": 435, "lr": 1.755877519492442e-05, "val_loss": 0.029605701565742493, "train_action_mse_error": 9.529989256407134e-06} +{"train_loss": 0.0013065460370853543, "global_step": 51884, "epoch": 436, "lr": 1.755708936111229e-05} +{"train_loss": 0.0009761154651641846, "global_step": 51885, "epoch": 436, "lr": 1.755540359099836e-05} +{"train_loss": 0.0005595794063992798, "global_step": 51886, "epoch": 436, "lr": 1.755371788458592e-05} +{"train_loss": 0.00102817767765373, "global_step": 51887, "epoch": 436, "lr": 1.7552032241878296e-05} +{"train_loss": 0.0005676235887221992, "global_step": 51888, "epoch": 436, "lr": 1.7550346662878775e-05} +{"train_loss": 0.0003347579622641206, "global_step": 51889, "epoch": 436, "lr": 1.75486611475907e-05} +{"train_loss": 0.0007811427349224687, "global_step": 51890, "epoch": 436, "lr": 1.7546975696017366e-05} +{"train_loss": 0.0013914465671405196, "global_step": 51891, "epoch": 436, "lr": 1.7545290308162054e-05} +{"train_loss": 0.0019968815613538027, "global_step": 51892, "epoch": 436, "lr": 1.7543604984028123e-05} +{"train_loss": 0.0004827083903364837, "global_step": 51893, "epoch": 436, "lr": 1.754191972361883e-05} +{"train_loss": 0.0011403470998629928, "global_step": 51894, "epoch": 436, "lr": 1.754023452693753e-05} +{"train_loss": 0.0017511555925011635, "global_step": 51895, "epoch": 436, "lr": 1.7538549393987515e-05} +{"train_loss": 0.0011069081956520677, "global_step": 51896, "epoch": 436, "lr": 1.7536864324772073e-05} +{"train_loss": 0.0008813930326141417, "global_step": 51897, "epoch": 436, "lr": 1.753517931929454e-05} +{"train_loss": 0.0007020612829364836, "global_step": 51898, "epoch": 436, "lr": 1.753349437755821e-05} +{"train_loss": 0.0023082853294909, "global_step": 51899, "epoch": 436, "lr": 1.7531809499566397e-05} +{"train_loss": 0.0011040548561140895, "global_step": 51900, "epoch": 436, "lr": 1.7530124685322397e-05} +{"train_loss": 0.0008801885996945202, "global_step": 51901, "epoch": 436, "lr": 1.752843993482955e-05} +{"train_loss": 0.0004877955070696771, "global_step": 51902, "epoch": 436, "lr": 1.7526755248091136e-05} +{"train_loss": 0.0009874620009213686, "global_step": 51903, "epoch": 436, "lr": 1.752507062511045e-05} +{"train_loss": 0.0014179362915456295, "global_step": 51904, "epoch": 436, "lr": 1.752338606589084e-05} +{"train_loss": 0.0008711150730960071, "global_step": 51905, "epoch": 436, "lr": 1.7521701570435576e-05} +{"train_loss": 0.0007350213127210736, "global_step": 51906, "epoch": 436, "lr": 1.7520017138747996e-05} +{"train_loss": 0.0012753125047311187, "global_step": 51907, "epoch": 436, "lr": 1.7518332770831375e-05} +{"train_loss": 0.0011671280954033136, "global_step": 51908, "epoch": 436, "lr": 1.7516648466689057e-05} +{"train_loss": 0.001116394530981779, "global_step": 51909, "epoch": 436, "lr": 1.751496422632431e-05} +{"train_loss": 0.0005911821499466896, "global_step": 51910, "epoch": 436, "lr": 1.751328004974046e-05} +{"train_loss": 0.000973884598352015, "global_step": 51911, "epoch": 436, "lr": 1.751159593694083e-05} +{"train_loss": 0.0007291196961887181, "global_step": 51912, "epoch": 436, "lr": 1.7509911887928694e-05} +{"train_loss": 0.0006339418468996882, "global_step": 51913, "epoch": 436, "lr": 1.7508227902707393e-05} +{"train_loss": 0.0009555472643114626, "global_step": 51914, "epoch": 436, "lr": 1.7506543981280216e-05} +{"train_loss": 0.0012604810763150454, "global_step": 51915, "epoch": 436, "lr": 1.7504860123650452e-05} +{"train_loss": 0.0005579101270996034, "global_step": 51916, "epoch": 436, "lr": 1.7503176329821436e-05} +{"train_loss": 0.000697451934684068, "global_step": 51917, "epoch": 436, "lr": 1.7501492599796447e-05} +{"train_loss": 0.0007833393174223602, "global_step": 51918, "epoch": 436, "lr": 1.7499808933578827e-05} +{"train_loss": 0.0009433056111447513, "global_step": 51919, "epoch": 436, "lr": 1.749812533117184e-05} +{"train_loss": 0.0008339331252500415, "global_step": 51920, "epoch": 436, "lr": 1.749644179257882e-05} +{"train_loss": 0.0013048147084191442, "global_step": 51921, "epoch": 436, "lr": 1.749475831780307e-05} +{"train_loss": 0.0008219309384003282, "global_step": 51922, "epoch": 436, "lr": 1.749307490684788e-05} +{"train_loss": 0.00043868296779692173, "global_step": 51923, "epoch": 436, "lr": 1.7491391559716575e-05} +{"train_loss": 0.0009074319968931377, "global_step": 51924, "epoch": 436, "lr": 1.7489708276412433e-05} +{"train_loss": 0.0009309885208494961, "global_step": 51925, "epoch": 436, "lr": 1.7488025056938796e-05} +{"train_loss": 0.0014848203863948584, "global_step": 51926, "epoch": 436, "lr": 1.748634190129894e-05} +{"train_loss": 0.0012889313511550426, "global_step": 51927, "epoch": 436, "lr": 1.7484658809496168e-05} +{"train_loss": 0.0008528780308552086, "global_step": 51928, "epoch": 436, "lr": 1.748297578153381e-05} +{"train_loss": 0.0004753650864586234, "global_step": 51929, "epoch": 436, "lr": 1.748129281741514e-05} +{"train_loss": 0.0012642403598874807, "global_step": 51930, "epoch": 436, "lr": 1.747960991714349e-05} +{"train_loss": 0.0005713885184377432, "global_step": 51931, "epoch": 436, "lr": 1.747792708072214e-05} +{"train_loss": 0.001313684624619782, "global_step": 51932, "epoch": 436, "lr": 1.7476244308154416e-05} +{"train_loss": 0.0011654861737042665, "global_step": 51933, "epoch": 436, "lr": 1.7474561599443618e-05} +{"train_loss": 0.0008664968190714717, "global_step": 51934, "epoch": 436, "lr": 1.7472878954593026e-05} +{"train_loss": 0.000992215471342206, "global_step": 51935, "epoch": 436, "lr": 1.7471196373605974e-05} +{"train_loss": 0.0010414572898298502, "global_step": 51936, "epoch": 436, "lr": 1.7469513856485735e-05} +{"train_loss": 0.0011698666494339705, "global_step": 51937, "epoch": 436, "lr": 1.7467831403235653e-05} +{"train_loss": 0.0015017763944342732, "global_step": 51938, "epoch": 436, "lr": 1.746614901385899e-05} +{"train_loss": 0.0007702968432568014, "global_step": 51939, "epoch": 436, "lr": 1.7464466688359084e-05} +{"train_loss": 0.0013627955922856927, "global_step": 51940, "epoch": 436, "lr": 1.7462784426739198e-05} +{"train_loss": 0.0014997596153989434, "global_step": 51941, "epoch": 436, "lr": 1.7461102229002686e-05} +{"train_loss": 0.00072727061342448, "global_step": 51942, "epoch": 436, "lr": 1.74594200951528e-05} +{"train_loss": 0.0009135630680248141, "global_step": 51943, "epoch": 436, "lr": 1.745773802519289e-05} +{"train_loss": 0.00045884266728535295, "global_step": 51944, "epoch": 436, "lr": 1.745605601912621e-05} +{"train_loss": 0.0006729325978085399, "global_step": 51945, "epoch": 436, "lr": 1.7454374076956103e-05} +{"train_loss": 0.0011661862954497337, "global_step": 51946, "epoch": 436, "lr": 1.7452692198685843e-05} +{"train_loss": 0.0012368819443508983, "global_step": 51947, "epoch": 436, "lr": 1.7451010384318767e-05} +{"train_loss": 0.0010365982307121158, "global_step": 51948, "epoch": 436, "lr": 1.744932863385813e-05} +{"train_loss": 0.0007612857152707875, "global_step": 51949, "epoch": 436, "lr": 1.7447646947307277e-05} +{"train_loss": 0.0012098444858565927, "global_step": 51950, "epoch": 436, "lr": 1.7445965324669477e-05} +{"train_loss": 0.00028331304201856256, "global_step": 51951, "epoch": 436, "lr": 1.744428376594806e-05} +{"train_loss": 0.0004742340533994138, "global_step": 51952, "epoch": 436, "lr": 1.7442602271146312e-05} +{"train_loss": 0.0006029789801687002, "global_step": 51953, "epoch": 436, "lr": 1.7440920840267528e-05} +{"train_loss": 0.000981746707111597, "global_step": 51954, "epoch": 436, "lr": 1.743923947331503e-05} +{"train_loss": 0.0012654474703595042, "global_step": 51955, "epoch": 436, "lr": 1.7437558170292083e-05} +{"train_loss": 0.0011647635838016868, "global_step": 51956, "epoch": 436, "lr": 1.743587693120204e-05} +{"train_loss": 0.0018441486172378063, "global_step": 51957, "epoch": 436, "lr": 1.743419575604815e-05} +{"train_loss": 0.0012490914668887854, "global_step": 51958, "epoch": 436, "lr": 1.7432514644833753e-05} +{"train_loss": 0.0004861271590925753, "global_step": 51959, "epoch": 436, "lr": 1.743083359756214e-05} +{"train_loss": 0.001230391557328403, "global_step": 51960, "epoch": 436, "lr": 1.742915261423658e-05} +{"train_loss": 0.0015456194523721933, "global_step": 51961, "epoch": 436, "lr": 1.7427471694860425e-05} +{"train_loss": 0.0010546178091317415, "global_step": 51962, "epoch": 436, "lr": 1.742579083943693e-05} +{"train_loss": 0.0012189006665721536, "global_step": 51963, "epoch": 436, "lr": 1.7424110047969433e-05} +{"train_loss": 0.0007870180415920913, "global_step": 51964, "epoch": 436, "lr": 1.7422429320461214e-05} +{"train_loss": 0.0006217783666215837, "global_step": 51965, "epoch": 436, "lr": 1.7420748656915554e-05} +{"train_loss": 0.001426399452611804, "global_step": 51966, "epoch": 436, "lr": 1.7419068057335795e-05} +{"train_loss": 0.0007225197041407228, "global_step": 51967, "epoch": 436, "lr": 1.74173875217252e-05} +{"train_loss": 0.0009705010452307761, "global_step": 51968, "epoch": 436, "lr": 1.7415707050087094e-05} +{"train_loss": 0.0010361780878156424, "global_step": 51969, "epoch": 436, "lr": 1.7414026642424753e-05} +{"train_loss": 0.0010103508830070496, "global_step": 51970, "epoch": 436, "lr": 1.7412346298741506e-05} +{"train_loss": 0.0007101647206582129, "global_step": 51971, "epoch": 436, "lr": 1.7410666019040633e-05} +{"train_loss": 0.000776593224145472, "global_step": 51972, "epoch": 436, "lr": 1.740898580332542e-05} +{"train_loss": 0.0009727223077788949, "global_step": 51973, "epoch": 436, "lr": 1.7407305651599186e-05} +{"train_loss": 0.001247361651621759, "global_step": 51974, "epoch": 436, "lr": 1.7405625563865242e-05} +{"train_loss": 0.000955378171056509, "global_step": 51975, "epoch": 436, "lr": 1.7403945540126847e-05} +{"train_loss": 0.0010593609185889363, "global_step": 51976, "epoch": 436, "lr": 1.7402265580387343e-05} +{"train_loss": 0.0006142521160654724, "global_step": 51977, "epoch": 436, "lr": 1.740058568464999e-05} +{"train_loss": 0.0013859468745067716, "global_step": 51978, "epoch": 436, "lr": 1.7398905852918123e-05} +{"train_loss": 0.0019029201939702034, "global_step": 51979, "epoch": 436, "lr": 1.7397226085195002e-05} +{"train_loss": 0.0009494480327703059, "global_step": 51980, "epoch": 436, "lr": 1.7395546381483963e-05} +{"train_loss": 0.0006910816882736981, "global_step": 51981, "epoch": 436, "lr": 1.7393866741788267e-05} +{"train_loss": 0.0009298931690864265, "global_step": 51982, "epoch": 436, "lr": 1.7392187166111252e-05} +{"train_loss": 0.000464228680357337, "global_step": 51983, "epoch": 436, "lr": 1.739050765445619e-05} +{"train_loss": 0.0008761436911299825, "global_step": 51984, "epoch": 436, "lr": 1.7388828206826362e-05} +{"train_loss": 0.0004663182480726391, "global_step": 51985, "epoch": 436, "lr": 1.7387148823225107e-05} +{"train_loss": 0.0014821748482063413, "global_step": 51986, "epoch": 436, "lr": 1.7385469503655684e-05} +{"train_loss": 0.0013829813105985522, "global_step": 51987, "epoch": 436, "lr": 1.7383790248121423e-05} +{"train_loss": 0.0013159119989722967, "global_step": 51988, "epoch": 436, "lr": 1.738211105662559e-05} +{"train_loss": 0.0007772815879434347, "global_step": 51989, "epoch": 436, "lr": 1.7380431929171513e-05} +{"train_loss": 0.0005872949259355664, "global_step": 51990, "epoch": 436, "lr": 1.737875286576247e-05} +{"train_loss": 0.000979823642410338, "global_step": 51991, "epoch": 436, "lr": 1.737707386640175e-05} +{"train_loss": 0.0003714430204126984, "global_step": 51992, "epoch": 436, "lr": 1.7375394931092676e-05} +{"train_loss": 0.0007252217037603259, "global_step": 51993, "epoch": 436, "lr": 1.7373716059838507e-05} +{"train_loss": 0.0006232256419025362, "global_step": 51994, "epoch": 436, "lr": 1.7372037252642583e-05} +{"train_loss": 0.0007826322107575834, "global_step": 51995, "epoch": 436, "lr": 1.7370358509508177e-05} +{"train_loss": 0.0006243301322683692, "global_step": 51996, "epoch": 436, "lr": 1.7368679830438567e-05} +{"train_loss": 0.0008914328645914793, "global_step": 51997, "epoch": 436, "lr": 1.7367001215437085e-05} +{"train_loss": 0.0006235265173017979, "global_step": 51998, "epoch": 436, "lr": 1.7365322664506995e-05} +{"train_loss": 0.0005273547139950097, "global_step": 51999, "epoch": 436, "lr": 1.7363644177651623e-05} +{"train_loss": 0.0007706716423854232, "global_step": 52000, "epoch": 436, "lr": 1.7361965754874233e-05} +{"train_loss": 0.0005185675108805299, "global_step": 52001, "epoch": 436, "lr": 1.7360287396178155e-05} +{"train_loss": 0.0009584813427665279, "global_step": 52002, "epoch": 436, "lr": 1.7358609101566658e-05, "val_loss": 0.02670084685087204} +{"train_loss": 0.0005865839193575084, "global_step": 52003, "epoch": 437, "lr": 1.7356930871043037e-05} +{"train_loss": 0.0008337036124430597, "global_step": 52004, "epoch": 437, "lr": 1.735525270461061e-05} +{"train_loss": 0.0009225677349604666, "global_step": 52005, "epoch": 437, "lr": 1.735357460227263e-05} +{"train_loss": 0.0010557303903624415, "global_step": 52006, "epoch": 437, "lr": 1.7351896564032448e-05} +{"train_loss": 0.0006664266693405807, "global_step": 52007, "epoch": 437, "lr": 1.735021858989331e-05} +{"train_loss": 0.0009139229659922421, "global_step": 52008, "epoch": 437, "lr": 1.734854067985852e-05} +{"train_loss": 0.0009666827390901744, "global_step": 52009, "epoch": 437, "lr": 1.734686283393141e-05} +{"train_loss": 0.0005618842551484704, "global_step": 52010, "epoch": 437, "lr": 1.7345185052115227e-05} +{"train_loss": 0.0010154149495065212, "global_step": 52011, "epoch": 437, "lr": 1.73435073344133e-05} +{"train_loss": 0.0004917328478768468, "global_step": 52012, "epoch": 437, "lr": 1.7341829680828888e-05} +{"train_loss": 0.0003315219364594668, "global_step": 52013, "epoch": 437, "lr": 1.7340152091365323e-05} +{"train_loss": 0.0011116386158391833, "global_step": 52014, "epoch": 437, "lr": 1.733847456602588e-05} +{"train_loss": 0.00096537807257846, "global_step": 52015, "epoch": 437, "lr": 1.733679710481384e-05} +{"train_loss": 0.0006301383837126195, "global_step": 52016, "epoch": 437, "lr": 1.7335119707732522e-05} +{"train_loss": 0.0003709843731485307, "global_step": 52017, "epoch": 437, "lr": 1.733344237478519e-05} +{"train_loss": 0.0009090276435017586, "global_step": 52018, "epoch": 437, "lr": 1.7331765105975172e-05} +{"train_loss": 0.0007599715027026832, "global_step": 52019, "epoch": 437, "lr": 1.7330087901305726e-05} +{"train_loss": 0.0007203216082416475, "global_step": 52020, "epoch": 437, "lr": 1.7328410760780178e-05} +{"train_loss": 0.0007274408126249909, "global_step": 52021, "epoch": 437, "lr": 1.7326733684401806e-05} +{"train_loss": 0.0006566172814927995, "global_step": 52022, "epoch": 437, "lr": 1.732505667217389e-05} +{"train_loss": 0.000654747593216598, "global_step": 52023, "epoch": 437, "lr": 1.7323379724099742e-05} +{"train_loss": 0.0010566767305135727, "global_step": 52024, "epoch": 437, "lr": 1.7321702840182635e-05} +{"train_loss": 0.000948118744418025, "global_step": 52025, "epoch": 437, "lr": 1.732002602042589e-05} +{"train_loss": 0.0006622551591135561, "global_step": 52026, "epoch": 437, "lr": 1.7318349264832766e-05} +{"train_loss": 0.0007802791078574955, "global_step": 52027, "epoch": 437, "lr": 1.731667257340659e-05} +{"train_loss": 0.0009658148046582937, "global_step": 52028, "epoch": 437, "lr": 1.731499594615063e-05} +{"train_loss": 0.0007919243071228266, "global_step": 52029, "epoch": 437, "lr": 1.731331938306817e-05} +{"train_loss": 0.0007613387424498796, "global_step": 52030, "epoch": 437, "lr": 1.7311642884162532e-05} +{"train_loss": 0.0006378591060638428, "global_step": 52031, "epoch": 437, "lr": 1.7309966449436975e-05} +{"train_loss": 0.0012373706558719277, "global_step": 52032, "epoch": 437, "lr": 1.7308290078894825e-05} +{"train_loss": 0.00038042411324568093, "global_step": 52033, "epoch": 437, "lr": 1.7306613772539354e-05} +{"train_loss": 0.0004752670938614756, "global_step": 52034, "epoch": 437, "lr": 1.7304937530373833e-05} +{"train_loss": 0.0007660361588932574, "global_step": 52035, "epoch": 437, "lr": 1.7303261352401594e-05} +{"train_loss": 0.0004209244216326624, "global_step": 52036, "epoch": 437, "lr": 1.7301585238625894e-05} +{"train_loss": 0.0005775128374807537, "global_step": 52037, "epoch": 437, "lr": 1.729990918905005e-05} +{"train_loss": 0.0002882404369302094, "global_step": 52038, "epoch": 437, "lr": 1.729823320367733e-05} +{"train_loss": 0.0003842909063678235, "global_step": 52039, "epoch": 437, "lr": 1.7296557282511043e-05} +{"train_loss": 0.0012872982770204544, "global_step": 52040, "epoch": 437, "lr": 1.7294881425554466e-05} +{"train_loss": 0.0007916831527836621, "global_step": 52041, "epoch": 437, "lr": 1.7293205632810904e-05} +{"train_loss": 0.0006782396812923253, "global_step": 52042, "epoch": 437, "lr": 1.7291529904283628e-05} +{"train_loss": 0.0009232402080669999, "global_step": 52043, "epoch": 437, "lr": 1.7289854239975933e-05} +{"train_loss": 0.0006354364450089633, "global_step": 52044, "epoch": 437, "lr": 1.7288178639891133e-05} +{"train_loss": 0.0006015298422425985, "global_step": 52045, "epoch": 437, "lr": 1.7286503104032498e-05} +{"train_loss": 0.0010429477551952004, "global_step": 52046, "epoch": 437, "lr": 1.7284827632403304e-05} +{"train_loss": 0.0009542531333863735, "global_step": 52047, "epoch": 437, "lr": 1.7283152225006875e-05} +{"train_loss": 0.0009940210729837418, "global_step": 52048, "epoch": 437, "lr": 1.7281476881846464e-05} +{"train_loss": 0.0008249005186371505, "global_step": 52049, "epoch": 437, "lr": 1.7279801602925393e-05} +{"train_loss": 0.0012940468732267618, "global_step": 52050, "epoch": 437, "lr": 1.7278126388246917e-05} +{"train_loss": 0.00041635165689513087, "global_step": 52051, "epoch": 437, "lr": 1.7276451237814362e-05} +{"train_loss": 0.0010035258019343019, "global_step": 52052, "epoch": 437, "lr": 1.7274776151631e-05} +{"train_loss": 0.0008011621539480984, "global_step": 52053, "epoch": 437, "lr": 1.7273101129700102e-05} +{"train_loss": 0.0011798676569014788, "global_step": 52054, "epoch": 437, "lr": 1.7271426172024992e-05} +{"train_loss": 0.0008867505821399391, "global_step": 52055, "epoch": 437, "lr": 1.7269751278608924e-05} +{"train_loss": 0.0014216786948964, "global_step": 52056, "epoch": 437, "lr": 1.7268076449455217e-05} +{"train_loss": 0.000679788994602859, "global_step": 52057, "epoch": 437, "lr": 1.726640168456713e-05} +{"train_loss": 0.0006661203224211931, "global_step": 52058, "epoch": 437, "lr": 1.7264726983947982e-05} +{"train_loss": 0.00040887927752919495, "global_step": 52059, "epoch": 437, "lr": 1.7263052347601044e-05} +{"train_loss": 0.0009974879212677479, "global_step": 52060, "epoch": 437, "lr": 1.7261377775529584e-05} +{"train_loss": 0.000785563956014812, "global_step": 52061, "epoch": 437, "lr": 1.725970326773694e-05} +{"train_loss": 0.0012815834488719702, "global_step": 52062, "epoch": 437, "lr": 1.7258028824226348e-05} +{"train_loss": 0.0005868503358215094, "global_step": 52063, "epoch": 437, "lr": 1.7256354445001133e-05} +{"train_loss": 0.001198050333186984, "global_step": 52064, "epoch": 437, "lr": 1.7254680130064567e-05} +{"train_loss": 0.0009438589331693947, "global_step": 52065, "epoch": 437, "lr": 1.7253005879419926e-05} +{"train_loss": 0.0007796852733008564, "global_step": 52066, "epoch": 437, "lr": 1.7251331693070523e-05} +{"train_loss": 0.0009320225799456239, "global_step": 52067, "epoch": 437, "lr": 1.724965757101962e-05} +{"train_loss": 0.00028935945010744035, "global_step": 52068, "epoch": 437, "lr": 1.7247983513270523e-05} +{"train_loss": 0.0005210909293964505, "global_step": 52069, "epoch": 437, "lr": 1.7246309519826497e-05} +{"train_loss": 0.0010081607615575194, "global_step": 52070, "epoch": 437, "lr": 1.7244635590690867e-05} +{"train_loss": 0.0006248379941098392, "global_step": 52071, "epoch": 437, "lr": 1.7242961725866874e-05} +{"train_loss": 0.0007114755571819842, "global_step": 52072, "epoch": 437, "lr": 1.724128792535784e-05} +{"train_loss": 0.0005569333443418145, "global_step": 52073, "epoch": 437, "lr": 1.7239614189167026e-05} +{"train_loss": 0.0005174268153496087, "global_step": 52074, "epoch": 437, "lr": 1.7237940517297745e-05} +{"train_loss": 0.0010080020874738693, "global_step": 52075, "epoch": 437, "lr": 1.723626690975325e-05} +{"train_loss": 0.0009937522700056434, "global_step": 52076, "epoch": 437, "lr": 1.7234593366536862e-05} +{"train_loss": 0.0005020730895921588, "global_step": 52077, "epoch": 437, "lr": 1.7232919887651834e-05} +{"train_loss": 0.0006555115687660873, "global_step": 52078, "epoch": 437, "lr": 1.7231246473101482e-05} +{"train_loss": 0.0010229898616671562, "global_step": 52079, "epoch": 437, "lr": 1.722957312288906e-05} +{"train_loss": 0.0007854222785681486, "global_step": 52080, "epoch": 437, "lr": 1.7227899837017886e-05} +{"train_loss": 0.0010428603272885084, "global_step": 52081, "epoch": 437, "lr": 1.7226226615491215e-05} +{"train_loss": 0.0005571218207478523, "global_step": 52082, "epoch": 437, "lr": 1.722455345831236e-05} +{"train_loss": 0.0006014917744323611, "global_step": 52083, "epoch": 437, "lr": 1.7222880365484596e-05} +{"train_loss": 0.0007248807814903557, "global_step": 52084, "epoch": 437, "lr": 1.7221207337011187e-05} +{"train_loss": 0.0005158357671461999, "global_step": 52085, "epoch": 437, "lr": 1.721953437289545e-05} +{"train_loss": 0.0011977648828178644, "global_step": 52086, "epoch": 437, "lr": 1.7217861473140644e-05} +{"train_loss": 0.0007556205964647233, "global_step": 52087, "epoch": 437, "lr": 1.7216188637750076e-05} +{"train_loss": 0.0004670846392400563, "global_step": 52088, "epoch": 437, "lr": 1.7214515866727006e-05} +{"train_loss": 0.0005946230376139283, "global_step": 52089, "epoch": 437, "lr": 1.721284316007475e-05} +{"train_loss": 0.000512703147251159, "global_step": 52090, "epoch": 437, "lr": 1.7211170517796567e-05} +{"train_loss": 0.0008188943029381335, "global_step": 52091, "epoch": 437, "lr": 1.7209497939895734e-05} +{"train_loss": 0.0012880756985396147, "global_step": 52092, "epoch": 437, "lr": 1.720782542637557e-05} +{"train_loss": 0.00042000567191280425, "global_step": 52093, "epoch": 437, "lr": 1.7206152977239316e-05} +{"train_loss": 0.0005456233629956841, "global_step": 52094, "epoch": 437, "lr": 1.720448059249029e-05} +{"train_loss": 0.0005029845051467419, "global_step": 52095, "epoch": 437, "lr": 1.720280827213175e-05} +{"train_loss": 0.0008922311244532466, "global_step": 52096, "epoch": 437, "lr": 1.720113601616701e-05} +{"train_loss": 0.0005202015745453537, "global_step": 52097, "epoch": 437, "lr": 1.7199463824599333e-05} +{"train_loss": 0.0007873952854424715, "global_step": 52098, "epoch": 437, "lr": 1.7197791697431992e-05} +{"train_loss": 0.0006727611180394888, "global_step": 52099, "epoch": 437, "lr": 1.7196119634668294e-05} +{"train_loss": 0.001138212624937296, "global_step": 52100, "epoch": 437, "lr": 1.71944476363115e-05} +{"train_loss": 0.0006215000757947564, "global_step": 52101, "epoch": 437, "lr": 1.7192775702364915e-05} +{"train_loss": 0.000504534924402833, "global_step": 52102, "epoch": 437, "lr": 1.7191103832831813e-05} +{"train_loss": 0.0008346864487975836, "global_step": 52103, "epoch": 437, "lr": 1.7189432027715453e-05} +{"train_loss": 0.0006803526193834841, "global_step": 52104, "epoch": 437, "lr": 1.7187760287019156e-05} +{"train_loss": 0.0005894684582017362, "global_step": 52105, "epoch": 437, "lr": 1.718608861074617e-05} +{"train_loss": 0.0004015005542896688, "global_step": 52106, "epoch": 437, "lr": 1.7184416998899793e-05} +{"train_loss": 0.0005736759630963206, "global_step": 52107, "epoch": 437, "lr": 1.718274545148333e-05} +{"train_loss": 0.00042757639312185347, "global_step": 52108, "epoch": 437, "lr": 1.7181073968500016e-05} +{"train_loss": 0.0007587891886942089, "global_step": 52109, "epoch": 437, "lr": 1.717940254995318e-05} +{"train_loss": 0.0005186872440390289, "global_step": 52110, "epoch": 437, "lr": 1.717773119584606e-05} +{"train_loss": 0.0007280076970346272, "global_step": 52111, "epoch": 437, "lr": 1.7176059906181974e-05} +{"train_loss": 0.0007221318082883954, "global_step": 52112, "epoch": 437, "lr": 1.7174388680964172e-05} +{"train_loss": 0.000641593593172729, "global_step": 52113, "epoch": 437, "lr": 1.7172717520195963e-05} +{"train_loss": 0.0006814595544710755, "global_step": 52114, "epoch": 437, "lr": 1.717104642388062e-05} +{"train_loss": 0.0006103747291490436, "global_step": 52115, "epoch": 437, "lr": 1.7169375392021407e-05} +{"train_loss": 0.0005465910071507096, "global_step": 52116, "epoch": 437, "lr": 1.7167704424621634e-05} +{"train_loss": 0.0006714810151606798, "global_step": 52117, "epoch": 437, "lr": 1.7166033521684544e-05} +{"train_loss": 0.0006473925895988941, "global_step": 52118, "epoch": 437, "lr": 1.716436268321346e-05} +{"train_loss": 0.000534460530616343, "global_step": 52119, "epoch": 437, "lr": 1.7162691909211626e-05} +{"train_loss": 0.0005173800745978951, "global_step": 52120, "epoch": 437, "lr": 1.7161021199682354e-05} +{"train_loss": 0.0007433798934524769, "global_step": 52121, "epoch": 437, "lr": 1.7159350554628907e-05, "val_loss": 0.018264953047037125} +{"train_loss": 0.0008316330495290458, "global_step": 52122, "epoch": 438, "lr": 1.7157679974054553e-05} +{"train_loss": 0.0006487589562311769, "global_step": 52123, "epoch": 438, "lr": 1.7156009457962598e-05} +{"train_loss": 0.00040634776814840734, "global_step": 52124, "epoch": 438, "lr": 1.7154339006356297e-05} +{"train_loss": 0.0009813811630010605, "global_step": 52125, "epoch": 438, "lr": 1.7152668619238956e-05} +{"train_loss": 0.0008146079489961267, "global_step": 52126, "epoch": 438, "lr": 1.7150998296613825e-05} +{"train_loss": 0.0005245466018095613, "global_step": 52127, "epoch": 438, "lr": 1.7149328038484212e-05} +{"train_loss": 0.0009258650825358927, "global_step": 52128, "epoch": 438, "lr": 1.7147657844853393e-05} +{"train_loss": 0.0005521815037354827, "global_step": 52129, "epoch": 438, "lr": 1.7145987715724615e-05} +{"train_loss": 0.0003816031967289746, "global_step": 52130, "epoch": 438, "lr": 1.71443176511012e-05} +{"train_loss": 0.00038336904253810644, "global_step": 52131, "epoch": 438, "lr": 1.714264765098639e-05} +{"train_loss": 0.0006240297807380557, "global_step": 52132, "epoch": 438, "lr": 1.7140977715383493e-05} +{"train_loss": 0.0005970148486085236, "global_step": 52133, "epoch": 438, "lr": 1.7139307844295784e-05} +{"train_loss": 0.0007038446492515504, "global_step": 52134, "epoch": 438, "lr": 1.7137638037726513e-05} +{"train_loss": 0.000495784217491746, "global_step": 52135, "epoch": 438, "lr": 1.713596829567899e-05} +{"train_loss": 0.000390781118767336, "global_step": 52136, "epoch": 438, "lr": 1.7134298618156474e-05} +{"train_loss": 0.0004294409300200641, "global_step": 52137, "epoch": 438, "lr": 1.7132629005162265e-05} +{"train_loss": 0.00047175181680358946, "global_step": 52138, "epoch": 438, "lr": 1.7130959456699606e-05} +{"train_loss": 0.0007566115236841142, "global_step": 52139, "epoch": 438, "lr": 1.7129289972771816e-05} +{"train_loss": 0.0004998165532015264, "global_step": 52140, "epoch": 438, "lr": 1.712762055338214e-05} +{"train_loss": 0.0006796386442147195, "global_step": 52141, "epoch": 438, "lr": 1.7125951198533868e-05} +{"train_loss": 0.0011243720073252916, "global_step": 52142, "epoch": 438, "lr": 1.7124281908230294e-05} +{"train_loss": 0.0005563717568293214, "global_step": 52143, "epoch": 438, "lr": 1.7122612682474663e-05} +{"train_loss": 0.0007658418617211282, "global_step": 52144, "epoch": 438, "lr": 1.7120943521270295e-05} +{"train_loss": 0.0006402942817658186, "global_step": 52145, "epoch": 438, "lr": 1.7119274424620414e-05} +{"train_loss": 0.0009018019773066044, "global_step": 52146, "epoch": 438, "lr": 1.7117605392528346e-05} +{"train_loss": 0.0003473363758530468, "global_step": 52147, "epoch": 438, "lr": 1.7115936424997346e-05} +{"train_loss": 0.0007018818287178874, "global_step": 52148, "epoch": 438, "lr": 1.7114267522030674e-05} +{"train_loss": 0.001064846059307456, "global_step": 52149, "epoch": 438, "lr": 1.7112598683631642e-05} +{"train_loss": 0.0007284568855538964, "global_step": 52150, "epoch": 438, "lr": 1.7110929909803498e-05} +{"train_loss": 0.0014243164332583547, "global_step": 52151, "epoch": 438, "lr": 1.7109261200549537e-05} +{"train_loss": 0.00112144835293293, "global_step": 52152, "epoch": 438, "lr": 1.7107592555873032e-05} +{"train_loss": 0.0004385763604659587, "global_step": 52153, "epoch": 438, "lr": 1.7105923975777237e-05} +{"train_loss": 0.0006993356510065496, "global_step": 52154, "epoch": 438, "lr": 1.7104255460265467e-05} +{"train_loss": 0.0006795037188567221, "global_step": 52155, "epoch": 438, "lr": 1.7102587009340953e-05} +{"train_loss": 0.0008449294255115092, "global_step": 52156, "epoch": 438, "lr": 1.7100918623007017e-05} +{"train_loss": 0.0007560153608210385, "global_step": 52157, "epoch": 438, "lr": 1.7099250301266896e-05} +{"train_loss": 0.000634950352832675, "global_step": 52158, "epoch": 438, "lr": 1.7097582044123896e-05} +{"train_loss": 0.00040327885653823614, "global_step": 52159, "epoch": 438, "lr": 1.709591385158128e-05} +{"train_loss": 0.0005263268249109387, "global_step": 52160, "epoch": 438, "lr": 1.7094245723642306e-05} +{"train_loss": 0.0005903357523493469, "global_step": 52161, "epoch": 438, "lr": 1.7092577660310277e-05} +{"train_loss": 0.0014981154818087816, "global_step": 52162, "epoch": 438, "lr": 1.7090909661588443e-05} +{"train_loss": 0.0013929040869697928, "global_step": 52163, "epoch": 438, "lr": 1.708924172748011e-05} +{"train_loss": 0.0005141710280440748, "global_step": 52164, "epoch": 438, "lr": 1.708757385798852e-05} +{"train_loss": 0.00040913463453762233, "global_step": 52165, "epoch": 438, "lr": 1.7085906053116974e-05} +{"train_loss": 0.0009891357040032744, "global_step": 52166, "epoch": 438, "lr": 1.7084238312868738e-05} +{"train_loss": 0.0008273391867987812, "global_step": 52167, "epoch": 438, "lr": 1.7082570637247063e-05} +{"train_loss": 0.00035294273402541876, "global_step": 52168, "epoch": 438, "lr": 1.708090302625527e-05} +{"train_loss": 0.0006929203518666327, "global_step": 52169, "epoch": 438, "lr": 1.7079235479896582e-05} +{"train_loss": 0.0002975512470584363, "global_step": 52170, "epoch": 438, "lr": 1.7077567998174315e-05} +{"train_loss": 0.0009790011681616306, "global_step": 52171, "epoch": 438, "lr": 1.7075900581091714e-05} +{"train_loss": 0.0007468298426829278, "global_step": 52172, "epoch": 438, "lr": 1.7074233228652075e-05} +{"train_loss": 0.0005988474003970623, "global_step": 52173, "epoch": 438, "lr": 1.707256594085865e-05} +{"train_loss": 0.0005020538810640574, "global_step": 52174, "epoch": 438, "lr": 1.707089871771474e-05} +{"train_loss": 0.0012221336364746094, "global_step": 52175, "epoch": 438, "lr": 1.7069231559223587e-05} +{"train_loss": 0.0007622587727382779, "global_step": 52176, "epoch": 438, "lr": 1.7067564465388474e-05} +{"train_loss": 0.0004155438218731433, "global_step": 52177, "epoch": 438, "lr": 1.7065897436212702e-05} +{"train_loss": 0.0013057744363322854, "global_step": 52178, "epoch": 438, "lr": 1.7064230471699516e-05} +{"train_loss": 0.001033396227285266, "global_step": 52179, "epoch": 438, "lr": 1.7062563571852187e-05} +{"train_loss": 0.00045559820136986673, "global_step": 52180, "epoch": 438, "lr": 1.7060896736674004e-05} +{"train_loss": 0.0006298834341578186, "global_step": 52181, "epoch": 438, "lr": 1.7059229966168216e-05} +{"train_loss": 0.0005878485972061753, "global_step": 52182, "epoch": 438, "lr": 1.7057563260338134e-05} +{"train_loss": 0.0010766286868602037, "global_step": 52183, "epoch": 438, "lr": 1.7055896619187e-05} +{"train_loss": 0.0007580002420581877, "global_step": 52184, "epoch": 438, "lr": 1.705423004271808e-05} +{"train_loss": 0.0005328709376044571, "global_step": 52185, "epoch": 438, "lr": 1.7052563530934673e-05} +{"train_loss": 0.0011274493299424648, "global_step": 52186, "epoch": 438, "lr": 1.7050897083840024e-05} +{"train_loss": 0.0007494425517506897, "global_step": 52187, "epoch": 438, "lr": 1.7049230701437435e-05} +{"train_loss": 0.0007676993263885379, "global_step": 52188, "epoch": 438, "lr": 1.7047564383730148e-05} +{"train_loss": 0.000516350963152945, "global_step": 52189, "epoch": 438, "lr": 1.7045898130721456e-05} +{"train_loss": 0.000943788792937994, "global_step": 52190, "epoch": 438, "lr": 1.704423194241463e-05} +{"train_loss": 0.0006394030060619116, "global_step": 52191, "epoch": 438, "lr": 1.7042565818812912e-05} +{"train_loss": 0.0008982667932286859, "global_step": 52192, "epoch": 438, "lr": 1.7040899759919615e-05} +{"train_loss": 0.0007215418154373765, "global_step": 52193, "epoch": 438, "lr": 1.7039233765737972e-05} +{"train_loss": 0.0008007065625861287, "global_step": 52194, "epoch": 438, "lr": 1.703756783627129e-05} +{"train_loss": 0.0009224776295013726, "global_step": 52195, "epoch": 438, "lr": 1.7035901971522806e-05} +{"train_loss": 0.0008009471348486841, "global_step": 52196, "epoch": 438, "lr": 1.7034236171495822e-05} +{"train_loss": 0.000753843632992357, "global_step": 52197, "epoch": 438, "lr": 1.703257043619359e-05} +{"train_loss": 0.0011780591448768973, "global_step": 52198, "epoch": 438, "lr": 1.703090476561937e-05} +{"train_loss": 0.0005159103311598301, "global_step": 52199, "epoch": 438, "lr": 1.7029239159776468e-05} +{"train_loss": 0.0010346043854951859, "global_step": 52200, "epoch": 438, "lr": 1.7027573618668107e-05} +{"train_loss": 0.00046266737626865506, "global_step": 52201, "epoch": 438, "lr": 1.7025908142297602e-05} +{"train_loss": 0.0007556175696663558, "global_step": 52202, "epoch": 438, "lr": 1.7024242730668195e-05} +{"train_loss": 0.000720247917342931, "global_step": 52203, "epoch": 438, "lr": 1.7022577383783174e-05} +{"train_loss": 0.0009500302840024233, "global_step": 52204, "epoch": 438, "lr": 1.702091210164578e-05} +{"train_loss": 0.0006427353946492076, "global_step": 52205, "epoch": 438, "lr": 1.701924688425932e-05} +{"train_loss": 0.0006351505871862173, "global_step": 52206, "epoch": 438, "lr": 1.701758173162703e-05} +{"train_loss": 0.0004404506762512028, "global_step": 52207, "epoch": 438, "lr": 1.7015916643752217e-05} +{"train_loss": 0.001232961774803698, "global_step": 52208, "epoch": 438, "lr": 1.7014251620638106e-05} +{"train_loss": 0.0006351897027343512, "global_step": 52209, "epoch": 438, "lr": 1.7012586662288e-05} +{"train_loss": 0.0009525849018245935, "global_step": 52210, "epoch": 438, "lr": 1.7010921768705145e-05} +{"train_loss": 0.0003797212557401508, "global_step": 52211, "epoch": 438, "lr": 1.7009256939892837e-05} +{"train_loss": 0.0004308513307478279, "global_step": 52212, "epoch": 438, "lr": 1.700759217585431e-05} +{"train_loss": 0.0010269569465890527, "global_step": 52213, "epoch": 438, "lr": 1.700592747659287e-05} +{"train_loss": 0.0007928505074232817, "global_step": 52214, "epoch": 438, "lr": 1.7004262842111745e-05} +{"train_loss": 0.0009008741471916437, "global_step": 52215, "epoch": 438, "lr": 1.7002598272414242e-05} +{"train_loss": 0.0005991020007058978, "global_step": 52216, "epoch": 438, "lr": 1.700093376750362e-05} +{"train_loss": 0.0006341547705233097, "global_step": 52217, "epoch": 438, "lr": 1.6999269327383117e-05} +{"train_loss": 0.0007607748848386109, "global_step": 52218, "epoch": 438, "lr": 1.699760495205604e-05} +{"train_loss": 0.00045620021410286427, "global_step": 52219, "epoch": 438, "lr": 1.699594064152562e-05} +{"train_loss": 0.0006275515188463032, "global_step": 52220, "epoch": 438, "lr": 1.6994276395795168e-05} +{"train_loss": 0.0005065671866759658, "global_step": 52221, "epoch": 438, "lr": 1.6992612214867925e-05} +{"train_loss": 0.0004504510434344411, "global_step": 52222, "epoch": 438, "lr": 1.6990948098747143e-05} +{"train_loss": 0.000903571373783052, "global_step": 52223, "epoch": 438, "lr": 1.698928404743613e-05} +{"train_loss": 0.0005962994182482362, "global_step": 52224, "epoch": 438, "lr": 1.698762006093811e-05} +{"train_loss": 0.0008935299701988697, "global_step": 52225, "epoch": 438, "lr": 1.6985956139256387e-05} +{"train_loss": 0.0005158123676665127, "global_step": 52226, "epoch": 438, "lr": 1.69842922823942e-05} +{"train_loss": 0.0008045447175391018, "global_step": 52227, "epoch": 438, "lr": 1.6982628490354836e-05} +{"train_loss": 0.0005317618488334119, "global_step": 52228, "epoch": 438, "lr": 1.698096476314156e-05} +{"train_loss": 0.0007444688235409558, "global_step": 52229, "epoch": 438, "lr": 1.6979301100757616e-05} +{"train_loss": 0.0005999000859446824, "global_step": 52230, "epoch": 438, "lr": 1.6977637503206302e-05} +{"train_loss": 0.0007264941232278943, "global_step": 52231, "epoch": 438, "lr": 1.697597397049085e-05} +{"train_loss": 0.000576846010517329, "global_step": 52232, "epoch": 438, "lr": 1.6974310502614567e-05} +{"train_loss": 0.000781908689532429, "global_step": 52233, "epoch": 438, "lr": 1.697264709958069e-05} +{"train_loss": 0.0006583916838280857, "global_step": 52234, "epoch": 438, "lr": 1.697098376139248e-05} +{"train_loss": 0.001508869114331901, "global_step": 52235, "epoch": 438, "lr": 1.696932048805323e-05} +{"train_loss": 0.000613653683103621, "global_step": 52236, "epoch": 438, "lr": 1.6967657279566175e-05} +{"train_loss": 0.000609667447861284, "global_step": 52237, "epoch": 438, "lr": 1.6965994135934592e-05} +{"train_loss": 0.0007318280404433608, "global_step": 52238, "epoch": 438, "lr": 1.696433105716177e-05} +{"train_loss": 0.0003202673397026956, "global_step": 52239, "epoch": 438, "lr": 1.696266804325094e-05} +{"train_loss": 0.0007227870022795876, "global_step": 52240, "epoch": 438, "lr": 1.6961005094205394e-05, "val_loss": 0.022197408601641655} +{"train_loss": 0.0005352764273993671, "global_step": 52241, "epoch": 439, "lr": 1.6959342210028372e-05} +{"train_loss": 0.0007501802174374461, "global_step": 52242, "epoch": 439, "lr": 1.6957679390723167e-05} +{"train_loss": 0.00040663493564352393, "global_step": 52243, "epoch": 439, "lr": 1.6956016636293016e-05} +{"train_loss": 0.000583754270337522, "global_step": 52244, "epoch": 439, "lr": 1.6954353946741203e-05} +{"train_loss": 0.0005575697869062424, "global_step": 52245, "epoch": 439, "lr": 1.695269132207098e-05} +{"train_loss": 0.0006287816213443875, "global_step": 52246, "epoch": 439, "lr": 1.6951028762285625e-05} +{"train_loss": 0.000996056362055242, "global_step": 52247, "epoch": 439, "lr": 1.6949366267388394e-05} +{"train_loss": 0.0005385911208577454, "global_step": 52248, "epoch": 439, "lr": 1.694770383738254e-05} +{"train_loss": 0.0014252548571676016, "global_step": 52249, "epoch": 439, "lr": 1.6946041472271357e-05} +{"train_loss": 0.0009917484130710363, "global_step": 52250, "epoch": 439, "lr": 1.6944379172058066e-05} +{"train_loss": 0.0003650682920124382, "global_step": 52251, "epoch": 439, "lr": 1.6942716936745978e-05} +{"train_loss": 0.00042610857053659856, "global_step": 52252, "epoch": 439, "lr": 1.694105476633833e-05} +{"train_loss": 0.0007621865370310843, "global_step": 52253, "epoch": 439, "lr": 1.6939392660838372e-05} +{"train_loss": 0.0007518726051785052, "global_step": 52254, "epoch": 439, "lr": 1.6937730620249404e-05} +{"train_loss": 0.0010621023830026388, "global_step": 52255, "epoch": 439, "lr": 1.6936068644574656e-05} +{"train_loss": 0.0005035339272581041, "global_step": 52256, "epoch": 439, "lr": 1.6934406733817414e-05} +{"train_loss": 0.00046111439587548375, "global_step": 52257, "epoch": 439, "lr": 1.6932744887980917e-05} +{"train_loss": 0.0006272950558923185, "global_step": 52258, "epoch": 439, "lr": 1.6931083107068463e-05} +{"train_loss": 0.0010127965360879898, "global_step": 52259, "epoch": 439, "lr": 1.692942139108329e-05} +{"train_loss": 0.0006255667540244758, "global_step": 52260, "epoch": 439, "lr": 1.6927759740028653e-05} +{"train_loss": 0.0007105639670044184, "global_step": 52261, "epoch": 439, "lr": 1.6926098153907836e-05} +{"train_loss": 0.0007922740187495947, "global_step": 52262, "epoch": 439, "lr": 1.6924436632724083e-05} +{"train_loss": 0.00044574064668267965, "global_step": 52263, "epoch": 439, "lr": 1.692277517648068e-05} +{"train_loss": 0.0009483431931585073, "global_step": 52264, "epoch": 439, "lr": 1.692111378518086e-05} +{"train_loss": 0.0007768992218188941, "global_step": 52265, "epoch": 439, "lr": 1.6919452458827907e-05} +{"train_loss": 0.0007610006141476333, "global_step": 52266, "epoch": 439, "lr": 1.6917791197425082e-05} +{"train_loss": 0.0004542878596112132, "global_step": 52267, "epoch": 439, "lr": 1.691613000097562e-05} +{"train_loss": 0.00041549321031197906, "global_step": 52268, "epoch": 439, "lr": 1.6914468869482818e-05} +{"train_loss": 0.0006950774695724249, "global_step": 52269, "epoch": 439, "lr": 1.6912807802949908e-05} +{"train_loss": 0.0003756895021069795, "global_step": 52270, "epoch": 439, "lr": 1.6911146801380183e-05} +{"train_loss": 0.0012159773614257574, "global_step": 52271, "epoch": 439, "lr": 1.6909485864776865e-05} +{"train_loss": 0.0009343950659967959, "global_step": 52272, "epoch": 439, "lr": 1.6907824993143257e-05} +{"train_loss": 0.00038650649366900325, "global_step": 52273, "epoch": 439, "lr": 1.6906164186482583e-05} +{"train_loss": 0.0012590200640261173, "global_step": 52274, "epoch": 439, "lr": 1.6904503444798114e-05} +{"train_loss": 0.0009032851667143404, "global_step": 52275, "epoch": 439, "lr": 1.6902842768093134e-05} +{"train_loss": 0.0005121731664985418, "global_step": 52276, "epoch": 439, "lr": 1.6901182156370875e-05} +{"train_loss": 0.0009118812158703804, "global_step": 52277, "epoch": 439, "lr": 1.6899521609634627e-05} +{"train_loss": 0.000496066699270159, "global_step": 52278, "epoch": 439, "lr": 1.6897861127887626e-05} +{"train_loss": 0.0004718610434792936, "global_step": 52279, "epoch": 439, "lr": 1.6896200711133127e-05} +{"train_loss": 0.0007782381726428866, "global_step": 52280, "epoch": 439, "lr": 1.689454035937441e-05} +{"train_loss": 0.0007135263294912875, "global_step": 52281, "epoch": 439, "lr": 1.689288007261472e-05} +{"train_loss": 0.0006158103351481259, "global_step": 52282, "epoch": 439, "lr": 1.6891219850857332e-05} +{"train_loss": 0.0007118026842363179, "global_step": 52283, "epoch": 439, "lr": 1.6889559694105485e-05} +{"train_loss": 0.001296854461543262, "global_step": 52284, "epoch": 439, "lr": 1.688789960236246e-05} +{"train_loss": 0.0005756912287324667, "global_step": 52285, "epoch": 439, "lr": 1.6886239575631513e-05} +{"train_loss": 0.0008236267021857202, "global_step": 52286, "epoch": 439, "lr": 1.6884579613915874e-05} +{"train_loss": 0.0006472266977652907, "global_step": 52287, "epoch": 439, "lr": 1.688291971721885e-05} +{"train_loss": 0.00035121786640957, "global_step": 52288, "epoch": 439, "lr": 1.6881259885543654e-05} +{"train_loss": 0.000872441625688225, "global_step": 52289, "epoch": 439, "lr": 1.687960011889358e-05} +{"train_loss": 0.0011817626655101776, "global_step": 52290, "epoch": 439, "lr": 1.6877940417271875e-05} +{"train_loss": 0.0006526823854073882, "global_step": 52291, "epoch": 439, "lr": 1.6876280780681782e-05} +{"train_loss": 0.0006034884136170149, "global_step": 52292, "epoch": 439, "lr": 1.6874621209126584e-05} +{"train_loss": 0.0005798631464131176, "global_step": 52293, "epoch": 439, "lr": 1.6872961702609512e-05} +{"train_loss": 0.0006652132724411786, "global_step": 52294, "epoch": 439, "lr": 1.6871302261133865e-05} +{"train_loss": 0.0006274831248447299, "global_step": 52295, "epoch": 439, "lr": 1.686964288470285e-05} +{"train_loss": 0.0011070071486756206, "global_step": 52296, "epoch": 439, "lr": 1.686798357331978e-05} +{"train_loss": 0.0008760071359574795, "global_step": 52297, "epoch": 439, "lr": 1.6866324326987874e-05} +{"train_loss": 0.00036319735227152705, "global_step": 52298, "epoch": 439, "lr": 1.686466514571039e-05} +{"train_loss": 0.0006375660304911435, "global_step": 52299, "epoch": 439, "lr": 1.6863006029490608e-05} +{"train_loss": 0.0006610530545003712, "global_step": 52300, "epoch": 439, "lr": 1.686134697833176e-05} +{"train_loss": 0.0008705995860509574, "global_step": 52301, "epoch": 439, "lr": 1.6859687992237134e-05} +{"train_loss": 0.0010470841079950333, "global_step": 52302, "epoch": 439, "lr": 1.685802907120995e-05} +{"train_loss": 0.0004062796360813081, "global_step": 52303, "epoch": 439, "lr": 1.6856370215253503e-05} +{"train_loss": 0.0007716607651673257, "global_step": 52304, "epoch": 439, "lr": 1.6854711424371018e-05} +{"train_loss": 0.00088074104860425, "global_step": 52305, "epoch": 439, "lr": 1.685305269856578e-05} +{"train_loss": 0.0008132739458233118, "global_step": 52306, "epoch": 439, "lr": 1.6851394037841017e-05} +{"train_loss": 0.0005199016886763275, "global_step": 52307, "epoch": 439, "lr": 1.6849735442200016e-05} +{"train_loss": 0.0009284898405894637, "global_step": 52308, "epoch": 439, "lr": 1.6848076911646e-05} +{"train_loss": 0.000318203994538635, "global_step": 52309, "epoch": 439, "lr": 1.684641844618226e-05} +{"train_loss": 0.000575756304897368, "global_step": 52310, "epoch": 439, "lr": 1.6844760045812023e-05} +{"train_loss": 0.0005683827330358326, "global_step": 52311, "epoch": 439, "lr": 1.6843101710538573e-05} +{"train_loss": 0.0009015368414111435, "global_step": 52312, "epoch": 439, "lr": 1.684144344036513e-05} +{"train_loss": 0.0010312760714441538, "global_step": 52313, "epoch": 439, "lr": 1.6839785235294992e-05} +{"train_loss": 0.0008543686126358807, "global_step": 52314, "epoch": 439, "lr": 1.6838127095331374e-05} +{"train_loss": 0.0003162587236147374, "global_step": 52315, "epoch": 439, "lr": 1.6836469020477563e-05} +{"train_loss": 0.00037014755071140826, "global_step": 52316, "epoch": 439, "lr": 1.6834811010736807e-05} +{"train_loss": 0.0007913518347777426, "global_step": 52317, "epoch": 439, "lr": 1.683315306611234e-05} +{"train_loss": 0.0005398770445026457, "global_step": 52318, "epoch": 439, "lr": 1.683149518660745e-05} +{"train_loss": 0.00042318980558775365, "global_step": 52319, "epoch": 439, "lr": 1.6829837372225353e-05} +{"train_loss": 0.0014303632779046893, "global_step": 52320, "epoch": 439, "lr": 1.6828179622969353e-05} +{"train_loss": 0.0004562872927635908, "global_step": 52321, "epoch": 439, "lr": 1.6826521938842672e-05} +{"train_loss": 0.0007436468731611967, "global_step": 52322, "epoch": 439, "lr": 1.6824864319848555e-05} +{"train_loss": 0.0006191655993461609, "global_step": 52323, "epoch": 439, "lr": 1.682320676599029e-05} +{"train_loss": 0.001267240266315639, "global_step": 52324, "epoch": 439, "lr": 1.6821549277271098e-05} +{"train_loss": 0.0010041272034868598, "global_step": 52325, "epoch": 439, "lr": 1.681989185369427e-05} +{"train_loss": 0.0006916967686265707, "global_step": 52326, "epoch": 439, "lr": 1.6818234495263018e-05} +{"train_loss": 0.0003612186701502651, "global_step": 52327, "epoch": 439, "lr": 1.6816577201980632e-05} +{"train_loss": 0.0012362555135041475, "global_step": 52328, "epoch": 439, "lr": 1.6814919973850357e-05} +{"train_loss": 0.0008539088303223252, "global_step": 52329, "epoch": 439, "lr": 1.6813262810875425e-05} +{"train_loss": 0.0006354939541779459, "global_step": 52330, "epoch": 439, "lr": 1.681160571305912e-05} +{"train_loss": 0.000386538595193997, "global_step": 52331, "epoch": 439, "lr": 1.6809948680404664e-05} +{"train_loss": 0.0007392676780000329, "global_step": 52332, "epoch": 439, "lr": 1.680829171291534e-05} +{"train_loss": 0.0012523360783234239, "global_step": 52333, "epoch": 439, "lr": 1.6806634810594385e-05} +{"train_loss": 0.0008755640010349452, "global_step": 52334, "epoch": 439, "lr": 1.6804977973445062e-05} +{"train_loss": 0.0004585717397276312, "global_step": 52335, "epoch": 439, "lr": 1.6803321201470608e-05} +{"train_loss": 0.00030732122831977904, "global_step": 52336, "epoch": 439, "lr": 1.6801664494674302e-05} +{"train_loss": 0.0006021155277267098, "global_step": 52337, "epoch": 439, "lr": 1.6800007853059364e-05} +{"train_loss": 0.0008132851216942072, "global_step": 52338, "epoch": 439, "lr": 1.6798351276629076e-05} +{"train_loss": 0.0005793593591079116, "global_step": 52339, "epoch": 439, "lr": 1.6796694765386667e-05} +{"train_loss": 0.0010977631900459528, "global_step": 52340, "epoch": 439, "lr": 1.6795038319335414e-05} +{"train_loss": 0.00039624617784284055, "global_step": 52341, "epoch": 439, "lr": 1.6793381938478542e-05} +{"train_loss": 0.0009392359061166644, "global_step": 52342, "epoch": 439, "lr": 1.679172562281933e-05} +{"train_loss": 0.0005784003878943622, "global_step": 52343, "epoch": 439, "lr": 1.6790069372361002e-05} +{"train_loss": 0.0006727631553076208, "global_step": 52344, "epoch": 439, "lr": 1.6788413187106843e-05} +{"train_loss": 0.0011627570493146777, "global_step": 52345, "epoch": 439, "lr": 1.6786757067060065e-05} +{"train_loss": 0.0006873810780234635, "global_step": 52346, "epoch": 439, "lr": 1.6785101012223965e-05} +{"train_loss": 0.0009562431951053441, "global_step": 52347, "epoch": 439, "lr": 1.678344502260177e-05} +{"train_loss": 0.0007213878561742604, "global_step": 52348, "epoch": 439, "lr": 1.6781789098196708e-05} +{"train_loss": 0.0008753665024414659, "global_step": 52349, "epoch": 439, "lr": 1.6780133239012073e-05} +{"train_loss": 0.0005598269635811448, "global_step": 52350, "epoch": 439, "lr": 1.677847744505109e-05} +{"train_loss": 0.0010005392832681537, "global_step": 52351, "epoch": 439, "lr": 1.6776821716317026e-05} +{"train_loss": 0.0008122495491988957, "global_step": 52352, "epoch": 439, "lr": 1.6775166052813123e-05} +{"train_loss": 0.0004445150261744857, "global_step": 52353, "epoch": 439, "lr": 1.6773510454542618e-05} +{"train_loss": 0.0007059540948830545, "global_step": 52354, "epoch": 439, "lr": 1.677185492150879e-05} +{"train_loss": 0.0005965739255771041, "global_step": 52355, "epoch": 439, "lr": 1.6770199453714856e-05} +{"train_loss": 0.0004724652098957449, "global_step": 52356, "epoch": 439, "lr": 1.6768544051164108e-05} +{"train_loss": 0.0005710315308533609, "global_step": 52357, "epoch": 439, "lr": 1.676688871385975e-05} +{"train_loss": 0.001059429137967527, "global_step": 52358, "epoch": 439, "lr": 1.6765233441805077e-05} +{"train_loss": 0.000721726448181234, "global_step": 52359, "epoch": 439, "lr": 1.6763578235003318e-05, "val_loss": 0.019183382391929626} +{"train_loss": 0.0013569575967267156, "global_step": 52360, "epoch": 440, "lr": 1.6761923093457705e-05} +{"train_loss": 0.0005923318094573915, "global_step": 52361, "epoch": 440, "lr": 1.676026801717152e-05} +{"train_loss": 0.0006095569115132093, "global_step": 52362, "epoch": 440, "lr": 1.6758613006147983e-05} +{"train_loss": 0.0007572938338853419, "global_step": 52363, "epoch": 440, "lr": 1.6756958060390377e-05} +{"train_loss": 0.0006038937717676163, "global_step": 52364, "epoch": 440, "lr": 1.675530317990191e-05} +{"train_loss": 0.0007356154383160174, "global_step": 52365, "epoch": 440, "lr": 1.6753648364685874e-05} +{"train_loss": 0.0005363572854548693, "global_step": 52366, "epoch": 440, "lr": 1.6751993614745494e-05} +{"train_loss": 0.0007334329420700669, "global_step": 52367, "epoch": 440, "lr": 1.6750338930084008e-05} +{"train_loss": 0.0008944018045440316, "global_step": 52368, "epoch": 440, "lr": 1.67486843107047e-05} +{"train_loss": 0.0005912911146879196, "global_step": 52369, "epoch": 440, "lr": 1.6747029756610778e-05} +{"train_loss": 0.0006169341504573822, "global_step": 52370, "epoch": 440, "lr": 1.6745375267805508e-05} +{"train_loss": 0.0005848060245625675, "global_step": 52371, "epoch": 440, "lr": 1.674372084429216e-05} +{"train_loss": 0.0016301494324579835, "global_step": 52372, "epoch": 440, "lr": 1.6742066486073943e-05} +{"train_loss": 0.0005403972463682294, "global_step": 52373, "epoch": 440, "lr": 1.6740412193154147e-05} +{"train_loss": 0.0004769825900439173, "global_step": 52374, "epoch": 440, "lr": 1.673875796553598e-05} +{"train_loss": 0.0012412613723427057, "global_step": 52375, "epoch": 440, "lr": 1.6737103803222727e-05} +{"train_loss": 0.0006962938932701945, "global_step": 52376, "epoch": 440, "lr": 1.6735449706217592e-05} +{"train_loss": 0.0013634570641443133, "global_step": 52377, "epoch": 440, "lr": 1.673379567452387e-05} +{"train_loss": 0.0009047037456184626, "global_step": 52378, "epoch": 440, "lr": 1.673214170814479e-05} +{"train_loss": 0.0007854505092836916, "global_step": 52379, "epoch": 440, "lr": 1.6730487807083576e-05} +{"train_loss": 0.0011580794816836715, "global_step": 52380, "epoch": 440, "lr": 1.672883397134351e-05} +{"train_loss": 0.0006759047391824424, "global_step": 52381, "epoch": 440, "lr": 1.6727180200927813e-05} +{"train_loss": 0.0003621565119829029, "global_step": 52382, "epoch": 440, "lr": 1.672552649583975e-05} +{"train_loss": 0.00045776437036693096, "global_step": 52383, "epoch": 440, "lr": 1.672387285608255e-05} +{"train_loss": 0.00024464973830617964, "global_step": 52384, "epoch": 440, "lr": 1.6722219281659484e-05} +{"train_loss": 0.0008709172834642231, "global_step": 52385, "epoch": 440, "lr": 1.6720565772573792e-05} +{"train_loss": 0.0005857654032297432, "global_step": 52386, "epoch": 440, "lr": 1.671891232882869e-05} +{"train_loss": 0.0006691839662380517, "global_step": 52387, "epoch": 440, "lr": 1.6717258950427473e-05} +{"train_loss": 0.0010364297777414322, "global_step": 52388, "epoch": 440, "lr": 1.671560563737334e-05} +{"train_loss": 0.0006535490392707288, "global_step": 52389, "epoch": 440, "lr": 1.6713952389669574e-05} +{"train_loss": 0.0002995128743350506, "global_step": 52390, "epoch": 440, "lr": 1.6712299207319408e-05} +{"train_loss": 0.0011481441324576735, "global_step": 52391, "epoch": 440, "lr": 1.671064609032607e-05} +{"train_loss": 0.001140507636591792, "global_step": 52392, "epoch": 440, "lr": 1.6708993038692837e-05} +{"train_loss": 0.0008620753069408238, "global_step": 52393, "epoch": 440, "lr": 1.6707340052422925e-05} +{"train_loss": 0.0004708393244072795, "global_step": 52394, "epoch": 440, "lr": 1.6705687131519615e-05} +{"train_loss": 0.0013151556486263871, "global_step": 52395, "epoch": 440, "lr": 1.6704034275986107e-05} +{"train_loss": 0.0007189952884800732, "global_step": 52396, "epoch": 440, "lr": 1.670238148582569e-05} +{"train_loss": 0.0013758620480075479, "global_step": 52397, "epoch": 440, "lr": 1.670072876104159e-05} +{"train_loss": 0.00040412350790575147, "global_step": 52398, "epoch": 440, "lr": 1.669907610163704e-05} +{"train_loss": 0.000579402141738683, "global_step": 52399, "epoch": 440, "lr": 1.6697423507615305e-05} +{"train_loss": 0.001276153838261962, "global_step": 52400, "epoch": 440, "lr": 1.6695770978979608e-05} +{"train_loss": 0.0007950977887958288, "global_step": 52401, "epoch": 440, "lr": 1.669411851573322e-05} +{"train_loss": 0.000835651415400207, "global_step": 52402, "epoch": 440, "lr": 1.6692466117879363e-05} +{"train_loss": 0.0007125717820599675, "global_step": 52403, "epoch": 440, "lr": 1.66908137854213e-05} +{"train_loss": 0.0005361530347727239, "global_step": 52404, "epoch": 440, "lr": 1.6689161518362252e-05} +{"train_loss": 0.0005936439265497029, "global_step": 52405, "epoch": 440, "lr": 1.6687509316705474e-05} +{"train_loss": 0.000699688564054668, "global_step": 52406, "epoch": 440, "lr": 1.6685857180454235e-05} +{"train_loss": 0.0006434021051973104, "global_step": 52407, "epoch": 440, "lr": 1.6684205109611734e-05} +{"train_loss": 0.0008269769023172557, "global_step": 52408, "epoch": 440, "lr": 1.6682553104181254e-05} +{"train_loss": 0.0010787942446768284, "global_step": 52409, "epoch": 440, "lr": 1.6680901164166025e-05} +{"train_loss": 0.0008132428047247231, "global_step": 52410, "epoch": 440, "lr": 1.6679249289569267e-05} +{"train_loss": 0.000698255083989352, "global_step": 52411, "epoch": 440, "lr": 1.6677597480394258e-05} +{"train_loss": 0.0007177485385909677, "global_step": 52412, "epoch": 440, "lr": 1.6675945736644216e-05} +{"train_loss": 0.000770923332311213, "global_step": 52413, "epoch": 440, "lr": 1.667429405832241e-05} +{"train_loss": 0.0006581502384506166, "global_step": 52414, "epoch": 440, "lr": 1.6672642445432047e-05} +{"train_loss": 0.0005858847871422768, "global_step": 52415, "epoch": 440, "lr": 1.667099089797641e-05} +{"train_loss": 0.0007542265811935067, "global_step": 52416, "epoch": 440, "lr": 1.6669339415958717e-05} +{"train_loss": 0.0015791093464940786, "global_step": 52417, "epoch": 440, "lr": 1.6667687999382205e-05} +{"train_loss": 0.0010881214402616024, "global_step": 52418, "epoch": 440, "lr": 1.666603664825013e-05} +{"train_loss": 0.001039433293044567, "global_step": 52419, "epoch": 440, "lr": 1.6664385362565733e-05} +{"train_loss": 0.0005054592038504779, "global_step": 52420, "epoch": 440, "lr": 1.666273414233226e-05} +{"train_loss": 0.0006968045490793884, "global_step": 52421, "epoch": 440, "lr": 1.6661082987552945e-05} +{"train_loss": 0.000709863263182342, "global_step": 52422, "epoch": 440, "lr": 1.665943189823102e-05} +{"train_loss": 0.0009304708801209927, "global_step": 52423, "epoch": 440, "lr": 1.6657780874369753e-05} +{"train_loss": 0.0003724828129634261, "global_step": 52424, "epoch": 440, "lr": 1.6656129915972356e-05} +{"train_loss": 0.00041384424548596144, "global_step": 52425, "epoch": 440, "lr": 1.6654479023042102e-05} +{"train_loss": 0.0007791430107317865, "global_step": 52426, "epoch": 440, "lr": 1.66528281955822e-05} +{"train_loss": 0.0006849682540632784, "global_step": 52427, "epoch": 440, "lr": 1.6651177433595923e-05} +{"train_loss": 0.0009730655583553016, "global_step": 52428, "epoch": 440, "lr": 1.6649526737086497e-05} +{"train_loss": 0.000565843190997839, "global_step": 52429, "epoch": 440, "lr": 1.6647876106057142e-05} +{"train_loss": 0.0007539365906268358, "global_step": 52430, "epoch": 440, "lr": 1.664622554051114e-05} +{"train_loss": 0.0014800246572121978, "global_step": 52431, "epoch": 440, "lr": 1.6644575040451693e-05} +{"train_loss": 0.000953500799369067, "global_step": 52432, "epoch": 440, "lr": 1.664292460588207e-05} +{"train_loss": 0.0008954211953096092, "global_step": 52433, "epoch": 440, "lr": 1.6641274236805494e-05} +{"train_loss": 0.000705692102201283, "global_step": 52434, "epoch": 440, "lr": 1.6639623933225223e-05} +{"train_loss": 0.0006000477005727589, "global_step": 52435, "epoch": 440, "lr": 1.663797369514447e-05} +{"train_loss": 0.0006882312591187656, "global_step": 52436, "epoch": 440, "lr": 1.663632352256651e-05} +{"train_loss": 0.0010470662964507937, "global_step": 52437, "epoch": 440, "lr": 1.663467341549455e-05} +{"train_loss": 0.0008238724549300969, "global_step": 52438, "epoch": 440, "lr": 1.6633023373931854e-05} +{"train_loss": 0.00047915420145727694, "global_step": 52439, "epoch": 440, "lr": 1.6631373397881646e-05} +{"train_loss": 0.0012369403848424554, "global_step": 52440, "epoch": 440, "lr": 1.6629723487347176e-05} +{"train_loss": 0.0012047110358253121, "global_step": 52441, "epoch": 440, "lr": 1.662807364233167e-05} +{"train_loss": 0.0005853833863511682, "global_step": 52442, "epoch": 440, "lr": 1.6626423862838392e-05} +{"train_loss": 0.0011739993933588266, "global_step": 52443, "epoch": 440, "lr": 1.662477414887055e-05} +{"train_loss": 0.0006286366260610521, "global_step": 52444, "epoch": 440, "lr": 1.6623124500431408e-05} +{"train_loss": 0.000594054174143821, "global_step": 52445, "epoch": 440, "lr": 1.6621474917524183e-05} +{"train_loss": 0.0009950901148840785, "global_step": 52446, "epoch": 440, "lr": 1.661982540015214e-05} +{"train_loss": 0.000913657306227833, "global_step": 52447, "epoch": 440, "lr": 1.661817594831851e-05} +{"train_loss": 0.0009042115416377783, "global_step": 52448, "epoch": 440, "lr": 1.6616526562026503e-05} +{"train_loss": 0.0004887067480012774, "global_step": 52449, "epoch": 440, "lr": 1.6614877241279398e-05} +{"train_loss": 0.0011812837328761816, "global_step": 52450, "epoch": 440, "lr": 1.6613227986080398e-05} +{"train_loss": 0.0007673578220419586, "global_step": 52451, "epoch": 440, "lr": 1.6611578796432776e-05} +{"train_loss": 0.0007077584741637111, "global_step": 52452, "epoch": 440, "lr": 1.660992967233973e-05} +{"train_loss": 0.0010082563385367393, "global_step": 52453, "epoch": 440, "lr": 1.6608280613804543e-05} +{"train_loss": 0.0012831388739868999, "global_step": 52454, "epoch": 440, "lr": 1.6606631620830426e-05} +{"train_loss": 0.0003683858667500317, "global_step": 52455, "epoch": 440, "lr": 1.6604982693420607e-05} +{"train_loss": 0.0008163590100593865, "global_step": 52456, "epoch": 440, "lr": 1.6603333831578348e-05} +{"train_loss": 0.0015276054618880153, "global_step": 52457, "epoch": 440, "lr": 1.6601685035306864e-05} +{"train_loss": 0.0007627348531968892, "global_step": 52458, "epoch": 440, "lr": 1.6600036304609418e-05} +{"train_loss": 0.0007066216203384101, "global_step": 52459, "epoch": 440, "lr": 1.6598387639489233e-05} +{"train_loss": 0.0006858009728603065, "global_step": 52460, "epoch": 440, "lr": 1.6596739039949526e-05} +{"train_loss": 0.0008143311715684831, "global_step": 52461, "epoch": 440, "lr": 1.659509050599357e-05} +{"train_loss": 0.001682817004621029, "global_step": 52462, "epoch": 440, "lr": 1.6593442037624574e-05} +{"train_loss": 0.0003987097297795117, "global_step": 52463, "epoch": 440, "lr": 1.6591793634845797e-05} +{"train_loss": 0.0004960006335750222, "global_step": 52464, "epoch": 440, "lr": 1.6590145297660448e-05} +{"train_loss": 0.0005642584292218089, "global_step": 52465, "epoch": 440, "lr": 1.6588497026071797e-05} +{"train_loss": 0.0010914584854617715, "global_step": 52466, "epoch": 440, "lr": 1.6586848820083062e-05} +{"train_loss": 0.0006313461344689131, "global_step": 52467, "epoch": 440, "lr": 1.6585200679697467e-05} +{"train_loss": 0.0011977367103099823, "global_step": 52468, "epoch": 440, "lr": 1.6583552604918253e-05} +{"train_loss": 0.0009486828930675983, "global_step": 52469, "epoch": 440, "lr": 1.6581904595748683e-05} +{"train_loss": 0.0010345991468057036, "global_step": 52470, "epoch": 440, "lr": 1.658025665219196e-05} +{"train_loss": 0.0005451598553918302, "global_step": 52471, "epoch": 440, "lr": 1.6578608774251346e-05} +{"train_loss": 0.0012763937702402472, "global_step": 52472, "epoch": 440, "lr": 1.657696096193005e-05} +{"train_loss": 0.0007824117201380432, "global_step": 52473, "epoch": 440, "lr": 1.6575313215231332e-05} +{"train_loss": 0.0010758530115708709, "global_step": 52474, "epoch": 440, "lr": 1.65736655341584e-05} +{"train_loss": 0.0004052701697219163, "global_step": 52475, "epoch": 440, "lr": 1.6572017918714523e-05} +{"train_loss": 0.0009413264924660325, "global_step": 52476, "epoch": 440, "lr": 1.6570370368902904e-05} +{"train_loss": 0.001327354577369988, "global_step": 52477, "epoch": 440, "lr": 1.65687228847268e-05} +{"train_loss": 0.0008194663974225615, "global_step": 52478, "epoch": 440, "lr": 1.6567075466189446e-05, "val_loss": 0.028389085084199905, "train_action_mse_error": 1.091030026145745e-05} +{"train_loss": 0.0005477031227201223, "global_step": 52479, "epoch": 441, "lr": 1.6565428113294047e-05} +{"train_loss": 0.0009777541272342205, "global_step": 52480, "epoch": 441, "lr": 1.656378082604387e-05} +{"train_loss": 0.0010638399980962276, "global_step": 52481, "epoch": 441, "lr": 1.6562133604442127e-05} +{"train_loss": 0.0006441228906624019, "global_step": 52482, "epoch": 441, "lr": 1.656048644849208e-05} +{"train_loss": 0.0014118795515969396, "global_step": 52483, "epoch": 441, "lr": 1.655883935819692e-05} +{"train_loss": 0.0006717385840602219, "global_step": 52484, "epoch": 441, "lr": 1.6557192333559927e-05} +{"train_loss": 0.0010180649114772677, "global_step": 52485, "epoch": 441, "lr": 1.655554537458432e-05} +{"train_loss": 0.0015277931233868003, "global_step": 52486, "epoch": 441, "lr": 1.6553898481273304e-05} +{"train_loss": 0.000996043556369841, "global_step": 52487, "epoch": 441, "lr": 1.655225165363015e-05} +{"train_loss": 0.0012139736209064722, "global_step": 52488, "epoch": 441, "lr": 1.6550604891658066e-05} +{"train_loss": 0.001127357012592256, "global_step": 52489, "epoch": 441, "lr": 1.6548958195360308e-05} +{"train_loss": 0.0007676499080844223, "global_step": 52490, "epoch": 441, "lr": 1.6547311564740102e-05} +{"train_loss": 0.0005030137253925204, "global_step": 52491, "epoch": 441, "lr": 1.6545664999800653e-05} +{"train_loss": 0.0007368395454250276, "global_step": 52492, "epoch": 441, "lr": 1.654401850054524e-05} +{"train_loss": 0.0009050483931787312, "global_step": 52493, "epoch": 441, "lr": 1.6542372066977046e-05} +{"train_loss": 0.0009337046649307013, "global_step": 52494, "epoch": 441, "lr": 1.654072569909936e-05} +{"train_loss": 0.0005898908129893243, "global_step": 52495, "epoch": 441, "lr": 1.6539079396915358e-05} +{"train_loss": 0.0005659305024892092, "global_step": 52496, "epoch": 441, "lr": 1.6537433160428317e-05} +{"train_loss": 0.001044481061398983, "global_step": 52497, "epoch": 441, "lr": 1.653578698964145e-05} +{"train_loss": 0.0006801241543143988, "global_step": 52498, "epoch": 441, "lr": 1.6534140884557975e-05} +{"train_loss": 0.0004679397970903665, "global_step": 52499, "epoch": 441, "lr": 1.6532494845181155e-05} +{"train_loss": 0.0006106994114816189, "global_step": 52500, "epoch": 441, "lr": 1.6530848871514194e-05} +{"train_loss": 0.0011730588739737868, "global_step": 52501, "epoch": 441, "lr": 1.6529202963560347e-05} +{"train_loss": 0.0008760893251746893, "global_step": 52502, "epoch": 441, "lr": 1.6527557121322816e-05} +{"train_loss": 0.0005226326175034046, "global_step": 52503, "epoch": 441, "lr": 1.6525911344804857e-05} +{"train_loss": 0.0005293766735121608, "global_step": 52504, "epoch": 441, "lr": 1.6524265634009705e-05} +{"train_loss": 0.0005307569517754018, "global_step": 52505, "epoch": 441, "lr": 1.652261998894057e-05} +{"train_loss": 0.0008634149562567472, "global_step": 52506, "epoch": 441, "lr": 1.652097440960071e-05} +{"train_loss": 0.0007852234994061291, "global_step": 52507, "epoch": 441, "lr": 1.6519328895993318e-05} +{"train_loss": 0.00046971309348009527, "global_step": 52508, "epoch": 441, "lr": 1.651768344812167e-05} +{"train_loss": 0.000735555135179311, "global_step": 52509, "epoch": 441, "lr": 1.651603806598897e-05} +{"train_loss": 0.001222781604155898, "global_step": 52510, "epoch": 441, "lr": 1.6514392749598433e-05} +{"train_loss": 0.0007472244906239212, "global_step": 52511, "epoch": 441, "lr": 1.651274749895333e-05} +{"train_loss": 0.0006457214476540685, "global_step": 52512, "epoch": 441, "lr": 1.6511102314056853e-05} +{"train_loss": 0.0010540522634983063, "global_step": 52513, "epoch": 441, "lr": 1.650945719491226e-05} +{"train_loss": 0.0008861160604283214, "global_step": 52514, "epoch": 441, "lr": 1.650781214152276e-05} +{"train_loss": 0.0008332296856679022, "global_step": 52515, "epoch": 441, "lr": 1.6506167153891607e-05} +{"train_loss": 0.0008954929653555155, "global_step": 52516, "epoch": 441, "lr": 1.6504522232022014e-05} +{"train_loss": 0.0007481413776986301, "global_step": 52517, "epoch": 441, "lr": 1.6502877375917198e-05} +{"train_loss": 0.0007104185642674565, "global_step": 52518, "epoch": 441, "lr": 1.6501232585580417e-05} +{"train_loss": 0.0006247890996746719, "global_step": 52519, "epoch": 441, "lr": 1.6499587861014874e-05} +{"train_loss": 0.0007192040211521089, "global_step": 52520, "epoch": 441, "lr": 1.6497943202223832e-05} +{"train_loss": 0.0005073723732493818, "global_step": 52521, "epoch": 441, "lr": 1.6496298609210474e-05} +{"train_loss": 0.00035532310721464455, "global_step": 52522, "epoch": 441, "lr": 1.649465408197808e-05} +{"train_loss": 0.000989022315479815, "global_step": 52523, "epoch": 441, "lr": 1.6493009620529846e-05} +{"train_loss": 0.0006901415181346238, "global_step": 52524, "epoch": 441, "lr": 1.6491365224868993e-05} +{"train_loss": 0.0008538622641935945, "global_step": 52525, "epoch": 441, "lr": 1.6489720894998784e-05} +{"train_loss": 0.0004972147289663553, "global_step": 52526, "epoch": 441, "lr": 1.648807663092241e-05} +{"train_loss": 0.000473374268040061, "global_step": 52527, "epoch": 441, "lr": 1.6486432432643134e-05} +{"train_loss": 0.000744709512218833, "global_step": 52528, "epoch": 441, "lr": 1.6484788300164166e-05} +{"train_loss": 0.0008541453280486166, "global_step": 52529, "epoch": 441, "lr": 1.6483144233488716e-05} +{"train_loss": 0.0005010296008549631, "global_step": 52530, "epoch": 441, "lr": 1.6481500232620057e-05} +{"train_loss": 0.0003613389271777123, "global_step": 52531, "epoch": 441, "lr": 1.6479856297561367e-05} +{"train_loss": 0.0006345766596496105, "global_step": 52532, "epoch": 441, "lr": 1.647821242831592e-05} +{"train_loss": 0.0005518467514775693, "global_step": 52533, "epoch": 441, "lr": 1.64765686248869e-05} +{"train_loss": 0.00055643729865551, "global_step": 52534, "epoch": 441, "lr": 1.6474924887277576e-05} +{"train_loss": 0.0005320145282894373, "global_step": 52535, "epoch": 441, "lr": 1.6473281215491136e-05} +{"train_loss": 0.0011043695267289877, "global_step": 52536, "epoch": 441, "lr": 1.6471637609530843e-05} +{"train_loss": 0.00044885854003950953, "global_step": 52537, "epoch": 441, "lr": 1.6469994069399896e-05} +{"train_loss": 0.0004975609481334686, "global_step": 52538, "epoch": 441, "lr": 1.646835059510153e-05} +{"train_loss": 0.0006936397985555232, "global_step": 52539, "epoch": 441, "lr": 1.6466707186638992e-05} +{"train_loss": 0.0006432136869989336, "global_step": 52540, "epoch": 441, "lr": 1.6465063844015492e-05} +{"train_loss": 0.0005359818460419774, "global_step": 52541, "epoch": 441, "lr": 1.6463420567234238e-05} +{"train_loss": 0.0005759954219684005, "global_step": 52542, "epoch": 441, "lr": 1.6461777356298496e-05} +{"train_loss": 0.00047013344010338187, "global_step": 52543, "epoch": 441, "lr": 1.646013421121145e-05} +{"train_loss": 0.0005190115189179778, "global_step": 52544, "epoch": 441, "lr": 1.6458491131976367e-05} +{"train_loss": 0.0005262731574475765, "global_step": 52545, "epoch": 441, "lr": 1.6456848118596437e-05} +{"train_loss": 0.000591874704696238, "global_step": 52546, "epoch": 441, "lr": 1.6455205171074917e-05} +{"train_loss": 0.0007536617922596633, "global_step": 52547, "epoch": 441, "lr": 1.645356228941502e-05} +{"train_loss": 0.000355890195351094, "global_step": 52548, "epoch": 441, "lr": 1.645191947361995e-05} +{"train_loss": 0.0006836785469204187, "global_step": 52549, "epoch": 441, "lr": 1.645027672369297e-05} +{"train_loss": 0.00023819663329049945, "global_step": 52550, "epoch": 441, "lr": 1.6448634039637273e-05} +{"train_loss": 0.0007715023821219802, "global_step": 52551, "epoch": 441, "lr": 1.644699142145611e-05} +{"train_loss": 0.0005843290127813816, "global_step": 52552, "epoch": 441, "lr": 1.6445348869152682e-05} +{"train_loss": 0.00042150524677708745, "global_step": 52553, "epoch": 441, "lr": 1.644370638273024e-05} +{"train_loss": 0.0005801012739539146, "global_step": 52554, "epoch": 441, "lr": 1.6442063962192e-05} +{"train_loss": 0.0007365660276263952, "global_step": 52555, "epoch": 441, "lr": 1.644042160754116e-05} +{"train_loss": 0.000643760256934911, "global_step": 52556, "epoch": 441, "lr": 1.643877931878099e-05} +{"train_loss": 0.0006622489308938384, "global_step": 52557, "epoch": 441, "lr": 1.6437137095914674e-05} +{"train_loss": 0.0005418499349616468, "global_step": 52558, "epoch": 441, "lr": 1.6435494938945467e-05} +{"train_loss": 0.0006974663119763136, "global_step": 52559, "epoch": 441, "lr": 1.643385284787658e-05} +{"train_loss": 0.0006382963038049638, "global_step": 52560, "epoch": 441, "lr": 1.643221082271122e-05} +{"train_loss": 0.0008344187517650425, "global_step": 52561, "epoch": 441, "lr": 1.6430568863452644e-05} +{"train_loss": 0.0008100341656245291, "global_step": 52562, "epoch": 441, "lr": 1.642892697010405e-05} +{"train_loss": 0.0004518501809798181, "global_step": 52563, "epoch": 441, "lr": 1.642728514266868e-05} +{"train_loss": 0.0006003526505082846, "global_step": 52564, "epoch": 441, "lr": 1.6425643381149737e-05} +{"train_loss": 0.0002848507429007441, "global_step": 52565, "epoch": 441, "lr": 1.6424001685550466e-05} +{"train_loss": 0.0009985436918213964, "global_step": 52566, "epoch": 441, "lr": 1.642236005587407e-05} +{"train_loss": 0.0005339065100997686, "global_step": 52567, "epoch": 441, "lr": 1.64207184921238e-05} +{"train_loss": 0.0005423202528618276, "global_step": 52568, "epoch": 441, "lr": 1.6419076994302847e-05} +{"train_loss": 0.0007331047672778368, "global_step": 52569, "epoch": 441, "lr": 1.6417435562414456e-05} +{"train_loss": 0.0005940115079283714, "global_step": 52570, "epoch": 441, "lr": 1.6415794196461838e-05} +{"train_loss": 0.0006532787811011076, "global_step": 52571, "epoch": 441, "lr": 1.6414152896448228e-05} +{"train_loss": 0.0006494754925370216, "global_step": 52572, "epoch": 441, "lr": 1.6412511662376823e-05} +{"train_loss": 0.0008201032178476453, "global_step": 52573, "epoch": 441, "lr": 1.6410870494250884e-05} +{"train_loss": 0.0004899183986708522, "global_step": 52574, "epoch": 441, "lr": 1.6409229392073596e-05} +{"train_loss": 0.0003332853375468403, "global_step": 52575, "epoch": 441, "lr": 1.6407588355848213e-05} +{"train_loss": 0.0004689745546784252, "global_step": 52576, "epoch": 441, "lr": 1.6405947385577926e-05} +{"train_loss": 0.0005488160531967878, "global_step": 52577, "epoch": 441, "lr": 1.6404306481265985e-05} +{"train_loss": 0.001284711412154138, "global_step": 52578, "epoch": 441, "lr": 1.6402665642915604e-05} +{"train_loss": 0.0008831820450723171, "global_step": 52579, "epoch": 441, "lr": 1.640102487052998e-05} +{"train_loss": 0.0004990968154743314, "global_step": 52580, "epoch": 441, "lr": 1.6399384164112373e-05} +{"train_loss": 0.0007040392374619842, "global_step": 52581, "epoch": 441, "lr": 1.6397743523665965e-05} +{"train_loss": 0.00046734040370211005, "global_step": 52582, "epoch": 441, "lr": 1.639610294919402e-05} +{"train_loss": 0.0013979129726067185, "global_step": 52583, "epoch": 441, "lr": 1.6394462440699716e-05} +{"train_loss": 0.0006674275500699878, "global_step": 52584, "epoch": 441, "lr": 1.6392821998186313e-05} +{"train_loss": 0.0007552013848908246, "global_step": 52585, "epoch": 441, "lr": 1.639118162165701e-05} +{"train_loss": 0.000499107816722244, "global_step": 52586, "epoch": 441, "lr": 1.638954131111502e-05} +{"train_loss": 0.0005604643374681473, "global_step": 52587, "epoch": 441, "lr": 1.6387901066563588e-05} +{"train_loss": 0.000827066891361028, "global_step": 52588, "epoch": 441, "lr": 1.6386260888005906e-05} +{"train_loss": 0.0004889839328825474, "global_step": 52589, "epoch": 441, "lr": 1.6384620775445226e-05} +{"train_loss": 0.0009617518517188728, "global_step": 52590, "epoch": 441, "lr": 1.6382980728884734e-05} +{"train_loss": 0.0007286526961252093, "global_step": 52591, "epoch": 441, "lr": 1.6381340748327688e-05} +{"train_loss": 0.0007777624996379018, "global_step": 52592, "epoch": 441, "lr": 1.6379700833777283e-05} +{"train_loss": 0.0008250068058259785, "global_step": 52593, "epoch": 441, "lr": 1.6378060985236732e-05} +{"train_loss": 0.0006949097150936723, "global_step": 52594, "epoch": 441, "lr": 1.637642120270928e-05} +{"train_loss": 0.0006746143335476518, "global_step": 52595, "epoch": 441, "lr": 1.6374781486198114e-05} +{"train_loss": 0.0009648786508478224, "global_step": 52596, "epoch": 441, "lr": 1.6373141835706497e-05} +{"train_loss": 0.0007081401982919916, "global_step": 52597, "epoch": 441, "lr": 1.637150225123762e-05, "val_loss": 0.02446499466896057} +{"train_loss": 0.0005530048510991037, "global_step": 52598, "epoch": 442, "lr": 1.6369862732794684e-05} +{"train_loss": 0.0006823324947617948, "global_step": 52599, "epoch": 442, "lr": 1.636822328038095e-05} +{"train_loss": 0.00047264856402762234, "global_step": 52600, "epoch": 442, "lr": 1.63665838939996e-05} +{"train_loss": 0.0005751405260525644, "global_step": 52601, "epoch": 442, "lr": 1.6364944573653867e-05} +{"train_loss": 0.0010562323732301593, "global_step": 52602, "epoch": 442, "lr": 1.636330531934699e-05} +{"train_loss": 0.0005545183084905148, "global_step": 52603, "epoch": 442, "lr": 1.6361666131082153e-05} +{"train_loss": 0.0004938601632602513, "global_step": 52604, "epoch": 442, "lr": 1.636002700886261e-05} +{"train_loss": 0.00046470476081594825, "global_step": 52605, "epoch": 442, "lr": 1.635838795269154e-05} +{"train_loss": 0.0010783668840304017, "global_step": 52606, "epoch": 442, "lr": 1.63567489625722e-05} +{"train_loss": 0.0008256450528278947, "global_step": 52607, "epoch": 442, "lr": 1.635511003850777e-05} +{"train_loss": 0.0006055172416381538, "global_step": 52608, "epoch": 442, "lr": 1.6353471180501507e-05} +{"train_loss": 0.0010858087334781885, "global_step": 52609, "epoch": 442, "lr": 1.6351832388556604e-05} +{"train_loss": 0.0002744954836089164, "global_step": 52610, "epoch": 442, "lr": 1.6350193662676273e-05} +{"train_loss": 0.0006707506836391985, "global_step": 52611, "epoch": 442, "lr": 1.6348555002863752e-05} +{"train_loss": 0.0007633930654264987, "global_step": 52612, "epoch": 442, "lr": 1.6346916409122238e-05} +{"train_loss": 0.0008619461441412568, "global_step": 52613, "epoch": 442, "lr": 1.6345277881454968e-05} +{"train_loss": 0.0004508057900238782, "global_step": 52614, "epoch": 442, "lr": 1.6343639419865135e-05} +{"train_loss": 0.00044789083767682314, "global_step": 52615, "epoch": 442, "lr": 1.6342001024355992e-05} +{"train_loss": 0.000668198976200074, "global_step": 52616, "epoch": 442, "lr": 1.634036269493073e-05} +{"train_loss": 0.0006975977448746562, "global_step": 52617, "epoch": 442, "lr": 1.633872443159255e-05} +{"train_loss": 0.00041115007479675114, "global_step": 52618, "epoch": 442, "lr": 1.633708623434471e-05} +{"train_loss": 0.0004150690801907331, "global_step": 52619, "epoch": 442, "lr": 1.6335448103190386e-05} +{"train_loss": 0.000919938669539988, "global_step": 52620, "epoch": 442, "lr": 1.633381003813283e-05} +{"train_loss": 0.0006696328055113554, "global_step": 52621, "epoch": 442, "lr": 1.6332172039175226e-05} +{"train_loss": 0.0006958945305086672, "global_step": 52622, "epoch": 442, "lr": 1.633053410632082e-05} +{"train_loss": 0.0008397414931096137, "global_step": 52623, "epoch": 442, "lr": 1.6328896239572815e-05} +{"train_loss": 0.00039156328421086073, "global_step": 52624, "epoch": 442, "lr": 1.6327258438934405e-05} +{"train_loss": 0.0004888302064500749, "global_step": 52625, "epoch": 442, "lr": 1.632562070440885e-05} +{"train_loss": 0.00032568204915151, "global_step": 52626, "epoch": 442, "lr": 1.632398303599932e-05} +{"train_loss": 0.0008683644118718803, "global_step": 52627, "epoch": 442, "lr": 1.6322345433709063e-05} +{"train_loss": 0.001103934715501964, "global_step": 52628, "epoch": 442, "lr": 1.632070789754129e-05} +{"train_loss": 0.0006843495648354292, "global_step": 52629, "epoch": 442, "lr": 1.6319070427499188e-05} +{"train_loss": 0.0006229127175174654, "global_step": 52630, "epoch": 442, "lr": 1.6317433023586016e-05} +{"train_loss": 0.0003627454279921949, "global_step": 52631, "epoch": 442, "lr": 1.6315795685804942e-05} +{"train_loss": 0.0008333121077157557, "global_step": 52632, "epoch": 442, "lr": 1.6314158414159225e-05} +{"train_loss": 0.0005107662873342633, "global_step": 52633, "epoch": 442, "lr": 1.6312521208652036e-05} +{"train_loss": 0.0006568269454874098, "global_step": 52634, "epoch": 442, "lr": 1.6310884069286637e-05} +{"train_loss": 0.0004067973350174725, "global_step": 52635, "epoch": 442, "lr": 1.63092469960662e-05} +{"train_loss": 0.0010098241036757827, "global_step": 52636, "epoch": 442, "lr": 1.6307609988993956e-05} +{"train_loss": 0.0004336317942943424, "global_step": 52637, "epoch": 442, "lr": 1.6305973048073137e-05} +{"train_loss": 0.0007787675713188946, "global_step": 52638, "epoch": 442, "lr": 1.6304336173306923e-05} +{"train_loss": 0.0007014014991000295, "global_step": 52639, "epoch": 442, "lr": 1.6302699364698566e-05} +{"train_loss": 0.0004066282126586884, "global_step": 52640, "epoch": 442, "lr": 1.6301062622251235e-05} +{"train_loss": 0.0007703126175329089, "global_step": 52641, "epoch": 442, "lr": 1.6299425945968188e-05} +{"train_loss": 0.0006091283867135644, "global_step": 52642, "epoch": 442, "lr": 1.6297789335852614e-05} +{"train_loss": 0.0008993677911348641, "global_step": 52643, "epoch": 442, "lr": 1.629615279190772e-05} +{"train_loss": 0.0013145541306585073, "global_step": 52644, "epoch": 442, "lr": 1.6294516314136743e-05} +{"train_loss": 0.0006020547589287162, "global_step": 52645, "epoch": 442, "lr": 1.6292879902542862e-05} +{"train_loss": 0.000453980261227116, "global_step": 52646, "epoch": 442, "lr": 1.6291243557129333e-05} +{"train_loss": 0.0007509716670028865, "global_step": 52647, "epoch": 442, "lr": 1.6289607277899343e-05} +{"train_loss": 0.0007016219897195697, "global_step": 52648, "epoch": 442, "lr": 1.6287971064856088e-05} +{"train_loss": 0.0006478481227532029, "global_step": 52649, "epoch": 442, "lr": 1.6286334918002822e-05} +{"train_loss": 0.0005023173871450126, "global_step": 52650, "epoch": 442, "lr": 1.6284698837342715e-05} +{"train_loss": 0.0006659863865934312, "global_step": 52651, "epoch": 442, "lr": 1.628306282287902e-05} +{"train_loss": 0.000476013810839504, "global_step": 52652, "epoch": 442, "lr": 1.6281426874614912e-05} +{"train_loss": 0.0005257812445051968, "global_step": 52653, "epoch": 442, "lr": 1.6279790992553633e-05} +{"train_loss": 0.0005805861437693238, "global_step": 52654, "epoch": 442, "lr": 1.6278155176698384e-05} +{"train_loss": 0.0006041087908670306, "global_step": 52655, "epoch": 442, "lr": 1.6276519427052363e-05} +{"train_loss": 0.0008312651189044118, "global_step": 52656, "epoch": 442, "lr": 1.6274883743618802e-05} +{"train_loss": 0.0005145948380231857, "global_step": 52657, "epoch": 442, "lr": 1.627324812640089e-05} +{"train_loss": 0.0004410134570207447, "global_step": 52658, "epoch": 442, "lr": 1.6271612575401873e-05} +{"train_loss": 0.0004686769098043442, "global_step": 52659, "epoch": 442, "lr": 1.6269977090624938e-05} +{"train_loss": 0.001129206153564155, "global_step": 52660, "epoch": 442, "lr": 1.6268341672073278e-05} +{"train_loss": 0.0007193015771917999, "global_step": 52661, "epoch": 442, "lr": 1.6266706319750148e-05} +{"train_loss": 0.0015215880703181028, "global_step": 52662, "epoch": 442, "lr": 1.626507103365872e-05} +{"train_loss": 0.0009394458611495793, "global_step": 52663, "epoch": 442, "lr": 1.6263435813802235e-05} +{"train_loss": 0.0008094767690636218, "global_step": 52664, "epoch": 442, "lr": 1.6261800660183873e-05} +{"train_loss": 0.00031583139207214117, "global_step": 52665, "epoch": 442, "lr": 1.626016557280688e-05} +{"train_loss": 0.0005916723166592419, "global_step": 52666, "epoch": 442, "lr": 1.6258530551674428e-05} +{"train_loss": 0.0012555144494399428, "global_step": 52667, "epoch": 442, "lr": 1.6256895596789768e-05} +{"train_loss": 0.0006321549299173057, "global_step": 52668, "epoch": 442, "lr": 1.625526070815607e-05} +{"train_loss": 0.0007821425097063184, "global_step": 52669, "epoch": 442, "lr": 1.6253625885776575e-05} +{"train_loss": 0.0006549165700562298, "global_step": 52670, "epoch": 442, "lr": 1.6251991129654464e-05} +{"train_loss": 0.0004269984201528132, "global_step": 52671, "epoch": 442, "lr": 1.6250356439792963e-05} +{"train_loss": 0.0004110246663913131, "global_step": 52672, "epoch": 442, "lr": 1.62487218161953e-05} +{"train_loss": 0.0005533558432944119, "global_step": 52673, "epoch": 442, "lr": 1.624708725886467e-05} +{"train_loss": 0.0005748901749029756, "global_step": 52674, "epoch": 442, "lr": 1.6245452767804254e-05} +{"train_loss": 0.0006833522929809988, "global_step": 52675, "epoch": 442, "lr": 1.624381834301731e-05} +{"train_loss": 0.0012948766816407442, "global_step": 52676, "epoch": 442, "lr": 1.6242183984506996e-05} +{"train_loss": 0.0012892833910882473, "global_step": 52677, "epoch": 442, "lr": 1.6240549692276567e-05} +{"train_loss": 0.0002973248774651438, "global_step": 52678, "epoch": 442, "lr": 1.6238915466329218e-05} +{"train_loss": 0.00048074667574837804, "global_step": 52679, "epoch": 442, "lr": 1.6237281306668135e-05} +{"train_loss": 0.0005644062766805291, "global_step": 52680, "epoch": 442, "lr": 1.623564721329655e-05} +{"train_loss": 0.0013097954215481877, "global_step": 52681, "epoch": 442, "lr": 1.6234013186217655e-05} +{"train_loss": 0.0005318383336998522, "global_step": 52682, "epoch": 442, "lr": 1.6232379225434685e-05} +{"train_loss": 0.0009625527891330421, "global_step": 52683, "epoch": 442, "lr": 1.6230745330950812e-05} +{"train_loss": 0.0005863648257218301, "global_step": 52684, "epoch": 442, "lr": 1.6229111502769278e-05} +{"train_loss": 0.0005983805167488754, "global_step": 52685, "epoch": 442, "lr": 1.6227477740893282e-05} +{"train_loss": 0.0006481072632595897, "global_step": 52686, "epoch": 442, "lr": 1.6225844045326e-05} +{"train_loss": 0.0006364264409057796, "global_step": 52687, "epoch": 442, "lr": 1.622421041607069e-05} +{"train_loss": 0.0009282513638027012, "global_step": 52688, "epoch": 442, "lr": 1.622257685313051e-05} +{"train_loss": 0.0008915672660805285, "global_step": 52689, "epoch": 442, "lr": 1.6220943356508717e-05} +{"train_loss": 0.0008514882065355778, "global_step": 52690, "epoch": 442, "lr": 1.621930992620847e-05} +{"train_loss": 0.0006987113738432527, "global_step": 52691, "epoch": 442, "lr": 1.6217676562233013e-05} +{"train_loss": 0.000798504741396755, "global_step": 52692, "epoch": 442, "lr": 1.6216043264585547e-05} +{"train_loss": 0.0005947448080405593, "global_step": 52693, "epoch": 442, "lr": 1.621441003326925e-05} +{"train_loss": 0.0004493660235311836, "global_step": 52694, "epoch": 442, "lr": 1.6212776868287365e-05} +{"train_loss": 0.0007597355870530009, "global_step": 52695, "epoch": 442, "lr": 1.6211143769643066e-05} +{"train_loss": 0.0011503658024594188, "global_step": 52696, "epoch": 442, "lr": 1.6209510737339594e-05} +{"train_loss": 0.0005614314577542245, "global_step": 52697, "epoch": 442, "lr": 1.6207877771380127e-05} +{"train_loss": 0.00040362487197853625, "global_step": 52698, "epoch": 442, "lr": 1.620624487176789e-05} +{"train_loss": 0.0004450808046385646, "global_step": 52699, "epoch": 442, "lr": 1.6204612038506067e-05} +{"train_loss": 0.0007817303412593901, "global_step": 52700, "epoch": 442, "lr": 1.6202979271597896e-05} +{"train_loss": 0.0004644958535209298, "global_step": 52701, "epoch": 442, "lr": 1.620134657104655e-05} +{"train_loss": 0.000825383176561445, "global_step": 52702, "epoch": 442, "lr": 1.619971393685526e-05} +{"train_loss": 0.0009943849872797728, "global_step": 52703, "epoch": 442, "lr": 1.6198081369027208e-05} +{"train_loss": 0.0007163283880800009, "global_step": 52704, "epoch": 442, "lr": 1.6196448867565627e-05} +{"train_loss": 0.0009172853897325695, "global_step": 52705, "epoch": 442, "lr": 1.619481643247369e-05} +{"train_loss": 0.000503736431710422, "global_step": 52706, "epoch": 442, "lr": 1.6193184063754634e-05} +{"train_loss": 0.0007608948508277535, "global_step": 52707, "epoch": 442, "lr": 1.619155176141164e-05} +{"train_loss": 0.0009587208041921258, "global_step": 52708, "epoch": 442, "lr": 1.618991952544793e-05} +{"train_loss": 0.0007514258031733334, "global_step": 52709, "epoch": 442, "lr": 1.6188287355866693e-05} +{"train_loss": 0.000668287044391036, "global_step": 52710, "epoch": 442, "lr": 1.618665525267115e-05} +{"train_loss": 0.0009539088932797313, "global_step": 52711, "epoch": 442, "lr": 1.6185023215864505e-05} +{"train_loss": 0.0008485628059133887, "global_step": 52712, "epoch": 442, "lr": 1.618339124544993e-05} +{"train_loss": 0.000657484692055732, "global_step": 52713, "epoch": 442, "lr": 1.6181759341430676e-05} +{"train_loss": 0.0009162218193523586, "global_step": 52714, "epoch": 442, "lr": 1.6180127503809906e-05} +{"train_loss": 0.0010828111553564668, "global_step": 52715, "epoch": 442, "lr": 1.617849573259086e-05} +{"train_loss": 0.000700195982246151, "global_step": 52716, "epoch": 442, "lr": 1.6176864027776723e-05, "val_loss": 0.014925917610526085} +{"train_loss": 0.0007042959914542735, "global_step": 52717, "epoch": 443, "lr": 1.6175232389370683e-05} +{"train_loss": 0.0002985231694765389, "global_step": 52718, "epoch": 443, "lr": 1.6173600817375976e-05} +{"train_loss": 0.000595349061768502, "global_step": 52719, "epoch": 443, "lr": 1.6171969311795774e-05} +{"train_loss": 0.0008845716365613043, "global_step": 52720, "epoch": 443, "lr": 1.6170337872633317e-05} +{"train_loss": 0.0007674975204281509, "global_step": 52721, "epoch": 443, "lr": 1.6168706499891767e-05} +{"train_loss": 0.000467153760837391, "global_step": 52722, "epoch": 443, "lr": 1.6167075193574365e-05} +{"train_loss": 0.0010373828699812293, "global_step": 52723, "epoch": 443, "lr": 1.6165443953684296e-05} +{"train_loss": 0.0005295331939123571, "global_step": 52724, "epoch": 443, "lr": 1.6163812780224747e-05} +{"train_loss": 0.0006752645131200552, "global_step": 52725, "epoch": 443, "lr": 1.616218167319895e-05} +{"train_loss": 0.0007582762045785785, "global_step": 52726, "epoch": 443, "lr": 1.6160550632610083e-05} +{"train_loss": 0.0008936720550991595, "global_step": 52727, "epoch": 443, "lr": 1.6158919658461374e-05} +{"train_loss": 0.0006340201362036169, "global_step": 52728, "epoch": 443, "lr": 1.615728875075601e-05} +{"train_loss": 0.0009111234685406089, "global_step": 52729, "epoch": 443, "lr": 1.615565790949718e-05} +{"train_loss": 0.0007089565042406321, "global_step": 52730, "epoch": 443, "lr": 1.6154027134688117e-05} +{"train_loss": 0.0011440996313467622, "global_step": 52731, "epoch": 443, "lr": 1.6152396426331984e-05} +{"train_loss": 0.0008854507468640804, "global_step": 52732, "epoch": 443, "lr": 1.615076578443202e-05} +{"train_loss": 0.00031558991759084165, "global_step": 52733, "epoch": 443, "lr": 1.61491352089914e-05} +{"train_loss": 0.0005374893080443144, "global_step": 52734, "epoch": 443, "lr": 1.614750470001334e-05} +{"train_loss": 0.0004873201542068273, "global_step": 52735, "epoch": 443, "lr": 1.6145874257501048e-05} +{"train_loss": 0.0007794966804794967, "global_step": 52736, "epoch": 443, "lr": 1.61442438814577e-05} +{"train_loss": 0.0006851053913123906, "global_step": 52737, "epoch": 443, "lr": 1.6142613571886528e-05} +{"train_loss": 0.0009671757579781115, "global_step": 52738, "epoch": 443, "lr": 1.6140983328790703e-05} +{"train_loss": 0.0015852914657443762, "global_step": 52739, "epoch": 443, "lr": 1.613935315217345e-05} +{"train_loss": 0.0009343880228698254, "global_step": 52740, "epoch": 443, "lr": 1.613772304203795e-05} +{"train_loss": 0.0005114690866321325, "global_step": 52741, "epoch": 443, "lr": 1.613609299838743e-05} +{"train_loss": 0.0007168874726630747, "global_step": 52742, "epoch": 443, "lr": 1.6134463021225072e-05} +{"train_loss": 0.0006907593342475593, "global_step": 52743, "epoch": 443, "lr": 1.613283311055406e-05} +{"train_loss": 0.0008024143753573298, "global_step": 52744, "epoch": 443, "lr": 1.6131203266377626e-05} +{"train_loss": 0.0010976014891639352, "global_step": 52745, "epoch": 443, "lr": 1.6129573488698947e-05} +{"train_loss": 0.0010621075052767992, "global_step": 52746, "epoch": 443, "lr": 1.6127943777521242e-05} +{"train_loss": 0.0008434073533862829, "global_step": 52747, "epoch": 443, "lr": 1.6126314132847702e-05} +{"train_loss": 0.000827755022328347, "global_step": 52748, "epoch": 443, "lr": 1.6124684554681512e-05} +{"train_loss": 0.0005072586936876178, "global_step": 52749, "epoch": 443, "lr": 1.6123055043025898e-05} +{"train_loss": 0.0004218991962261498, "global_step": 52750, "epoch": 443, "lr": 1.6121425597884033e-05} +{"train_loss": 0.000782450137194246, "global_step": 52751, "epoch": 443, "lr": 1.6119796219259144e-05} +{"train_loss": 0.000999211915768683, "global_step": 52752, "epoch": 443, "lr": 1.61181669071544e-05} +{"train_loss": 0.001208762638270855, "global_step": 52753, "epoch": 443, "lr": 1.611653766157303e-05} +{"train_loss": 0.0008079764083959162, "global_step": 52754, "epoch": 443, "lr": 1.6114908482518216e-05} +{"train_loss": 0.0009565487271174788, "global_step": 52755, "epoch": 443, "lr": 1.6113279369993146e-05} +{"train_loss": 0.0006407784530892968, "global_step": 52756, "epoch": 443, "lr": 1.611165032400105e-05} +{"train_loss": 0.0010222705313935876, "global_step": 52757, "epoch": 443, "lr": 1.611002134454509e-05} +{"train_loss": 0.001046834047883749, "global_step": 52758, "epoch": 443, "lr": 1.6108392431628492e-05} +{"train_loss": 0.0008917310042306781, "global_step": 52759, "epoch": 443, "lr": 1.6106763585254435e-05} +{"train_loss": 0.0008721633930690587, "global_step": 52760, "epoch": 443, "lr": 1.610513480542615e-05} +{"train_loss": 0.000405466795200482, "global_step": 52761, "epoch": 443, "lr": 1.6103506092146802e-05} +{"train_loss": 0.0005044848658144474, "global_step": 52762, "epoch": 443, "lr": 1.6101877445419583e-05} +{"train_loss": 0.00044748629443347454, "global_step": 52763, "epoch": 443, "lr": 1.6100248865247723e-05} +{"train_loss": 0.0006444754544645548, "global_step": 52764, "epoch": 443, "lr": 1.609862035163439e-05} +{"train_loss": 0.0006742209661751986, "global_step": 52765, "epoch": 443, "lr": 1.609699190458281e-05} +{"train_loss": 0.0005031191976740956, "global_step": 52766, "epoch": 443, "lr": 1.6095363524096148e-05} +{"train_loss": 0.0006238488713279366, "global_step": 52767, "epoch": 443, "lr": 1.609373521017763e-05} +{"train_loss": 0.001028240891173482, "global_step": 52768, "epoch": 443, "lr": 1.6092106962830423e-05} +{"train_loss": 0.0007471686112694442, "global_step": 52769, "epoch": 443, "lr": 1.6090478782057745e-05} +{"train_loss": 0.0013118713395670056, "global_step": 52770, "epoch": 443, "lr": 1.6088850667862803e-05} +{"train_loss": 0.0008159492863342166, "global_step": 52771, "epoch": 443, "lr": 1.608722262024877e-05} +{"train_loss": 0.0003663344541564584, "global_step": 52772, "epoch": 443, "lr": 1.6085594639218866e-05} +{"train_loss": 0.0007241361890919507, "global_step": 52773, "epoch": 443, "lr": 1.6083966724776268e-05} +{"train_loss": 0.0006196803878992796, "global_step": 52774, "epoch": 443, "lr": 1.6082338876924168e-05} +{"train_loss": 0.0006624155794270337, "global_step": 52775, "epoch": 443, "lr": 1.6080711095665785e-05} +{"train_loss": 0.0013543142704293132, "global_step": 52776, "epoch": 443, "lr": 1.607908338100429e-05} +{"train_loss": 0.0014550491468980908, "global_step": 52777, "epoch": 443, "lr": 1.60774557329429e-05} +{"train_loss": 0.0006895509432069957, "global_step": 52778, "epoch": 443, "lr": 1.607582815148479e-05} +{"train_loss": 0.0004775986890308559, "global_step": 52779, "epoch": 443, "lr": 1.6074200636633185e-05} +{"train_loss": 0.00039237053715623915, "global_step": 52780, "epoch": 443, "lr": 1.607257318839126e-05} +{"train_loss": 0.0007582996622659266, "global_step": 52781, "epoch": 443, "lr": 1.6070945806762194e-05} +{"train_loss": 0.0017269214149564505, "global_step": 52782, "epoch": 443, "lr": 1.6069318491749217e-05} +{"train_loss": 0.00047513487515971065, "global_step": 52783, "epoch": 443, "lr": 1.6067691243355497e-05} +{"train_loss": 0.0008442689431831241, "global_step": 52784, "epoch": 443, "lr": 1.6066064061584256e-05} +{"train_loss": 0.0007088337442837656, "global_step": 52785, "epoch": 443, "lr": 1.606443694643867e-05} +{"train_loss": 0.0006372923380695283, "global_step": 52786, "epoch": 443, "lr": 1.6062809897921927e-05} +{"train_loss": 0.0009770846227183938, "global_step": 52787, "epoch": 443, "lr": 1.6061182916037244e-05} +{"train_loss": 0.0007685186574235559, "global_step": 52788, "epoch": 443, "lr": 1.605955600078778e-05} +{"train_loss": 0.0010894231963902712, "global_step": 52789, "epoch": 443, "lr": 1.6057929152176777e-05} +{"train_loss": 0.0009379656985402107, "global_step": 52790, "epoch": 443, "lr": 1.6056302370207377e-05} +{"train_loss": 0.0008622735622338951, "global_step": 52791, "epoch": 443, "lr": 1.6054675654882827e-05} +{"train_loss": 0.0011361604556441307, "global_step": 52792, "epoch": 443, "lr": 1.605304900620629e-05} +{"train_loss": 0.0005154085229150951, "global_step": 52793, "epoch": 443, "lr": 1.605142242418095e-05} +{"train_loss": 0.0006465748301707208, "global_step": 52794, "epoch": 443, "lr": 1.6049795908810035e-05} +{"train_loss": 0.0008536952082067728, "global_step": 52795, "epoch": 443, "lr": 1.6048169460096694e-05} +{"train_loss": 0.0008024642011150718, "global_step": 52796, "epoch": 443, "lr": 1.604654307804417e-05} +{"train_loss": 0.0005207957583479583, "global_step": 52797, "epoch": 443, "lr": 1.6044916762655604e-05} +{"train_loss": 0.0011619508732110262, "global_step": 52798, "epoch": 443, "lr": 1.6043290513934244e-05} +{"train_loss": 0.0011136436369270086, "global_step": 52799, "epoch": 443, "lr": 1.6041664331883234e-05} +{"train_loss": 0.0006372648640535772, "global_step": 52800, "epoch": 443, "lr": 1.6040038216505805e-05} +{"train_loss": 0.0006318939849734306, "global_step": 52801, "epoch": 443, "lr": 1.6038412167805116e-05} +{"train_loss": 0.0008874779450707138, "global_step": 52802, "epoch": 443, "lr": 1.6036786185784392e-05} +{"train_loss": 0.0007277011754922569, "global_step": 52803, "epoch": 443, "lr": 1.6035160270446797e-05} +{"train_loss": 0.000773904612287879, "global_step": 52804, "epoch": 443, "lr": 1.6033534421795548e-05} +{"train_loss": 0.0008104354492388666, "global_step": 52805, "epoch": 443, "lr": 1.6031908639833814e-05} +{"train_loss": 0.0006837465916760266, "global_step": 52806, "epoch": 443, "lr": 1.603028292456481e-05} +{"train_loss": 0.0004733635578304529, "global_step": 52807, "epoch": 443, "lr": 1.6028657275991703e-05} +{"train_loss": 0.0007153174374252558, "global_step": 52808, "epoch": 443, "lr": 1.6027031694117712e-05} +{"train_loss": 0.000766336394008249, "global_step": 52809, "epoch": 443, "lr": 1.6025406178946e-05} +{"train_loss": 0.0012551527470350266, "global_step": 52810, "epoch": 443, "lr": 1.6023780730479793e-05} +{"train_loss": 0.000817330670543015, "global_step": 52811, "epoch": 443, "lr": 1.6022155348722256e-05} +{"train_loss": 0.0015254378085955977, "global_step": 52812, "epoch": 443, "lr": 1.6020530033676572e-05} +{"train_loss": 0.0005167446215637028, "global_step": 52813, "epoch": 443, "lr": 1.6018904785345968e-05} +{"train_loss": 0.00038871695869602263, "global_step": 52814, "epoch": 443, "lr": 1.6017279603733598e-05} +{"train_loss": 0.0007487331167794764, "global_step": 52815, "epoch": 443, "lr": 1.601565448884268e-05} +{"train_loss": 0.0011675427667796612, "global_step": 52816, "epoch": 443, "lr": 1.6014029440676398e-05} +{"train_loss": 0.0002843278634827584, "global_step": 52817, "epoch": 443, "lr": 1.6012404459237917e-05} +{"train_loss": 0.0005363944219425321, "global_step": 52818, "epoch": 443, "lr": 1.601077954453047e-05} +{"train_loss": 0.000725599704310298, "global_step": 52819, "epoch": 443, "lr": 1.600915469655721e-05} +{"train_loss": 0.0011460552923381329, "global_step": 52820, "epoch": 443, "lr": 1.6007529915321355e-05} +{"train_loss": 0.0005380264483392239, "global_step": 52821, "epoch": 443, "lr": 1.6005905200826073e-05} +{"train_loss": 0.001116305124014616, "global_step": 52822, "epoch": 443, "lr": 1.6004280553074578e-05} +{"train_loss": 0.0007121824310161173, "global_step": 52823, "epoch": 443, "lr": 1.6002655972070045e-05} +{"train_loss": 0.0007242587162181735, "global_step": 52824, "epoch": 443, "lr": 1.6001031457815653e-05} +{"train_loss": 0.0008704728097654879, "global_step": 52825, "epoch": 443, "lr": 1.5999407010314615e-05} +{"train_loss": 0.0005490368930622935, "global_step": 52826, "epoch": 443, "lr": 1.599778262957009e-05} +{"train_loss": 0.00039430256583727896, "global_step": 52827, "epoch": 443, "lr": 1.599615831558531e-05} +{"train_loss": 0.0004657251120079309, "global_step": 52828, "epoch": 443, "lr": 1.599453406836342e-05} +{"train_loss": 0.0007328878855332732, "global_step": 52829, "epoch": 443, "lr": 1.599290988790765e-05} +{"train_loss": 0.0006427185144275427, "global_step": 52830, "epoch": 443, "lr": 1.5991285774221144e-05} +{"train_loss": 0.0008408813737332821, "global_step": 52831, "epoch": 443, "lr": 1.5989661727307138e-05} +{"train_loss": 0.0006530194659717381, "global_step": 52832, "epoch": 443, "lr": 1.5988037747168777e-05} +{"train_loss": 0.0007335461559705436, "global_step": 52833, "epoch": 443, "lr": 1.5986413833809288e-05} +{"train_loss": 0.0006823235307820141, "global_step": 52834, "epoch": 443, "lr": 1.598478998723183e-05} +{"train_loss": 0.0007777141870347736, "global_step": 52835, "epoch": 443, "lr": 1.5983166207439616e-05, "val_loss": 0.018726006150245667} +{"train_loss": 0.0004793951811734587, "global_step": 52836, "epoch": 444, "lr": 1.5981542494435802e-05} +{"train_loss": 0.0009586584055796266, "global_step": 52837, "epoch": 444, "lr": 1.5979918848223613e-05} +{"train_loss": 0.0004792159888893366, "global_step": 52838, "epoch": 444, "lr": 1.5978295268806203e-05} +{"train_loss": 0.0007755195256322622, "global_step": 52839, "epoch": 444, "lr": 1.597667175618679e-05} +{"train_loss": 0.0007335859118029475, "global_step": 52840, "epoch": 444, "lr": 1.5975048310368535e-05} +{"train_loss": 0.0010004520881921053, "global_step": 52841, "epoch": 444, "lr": 1.5973424931354648e-05} +{"train_loss": 0.0009598550968803465, "global_step": 52842, "epoch": 444, "lr": 1.5971801619148312e-05} +{"train_loss": 0.0007158608641475439, "global_step": 52843, "epoch": 444, "lr": 1.5970178373752686e-05} +{"train_loss": 0.0006308780866675079, "global_step": 52844, "epoch": 444, "lr": 1.5968555195171e-05} +{"train_loss": 0.0006532941479235888, "global_step": 52845, "epoch": 444, "lr": 1.5966932083406405e-05} +{"train_loss": 0.0007902638171799481, "global_step": 52846, "epoch": 444, "lr": 1.596530903846212e-05} +{"train_loss": 0.0005342920776456594, "global_step": 52847, "epoch": 444, "lr": 1.5963686060341305e-05} +{"train_loss": 0.0005476073129102588, "global_step": 52848, "epoch": 444, "lr": 1.5962063149047146e-05} +{"train_loss": 0.0005411843885667622, "global_step": 52849, "epoch": 444, "lr": 1.5960440304582856e-05} +{"train_loss": 0.0005854766932316124, "global_step": 52850, "epoch": 444, "lr": 1.595881752695159e-05} +{"train_loss": 0.0004768511571455747, "global_step": 52851, "epoch": 444, "lr": 1.595719481615656e-05} +{"train_loss": 0.0009203423396684229, "global_step": 52852, "epoch": 444, "lr": 1.5955572172200934e-05} +{"train_loss": 0.00034099016920663416, "global_step": 52853, "epoch": 444, "lr": 1.5953949595087914e-05} +{"train_loss": 0.00041533788316883147, "global_step": 52854, "epoch": 444, "lr": 1.595232708482068e-05} +{"train_loss": 0.0005024036508984864, "global_step": 52855, "epoch": 444, "lr": 1.5950704641402398e-05} +{"train_loss": 0.0006523928022943437, "global_step": 52856, "epoch": 444, "lr": 1.5949082264836286e-05} +{"train_loss": 0.0007171853794716299, "global_step": 52857, "epoch": 444, "lr": 1.5947459955125492e-05} +{"train_loss": 0.0008604944450780749, "global_step": 52858, "epoch": 444, "lr": 1.594583771227324e-05} +{"train_loss": 0.0008200056036002934, "global_step": 52859, "epoch": 444, "lr": 1.5944215536282685e-05} +{"train_loss": 0.0008155937539413571, "global_step": 52860, "epoch": 444, "lr": 1.5942593427157045e-05} +{"train_loss": 0.00046944874338805676, "global_step": 52861, "epoch": 444, "lr": 1.5940971384899472e-05} +{"train_loss": 0.0006863370654173195, "global_step": 52862, "epoch": 444, "lr": 1.5939349409513155e-05} +{"train_loss": 0.0005915464134886861, "global_step": 52863, "epoch": 444, "lr": 1.5937727501001305e-05} +{"train_loss": 0.00110369804315269, "global_step": 52864, "epoch": 444, "lr": 1.5936105659367067e-05} +{"train_loss": 0.0005130036734044552, "global_step": 52865, "epoch": 444, "lr": 1.5934483884613642e-05} +{"train_loss": 0.0005604748730547726, "global_step": 52866, "epoch": 444, "lr": 1.5932862176744247e-05} +{"train_loss": 0.0009234409662894905, "global_step": 52867, "epoch": 444, "lr": 1.593124053576201e-05} +{"train_loss": 0.0010772438254207373, "global_step": 52868, "epoch": 444, "lr": 1.5929618961670166e-05} +{"train_loss": 0.0006498786387965083, "global_step": 52869, "epoch": 444, "lr": 1.5927997454471854e-05} +{"train_loss": 0.0008886712603271008, "global_step": 52870, "epoch": 444, "lr": 1.5926376014170297e-05} +{"train_loss": 0.0006519872113130987, "global_step": 52871, "epoch": 444, "lr": 1.5924754640768645e-05} +{"train_loss": 0.0004148534790147096, "global_step": 52872, "epoch": 444, "lr": 1.592313333427011e-05} +{"train_loss": 0.0009242958039976656, "global_step": 52873, "epoch": 444, "lr": 1.592151209467787e-05} +{"train_loss": 0.0008730401750653982, "global_step": 52874, "epoch": 444, "lr": 1.5919890921995078e-05} +{"train_loss": 0.0007751899538561702, "global_step": 52875, "epoch": 444, "lr": 1.5918269816224958e-05} +{"train_loss": 0.0005274356226436794, "global_step": 52876, "epoch": 444, "lr": 1.591664877737065e-05} +{"train_loss": 0.0005481865373440087, "global_step": 52877, "epoch": 444, "lr": 1.591502780543539e-05} +{"train_loss": 0.0008308664546348155, "global_step": 52878, "epoch": 444, "lr": 1.5913406900422307e-05} +{"train_loss": 0.0014525740407407284, "global_step": 52879, "epoch": 444, "lr": 1.5911786062334626e-05} +{"train_loss": 0.0012334348866716027, "global_step": 52880, "epoch": 444, "lr": 1.591016529117551e-05} +{"train_loss": 0.0007951615261845291, "global_step": 52881, "epoch": 444, "lr": 1.5908544586948125e-05} +{"train_loss": 0.0006427906337194145, "global_step": 52882, "epoch": 444, "lr": 1.5906923949655693e-05} +{"train_loss": 0.0010353425750508904, "global_step": 52883, "epoch": 444, "lr": 1.590530337930135e-05} +{"train_loss": 0.0004611514450516552, "global_step": 52884, "epoch": 444, "lr": 1.590368287588832e-05} +{"train_loss": 0.0002965278981719166, "global_step": 52885, "epoch": 444, "lr": 1.590206243941977e-05} +{"train_loss": 0.0004976720083504915, "global_step": 52886, "epoch": 444, "lr": 1.590044206989886e-05} +{"train_loss": 0.0013023634674027562, "global_step": 52887, "epoch": 444, "lr": 1.5898821767328802e-05} +{"train_loss": 0.0007729732897132635, "global_step": 52888, "epoch": 444, "lr": 1.5897201531712753e-05} +{"train_loss": 0.000468356825876981, "global_step": 52889, "epoch": 444, "lr": 1.5895581363053912e-05} +{"train_loss": 0.000513806298840791, "global_step": 52890, "epoch": 444, "lr": 1.5893961261355445e-05} +{"train_loss": 0.0006820606649853289, "global_step": 52891, "epoch": 444, "lr": 1.5892341226620554e-05} +{"train_loss": 0.0009198352927342057, "global_step": 52892, "epoch": 444, "lr": 1.5890721258852416e-05} +{"train_loss": 0.0005798644851893187, "global_step": 52893, "epoch": 444, "lr": 1.5889101358054175e-05} +{"train_loss": 0.0008446472347714007, "global_step": 52894, "epoch": 444, "lr": 1.5887481524229065e-05} +{"train_loss": 0.000934136682190001, "global_step": 52895, "epoch": 444, "lr": 1.5885861757380215e-05} +{"train_loss": 0.0008175108814612031, "global_step": 52896, "epoch": 444, "lr": 1.588424205751085e-05} +{"train_loss": 0.0007373310509137809, "global_step": 52897, "epoch": 444, "lr": 1.588262242462412e-05} +{"train_loss": 0.0005369083373807371, "global_step": 52898, "epoch": 444, "lr": 1.5881002858723226e-05} +{"train_loss": 0.0006020523142069578, "global_step": 52899, "epoch": 444, "lr": 1.5879383359811328e-05} +{"train_loss": 0.0003478732251096517, "global_step": 52900, "epoch": 444, "lr": 1.5877763927891608e-05} +{"train_loss": 0.00038214336382225156, "global_step": 52901, "epoch": 444, "lr": 1.5876144562967278e-05} +{"train_loss": 0.0006059015286155045, "global_step": 52902, "epoch": 444, "lr": 1.5874525265041468e-05} +{"train_loss": 0.0005325471865944564, "global_step": 52903, "epoch": 444, "lr": 1.58729060341174e-05} +{"train_loss": 0.0005998220294713974, "global_step": 52904, "epoch": 444, "lr": 1.5871286870198238e-05} +{"train_loss": 0.00045039449469186366, "global_step": 52905, "epoch": 444, "lr": 1.5869667773287143e-05} +{"train_loss": 0.0009731109021231532, "global_step": 52906, "epoch": 444, "lr": 1.5868048743387322e-05} +{"train_loss": 0.0005208190414123237, "global_step": 52907, "epoch": 444, "lr": 1.5866429780501925e-05} +{"train_loss": 0.00041171812335960567, "global_step": 52908, "epoch": 444, "lr": 1.586481088463416e-05} +{"train_loss": 0.0006558673339895904, "global_step": 52909, "epoch": 444, "lr": 1.5863192055787185e-05} +{"train_loss": 0.0006828084005974233, "global_step": 52910, "epoch": 444, "lr": 1.5861573293964194e-05} +{"train_loss": 0.0006207235273905098, "global_step": 52911, "epoch": 444, "lr": 1.5859954599168357e-05} +{"train_loss": 0.0004265850002411753, "global_step": 52912, "epoch": 444, "lr": 1.5858335971402838e-05} +{"train_loss": 0.0010789250954985619, "global_step": 52913, "epoch": 444, "lr": 1.585671741067084e-05} +{"train_loss": 0.00038338146987371147, "global_step": 52914, "epoch": 444, "lr": 1.585509891697552e-05} +{"train_loss": 0.0014680896420031786, "global_step": 52915, "epoch": 444, "lr": 1.5853480490320077e-05} +{"train_loss": 0.00039043588913045824, "global_step": 52916, "epoch": 444, "lr": 1.5851862130707683e-05} +{"train_loss": 0.0007405075011774898, "global_step": 52917, "epoch": 444, "lr": 1.5850243838141487e-05} +{"train_loss": 0.0006196398753672838, "global_step": 52918, "epoch": 444, "lr": 1.584862561262471e-05} +{"train_loss": 0.0002727996907196939, "global_step": 52919, "epoch": 444, "lr": 1.584700745416049e-05} +{"train_loss": 0.001366682117804885, "global_step": 52920, "epoch": 444, "lr": 1.5845389362752033e-05} +{"train_loss": 0.00093373580602929, "global_step": 52921, "epoch": 444, "lr": 1.5843771338402496e-05} +{"train_loss": 0.0011055750073865056, "global_step": 52922, "epoch": 444, "lr": 1.5842153381115075e-05} +{"train_loss": 0.0008168778149411082, "global_step": 52923, "epoch": 444, "lr": 1.5840535490892945e-05} +{"train_loss": 0.0006321118562482297, "global_step": 52924, "epoch": 444, "lr": 1.583891766773925e-05} +{"train_loss": 0.0004939239006489515, "global_step": 52925, "epoch": 444, "lr": 1.583729991165721e-05} +{"train_loss": 0.00044548933510668576, "global_step": 52926, "epoch": 444, "lr": 1.5835682222649968e-05} +{"train_loss": 0.00034583048545755446, "global_step": 52927, "epoch": 444, "lr": 1.5834064600720726e-05} +{"train_loss": 0.0004918621270917356, "global_step": 52928, "epoch": 444, "lr": 1.5832447045872634e-05} +{"train_loss": 0.0008005037670955062, "global_step": 52929, "epoch": 444, "lr": 1.58308295581089e-05} +{"train_loss": 0.0005847366410307586, "global_step": 52930, "epoch": 444, "lr": 1.5829212137432665e-05} +{"train_loss": 0.0004933930467814207, "global_step": 52931, "epoch": 444, "lr": 1.5827594783847133e-05} +{"train_loss": 0.0007489007548429072, "global_step": 52932, "epoch": 444, "lr": 1.5825977497355454e-05} +{"train_loss": 0.0006029818905517459, "global_step": 52933, "epoch": 444, "lr": 1.5824360277960835e-05} +{"train_loss": 0.000888102687895298, "global_step": 52934, "epoch": 444, "lr": 1.5822743125666416e-05} +{"train_loss": 0.0013655092334374785, "global_step": 52935, "epoch": 444, "lr": 1.582112604047541e-05} +{"train_loss": 0.00026530169998295605, "global_step": 52936, "epoch": 444, "lr": 1.5819509022390948e-05} +{"train_loss": 0.0007607318111695349, "global_step": 52937, "epoch": 444, "lr": 1.5817892071416253e-05} +{"train_loss": 0.0003484679327812046, "global_step": 52938, "epoch": 444, "lr": 1.581627518755445e-05} +{"train_loss": 0.00029456030461005867, "global_step": 52939, "epoch": 444, "lr": 1.581465837080876e-05} +{"train_loss": 0.0014890938764438033, "global_step": 52940, "epoch": 444, "lr": 1.5813041621182316e-05} +{"train_loss": 0.000518058892339468, "global_step": 52941, "epoch": 444, "lr": 1.5811424938678332e-05} +{"train_loss": 0.0011261840118095279, "global_step": 52942, "epoch": 444, "lr": 1.580980832329996e-05} +{"train_loss": 0.0006697220960631967, "global_step": 52943, "epoch": 444, "lr": 1.5808191775050367e-05} +{"train_loss": 0.0006156015442684293, "global_step": 52944, "epoch": 444, "lr": 1.5806575293932746e-05} +{"train_loss": 0.0010156657081097364, "global_step": 52945, "epoch": 444, "lr": 1.580495887995025e-05} +{"train_loss": 0.0007490419084206223, "global_step": 52946, "epoch": 444, "lr": 1.5803342533106074e-05} +{"train_loss": 0.0004374887212179601, "global_step": 52947, "epoch": 444, "lr": 1.580172625340337e-05} +{"train_loss": 0.001005459693260491, "global_step": 52948, "epoch": 444, "lr": 1.580011004084534e-05} +{"train_loss": 0.0007534566102549434, "global_step": 52949, "epoch": 444, "lr": 1.579849389543514e-05} +{"train_loss": 0.001068029785528779, "global_step": 52950, "epoch": 444, "lr": 1.5796877817175925e-05} +{"train_loss": 0.0008024550625123084, "global_step": 52951, "epoch": 444, "lr": 1.5795261806070906e-05} +{"train_loss": 0.0005074652726761997, "global_step": 52952, "epoch": 444, "lr": 1.5793645862123212e-05} +{"train_loss": 0.0005438349908217788, "global_step": 52953, "epoch": 444, "lr": 1.5792029985336067e-05} +{"train_loss": 0.0007037641517250572, "global_step": 52954, "epoch": 444, "lr": 1.579041417571261e-05, "val_loss": 0.01996692642569542} +{"train_loss": 0.0004667208413593471, "global_step": 52955, "epoch": 445, "lr": 1.5788798433256002e-05} +{"train_loss": 0.0005947331083007157, "global_step": 52956, "epoch": 445, "lr": 1.5787182757969453e-05} +{"train_loss": 0.0004905035020783544, "global_step": 52957, "epoch": 445, "lr": 1.5785567149856096e-05} +{"train_loss": 0.0005320768686942756, "global_step": 52958, "epoch": 445, "lr": 1.5783951608919144e-05} +{"train_loss": 0.0005532049690373242, "global_step": 52959, "epoch": 445, "lr": 1.578233613516173e-05} +{"train_loss": 0.00119543238542974, "global_step": 52960, "epoch": 445, "lr": 1.5780720728587056e-05} +{"train_loss": 0.0005072419880889356, "global_step": 52961, "epoch": 445, "lr": 1.5779105389198283e-05} +{"train_loss": 0.0003743792767636478, "global_step": 52962, "epoch": 445, "lr": 1.5777490116998566e-05} +{"train_loss": 0.0004669120826292783, "global_step": 52963, "epoch": 445, "lr": 1.577587491199109e-05} +{"train_loss": 0.000745507946703583, "global_step": 52964, "epoch": 445, "lr": 1.577425977417904e-05} +{"train_loss": 0.000591838441323489, "global_step": 52965, "epoch": 445, "lr": 1.5772644703565565e-05} +{"train_loss": 0.0006797534879297018, "global_step": 52966, "epoch": 445, "lr": 1.5771029700153854e-05} +{"train_loss": 0.0003441843728069216, "global_step": 52967, "epoch": 445, "lr": 1.576941476394706e-05} +{"train_loss": 0.0005981192225590348, "global_step": 52968, "epoch": 445, "lr": 1.5767799894948377e-05} +{"train_loss": 0.0010286574251949787, "global_step": 52969, "epoch": 445, "lr": 1.5766185093160946e-05} +{"train_loss": 0.0005612748791463673, "global_step": 52970, "epoch": 445, "lr": 1.5764570358587965e-05} +{"train_loss": 0.0005155201070010662, "global_step": 52971, "epoch": 445, "lr": 1.5762955691232585e-05} +{"train_loss": 0.001065816031768918, "global_step": 52972, "epoch": 445, "lr": 1.5761341091097994e-05} +{"train_loss": 0.000783545256126672, "global_step": 52973, "epoch": 445, "lr": 1.5759726558187355e-05} +{"train_loss": 0.0008142600418068469, "global_step": 52974, "epoch": 445, "lr": 1.575811209250381e-05} +{"train_loss": 0.00040698007796891034, "global_step": 52975, "epoch": 445, "lr": 1.575649769405058e-05} +{"train_loss": 0.0011250413954257965, "global_step": 52976, "epoch": 445, "lr": 1.5754883362830792e-05} +{"train_loss": 0.00036227505188435316, "global_step": 52977, "epoch": 445, "lr": 1.5753269098847646e-05} +{"train_loss": 0.0004227900644764304, "global_step": 52978, "epoch": 445, "lr": 1.5751654902104273e-05} +{"train_loss": 0.0005418456858024001, "global_step": 52979, "epoch": 445, "lr": 1.575004077260389e-05} +{"train_loss": 0.0006002180743962526, "global_step": 52980, "epoch": 445, "lr": 1.5748426710349644e-05} +{"train_loss": 0.0006937379366718233, "global_step": 52981, "epoch": 445, "lr": 1.574681271534469e-05} +{"train_loss": 0.0007019710028544068, "global_step": 52982, "epoch": 445, "lr": 1.5745198787592218e-05} +{"train_loss": 0.0005091429920867085, "global_step": 52983, "epoch": 445, "lr": 1.5743584927095378e-05} +{"train_loss": 0.0004561475943773985, "global_step": 52984, "epoch": 445, "lr": 1.5741971133857365e-05} +{"train_loss": 0.00043482775799930096, "global_step": 52985, "epoch": 445, "lr": 1.5740357407881328e-05} +{"train_loss": 0.0004046543617732823, "global_step": 52986, "epoch": 445, "lr": 1.5738743749170426e-05} +{"train_loss": 0.0007105247932486236, "global_step": 52987, "epoch": 445, "lr": 1.5737130157727853e-05} +{"train_loss": 0.0007903034565970302, "global_step": 52988, "epoch": 445, "lr": 1.573551663355675e-05} +{"train_loss": 0.0008465947466902435, "global_step": 52989, "epoch": 445, "lr": 1.573390317666032e-05} +{"train_loss": 0.0009607643587514758, "global_step": 52990, "epoch": 445, "lr": 1.573228978704169e-05} +{"train_loss": 0.00043901544995605946, "global_step": 52991, "epoch": 445, "lr": 1.5730676464704063e-05} +{"train_loss": 0.0005758061888627708, "global_step": 52992, "epoch": 445, "lr": 1.5729063209650596e-05} +{"train_loss": 0.0006020715227350593, "global_step": 52993, "epoch": 445, "lr": 1.5727450021884432e-05} +{"train_loss": 0.00043829972855746746, "global_step": 52994, "epoch": 445, "lr": 1.572583690140878e-05} +{"train_loss": 0.001239586970768869, "global_step": 52995, "epoch": 445, "lr": 1.5724223848226766e-05} +{"train_loss": 0.0010154535993933678, "global_step": 52996, "epoch": 445, "lr": 1.5722610862341592e-05} +{"train_loss": 0.0008743071812205017, "global_step": 52997, "epoch": 445, "lr": 1.5720997943756394e-05} +{"train_loss": 0.0005950452759861946, "global_step": 52998, "epoch": 445, "lr": 1.5719385092474354e-05} +{"train_loss": 0.0006702385726384819, "global_step": 52999, "epoch": 445, "lr": 1.5717772308498653e-05} +{"train_loss": 0.0005834948387928307, "global_step": 53000, "epoch": 445, "lr": 1.571615959183243e-05} +{"train_loss": 0.0007746714982204139, "global_step": 53001, "epoch": 445, "lr": 1.571454694247888e-05} +{"train_loss": 0.0004416374722495675, "global_step": 53002, "epoch": 445, "lr": 1.5712934360441138e-05} +{"train_loss": 0.0005078467656858265, "global_step": 53003, "epoch": 445, "lr": 1.5711321845722405e-05} +{"train_loss": 0.0008276141597889364, "global_step": 53004, "epoch": 445, "lr": 1.5709709398325827e-05} +{"train_loss": 0.0005949101177975535, "global_step": 53005, "epoch": 445, "lr": 1.5708097018254554e-05} +{"train_loss": 0.000475716486107558, "global_step": 53006, "epoch": 445, "lr": 1.5706484705511786e-05} +{"train_loss": 0.0006638249033130705, "global_step": 53007, "epoch": 445, "lr": 1.5704872460100656e-05} +{"train_loss": 0.000904892454855144, "global_step": 53008, "epoch": 445, "lr": 1.5703260282024363e-05} +{"train_loss": 0.0008941544219851494, "global_step": 53009, "epoch": 445, "lr": 1.570164817128603e-05} +{"train_loss": 0.0003343945718370378, "global_step": 53010, "epoch": 445, "lr": 1.5700036127888874e-05} +{"train_loss": 0.0009037909912876785, "global_step": 53011, "epoch": 445, "lr": 1.5698424151836024e-05} +{"train_loss": 0.0006865980685688555, "global_step": 53012, "epoch": 445, "lr": 1.5696812243130645e-05} +{"train_loss": 0.0002780206559691578, "global_step": 53013, "epoch": 445, "lr": 1.5695200401775918e-05} +{"train_loss": 0.0007934639579616487, "global_step": 53014, "epoch": 445, "lr": 1.5693588627774985e-05} +{"train_loss": 0.0005504695582203567, "global_step": 53015, "epoch": 445, "lr": 1.5691976921131046e-05} +{"train_loss": 0.0007336419657804072, "global_step": 53016, "epoch": 445, "lr": 1.569036528184723e-05} +{"train_loss": 0.0006685125408694148, "global_step": 53017, "epoch": 445, "lr": 1.568875370992673e-05} +{"train_loss": 0.0003772051422856748, "global_step": 53018, "epoch": 445, "lr": 1.5687142205372695e-05} +{"train_loss": 0.000726273050531745, "global_step": 53019, "epoch": 445, "lr": 1.5685530768188277e-05} +{"train_loss": 0.000573939410969615, "global_step": 53020, "epoch": 445, "lr": 1.5683919398376667e-05} +{"train_loss": 0.0005566815380007029, "global_step": 53021, "epoch": 445, "lr": 1.5682308095941002e-05} +{"train_loss": 0.0005779715138487518, "global_step": 53022, "epoch": 445, "lr": 1.5680696860884477e-05} +{"train_loss": 0.001059177448041737, "global_step": 53023, "epoch": 445, "lr": 1.5679085693210232e-05} +{"train_loss": 0.0002532453218009323, "global_step": 53024, "epoch": 445, "lr": 1.567747459292142e-05} +{"train_loss": 0.0005680097383446991, "global_step": 53025, "epoch": 445, "lr": 1.5675863560021236e-05} +{"train_loss": 0.000608311325777322, "global_step": 53026, "epoch": 445, "lr": 1.567425259451281e-05} +{"train_loss": 0.0008327521500177681, "global_step": 53027, "epoch": 445, "lr": 1.5672641696399344e-05} +{"train_loss": 0.0005393463070504367, "global_step": 53028, "epoch": 445, "lr": 1.5671030865683957e-05} +{"train_loss": 0.000387803214835003, "global_step": 53029, "epoch": 445, "lr": 1.5669420102369848e-05} +{"train_loss": 0.0005990316276438534, "global_step": 53030, "epoch": 445, "lr": 1.5667809406460155e-05} +{"train_loss": 0.0015191481215879321, "global_step": 53031, "epoch": 445, "lr": 1.5666198777958065e-05} +{"train_loss": 0.0011735204607248306, "global_step": 53032, "epoch": 445, "lr": 1.5664588216866706e-05} +{"train_loss": 0.0006001598085276783, "global_step": 53033, "epoch": 445, "lr": 1.566297772318926e-05} +{"train_loss": 0.00032380232005380094, "global_step": 53034, "epoch": 445, "lr": 1.566136729692891e-05} +{"train_loss": 0.0009383061551488936, "global_step": 53035, "epoch": 445, "lr": 1.5659756938088788e-05} +{"train_loss": 0.0006935361307114363, "global_step": 53036, "epoch": 445, "lr": 1.5658146646672055e-05} +{"train_loss": 0.001221193466335535, "global_step": 53037, "epoch": 445, "lr": 1.56565364226819e-05} +{"train_loss": 0.0009140947950072587, "global_step": 53038, "epoch": 445, "lr": 1.5654926266121444e-05} +{"train_loss": 0.000685619714204222, "global_step": 53039, "epoch": 445, "lr": 1.5653316176993892e-05} +{"train_loss": 0.0003664757532533258, "global_step": 53040, "epoch": 445, "lr": 1.5651706155302364e-05} +{"train_loss": 0.0009633508161641657, "global_step": 53041, "epoch": 445, "lr": 1.5650096201050063e-05} +{"train_loss": 0.0008834351901896298, "global_step": 53042, "epoch": 445, "lr": 1.5648486314240122e-05} +{"train_loss": 0.0005419981898739934, "global_step": 53043, "epoch": 445, "lr": 1.56468764948757e-05} +{"train_loss": 0.00044213366345502436, "global_step": 53044, "epoch": 445, "lr": 1.564526674295998e-05} +{"train_loss": 0.0006192155415192246, "global_step": 53045, "epoch": 445, "lr": 1.5643657058496085e-05} +{"train_loss": 0.0006716495263390243, "global_step": 53046, "epoch": 445, "lr": 1.5642047441487222e-05} +{"train_loss": 0.0005993666127324104, "global_step": 53047, "epoch": 445, "lr": 1.564043789193651e-05} +{"train_loss": 0.0008814072934910655, "global_step": 53048, "epoch": 445, "lr": 1.5638828409847144e-05} +{"train_loss": 0.0005327623803168535, "global_step": 53049, "epoch": 445, "lr": 1.563721899522227e-05} +{"train_loss": 0.0005346794496290386, "global_step": 53050, "epoch": 445, "lr": 1.5635609648065024e-05} +{"train_loss": 0.0005372862797230482, "global_step": 53051, "epoch": 445, "lr": 1.563400036837861e-05} +{"train_loss": 0.0007149107987061143, "global_step": 53052, "epoch": 445, "lr": 1.563239115616614e-05} +{"train_loss": 0.0003601299540605396, "global_step": 53053, "epoch": 445, "lr": 1.5630782011430822e-05} +{"train_loss": 0.0006636559846810997, "global_step": 53054, "epoch": 445, "lr": 1.562917293417579e-05} +{"train_loss": 0.0009705094853416085, "global_step": 53055, "epoch": 445, "lr": 1.5627563924404187e-05} +{"train_loss": 0.00117441825568676, "global_step": 53056, "epoch": 445, "lr": 1.5625954982119205e-05} +{"train_loss": 0.0006118364981375635, "global_step": 53057, "epoch": 445, "lr": 1.562434610732397e-05} +{"train_loss": 0.0006058758590370417, "global_step": 53058, "epoch": 445, "lr": 1.5622737300021682e-05} +{"train_loss": 0.0009122222545556724, "global_step": 53059, "epoch": 445, "lr": 1.562112856021546e-05} +{"train_loss": 0.0004221401468385011, "global_step": 53060, "epoch": 445, "lr": 1.561951988790849e-05} +{"train_loss": 0.0006758727831766009, "global_step": 53061, "epoch": 445, "lr": 1.561791128310391e-05} +{"train_loss": 0.0008348854025825858, "global_step": 53062, "epoch": 445, "lr": 1.56163027458049e-05} +{"train_loss": 0.0011678487062454224, "global_step": 53063, "epoch": 445, "lr": 1.561469427601459e-05} +{"train_loss": 0.0008527669706381857, "global_step": 53064, "epoch": 445, "lr": 1.5613085873736173e-05} +{"train_loss": 0.0006385965971276164, "global_step": 53065, "epoch": 445, "lr": 1.5611477538972768e-05} +{"train_loss": 0.0006581821362487972, "global_step": 53066, "epoch": 445, "lr": 1.5609869271727573e-05} +{"train_loss": 0.0006706286803819239, "global_step": 53067, "epoch": 445, "lr": 1.5608261072003704e-05} +{"train_loss": 0.0009263997199013829, "global_step": 53068, "epoch": 445, "lr": 1.5606652939804362e-05} +{"train_loss": 0.000452919804956764, "global_step": 53069, "epoch": 445, "lr": 1.5605044875132663e-05} +{"train_loss": 0.0010755178518593311, "global_step": 53070, "epoch": 445, "lr": 1.56034368779918e-05} +{"train_loss": 0.0007003283826634288, "global_step": 53071, "epoch": 445, "lr": 1.56018289483849e-05} +{"train_loss": 0.0010746606858447194, "global_step": 53072, "epoch": 445, "lr": 1.560022108631515e-05} +{"train_loss": 0.0006815170883416285, "global_step": 53073, "epoch": 445, "lr": 1.5598613291785692e-05, "val_loss": 0.03376256301999092, "train_action_mse_error": 9.46724321693182e-06} +{"train_loss": 0.0010780672309920192, "global_step": 53074, "epoch": 446, "lr": 1.5597005564799662e-05} +{"train_loss": 0.0007635167567059398, "global_step": 53075, "epoch": 446, "lr": 1.5595397905360254e-05} +{"train_loss": 0.0007972568855620921, "global_step": 53076, "epoch": 446, "lr": 1.5593790313470592e-05} +{"train_loss": 0.000745707715395838, "global_step": 53077, "epoch": 446, "lr": 1.5592182789133858e-05} +{"train_loss": 0.0004832927661482245, "global_step": 53078, "epoch": 446, "lr": 1.5590575332353185e-05} +{"train_loss": 0.0005136851104907691, "global_step": 53079, "epoch": 446, "lr": 1.5588967943131755e-05} +{"train_loss": 0.0007696609245613217, "global_step": 53080, "epoch": 446, "lr": 1.558736062147271e-05} +{"train_loss": 0.000887532252818346, "global_step": 53081, "epoch": 446, "lr": 1.5585753367379196e-05} +{"train_loss": 0.0007945235702209175, "global_step": 53082, "epoch": 446, "lr": 1.5584146180854393e-05} +{"train_loss": 0.0004516885383054614, "global_step": 53083, "epoch": 446, "lr": 1.558253906190142e-05} +{"train_loss": 0.0016706784954294562, "global_step": 53084, "epoch": 446, "lr": 1.5580932010523476e-05} +{"train_loss": 0.0006689613219350576, "global_step": 53085, "epoch": 446, "lr": 1.5579325026723673e-05} +{"train_loss": 0.0005257529555819929, "global_step": 53086, "epoch": 446, "lr": 1.5577718110505213e-05} +{"train_loss": 0.0004208937752991915, "global_step": 53087, "epoch": 446, "lr": 1.5576111261871218e-05} +{"train_loss": 0.00062628771411255, "global_step": 53088, "epoch": 446, "lr": 1.5574504480824838e-05} +{"train_loss": 0.0008708829991519451, "global_step": 53089, "epoch": 446, "lr": 1.557289776736926e-05} +{"train_loss": 0.00047837785677984357, "global_step": 53090, "epoch": 446, "lr": 1.5571291121507598e-05} +{"train_loss": 0.001038460759446025, "global_step": 53091, "epoch": 446, "lr": 1.5569684543243046e-05} +{"train_loss": 0.0005824655527248979, "global_step": 53092, "epoch": 446, "lr": 1.5568078032578738e-05} +{"train_loss": 0.0009283998515456915, "global_step": 53093, "epoch": 446, "lr": 1.5566471589517816e-05} +{"train_loss": 0.0007555215270258486, "global_step": 53094, "epoch": 446, "lr": 1.5564865214063462e-05} +{"train_loss": 0.0009688565041869879, "global_step": 53095, "epoch": 446, "lr": 1.5563258906218804e-05} +{"train_loss": 0.0005480860127136111, "global_step": 53096, "epoch": 446, "lr": 1.556165266598701e-05} +{"train_loss": 0.0011639170115813613, "global_step": 53097, "epoch": 446, "lr": 1.5560046493371243e-05} +{"train_loss": 0.000978548894636333, "global_step": 53098, "epoch": 446, "lr": 1.5558440388374628e-05} +{"train_loss": 0.0008878271328285336, "global_step": 53099, "epoch": 446, "lr": 1.5556834351000353e-05} +{"train_loss": 0.0004764724289998412, "global_step": 53100, "epoch": 446, "lr": 1.5555228381251542e-05} +{"train_loss": 0.0021275803446769714, "global_step": 53101, "epoch": 446, "lr": 1.5553622479131376e-05} +{"train_loss": 0.0006962568149901927, "global_step": 53102, "epoch": 446, "lr": 1.5552016644642976e-05} +{"train_loss": 0.0004022821376565844, "global_step": 53103, "epoch": 446, "lr": 1.5550410877789523e-05} +{"train_loss": 0.0005013640038669109, "global_step": 53104, "epoch": 446, "lr": 1.5548805178574162e-05} +{"train_loss": 0.0008604843751527369, "global_step": 53105, "epoch": 446, "lr": 1.554719954700002e-05} +{"train_loss": 0.0006107212393544614, "global_step": 53106, "epoch": 446, "lr": 1.5545593983070287e-05} +{"train_loss": 0.0008780453354120255, "global_step": 53107, "epoch": 446, "lr": 1.5543988486788093e-05} +{"train_loss": 0.000951985886786133, "global_step": 53108, "epoch": 446, "lr": 1.55423830581566e-05} +{"train_loss": 0.0008404368418268859, "global_step": 53109, "epoch": 446, "lr": 1.554077769717895e-05} +{"train_loss": 0.0011129600461572409, "global_step": 53110, "epoch": 446, "lr": 1.5539172403858315e-05} +{"train_loss": 0.000571967102587223, "global_step": 53111, "epoch": 446, "lr": 1.553756717819783e-05} +{"train_loss": 0.0008046541479416192, "global_step": 53112, "epoch": 446, "lr": 1.553596202020064e-05} +{"train_loss": 0.0009237277554348111, "global_step": 53113, "epoch": 446, "lr": 1.553435692986992e-05} +{"train_loss": 0.00047142666880972683, "global_step": 53114, "epoch": 446, "lr": 1.553275190720879e-05} +{"train_loss": 0.001026271260343492, "global_step": 53115, "epoch": 446, "lr": 1.5531146952220436e-05} +{"train_loss": 0.001182275707833469, "global_step": 53116, "epoch": 446, "lr": 1.5529542064907975e-05} +{"train_loss": 0.00039194137207232416, "global_step": 53117, "epoch": 446, "lr": 1.5527937245274597e-05} +{"train_loss": 0.0008188451756723225, "global_step": 53118, "epoch": 446, "lr": 1.5526332493323432e-05} +{"train_loss": 0.000973345770034939, "global_step": 53119, "epoch": 446, "lr": 1.5524727809057605e-05} +{"train_loss": 0.0010949939023703337, "global_step": 53120, "epoch": 446, "lr": 1.5523123192480316e-05} +{"train_loss": 0.0005593665991909802, "global_step": 53121, "epoch": 446, "lr": 1.5521518643594674e-05} +{"train_loss": 0.0009311562171205878, "global_step": 53122, "epoch": 446, "lr": 1.5519914162403858e-05} +{"train_loss": 0.0007088315906003118, "global_step": 53123, "epoch": 446, "lr": 1.5518309748911016e-05} +{"train_loss": 0.0008662492618896067, "global_step": 53124, "epoch": 446, "lr": 1.5516705403119263e-05} +{"train_loss": 0.0007411083788610995, "global_step": 53125, "epoch": 446, "lr": 1.5515101125031793e-05} +{"train_loss": 0.0006501547759398818, "global_step": 53126, "epoch": 446, "lr": 1.5513496914651725e-05} +{"train_loss": 0.0013637697556987405, "global_step": 53127, "epoch": 446, "lr": 1.5511892771982238e-05} +{"train_loss": 0.0006510746898129582, "global_step": 53128, "epoch": 446, "lr": 1.5510288697026448e-05} +{"train_loss": 0.0003234084288123995, "global_step": 53129, "epoch": 446, "lr": 1.5508684689787534e-05} +{"train_loss": 0.0006137368036434054, "global_step": 53130, "epoch": 446, "lr": 1.550708075026862e-05} +{"train_loss": 0.0011599495774134994, "global_step": 53131, "epoch": 446, "lr": 1.550547687847287e-05} +{"train_loss": 0.0017348334658890963, "global_step": 53132, "epoch": 446, "lr": 1.550387307440344e-05} +{"train_loss": 0.0011288679670542479, "global_step": 53133, "epoch": 446, "lr": 1.5502269338063464e-05} +{"train_loss": 0.0004346443456597626, "global_step": 53134, "epoch": 446, "lr": 1.5500665669456105e-05} +{"train_loss": 0.0006103574414737523, "global_step": 53135, "epoch": 446, "lr": 1.5499062068584486e-05} +{"train_loss": 0.00044183089630678296, "global_step": 53136, "epoch": 446, "lr": 1.5497458535451793e-05} +{"train_loss": 0.0010254334192723036, "global_step": 53137, "epoch": 446, "lr": 1.5495855070061153e-05} +{"train_loss": 0.0005128072807565331, "global_step": 53138, "epoch": 446, "lr": 1.54942516724157e-05} +{"train_loss": 0.0006931812968105078, "global_step": 53139, "epoch": 446, "lr": 1.5492648342518612e-05} +{"train_loss": 0.0006837011897005141, "global_step": 53140, "epoch": 446, "lr": 1.5491045080373006e-05} +{"train_loss": 0.0007290120120160282, "global_step": 53141, "epoch": 446, "lr": 1.5489441885982063e-05} +{"train_loss": 0.000543686852324754, "global_step": 53142, "epoch": 446, "lr": 1.5487838759348915e-05} +{"train_loss": 0.0004504996759351343, "global_step": 53143, "epoch": 446, "lr": 1.548623570047669e-05} +{"train_loss": 0.0009545019129291177, "global_step": 53144, "epoch": 446, "lr": 1.5484632709368574e-05} +{"train_loss": 0.001078885281458497, "global_step": 53145, "epoch": 446, "lr": 1.5483029786027676e-05} +{"train_loss": 0.0008176922565326095, "global_step": 53146, "epoch": 446, "lr": 1.5481426930457176e-05} +{"train_loss": 0.0005796261830255389, "global_step": 53147, "epoch": 446, "lr": 1.5479824142660192e-05} +{"train_loss": 0.0006344608846120536, "global_step": 53148, "epoch": 446, "lr": 1.5478221422639904e-05} +{"train_loss": 0.0002837388019543141, "global_step": 53149, "epoch": 446, "lr": 1.5476618770399436e-05} +{"train_loss": 0.0004965560510754585, "global_step": 53150, "epoch": 446, "lr": 1.5475016185941927e-05} +{"train_loss": 0.0009475712431594729, "global_step": 53151, "epoch": 446, "lr": 1.547341366927055e-05} +{"train_loss": 0.0006812008796259761, "global_step": 53152, "epoch": 446, "lr": 1.5471811220388415e-05} +{"train_loss": 0.0008029782329685986, "global_step": 53153, "epoch": 446, "lr": 1.547020883929871e-05} +{"train_loss": 0.0006723430124111474, "global_step": 53154, "epoch": 446, "lr": 1.5468606526004563e-05} +{"train_loss": 0.0006213079323060811, "global_step": 53155, "epoch": 446, "lr": 1.54670042805091e-05} +{"train_loss": 0.0010212995111942291, "global_step": 53156, "epoch": 446, "lr": 1.54654021028155e-05} +{"train_loss": 0.0005147659103386104, "global_step": 53157, "epoch": 446, "lr": 1.546379999292688e-05} +{"train_loss": 0.0008239771123044193, "global_step": 53158, "epoch": 446, "lr": 1.5462197950846414e-05} +{"train_loss": 0.0006159273907542229, "global_step": 53159, "epoch": 446, "lr": 1.5460595976577213e-05} +{"train_loss": 0.0003769409959204495, "global_step": 53160, "epoch": 446, "lr": 1.5458994070122462e-05} +{"train_loss": 0.0004844019131269306, "global_step": 53161, "epoch": 446, "lr": 1.545739223148527e-05} +{"train_loss": 0.000909432303160429, "global_step": 53162, "epoch": 446, "lr": 1.545579046066881e-05} +{"train_loss": 0.0006428632768802345, "global_step": 53163, "epoch": 446, "lr": 1.54541887576762e-05} +{"train_loss": 0.00037301151314750314, "global_step": 53164, "epoch": 446, "lr": 1.545258712251062e-05} +{"train_loss": 0.00030305288964882493, "global_step": 53165, "epoch": 446, "lr": 1.5450985555175173e-05} +{"train_loss": 0.0005432531470432878, "global_step": 53166, "epoch": 446, "lr": 1.5449384055673027e-05} +{"train_loss": 0.0007603758131153882, "global_step": 53167, "epoch": 446, "lr": 1.5447782624007345e-05} +{"train_loss": 0.000434320216299966, "global_step": 53168, "epoch": 446, "lr": 1.5446181260181243e-05} +{"train_loss": 0.0004454677109606564, "global_step": 53169, "epoch": 446, "lr": 1.544457996419786e-05} +{"train_loss": 0.0009537485893815756, "global_step": 53170, "epoch": 446, "lr": 1.544297873606037e-05} +{"train_loss": 0.0004358102451078594, "global_step": 53171, "epoch": 446, "lr": 1.544137757577188e-05} +{"train_loss": 0.00043728281161747873, "global_step": 53172, "epoch": 446, "lr": 1.5439776483335572e-05} +{"train_loss": 0.00044228523620404303, "global_step": 53173, "epoch": 446, "lr": 1.5438175458754568e-05} +{"train_loss": 0.0005606411141343415, "global_step": 53174, "epoch": 446, "lr": 1.5436574502032e-05} +{"train_loss": 0.0006279760273173451, "global_step": 53175, "epoch": 446, "lr": 1.543497361317104e-05} +{"train_loss": 0.00027782164397649467, "global_step": 53176, "epoch": 446, "lr": 1.5433372792174798e-05} +{"train_loss": 0.0007222139392979443, "global_step": 53177, "epoch": 446, "lr": 1.543177203904646e-05} +{"train_loss": 0.0009002366568893194, "global_step": 53178, "epoch": 446, "lr": 1.5430171353789125e-05} +{"train_loss": 0.0011061662808060646, "global_step": 53179, "epoch": 446, "lr": 1.5428570736405966e-05} +{"train_loss": 0.00038560840766876936, "global_step": 53180, "epoch": 446, "lr": 1.5426970186900118e-05} +{"train_loss": 0.000501863076351583, "global_step": 53181, "epoch": 446, "lr": 1.5425369705274707e-05} +{"train_loss": 0.0005950251943431795, "global_step": 53182, "epoch": 446, "lr": 1.5423769291532902e-05} +{"train_loss": 0.0007822092738933861, "global_step": 53183, "epoch": 446, "lr": 1.5422168945677817e-05} +{"train_loss": 0.0004901945940218866, "global_step": 53184, "epoch": 446, "lr": 1.5420568667712625e-05} +{"train_loss": 0.0008402024395763874, "global_step": 53185, "epoch": 446, "lr": 1.5418968457640438e-05} +{"train_loss": 0.000629113637842238, "global_step": 53186, "epoch": 446, "lr": 1.5417368315464426e-05} +{"train_loss": 0.0004113750474061817, "global_step": 53187, "epoch": 446, "lr": 1.5415768241187717e-05} +{"train_loss": 0.0008094815420918167, "global_step": 53188, "epoch": 446, "lr": 1.5414168234813435e-05} +{"train_loss": 0.0005628148792311549, "global_step": 53189, "epoch": 446, "lr": 1.541256829634476e-05} +{"train_loss": 0.0007191117038019001, "global_step": 53190, "epoch": 446, "lr": 1.541096842578479e-05} +{"train_loss": 0.0006616433965973556, "global_step": 53191, "epoch": 446, "lr": 1.5409368623136706e-05} +{"train_loss": 0.0007307278024161845, "global_step": 53192, "epoch": 446, "lr": 1.5407768888403633e-05, "val_loss": 0.02723338082432747} +{"train_loss": 0.00041095699998550117, "global_step": 53193, "epoch": 447, "lr": 1.5406169221588695e-05} +{"train_loss": 0.0006217507179826498, "global_step": 53194, "epoch": 447, "lr": 1.540456962269504e-05} +{"train_loss": 0.0006886811461299658, "global_step": 53195, "epoch": 447, "lr": 1.5402970091725844e-05} +{"train_loss": 0.0008202512399293482, "global_step": 53196, "epoch": 447, "lr": 1.5401370628684197e-05} +{"train_loss": 0.0011556553654372692, "global_step": 53197, "epoch": 447, "lr": 1.5399771233573277e-05} +{"train_loss": 0.0011050625471398234, "global_step": 53198, "epoch": 447, "lr": 1.5398171906396196e-05} +{"train_loss": 0.00047308774082921445, "global_step": 53199, "epoch": 447, "lr": 1.5396572647156127e-05} +{"train_loss": 0.0008028295123949647, "global_step": 53200, "epoch": 447, "lr": 1.539497345585617e-05} +{"train_loss": 0.0005058927345089614, "global_step": 53201, "epoch": 447, "lr": 1.5393374332499507e-05} +{"train_loss": 0.0004998877993784845, "global_step": 53202, "epoch": 447, "lr": 1.5391775277089236e-05} +{"train_loss": 0.0005536032258532941, "global_step": 53203, "epoch": 447, "lr": 1.5390176289628532e-05} +{"train_loss": 0.0004322536988183856, "global_step": 53204, "epoch": 447, "lr": 1.5388577370120503e-05} +{"train_loss": 0.0015663254307582974, "global_step": 53205, "epoch": 447, "lr": 1.538697851856833e-05} +{"train_loss": 0.0005562187288887799, "global_step": 53206, "epoch": 447, "lr": 1.538537973497512e-05} +{"train_loss": 0.001161961816251278, "global_step": 53207, "epoch": 447, "lr": 1.5383781019344e-05} +{"train_loss": 0.0003884432662744075, "global_step": 53208, "epoch": 447, "lr": 1.5382182371678146e-05} +{"train_loss": 0.0008756981114856899, "global_step": 53209, "epoch": 447, "lr": 1.5380583791980664e-05} +{"train_loss": 0.0017590807983651757, "global_step": 53210, "epoch": 447, "lr": 1.537898528025472e-05} +{"train_loss": 0.000650571018923074, "global_step": 53211, "epoch": 447, "lr": 1.5377386836503445e-05} +{"train_loss": 0.0004496289766393602, "global_step": 53212, "epoch": 447, "lr": 1.537578846072995e-05} +{"train_loss": 0.0008325286908075213, "global_step": 53213, "epoch": 447, "lr": 1.537419015293741e-05} +{"train_loss": 0.0005428332951851189, "global_step": 53214, "epoch": 447, "lr": 1.5372591913128942e-05} +{"train_loss": 0.000401535740820691, "global_step": 53215, "epoch": 447, "lr": 1.5370993741307697e-05} +{"train_loss": 0.00037470372626557946, "global_step": 53216, "epoch": 447, "lr": 1.5369395637476798e-05} +{"train_loss": 0.0007551590679213405, "global_step": 53217, "epoch": 447, "lr": 1.5367797601639405e-05} +{"train_loss": 0.0008149753557518125, "global_step": 53218, "epoch": 447, "lr": 1.536619963379864e-05} +{"train_loss": 0.0008078537066467106, "global_step": 53219, "epoch": 447, "lr": 1.5364601733957625e-05} +{"train_loss": 0.0006880367873236537, "global_step": 53220, "epoch": 447, "lr": 1.5363003902119528e-05} +{"train_loss": 0.00040161950164474547, "global_step": 53221, "epoch": 447, "lr": 1.536140613828746e-05} +{"train_loss": 0.0013047389220446348, "global_step": 53222, "epoch": 447, "lr": 1.5359808442464584e-05} +{"train_loss": 0.000468343059765175, "global_step": 53223, "epoch": 447, "lr": 1.5358210814654027e-05} +{"train_loss": 0.0005236288416199386, "global_step": 53224, "epoch": 447, "lr": 1.5356613254858902e-05} +{"train_loss": 0.0010866003576666117, "global_step": 53225, "epoch": 447, "lr": 1.5355015763082386e-05} +{"train_loss": 0.0015210218261927366, "global_step": 53226, "epoch": 447, "lr": 1.535341833932758e-05} +{"train_loss": 0.0006470010848715901, "global_step": 53227, "epoch": 447, "lr": 1.535182098359765e-05} +{"train_loss": 0.0008130564820021391, "global_step": 53228, "epoch": 447, "lr": 1.53502236958957e-05} +{"train_loss": 0.0010162778198719025, "global_step": 53229, "epoch": 447, "lr": 1.534862647622488e-05} +{"train_loss": 0.0015360401012003422, "global_step": 53230, "epoch": 447, "lr": 1.534702932458835e-05} +{"train_loss": 0.001222358550876379, "global_step": 53231, "epoch": 447, "lr": 1.534543224098921e-05} +{"train_loss": 0.0009863422019407153, "global_step": 53232, "epoch": 447, "lr": 1.5343835225430632e-05} +{"train_loss": 0.000890012364834547, "global_step": 53233, "epoch": 447, "lr": 1.534223827791571e-05} +{"train_loss": 0.0005835822666995227, "global_step": 53234, "epoch": 447, "lr": 1.5340641398447618e-05} +{"train_loss": 0.0005256371223367751, "global_step": 53235, "epoch": 447, "lr": 1.5339044587029456e-05} +{"train_loss": 0.000558426370844245, "global_step": 53236, "epoch": 447, "lr": 1.5337447843664394e-05} +{"train_loss": 0.0008711627451702952, "global_step": 53237, "epoch": 447, "lr": 1.5335851168355553e-05} +{"train_loss": 0.0005724571528844535, "global_step": 53238, "epoch": 447, "lr": 1.5334254561106043e-05} +{"train_loss": 0.0008334435406140983, "global_step": 53239, "epoch": 447, "lr": 1.5332658021919042e-05} +{"train_loss": 0.0015132918488234282, "global_step": 53240, "epoch": 447, "lr": 1.5331061550797644e-05} +{"train_loss": 0.0008614488760940731, "global_step": 53241, "epoch": 447, "lr": 1.532946514774502e-05} +{"train_loss": 0.0008925292640924454, "global_step": 53242, "epoch": 447, "lr": 1.532786881276429e-05} +{"train_loss": 0.0007019093027338386, "global_step": 53243, "epoch": 447, "lr": 1.5326272545858568e-05} +{"train_loss": 0.0004721822333522141, "global_step": 53244, "epoch": 447, "lr": 1.5324676347031018e-05} +{"train_loss": 0.00044388638343662024, "global_step": 53245, "epoch": 447, "lr": 1.5323080216284748e-05} +{"train_loss": 0.0006134702707640827, "global_step": 53246, "epoch": 447, "lr": 1.5321484153622922e-05} +{"train_loss": 0.0005223124171607196, "global_step": 53247, "epoch": 447, "lr": 1.531988815904864e-05} +{"train_loss": 0.0014893567422404885, "global_step": 53248, "epoch": 447, "lr": 1.531829223256507e-05} +{"train_loss": 0.0011332887224853039, "global_step": 53249, "epoch": 447, "lr": 1.5316696374175328e-05} +{"train_loss": 0.00038099035737104714, "global_step": 53250, "epoch": 447, "lr": 1.5315100583882523e-05} +{"train_loss": 0.0006593003054149449, "global_step": 53251, "epoch": 447, "lr": 1.5313504861689835e-05} +{"train_loss": 0.0011426450219005346, "global_step": 53252, "epoch": 447, "lr": 1.531190920760036e-05} +{"train_loss": 0.0005245816428214312, "global_step": 53253, "epoch": 447, "lr": 1.531031362161726e-05} +{"train_loss": 0.0005267883534543216, "global_step": 53254, "epoch": 447, "lr": 1.530871810374364e-05} +{"train_loss": 0.0008245874778367579, "global_step": 53255, "epoch": 447, "lr": 1.5307122653982658e-05} +{"train_loss": 0.0005988678312860429, "global_step": 53256, "epoch": 447, "lr": 1.530552727233744e-05} +{"train_loss": 0.0007969020516611636, "global_step": 53257, "epoch": 447, "lr": 1.530393195881109e-05} +{"train_loss": 0.0009325840510427952, "global_step": 53258, "epoch": 447, "lr": 1.5302336713406777e-05} +{"train_loss": 0.0007595191127620637, "global_step": 53259, "epoch": 447, "lr": 1.530074153612761e-05} +{"train_loss": 0.0008551279315724969, "global_step": 53260, "epoch": 447, "lr": 1.5299146426976742e-05} +{"train_loss": 0.0007121299859136343, "global_step": 53261, "epoch": 447, "lr": 1.5297551385957278e-05} +{"train_loss": 0.0006485729245468974, "global_step": 53262, "epoch": 447, "lr": 1.529595641307238e-05} +{"train_loss": 0.0007083993987180293, "global_step": 53263, "epoch": 447, "lr": 1.529436150832515e-05} +{"train_loss": 0.0006492844549939036, "global_step": 53264, "epoch": 447, "lr": 1.5292766671718727e-05} +{"train_loss": 0.0004209299513604492, "global_step": 53265, "epoch": 447, "lr": 1.5291171903256275e-05} +{"train_loss": 0.00045387272257357836, "global_step": 53266, "epoch": 447, "lr": 1.5289577202940875e-05} +{"train_loss": 0.0007042914512567222, "global_step": 53267, "epoch": 447, "lr": 1.52879825707757e-05} +{"train_loss": 0.0009357936796732247, "global_step": 53268, "epoch": 447, "lr": 1.5286388006763863e-05} +{"train_loss": 0.000608474831096828, "global_step": 53269, "epoch": 447, "lr": 1.528479351090848e-05} +{"train_loss": 0.0004821627517230809, "global_step": 53270, "epoch": 447, "lr": 1.5283199083212707e-05} +{"train_loss": 0.0006783002172596753, "global_step": 53271, "epoch": 447, "lr": 1.5281604723679655e-05} +{"train_loss": 0.0011191634694114327, "global_step": 53272, "epoch": 447, "lr": 1.5280010432312474e-05} +{"train_loss": 0.0007297003176063299, "global_step": 53273, "epoch": 447, "lr": 1.5278416209114267e-05} +{"train_loss": 0.0005372809246182442, "global_step": 53274, "epoch": 447, "lr": 1.5276822054088196e-05} +{"train_loss": 0.00043931626714766026, "global_step": 53275, "epoch": 447, "lr": 1.5275227967237378e-05} +{"train_loss": 0.0005765203386545181, "global_step": 53276, "epoch": 447, "lr": 1.5273633948564926e-05} +{"train_loss": 0.0004894050071015954, "global_step": 53277, "epoch": 447, "lr": 1.5272039998073994e-05} +{"train_loss": 0.000729088147636503, "global_step": 53278, "epoch": 447, "lr": 1.527044611576769e-05} +{"train_loss": 0.00060726806987077, "global_step": 53279, "epoch": 447, "lr": 1.5268852301649165e-05} +{"train_loss": 0.0007321491139009595, "global_step": 53280, "epoch": 447, "lr": 1.5267258555721546e-05} +{"train_loss": 0.00046741453115828335, "global_step": 53281, "epoch": 447, "lr": 1.5265664877987932e-05} +{"train_loss": 0.001056502922438085, "global_step": 53282, "epoch": 447, "lr": 1.526407126845149e-05} +{"train_loss": 0.0009103910997509956, "global_step": 53283, "epoch": 447, "lr": 1.526247772711532e-05} +{"train_loss": 0.0004905057139694691, "global_step": 53284, "epoch": 447, "lr": 1.5260884253982583e-05} +{"train_loss": 0.0006440565339289606, "global_step": 53285, "epoch": 447, "lr": 1.5259290849056367e-05} +{"train_loss": 0.0009566235239617527, "global_step": 53286, "epoch": 447, "lr": 1.5257697512339841e-05} +{"train_loss": 0.0010081217624247074, "global_step": 53287, "epoch": 447, "lr": 1.5256104243836112e-05} +{"train_loss": 0.0011370866559445858, "global_step": 53288, "epoch": 447, "lr": 1.5254511043548298e-05} +{"train_loss": 0.0008195961127057672, "global_step": 53289, "epoch": 447, "lr": 1.5252917911479553e-05} +{"train_loss": 0.0008006520802155137, "global_step": 53290, "epoch": 447, "lr": 1.5251324847632975e-05} +{"train_loss": 0.00040953545249067247, "global_step": 53291, "epoch": 447, "lr": 1.5249731852011723e-05} +{"train_loss": 0.00041954818880185485, "global_step": 53292, "epoch": 447, "lr": 1.5248138924618893e-05} +{"train_loss": 0.0004988493747077882, "global_step": 53293, "epoch": 447, "lr": 1.524654606545765e-05} +{"train_loss": 0.0008719634497538209, "global_step": 53294, "epoch": 447, "lr": 1.5244953274531081e-05} +{"train_loss": 0.0008056422811932862, "global_step": 53295, "epoch": 447, "lr": 1.5243360551842356e-05} +{"train_loss": 0.0005910786567255855, "global_step": 53296, "epoch": 447, "lr": 1.524176789739456e-05} +{"train_loss": 0.001085981959477067, "global_step": 53297, "epoch": 447, "lr": 1.5240175311190852e-05} +{"train_loss": 0.0006583461072295904, "global_step": 53298, "epoch": 447, "lr": 1.523858279323433e-05} +{"train_loss": 0.0006596557213924825, "global_step": 53299, "epoch": 447, "lr": 1.5236990343528157e-05} +{"train_loss": 0.0009603319922462106, "global_step": 53300, "epoch": 447, "lr": 1.523539796207542e-05} +{"train_loss": 0.0009910878725349903, "global_step": 53301, "epoch": 447, "lr": 1.5233805648879284e-05} +{"train_loss": 0.0009749765158630908, "global_step": 53302, "epoch": 447, "lr": 1.5232213403942842e-05} +{"train_loss": 0.0005066776066087186, "global_step": 53303, "epoch": 447, "lr": 1.5230621227269248e-05} +{"train_loss": 0.0005838919896632433, "global_step": 53304, "epoch": 447, "lr": 1.5229029118861598e-05} +{"train_loss": 0.00034027951187454164, "global_step": 53305, "epoch": 447, "lr": 1.522743707872305e-05} +{"train_loss": 0.000684060447383672, "global_step": 53306, "epoch": 447, "lr": 1.5225845106856717e-05} +{"train_loss": 0.0006643093074671924, "global_step": 53307, "epoch": 447, "lr": 1.5224253203265704e-05} +{"train_loss": 0.0009361275588162243, "global_step": 53308, "epoch": 447, "lr": 1.5222661367953173e-05} +{"train_loss": 0.00035701468004845083, "global_step": 53309, "epoch": 447, "lr": 1.5221069600922211e-05} +{"train_loss": 0.0004851415869779885, "global_step": 53310, "epoch": 447, "lr": 1.5219477902175982e-05} +{"train_loss": 0.000748451436701536, "global_step": 53311, "epoch": 447, "lr": 1.521788627171759e-05, "val_loss": 0.01838890090584755} +{"train_loss": 0.0006131169502623379, "global_step": 53312, "epoch": 448, "lr": 1.521629470955015e-05} +{"train_loss": 0.0006799301481805742, "global_step": 53313, "epoch": 448, "lr": 1.5214703215676813e-05} +{"train_loss": 0.0006542517221532762, "global_step": 53314, "epoch": 448, "lr": 1.5213111790100677e-05} +{"train_loss": 0.0007531630690209568, "global_step": 53315, "epoch": 448, "lr": 1.5211520432824888e-05} +{"train_loss": 0.0003910162777174264, "global_step": 53316, "epoch": 448, "lr": 1.5209929143852553e-05} +{"train_loss": 0.0007552626193501055, "global_step": 53317, "epoch": 448, "lr": 1.5208337923186821e-05} +{"train_loss": 0.0004859084729105234, "global_step": 53318, "epoch": 448, "lr": 1.52067467708308e-05} +{"train_loss": 0.0007035475573502481, "global_step": 53319, "epoch": 448, "lr": 1.5205155686787598e-05} +{"train_loss": 0.0004612568882293999, "global_step": 53320, "epoch": 448, "lr": 1.5203564671060371e-05} +{"train_loss": 0.0008202344761230052, "global_step": 53321, "epoch": 448, "lr": 1.5201973723652208e-05} +{"train_loss": 0.00031961483182385564, "global_step": 53322, "epoch": 448, "lr": 1.5200382844566274e-05} +{"train_loss": 0.0007148789591155946, "global_step": 53323, "epoch": 448, "lr": 1.5198792033805653e-05} +{"train_loss": 0.0011395660694688559, "global_step": 53324, "epoch": 448, "lr": 1.5197201291373498e-05} +{"train_loss": 0.0008690652903169394, "global_step": 53325, "epoch": 448, "lr": 1.519561061727291e-05} +{"train_loss": 0.0006407870096154511, "global_step": 53326, "epoch": 448, "lr": 1.5194020011507033e-05} +{"train_loss": 0.0005234450218267739, "global_step": 53327, "epoch": 448, "lr": 1.5192429474078967e-05} +{"train_loss": 0.0008061568369157612, "global_step": 53328, "epoch": 448, "lr": 1.5190839004991859e-05} +{"train_loss": 0.0006376053206622601, "global_step": 53329, "epoch": 448, "lr": 1.5189248604248807e-05} +{"train_loss": 0.0006238868809305131, "global_step": 53330, "epoch": 448, "lr": 1.5187658271852962e-05} +{"train_loss": 0.0005210090312175453, "global_step": 53331, "epoch": 448, "lr": 1.5186068007807414e-05} +{"train_loss": 0.0011844565160572529, "global_step": 53332, "epoch": 448, "lr": 1.5184477812115322e-05} +{"train_loss": 0.0005228568334132433, "global_step": 53333, "epoch": 448, "lr": 1.5182887684779767e-05} +{"train_loss": 0.0005288699176162481, "global_step": 53334, "epoch": 448, "lr": 1.5181297625803908e-05} +{"train_loss": 0.0007116468041203916, "global_step": 53335, "epoch": 448, "lr": 1.5179707635190838e-05} +{"train_loss": 0.0009982474148273468, "global_step": 53336, "epoch": 448, "lr": 1.5178117712943708e-05} +{"train_loss": 0.0006093939882703125, "global_step": 53337, "epoch": 448, "lr": 1.5176527859065626e-05} +{"train_loss": 0.0006136941956356168, "global_step": 53338, "epoch": 448, "lr": 1.5174938073559692e-05} +{"train_loss": 0.0006986383232288063, "global_step": 53339, "epoch": 448, "lr": 1.5173348356429063e-05} +{"train_loss": 0.0005783235537819564, "global_step": 53340, "epoch": 448, "lr": 1.5171758707676825e-05} +{"train_loss": 0.0004918054910376668, "global_step": 53341, "epoch": 448, "lr": 1.517016912730614e-05} +{"train_loss": 0.0006409102934412658, "global_step": 53342, "epoch": 448, "lr": 1.5168579615320105e-05} +{"train_loss": 0.0007173207122832537, "global_step": 53343, "epoch": 448, "lr": 1.5166990171721824e-05} +{"train_loss": 0.0014119840925559402, "global_step": 53344, "epoch": 448, "lr": 1.5165400796514456e-05} +{"train_loss": 0.0010646155569702387, "global_step": 53345, "epoch": 448, "lr": 1.5163811489701079e-05} +{"train_loss": 0.0007660280098207295, "global_step": 53346, "epoch": 448, "lr": 1.5162222251284857e-05} +{"train_loss": 0.00040671142050996423, "global_step": 53347, "epoch": 448, "lr": 1.5160633081268876e-05} +{"train_loss": 0.0008990753558464348, "global_step": 53348, "epoch": 448, "lr": 1.5159043979656285e-05} +{"train_loss": 0.0008209215011447668, "global_step": 53349, "epoch": 448, "lr": 1.515745494645019e-05} +{"train_loss": 0.0007446530507877469, "global_step": 53350, "epoch": 448, "lr": 1.5155865981653689e-05} +{"train_loss": 0.0009894834365695715, "global_step": 53351, "epoch": 448, "lr": 1.5154277085269941e-05} +{"train_loss": 0.00045879543176852167, "global_step": 53352, "epoch": 448, "lr": 1.5152688257302033e-05} +{"train_loss": 0.000557485967874527, "global_step": 53353, "epoch": 448, "lr": 1.5151099497753113e-05} +{"train_loss": 0.0005289061809889972, "global_step": 53354, "epoch": 448, "lr": 1.514951080662627e-05} +{"train_loss": 0.00043536711018532515, "global_step": 53355, "epoch": 448, "lr": 1.5147922183924656e-05} +{"train_loss": 0.0013123711105436087, "global_step": 53356, "epoch": 448, "lr": 1.5146333629651377e-05} +{"train_loss": 0.0005470299511216581, "global_step": 53357, "epoch": 448, "lr": 1.5144745143809524e-05} +{"train_loss": 0.0006834025261923671, "global_step": 53358, "epoch": 448, "lr": 1.5143156726402263e-05} +{"train_loss": 0.0006771094631403685, "global_step": 53359, "epoch": 448, "lr": 1.5141568377432674e-05} +{"train_loss": 0.0011242952896282077, "global_step": 53360, "epoch": 448, "lr": 1.5139980096903906e-05} +{"train_loss": 0.00048580075963400304, "global_step": 53361, "epoch": 448, "lr": 1.5138391884819042e-05} +{"train_loss": 0.0007399704190902412, "global_step": 53362, "epoch": 448, "lr": 1.5136803741181227e-05} +{"train_loss": 0.0004786117933690548, "global_step": 53363, "epoch": 448, "lr": 1.5135215665993585e-05} +{"train_loss": 0.001000870019197464, "global_step": 53364, "epoch": 448, "lr": 1.5133627659259208e-05} +{"train_loss": 0.0012968762312084436, "global_step": 53365, "epoch": 448, "lr": 1.5132039720981245e-05} +{"train_loss": 0.0004502043593674898, "global_step": 53366, "epoch": 448, "lr": 1.513045185116278e-05} +{"train_loss": 0.0005659007583744824, "global_step": 53367, "epoch": 448, "lr": 1.5128864049806967e-05} +{"train_loss": 0.000865697511471808, "global_step": 53368, "epoch": 448, "lr": 1.5127276316916899e-05} +{"train_loss": 0.0003385149466339499, "global_step": 53369, "epoch": 448, "lr": 1.5125688652495683e-05} +{"train_loss": 0.0005685816868208349, "global_step": 53370, "epoch": 448, "lr": 1.5124101056546469e-05} +{"train_loss": 0.000687865715008229, "global_step": 53371, "epoch": 448, "lr": 1.512251352907234e-05} +{"train_loss": 0.0005178095889277756, "global_step": 53372, "epoch": 448, "lr": 1.5120926070076453e-05} +{"train_loss": 0.0017872886965051293, "global_step": 53373, "epoch": 448, "lr": 1.5119338679561874e-05} +{"train_loss": 0.0005358509952202439, "global_step": 53374, "epoch": 448, "lr": 1.5117751357531767e-05} +{"train_loss": 0.0006350071053020656, "global_step": 53375, "epoch": 448, "lr": 1.5116164103989233e-05} +{"train_loss": 0.0008313119760714471, "global_step": 53376, "epoch": 448, "lr": 1.5114576918937363e-05} +{"train_loss": 0.0007782951579429209, "global_step": 53377, "epoch": 448, "lr": 1.5112989802379312e-05} +{"train_loss": 0.0009125490323640406, "global_step": 53378, "epoch": 448, "lr": 1.511140275431816e-05} +{"train_loss": 0.0011213172692805529, "global_step": 53379, "epoch": 448, "lr": 1.5109815774757057e-05} +{"train_loss": 0.0011317397002130747, "global_step": 53380, "epoch": 448, "lr": 1.5108228863699109e-05} +{"train_loss": 0.0007422162452712655, "global_step": 53381, "epoch": 448, "lr": 1.5106642021147404e-05} +{"train_loss": 0.0006941342144273221, "global_step": 53382, "epoch": 448, "lr": 1.5105055247105099e-05} +{"train_loss": 0.0007731911609880626, "global_step": 53383, "epoch": 448, "lr": 1.5103468541575278e-05} +{"train_loss": 0.0008359166677109897, "global_step": 53384, "epoch": 448, "lr": 1.5101881904561077e-05} +{"train_loss": 0.001214297371916473, "global_step": 53385, "epoch": 448, "lr": 1.510029533606559e-05} +{"train_loss": 0.00028911317349411547, "global_step": 53386, "epoch": 448, "lr": 1.5098708836091957e-05} +{"train_loss": 0.0004115882911719382, "global_step": 53387, "epoch": 448, "lr": 1.5097122404643282e-05} +{"train_loss": 0.0009740363457240164, "global_step": 53388, "epoch": 448, "lr": 1.509553604172267e-05} +{"train_loss": 0.0006402003928087652, "global_step": 53389, "epoch": 448, "lr": 1.5093949747333253e-05} +{"train_loss": 0.0009002434671856463, "global_step": 53390, "epoch": 448, "lr": 1.509236352147812e-05} +{"train_loss": 0.0005559687851928174, "global_step": 53391, "epoch": 448, "lr": 1.509077736416042e-05} +{"train_loss": 0.0007729546632617712, "global_step": 53392, "epoch": 448, "lr": 1.508919127538323e-05} +{"train_loss": 0.0007714001694694161, "global_step": 53393, "epoch": 448, "lr": 1.50876052551497e-05} +{"train_loss": 0.0006760565447621047, "global_step": 53394, "epoch": 448, "lr": 1.5086019303462912e-05} +{"train_loss": 0.00045356739428825676, "global_step": 53395, "epoch": 448, "lr": 1.5084433420326017e-05} +{"train_loss": 0.001451542368158698, "global_step": 53396, "epoch": 448, "lr": 1.5082847605742084e-05} +{"train_loss": 0.0003834033268503845, "global_step": 53397, "epoch": 448, "lr": 1.5081261859714253e-05} +{"train_loss": 0.0005637665744870901, "global_step": 53398, "epoch": 448, "lr": 1.5079676182245644e-05} +{"train_loss": 0.0015421294374391437, "global_step": 53399, "epoch": 448, "lr": 1.5078090573339365e-05} +{"train_loss": 0.0004846326482947916, "global_step": 53400, "epoch": 448, "lr": 1.5076505032998505e-05} +{"train_loss": 0.0008048680028878152, "global_step": 53401, "epoch": 448, "lr": 1.5074919561226213e-05} +{"train_loss": 0.0005178247229196131, "global_step": 53402, "epoch": 448, "lr": 1.5073334158025577e-05} +{"train_loss": 0.0005630272207781672, "global_step": 53403, "epoch": 448, "lr": 1.5071748823399723e-05} +{"train_loss": 0.0017075606156140566, "global_step": 53404, "epoch": 448, "lr": 1.5070163557351746e-05} +{"train_loss": 0.0005007474101148546, "global_step": 53405, "epoch": 448, "lr": 1.5068578359884794e-05} +{"train_loss": 0.0011695486027747393, "global_step": 53406, "epoch": 448, "lr": 1.5066993231001947e-05} +{"train_loss": 0.0006434138049371541, "global_step": 53407, "epoch": 448, "lr": 1.506540817070632e-05} +{"train_loss": 0.0009838807163760066, "global_step": 53408, "epoch": 448, "lr": 1.5063823179001041e-05} +{"train_loss": 0.0004878499894402921, "global_step": 53409, "epoch": 448, "lr": 1.5062238255889199e-05} +{"train_loss": 0.0007768249488435686, "global_step": 53410, "epoch": 448, "lr": 1.506065340137393e-05} +{"train_loss": 0.0006521655595861375, "global_step": 53411, "epoch": 448, "lr": 1.5059068615458344e-05} +{"train_loss": 0.0010356182465329766, "global_step": 53412, "epoch": 448, "lr": 1.5057483898145525e-05} +{"train_loss": 0.0005568900378420949, "global_step": 53413, "epoch": 448, "lr": 1.5055899249438616e-05} +{"train_loss": 0.0011130644707009196, "global_step": 53414, "epoch": 448, "lr": 1.5054314669340703e-05} +{"train_loss": 0.0008281327318400145, "global_step": 53415, "epoch": 448, "lr": 1.5052730157854928e-05} +{"train_loss": 0.0005922515410929918, "global_step": 53416, "epoch": 448, "lr": 1.505114571498436e-05} +{"train_loss": 0.0011363080702722073, "global_step": 53417, "epoch": 448, "lr": 1.504956134073216e-05} +{"train_loss": 0.0010316881816834211, "global_step": 53418, "epoch": 448, "lr": 1.5047977035101407e-05} +{"train_loss": 0.0017114505171775818, "global_step": 53419, "epoch": 448, "lr": 1.5046392798095199e-05} +{"train_loss": 0.0004997664946131408, "global_step": 53420, "epoch": 448, "lr": 1.5044808629716684e-05} +{"train_loss": 0.0006681960658170283, "global_step": 53421, "epoch": 448, "lr": 1.5043224529968936e-05} +{"train_loss": 0.0012721249368041754, "global_step": 53422, "epoch": 448, "lr": 1.5041640498855092e-05} +{"train_loss": 0.0010021100752055645, "global_step": 53423, "epoch": 448, "lr": 1.5040056536378244e-05} +{"train_loss": 0.0010344667825847864, "global_step": 53424, "epoch": 448, "lr": 1.5038472642541523e-05} +{"train_loss": 0.000818368629552424, "global_step": 53425, "epoch": 448, "lr": 1.503688881734801e-05} +{"train_loss": 0.0009482720051892102, "global_step": 53426, "epoch": 448, "lr": 1.5035305060800847e-05} +{"train_loss": 0.0006852674414403737, "global_step": 53427, "epoch": 448, "lr": 1.503372137290311e-05} +{"train_loss": 0.0013771435478702188, "global_step": 53428, "epoch": 448, "lr": 1.5032137753657944e-05} +{"train_loss": 0.0004457921313587576, "global_step": 53429, "epoch": 448, "lr": 1.503055420306842e-05} +{"train_loss": 0.0007740691589864613, "global_step": 53430, "epoch": 448, "lr": 1.5028970721137686e-05, "val_loss": 0.015416905283927917} +{"train_loss": 0.0010049125412479043, "global_step": 53431, "epoch": 449, "lr": 1.5027387307868818e-05} +{"train_loss": 0.0011375363683328032, "global_step": 53432, "epoch": 449, "lr": 1.502580396326495e-05} +{"train_loss": 0.0005853432230651379, "global_step": 53433, "epoch": 449, "lr": 1.5024220687329167e-05} +{"train_loss": 0.0010191785404458642, "global_step": 53434, "epoch": 449, "lr": 1.5022637480064605e-05} +{"train_loss": 0.001193283125758171, "global_step": 53435, "epoch": 449, "lr": 1.5021054341474338e-05} +{"train_loss": 0.0006386255845427513, "global_step": 53436, "epoch": 449, "lr": 1.5019471271561514e-05} +{"train_loss": 0.0008684261702001095, "global_step": 53437, "epoch": 449, "lr": 1.5017888270329216e-05} +{"train_loss": 0.001512498245574534, "global_step": 53438, "epoch": 449, "lr": 1.501630533778055e-05} +{"train_loss": 0.0008526325691491365, "global_step": 53439, "epoch": 449, "lr": 1.5014722473918641e-05} +{"train_loss": 0.0007576256757602096, "global_step": 53440, "epoch": 449, "lr": 1.5013139678746568e-05} +{"train_loss": 0.0012611707206815481, "global_step": 53441, "epoch": 449, "lr": 1.501155695226748e-05} +{"train_loss": 0.0004935312317684293, "global_step": 53442, "epoch": 449, "lr": 1.500997429448444e-05} +{"train_loss": 0.0003789433103520423, "global_step": 53443, "epoch": 449, "lr": 1.50083917054006e-05} +{"train_loss": 0.0007916989852674305, "global_step": 53444, "epoch": 449, "lr": 1.5006809185019038e-05} +{"train_loss": 0.0006564200157299638, "global_step": 53445, "epoch": 449, "lr": 1.5005226733342858e-05} +{"train_loss": 0.0011828674469143152, "global_step": 53446, "epoch": 449, "lr": 1.500364435037519e-05} +{"train_loss": 0.0008504324359819293, "global_step": 53447, "epoch": 449, "lr": 1.5002062036119107e-05} +{"train_loss": 0.0010894967708736658, "global_step": 53448, "epoch": 449, "lr": 1.500047979057776e-05} +{"train_loss": 0.0003356003144290298, "global_step": 53449, "epoch": 449, "lr": 1.4998897613754225e-05} +{"train_loss": 0.000979722710326314, "global_step": 53450, "epoch": 449, "lr": 1.4997315505651604e-05} +{"train_loss": 0.0008821883820928633, "global_step": 53451, "epoch": 449, "lr": 1.4995733466273026e-05} +{"train_loss": 0.0016030208207666874, "global_step": 53452, "epoch": 449, "lr": 1.4994151495621572e-05} +{"train_loss": 0.0005956126260571182, "global_step": 53453, "epoch": 449, "lr": 1.4992569593700378e-05} +{"train_loss": 0.0006674452451989055, "global_step": 53454, "epoch": 449, "lr": 1.499098776051252e-05} +{"train_loss": 0.000982698518782854, "global_step": 53455, "epoch": 449, "lr": 1.4989405996061128e-05} +{"train_loss": 0.0007495406898669899, "global_step": 53456, "epoch": 449, "lr": 1.49878243003493e-05} +{"train_loss": 0.001180600025691092, "global_step": 53457, "epoch": 449, "lr": 1.4986242673380125e-05} +{"train_loss": 0.000634814496152103, "global_step": 53458, "epoch": 449, "lr": 1.4984661115156717e-05} +{"train_loss": 0.0011009675217792392, "global_step": 53459, "epoch": 449, "lr": 1.4983079625682206e-05} +{"train_loss": 0.0005838030483573675, "global_step": 53460, "epoch": 449, "lr": 1.4981498204959659e-05} +{"train_loss": 0.0006922514294274151, "global_step": 53461, "epoch": 449, "lr": 1.4979916852992214e-05} +{"train_loss": 0.0004681749560404569, "global_step": 53462, "epoch": 449, "lr": 1.4978335569782947e-05} +{"train_loss": 0.0008764783851802349, "global_step": 53463, "epoch": 449, "lr": 1.4976754355334993e-05} +{"train_loss": 0.000737539550755173, "global_step": 53464, "epoch": 449, "lr": 1.4975173209651422e-05} +{"train_loss": 0.0006390207563526928, "global_step": 53465, "epoch": 449, "lr": 1.4973592132735375e-05} +{"train_loss": 0.0005385263357311487, "global_step": 53466, "epoch": 449, "lr": 1.4972011124589924e-05} +{"train_loss": 0.0012486096238717437, "global_step": 53467, "epoch": 449, "lr": 1.4970430185218198e-05} +{"train_loss": 0.0005721282213926315, "global_step": 53468, "epoch": 449, "lr": 1.496884931462329e-05} +{"train_loss": 0.0008760495111346245, "global_step": 53469, "epoch": 449, "lr": 1.496726851280829e-05} +{"train_loss": 0.000793808838352561, "global_step": 53470, "epoch": 449, "lr": 1.4965687779776333e-05} +{"train_loss": 0.000583478482440114, "global_step": 53471, "epoch": 449, "lr": 1.4964107115530485e-05} +{"train_loss": 0.0005130788777023554, "global_step": 53472, "epoch": 449, "lr": 1.4962526520073888e-05} +{"train_loss": 0.0005847676657140255, "global_step": 53473, "epoch": 449, "lr": 1.4960945993409608e-05} +{"train_loss": 0.0013223006390035152, "global_step": 53474, "epoch": 449, "lr": 1.4959365535540788e-05} +{"train_loss": 0.0007695247186347842, "global_step": 53475, "epoch": 449, "lr": 1.495778514647051e-05} +{"train_loss": 0.000582134525757283, "global_step": 53476, "epoch": 449, "lr": 1.4956204826201858e-05} +{"train_loss": 0.001202934654429555, "global_step": 53477, "epoch": 449, "lr": 1.4954624574737974e-05} +{"train_loss": 0.0008603986934758723, "global_step": 53478, "epoch": 449, "lr": 1.4953044392081922e-05} +{"train_loss": 0.0008253486012108624, "global_step": 53479, "epoch": 449, "lr": 1.4951464278236837e-05} +{"train_loss": 0.001191925024613738, "global_step": 53480, "epoch": 449, "lr": 1.4949884233205807e-05} +{"train_loss": 0.0011583182495087385, "global_step": 53481, "epoch": 449, "lr": 1.4948304256991924e-05} +{"train_loss": 0.001358876354061067, "global_step": 53482, "epoch": 449, "lr": 1.4946724349598312e-05} +{"train_loss": 0.0014051343314349651, "global_step": 53483, "epoch": 449, "lr": 1.4945144511028047e-05} +{"train_loss": 0.00030503905145451427, "global_step": 53484, "epoch": 449, "lr": 1.4943564741284265e-05} +{"train_loss": 0.0004242743889335543, "global_step": 53485, "epoch": 449, "lr": 1.4941985040370032e-05} +{"train_loss": 0.0004460244963411242, "global_step": 53486, "epoch": 449, "lr": 1.4940405408288477e-05} +{"train_loss": 0.00089146668324247, "global_step": 53487, "epoch": 449, "lr": 1.4938825845042693e-05} +{"train_loss": 0.003044516546651721, "global_step": 53488, "epoch": 449, "lr": 1.4937246350635764e-05} +{"train_loss": 0.0005815819022245705, "global_step": 53489, "epoch": 449, "lr": 1.4935666925070823e-05} +{"train_loss": 0.0008994000963866711, "global_step": 53490, "epoch": 449, "lr": 1.4934087568350935e-05} +{"train_loss": 0.0010484238155186176, "global_step": 53491, "epoch": 449, "lr": 1.4932508280479234e-05} +{"train_loss": 0.0011809910647571087, "global_step": 53492, "epoch": 449, "lr": 1.4930929061458799e-05} +{"train_loss": 0.0009561550104990602, "global_step": 53493, "epoch": 449, "lr": 1.4929349911292728e-05} +{"train_loss": 0.0011055542854592204, "global_step": 53494, "epoch": 449, "lr": 1.4927770829984155e-05} +{"train_loss": 0.0017371615394949913, "global_step": 53495, "epoch": 449, "lr": 1.492619181753614e-05} +{"train_loss": 0.0011396448826417327, "global_step": 53496, "epoch": 449, "lr": 1.4924612873951809e-05} +{"train_loss": 0.0014716117875650525, "global_step": 53497, "epoch": 449, "lr": 1.4923033999234249e-05} +{"train_loss": 0.0006491701351478696, "global_step": 53498, "epoch": 449, "lr": 1.4921455193386575e-05} +{"train_loss": 0.0012393889483064413, "global_step": 53499, "epoch": 449, "lr": 1.4919876456411874e-05} +{"train_loss": 0.0009474347461946309, "global_step": 53500, "epoch": 449, "lr": 1.491829778831323e-05} +{"train_loss": 0.001536182826384902, "global_step": 53501, "epoch": 449, "lr": 1.491671918909378e-05} +{"train_loss": 0.0011186983902007341, "global_step": 53502, "epoch": 449, "lr": 1.4915140658756588e-05} +{"train_loss": 0.0015494691906496882, "global_step": 53503, "epoch": 449, "lr": 1.4913562197304787e-05} +{"train_loss": 0.0007058827904984355, "global_step": 53504, "epoch": 449, "lr": 1.4911983804741437e-05} +{"train_loss": 0.0006592057179659605, "global_step": 53505, "epoch": 449, "lr": 1.4910405481069678e-05} +{"train_loss": 0.0007961969240568578, "global_step": 53506, "epoch": 449, "lr": 1.4908827226292588e-05} +{"train_loss": 0.0010779611766338348, "global_step": 53507, "epoch": 449, "lr": 1.490724904041325e-05} +{"train_loss": 0.0017228180076926947, "global_step": 53508, "epoch": 449, "lr": 1.4905670923434794e-05} +{"train_loss": 0.001401362707838416, "global_step": 53509, "epoch": 449, "lr": 1.4904092875360292e-05} +{"train_loss": 0.000678405340295285, "global_step": 53510, "epoch": 449, "lr": 1.4902514896192871e-05} +{"train_loss": 0.0005790205905213952, "global_step": 53511, "epoch": 449, "lr": 1.4900936985935593e-05} +{"train_loss": 0.0008161811856552958, "global_step": 53512, "epoch": 449, "lr": 1.489935914459159e-05} +{"train_loss": 0.0005808912101201713, "global_step": 53513, "epoch": 449, "lr": 1.4897781372163949e-05} +{"train_loss": 0.0009882076410576701, "global_step": 53514, "epoch": 449, "lr": 1.4896203668655745e-05} +{"train_loss": 0.0008129379129968584, "global_step": 53515, "epoch": 449, "lr": 1.4894626034070114e-05} +{"train_loss": 0.001205569482408464, "global_step": 53516, "epoch": 449, "lr": 1.4893048468410115e-05} +{"train_loss": 0.0013429910177364945, "global_step": 53517, "epoch": 449, "lr": 1.4891470971678883e-05} +{"train_loss": 0.001076219603419304, "global_step": 53518, "epoch": 449, "lr": 1.4889893543879497e-05} +{"train_loss": 0.0010066945105791092, "global_step": 53519, "epoch": 449, "lr": 1.4888316185015038e-05} +{"train_loss": 0.00039965208270587027, "global_step": 53520, "epoch": 449, "lr": 1.4886738895088631e-05} +{"train_loss": 0.0006519368616864085, "global_step": 53521, "epoch": 449, "lr": 1.4885161674103349e-05} +{"train_loss": 0.0015511104138568044, "global_step": 53522, "epoch": 449, "lr": 1.4883584522062317e-05} +{"train_loss": 0.0006984049105085433, "global_step": 53523, "epoch": 449, "lr": 1.4882007438968597e-05} +{"train_loss": 0.0011128414189442992, "global_step": 53524, "epoch": 449, "lr": 1.488043042482532e-05} +{"train_loss": 0.0006721543031744659, "global_step": 53525, "epoch": 449, "lr": 1.4878853479635551e-05} +{"train_loss": 0.0006757404189556837, "global_step": 53526, "epoch": 449, "lr": 1.4877276603402418e-05} +{"train_loss": 0.0011070627951994538, "global_step": 53527, "epoch": 449, "lr": 1.4875699796128984e-05} +{"train_loss": 0.0009010889334604144, "global_step": 53528, "epoch": 449, "lr": 1.4874123057818357e-05} +{"train_loss": 0.0006670673610642552, "global_step": 53529, "epoch": 449, "lr": 1.4872546388473658e-05} +{"train_loss": 0.000643657345790416, "global_step": 53530, "epoch": 449, "lr": 1.4870969788097956e-05} +{"train_loss": 0.0020423149690032005, "global_step": 53531, "epoch": 449, "lr": 1.4869393256694342e-05} +{"train_loss": 0.0009644792880862951, "global_step": 53532, "epoch": 449, "lr": 1.4867816794265933e-05} +{"train_loss": 0.0010427485685795546, "global_step": 53533, "epoch": 449, "lr": 1.4866240400815795e-05} +{"train_loss": 0.0008508797036483884, "global_step": 53534, "epoch": 449, "lr": 1.4864664076347062e-05} +{"train_loss": 0.0005419586668722332, "global_step": 53535, "epoch": 449, "lr": 1.4863087820862786e-05} +{"train_loss": 0.0005168195348232985, "global_step": 53536, "epoch": 449, "lr": 1.4861511634366098e-05} +{"train_loss": 0.0007840332109481096, "global_step": 53537, "epoch": 449, "lr": 1.4859935516860084e-05} +{"train_loss": 0.0004421257181093097, "global_step": 53538, "epoch": 449, "lr": 1.4858359468347816e-05} +{"train_loss": 0.0005033693159930408, "global_step": 53539, "epoch": 449, "lr": 1.4856783488832416e-05} +{"train_loss": 0.00043435703264549375, "global_step": 53540, "epoch": 449, "lr": 1.4855207578316954e-05} +{"train_loss": 0.0006222333176992834, "global_step": 53541, "epoch": 449, "lr": 1.4853631736804551e-05} +{"train_loss": 0.0005353640881367028, "global_step": 53542, "epoch": 449, "lr": 1.4852055964298272e-05} +{"train_loss": 0.0011492243502289057, "global_step": 53543, "epoch": 449, "lr": 1.4850480260801248e-05} +{"train_loss": 0.0010168757289648056, "global_step": 53544, "epoch": 449, "lr": 1.4848904626316546e-05} +{"train_loss": 0.0010543818352743983, "global_step": 53545, "epoch": 449, "lr": 1.4847329060847247e-05} +{"train_loss": 0.0005716950399801135, "global_step": 53546, "epoch": 449, "lr": 1.484575356439648e-05} +{"train_loss": 0.000658373930491507, "global_step": 53547, "epoch": 449, "lr": 1.4844178136967302e-05} +{"train_loss": 0.0005176677950657904, "global_step": 53548, "epoch": 449, "lr": 1.4842602778562842e-05} +{"train_loss": 0.000910215125763554, "global_step": 53549, "epoch": 449, "lr": 1.4841027489186177e-05, "val_loss": 0.013923853635787964} +{"train_loss": 0.0008477152441628277, "global_step": 53550, "epoch": 450, "lr": 1.4839452268840381e-05} +{"train_loss": 0.0010456274030730128, "global_step": 53551, "epoch": 450, "lr": 1.4837877117528582e-05} +{"train_loss": 0.001744543667882681, "global_step": 53552, "epoch": 450, "lr": 1.4836302035253836e-05} +{"train_loss": 0.0008361563668586314, "global_step": 53553, "epoch": 450, "lr": 1.4834727022019268e-05} +{"train_loss": 0.0007259760750457644, "global_step": 53554, "epoch": 450, "lr": 1.4833152077827944e-05} +{"train_loss": 0.0006004403112456203, "global_step": 53555, "epoch": 450, "lr": 1.4831577202682984e-05} +{"train_loss": 0.001077207736670971, "global_step": 53556, "epoch": 450, "lr": 1.483000239658745e-05} +{"train_loss": 0.001099410466849804, "global_step": 53557, "epoch": 450, "lr": 1.4828427659544463e-05} +{"train_loss": 0.0008215793059207499, "global_step": 53558, "epoch": 450, "lr": 1.4826852991557089e-05} +{"train_loss": 0.0005360310315154493, "global_step": 53559, "epoch": 450, "lr": 1.4825278392628445e-05} +{"train_loss": 0.0006474010879173875, "global_step": 53560, "epoch": 450, "lr": 1.482370386276159e-05} +{"train_loss": 0.0003726813883986324, "global_step": 53561, "epoch": 450, "lr": 1.4822129401959655e-05} +{"train_loss": 0.0005716175655834377, "global_step": 53562, "epoch": 450, "lr": 1.482055501022569e-05} +{"train_loss": 0.0008794044842943549, "global_step": 53563, "epoch": 450, "lr": 1.4818980687562829e-05} +{"train_loss": 0.0006534263375215232, "global_step": 53564, "epoch": 450, "lr": 1.4817406433974118e-05} +{"train_loss": 0.0004083583189640194, "global_step": 53565, "epoch": 450, "lr": 1.4815832249462691e-05} +{"train_loss": 0.0009160689660347998, "global_step": 53566, "epoch": 450, "lr": 1.48142581340316e-05} +{"train_loss": 0.0005955124506726861, "global_step": 53567, "epoch": 450, "lr": 1.4812684087683976e-05} +{"train_loss": 0.0006342744454741478, "global_step": 53568, "epoch": 450, "lr": 1.4811110110422883e-05} +{"train_loss": 0.0005485844449140131, "global_step": 53569, "epoch": 450, "lr": 1.4809536202251401e-05} +{"train_loss": 0.001030314015224576, "global_step": 53570, "epoch": 450, "lr": 1.4807962363172651e-05} +{"train_loss": 0.0005386138800531626, "global_step": 53571, "epoch": 450, "lr": 1.4806388593189685e-05} +{"train_loss": 0.0006171334534883499, "global_step": 53572, "epoch": 450, "lr": 1.4804814892305641e-05} +{"train_loss": 0.0009891754016280174, "global_step": 53573, "epoch": 450, "lr": 1.480324126052356e-05} +{"train_loss": 0.0007627761224284768, "global_step": 53574, "epoch": 450, "lr": 1.4801667697846571e-05} +{"train_loss": 0.000937274016905576, "global_step": 53575, "epoch": 450, "lr": 1.4800094204277753e-05} +{"train_loss": 0.0012738098157569766, "global_step": 53576, "epoch": 450, "lr": 1.4798520779820168e-05} +{"train_loss": 0.0007663483265787363, "global_step": 53577, "epoch": 450, "lr": 1.4796947424476947e-05} +{"train_loss": 0.0008458927040919662, "global_step": 53578, "epoch": 450, "lr": 1.4795374138251138e-05} +{"train_loss": 0.0004911273717880249, "global_step": 53579, "epoch": 450, "lr": 1.4793800921145873e-05} +{"train_loss": 0.0010421602055430412, "global_step": 53580, "epoch": 450, "lr": 1.4792227773164196e-05} +{"train_loss": 0.0010137378703802824, "global_step": 53581, "epoch": 450, "lr": 1.4790654694309236e-05} +{"train_loss": 0.0006547041120938957, "global_step": 53582, "epoch": 450, "lr": 1.4789081684584066e-05} +{"train_loss": 0.0009612634312361479, "global_step": 53583, "epoch": 450, "lr": 1.4787508743991757e-05} +{"train_loss": 0.0005282366182655096, "global_step": 53584, "epoch": 450, "lr": 1.4785935872535428e-05} +{"train_loss": 0.000559357285965234, "global_step": 53585, "epoch": 450, "lr": 1.4784363070218133e-05} +{"train_loss": 0.0003511536051519215, "global_step": 53586, "epoch": 450, "lr": 1.4782790337042995e-05} +{"train_loss": 0.00048598169814795256, "global_step": 53587, "epoch": 450, "lr": 1.4781217673013088e-05} +{"train_loss": 0.0009064523037523031, "global_step": 53588, "epoch": 450, "lr": 1.4779645078131483e-05} +{"train_loss": 0.0007122609531506896, "global_step": 53589, "epoch": 450, "lr": 1.4778072552401295e-05} +{"train_loss": 0.0006010631332173944, "global_step": 53590, "epoch": 450, "lr": 1.4776500095825584e-05} +{"train_loss": 0.00042218973976559937, "global_step": 53591, "epoch": 450, "lr": 1.4774927708407454e-05} +{"train_loss": 0.0008426003041677177, "global_step": 53592, "epoch": 450, "lr": 1.4773355390150001e-05} +{"train_loss": 0.0004939982900395989, "global_step": 53593, "epoch": 450, "lr": 1.4771783141056288e-05} +{"train_loss": 0.0008027006988413632, "global_step": 53594, "epoch": 450, "lr": 1.4770210961129432e-05} +{"train_loss": 0.0005178798455744982, "global_step": 53595, "epoch": 450, "lr": 1.476863885037249e-05} +{"train_loss": 0.0007286404725164175, "global_step": 53596, "epoch": 450, "lr": 1.4767066808788571e-05} +{"train_loss": 0.0008572107180953026, "global_step": 53597, "epoch": 450, "lr": 1.4765494836380744e-05} +{"train_loss": 0.0008884764392860234, "global_step": 53598, "epoch": 450, "lr": 1.4763922933152113e-05} +{"train_loss": 0.00044382180203683674, "global_step": 53599, "epoch": 450, "lr": 1.4762351099105759e-05} +{"train_loss": 0.0009413147927261889, "global_step": 53600, "epoch": 450, "lr": 1.4760779334244746e-05} +{"train_loss": 0.0006873949896544218, "global_step": 53601, "epoch": 450, "lr": 1.4759207638572193e-05} +{"train_loss": 0.000302102038403973, "global_step": 53602, "epoch": 450, "lr": 1.4757636012091159e-05} +{"train_loss": 0.0008167812484316528, "global_step": 53603, "epoch": 450, "lr": 1.4756064454804752e-05} +{"train_loss": 0.0007271863869391382, "global_step": 53604, "epoch": 450, "lr": 1.4754492966716032e-05} +{"train_loss": 0.0005481543485075235, "global_step": 53605, "epoch": 450, "lr": 1.475292154782812e-05} +{"train_loss": 0.00037599907955154777, "global_step": 53606, "epoch": 450, "lr": 1.4751350198144077e-05} +{"train_loss": 0.00032525009009987116, "global_step": 53607, "epoch": 450, "lr": 1.474977891766698e-05} +{"train_loss": 0.0005314440932124853, "global_step": 53608, "epoch": 450, "lr": 1.4748207706399936e-05} +{"train_loss": 0.0012354586506262422, "global_step": 53609, "epoch": 450, "lr": 1.4746636564346012e-05} +{"train_loss": 0.0007979622459970415, "global_step": 53610, "epoch": 450, "lr": 1.4745065491508308e-05} +{"train_loss": 0.0010891365818679333, "global_step": 53611, "epoch": 450, "lr": 1.4743494487889892e-05} +{"train_loss": 0.0009616395109333098, "global_step": 53612, "epoch": 450, "lr": 1.4741923553493876e-05} +{"train_loss": 0.0005906512960791588, "global_step": 53613, "epoch": 450, "lr": 1.4740352688323317e-05} +{"train_loss": 0.00046364287845790386, "global_step": 53614, "epoch": 450, "lr": 1.4738781892381299e-05} +{"train_loss": 0.0014751643175259233, "global_step": 53615, "epoch": 450, "lr": 1.4737211165670934e-05} +{"train_loss": 0.0007363276090472937, "global_step": 53616, "epoch": 450, "lr": 1.4735640508195265e-05} +{"train_loss": 0.0010382449254393578, "global_step": 53617, "epoch": 450, "lr": 1.4734069919957422e-05} +{"train_loss": 0.0002956506214104593, "global_step": 53618, "epoch": 450, "lr": 1.473249940096046e-05} +{"train_loss": 0.0003885911137331277, "global_step": 53619, "epoch": 450, "lr": 1.473092895120745e-05} +{"train_loss": 0.0010797367431223392, "global_step": 53620, "epoch": 450, "lr": 1.4729358570701513e-05} +{"train_loss": 0.0006909706280566752, "global_step": 53621, "epoch": 450, "lr": 1.4727788259445696e-05} +{"train_loss": 0.0009076038259081542, "global_step": 53622, "epoch": 450, "lr": 1.4726218017443111e-05} +{"train_loss": 0.0006751182372681797, "global_step": 53623, "epoch": 450, "lr": 1.4724647844696815e-05} +{"train_loss": 0.0015392019413411617, "global_step": 53624, "epoch": 450, "lr": 1.4723077741209918e-05} +{"train_loss": 0.0010811961255967617, "global_step": 53625, "epoch": 450, "lr": 1.4721507706985477e-05} +{"train_loss": 0.0004169646999798715, "global_step": 53626, "epoch": 450, "lr": 1.4719937742026585e-05} +{"train_loss": 0.0010761095909401774, "global_step": 53627, "epoch": 450, "lr": 1.471836784633634e-05} +{"train_loss": 0.0008957265526987612, "global_step": 53628, "epoch": 450, "lr": 1.4716798019917799e-05} +{"train_loss": 0.0007423394126817584, "global_step": 53629, "epoch": 450, "lr": 1.4715228262774067e-05} +{"train_loss": 0.000758053211029619, "global_step": 53630, "epoch": 450, "lr": 1.4713658574908202e-05} +{"train_loss": 0.001228890847414732, "global_step": 53631, "epoch": 450, "lr": 1.4712088956323311e-05} +{"train_loss": 0.0010325232287868857, "global_step": 53632, "epoch": 450, "lr": 1.4710519407022466e-05} +{"train_loss": 0.0008945863228291273, "global_step": 53633, "epoch": 450, "lr": 1.470894992700873e-05} +{"train_loss": 0.0011334390146657825, "global_step": 53634, "epoch": 450, "lr": 1.4707380516285219e-05} +{"train_loss": 0.0010167123982682824, "global_step": 53635, "epoch": 450, "lr": 1.4705811174854977e-05} +{"train_loss": 0.000618457212112844, "global_step": 53636, "epoch": 450, "lr": 1.4704241902721116e-05} +{"train_loss": 0.0005437282379716635, "global_step": 53637, "epoch": 450, "lr": 1.470267269988671e-05} +{"train_loss": 0.0006752173649147153, "global_step": 53638, "epoch": 450, "lr": 1.4701103566354823e-05} +{"train_loss": 0.0006254788604564965, "global_step": 53639, "epoch": 450, "lr": 1.469953450212856e-05} +{"train_loss": 0.000632061914075166, "global_step": 53640, "epoch": 450, "lr": 1.469796550721097e-05} +{"train_loss": 0.0008684960776008666, "global_step": 53641, "epoch": 450, "lr": 1.4696396581605176e-05} +{"train_loss": 0.0006547392113134265, "global_step": 53642, "epoch": 450, "lr": 1.4694827725314214e-05} +{"train_loss": 0.0007733350503258407, "global_step": 53643, "epoch": 450, "lr": 1.4693258938341204e-05} +{"train_loss": 0.00034129375126212835, "global_step": 53644, "epoch": 450, "lr": 1.4691690220689208e-05} +{"train_loss": 0.0007979012443684042, "global_step": 53645, "epoch": 450, "lr": 1.4690121572361294e-05} +{"train_loss": 0.0005510495393536985, "global_step": 53646, "epoch": 450, "lr": 1.4688552993360566e-05} +{"train_loss": 0.0009939257288351655, "global_step": 53647, "epoch": 450, "lr": 1.4686984483690075e-05} +{"train_loss": 0.0009016628609970212, "global_step": 53648, "epoch": 450, "lr": 1.4685416043352934e-05} +{"train_loss": 0.0007842483464628458, "global_step": 53649, "epoch": 450, "lr": 1.4683847672352207e-05} +{"train_loss": 0.0008680476457811892, "global_step": 53650, "epoch": 450, "lr": 1.4682279370690955e-05} +{"train_loss": 0.0007629018509760499, "global_step": 53651, "epoch": 450, "lr": 1.4680711138372288e-05} +{"train_loss": 0.0004500426584854722, "global_step": 53652, "epoch": 450, "lr": 1.4679142975399262e-05} +{"train_loss": 0.0007412899867631495, "global_step": 53653, "epoch": 450, "lr": 1.4677574881774975e-05} +{"train_loss": 0.0009606528910808265, "global_step": 53654, "epoch": 450, "lr": 1.4676006857502484e-05} +{"train_loss": 0.0005696530570276082, "global_step": 53655, "epoch": 450, "lr": 1.4674438902584892e-05} +{"train_loss": 0.000607042049523443, "global_step": 53656, "epoch": 450, "lr": 1.4672871017025253e-05} +{"train_loss": 0.0006804551812820137, "global_step": 53657, "epoch": 450, "lr": 1.4671303200826675e-05} +{"train_loss": 0.0012198236072435975, "global_step": 53658, "epoch": 450, "lr": 1.4669735453992194e-05} +{"train_loss": 0.0005857966607436538, "global_step": 53659, "epoch": 450, "lr": 1.4668167776524938e-05} +{"train_loss": 0.000640530081000179, "global_step": 53660, "epoch": 450, "lr": 1.466660016842794e-05} +{"train_loss": 0.0004617126251105219, "global_step": 53661, "epoch": 450, "lr": 1.46650326297043e-05} +{"train_loss": 0.0005047285230830312, "global_step": 53662, "epoch": 450, "lr": 1.466346516035711e-05} +{"train_loss": 0.0004960171063430607, "global_step": 53663, "epoch": 450, "lr": 1.4661897760389426e-05} +{"train_loss": 0.0012503163889050484, "global_step": 53664, "epoch": 450, "lr": 1.4660330429804319e-05} +{"train_loss": 0.0008856149506755173, "global_step": 53665, "epoch": 450, "lr": 1.465876316860489e-05} +{"train_loss": 0.0003806185268331319, "global_step": 53666, "epoch": 450, "lr": 1.465719597679419e-05} +{"train_loss": 0.000817479332908988, "global_step": 53667, "epoch": 450, "lr": 1.4655628854375324e-05} +{"train_loss": 0.0007591283153312109, "global_step": 53668, "epoch": 450, "lr": 1.465406180135136e-05, "val_loss": 0.013083764351904392, "train_action_mse_error": 9.835525816015434e-06} +{"train_loss": 0.0008707201341167092, "global_step": 53669, "epoch": 451, "lr": 1.4652494817725349e-05} +{"train_loss": 0.00047384490608237684, "global_step": 53670, "epoch": 451, "lr": 1.4650927903500405e-05} +{"train_loss": 0.0006517249858006835, "global_step": 53671, "epoch": 451, "lr": 1.4649361058679572e-05} +{"train_loss": 0.0006530415848828852, "global_step": 53672, "epoch": 451, "lr": 1.4647794283265958e-05} +{"train_loss": 0.000553065852727741, "global_step": 53673, "epoch": 451, "lr": 1.4646227577262606e-05} +{"train_loss": 0.0007134692277759314, "global_step": 53674, "epoch": 451, "lr": 1.4644660940672627e-05} +{"train_loss": 0.00044880094355903566, "global_step": 53675, "epoch": 451, "lr": 1.4643094373499077e-05} +{"train_loss": 0.0004814224666915834, "global_step": 53676, "epoch": 451, "lr": 1.464152787574502e-05} +{"train_loss": 0.0004202983109280467, "global_step": 53677, "epoch": 451, "lr": 1.4639961447413564e-05} +{"train_loss": 0.0007599375676363707, "global_step": 53678, "epoch": 451, "lr": 1.4638395088507745e-05} +{"train_loss": 0.0006283792899921536, "global_step": 53679, "epoch": 451, "lr": 1.4636828799030677e-05} +{"train_loss": 0.0007805067580193281, "global_step": 53680, "epoch": 451, "lr": 1.4635262578985398e-05} +{"train_loss": 0.0009692451567389071, "global_step": 53681, "epoch": 451, "lr": 1.4633696428375027e-05} +{"train_loss": 0.000978761469013989, "global_step": 53682, "epoch": 451, "lr": 1.4632130347202605e-05} +{"train_loss": 0.00039573790854774415, "global_step": 53683, "epoch": 451, "lr": 1.4630564335471209e-05} +{"train_loss": 0.001126875402405858, "global_step": 53684, "epoch": 451, "lr": 1.4628998393183935e-05} +{"train_loss": 0.0007945576217025518, "global_step": 53685, "epoch": 451, "lr": 1.4627432520343826e-05} +{"train_loss": 0.0010371020762249827, "global_step": 53686, "epoch": 451, "lr": 1.462586671695399e-05} +{"train_loss": 0.0006339189712889493, "global_step": 53687, "epoch": 451, "lr": 1.4624300983017487e-05} +{"train_loss": 0.0005647393991239369, "global_step": 53688, "epoch": 451, "lr": 1.4622735318537372e-05} +{"train_loss": 0.0006107985973358154, "global_step": 53689, "epoch": 451, "lr": 1.4621169723516736e-05} +{"train_loss": 0.0013108589919283986, "global_step": 53690, "epoch": 451, "lr": 1.4619604197958675e-05} +{"train_loss": 0.00040668059955351055, "global_step": 53691, "epoch": 451, "lr": 1.461803874186622e-05} +{"train_loss": 0.00047474089660681784, "global_step": 53692, "epoch": 451, "lr": 1.4616473355242483e-05} +{"train_loss": 0.0005745639209635556, "global_step": 53693, "epoch": 451, "lr": 1.4614908038090507e-05} +{"train_loss": 0.0007486778777092695, "global_step": 53694, "epoch": 451, "lr": 1.4613342790413392e-05} +{"train_loss": 0.0016059972112998366, "global_step": 53695, "epoch": 451, "lr": 1.4611777612214184e-05} +{"train_loss": 0.001033195061609149, "global_step": 53696, "epoch": 451, "lr": 1.4610212503495985e-05} +{"train_loss": 0.00032149432809092104, "global_step": 53697, "epoch": 451, "lr": 1.4608647464261833e-05} +{"train_loss": 0.0009115117136389017, "global_step": 53698, "epoch": 451, "lr": 1.460708249451484e-05} +{"train_loss": 0.0007921013166196644, "global_step": 53699, "epoch": 451, "lr": 1.4605517594258045e-05} +{"train_loss": 0.0004742532328236848, "global_step": 53700, "epoch": 451, "lr": 1.460395276349455e-05} +{"train_loss": 0.0007442939677275717, "global_step": 53701, "epoch": 451, "lr": 1.4602388002227414e-05} +{"train_loss": 0.000845964124891907, "global_step": 53702, "epoch": 451, "lr": 1.4600823310459688e-05} +{"train_loss": 0.0005189091898500919, "global_step": 53703, "epoch": 451, "lr": 1.4599258688194479e-05} +{"train_loss": 0.0008363963570445776, "global_step": 53704, "epoch": 451, "lr": 1.459769413543483e-05} +{"train_loss": 0.000979105243459344, "global_step": 53705, "epoch": 451, "lr": 1.4596129652183843e-05} +{"train_loss": 0.0009614732698537409, "global_step": 53706, "epoch": 451, "lr": 1.4594565238444569e-05} +{"train_loss": 0.0005208002403378487, "global_step": 53707, "epoch": 451, "lr": 1.4593000894220071e-05} +{"train_loss": 0.0004846074734814465, "global_step": 53708, "epoch": 451, "lr": 1.4591436619513449e-05} +{"train_loss": 0.0007636501686647534, "global_step": 53709, "epoch": 451, "lr": 1.4589872414327742e-05} +{"train_loss": 0.0009940018644556403, "global_step": 53710, "epoch": 451, "lr": 1.4588308278666051e-05} +{"train_loss": 0.0010033852886408567, "global_step": 53711, "epoch": 451, "lr": 1.4586744212531423e-05} +{"train_loss": 0.0009071030654013157, "global_step": 53712, "epoch": 451, "lr": 1.4585180215926953e-05} +{"train_loss": 0.000600133091211319, "global_step": 53713, "epoch": 451, "lr": 1.4583616288855695e-05} +{"train_loss": 0.0016229667235165834, "global_step": 53714, "epoch": 451, "lr": 1.458205243132071e-05} +{"train_loss": 0.0006796338129788637, "global_step": 53715, "epoch": 451, "lr": 1.4580488643325097e-05} +{"train_loss": 0.0004077928315382451, "global_step": 53716, "epoch": 451, "lr": 1.4578924924871895e-05} +{"train_loss": 0.0007026066887192428, "global_step": 53717, "epoch": 451, "lr": 1.4577361275964202e-05} +{"train_loss": 0.0005880079115740955, "global_step": 53718, "epoch": 451, "lr": 1.4575797696605082e-05} +{"train_loss": 0.0013902600621804595, "global_step": 53719, "epoch": 451, "lr": 1.4574234186797575e-05} +{"train_loss": 0.0007139918161556125, "global_step": 53720, "epoch": 451, "lr": 1.4572670746544797e-05} +{"train_loss": 0.0006657529156655073, "global_step": 53721, "epoch": 451, "lr": 1.4571107375849773e-05} +{"train_loss": 0.0006496495916508138, "global_step": 53722, "epoch": 451, "lr": 1.4569544074715618e-05} +{"train_loss": 0.0010125203989446163, "global_step": 53723, "epoch": 451, "lr": 1.4567980843145356e-05} +{"train_loss": 0.001370736281387508, "global_step": 53724, "epoch": 451, "lr": 1.456641768114208e-05} +{"train_loss": 0.002114759525284171, "global_step": 53725, "epoch": 451, "lr": 1.4564854588708877e-05} +{"train_loss": 0.0005590232904069126, "global_step": 53726, "epoch": 451, "lr": 1.4563291565848775e-05} +{"train_loss": 0.0005363772506825626, "global_step": 53727, "epoch": 451, "lr": 1.4561728612564884e-05} +{"train_loss": 0.0008361871005035937, "global_step": 53728, "epoch": 451, "lr": 1.4560165728860237e-05} +{"train_loss": 0.0004618213861249387, "global_step": 53729, "epoch": 451, "lr": 1.4558602914737934e-05} +{"train_loss": 0.0004567222495097667, "global_step": 53730, "epoch": 451, "lr": 1.4557040170201009e-05} +{"train_loss": 0.000642994069494307, "global_step": 53731, "epoch": 451, "lr": 1.4555477495252567e-05} +{"train_loss": 0.0015573239652439952, "global_step": 53732, "epoch": 451, "lr": 1.4553914889895658e-05} +{"train_loss": 0.0007047333056107163, "global_step": 53733, "epoch": 451, "lr": 1.455235235413333e-05} +{"train_loss": 0.00034942812635563314, "global_step": 53734, "epoch": 451, "lr": 1.4550789887968697e-05} +{"train_loss": 0.0012083331821486354, "global_step": 53735, "epoch": 451, "lr": 1.4549227491404777e-05} +{"train_loss": 0.0010083119850605726, "global_step": 53736, "epoch": 451, "lr": 1.454766516444468e-05} +{"train_loss": 0.0013012962881475687, "global_step": 53737, "epoch": 451, "lr": 1.4546102907091452e-05} +{"train_loss": 0.0010445751249790192, "global_step": 53738, "epoch": 451, "lr": 1.4544540719348154e-05} +{"train_loss": 0.001345417695119977, "global_step": 53739, "epoch": 451, "lr": 1.4542978601217871e-05} +{"train_loss": 0.00070849439362064, "global_step": 53740, "epoch": 451, "lr": 1.4541416552703652e-05} +{"train_loss": 0.0004579750238917768, "global_step": 53741, "epoch": 451, "lr": 1.453985457380858e-05} +{"train_loss": 0.0005313029978424311, "global_step": 53742, "epoch": 451, "lr": 1.4538292664535708e-05} +{"train_loss": 0.001161785563454032, "global_step": 53743, "epoch": 451, "lr": 1.4536730824888123e-05} +{"train_loss": 0.0007273054798133671, "global_step": 53744, "epoch": 451, "lr": 1.453516905486888e-05} +{"train_loss": 0.001148063107393682, "global_step": 53745, "epoch": 451, "lr": 1.4533607354481027e-05} +{"train_loss": 0.0008040334796532989, "global_step": 53746, "epoch": 451, "lr": 1.4532045723727661e-05} +{"train_loss": 0.0004926862311549485, "global_step": 53747, "epoch": 451, "lr": 1.4530484162611819e-05} +{"train_loss": 0.0008254441781900823, "global_step": 53748, "epoch": 451, "lr": 1.4528922671136597e-05} +{"train_loss": 0.0007454144069924951, "global_step": 53749, "epoch": 451, "lr": 1.4527361249305033e-05} +{"train_loss": 0.0006239588838070631, "global_step": 53750, "epoch": 451, "lr": 1.4525799897120218e-05} +{"train_loss": 0.0007279565325006843, "global_step": 53751, "epoch": 451, "lr": 1.4524238614585207e-05} +{"train_loss": 0.0008577478001825511, "global_step": 53752, "epoch": 451, "lr": 1.4522677401703044e-05} +{"train_loss": 0.0010744845494627953, "global_step": 53753, "epoch": 451, "lr": 1.4521116258476836e-05} +{"train_loss": 0.0005258998135104775, "global_step": 53754, "epoch": 451, "lr": 1.4519555184909606e-05} +{"train_loss": 0.0007987146964296699, "global_step": 53755, "epoch": 451, "lr": 1.4517994181004457e-05} +{"train_loss": 0.000895465025678277, "global_step": 53756, "epoch": 451, "lr": 1.4516433246764415e-05} +{"train_loss": 0.000653413706459105, "global_step": 53757, "epoch": 451, "lr": 1.4514872382192584e-05} +{"train_loss": 0.0009612857247702777, "global_step": 53758, "epoch": 451, "lr": 1.4513311587291994e-05} +{"train_loss": 0.00039663061033934355, "global_step": 53759, "epoch": 451, "lr": 1.4511750862065731e-05} +{"train_loss": 0.000861896201968193, "global_step": 53760, "epoch": 451, "lr": 1.4510190206516866e-05} +{"train_loss": 0.0009061822202056646, "global_step": 53761, "epoch": 451, "lr": 1.4508629620648435e-05} +{"train_loss": 0.000746141595300287, "global_step": 53762, "epoch": 451, "lr": 1.4507069104463527e-05} +{"train_loss": 0.0005508074536919594, "global_step": 53763, "epoch": 451, "lr": 1.4505508657965206e-05} +{"train_loss": 0.000796991924289614, "global_step": 53764, "epoch": 451, "lr": 1.450394828115651e-05} +{"train_loss": 0.00045829996815882623, "global_step": 53765, "epoch": 451, "lr": 1.4502387974040531e-05} +{"train_loss": 0.0006427038460969925, "global_step": 53766, "epoch": 451, "lr": 1.4500827736620304e-05} +{"train_loss": 0.0016521846409887075, "global_step": 53767, "epoch": 451, "lr": 1.4499267568898928e-05} +{"train_loss": 0.00045766396215185523, "global_step": 53768, "epoch": 451, "lr": 1.4497707470879452e-05} +{"train_loss": 0.0011099940165877342, "global_step": 53769, "epoch": 451, "lr": 1.4496147442564912e-05} +{"train_loss": 0.0004605390422511846, "global_step": 53770, "epoch": 451, "lr": 1.449458748395841e-05} +{"train_loss": 0.0016784195322543383, "global_step": 53771, "epoch": 451, "lr": 1.449302759506298e-05} +{"train_loss": 0.00031778865377418697, "global_step": 53772, "epoch": 451, "lr": 1.4491467775881712e-05} +{"train_loss": 0.000958765740506351, "global_step": 53773, "epoch": 451, "lr": 1.4489908026417636e-05} +{"train_loss": 0.0005181516171433032, "global_step": 53774, "epoch": 451, "lr": 1.4488348346673847e-05} +{"train_loss": 0.0007386275101453066, "global_step": 53775, "epoch": 451, "lr": 1.4486788736653389e-05} +{"train_loss": 0.0007736681145615876, "global_step": 53776, "epoch": 451, "lr": 1.4485229196359318e-05} +{"train_loss": 0.00028825667686760426, "global_step": 53777, "epoch": 451, "lr": 1.4483669725794718e-05} +{"train_loss": 0.0011699720053002238, "global_step": 53778, "epoch": 451, "lr": 1.4482110324962622e-05} +{"train_loss": 0.000913234893232584, "global_step": 53779, "epoch": 451, "lr": 1.4480550993866127e-05} +{"train_loss": 0.0009984864154830575, "global_step": 53780, "epoch": 451, "lr": 1.4478991732508257e-05} +{"train_loss": 0.0007539776270277798, "global_step": 53781, "epoch": 451, "lr": 1.4477432540892112e-05} +{"train_loss": 0.00046699069207534194, "global_step": 53782, "epoch": 451, "lr": 1.4475873419020725e-05} +{"train_loss": 0.0007186076254583895, "global_step": 53783, "epoch": 451, "lr": 1.4474314366897157e-05} +{"train_loss": 0.0005300758639350533, "global_step": 53784, "epoch": 451, "lr": 1.447275538452449e-05} +{"train_loss": 0.00113865255843848, "global_step": 53785, "epoch": 451, "lr": 1.4471196471905757e-05} +{"train_loss": 0.0005152171943336725, "global_step": 53786, "epoch": 451, "lr": 1.4469637629044047e-05} +{"train_loss": 0.0007913740918709419, "global_step": 53787, "epoch": 451, "lr": 1.4468078855942397e-05, "val_loss": 0.01974138244986534} +{"train_loss": 0.0005665378412231803, "global_step": 53788, "epoch": 452, "lr": 1.4466520152603891e-05} +{"train_loss": 0.0009576701559126377, "global_step": 53789, "epoch": 452, "lr": 1.4464961519031556e-05} +{"train_loss": 0.000653115741442889, "global_step": 53790, "epoch": 452, "lr": 1.4463402955228494e-05} +{"train_loss": 0.0007902031065896153, "global_step": 53791, "epoch": 452, "lr": 1.4461844461197727e-05} +{"train_loss": 0.0004972508177161217, "global_step": 53792, "epoch": 452, "lr": 1.446028603694235e-05} +{"train_loss": 0.000409342726925388, "global_step": 53793, "epoch": 452, "lr": 1.4458727682465384e-05} +{"train_loss": 0.0008876913925632834, "global_step": 53794, "epoch": 452, "lr": 1.4457169397769931e-05} +{"train_loss": 0.0005065202130936086, "global_step": 53795, "epoch": 452, "lr": 1.4455611182859009e-05} +{"train_loss": 0.0004845350922551006, "global_step": 53796, "epoch": 452, "lr": 1.445405303773571e-05} +{"train_loss": 0.0003388242912478745, "global_step": 53797, "epoch": 452, "lr": 1.4452494962403068e-05} +{"train_loss": 0.0005271524423733354, "global_step": 53798, "epoch": 452, "lr": 1.445093695686417e-05} +{"train_loss": 0.001171212992630899, "global_step": 53799, "epoch": 452, "lr": 1.4449379021122044e-05} +{"train_loss": 0.00035677902633324265, "global_step": 53800, "epoch": 452, "lr": 1.444782115517978e-05} +{"train_loss": 0.0004585333517752588, "global_step": 53801, "epoch": 452, "lr": 1.4446263359040424e-05} +{"train_loss": 0.0008287976961582899, "global_step": 53802, "epoch": 452, "lr": 1.4444705632707013e-05} +{"train_loss": 0.0006654109456576407, "global_step": 53803, "epoch": 452, "lr": 1.4443147976182637e-05} +{"train_loss": 0.0005901743425056338, "global_step": 53804, "epoch": 452, "lr": 1.4441590389470328e-05} +{"train_loss": 0.000615133554674685, "global_step": 53805, "epoch": 452, "lr": 1.4440032872573172e-05} +{"train_loss": 0.0008588638156652451, "global_step": 53806, "epoch": 452, "lr": 1.4438475425494213e-05} +{"train_loss": 0.0006972571718506515, "global_step": 53807, "epoch": 452, "lr": 1.4436918048236492e-05} +{"train_loss": 0.0007457308820448816, "global_step": 53808, "epoch": 452, "lr": 1.44353607408031e-05} +{"train_loss": 0.0005178085411898792, "global_step": 53809, "epoch": 452, "lr": 1.4433803503197063e-05} +{"train_loss": 0.0009021477308124304, "global_step": 53810, "epoch": 452, "lr": 1.4432246335421467e-05} +{"train_loss": 0.00031605176627635956, "global_step": 53811, "epoch": 452, "lr": 1.443068923747934e-05} +{"train_loss": 0.0005823969258926809, "global_step": 53812, "epoch": 452, "lr": 1.442913220937377e-05} +{"train_loss": 0.000561270397156477, "global_step": 53813, "epoch": 452, "lr": 1.44275752511078e-05} +{"train_loss": 0.0005784431705251336, "global_step": 53814, "epoch": 452, "lr": 1.4426018362684468e-05} +{"train_loss": 0.001379877096042037, "global_step": 53815, "epoch": 452, "lr": 1.4424461544106866e-05} +{"train_loss": 0.00030925063765607774, "global_step": 53816, "epoch": 452, "lr": 1.4422904795378017e-05} +{"train_loss": 0.0007094956818036735, "global_step": 53817, "epoch": 452, "lr": 1.442134811650101e-05} +{"train_loss": 0.0006232389714568853, "global_step": 53818, "epoch": 452, "lr": 1.441979150747887e-05} +{"train_loss": 0.0005583706079050899, "global_step": 53819, "epoch": 452, "lr": 1.441823496831468e-05} +{"train_loss": 0.000614009506534785, "global_step": 53820, "epoch": 452, "lr": 1.4416678499011487e-05} +{"train_loss": 0.0010914020240306854, "global_step": 53821, "epoch": 452, "lr": 1.4415122099572325e-05} +{"train_loss": 0.0007718607666902244, "global_step": 53822, "epoch": 452, "lr": 1.4413565770000276e-05} +{"train_loss": 0.0006490742671303451, "global_step": 53823, "epoch": 452, "lr": 1.4412009510298397e-05} +{"train_loss": 0.001284255413338542, "global_step": 53824, "epoch": 452, "lr": 1.4410453320469725e-05} +{"train_loss": 0.00102109310682863, "global_step": 53825, "epoch": 452, "lr": 1.4408897200517341e-05} +{"train_loss": 0.0007881947094574571, "global_step": 53826, "epoch": 452, "lr": 1.4407341150444265e-05} +{"train_loss": 0.0002207718207500875, "global_step": 53827, "epoch": 452, "lr": 1.4405785170253588e-05} +{"train_loss": 0.0006830185884609818, "global_step": 53828, "epoch": 452, "lr": 1.4404229259948338e-05} +{"train_loss": 0.0010923995869234204, "global_step": 53829, "epoch": 452, "lr": 1.4402673419531598e-05} +{"train_loss": 0.0005176328122615814, "global_step": 53830, "epoch": 452, "lr": 1.4401117649006385e-05} +{"train_loss": 0.0004942609230056405, "global_step": 53831, "epoch": 452, "lr": 1.439956194837579e-05} +{"train_loss": 0.001119733089581132, "global_step": 53832, "epoch": 452, "lr": 1.4398006317642854e-05} +{"train_loss": 0.0009988443925976753, "global_step": 53833, "epoch": 452, "lr": 1.4396450756810615e-05} +{"train_loss": 0.00033399139647372067, "global_step": 53834, "epoch": 452, "lr": 1.4394895265882153e-05} +{"train_loss": 0.0006492006359621882, "global_step": 53835, "epoch": 452, "lr": 1.4393339844860499e-05} +{"train_loss": 0.0005913096247240901, "global_step": 53836, "epoch": 452, "lr": 1.4391784493748728e-05} +{"train_loss": 0.0005989586934447289, "global_step": 53837, "epoch": 452, "lr": 1.4390229212549888e-05} +{"train_loss": 0.0003955702995881438, "global_step": 53838, "epoch": 452, "lr": 1.4388674001267011e-05} +{"train_loss": 0.0006260315421968699, "global_step": 53839, "epoch": 452, "lr": 1.4387118859903187e-05} +{"train_loss": 0.0009750360623002052, "global_step": 53840, "epoch": 452, "lr": 1.438556378846143e-05} +{"train_loss": 0.0009838698897510767, "global_step": 53841, "epoch": 452, "lr": 1.4384008786944837e-05} +{"train_loss": 0.0010066841496154666, "global_step": 53842, "epoch": 452, "lr": 1.4382453855356414e-05} +{"train_loss": 0.0011899903183802962, "global_step": 53843, "epoch": 452, "lr": 1.438089899369926e-05} +{"train_loss": 0.00046226015547290444, "global_step": 53844, "epoch": 452, "lr": 1.4379344201976402e-05} +{"train_loss": 0.000519131135661155, "global_step": 53845, "epoch": 452, "lr": 1.4377789480190879e-05} +{"train_loss": 0.0006608479307033122, "global_step": 53846, "epoch": 452, "lr": 1.437623482834578e-05} +{"train_loss": 0.0006365312729030848, "global_step": 53847, "epoch": 452, "lr": 1.4374680246444116e-05} +{"train_loss": 0.0009505907073616982, "global_step": 53848, "epoch": 452, "lr": 1.4373125734488985e-05} +{"train_loss": 0.00043850281508639455, "global_step": 53849, "epoch": 452, "lr": 1.4371571292483393e-05} +{"train_loss": 0.00029770174296572804, "global_step": 53850, "epoch": 452, "lr": 1.4370016920430434e-05} +{"train_loss": 0.0007495667668990791, "global_step": 53851, "epoch": 452, "lr": 1.436846261833314e-05} +{"train_loss": 0.0008670877432450652, "global_step": 53852, "epoch": 452, "lr": 1.436690838619455e-05} +{"train_loss": 0.0008817875641398132, "global_step": 53853, "epoch": 452, "lr": 1.436535422401774e-05} +{"train_loss": 0.0010116465855389833, "global_step": 53854, "epoch": 452, "lr": 1.4363800131805733e-05} +{"train_loss": 0.0006219224305823445, "global_step": 53855, "epoch": 452, "lr": 1.4362246109561616e-05} +{"train_loss": 0.0007620666874572635, "global_step": 53856, "epoch": 452, "lr": 1.4360692157288402e-05} +{"train_loss": 0.000575177138671279, "global_step": 53857, "epoch": 452, "lr": 1.435913827498917e-05} +{"train_loss": 0.0007173530175350606, "global_step": 53858, "epoch": 452, "lr": 1.4357584462666967e-05} +{"train_loss": 0.00046693396870978177, "global_step": 53859, "epoch": 452, "lr": 1.4356030720324831e-05} +{"train_loss": 0.0006628844421356916, "global_step": 53860, "epoch": 452, "lr": 1.4354477047965836e-05} +{"train_loss": 0.0005741671193391085, "global_step": 53861, "epoch": 452, "lr": 1.4352923445592997e-05} +{"train_loss": 0.0011319800978526473, "global_step": 53862, "epoch": 452, "lr": 1.4351369913209405e-05} +{"train_loss": 0.0004949893918819726, "global_step": 53863, "epoch": 452, "lr": 1.4349816450818087e-05} +{"train_loss": 0.0003540822071954608, "global_step": 53864, "epoch": 452, "lr": 1.4348263058422078e-05} +{"train_loss": 0.0008575695683248341, "global_step": 53865, "epoch": 452, "lr": 1.4346709736024466e-05} +{"train_loss": 0.0006208631093613803, "global_step": 53866, "epoch": 452, "lr": 1.4345156483628263e-05} +{"train_loss": 0.000637371267657727, "global_step": 53867, "epoch": 452, "lr": 1.4343603301236552e-05} +{"train_loss": 0.0006524465861730278, "global_step": 53868, "epoch": 452, "lr": 1.4342050188852351e-05} +{"train_loss": 0.0006281720707193017, "global_step": 53869, "epoch": 452, "lr": 1.4340497146478737e-05} +{"train_loss": 0.0008930080221034586, "global_step": 53870, "epoch": 452, "lr": 1.4338944174118752e-05} +{"train_loss": 0.0013029605615884066, "global_step": 53871, "epoch": 452, "lr": 1.4337391271775425e-05} +{"train_loss": 0.0005487948074005544, "global_step": 53872, "epoch": 452, "lr": 1.4335838439451831e-05} +{"train_loss": 0.000498482899274677, "global_step": 53873, "epoch": 452, "lr": 1.4334285677151e-05} +{"train_loss": 0.00046132667921483517, "global_step": 53874, "epoch": 452, "lr": 1.4332732984875996e-05} +{"train_loss": 0.0006086558569222689, "global_step": 53875, "epoch": 452, "lr": 1.4331180362629865e-05} +{"train_loss": 0.0008174472604878247, "global_step": 53876, "epoch": 452, "lr": 1.4329627810415636e-05} +{"train_loss": 0.0007850736728869379, "global_step": 53877, "epoch": 452, "lr": 1.4328075328236384e-05} +{"train_loss": 0.0006382734281942248, "global_step": 53878, "epoch": 452, "lr": 1.432652291609513e-05} +{"train_loss": 0.0003464959154371172, "global_step": 53879, "epoch": 452, "lr": 1.4324970573994955e-05} +{"train_loss": 0.001116169965825975, "global_step": 53880, "epoch": 452, "lr": 1.4323418301938868e-05} +{"train_loss": 0.0005308707477524877, "global_step": 53881, "epoch": 452, "lr": 1.432186609992996e-05} +{"train_loss": 0.0008122349390760064, "global_step": 53882, "epoch": 452, "lr": 1.4320313967971256e-05} +{"train_loss": 0.0011479289969429374, "global_step": 53883, "epoch": 452, "lr": 1.4318761906065781e-05} +{"train_loss": 0.00044825777877122164, "global_step": 53884, "epoch": 452, "lr": 1.4317209914216628e-05} +{"train_loss": 0.0009374495130032301, "global_step": 53885, "epoch": 452, "lr": 1.4315657992426801e-05} +{"train_loss": 0.0009555734577588737, "global_step": 53886, "epoch": 452, "lr": 1.4314106140699385e-05} +{"train_loss": 0.0012883751187473536, "global_step": 53887, "epoch": 452, "lr": 1.4312554359037395e-05} +{"train_loss": 0.0005885413265787065, "global_step": 53888, "epoch": 452, "lr": 1.4311002647443905e-05} +{"train_loss": 0.0008434786577709019, "global_step": 53889, "epoch": 452, "lr": 1.4309451005921936e-05} +{"train_loss": 0.0006465146434493363, "global_step": 53890, "epoch": 452, "lr": 1.4307899434474559e-05} +{"train_loss": 0.0010282628936693072, "global_step": 53891, "epoch": 452, "lr": 1.430634793310479e-05} +{"train_loss": 0.0009485679329372942, "global_step": 53892, "epoch": 452, "lr": 1.4304796501815704e-05} +{"train_loss": 0.0010489661945030093, "global_step": 53893, "epoch": 452, "lr": 1.4303245140610344e-05} +{"train_loss": 0.0007438517641276121, "global_step": 53894, "epoch": 452, "lr": 1.4301693849491748e-05} +{"train_loss": 0.0010361982276663184, "global_step": 53895, "epoch": 452, "lr": 1.4300142628462948e-05} +{"train_loss": 0.0011793447192758322, "global_step": 53896, "epoch": 452, "lr": 1.4298591477527024e-05} +{"train_loss": 0.0007578382501378655, "global_step": 53897, "epoch": 452, "lr": 1.4297040396686984e-05} +{"train_loss": 0.0009588172542862594, "global_step": 53898, "epoch": 452, "lr": 1.4295489385945904e-05} +{"train_loss": 0.0008648085640743375, "global_step": 53899, "epoch": 452, "lr": 1.4293938445306799e-05} +{"train_loss": 0.0011805910617113113, "global_step": 53900, "epoch": 452, "lr": 1.4292387574772748e-05} +{"train_loss": 0.0006406756001524627, "global_step": 53901, "epoch": 452, "lr": 1.4290836774346782e-05} +{"train_loss": 0.00047812898992560804, "global_step": 53902, "epoch": 452, "lr": 1.4289286044031924e-05} +{"train_loss": 0.0004944900865666568, "global_step": 53903, "epoch": 452, "lr": 1.4287735383831258e-05} +{"train_loss": 0.000643216073513031, "global_step": 53904, "epoch": 452, "lr": 1.4286184793747792e-05} +{"train_loss": 0.0017431547166779637, "global_step": 53905, "epoch": 452, "lr": 1.4284634273784598e-05} +{"train_loss": 0.0007324534350470052, "global_step": 53906, "epoch": 452, "lr": 1.428308382394471e-05, "val_loss": 0.029059261083602905} +{"train_loss": 0.0006215713801793754, "global_step": 53907, "epoch": 453, "lr": 1.428153344423116e-05} +{"train_loss": 0.0006708736182190478, "global_step": 53908, "epoch": 453, "lr": 1.4279983134647013e-05} +{"train_loss": 0.0009041543235071003, "global_step": 53909, "epoch": 453, "lr": 1.4278432895195288e-05} +{"train_loss": 0.0006952327094040811, "global_step": 53910, "epoch": 453, "lr": 1.4276882725879065e-05} +{"train_loss": 0.0013493142323568463, "global_step": 53911, "epoch": 453, "lr": 1.4275332626701344e-05} +{"train_loss": 0.0015666655963286757, "global_step": 53912, "epoch": 453, "lr": 1.4273782597665209e-05} +{"train_loss": 0.000601967447437346, "global_step": 53913, "epoch": 453, "lr": 1.4272232638773686e-05} +{"train_loss": 0.0008673535194247961, "global_step": 53914, "epoch": 453, "lr": 1.4270682750029802e-05} +{"train_loss": 0.0008376300102099776, "global_step": 53915, "epoch": 453, "lr": 1.4269132931436629e-05} +{"train_loss": 0.0004461012140382081, "global_step": 53916, "epoch": 453, "lr": 1.426758318299718e-05} +{"train_loss": 0.0007659115944989026, "global_step": 53917, "epoch": 453, "lr": 1.4266033504714531e-05} +{"train_loss": 0.0008655411074869335, "global_step": 53918, "epoch": 453, "lr": 1.4264483896591695e-05} +{"train_loss": 0.0004275900428183377, "global_step": 53919, "epoch": 453, "lr": 1.426293435863174e-05} +{"train_loss": 0.0011651916429400444, "global_step": 53920, "epoch": 453, "lr": 1.4261384890837681e-05} +{"train_loss": 0.0004416482988744974, "global_step": 53921, "epoch": 453, "lr": 1.4259835493212587e-05} +{"train_loss": 0.0004969205474480987, "global_step": 53922, "epoch": 453, "lr": 1.4258286165759471e-05} +{"train_loss": 0.00034907477675005794, "global_step": 53923, "epoch": 453, "lr": 1.425673690848141e-05} +{"train_loss": 0.0005069156177341938, "global_step": 53924, "epoch": 453, "lr": 1.4255187721381413e-05} +{"train_loss": 0.0005727765965275466, "global_step": 53925, "epoch": 453, "lr": 1.4253638604462555e-05} +{"train_loss": 0.0004699229612015188, "global_step": 53926, "epoch": 453, "lr": 1.4252089557727838e-05} +{"train_loss": 0.0004003598296549171, "global_step": 53927, "epoch": 453, "lr": 1.4250540581180338e-05} +{"train_loss": 0.0004532875900622457, "global_step": 53928, "epoch": 453, "lr": 1.424899167482307e-05} +{"train_loss": 0.0007368689985014498, "global_step": 53929, "epoch": 453, "lr": 1.4247442838659103e-05} +{"train_loss": 0.0007265629828907549, "global_step": 53930, "epoch": 453, "lr": 1.4245894072691446e-05} +{"train_loss": 0.0005398054490797222, "global_step": 53931, "epoch": 453, "lr": 1.4244345376923173e-05} +{"train_loss": 0.0006244826363399625, "global_step": 53932, "epoch": 453, "lr": 1.4242796751357307e-05} +{"train_loss": 0.000782054616138339, "global_step": 53933, "epoch": 453, "lr": 1.4241248195996876e-05} +{"train_loss": 0.0004583208938129246, "global_step": 53934, "epoch": 453, "lr": 1.4239699710844944e-05} +{"train_loss": 0.0016251259949058294, "global_step": 53935, "epoch": 453, "lr": 1.4238151295904529e-05} +{"train_loss": 0.00042689815745688975, "global_step": 53936, "epoch": 453, "lr": 1.4236602951178702e-05} +{"train_loss": 0.0008506702724844217, "global_step": 53937, "epoch": 453, "lr": 1.4235054676670462e-05} +{"train_loss": 0.001120297471061349, "global_step": 53938, "epoch": 453, "lr": 1.423350647238289e-05} +{"train_loss": 0.0008276774315163493, "global_step": 53939, "epoch": 453, "lr": 1.4231958338319007e-05} +{"train_loss": 0.0009812824428081512, "global_step": 53940, "epoch": 453, "lr": 1.4230410274481837e-05} +{"train_loss": 0.000816136656794697, "global_step": 53941, "epoch": 453, "lr": 1.422886228087445e-05} +{"train_loss": 0.00043217831989750266, "global_step": 53942, "epoch": 453, "lr": 1.422731435749986e-05} +{"train_loss": 0.0007181629189290106, "global_step": 53943, "epoch": 453, "lr": 1.4225766504361127e-05} +{"train_loss": 0.0008709166431799531, "global_step": 53944, "epoch": 453, "lr": 1.422421872146128e-05} +{"train_loss": 0.0006588847027160227, "global_step": 53945, "epoch": 453, "lr": 1.422267100880334e-05} +{"train_loss": 0.0006184233352541924, "global_step": 53946, "epoch": 453, "lr": 1.4221123366390383e-05} +{"train_loss": 0.0006314092315733433, "global_step": 53947, "epoch": 453, "lr": 1.421957579422541e-05} +{"train_loss": 0.000681210367474705, "global_step": 53948, "epoch": 453, "lr": 1.4218028292311492e-05} +{"train_loss": 0.00042967480840161443, "global_step": 53949, "epoch": 453, "lr": 1.4216480860651638e-05} +{"train_loss": 0.0008262852788902819, "global_step": 53950, "epoch": 453, "lr": 1.4214933499248917e-05} +{"train_loss": 0.0004492161388043314, "global_step": 53951, "epoch": 453, "lr": 1.421338620810635e-05} +{"train_loss": 0.000552049488760531, "global_step": 53952, "epoch": 453, "lr": 1.421183898722696e-05} +{"train_loss": 0.0004969676374457777, "global_step": 53953, "epoch": 453, "lr": 1.4210291836613804e-05} +{"train_loss": 0.0006674451287835836, "global_step": 53954, "epoch": 453, "lr": 1.4208744756269932e-05} +{"train_loss": 0.0007088443962857127, "global_step": 53955, "epoch": 453, "lr": 1.4207197746198347e-05} +{"train_loss": 0.0005345390527509153, "global_step": 53956, "epoch": 453, "lr": 1.420565080640212e-05} +{"train_loss": 0.0005907173617742956, "global_step": 53957, "epoch": 453, "lr": 1.4204103936884261e-05} +{"train_loss": 0.0005127770709805191, "global_step": 53958, "epoch": 453, "lr": 1.4202557137647837e-05} +{"train_loss": 0.0008082503918558359, "global_step": 53959, "epoch": 453, "lr": 1.4201010408695847e-05} +{"train_loss": 0.00047002354403957725, "global_step": 53960, "epoch": 453, "lr": 1.4199463750031367e-05} +{"train_loss": 0.0009917542338371277, "global_step": 53961, "epoch": 453, "lr": 1.4197917161657398e-05} +{"train_loss": 0.0003982059715781361, "global_step": 53962, "epoch": 453, "lr": 1.4196370643577012e-05} +{"train_loss": 0.0007293234812095761, "global_step": 53963, "epoch": 453, "lr": 1.4194824195793227e-05} +{"train_loss": 0.0016149795847013593, "global_step": 53964, "epoch": 453, "lr": 1.4193277818309064e-05} +{"train_loss": 0.000519180262926966, "global_step": 53965, "epoch": 453, "lr": 1.4191731511127587e-05} +{"train_loss": 0.0006341629778034985, "global_step": 53966, "epoch": 453, "lr": 1.4190185274251805e-05} +{"train_loss": 0.0005941552808508277, "global_step": 53967, "epoch": 453, "lr": 1.4188639107684788e-05} +{"train_loss": 0.00047214291407726705, "global_step": 53968, "epoch": 453, "lr": 1.4187093011429532e-05} +{"train_loss": 0.0005652370164170861, "global_step": 53969, "epoch": 453, "lr": 1.4185546985489113e-05} +{"train_loss": 0.0004497867194004357, "global_step": 53970, "epoch": 453, "lr": 1.4184001029866539e-05} +{"train_loss": 0.0007610396714881063, "global_step": 53971, "epoch": 453, "lr": 1.4182455144564843e-05} +{"train_loss": 0.000816437357570976, "global_step": 53972, "epoch": 453, "lr": 1.4180909329587084e-05} +{"train_loss": 0.0006066404166631401, "global_step": 53973, "epoch": 453, "lr": 1.4179363584936266e-05} +{"train_loss": 0.0009664690005593002, "global_step": 53974, "epoch": 453, "lr": 1.417781791061546e-05} +{"train_loss": 0.0006249487632885575, "global_step": 53975, "epoch": 453, "lr": 1.4176272306627675e-05} +{"train_loss": 0.0005009061424061656, "global_step": 53976, "epoch": 453, "lr": 1.4174726772975943e-05} +{"train_loss": 0.0011990442872047424, "global_step": 53977, "epoch": 453, "lr": 1.4173181309663319e-05} +{"train_loss": 0.000896202283911407, "global_step": 53978, "epoch": 453, "lr": 1.417163591669281e-05} +{"train_loss": 0.0004542046517599374, "global_step": 53979, "epoch": 453, "lr": 1.4170090594067487e-05} +{"train_loss": 0.0006480051088146865, "global_step": 53980, "epoch": 453, "lr": 1.4168545341790345e-05} +{"train_loss": 0.0012750630266964436, "global_step": 53981, "epoch": 453, "lr": 1.4167000159864452e-05} +{"train_loss": 0.0005767152761109173, "global_step": 53982, "epoch": 453, "lr": 1.4165455048292825e-05} +{"train_loss": 0.0013457414461299777, "global_step": 53983, "epoch": 453, "lr": 1.4163910007078479e-05} +{"train_loss": 0.0007532131276093423, "global_step": 53984, "epoch": 453, "lr": 1.416236503622449e-05} +{"train_loss": 0.0010985026601701975, "global_step": 53985, "epoch": 453, "lr": 1.4160820135733848e-05} +{"train_loss": 0.0006063728360459208, "global_step": 53986, "epoch": 453, "lr": 1.4159275305609626e-05} +{"train_loss": 0.0010818823939189315, "global_step": 53987, "epoch": 453, "lr": 1.415773054585482e-05} +{"train_loss": 0.0009514619596302509, "global_step": 53988, "epoch": 453, "lr": 1.4156185856472481e-05} +{"train_loss": 0.0005358312046155334, "global_step": 53989, "epoch": 453, "lr": 1.415464123746566e-05} +{"train_loss": 0.0004506102704908699, "global_step": 53990, "epoch": 453, "lr": 1.4153096688837353e-05} +{"train_loss": 0.000812467304058373, "global_step": 53991, "epoch": 453, "lr": 1.4151552210590624e-05} +{"train_loss": 0.0007055344758555293, "global_step": 53992, "epoch": 453, "lr": 1.4150007802728482e-05} +{"train_loss": 0.0007124149706214666, "global_step": 53993, "epoch": 453, "lr": 1.4148463465253985e-05} +{"train_loss": 0.0006933559780009091, "global_step": 53994, "epoch": 453, "lr": 1.4146919198170145e-05} +{"train_loss": 0.0011504758149385452, "global_step": 53995, "epoch": 453, "lr": 1.4145375001479989e-05} +{"train_loss": 0.0003086129727307707, "global_step": 53996, "epoch": 453, "lr": 1.414383087518657e-05} +{"train_loss": 0.000903970212675631, "global_step": 53997, "epoch": 453, "lr": 1.4142286819292895e-05} +{"train_loss": 0.0007737796404398978, "global_step": 53998, "epoch": 453, "lr": 1.4140742833802023e-05} +{"train_loss": 0.0004786121426150203, "global_step": 53999, "epoch": 453, "lr": 1.4139198918716956e-05} +{"train_loss": 0.000754311855416745, "global_step": 54000, "epoch": 453, "lr": 1.4137655074040756e-05} +{"train_loss": 0.0007822116604074836, "global_step": 54001, "epoch": 453, "lr": 1.4136111299776444e-05} +{"train_loss": 0.000677425239700824, "global_step": 54002, "epoch": 453, "lr": 1.4134567595927028e-05} +{"train_loss": 0.000771653198171407, "global_step": 54003, "epoch": 453, "lr": 1.4133023962495567e-05} +{"train_loss": 0.0002692092675715685, "global_step": 54004, "epoch": 453, "lr": 1.413148039948507e-05} +{"train_loss": 0.0008606709307059646, "global_step": 54005, "epoch": 453, "lr": 1.4129936906898595e-05} +{"train_loss": 0.000559780397452414, "global_step": 54006, "epoch": 453, "lr": 1.4128393484739144e-05} +{"train_loss": 0.000918770267162472, "global_step": 54007, "epoch": 453, "lr": 1.4126850133009772e-05} +{"train_loss": 0.0008596476400271058, "global_step": 54008, "epoch": 453, "lr": 1.4125306851713499e-05} +{"train_loss": 0.0004083366075064987, "global_step": 54009, "epoch": 453, "lr": 1.4123763640853333e-05} +{"train_loss": 0.0006874130922369659, "global_step": 54010, "epoch": 453, "lr": 1.4122220500432349e-05} +{"train_loss": 0.0007023841026239097, "global_step": 54011, "epoch": 453, "lr": 1.4120677430453527e-05} +{"train_loss": 0.00045279698679223657, "global_step": 54012, "epoch": 453, "lr": 1.4119134430919944e-05} +{"train_loss": 0.0008465886348858476, "global_step": 54013, "epoch": 453, "lr": 1.4117591501834604e-05} +{"train_loss": 0.000471874896902591, "global_step": 54014, "epoch": 453, "lr": 1.4116048643200524e-05} +{"train_loss": 0.0014542663702741265, "global_step": 54015, "epoch": 453, "lr": 1.4114505855020765e-05} +{"train_loss": 0.0008296745363622904, "global_step": 54016, "epoch": 453, "lr": 1.4112963137298324e-05} +{"train_loss": 0.0007139419321902096, "global_step": 54017, "epoch": 453, "lr": 1.4111420490036265e-05} +{"train_loss": 0.0007199302199296653, "global_step": 54018, "epoch": 453, "lr": 1.4109877913237578e-05} +{"train_loss": 0.0006246902048587799, "global_step": 54019, "epoch": 453, "lr": 1.4108335406905327e-05} +{"train_loss": 0.0005241609760560095, "global_step": 54020, "epoch": 453, "lr": 1.410679297104251e-05} +{"train_loss": 0.0006617239560000598, "global_step": 54021, "epoch": 453, "lr": 1.4105250605652186e-05} +{"train_loss": 0.001011520391330123, "global_step": 54022, "epoch": 453, "lr": 1.410370831073735e-05} +{"train_loss": 0.0017942480044439435, "global_step": 54023, "epoch": 453, "lr": 1.4102166086301072e-05} +{"train_loss": 0.0003547371888998896, "global_step": 54024, "epoch": 453, "lr": 1.4100623932346329e-05} +{"train_loss": 0.0007281375827831255, "global_step": 54025, "epoch": 453, "lr": 1.40990818488762e-05, "val_loss": 0.015916218981146812} +{"train_loss": 0.001463365158997476, "global_step": 54026, "epoch": 454, "lr": 1.409753983589367e-05} +{"train_loss": 0.0004274901293683797, "global_step": 54027, "epoch": 454, "lr": 1.4095997893401796e-05} +{"train_loss": 0.0009746291325427592, "global_step": 54028, "epoch": 454, "lr": 1.4094456021403584e-05} +{"train_loss": 0.0010341847082599998, "global_step": 54029, "epoch": 454, "lr": 1.4092914219902088e-05} +{"train_loss": 0.0011067435843870044, "global_step": 54030, "epoch": 454, "lr": 1.40913724889003e-05} +{"train_loss": 0.0006349216564558446, "global_step": 54031, "epoch": 454, "lr": 1.4089830828401279e-05} +{"train_loss": 0.000556476297788322, "global_step": 54032, "epoch": 454, "lr": 1.4088289238408042e-05} +{"train_loss": 0.0005604766192846, "global_step": 54033, "epoch": 454, "lr": 1.4086747718923599e-05} +{"train_loss": 0.00037124607479199767, "global_step": 54034, "epoch": 454, "lr": 1.4085206269951001e-05} +{"train_loss": 0.0013304221211001277, "global_step": 54035, "epoch": 454, "lr": 1.4083664891493253e-05} +{"train_loss": 0.0007749164942651987, "global_step": 54036, "epoch": 454, "lr": 1.4082123583553403e-05} +{"train_loss": 0.0003554545110091567, "global_step": 54037, "epoch": 454, "lr": 1.4080582346134452e-05} +{"train_loss": 0.0004874177393503487, "global_step": 54038, "epoch": 454, "lr": 1.407904117923946e-05} +{"train_loss": 0.0008192432578653097, "global_step": 54039, "epoch": 454, "lr": 1.4077500082871425e-05} +{"train_loss": 0.0004871478595305234, "global_step": 54040, "epoch": 454, "lr": 1.4075959057033373e-05} +{"train_loss": 0.0010393905686214566, "global_step": 54041, "epoch": 454, "lr": 1.4074418101728348e-05} +{"train_loss": 0.0006094392156228423, "global_step": 54042, "epoch": 454, "lr": 1.4072877216959352e-05} +{"train_loss": 0.0004972367314621806, "global_step": 54043, "epoch": 454, "lr": 1.4071336402729435e-05} +{"train_loss": 0.0009143829811364412, "global_step": 54044, "epoch": 454, "lr": 1.4069795659041618e-05} +{"train_loss": 0.00048371858429163694, "global_step": 54045, "epoch": 454, "lr": 1.40682549858989e-05} +{"train_loss": 0.0008176766568794847, "global_step": 54046, "epoch": 454, "lr": 1.4066714383304335e-05} +{"train_loss": 0.000617635203525424, "global_step": 54047, "epoch": 454, "lr": 1.4065173851260927e-05} +{"train_loss": 0.0014166528126224875, "global_step": 54048, "epoch": 454, "lr": 1.4063633389771723e-05} +{"train_loss": 0.0007029747939668596, "global_step": 54049, "epoch": 454, "lr": 1.406209299883972e-05} +{"train_loss": 0.00043252873001620173, "global_step": 54050, "epoch": 454, "lr": 1.406055267846798e-05} +{"train_loss": 0.0009162530186586082, "global_step": 54051, "epoch": 454, "lr": 1.4059012428659485e-05} +{"train_loss": 0.001002746052108705, "global_step": 54052, "epoch": 454, "lr": 1.4057472249417297e-05} +{"train_loss": 0.00053345353808254, "global_step": 54053, "epoch": 454, "lr": 1.4055932140744405e-05} +{"train_loss": 0.000624793057795614, "global_step": 54054, "epoch": 454, "lr": 1.4054392102643864e-05} +{"train_loss": 0.0008694386342540383, "global_step": 54055, "epoch": 454, "lr": 1.4052852135118671e-05} +{"train_loss": 0.0006466165068559349, "global_step": 54056, "epoch": 454, "lr": 1.4051312238171877e-05} +{"train_loss": 0.000466352968942374, "global_step": 54057, "epoch": 454, "lr": 1.4049772411806472e-05} +{"train_loss": 0.0006888920324854553, "global_step": 54058, "epoch": 454, "lr": 1.4048232656025523e-05} +{"train_loss": 0.00030280451755970716, "global_step": 54059, "epoch": 454, "lr": 1.4046692970832003e-05} +{"train_loss": 0.0011676964350044727, "global_step": 54060, "epoch": 454, "lr": 1.404515335622898e-05} +{"train_loss": 0.00047894706949591637, "global_step": 54061, "epoch": 454, "lr": 1.4043613812219442e-05} +{"train_loss": 0.0007487248512916267, "global_step": 54062, "epoch": 454, "lr": 1.4042074338806443e-05} +{"train_loss": 0.0005893956986255944, "global_step": 54063, "epoch": 454, "lr": 1.4040534935992988e-05} +{"train_loss": 0.0008484955760650337, "global_step": 54064, "epoch": 454, "lr": 1.4038995603782085e-05} +{"train_loss": 0.0006755890790373087, "global_step": 54065, "epoch": 454, "lr": 1.4037456342176791e-05} +{"train_loss": 0.001296213478781283, "global_step": 54066, "epoch": 454, "lr": 1.403591715118009e-05} +{"train_loss": 0.0010012160055339336, "global_step": 54067, "epoch": 454, "lr": 1.4034378030795042e-05} +{"train_loss": 0.0007346671191044152, "global_step": 54068, "epoch": 454, "lr": 1.4032838981024631e-05} +{"train_loss": 0.0006039844010956585, "global_step": 54069, "epoch": 454, "lr": 1.4031300001871916e-05} +{"train_loss": 0.0007296128896996379, "global_step": 54070, "epoch": 454, "lr": 1.40297610933399e-05} +{"train_loss": 0.0010292490478605032, "global_step": 54071, "epoch": 454, "lr": 1.4028222255431595e-05} +{"train_loss": 0.0005041942349635065, "global_step": 54072, "epoch": 454, "lr": 1.4026683488150038e-05} +{"train_loss": 0.0011198536958545446, "global_step": 54073, "epoch": 454, "lr": 1.4025144791498241e-05} +{"train_loss": 0.0006279979133978486, "global_step": 54074, "epoch": 454, "lr": 1.4023606165479237e-05} +{"train_loss": 0.0006018232088536024, "global_step": 54075, "epoch": 454, "lr": 1.402206761009604e-05} +{"train_loss": 0.0009772985940799117, "global_step": 54076, "epoch": 454, "lr": 1.402052912535165e-05} +{"train_loss": 0.001355704735033214, "global_step": 54077, "epoch": 454, "lr": 1.401899071124913e-05} +{"train_loss": 0.00047822025953792036, "global_step": 54078, "epoch": 454, "lr": 1.4017452367791461e-05} +{"train_loss": 0.0013739070855081081, "global_step": 54079, "epoch": 454, "lr": 1.4015914094981691e-05} +{"train_loss": 0.0004572265315800905, "global_step": 54080, "epoch": 454, "lr": 1.4014375892822817e-05} +{"train_loss": 0.0007060409989207983, "global_step": 54081, "epoch": 454, "lr": 1.4012837761317887e-05} +{"train_loss": 0.0009488825453445315, "global_step": 54082, "epoch": 454, "lr": 1.4011299700469904e-05} +{"train_loss": 0.0006326966104097664, "global_step": 54083, "epoch": 454, "lr": 1.4009761710281876e-05} +{"train_loss": 0.0006441822624765337, "global_step": 54084, "epoch": 454, "lr": 1.4008223790756848e-05} +{"train_loss": 0.00031471758848056197, "global_step": 54085, "epoch": 454, "lr": 1.4006685941897813e-05} +{"train_loss": 0.0009064581827260554, "global_step": 54086, "epoch": 454, "lr": 1.400514816370781e-05} +{"train_loss": 0.0009940857999026775, "global_step": 54087, "epoch": 454, "lr": 1.4003610456189865e-05} +{"train_loss": 0.0006499385344795883, "global_step": 54088, "epoch": 454, "lr": 1.4002072819346967e-05} +{"train_loss": 0.0008413844043388963, "global_step": 54089, "epoch": 454, "lr": 1.4000535253182168e-05} +{"train_loss": 0.00045674986904487014, "global_step": 54090, "epoch": 454, "lr": 1.3998997757698462e-05} +{"train_loss": 0.0010320879518985748, "global_step": 54091, "epoch": 454, "lr": 1.3997460332898887e-05} +{"train_loss": 0.0003947509976569563, "global_step": 54092, "epoch": 454, "lr": 1.3995922978786442e-05} +{"train_loss": 0.0006510738166980445, "global_step": 54093, "epoch": 454, "lr": 1.3994385695364171e-05} +{"train_loss": 0.0006000309367664158, "global_step": 54094, "epoch": 454, "lr": 1.3992848482635074e-05} +{"train_loss": 0.0007021165220066905, "global_step": 54095, "epoch": 454, "lr": 1.399131134060216e-05} +{"train_loss": 0.00048586755292490125, "global_step": 54096, "epoch": 454, "lr": 1.3989774269268474e-05} +{"train_loss": 0.0009005173342302442, "global_step": 54097, "epoch": 454, "lr": 1.3988237268637e-05} +{"train_loss": 0.0013940335484221578, "global_step": 54098, "epoch": 454, "lr": 1.3986700338710796e-05} +{"train_loss": 0.0004942045779898763, "global_step": 54099, "epoch": 454, "lr": 1.398516347949284e-05} +{"train_loss": 0.0004929651040583849, "global_step": 54100, "epoch": 454, "lr": 1.3983626690986184e-05} +{"train_loss": 0.00048582421732135117, "global_step": 54101, "epoch": 454, "lr": 1.3982089973193829e-05} +{"train_loss": 0.0006648203125223517, "global_step": 54102, "epoch": 454, "lr": 1.3980553326118773e-05} +{"train_loss": 0.0007402045885100961, "global_step": 54103, "epoch": 454, "lr": 1.3979016749764073e-05} +{"train_loss": 0.00145234155934304, "global_step": 54104, "epoch": 454, "lr": 1.3977480244132707e-05} +{"train_loss": 0.0009339642710983753, "global_step": 54105, "epoch": 454, "lr": 1.3975943809227726e-05} +{"train_loss": 0.00047439616173505783, "global_step": 54106, "epoch": 454, "lr": 1.3974407445052117e-05} +{"train_loss": 0.0008200497832149267, "global_step": 54107, "epoch": 454, "lr": 1.3972871151608923e-05} +{"train_loss": 0.0005309752887114882, "global_step": 54108, "epoch": 454, "lr": 1.3971334928901152e-05} +{"train_loss": 0.0007468634867109358, "global_step": 54109, "epoch": 454, "lr": 1.3969798776931797e-05} +{"train_loss": 0.0012459778226912022, "global_step": 54110, "epoch": 454, "lr": 1.396826269570391e-05} +{"train_loss": 0.0006639197235926986, "global_step": 54111, "epoch": 454, "lr": 1.3966726685220471e-05} +{"train_loss": 0.0006878779386170208, "global_step": 54112, "epoch": 454, "lr": 1.3965190745484536e-05} +{"train_loss": 0.0003666038392111659, "global_step": 54113, "epoch": 454, "lr": 1.3963654876499093e-05} +{"train_loss": 0.000463915872387588, "global_step": 54114, "epoch": 454, "lr": 1.3962119078267156e-05} +{"train_loss": 0.0005315395537763834, "global_step": 54115, "epoch": 454, "lr": 1.3960583350791756e-05} +{"train_loss": 0.0005511023919098079, "global_step": 54116, "epoch": 454, "lr": 1.3959047694075888e-05} +{"train_loss": 0.0010774469701573253, "global_step": 54117, "epoch": 454, "lr": 1.3957512108122595e-05} +{"train_loss": 0.00034226581919938326, "global_step": 54118, "epoch": 454, "lr": 1.3955976592934855e-05} +{"train_loss": 0.0008759216871112585, "global_step": 54119, "epoch": 454, "lr": 1.3954441148515728e-05} +{"train_loss": 0.0006639138446189463, "global_step": 54120, "epoch": 454, "lr": 1.3952905774868185e-05} +{"train_loss": 0.000913610216230154, "global_step": 54121, "epoch": 454, "lr": 1.3951370471995262e-05} +{"train_loss": 0.0007041041390039027, "global_step": 54122, "epoch": 454, "lr": 1.3949835239899989e-05} +{"train_loss": 0.0006030413787811995, "global_step": 54123, "epoch": 454, "lr": 1.3948300078585347e-05} +{"train_loss": 0.0007547007990069687, "global_step": 54124, "epoch": 454, "lr": 1.3946764988054378e-05} +{"train_loss": 0.0007011554553173482, "global_step": 54125, "epoch": 454, "lr": 1.394522996831007e-05} +{"train_loss": 0.0007386354263871908, "global_step": 54126, "epoch": 454, "lr": 1.3943695019355468e-05} +{"train_loss": 0.0009793591452762485, "global_step": 54127, "epoch": 454, "lr": 1.3942160141193566e-05} +{"train_loss": 0.0010530551662668586, "global_step": 54128, "epoch": 454, "lr": 1.3940625333827374e-05} +{"train_loss": 0.0004431555571500212, "global_step": 54129, "epoch": 454, "lr": 1.3939090597259919e-05} +{"train_loss": 0.0006645818357355893, "global_step": 54130, "epoch": 454, "lr": 1.393755593149419e-05} +{"train_loss": 0.0007288525230251253, "global_step": 54131, "epoch": 454, "lr": 1.393602133653324e-05} +{"train_loss": 0.0006427133339457214, "global_step": 54132, "epoch": 454, "lr": 1.3934486812380054e-05} +{"train_loss": 0.0008873705519363284, "global_step": 54133, "epoch": 454, "lr": 1.3932952359037633e-05} +{"train_loss": 0.0005078040412627161, "global_step": 54134, "epoch": 454, "lr": 1.3931417976509026e-05} +{"train_loss": 0.0005169252981431782, "global_step": 54135, "epoch": 454, "lr": 1.392988366479721e-05} +{"train_loss": 0.0015089948428794742, "global_step": 54136, "epoch": 454, "lr": 1.3928349423905229e-05} +{"train_loss": 0.0009703434188850224, "global_step": 54137, "epoch": 454, "lr": 1.3926815253836067e-05} +{"train_loss": 0.0003603029763326049, "global_step": 54138, "epoch": 454, "lr": 1.3925281154592762e-05} +{"train_loss": 0.0004931291914545, "global_step": 54139, "epoch": 454, "lr": 1.3923747126178316e-05} +{"train_loss": 0.0004339225706644356, "global_step": 54140, "epoch": 454, "lr": 1.392221316859572e-05} +{"train_loss": 0.0008267281809821725, "global_step": 54141, "epoch": 454, "lr": 1.392067928184802e-05} +{"train_loss": 0.000505726202391088, "global_step": 54142, "epoch": 454, "lr": 1.39191454659382e-05} +{"train_loss": 0.0008968388428911567, "global_step": 54143, "epoch": 454, "lr": 1.3917611720869294e-05} +{"train_loss": 0.0007431613121909567, "global_step": 54144, "epoch": 454, "lr": 1.3916078046644304e-05, "val_loss": 0.007715191226452589} +{"train_loss": 0.00028249132446944714, "global_step": 54145, "epoch": 455, "lr": 1.3914544443266225e-05} +{"train_loss": 0.0016195940552279353, "global_step": 54146, "epoch": 455, "lr": 1.3913010910738095e-05} +{"train_loss": 0.0006357773672789335, "global_step": 54147, "epoch": 455, "lr": 1.3911477449062904e-05} +{"train_loss": 0.0006166626117192209, "global_step": 54148, "epoch": 455, "lr": 1.3909944058243679e-05} +{"train_loss": 0.0006756361108273268, "global_step": 54149, "epoch": 455, "lr": 1.3908410738283417e-05} +{"train_loss": 0.0006813128129579127, "global_step": 54150, "epoch": 455, "lr": 1.3906877489185143e-05} +{"train_loss": 0.00041561960824765265, "global_step": 54151, "epoch": 455, "lr": 1.3905344310951845e-05} +{"train_loss": 0.000389505730709061, "global_step": 54152, "epoch": 455, "lr": 1.3903811203586563e-05} +{"train_loss": 0.001043691299855709, "global_step": 54153, "epoch": 455, "lr": 1.3902278167092276e-05} +{"train_loss": 0.0005347445257939398, "global_step": 54154, "epoch": 455, "lr": 1.3900745201472027e-05} +{"train_loss": 0.0005295425071381032, "global_step": 54155, "epoch": 455, "lr": 1.3899212306728792e-05} +{"train_loss": 0.0007541437516920269, "global_step": 54156, "epoch": 455, "lr": 1.3897679482865594e-05} +{"train_loss": 0.0005421110545285046, "global_step": 54157, "epoch": 455, "lr": 1.3896146729885461e-05} +{"train_loss": 0.0010177443036809564, "global_step": 54158, "epoch": 455, "lr": 1.3894614047791394e-05} +{"train_loss": 0.00157906801905483, "global_step": 54159, "epoch": 455, "lr": 1.3893081436586369e-05} +{"train_loss": 0.0005504043656401336, "global_step": 54160, "epoch": 455, "lr": 1.3891548896273443e-05} +{"train_loss": 0.0006778900278732181, "global_step": 54161, "epoch": 455, "lr": 1.3890016426855584e-05} +{"train_loss": 0.0004924151580780745, "global_step": 54162, "epoch": 455, "lr": 1.3888484028335841e-05} +{"train_loss": 0.0007591057801619172, "global_step": 54163, "epoch": 455, "lr": 1.38869517007172e-05} +{"train_loss": 0.0013717132387682796, "global_step": 54164, "epoch": 455, "lr": 1.3885419444002651e-05} +{"train_loss": 0.00048407548456452787, "global_step": 54165, "epoch": 455, "lr": 1.3883887258195243e-05} +{"train_loss": 0.0009698792127892375, "global_step": 54166, "epoch": 455, "lr": 1.3882355143297942e-05} +{"train_loss": 0.0004787874349858612, "global_step": 54167, "epoch": 455, "lr": 1.38808230993138e-05} +{"train_loss": 0.0006272608297877014, "global_step": 54168, "epoch": 455, "lr": 1.3879291126245787e-05} +{"train_loss": 0.0009326295694336295, "global_step": 54169, "epoch": 455, "lr": 1.3877759224096943e-05} +{"train_loss": 0.0004926006076857448, "global_step": 54170, "epoch": 455, "lr": 1.3876227392870256e-05} +{"train_loss": 0.0006477273418568075, "global_step": 54171, "epoch": 455, "lr": 1.3874695632568724e-05} +{"train_loss": 0.0006451013032346964, "global_step": 54172, "epoch": 455, "lr": 1.3873163943195383e-05} +{"train_loss": 0.0011448418954387307, "global_step": 54173, "epoch": 455, "lr": 1.3871632324753208e-05} +{"train_loss": 0.0007348659564740956, "global_step": 54174, "epoch": 455, "lr": 1.3870100777245243e-05} +{"train_loss": 0.0007730727666057646, "global_step": 54175, "epoch": 455, "lr": 1.3868569300674455e-05} +{"train_loss": 0.0007471187855117023, "global_step": 54176, "epoch": 455, "lr": 1.3867037895043888e-05} +{"train_loss": 0.0008916734368540347, "global_step": 54177, "epoch": 455, "lr": 1.3865506560356535e-05} +{"train_loss": 0.0005175386322662234, "global_step": 54178, "epoch": 455, "lr": 1.3863975296615378e-05} +{"train_loss": 0.0005457550287246704, "global_step": 54179, "epoch": 455, "lr": 1.3862444103823463e-05} +{"train_loss": 0.0004499554925132543, "global_step": 54180, "epoch": 455, "lr": 1.3860912981983765e-05} +{"train_loss": 0.00040429786895401776, "global_step": 54181, "epoch": 455, "lr": 1.3859381931099318e-05} +{"train_loss": 0.001151909469626844, "global_step": 54182, "epoch": 455, "lr": 1.3857850951173112e-05} +{"train_loss": 0.0010993247851729393, "global_step": 54183, "epoch": 455, "lr": 1.3856320042208137e-05} +{"train_loss": 0.0005432231700979173, "global_step": 54184, "epoch": 455, "lr": 1.3854789204207419e-05} +{"train_loss": 0.0007250083144754171, "global_step": 54185, "epoch": 455, "lr": 1.3853258437173977e-05} +{"train_loss": 0.0008350912830792367, "global_step": 54186, "epoch": 455, "lr": 1.3851727741110786e-05} +{"train_loss": 0.0007512380834668875, "global_step": 54187, "epoch": 455, "lr": 1.385019711602088e-05} +{"train_loss": 0.0006744791171513498, "global_step": 54188, "epoch": 455, "lr": 1.3848666561907231e-05} +{"train_loss": 0.0009537390433251858, "global_step": 54189, "epoch": 455, "lr": 1.3847136078772882e-05} +{"train_loss": 0.0014511424815282226, "global_step": 54190, "epoch": 455, "lr": 1.3845605666620803e-05} +{"train_loss": 0.0007152956677600741, "global_step": 54191, "epoch": 455, "lr": 1.3844075325454031e-05} +{"train_loss": 0.0004718347336165607, "global_step": 54192, "epoch": 455, "lr": 1.384254505527554e-05} +{"train_loss": 0.001129071693867445, "global_step": 54193, "epoch": 455, "lr": 1.3841014856088363e-05} +{"train_loss": 0.0014334855368360877, "global_step": 54194, "epoch": 455, "lr": 1.3839484727895474e-05} +{"train_loss": 0.00030228550895117223, "global_step": 54195, "epoch": 455, "lr": 1.383795467069991e-05} +{"train_loss": 0.0004130971210543066, "global_step": 54196, "epoch": 455, "lr": 1.3836424684504656e-05} +{"train_loss": 0.0003437992709223181, "global_step": 54197, "epoch": 455, "lr": 1.3834894769312706e-05} +{"train_loss": 0.0009560828912071884, "global_step": 54198, "epoch": 455, "lr": 1.383336492512709e-05} +{"train_loss": 0.00048472717753611505, "global_step": 54199, "epoch": 455, "lr": 1.3831835151950783e-05} +{"train_loss": 0.0006737628136761487, "global_step": 54200, "epoch": 455, "lr": 1.3830305449786818e-05} +{"train_loss": 0.0007534957258030772, "global_step": 54201, "epoch": 455, "lr": 1.3828775818638189e-05} +{"train_loss": 0.0009209763957187533, "global_step": 54202, "epoch": 455, "lr": 1.3827246258507875e-05} +{"train_loss": 0.000547041418030858, "global_step": 54203, "epoch": 455, "lr": 1.3825716769398916e-05} +{"train_loss": 0.0005745463422499597, "global_step": 54204, "epoch": 455, "lr": 1.3824187351314277e-05} +{"train_loss": 0.00041475307079963386, "global_step": 54205, "epoch": 455, "lr": 1.3822658004257e-05} +{"train_loss": 0.0015799986431375146, "global_step": 54206, "epoch": 455, "lr": 1.3821128728230055e-05} +{"train_loss": 0.0008101685089059174, "global_step": 54207, "epoch": 455, "lr": 1.3819599523236476e-05} +{"train_loss": 0.0009039962315000594, "global_step": 54208, "epoch": 455, "lr": 1.3818070389279241e-05} +{"train_loss": 0.0010591349564492702, "global_step": 54209, "epoch": 455, "lr": 1.3816541326361348e-05} +{"train_loss": 0.0011106887832283974, "global_step": 54210, "epoch": 455, "lr": 1.3815012334485827e-05} +{"train_loss": 0.00046530639519914985, "global_step": 54211, "epoch": 455, "lr": 1.3813483413655647e-05} +{"train_loss": 0.0009853971423581243, "global_step": 54212, "epoch": 455, "lr": 1.3811954563873841e-05} +{"train_loss": 0.0009754233178682625, "global_step": 54213, "epoch": 455, "lr": 1.38104257851434e-05} +{"train_loss": 0.0006323012057691813, "global_step": 54214, "epoch": 455, "lr": 1.3808897077467303e-05} +{"train_loss": 0.0005800409126095474, "global_step": 54215, "epoch": 455, "lr": 1.3807368440848584e-05} +{"train_loss": 0.0005338985356502235, "global_step": 54216, "epoch": 455, "lr": 1.3805839875290216e-05} +{"train_loss": 0.0006581340567208827, "global_step": 54217, "epoch": 455, "lr": 1.3804311380795231e-05} +{"train_loss": 0.0005691109108738601, "global_step": 54218, "epoch": 455, "lr": 1.38027829573666e-05} +{"train_loss": 0.0011089133331552148, "global_step": 54219, "epoch": 455, "lr": 1.3801254605007335e-05} +{"train_loss": 0.0007552095339633524, "global_step": 54220, "epoch": 455, "lr": 1.3799726323720458e-05} +{"train_loss": 0.000442928314441815, "global_step": 54221, "epoch": 455, "lr": 1.3798198113508931e-05} +{"train_loss": 0.0006687364657409489, "global_step": 54222, "epoch": 455, "lr": 1.3796669974375792e-05} +{"train_loss": 0.0009271247545257211, "global_step": 54223, "epoch": 455, "lr": 1.3795141906324005e-05} +{"train_loss": 0.0008023568661883473, "global_step": 54224, "epoch": 455, "lr": 1.3793613909356612e-05} +{"train_loss": 0.0003981417394243181, "global_step": 54225, "epoch": 455, "lr": 1.3792085983476565e-05} +{"train_loss": 0.0006792262429371476, "global_step": 54226, "epoch": 455, "lr": 1.3790558128686915e-05} +{"train_loss": 0.00045409699669107795, "global_step": 54227, "epoch": 455, "lr": 1.3789030344990627e-05} +{"train_loss": 0.00039922495489008725, "global_step": 54228, "epoch": 455, "lr": 1.3787502632390697e-05} +{"train_loss": 0.00046573090367019176, "global_step": 54229, "epoch": 455, "lr": 1.3785974990890149e-05} +{"train_loss": 0.00047156697837635875, "global_step": 54230, "epoch": 455, "lr": 1.3784447420491958e-05} +{"train_loss": 0.0006431762012653053, "global_step": 54231, "epoch": 455, "lr": 1.3782919921199156e-05} +{"train_loss": 0.0008857494103722274, "global_step": 54232, "epoch": 455, "lr": 1.3781392493014717e-05} +{"train_loss": 0.0008393923053517938, "global_step": 54233, "epoch": 455, "lr": 1.3779865135941628e-05} +{"train_loss": 0.0010264570591971278, "global_step": 54234, "epoch": 455, "lr": 1.377833784998292e-05} +{"train_loss": 0.00047963872202672064, "global_step": 54235, "epoch": 455, "lr": 1.3776810635141558e-05} +{"train_loss": 0.0011400511721149087, "global_step": 54236, "epoch": 455, "lr": 1.3775283491420576e-05} +{"train_loss": 0.0005037901573814452, "global_step": 54237, "epoch": 455, "lr": 1.3773756418822942e-05} +{"train_loss": 0.00034648695145733654, "global_step": 54238, "epoch": 455, "lr": 1.3772229417351679e-05} +{"train_loss": 0.000464671291410923, "global_step": 54239, "epoch": 455, "lr": 1.3770702487009773e-05} +{"train_loss": 0.0006357302772812545, "global_step": 54240, "epoch": 455, "lr": 1.3769175627800207e-05} +{"train_loss": 0.0006051618838682771, "global_step": 54241, "epoch": 455, "lr": 1.376764883972601e-05} +{"train_loss": 0.0010654415236786008, "global_step": 54242, "epoch": 455, "lr": 1.3766122122790154e-05} +{"train_loss": 0.0008694702992215753, "global_step": 54243, "epoch": 455, "lr": 1.3764595476995657e-05} +{"train_loss": 0.0005553208175115287, "global_step": 54244, "epoch": 455, "lr": 1.3763068902345489e-05} +{"train_loss": 0.0002671167894732207, "global_step": 54245, "epoch": 455, "lr": 1.3761542398842675e-05} +{"train_loss": 0.0003321791591588408, "global_step": 54246, "epoch": 455, "lr": 1.3760015966490209e-05} +{"train_loss": 0.0008357776096090674, "global_step": 54247, "epoch": 455, "lr": 1.3758489605291059e-05} +{"train_loss": 0.0013737407280132174, "global_step": 54248, "epoch": 455, "lr": 1.3756963315248261e-05} +{"train_loss": 0.0009495282429270446, "global_step": 54249, "epoch": 455, "lr": 1.3755437096364782e-05} +{"train_loss": 0.0005659986054524779, "global_step": 54250, "epoch": 455, "lr": 1.375391094864364e-05} +{"train_loss": 0.0008494887733832002, "global_step": 54251, "epoch": 455, "lr": 1.3752384872087804e-05} +{"train_loss": 0.0006657556514255702, "global_step": 54252, "epoch": 455, "lr": 1.3750858866700306e-05} +{"train_loss": 0.00072111637564376, "global_step": 54253, "epoch": 455, "lr": 1.3749332932484111e-05} +{"train_loss": 0.0013286679750308394, "global_step": 54254, "epoch": 455, "lr": 1.3747807069442226e-05} +{"train_loss": 0.0005539439735002816, "global_step": 54255, "epoch": 455, "lr": 1.3746281277577666e-05} +{"train_loss": 0.0005147659685462713, "global_step": 54256, "epoch": 455, "lr": 1.3744755556893391e-05} +{"train_loss": 0.0006630753050558269, "global_step": 54257, "epoch": 455, "lr": 1.3743229907392436e-05} +{"train_loss": 0.0005214127013459802, "global_step": 54258, "epoch": 455, "lr": 1.374170432907777e-05} +{"train_loss": 0.0011468777665868402, "global_step": 54259, "epoch": 455, "lr": 1.3740178821952377e-05} +{"train_loss": 0.0003912505053449422, "global_step": 54260, "epoch": 455, "lr": 1.373865338601929e-05} +{"train_loss": 0.0013067189138382673, "global_step": 54261, "epoch": 455, "lr": 1.3737128021281465e-05} +{"train_loss": 0.0007437068852595985, "global_step": 54262, "epoch": 455, "lr": 1.3735602727741931e-05} +{"train_loss": 0.0007364653792435757, "global_step": 54263, "epoch": 455, "lr": 1.3734077505403665e-05, "val_loss": 0.01987832598388195, "train_action_mse_error": 1.0177321200899314e-05} +{"train_loss": 0.0006734660128131509, "global_step": 54264, "epoch": 456, "lr": 1.3732552354269651e-05} +{"train_loss": 0.0009650347637943923, "global_step": 54265, "epoch": 456, "lr": 1.3731027274342911e-05} +{"train_loss": 0.0005538278492167592, "global_step": 54266, "epoch": 456, "lr": 1.372950226562641e-05} +{"train_loss": 0.00035370702971704304, "global_step": 54267, "epoch": 456, "lr": 1.3727977328123164e-05} +{"train_loss": 0.0008269330719485879, "global_step": 54268, "epoch": 456, "lr": 1.3726452461836153e-05} +{"train_loss": 0.0007258565747179091, "global_step": 54269, "epoch": 456, "lr": 1.3724927666768388e-05} +{"train_loss": 0.0012208111584186554, "global_step": 54270, "epoch": 456, "lr": 1.3723402942922852e-05} +{"train_loss": 0.0010271139908581972, "global_step": 54271, "epoch": 456, "lr": 1.3721878290302526e-05} +{"train_loss": 0.0005642853211611509, "global_step": 54272, "epoch": 456, "lr": 1.3720353708910427e-05} +{"train_loss": 0.00041654074448160827, "global_step": 54273, "epoch": 456, "lr": 1.3718829198749528e-05} +{"train_loss": 0.0006276196800172329, "global_step": 54274, "epoch": 456, "lr": 1.3717304759822846e-05} +{"train_loss": 0.0006554808933287859, "global_step": 54275, "epoch": 456, "lr": 1.3715780392133343e-05} +{"train_loss": 0.0009617495816200972, "global_step": 54276, "epoch": 456, "lr": 1.3714256095684042e-05} +{"train_loss": 0.0009689846774563193, "global_step": 54277, "epoch": 456, "lr": 1.3712731870477925e-05} +{"train_loss": 0.0007988567231222987, "global_step": 54278, "epoch": 456, "lr": 1.3711207716517965e-05} +{"train_loss": 0.0007563236285932362, "global_step": 54279, "epoch": 456, "lr": 1.370968363380719e-05} +{"train_loss": 0.0010281556751579046, "global_step": 54280, "epoch": 456, "lr": 1.370815962234856e-05} +{"train_loss": 0.0008772430010139942, "global_step": 54281, "epoch": 456, "lr": 1.3706635682145091e-05} +{"train_loss": 0.0004580568347591907, "global_step": 54282, "epoch": 456, "lr": 1.3705111813199756e-05} +{"train_loss": 0.0003138897882308811, "global_step": 54283, "epoch": 456, "lr": 1.3703588015515568e-05} +{"train_loss": 0.0007083687814883888, "global_step": 54284, "epoch": 456, "lr": 1.3702064289095495e-05} +{"train_loss": 0.0006630339776165783, "global_step": 54285, "epoch": 456, "lr": 1.3700540633942554e-05} +{"train_loss": 0.0009084410266950727, "global_step": 54286, "epoch": 456, "lr": 1.3699017050059708e-05} +{"train_loss": 0.0007924575475044549, "global_step": 54287, "epoch": 456, "lr": 1.3697493537449979e-05} +{"train_loss": 0.00045336520997807384, "global_step": 54288, "epoch": 456, "lr": 1.3695970096116329e-05} +{"train_loss": 0.0009469881770201027, "global_step": 54289, "epoch": 456, "lr": 1.3694446726061777e-05} +{"train_loss": 0.000978322932496667, "global_step": 54290, "epoch": 456, "lr": 1.3692923427289289e-05} +{"train_loss": 0.0006884839967824519, "global_step": 54291, "epoch": 456, "lr": 1.369140019980188e-05} +{"train_loss": 0.001431065145879984, "global_step": 54292, "epoch": 456, "lr": 1.3689877043602511e-05} +{"train_loss": 0.0006053290562704206, "global_step": 54293, "epoch": 456, "lr": 1.3688353958694206e-05} +{"train_loss": 0.0009520332096144557, "global_step": 54294, "epoch": 456, "lr": 1.368683094507992e-05} +{"train_loss": 0.0003597618779167533, "global_step": 54295, "epoch": 456, "lr": 1.368530800276268e-05} +{"train_loss": 0.0005498293321579695, "global_step": 54296, "epoch": 456, "lr": 1.3683785131745458e-05} +{"train_loss": 0.0003799942205660045, "global_step": 54297, "epoch": 456, "lr": 1.3682262332031225e-05} +{"train_loss": 0.0005536370445042849, "global_step": 54298, "epoch": 456, "lr": 1.3680739603623011e-05} +{"train_loss": 0.0005901765543967485, "global_step": 54299, "epoch": 456, "lr": 1.367921694652377e-05} +{"train_loss": 0.0006398988771252334, "global_step": 54300, "epoch": 456, "lr": 1.3677694360736516e-05} +{"train_loss": 0.001294253976084292, "global_step": 54301, "epoch": 456, "lr": 1.367617184626423e-05} +{"train_loss": 0.0003292365581728518, "global_step": 54302, "epoch": 456, "lr": 1.367464940310989e-05} +{"train_loss": 0.0007952290470711887, "global_step": 54303, "epoch": 456, "lr": 1.3673127031276505e-05} +{"train_loss": 0.00044624213478527963, "global_step": 54304, "epoch": 456, "lr": 1.367160473076704e-05} +{"train_loss": 0.0011458880035206676, "global_step": 54305, "epoch": 456, "lr": 1.3670082501584514e-05} +{"train_loss": 0.00048485497245565057, "global_step": 54306, "epoch": 456, "lr": 1.3668560343731884e-05} +{"train_loss": 0.0007463691290467978, "global_step": 54307, "epoch": 456, "lr": 1.3667038257212166e-05} +{"train_loss": 0.0007622534758411348, "global_step": 54308, "epoch": 456, "lr": 1.3665516242028342e-05} +{"train_loss": 0.0006560933543369174, "global_step": 54309, "epoch": 456, "lr": 1.366399429818338e-05} +{"train_loss": 0.0008013269980438054, "global_step": 54310, "epoch": 456, "lr": 1.3662472425680296e-05} +{"train_loss": 0.0005914654466323555, "global_step": 54311, "epoch": 456, "lr": 1.366095062452205e-05} +{"train_loss": 0.0007126195705495775, "global_step": 54312, "epoch": 456, "lr": 1.3659428894711663e-05} +{"train_loss": 0.0008557710680179298, "global_step": 54313, "epoch": 456, "lr": 1.3657907236252088e-05} +{"train_loss": 0.00042971718357875943, "global_step": 54314, "epoch": 456, "lr": 1.3656385649146341e-05} +{"train_loss": 0.0007880889461375773, "global_step": 54315, "epoch": 456, "lr": 1.3654864133397405e-05} +{"train_loss": 0.0005681493203155696, "global_step": 54316, "epoch": 456, "lr": 1.3653342689008241e-05} +{"train_loss": 0.0010169545421376824, "global_step": 54317, "epoch": 456, "lr": 1.3651821315981856e-05} +{"train_loss": 0.00032064103288576007, "global_step": 54318, "epoch": 456, "lr": 1.3650300014321254e-05} +{"train_loss": 0.0006836937973275781, "global_step": 54319, "epoch": 456, "lr": 1.3648778784029387e-05} +{"train_loss": 0.0007112880703061819, "global_step": 54320, "epoch": 456, "lr": 1.3647257625109273e-05} +{"train_loss": 0.00038115138886496425, "global_step": 54321, "epoch": 456, "lr": 1.3645736537563875e-05} +{"train_loss": 0.0004035990568809211, "global_step": 54322, "epoch": 456, "lr": 1.3644215521396198e-05} +{"train_loss": 0.0005381318042054772, "global_step": 54323, "epoch": 456, "lr": 1.3642694576609211e-05} +{"train_loss": 0.0006247048731893301, "global_step": 54324, "epoch": 456, "lr": 1.3641173703205918e-05} +{"train_loss": 0.0004287716292310506, "global_step": 54325, "epoch": 456, "lr": 1.3639652901189287e-05} +{"train_loss": 0.0008931902702897787, "global_step": 54326, "epoch": 456, "lr": 1.3638132170562324e-05} +{"train_loss": 0.0005180223961360753, "global_step": 54327, "epoch": 456, "lr": 1.3636611511328008e-05} +{"train_loss": 0.0003914161934517324, "global_step": 54328, "epoch": 456, "lr": 1.3635090923489302e-05} +{"train_loss": 0.0010589027078822255, "global_step": 54329, "epoch": 456, "lr": 1.3633570407049224e-05} +{"train_loss": 0.00037331038038246334, "global_step": 54330, "epoch": 456, "lr": 1.363204996201073e-05} +{"train_loss": 0.0005128610646352172, "global_step": 54331, "epoch": 456, "lr": 1.363052958837684e-05} +{"train_loss": 0.00035394870792515576, "global_step": 54332, "epoch": 456, "lr": 1.3629009286150512e-05} +{"train_loss": 0.0008506706217303872, "global_step": 54333, "epoch": 456, "lr": 1.362748905533473e-05} +{"train_loss": 0.0006347004673443735, "global_step": 54334, "epoch": 456, "lr": 1.36259688959325e-05} +{"train_loss": 0.00041966798016801476, "global_step": 54335, "epoch": 456, "lr": 1.3624448807946782e-05} +{"train_loss": 0.0008829290745779872, "global_step": 54336, "epoch": 456, "lr": 1.3622928791380585e-05} +{"train_loss": 0.0005975340609438717, "global_step": 54337, "epoch": 456, "lr": 1.3621408846236867e-05} +{"train_loss": 0.0004475089081097394, "global_step": 54338, "epoch": 456, "lr": 1.3619888972518641e-05} +{"train_loss": 0.0003613361914176494, "global_step": 54339, "epoch": 456, "lr": 1.3618369170228879e-05} +{"train_loss": 0.0006837710388936102, "global_step": 54340, "epoch": 456, "lr": 1.3616849439370544e-05} +{"train_loss": 0.0008081624400801957, "global_step": 54341, "epoch": 456, "lr": 1.3615329779946651e-05} +{"train_loss": 0.000829036463983357, "global_step": 54342, "epoch": 456, "lr": 1.3613810191960159e-05} +{"train_loss": 0.00044014546438120306, "global_step": 54343, "epoch": 456, "lr": 1.361229067541408e-05} +{"train_loss": 0.0006701109814457595, "global_step": 54344, "epoch": 456, "lr": 1.3610771230311364e-05} +{"train_loss": 0.00035867124097421765, "global_step": 54345, "epoch": 456, "lr": 1.3609251856655026e-05} +{"train_loss": 0.0004672673821914941, "global_step": 54346, "epoch": 456, "lr": 1.3607732554448032e-05} +{"train_loss": 0.000520497327670455, "global_step": 54347, "epoch": 456, "lr": 1.3606213323693357e-05} +{"train_loss": 0.0005747013492509723, "global_step": 54348, "epoch": 456, "lr": 1.3604694164394005e-05} +{"train_loss": 0.0007304797763936222, "global_step": 54349, "epoch": 456, "lr": 1.3603175076552932e-05} +{"train_loss": 0.0004648693429771811, "global_step": 54350, "epoch": 456, "lr": 1.3601656060173151e-05} +{"train_loss": 0.0012820940464735031, "global_step": 54351, "epoch": 456, "lr": 1.3600137115257621e-05} +{"train_loss": 0.0005080176633782685, "global_step": 54352, "epoch": 456, "lr": 1.359861824180933e-05} +{"train_loss": 0.0005111994105391204, "global_step": 54353, "epoch": 456, "lr": 1.3597099439831273e-05} +{"train_loss": 0.0006234198808670044, "global_step": 54354, "epoch": 456, "lr": 1.3595580709326411e-05} +{"train_loss": 0.00032627477776259184, "global_step": 54355, "epoch": 456, "lr": 1.3594062050297757e-05} +{"train_loss": 0.0009852558141574264, "global_step": 54356, "epoch": 456, "lr": 1.3592543462748253e-05} +{"train_loss": 0.0008022249094210565, "global_step": 54357, "epoch": 456, "lr": 1.3591024946680913e-05} +{"train_loss": 0.0006239816430024803, "global_step": 54358, "epoch": 456, "lr": 1.3589506502098709e-05} +{"train_loss": 0.0005014569032937288, "global_step": 54359, "epoch": 456, "lr": 1.3587988129004603e-05} +{"train_loss": 0.0003795266093220562, "global_step": 54360, "epoch": 456, "lr": 1.358646982740161e-05} +{"train_loss": 0.0006193075678311288, "global_step": 54361, "epoch": 456, "lr": 1.3584951597292673e-05} +{"train_loss": 0.00032337542506866157, "global_step": 54362, "epoch": 456, "lr": 1.358343343868081e-05} +{"train_loss": 0.001128846313804388, "global_step": 54363, "epoch": 456, "lr": 1.3581915351568974e-05} +{"train_loss": 0.0014774680603295565, "global_step": 54364, "epoch": 456, "lr": 1.3580397335960165e-05} +{"train_loss": 0.0008087134337984025, "global_step": 54365, "epoch": 456, "lr": 1.3578879391857363e-05} +{"train_loss": 0.0004959514481015503, "global_step": 54366, "epoch": 456, "lr": 1.3577361519263521e-05} +{"train_loss": 0.0006302446126937866, "global_step": 54367, "epoch": 456, "lr": 1.3575843718181652e-05} +{"train_loss": 0.0003916282730642706, "global_step": 54368, "epoch": 456, "lr": 1.3574325988614706e-05} +{"train_loss": 0.0007509759743697941, "global_step": 54369, "epoch": 456, "lr": 1.35728083305657e-05} +{"train_loss": 0.0006967567605897784, "global_step": 54370, "epoch": 456, "lr": 1.357129074403759e-05} +{"train_loss": 0.0013847654918208718, "global_step": 54371, "epoch": 456, "lr": 1.3569773229033345e-05} +{"train_loss": 0.0004346697241999209, "global_step": 54372, "epoch": 456, "lr": 1.3568255785555972e-05} +{"train_loss": 0.0010179094970226288, "global_step": 54373, "epoch": 456, "lr": 1.3566738413608422e-05} +{"train_loss": 0.00035898861824534833, "global_step": 54374, "epoch": 456, "lr": 1.3565221113193705e-05} +{"train_loss": 0.0004113739123567939, "global_step": 54375, "epoch": 456, "lr": 1.3563703884314765e-05} +{"train_loss": 0.0007365343626588583, "global_step": 54376, "epoch": 456, "lr": 1.3562186726974618e-05} +{"train_loss": 0.001098613953217864, "global_step": 54377, "epoch": 456, "lr": 1.3560669641176227e-05} +{"train_loss": 0.0005496072699315846, "global_step": 54378, "epoch": 456, "lr": 1.355915262692255e-05} +{"train_loss": 0.0004738723218906671, "global_step": 54379, "epoch": 456, "lr": 1.3557635684216597e-05} +{"train_loss": 0.0010900439228862524, "global_step": 54380, "epoch": 456, "lr": 1.3556118813061318e-05} +{"train_loss": 0.0008296133601106703, "global_step": 54381, "epoch": 456, "lr": 1.3554602013459722e-05} +{"train_loss": 0.000680637887058811, "global_step": 54382, "epoch": 456, "lr": 1.3553085285414758e-05, "val_loss": 0.026579199358820915} +{"train_loss": 0.0006651682197116315, "global_step": 54383, "epoch": 457, "lr": 1.3551568628929434e-05} +{"train_loss": 0.0006312195328064263, "global_step": 54384, "epoch": 457, "lr": 1.3550052044006695e-05} +{"train_loss": 0.000670993176754564, "global_step": 54385, "epoch": 457, "lr": 1.3548535530649548e-05} +{"train_loss": 0.0007768968353047967, "global_step": 54386, "epoch": 457, "lr": 1.354701908886094e-05} +{"train_loss": 0.0006911210948601365, "global_step": 54387, "epoch": 457, "lr": 1.354550271864387e-05} +{"train_loss": 0.0005661762552335858, "global_step": 54388, "epoch": 457, "lr": 1.3543986420001325e-05} +{"train_loss": 0.00048740010242909193, "global_step": 54389, "epoch": 457, "lr": 1.3542470192936268e-05} +{"train_loss": 0.0010111972223967314, "global_step": 54390, "epoch": 457, "lr": 1.3540954037451659e-05} +{"train_loss": 0.0005050417967140675, "global_step": 54391, "epoch": 457, "lr": 1.3539437953550504e-05} +{"train_loss": 0.0005700767505913973, "global_step": 54392, "epoch": 457, "lr": 1.353792194123576e-05} +{"train_loss": 0.00040457857539877295, "global_step": 54393, "epoch": 457, "lr": 1.3536406000510421e-05} +{"train_loss": 0.0010748648783192039, "global_step": 54394, "epoch": 457, "lr": 1.3534890131377437e-05} +{"train_loss": 0.0008065013098530471, "global_step": 54395, "epoch": 457, "lr": 1.353337433383982e-05} +{"train_loss": 0.0005866146530024707, "global_step": 54396, "epoch": 457, "lr": 1.3531858607900522e-05} +{"train_loss": 0.0005597343551926315, "global_step": 54397, "epoch": 457, "lr": 1.3530342953562514e-05} +{"train_loss": 0.0008056434453465044, "global_step": 54398, "epoch": 457, "lr": 1.3528827370828789e-05} +{"train_loss": 0.00028934955480508506, "global_step": 54399, "epoch": 457, "lr": 1.3527311859702307e-05} +{"train_loss": 0.0005600868607871234, "global_step": 54400, "epoch": 457, "lr": 1.3525796420186065e-05} +{"train_loss": 0.0008257839363068342, "global_step": 54401, "epoch": 457, "lr": 1.3524281052283022e-05} +{"train_loss": 0.0008786025573499501, "global_step": 54402, "epoch": 457, "lr": 1.3522765755996141e-05} +{"train_loss": 0.0004852843994740397, "global_step": 54403, "epoch": 457, "lr": 1.3521250531328433e-05} +{"train_loss": 0.0004193595377728343, "global_step": 54404, "epoch": 457, "lr": 1.3519735378282833e-05} +{"train_loss": 0.0006585209048353136, "global_step": 54405, "epoch": 457, "lr": 1.3518220296862354e-05} +{"train_loss": 0.0006461568409577012, "global_step": 54406, "epoch": 457, "lr": 1.3516705287069931e-05} +{"train_loss": 0.0007885916857048869, "global_step": 54407, "epoch": 457, "lr": 1.351519034890858e-05} +{"train_loss": 0.00024408998433500528, "global_step": 54408, "epoch": 457, "lr": 1.3513675482381254e-05} +{"train_loss": 0.00047273398377001286, "global_step": 54409, "epoch": 457, "lr": 1.351216068749091e-05} +{"train_loss": 0.00033945744507946074, "global_step": 54410, "epoch": 457, "lr": 1.351064596424056e-05} +{"train_loss": 0.0011593354865908623, "global_step": 54411, "epoch": 457, "lr": 1.350913131263314e-05} +{"train_loss": 0.0004446940147317946, "global_step": 54412, "epoch": 457, "lr": 1.3507616732671658e-05} +{"train_loss": 0.0007472601137124002, "global_step": 54413, "epoch": 457, "lr": 1.3506102224359051e-05} +{"train_loss": 0.0005142877344042063, "global_step": 54414, "epoch": 457, "lr": 1.3504587787698336e-05} +{"train_loss": 0.0007526876288466156, "global_step": 54415, "epoch": 457, "lr": 1.3503073422692447e-05} +{"train_loss": 0.0005462479311972857, "global_step": 54416, "epoch": 457, "lr": 1.3501559129344393e-05} +{"train_loss": 0.00035109109012410045, "global_step": 54417, "epoch": 457, "lr": 1.3500044907657106e-05} +{"train_loss": 0.00035914155887439847, "global_step": 54418, "epoch": 457, "lr": 1.3498530757633604e-05} +{"train_loss": 0.000559890759177506, "global_step": 54419, "epoch": 457, "lr": 1.3497016679276813e-05} +{"train_loss": 0.0004692410584539175, "global_step": 54420, "epoch": 457, "lr": 1.3495502672589754e-05} +{"train_loss": 0.00037776713725179434, "global_step": 54421, "epoch": 457, "lr": 1.3493988737575359e-05} +{"train_loss": 0.00036740556242875755, "global_step": 54422, "epoch": 457, "lr": 1.3492474874236627e-05} +{"train_loss": 0.000535996921826154, "global_step": 54423, "epoch": 457, "lr": 1.3490961082576509e-05} +{"train_loss": 0.000384878454497084, "global_step": 54424, "epoch": 457, "lr": 1.3489447362598001e-05} +{"train_loss": 0.00039555973489768803, "global_step": 54425, "epoch": 457, "lr": 1.3487933714304052e-05} +{"train_loss": 0.0007470994023606181, "global_step": 54426, "epoch": 457, "lr": 1.3486420137697653e-05} +{"train_loss": 0.0006148163229227066, "global_step": 54427, "epoch": 457, "lr": 1.3484906632781774e-05} +{"train_loss": 0.0006576154846698046, "global_step": 54428, "epoch": 457, "lr": 1.3483393199559358e-05} +{"train_loss": 0.0007107849814929068, "global_step": 54429, "epoch": 457, "lr": 1.3481879838033418e-05} +{"train_loss": 0.0004329567891545594, "global_step": 54430, "epoch": 457, "lr": 1.348036654820689e-05} +{"train_loss": 0.0006894420948810875, "global_step": 54431, "epoch": 457, "lr": 1.3478853330082775e-05} +{"train_loss": 0.00022148214338812977, "global_step": 54432, "epoch": 457, "lr": 1.3477340183664017e-05} +{"train_loss": 0.0004467374237719923, "global_step": 54433, "epoch": 457, "lr": 1.3475827108953609e-05} +{"train_loss": 0.0010250166524201632, "global_step": 54434, "epoch": 457, "lr": 1.3474314105954517e-05} +{"train_loss": 0.00055337930098176, "global_step": 54435, "epoch": 457, "lr": 1.3472801174669692e-05} +{"train_loss": 0.0007219096878543496, "global_step": 54436, "epoch": 457, "lr": 1.3471288315102131e-05} +{"train_loss": 0.000403253041440621, "global_step": 54437, "epoch": 457, "lr": 1.346977552725478e-05} +{"train_loss": 0.0008089237962849438, "global_step": 54438, "epoch": 457, "lr": 1.3468262811130638e-05} +{"train_loss": 0.0005361278308555484, "global_step": 54439, "epoch": 457, "lr": 1.3466750166732662e-05} +{"train_loss": 0.0008782881777733564, "global_step": 54440, "epoch": 457, "lr": 1.34652375940638e-05} +{"train_loss": 0.0006707023130729795, "global_step": 54441, "epoch": 457, "lr": 1.3463725093127056e-05} +{"train_loss": 0.000913866562768817, "global_step": 54442, "epoch": 457, "lr": 1.3462212663925367e-05} +{"train_loss": 0.0005213170661590993, "global_step": 54443, "epoch": 457, "lr": 1.3460700306461738e-05} +{"train_loss": 0.000517072738148272, "global_step": 54444, "epoch": 457, "lr": 1.3459188020739106e-05} +{"train_loss": 0.00043757547973655164, "global_step": 54445, "epoch": 457, "lr": 1.3457675806760473e-05} +{"train_loss": 0.00036735981120727956, "global_step": 54446, "epoch": 457, "lr": 1.3456163664528781e-05} +{"train_loss": 0.0004861914785578847, "global_step": 54447, "epoch": 457, "lr": 1.3454651594046996e-05} +{"train_loss": 0.0008751916466280818, "global_step": 54448, "epoch": 457, "lr": 1.3453139595318115e-05} +{"train_loss": 0.0005585221806541085, "global_step": 54449, "epoch": 457, "lr": 1.3451627668345075e-05} +{"train_loss": 0.00041483843233436346, "global_step": 54450, "epoch": 457, "lr": 1.345011581313086e-05} +{"train_loss": 0.0007456954917870462, "global_step": 54451, "epoch": 457, "lr": 1.3448604029678452e-05} +{"train_loss": 0.0006460573640652001, "global_step": 54452, "epoch": 457, "lr": 1.344709231799079e-05} +{"train_loss": 0.0005839446093887091, "global_step": 54453, "epoch": 457, "lr": 1.3445580678070868e-05} +{"train_loss": 0.000558971194550395, "global_step": 54454, "epoch": 457, "lr": 1.3444069109921631e-05} +{"train_loss": 0.00037741666892543435, "global_step": 54455, "epoch": 457, "lr": 1.3442557613546076e-05} +{"train_loss": 0.0003994568542111665, "global_step": 54456, "epoch": 457, "lr": 1.3441046188947138e-05} +{"train_loss": 0.0007767463685013354, "global_step": 54457, "epoch": 457, "lr": 1.3439534836127815e-05} +{"train_loss": 0.0003992592392023653, "global_step": 54458, "epoch": 457, "lr": 1.3438023555091057e-05} +{"train_loss": 0.0005363473319448531, "global_step": 54459, "epoch": 457, "lr": 1.3436512345839819e-05} +{"train_loss": 0.0007072820444591343, "global_step": 54460, "epoch": 457, "lr": 1.3435001208377102e-05} +{"train_loss": 0.0006486679194495082, "global_step": 54461, "epoch": 457, "lr": 1.3433490142705834e-05} +{"train_loss": 0.000296011712634936, "global_step": 54462, "epoch": 457, "lr": 1.3431979148829015e-05} +{"train_loss": 0.0006560522015206516, "global_step": 54463, "epoch": 457, "lr": 1.3430468226749587e-05} +{"train_loss": 0.00044961809180676937, "global_step": 54464, "epoch": 457, "lr": 1.3428957376470541e-05} +{"train_loss": 0.0004113117465749383, "global_step": 54465, "epoch": 457, "lr": 1.3427446597994836e-05} +{"train_loss": 0.0005645898054353893, "global_step": 54466, "epoch": 457, "lr": 1.3425935891325408e-05} +{"train_loss": 0.0009294215124100447, "global_step": 54467, "epoch": 457, "lr": 1.3424425256465273e-05} +{"train_loss": 0.0008572997176088393, "global_step": 54468, "epoch": 457, "lr": 1.3422914693417349e-05} +{"train_loss": 0.00039666524389758706, "global_step": 54469, "epoch": 457, "lr": 1.342140420218464e-05} +{"train_loss": 0.0005250662798061967, "global_step": 54470, "epoch": 457, "lr": 1.3419893782770098e-05} +{"train_loss": 0.0007253616349771619, "global_step": 54471, "epoch": 457, "lr": 1.3418383435176668e-05} +{"train_loss": 0.0004086029657628387, "global_step": 54472, "epoch": 457, "lr": 1.341687315940735e-05} +{"train_loss": 0.0009555207216180861, "global_step": 54473, "epoch": 457, "lr": 1.3415362955465082e-05} +{"train_loss": 0.00045142616727389395, "global_step": 54474, "epoch": 457, "lr": 1.3413852823352851e-05} +{"train_loss": 0.0011291240807622671, "global_step": 54475, "epoch": 457, "lr": 1.3412342763073598e-05} +{"train_loss": 0.0003049715596716851, "global_step": 54476, "epoch": 457, "lr": 1.3410832774630322e-05} +{"train_loss": 0.0003581777273211628, "global_step": 54477, "epoch": 457, "lr": 1.3409322858025958e-05} +{"train_loss": 0.0006053319084458053, "global_step": 54478, "epoch": 457, "lr": 1.340781301326347e-05} +{"train_loss": 0.0002949977933894843, "global_step": 54479, "epoch": 457, "lr": 1.3406303240345847e-05} +{"train_loss": 0.0006715251947753131, "global_step": 54480, "epoch": 457, "lr": 1.3404793539276018e-05} +{"train_loss": 0.0006849094061180949, "global_step": 54481, "epoch": 457, "lr": 1.3403283910056985e-05} +{"train_loss": 0.0002568028576206416, "global_step": 54482, "epoch": 457, "lr": 1.3401774352691681e-05} +{"train_loss": 0.0005511788185685873, "global_step": 54483, "epoch": 457, "lr": 1.3400264867183093e-05} +{"train_loss": 0.0005390658625401556, "global_step": 54484, "epoch": 457, "lr": 1.3398755453534167e-05} +{"train_loss": 0.0003122803755104542, "global_step": 54485, "epoch": 457, "lr": 1.339724611174787e-05} +{"train_loss": 0.000701993063557893, "global_step": 54486, "epoch": 457, "lr": 1.3395736841827184e-05} +{"train_loss": 0.0008911735494621098, "global_step": 54487, "epoch": 457, "lr": 1.3394227643775049e-05} +{"train_loss": 0.0003530376998241991, "global_step": 54488, "epoch": 457, "lr": 1.3392718517594443e-05} +{"train_loss": 0.0008230310049839318, "global_step": 54489, "epoch": 457, "lr": 1.3391209463288329e-05} +{"train_loss": 0.0012439752463251352, "global_step": 54490, "epoch": 457, "lr": 1.3389700480859652e-05} +{"train_loss": 0.0008232063846662641, "global_step": 54491, "epoch": 457, "lr": 1.3388191570311399e-05} +{"train_loss": 0.0005145625327713788, "global_step": 54492, "epoch": 457, "lr": 1.33866827316465e-05} +{"train_loss": 0.00040639055077917874, "global_step": 54493, "epoch": 457, "lr": 1.3385173964867959e-05} +{"train_loss": 0.0006811293424107134, "global_step": 54494, "epoch": 457, "lr": 1.3383665269978702e-05} +{"train_loss": 0.0009992956183850765, "global_step": 54495, "epoch": 457, "lr": 1.3382156646981719e-05} +{"train_loss": 0.0007459495100192726, "global_step": 54496, "epoch": 457, "lr": 1.338064809587996e-05} +{"train_loss": 0.0005623667384497821, "global_step": 54497, "epoch": 457, "lr": 1.3379139616676373e-05} +{"train_loss": 0.0009405412711203098, "global_step": 54498, "epoch": 457, "lr": 1.3377631209373948e-05} +{"train_loss": 0.000577141938265413, "global_step": 54499, "epoch": 457, "lr": 1.3376122873975616e-05} +{"train_loss": 0.0005298047326505184, "global_step": 54500, "epoch": 457, "lr": 1.3374614610484366e-05} +{"train_loss": 0.0006053952093993337, "global_step": 54501, "epoch": 457, "lr": 1.3373106418903136e-05, "val_loss": 0.030528753995895386} +{"train_loss": 0.0005269594839774072, "global_step": 54502, "epoch": 458, "lr": 1.3371598299234911e-05} +{"train_loss": 0.0005537302349694073, "global_step": 54503, "epoch": 458, "lr": 1.3370090251482642e-05} +{"train_loss": 0.0009994048159569502, "global_step": 54504, "epoch": 458, "lr": 1.3368582275649271e-05} +{"train_loss": 0.0005281012272462249, "global_step": 54505, "epoch": 458, "lr": 1.3367074371737792e-05} +{"train_loss": 0.0004325355985201895, "global_step": 54506, "epoch": 458, "lr": 1.3365566539751129e-05} +{"train_loss": 0.0009359571267850697, "global_step": 54507, "epoch": 458, "lr": 1.3364058779692284e-05} +{"train_loss": 0.0007043845253065228, "global_step": 54508, "epoch": 458, "lr": 1.3362551091564191e-05} +{"train_loss": 0.0005491662304848433, "global_step": 54509, "epoch": 458, "lr": 1.33610434753698e-05} +{"train_loss": 0.0004071524308528751, "global_step": 54510, "epoch": 458, "lr": 1.3359535931112105e-05} +{"train_loss": 0.0005080900155007839, "global_step": 54511, "epoch": 458, "lr": 1.3358028458794025e-05} +{"train_loss": 0.0009851520881056786, "global_step": 54512, "epoch": 458, "lr": 1.3356521058418564e-05} +{"train_loss": 0.00033373531186953187, "global_step": 54513, "epoch": 458, "lr": 1.3355013729988641e-05} +{"train_loss": 0.0011138980044052005, "global_step": 54514, "epoch": 458, "lr": 1.3353506473507243e-05} +{"train_loss": 0.0005842829123139381, "global_step": 54515, "epoch": 458, "lr": 1.3351999288977312e-05} +{"train_loss": 0.0005884167621843517, "global_step": 54516, "epoch": 458, "lr": 1.335049217640183e-05} +{"train_loss": 0.0009289843146689236, "global_step": 54517, "epoch": 458, "lr": 1.3348985135783721e-05} +{"train_loss": 0.00036644883221015334, "global_step": 54518, "epoch": 458, "lr": 1.3347478167125982e-05} +{"train_loss": 0.0009651309810578823, "global_step": 54519, "epoch": 458, "lr": 1.334597127043154e-05} +{"train_loss": 0.0005535106756724417, "global_step": 54520, "epoch": 458, "lr": 1.334446444570338e-05} +{"train_loss": 0.0004149916931055486, "global_step": 54521, "epoch": 458, "lr": 1.3342957692944435e-05} +{"train_loss": 0.000497573462780565, "global_step": 54522, "epoch": 458, "lr": 1.3341451012157696e-05} +{"train_loss": 0.0003693728649523109, "global_step": 54523, "epoch": 458, "lr": 1.3339944403346078e-05} +{"train_loss": 0.0009336855146102607, "global_step": 54524, "epoch": 458, "lr": 1.3338437866512583e-05} +{"train_loss": 0.0007605512510053813, "global_step": 54525, "epoch": 458, "lr": 1.333693140166013e-05} +{"train_loss": 0.0005249198293313384, "global_step": 54526, "epoch": 458, "lr": 1.3335425008791714e-05} +{"train_loss": 0.0002925940207205713, "global_step": 54527, "epoch": 458, "lr": 1.3333918687910273e-05} +{"train_loss": 0.00037481298204511404, "global_step": 54528, "epoch": 458, "lr": 1.333241243901875e-05} +{"train_loss": 0.0009418496047146618, "global_step": 54529, "epoch": 458, "lr": 1.333090626212013e-05} +{"train_loss": 0.0009068017825484276, "global_step": 54530, "epoch": 458, "lr": 1.3329400157217348e-05} +{"train_loss": 0.0003831434587482363, "global_step": 54531, "epoch": 458, "lr": 1.3327894124313383e-05} +{"train_loss": 0.0005739324260503054, "global_step": 54532, "epoch": 458, "lr": 1.3326388163411164e-05} +{"train_loss": 0.0006170269334688783, "global_step": 54533, "epoch": 458, "lr": 1.3324882274513679e-05} +{"train_loss": 0.00037422924651764333, "global_step": 54534, "epoch": 458, "lr": 1.3323376457623871e-05} +{"train_loss": 0.0006408262997865677, "global_step": 54535, "epoch": 458, "lr": 1.3321870712744683e-05} +{"train_loss": 0.001203124993480742, "global_step": 54536, "epoch": 458, "lr": 1.3320365039879095e-05} +{"train_loss": 0.0005699226167052984, "global_step": 54537, "epoch": 458, "lr": 1.3318859439030035e-05} +{"train_loss": 0.0008121232385747135, "global_step": 54538, "epoch": 458, "lr": 1.3317353910200492e-05} +{"train_loss": 0.0004111156740691513, "global_step": 54539, "epoch": 458, "lr": 1.331584845339341e-05} +{"train_loss": 0.0009330013417638838, "global_step": 54540, "epoch": 458, "lr": 1.3314343068611718e-05} +{"train_loss": 0.0015086965868249536, "global_step": 54541, "epoch": 458, "lr": 1.3312837755858414e-05} +{"train_loss": 0.0006848369375802577, "global_step": 54542, "epoch": 458, "lr": 1.3311332515136416e-05} +{"train_loss": 0.0006601976929232478, "global_step": 54543, "epoch": 458, "lr": 1.3309827346448716e-05} +{"train_loss": 0.0004884726367890835, "global_step": 54544, "epoch": 458, "lr": 1.3308322249798234e-05} +{"train_loss": 0.0006154505535960197, "global_step": 54545, "epoch": 458, "lr": 1.330681722518795e-05} +{"train_loss": 0.00044158162199892104, "global_step": 54546, "epoch": 458, "lr": 1.33053122726208e-05} +{"train_loss": 0.0007082390366122127, "global_step": 54547, "epoch": 458, "lr": 1.3303807392099765e-05} +{"train_loss": 0.0009668932179920375, "global_step": 54548, "epoch": 458, "lr": 1.3302302583627768e-05} +{"train_loss": 0.0004363335610833019, "global_step": 54549, "epoch": 458, "lr": 1.3300797847207797e-05} +{"train_loss": 0.00036676652962341905, "global_step": 54550, "epoch": 458, "lr": 1.329929318284277e-05} +{"train_loss": 0.0006713987095281482, "global_step": 54551, "epoch": 458, "lr": 1.3297788590535676e-05} +{"train_loss": 0.000313394091790542, "global_step": 54552, "epoch": 458, "lr": 1.3296284070289438e-05} +{"train_loss": 0.0005158031126484275, "global_step": 54553, "epoch": 458, "lr": 1.329477962210704e-05} +{"train_loss": 0.0006113540148362517, "global_step": 54554, "epoch": 458, "lr": 1.3293275245991404e-05} +{"train_loss": 0.000858236919157207, "global_step": 54555, "epoch": 458, "lr": 1.329177094194552e-05} +{"train_loss": 0.0004378891026135534, "global_step": 54556, "epoch": 458, "lr": 1.3290266709972304e-05} +{"train_loss": 0.00046469984226860106, "global_step": 54557, "epoch": 458, "lr": 1.3288762550074741e-05} +{"train_loss": 0.0007003164500929415, "global_step": 54558, "epoch": 458, "lr": 1.3287258462255775e-05} +{"train_loss": 0.0003348102036397904, "global_step": 54559, "epoch": 458, "lr": 1.3285754446518334e-05} +{"train_loss": 0.0009285407140851021, "global_step": 54560, "epoch": 458, "lr": 1.3284250502865415e-05} +{"train_loss": 0.0006626852555200458, "global_step": 54561, "epoch": 458, "lr": 1.3282746631299925e-05} +{"train_loss": 0.0006278370274230838, "global_step": 54562, "epoch": 458, "lr": 1.3281242831824858e-05} +{"train_loss": 0.001205758540891111, "global_step": 54563, "epoch": 458, "lr": 1.3279739104443134e-05} +{"train_loss": 0.0007056106114760041, "global_step": 54564, "epoch": 458, "lr": 1.3278235449157733e-05} +{"train_loss": 0.00046095464495010674, "global_step": 54565, "epoch": 458, "lr": 1.3276731865971592e-05} +{"train_loss": 0.0006196428439579904, "global_step": 54566, "epoch": 458, "lr": 1.3275228354887648e-05} +{"train_loss": 0.0008252856787294149, "global_step": 54567, "epoch": 458, "lr": 1.3273724915908886e-05} +{"train_loss": 0.00026397581677883863, "global_step": 54568, "epoch": 458, "lr": 1.3272221549038232e-05} +{"train_loss": 0.0009650701540522277, "global_step": 54569, "epoch": 458, "lr": 1.3270718254278658e-05} +{"train_loss": 0.0005283068749122322, "global_step": 54570, "epoch": 458, "lr": 1.3269215031633104e-05} +{"train_loss": 0.00046210107393562794, "global_step": 54571, "epoch": 458, "lr": 1.3267711881104505e-05} +{"train_loss": 0.0006493085529655218, "global_step": 54572, "epoch": 458, "lr": 1.3266208802695852e-05} +{"train_loss": 0.0008186815539374948, "global_step": 54573, "epoch": 458, "lr": 1.3264705796410054e-05} +{"train_loss": 0.0004828444798476994, "global_step": 54574, "epoch": 458, "lr": 1.3263202862250097e-05} +{"train_loss": 0.0006466301274485886, "global_step": 54575, "epoch": 458, "lr": 1.3261700000218896e-05} +{"train_loss": 0.0004369882808532566, "global_step": 54576, "epoch": 458, "lr": 1.3260197210319442e-05} +{"train_loss": 0.0005785347311757505, "global_step": 54577, "epoch": 458, "lr": 1.3258694492554669e-05} +{"train_loss": 0.0005095972446724772, "global_step": 54578, "epoch": 458, "lr": 1.3257191846927503e-05} +{"train_loss": 0.0006437850533984601, "global_step": 54579, "epoch": 458, "lr": 1.3255689273440935e-05} +{"train_loss": 0.000894614146091044, "global_step": 54580, "epoch": 458, "lr": 1.3254186772097881e-05} +{"train_loss": 0.00043154743616469204, "global_step": 54581, "epoch": 458, "lr": 1.3252684342901301e-05} +{"train_loss": 0.0013344238977879286, "global_step": 54582, "epoch": 458, "lr": 1.3251181985854167e-05} +{"train_loss": 0.0005862325779162347, "global_step": 54583, "epoch": 458, "lr": 1.32496797009594e-05} +{"train_loss": 0.0005541995051316917, "global_step": 54584, "epoch": 458, "lr": 1.324817748821997e-05} +{"train_loss": 0.00034520935150794685, "global_step": 54585, "epoch": 458, "lr": 1.3246675347638804e-05} +{"train_loss": 0.0006930602248758078, "global_step": 54586, "epoch": 458, "lr": 1.3245173279218881e-05} +{"train_loss": 0.000719957344699651, "global_step": 54587, "epoch": 458, "lr": 1.3243671282963115e-05} +{"train_loss": 0.00040594564052298665, "global_step": 54588, "epoch": 458, "lr": 1.324216935887449e-05} +{"train_loss": 0.00030987299396656454, "global_step": 54589, "epoch": 458, "lr": 1.3240667506955939e-05} +{"train_loss": 0.0006345950532704592, "global_step": 54590, "epoch": 458, "lr": 1.3239165727210395e-05} +{"train_loss": 0.0018116742139682174, "global_step": 54591, "epoch": 458, "lr": 1.323766401964084e-05} +{"train_loss": 0.0017139958217740059, "global_step": 54592, "epoch": 458, "lr": 1.3236162384250184e-05} +{"train_loss": 0.00032811073469929397, "global_step": 54593, "epoch": 458, "lr": 1.3234660821041412e-05} +{"train_loss": 0.0019730008207261562, "global_step": 54594, "epoch": 458, "lr": 1.3233159330017442e-05} +{"train_loss": 0.001088438555598259, "global_step": 54595, "epoch": 458, "lr": 1.323165791118125e-05} +{"train_loss": 0.0006785045843571424, "global_step": 54596, "epoch": 458, "lr": 1.3230156564535767e-05} +{"train_loss": 0.0012559585738927126, "global_step": 54597, "epoch": 458, "lr": 1.3228655290083935e-05} +{"train_loss": 0.00036160938907414675, "global_step": 54598, "epoch": 458, "lr": 1.322715408782872e-05} +{"train_loss": 0.0006907034548930824, "global_step": 54599, "epoch": 458, "lr": 1.3225652957773044e-05} +{"train_loss": 0.0003164584923069924, "global_step": 54600, "epoch": 458, "lr": 1.3224151899919884e-05} +{"train_loss": 0.0006054078694432974, "global_step": 54601, "epoch": 458, "lr": 1.322265091427216e-05} +{"train_loss": 0.0004119937657378614, "global_step": 54602, "epoch": 458, "lr": 1.322115000083285e-05} +{"train_loss": 0.0009518891456536949, "global_step": 54603, "epoch": 458, "lr": 1.321964915960488e-05} +{"train_loss": 0.0006740696262568235, "global_step": 54604, "epoch": 458, "lr": 1.3218148390591184e-05} +{"train_loss": 0.0006974368006922305, "global_step": 54605, "epoch": 458, "lr": 1.3216647693794736e-05} +{"train_loss": 0.0004630176699720323, "global_step": 54606, "epoch": 458, "lr": 1.3215147069218459e-05} +{"train_loss": 0.0006506236968562007, "global_step": 54607, "epoch": 458, "lr": 1.3213646516865324e-05} +{"train_loss": 0.0005996383260935545, "global_step": 54608, "epoch": 458, "lr": 1.3212146036738266e-05} +{"train_loss": 0.001012118300423026, "global_step": 54609, "epoch": 458, "lr": 1.3210645628840213e-05} +{"train_loss": 0.0005410187877714634, "global_step": 54610, "epoch": 458, "lr": 1.3209145293174146e-05} +{"train_loss": 0.0013259521219879389, "global_step": 54611, "epoch": 458, "lr": 1.3207645029742971e-05} +{"train_loss": 0.0007263143197633326, "global_step": 54612, "epoch": 458, "lr": 1.3206144838549673e-05} +{"train_loss": 0.0006638506893068552, "global_step": 54613, "epoch": 458, "lr": 1.320464471959716e-05} +{"train_loss": 0.0006788069731555879, "global_step": 54614, "epoch": 458, "lr": 1.3203144672888412e-05} +{"train_loss": 0.0004928784328512847, "global_step": 54615, "epoch": 458, "lr": 1.3201644698426346e-05} +{"train_loss": 0.0008522329153493047, "global_step": 54616, "epoch": 458, "lr": 1.320014479621392e-05} +{"train_loss": 0.0008460713434033096, "global_step": 54617, "epoch": 458, "lr": 1.3198644966254086e-05} +{"train_loss": 0.0003858345444314182, "global_step": 54618, "epoch": 458, "lr": 1.3197145208549772e-05} +{"train_loss": 0.0005377766210585833, "global_step": 54619, "epoch": 458, "lr": 1.3195645523103944e-05} +{"train_loss": 0.0006793352135480577, "global_step": 54620, "epoch": 458, "lr": 1.3194145909919525e-05, "val_loss": 0.014813977293670177} +{"train_loss": 0.000608024129178375, "global_step": 54621, "epoch": 459, "lr": 1.3192646368999479e-05} +{"train_loss": 0.00042661678162403405, "global_step": 54622, "epoch": 459, "lr": 1.319114690034674e-05} +{"train_loss": 0.00038134714122861624, "global_step": 54623, "epoch": 459, "lr": 1.3189647503964236e-05} +{"train_loss": 0.00040457447175867856, "global_step": 54624, "epoch": 459, "lr": 1.3188148179854937e-05} +{"train_loss": 0.0005470163305290043, "global_step": 54625, "epoch": 459, "lr": 1.3186648928021767e-05} +{"train_loss": 0.0005071173654869199, "global_step": 54626, "epoch": 459, "lr": 1.3185149748467695e-05} +{"train_loss": 0.0003672722668852657, "global_step": 54627, "epoch": 459, "lr": 1.3183650641195644e-05} +{"train_loss": 0.00048686820082366467, "global_step": 54628, "epoch": 459, "lr": 1.3182151606208548e-05} +{"train_loss": 0.0009154939907602966, "global_step": 54629, "epoch": 459, "lr": 1.3180652643509383e-05} +{"train_loss": 0.00035567799932323396, "global_step": 54630, "epoch": 459, "lr": 1.3179153753101053e-05} +{"train_loss": 0.0008832829189486802, "global_step": 54631, "epoch": 459, "lr": 1.3177654934986538e-05} +{"train_loss": 0.0006704042316414416, "global_step": 54632, "epoch": 459, "lr": 1.3176156189168748e-05} +{"train_loss": 0.0005380503134801984, "global_step": 54633, "epoch": 459, "lr": 1.3174657515650656e-05} +{"train_loss": 0.0006424360326491296, "global_step": 54634, "epoch": 459, "lr": 1.317315891443519e-05} +{"train_loss": 0.0010740128345787525, "global_step": 54635, "epoch": 459, "lr": 1.3171660385525281e-05} +{"train_loss": 0.0005957221728749573, "global_step": 54636, "epoch": 459, "lr": 1.317016192892389e-05} +{"train_loss": 0.0005204170010983944, "global_step": 54637, "epoch": 459, "lr": 1.3168663544633942e-05} +{"train_loss": 0.00045330155990086496, "global_step": 54638, "epoch": 459, "lr": 1.3167165232658401e-05} +{"train_loss": 0.0007212034543044865, "global_step": 54639, "epoch": 459, "lr": 1.3165666993000197e-05} +{"train_loss": 0.0006276134517975152, "global_step": 54640, "epoch": 459, "lr": 1.3164168825662254e-05} +{"train_loss": 0.00027505139587447047, "global_step": 54641, "epoch": 459, "lr": 1.3162670730647547e-05} +{"train_loss": 0.0004073528980370611, "global_step": 54642, "epoch": 459, "lr": 1.3161172707958986e-05} +{"train_loss": 0.0006196976755745709, "global_step": 54643, "epoch": 459, "lr": 1.3159674757599539e-05} +{"train_loss": 0.0010188331361860037, "global_step": 54644, "epoch": 459, "lr": 1.3158176879572121e-05} +{"train_loss": 0.0003766404988709837, "global_step": 54645, "epoch": 459, "lr": 1.3156679073879703e-05} +{"train_loss": 0.0007162948022596538, "global_step": 54646, "epoch": 459, "lr": 1.315518134052519e-05} +{"train_loss": 0.0008408667636103928, "global_step": 54647, "epoch": 459, "lr": 1.3153683679511564e-05} +{"train_loss": 0.00038942231913097203, "global_step": 54648, "epoch": 459, "lr": 1.3152186090841728e-05} +{"train_loss": 0.0004616244987118989, "global_step": 54649, "epoch": 459, "lr": 1.315068857451865e-05} +{"train_loss": 0.0007897365721873939, "global_step": 54650, "epoch": 459, "lr": 1.3149191130545241e-05} +{"train_loss": 0.00035580541589297354, "global_step": 54651, "epoch": 459, "lr": 1.3147693758924479e-05} +{"train_loss": 0.0005696313455700874, "global_step": 54652, "epoch": 459, "lr": 1.314619645965926e-05} +{"train_loss": 0.0006512610125355422, "global_step": 54653, "epoch": 459, "lr": 1.3144699232752572e-05} +{"train_loss": 0.0014629936777055264, "global_step": 54654, "epoch": 459, "lr": 1.3143202078207306e-05} +{"train_loss": 0.00041202930151484907, "global_step": 54655, "epoch": 459, "lr": 1.3141704996026443e-05} +{"train_loss": 0.0006270101293921471, "global_step": 54656, "epoch": 459, "lr": 1.3140207986212894e-05} +{"train_loss": 0.0008695899159647524, "global_step": 54657, "epoch": 459, "lr": 1.313871104876962e-05} +{"train_loss": 0.000512919679749757, "global_step": 54658, "epoch": 459, "lr": 1.3137214183699547e-05} +{"train_loss": 0.0009307850850746036, "global_step": 54659, "epoch": 459, "lr": 1.3135717391005603e-05} +{"train_loss": 0.0010364813497290015, "global_step": 54660, "epoch": 459, "lr": 1.3134220670690756e-05} +{"train_loss": 0.00027394876815378666, "global_step": 54661, "epoch": 459, "lr": 1.3132724022757908e-05} +{"train_loss": 0.00045093963854014874, "global_step": 54662, "epoch": 459, "lr": 1.3131227447210038e-05} +{"train_loss": 0.0004908867995254695, "global_step": 54663, "epoch": 459, "lr": 1.312973094405005e-05} +{"train_loss": 0.0004427239764481783, "global_step": 54664, "epoch": 459, "lr": 1.3128234513280908e-05} +{"train_loss": 0.0011379601201042533, "global_step": 54665, "epoch": 459, "lr": 1.3126738154905538e-05} +{"train_loss": 0.0005758193437941372, "global_step": 54666, "epoch": 459, "lr": 1.3125241868926863e-05} +{"train_loss": 0.000303382461424917, "global_step": 54667, "epoch": 459, "lr": 1.3123745655347852e-05} +{"train_loss": 0.0005230908282101154, "global_step": 54668, "epoch": 459, "lr": 1.3122249514171413e-05} +{"train_loss": 0.0008570771897211671, "global_step": 54669, "epoch": 459, "lr": 1.3120753445400513e-05} +{"train_loss": 0.0006347703747451305, "global_step": 54670, "epoch": 459, "lr": 1.3119257449038053e-05} +{"train_loss": 0.00047190397162921727, "global_step": 54671, "epoch": 459, "lr": 1.3117761525087013e-05} +{"train_loss": 0.0006267944700084627, "global_step": 54672, "epoch": 459, "lr": 1.3116265673550304e-05} +{"train_loss": 0.0002894028148148209, "global_step": 54673, "epoch": 459, "lr": 1.3114769894430851e-05} +{"train_loss": 0.0006164831575006247, "global_step": 54674, "epoch": 459, "lr": 1.3113274187731623e-05} +{"train_loss": 0.00043186399852856994, "global_step": 54675, "epoch": 459, "lr": 1.3111778553455528e-05} +{"train_loss": 0.0004633984644897282, "global_step": 54676, "epoch": 459, "lr": 1.3110282991605526e-05} +{"train_loss": 0.000990058295428753, "global_step": 54677, "epoch": 459, "lr": 1.3108787502184543e-05} +{"train_loss": 0.0006446431507356465, "global_step": 54678, "epoch": 459, "lr": 1.31072920851955e-05} +{"train_loss": 0.0006412618677131832, "global_step": 54679, "epoch": 459, "lr": 1.3105796740641352e-05} +{"train_loss": 0.0007127749267965555, "global_step": 54680, "epoch": 459, "lr": 1.3104301468525038e-05} +{"train_loss": 0.0005900378455407917, "global_step": 54681, "epoch": 459, "lr": 1.3102806268849476e-05} +{"train_loss": 0.0005079558468423784, "global_step": 54682, "epoch": 459, "lr": 1.3101311141617628e-05} +{"train_loss": 0.000824267219286412, "global_step": 54683, "epoch": 459, "lr": 1.3099816086832395e-05} +{"train_loss": 0.0007301493315026164, "global_step": 54684, "epoch": 459, "lr": 1.3098321104496747e-05} +{"train_loss": 0.0002926248707808554, "global_step": 54685, "epoch": 459, "lr": 1.3096826194613588e-05} +{"train_loss": 0.0009229081333614886, "global_step": 54686, "epoch": 459, "lr": 1.3095331357185886e-05} +{"train_loss": 0.000564897432923317, "global_step": 54687, "epoch": 459, "lr": 1.3093836592216541e-05} +{"train_loss": 0.000703725847415626, "global_step": 54688, "epoch": 459, "lr": 1.3092341899708516e-05} +{"train_loss": 0.0004672994837164879, "global_step": 54689, "epoch": 459, "lr": 1.3090847279664725e-05} +{"train_loss": 0.0008638517465442419, "global_step": 54690, "epoch": 459, "lr": 1.3089352732088127e-05} +{"train_loss": 0.0006355723598971963, "global_step": 54691, "epoch": 459, "lr": 1.3087858256981638e-05} +{"train_loss": 0.0004387946391943842, "global_step": 54692, "epoch": 459, "lr": 1.3086363854348182e-05} +{"train_loss": 0.00036914701922796667, "global_step": 54693, "epoch": 459, "lr": 1.3084869524190725e-05} +{"train_loss": 0.0005711790290661156, "global_step": 54694, "epoch": 459, "lr": 1.3083375266512165e-05} +{"train_loss": 0.00043357780668884516, "global_step": 54695, "epoch": 459, "lr": 1.3081881081315472e-05} +{"train_loss": 0.000854291080031544, "global_step": 54696, "epoch": 459, "lr": 1.3080386968603559e-05} +{"train_loss": 0.0005727738607674837, "global_step": 54697, "epoch": 459, "lr": 1.3078892928379345e-05} +{"train_loss": 0.0004904746892862022, "global_step": 54698, "epoch": 459, "lr": 1.3077398960645797e-05} +{"train_loss": 0.0005723165231756866, "global_step": 54699, "epoch": 459, "lr": 1.3075905065405819e-05} +{"train_loss": 0.0006980391917750239, "global_step": 54700, "epoch": 459, "lr": 1.3074411242662371e-05} +{"train_loss": 0.0003192186704836786, "global_step": 54701, "epoch": 459, "lr": 1.3072917492418351e-05} +{"train_loss": 0.0003822042199317366, "global_step": 54702, "epoch": 459, "lr": 1.307142381467673e-05} +{"train_loss": 0.0005970306810922921, "global_step": 54703, "epoch": 459, "lr": 1.3069930209440428e-05} +{"train_loss": 0.0008158207638189197, "global_step": 54704, "epoch": 459, "lr": 1.3068436676712354e-05} +{"train_loss": 0.0004042834334541112, "global_step": 54705, "epoch": 459, "lr": 1.3066943216495475e-05} +{"train_loss": 0.0004722274316009134, "global_step": 54706, "epoch": 459, "lr": 1.3065449828792692e-05} +{"train_loss": 0.0005930086481384933, "global_step": 54707, "epoch": 459, "lr": 1.3063956513606968e-05} +{"train_loss": 0.000976895447820425, "global_step": 54708, "epoch": 459, "lr": 1.3062463270941216e-05} +{"train_loss": 0.0008171474910341203, "global_step": 54709, "epoch": 459, "lr": 1.306097010079836e-05} +{"train_loss": 0.0003700885863509029, "global_step": 54710, "epoch": 459, "lr": 1.3059477003181354e-05} +{"train_loss": 0.0016712831566110253, "global_step": 54711, "epoch": 459, "lr": 1.3057983978093108e-05} +{"train_loss": 0.0006169046391732991, "global_step": 54712, "epoch": 459, "lr": 1.3056491025536576e-05} +{"train_loss": 0.0006568953976966441, "global_step": 54713, "epoch": 459, "lr": 1.3054998145514664e-05} +{"train_loss": 0.0005456790095195174, "global_step": 54714, "epoch": 459, "lr": 1.3053505338030314e-05} +{"train_loss": 0.0007501298096030951, "global_step": 54715, "epoch": 459, "lr": 1.3052012603086472e-05} +{"train_loss": 0.0004512774175964296, "global_step": 54716, "epoch": 459, "lr": 1.3050519940686046e-05} +{"train_loss": 0.0005104205920360982, "global_step": 54717, "epoch": 459, "lr": 1.3049027350831989e-05} +{"train_loss": 0.000895868637599051, "global_step": 54718, "epoch": 459, "lr": 1.3047534833527203e-05} +{"train_loss": 0.0004762502503581345, "global_step": 54719, "epoch": 459, "lr": 1.3046042388774655e-05} +{"train_loss": 0.0006082478212192655, "global_step": 54720, "epoch": 459, "lr": 1.3044550016577235e-05} +{"train_loss": 0.0005951996427029371, "global_step": 54721, "epoch": 459, "lr": 1.3043057716937907e-05} +{"train_loss": 0.0004490006831474602, "global_step": 54722, "epoch": 459, "lr": 1.3041565489859587e-05} +{"train_loss": 0.00048017012886703014, "global_step": 54723, "epoch": 459, "lr": 1.3040073335345192e-05} +{"train_loss": 0.000388011074392125, "global_step": 54724, "epoch": 459, "lr": 1.303858125339768e-05} +{"train_loss": 0.0007028093677945435, "global_step": 54725, "epoch": 459, "lr": 1.303708924401995e-05} +{"train_loss": 0.0008848131401464343, "global_step": 54726, "epoch": 459, "lr": 1.3035597307214958e-05} +{"train_loss": 0.0005200886516831815, "global_step": 54727, "epoch": 459, "lr": 1.3034105442985622e-05} +{"train_loss": 0.0004905101959593594, "global_step": 54728, "epoch": 459, "lr": 1.3032613651334863e-05} +{"train_loss": 0.0004250550991855562, "global_step": 54729, "epoch": 459, "lr": 1.3031121932265628e-05} +{"train_loss": 0.0006261563976295292, "global_step": 54730, "epoch": 459, "lr": 1.3029630285780819e-05} +{"train_loss": 0.0003561240737326443, "global_step": 54731, "epoch": 459, "lr": 1.3028138711883398e-05} +{"train_loss": 0.0006771091721020639, "global_step": 54732, "epoch": 459, "lr": 1.302664721057626e-05} +{"train_loss": 0.0004945439286530018, "global_step": 54733, "epoch": 459, "lr": 1.3025155781862363e-05} +{"train_loss": 0.0006959690363146365, "global_step": 54734, "epoch": 459, "lr": 1.3023664425744624e-05} +{"train_loss": 0.0006359051913022995, "global_step": 54735, "epoch": 459, "lr": 1.3022173142225958e-05} +{"train_loss": 0.0005463858833536506, "global_step": 54736, "epoch": 459, "lr": 1.3020681931309319e-05} +{"train_loss": 0.0003749267489183694, "global_step": 54737, "epoch": 459, "lr": 1.3019190792997603e-05} +{"train_loss": 0.0004889862611889839, "global_step": 54738, "epoch": 459, "lr": 1.3017699727293769e-05} +{"train_loss": 0.0006094722117849101, "global_step": 54739, "epoch": 459, "lr": 1.301620873420072e-05, "val_loss": 0.018433688208460808} +{"train_loss": 0.000507422664668411, "global_step": 54740, "epoch": 460, "lr": 1.3014717813721405e-05} +{"train_loss": 0.00045923294965177774, "global_step": 54741, "epoch": 460, "lr": 1.3013226965858743e-05} +{"train_loss": 0.0004549412406049669, "global_step": 54742, "epoch": 460, "lr": 1.3011736190615642e-05} +{"train_loss": 0.00031749665504321456, "global_step": 54743, "epoch": 460, "lr": 1.301024548799506e-05} +{"train_loss": 0.0003310654719825834, "global_step": 54744, "epoch": 460, "lr": 1.3008754857999893e-05} +{"train_loss": 0.0004019859479740262, "global_step": 54745, "epoch": 460, "lr": 1.3007264300633104e-05} +{"train_loss": 0.0006582131027244031, "global_step": 54746, "epoch": 460, "lr": 1.3005773815897581e-05} +{"train_loss": 0.000420442724134773, "global_step": 54747, "epoch": 460, "lr": 1.3004283403796287e-05} +{"train_loss": 0.0006464244797825813, "global_step": 54748, "epoch": 460, "lr": 1.3002793064332108e-05} +{"train_loss": 0.0008958741091191769, "global_step": 54749, "epoch": 460, "lr": 1.3001302797507997e-05} +{"train_loss": 0.0004170729371253401, "global_step": 54750, "epoch": 460, "lr": 1.299981260332689e-05} +{"train_loss": 0.0006047969800420105, "global_step": 54751, "epoch": 460, "lr": 1.2998322481791686e-05} +{"train_loss": 0.000662927282974124, "global_step": 54752, "epoch": 460, "lr": 1.2996832432905332e-05} +{"train_loss": 0.0004762104945257306, "global_step": 54753, "epoch": 460, "lr": 1.2995342456670745e-05} +{"train_loss": 0.0011964634759351611, "global_step": 54754, "epoch": 460, "lr": 1.299385255309084e-05} +{"train_loss": 0.0006212286534719169, "global_step": 54755, "epoch": 460, "lr": 1.299236272216856e-05} +{"train_loss": 0.0005807342240586877, "global_step": 54756, "epoch": 460, "lr": 1.2990872963906814e-05} +{"train_loss": 0.0009473899262957275, "global_step": 54757, "epoch": 460, "lr": 1.2989383278308548e-05} +{"train_loss": 0.00022105967218521982, "global_step": 54758, "epoch": 460, "lr": 1.2987893665376671e-05} +{"train_loss": 0.0003611230058595538, "global_step": 54759, "epoch": 460, "lr": 1.2986404125114099e-05} +{"train_loss": 0.0006116908043622971, "global_step": 54760, "epoch": 460, "lr": 1.2984914657523777e-05} +{"train_loss": 0.0005898098461329937, "global_step": 54761, "epoch": 460, "lr": 1.2983425262608611e-05} +{"train_loss": 0.0002794946194626391, "global_step": 54762, "epoch": 460, "lr": 1.2981935940371547e-05} +{"train_loss": 0.0010737464763224125, "global_step": 54763, "epoch": 460, "lr": 1.298044669081549e-05} +{"train_loss": 0.00047387537779286504, "global_step": 54764, "epoch": 460, "lr": 1.297895751394338e-05} +{"train_loss": 0.0006895386031828821, "global_step": 54765, "epoch": 460, "lr": 1.297746840975813e-05} +{"train_loss": 0.0005953003419563174, "global_step": 54766, "epoch": 460, "lr": 1.2975979378262647e-05} +{"train_loss": 0.0006707553402520716, "global_step": 54767, "epoch": 460, "lr": 1.2974490419459894e-05} +{"train_loss": 0.0006324663991108537, "global_step": 54768, "epoch": 460, "lr": 1.2973001533352763e-05} +{"train_loss": 0.0007306252373382449, "global_step": 54769, "epoch": 460, "lr": 1.2971512719944196e-05} +{"train_loss": 0.0013171148020774126, "global_step": 54770, "epoch": 460, "lr": 1.2970023979237095e-05} +{"train_loss": 0.00035106379073113203, "global_step": 54771, "epoch": 460, "lr": 1.2968535311234408e-05} +{"train_loss": 0.00035213734372518957, "global_step": 54772, "epoch": 460, "lr": 1.2967046715939046e-05} +{"train_loss": 0.0006819567061029375, "global_step": 54773, "epoch": 460, "lr": 1.2965558193353922e-05} +{"train_loss": 0.0007449901895597577, "global_step": 54774, "epoch": 460, "lr": 1.2964069743481977e-05} +{"train_loss": 0.0006853772792965174, "global_step": 54775, "epoch": 460, "lr": 1.2962581366326115e-05} +{"train_loss": 0.0011665329802781343, "global_step": 54776, "epoch": 460, "lr": 1.2961093061889278e-05} +{"train_loss": 0.0007832207484170794, "global_step": 54777, "epoch": 460, "lr": 1.2959604830174365e-05} +{"train_loss": 0.0005016307695768774, "global_step": 54778, "epoch": 460, "lr": 1.2958116671184323e-05} +{"train_loss": 0.0003969724930357188, "global_step": 54779, "epoch": 460, "lr": 1.2956628584922048e-05} +{"train_loss": 0.000994933652691543, "global_step": 54780, "epoch": 460, "lr": 1.295514057139049e-05} +{"train_loss": 0.00021423575526569039, "global_step": 54781, "epoch": 460, "lr": 1.2953652630592544e-05} +{"train_loss": 0.0007756194681860507, "global_step": 54782, "epoch": 460, "lr": 1.2952164762531154e-05} +{"train_loss": 0.0007417066371999681, "global_step": 54783, "epoch": 460, "lr": 1.2950676967209218e-05} +{"train_loss": 0.000373703456716612, "global_step": 54784, "epoch": 460, "lr": 1.2949189244629684e-05} +{"train_loss": 0.00035981120890937746, "global_step": 54785, "epoch": 460, "lr": 1.2947701594795442e-05} +{"train_loss": 0.0006302252295427024, "global_step": 54786, "epoch": 460, "lr": 1.2946214017709446e-05} +{"train_loss": 0.0006719705415889621, "global_step": 54787, "epoch": 460, "lr": 1.2944726513374583e-05} +{"train_loss": 0.000522062589880079, "global_step": 54788, "epoch": 460, "lr": 1.2943239081793806e-05} +{"train_loss": 0.00031559274066239595, "global_step": 54789, "epoch": 460, "lr": 1.2941751722970008e-05} +{"train_loss": 0.0011716792359948158, "global_step": 54790, "epoch": 460, "lr": 1.2940264436906135e-05} +{"train_loss": 0.0012289329897612333, "global_step": 54791, "epoch": 460, "lr": 1.2938777223605098e-05} +{"train_loss": 0.0008367293048650026, "global_step": 54792, "epoch": 460, "lr": 1.2937290083069792e-05} +{"train_loss": 0.00048129470087587833, "global_step": 54793, "epoch": 460, "lr": 1.2935803015303172e-05} +{"train_loss": 0.0006266249110922217, "global_step": 54794, "epoch": 460, "lr": 1.293431602030813e-05} +{"train_loss": 0.0007174381171353161, "global_step": 54795, "epoch": 460, "lr": 1.2932829098087612e-05} +{"train_loss": 0.00038932691677473485, "global_step": 54796, "epoch": 460, "lr": 1.2931342248644529e-05} +{"train_loss": 0.0005102194845676422, "global_step": 54797, "epoch": 460, "lr": 1.2929855471981773e-05} +{"train_loss": 0.000732363376300782, "global_step": 54798, "epoch": 460, "lr": 1.2928368768102306e-05} +{"train_loss": 0.0004978556535206735, "global_step": 54799, "epoch": 460, "lr": 1.2926882137009011e-05} +{"train_loss": 0.001354220206849277, "global_step": 54800, "epoch": 460, "lr": 1.2925395578704835e-05} +{"train_loss": 0.00047998930676840246, "global_step": 54801, "epoch": 460, "lr": 1.292390909319267e-05} +{"train_loss": 0.0007851971895433962, "global_step": 54802, "epoch": 460, "lr": 1.292242268047546e-05} +{"train_loss": 0.0008331831195391715, "global_step": 54803, "epoch": 460, "lr": 1.2920936340556117e-05} +{"train_loss": 0.000702905235812068, "global_step": 54804, "epoch": 460, "lr": 1.2919450073437538e-05} +{"train_loss": 0.0006709833396598697, "global_step": 54805, "epoch": 460, "lr": 1.2917963879122668e-05} +{"train_loss": 0.00043541414197534323, "global_step": 54806, "epoch": 460, "lr": 1.2916477757614404e-05} +{"train_loss": 0.0008130847127176821, "global_step": 54807, "epoch": 460, "lr": 1.2914991708915692e-05} +{"train_loss": 0.00045538967242464423, "global_step": 54808, "epoch": 460, "lr": 1.2913505733029407e-05} +{"train_loss": 0.0006918294238857925, "global_step": 54809, "epoch": 460, "lr": 1.2912019829958516e-05} +{"train_loss": 0.0007949289283715189, "global_step": 54810, "epoch": 460, "lr": 1.2910533999705904e-05} +{"train_loss": 0.0005299928016029298, "global_step": 54811, "epoch": 460, "lr": 1.2909048242274485e-05} +{"train_loss": 0.0007773961988277733, "global_step": 54812, "epoch": 460, "lr": 1.2907562557667191e-05} +{"train_loss": 0.0010124471737071872, "global_step": 54813, "epoch": 460, "lr": 1.2906076945886947e-05} +{"train_loss": 0.0007293956005014479, "global_step": 54814, "epoch": 460, "lr": 1.290459140693664e-05} +{"train_loss": 0.0004964609397575259, "global_step": 54815, "epoch": 460, "lr": 1.290310594081922e-05} +{"train_loss": 0.000700032920576632, "global_step": 54816, "epoch": 460, "lr": 1.290162054753758e-05} +{"train_loss": 0.000633508141618222, "global_step": 54817, "epoch": 460, "lr": 1.290013522709465e-05} +{"train_loss": 0.0004313124227337539, "global_step": 54818, "epoch": 460, "lr": 1.2898649979493333e-05} +{"train_loss": 0.0003687710268422961, "global_step": 54819, "epoch": 460, "lr": 1.2897164804736566e-05} +{"train_loss": 0.0007827368681319058, "global_step": 54820, "epoch": 460, "lr": 1.289567970282724e-05} +{"train_loss": 0.0004047460970468819, "global_step": 54821, "epoch": 460, "lr": 1.2894194673768295e-05} +{"train_loss": 0.0003785084991250187, "global_step": 54822, "epoch": 460, "lr": 1.2892709717562634e-05} +{"train_loss": 0.0006249628495424986, "global_step": 54823, "epoch": 460, "lr": 1.2891224834213156e-05} +{"train_loss": 0.0005489745526574552, "global_step": 54824, "epoch": 460, "lr": 1.2889740023722813e-05} +{"train_loss": 0.00043795857345685363, "global_step": 54825, "epoch": 460, "lr": 1.2888255286094485e-05} +{"train_loss": 0.0009649755666032434, "global_step": 54826, "epoch": 460, "lr": 1.2886770621331118e-05} +{"train_loss": 0.0009112409316003323, "global_step": 54827, "epoch": 460, "lr": 1.2885286029435611e-05} +{"train_loss": 0.0005235761636868119, "global_step": 54828, "epoch": 460, "lr": 1.2883801510410864e-05} +{"train_loss": 0.0005798523779958487, "global_step": 54829, "epoch": 460, "lr": 1.2882317064259824e-05} +{"train_loss": 0.0008137065451592207, "global_step": 54830, "epoch": 460, "lr": 1.2880832690985373e-05} +{"train_loss": 0.0008197430288419127, "global_step": 54831, "epoch": 460, "lr": 1.2879348390590457e-05} +{"train_loss": 0.00045457930536940694, "global_step": 54832, "epoch": 460, "lr": 1.2877864163077958e-05} +{"train_loss": 0.0012534402776509523, "global_step": 54833, "epoch": 460, "lr": 1.2876380008450822e-05} +{"train_loss": 0.0012323845876380801, "global_step": 54834, "epoch": 460, "lr": 1.287489592671195e-05} +{"train_loss": 0.0005024982965551317, "global_step": 54835, "epoch": 460, "lr": 1.2873411917864237e-05} +{"train_loss": 0.000700640375725925, "global_step": 54836, "epoch": 460, "lr": 1.2871927981910625e-05} +{"train_loss": 0.0005696110310964286, "global_step": 54837, "epoch": 460, "lr": 1.2870444118854008e-05} +{"train_loss": 0.0005684391944669187, "global_step": 54838, "epoch": 460, "lr": 1.2868960328697316e-05} +{"train_loss": 0.0008233741391450167, "global_step": 54839, "epoch": 460, "lr": 1.2867476611443446e-05} +{"train_loss": 0.00077382120070979, "global_step": 54840, "epoch": 460, "lr": 1.2865992967095326e-05} +{"train_loss": 0.0004917849437333643, "global_step": 54841, "epoch": 460, "lr": 1.2864509395655866e-05} +{"train_loss": 0.0004465144593268633, "global_step": 54842, "epoch": 460, "lr": 1.2863025897127957e-05} +{"train_loss": 0.0007987924036569893, "global_step": 54843, "epoch": 460, "lr": 1.2861542471514548e-05} +{"train_loss": 0.0004400633042678237, "global_step": 54844, "epoch": 460, "lr": 1.2860059118818513e-05} +{"train_loss": 0.0009256011107936502, "global_step": 54845, "epoch": 460, "lr": 1.2858575839042802e-05} +{"train_loss": 0.0008425615960732102, "global_step": 54846, "epoch": 460, "lr": 1.2857092632190293e-05} +{"train_loss": 0.0003378985566087067, "global_step": 54847, "epoch": 460, "lr": 1.2855609498263915e-05} +{"train_loss": 0.0006688885041512549, "global_step": 54848, "epoch": 460, "lr": 1.2854126437266596e-05} +{"train_loss": 0.0008207217906601727, "global_step": 54849, "epoch": 460, "lr": 1.2852643449201213e-05} +{"train_loss": 0.0004306038317736238, "global_step": 54850, "epoch": 460, "lr": 1.2851160534070711e-05} +{"train_loss": 0.0005696648731827736, "global_step": 54851, "epoch": 460, "lr": 1.2849677691877976e-05} +{"train_loss": 0.0008095527882687747, "global_step": 54852, "epoch": 460, "lr": 1.2848194922625939e-05} +{"train_loss": 0.0010826699435710907, "global_step": 54853, "epoch": 460, "lr": 1.2846712226317508e-05} +{"train_loss": 0.0006367817404679954, "global_step": 54854, "epoch": 460, "lr": 1.2845229602955572e-05} +{"train_loss": 0.001091467565856874, "global_step": 54855, "epoch": 460, "lr": 1.284374705254307e-05} +{"train_loss": 0.00034548513940535486, "global_step": 54856, "epoch": 460, "lr": 1.2842264575082884e-05} +{"train_loss": 0.0005541669088415802, "global_step": 54857, "epoch": 460, "lr": 1.2840782170577965e-05} +{"train_loss": 0.0006522760563138716, "global_step": 54858, "epoch": 460, "lr": 1.2839299839031183e-05, "val_loss": 0.022612711414694786, "train_action_mse_error": 8.75501791597344e-06} +{"train_loss": 0.00025373679818585515, "global_step": 54859, "epoch": 461, "lr": 1.2837817580445477e-05} +{"train_loss": 0.0008202370954677463, "global_step": 54860, "epoch": 461, "lr": 1.2836335394823746e-05} +{"train_loss": 0.0012406137539073825, "global_step": 54861, "epoch": 461, "lr": 1.283485328216889e-05} +{"train_loss": 0.0005120944115333259, "global_step": 54862, "epoch": 461, "lr": 1.2833371242483837e-05} +{"train_loss": 0.000374122173525393, "global_step": 54863, "epoch": 461, "lr": 1.2831889275771481e-05} +{"train_loss": 0.0009171905694529414, "global_step": 54864, "epoch": 461, "lr": 1.2830407382034749e-05} +{"train_loss": 0.000806096417363733, "global_step": 54865, "epoch": 461, "lr": 1.2828925561276545e-05} +{"train_loss": 0.0005806767148897052, "global_step": 54866, "epoch": 461, "lr": 1.2827443813499756e-05} +{"train_loss": 0.0008149799541570246, "global_step": 54867, "epoch": 461, "lr": 1.2825962138707325e-05} +{"train_loss": 0.0008229133090935647, "global_step": 54868, "epoch": 461, "lr": 1.2824480536902134e-05} +{"train_loss": 0.0009701692615635693, "global_step": 54869, "epoch": 461, "lr": 1.2822999008087121e-05} +{"train_loss": 0.0009104736382141709, "global_step": 54870, "epoch": 461, "lr": 1.282151755226516e-05} +{"train_loss": 0.0006531386752612889, "global_step": 54871, "epoch": 461, "lr": 1.2820036169439193e-05} +{"train_loss": 0.00037288208841346204, "global_step": 54872, "epoch": 461, "lr": 1.2818554859612109e-05} +{"train_loss": 0.0002960556885227561, "global_step": 54873, "epoch": 461, "lr": 1.2817073622786808e-05} +{"train_loss": 0.0005362597294151783, "global_step": 54874, "epoch": 461, "lr": 1.2815592458966225e-05} +{"train_loss": 0.0006150317494757473, "global_step": 54875, "epoch": 461, "lr": 1.2814111368153236e-05} +{"train_loss": 0.0006718332297168672, "global_step": 54876, "epoch": 461, "lr": 1.2812630350350784e-05} +{"train_loss": 0.0004203700227662921, "global_step": 54877, "epoch": 461, "lr": 1.2811149405561746e-05} +{"train_loss": 0.0005370903527364135, "global_step": 54878, "epoch": 461, "lr": 1.280966853378906e-05} +{"train_loss": 0.0004632483178284019, "global_step": 54879, "epoch": 461, "lr": 1.2808187735035598e-05} +{"train_loss": 0.0004376443976070732, "global_step": 54880, "epoch": 461, "lr": 1.2806707009304303e-05} +{"train_loss": 0.00040511900442652404, "global_step": 54881, "epoch": 461, "lr": 1.2805226356598049e-05} +{"train_loss": 0.0009992264676839113, "global_step": 54882, "epoch": 461, "lr": 1.2803745776919757e-05} +{"train_loss": 0.0010737647535279393, "global_step": 54883, "epoch": 461, "lr": 1.2802265270272357e-05} +{"train_loss": 0.00087068259017542, "global_step": 54884, "epoch": 461, "lr": 1.280078483665873e-05} +{"train_loss": 0.0006322112749330699, "global_step": 54885, "epoch": 461, "lr": 1.2799304476081775e-05} +{"train_loss": 0.00044576864456757903, "global_step": 54886, "epoch": 461, "lr": 1.2797824188544427e-05} +{"train_loss": 0.0004588668525684625, "global_step": 54887, "epoch": 461, "lr": 1.2796343974049557e-05} +{"train_loss": 0.0007222328567877412, "global_step": 54888, "epoch": 461, "lr": 1.2794863832600113e-05} +{"train_loss": 0.00042320217471569777, "global_step": 54889, "epoch": 461, "lr": 1.2793383764198958e-05} +{"train_loss": 0.00037861012970097363, "global_step": 54890, "epoch": 461, "lr": 1.279190376884904e-05} +{"train_loss": 0.0010591073660179973, "global_step": 54891, "epoch": 461, "lr": 1.279042384655324e-05} +{"train_loss": 0.0005641381139867008, "global_step": 54892, "epoch": 461, "lr": 1.278894399731445e-05} +{"train_loss": 0.00041409145342186093, "global_step": 54893, "epoch": 461, "lr": 1.2787464221135614e-05} +{"train_loss": 0.0007804379565641284, "global_step": 54894, "epoch": 461, "lr": 1.27859845180196e-05} +{"train_loss": 0.00041301449527963996, "global_step": 54895, "epoch": 461, "lr": 1.278450488796934e-05} +{"train_loss": 0.00036156928399577737, "global_step": 54896, "epoch": 461, "lr": 1.2783025330987736e-05} +{"train_loss": 0.0003596168535295874, "global_step": 54897, "epoch": 461, "lr": 1.2781545847077663e-05} +{"train_loss": 0.0007225173176266253, "global_step": 54898, "epoch": 461, "lr": 1.2780066436242066e-05} +{"train_loss": 0.0006377982208505273, "global_step": 54899, "epoch": 461, "lr": 1.2778587098483819e-05} +{"train_loss": 0.0011736395535990596, "global_step": 54900, "epoch": 461, "lr": 1.2777107833805858e-05} +{"train_loss": 0.0008311083074659109, "global_step": 54901, "epoch": 461, "lr": 1.2775628642211046e-05} +{"train_loss": 0.00041399465408176184, "global_step": 54902, "epoch": 461, "lr": 1.2774149523702334e-05} +{"train_loss": 0.0004738015413749963, "global_step": 54903, "epoch": 461, "lr": 1.2772670478282595e-05} +{"train_loss": 0.0006906710914336145, "global_step": 54904, "epoch": 461, "lr": 1.2771191505954727e-05} +{"train_loss": 0.0013318882556632161, "global_step": 54905, "epoch": 461, "lr": 1.2769712606721667e-05} +{"train_loss": 0.00037604811950586736, "global_step": 54906, "epoch": 461, "lr": 1.276823378058628e-05} +{"train_loss": 0.0008533785585314035, "global_step": 54907, "epoch": 461, "lr": 1.2766755027551503e-05} +{"train_loss": 0.0006495280540548265, "global_step": 54908, "epoch": 461, "lr": 1.2765276347620208e-05} +{"train_loss": 0.0005849045119248331, "global_step": 54909, "epoch": 461, "lr": 1.2763797740795335e-05} +{"train_loss": 0.0005133358063176274, "global_step": 54910, "epoch": 461, "lr": 1.2762319207079749e-05} +{"train_loss": 0.0006295031635090709, "global_step": 54911, "epoch": 461, "lr": 1.2760840746476388e-05} +{"train_loss": 0.0009183645015582442, "global_step": 54912, "epoch": 461, "lr": 1.275936235898812e-05} +{"train_loss": 0.0003700827364809811, "global_step": 54913, "epoch": 461, "lr": 1.2757884044617886e-05} +{"train_loss": 0.000504440104123205, "global_step": 54914, "epoch": 461, "lr": 1.2756405803368544e-05} +{"train_loss": 0.0008851580205373466, "global_step": 54915, "epoch": 461, "lr": 1.2754927635243041e-05} +{"train_loss": 0.0009370847255922854, "global_step": 54916, "epoch": 461, "lr": 1.2753449540244244e-05} +{"train_loss": 0.0004771743551827967, "global_step": 54917, "epoch": 461, "lr": 1.2751971518375083e-05} +{"train_loss": 0.0008012218750081956, "global_step": 54918, "epoch": 461, "lr": 1.2750493569638432e-05} +{"train_loss": 0.00062552560120821, "global_step": 54919, "epoch": 461, "lr": 1.274901569403722e-05} +{"train_loss": 0.0008175260736607015, "global_step": 54920, "epoch": 461, "lr": 1.2747537891574325e-05} +{"train_loss": 0.0006222932715900242, "global_step": 54921, "epoch": 461, "lr": 1.2746060162252672e-05} +{"train_loss": 0.0003627886180765927, "global_step": 54922, "epoch": 461, "lr": 1.2744582506075148e-05} +{"train_loss": 0.00041902236989699304, "global_step": 54923, "epoch": 461, "lr": 1.2743104923044646e-05} +{"train_loss": 0.0007007102249190211, "global_step": 54924, "epoch": 461, "lr": 1.2741627413164087e-05} +{"train_loss": 0.0005777782062068582, "global_step": 54925, "epoch": 461, "lr": 1.274014997643635e-05} +{"train_loss": 0.0005177846178412437, "global_step": 54926, "epoch": 461, "lr": 1.2738672612864366e-05} +{"train_loss": 0.0004399700555950403, "global_step": 54927, "epoch": 461, "lr": 1.2737195322450995e-05} +{"train_loss": 0.0005329290288500488, "global_step": 54928, "epoch": 461, "lr": 1.273571810519918e-05} +{"train_loss": 0.0004601146501954645, "global_step": 54929, "epoch": 461, "lr": 1.2734240961111804e-05} +{"train_loss": 0.0006197215407155454, "global_step": 54930, "epoch": 461, "lr": 1.2732763890191746e-05} +{"train_loss": 0.0006603439105674624, "global_step": 54931, "epoch": 461, "lr": 1.2731286892441941e-05} +{"train_loss": 0.0012432519579306245, "global_step": 54932, "epoch": 461, "lr": 1.2729809967865253e-05} +{"train_loss": 0.000870223215315491, "global_step": 54933, "epoch": 461, "lr": 1.272833311646462e-05} +{"train_loss": 0.0006164995720610023, "global_step": 54934, "epoch": 461, "lr": 1.272685633824292e-05} +{"train_loss": 0.00045575512922368944, "global_step": 54935, "epoch": 461, "lr": 1.272537963320305e-05} +{"train_loss": 0.00038046418922021985, "global_step": 54936, "epoch": 461, "lr": 1.272390300134792e-05} +{"train_loss": 0.000696711940690875, "global_step": 54937, "epoch": 461, "lr": 1.2722426442680413e-05} +{"train_loss": 0.0004179058887530118, "global_step": 54938, "epoch": 461, "lr": 1.2720949957203454e-05} +{"train_loss": 0.0006644439417868853, "global_step": 54939, "epoch": 461, "lr": 1.2719473544919914e-05} +{"train_loss": 0.0008096667588688433, "global_step": 54940, "epoch": 461, "lr": 1.2717997205832716e-05} +{"train_loss": 0.0007836416480131447, "global_step": 54941, "epoch": 461, "lr": 1.2716520939944747e-05} +{"train_loss": 0.00040045767673291266, "global_step": 54942, "epoch": 461, "lr": 1.2715044747258891e-05} +{"train_loss": 0.0005599263240583241, "global_step": 54943, "epoch": 461, "lr": 1.2713568627778083e-05} +{"train_loss": 0.0004985148552805185, "global_step": 54944, "epoch": 461, "lr": 1.271209258150518e-05} +{"train_loss": 0.0005668262019753456, "global_step": 54945, "epoch": 461, "lr": 1.2710616608443099e-05} +{"train_loss": 0.0007345345220528543, "global_step": 54946, "epoch": 461, "lr": 1.2709140708594753e-05} +{"train_loss": 0.0006819890695624053, "global_step": 54947, "epoch": 461, "lr": 1.270766488196301e-05} +{"train_loss": 0.0005392396124079823, "global_step": 54948, "epoch": 461, "lr": 1.27061891285508e-05} +{"train_loss": 0.0011905946303158998, "global_step": 54949, "epoch": 461, "lr": 1.2704713448360988e-05} +{"train_loss": 0.0009248062269762158, "global_step": 54950, "epoch": 461, "lr": 1.2703237841396499e-05} +{"train_loss": 0.0008153110975399613, "global_step": 54951, "epoch": 461, "lr": 1.2701762307660209e-05} +{"train_loss": 0.0005857289070263505, "global_step": 54952, "epoch": 461, "lr": 1.2700286847155035e-05} +{"train_loss": 0.0005305713275447488, "global_step": 54953, "epoch": 461, "lr": 1.2698811459883863e-05} +{"train_loss": 0.001066997880116105, "global_step": 54954, "epoch": 461, "lr": 1.2697336145849576e-05} +{"train_loss": 0.000663171405903995, "global_step": 54955, "epoch": 461, "lr": 1.2695860905055096e-05} +{"train_loss": 0.0007398332236334682, "global_step": 54956, "epoch": 461, "lr": 1.2694385737503295e-05} +{"train_loss": 0.0007609713356941938, "global_step": 54957, "epoch": 461, "lr": 1.2692910643197098e-05} +{"train_loss": 0.0010269181802868843, "global_step": 54958, "epoch": 461, "lr": 1.269143562213937e-05} +{"train_loss": 0.0006692314054816961, "global_step": 54959, "epoch": 461, "lr": 1.2689960674333034e-05} +{"train_loss": 0.0005479761166498065, "global_step": 54960, "epoch": 461, "lr": 1.2688485799780975e-05} +{"train_loss": 0.0009011540678329766, "global_step": 54961, "epoch": 461, "lr": 1.2687010998486077e-05} +{"train_loss": 0.0006311949109658599, "global_step": 54962, "epoch": 461, "lr": 1.268553627045126e-05} +{"train_loss": 0.0003269625303801149, "global_step": 54963, "epoch": 461, "lr": 1.2684061615679389e-05} +{"train_loss": 0.0007650331826880574, "global_step": 54964, "epoch": 461, "lr": 1.2682587034173392e-05} +{"train_loss": 0.00038519149529747665, "global_step": 54965, "epoch": 461, "lr": 1.2681112525936151e-05} +{"train_loss": 0.0008558278204873204, "global_step": 54966, "epoch": 461, "lr": 1.2679638090970541e-05} +{"train_loss": 0.0005329938721843064, "global_step": 54967, "epoch": 461, "lr": 1.2678163729279491e-05} +{"train_loss": 0.0008291733101941645, "global_step": 54968, "epoch": 461, "lr": 1.2676689440865863e-05} +{"train_loss": 0.0006245955009944737, "global_step": 54969, "epoch": 461, "lr": 1.2675215225732584e-05} +{"train_loss": 0.0007377236033789814, "global_step": 54970, "epoch": 461, "lr": 1.2673741083882517e-05} +{"train_loss": 0.000490895239636302, "global_step": 54971, "epoch": 461, "lr": 1.2672267015318584e-05} +{"train_loss": 0.0007134483312256634, "global_step": 54972, "epoch": 461, "lr": 1.267079302004367e-05} +{"train_loss": 0.0003606292011681944, "global_step": 54973, "epoch": 461, "lr": 1.266931909806065e-05} +{"train_loss": 0.0005105603486299515, "global_step": 54974, "epoch": 461, "lr": 1.2667845249372452e-05} +{"train_loss": 0.00046031014062464237, "global_step": 54975, "epoch": 461, "lr": 1.2666371473981931e-05} +{"train_loss": 0.0006015088292770088, "global_step": 54976, "epoch": 461, "lr": 1.266489777189202e-05} +{"train_loss": 0.0006515963798870152, "global_step": 54977, "epoch": 461, "lr": 1.2663424143105578e-05, "val_loss": 0.03461939096450806} +{"train_loss": 0.0008901740075089037, "global_step": 54978, "epoch": 462, "lr": 1.2661950587625526e-05} +{"train_loss": 0.0005397552740760148, "global_step": 54979, "epoch": 462, "lr": 1.2660477105454732e-05} +{"train_loss": 0.0006542688934132457, "global_step": 54980, "epoch": 462, "lr": 1.2659003696596106e-05} +{"train_loss": 0.00047720459406264126, "global_step": 54981, "epoch": 462, "lr": 1.2657530361052545e-05} +{"train_loss": 0.00041555208736099303, "global_step": 54982, "epoch": 462, "lr": 1.2656057098826923e-05} +{"train_loss": 0.00036279685446061194, "global_step": 54983, "epoch": 462, "lr": 1.2654583909922158e-05} +{"train_loss": 0.0014239033916965127, "global_step": 54984, "epoch": 462, "lr": 1.2653110794341121e-05} +{"train_loss": 0.0005901602562516928, "global_step": 54985, "epoch": 462, "lr": 1.2651637752086704e-05} +{"train_loss": 0.0006916812271811068, "global_step": 54986, "epoch": 462, "lr": 1.2650164783161823e-05} +{"train_loss": 0.0010949599090963602, "global_step": 54987, "epoch": 462, "lr": 1.264869188756933e-05} +{"train_loss": 0.0003236319753341377, "global_step": 54988, "epoch": 462, "lr": 1.2647219065312161e-05} +{"train_loss": 0.0009488206123933196, "global_step": 54989, "epoch": 462, "lr": 1.264574631639317e-05} +{"train_loss": 0.0005855266354046762, "global_step": 54990, "epoch": 462, "lr": 1.264427364081528e-05} +{"train_loss": 0.00048091603093780577, "global_step": 54991, "epoch": 462, "lr": 1.264280103858137e-05} +{"train_loss": 0.0006199228810146451, "global_step": 54992, "epoch": 462, "lr": 1.264132850969431e-05} +{"train_loss": 0.0014882032992318273, "global_step": 54993, "epoch": 462, "lr": 1.2639856054157029e-05} +{"train_loss": 0.000674135226290673, "global_step": 54994, "epoch": 462, "lr": 1.2638383671972382e-05} +{"train_loss": 0.0009258872596547008, "global_step": 54995, "epoch": 462, "lr": 1.2636911363143295e-05} +{"train_loss": 0.0005732154822908342, "global_step": 54996, "epoch": 462, "lr": 1.2635439127672622e-05} +{"train_loss": 0.0008010698365978897, "global_step": 54997, "epoch": 462, "lr": 1.2633966965563294e-05} +{"train_loss": 0.0010767460335046053, "global_step": 54998, "epoch": 462, "lr": 1.2632494876818173e-05} +{"train_loss": 0.0008429354638792574, "global_step": 54999, "epoch": 462, "lr": 1.2631022861440144e-05} +{"train_loss": 0.0006652696174569428, "global_step": 55000, "epoch": 462, "lr": 1.2629550919432121e-05} +{"train_loss": 0.0007675616652704775, "global_step": 55001, "epoch": 462, "lr": 1.262807905079697e-05} +{"train_loss": 0.00042370043229311705, "global_step": 55002, "epoch": 462, "lr": 1.2626607255537609e-05} +{"train_loss": 0.00063051882898435, "global_step": 55003, "epoch": 462, "lr": 1.2625135533656913e-05} +{"train_loss": 0.0003522060578688979, "global_step": 55004, "epoch": 462, "lr": 1.2623663885157754e-05} +{"train_loss": 0.0005377990310080349, "global_step": 55005, "epoch": 462, "lr": 1.2622192310043052e-05} +{"train_loss": 0.0010204201098531485, "global_step": 55006, "epoch": 462, "lr": 1.2620720808315667e-05} +{"train_loss": 0.0005925307050347328, "global_step": 55007, "epoch": 462, "lr": 1.2619249379978521e-05} +{"train_loss": 0.0006283366237767041, "global_step": 55008, "epoch": 462, "lr": 1.2617778025034467e-05} +{"train_loss": 0.0007874006987549365, "global_step": 55009, "epoch": 462, "lr": 1.2616306743486428e-05} +{"train_loss": 0.0008519294788129628, "global_step": 55010, "epoch": 462, "lr": 1.2614835535337266e-05} +{"train_loss": 0.0012228889390826225, "global_step": 55011, "epoch": 462, "lr": 1.2613364400589889e-05} +{"train_loss": 0.0005270610563457012, "global_step": 55012, "epoch": 462, "lr": 1.2611893339247166e-05} +{"train_loss": 0.0008897908264771104, "global_step": 55013, "epoch": 462, "lr": 1.2610422351312006e-05} +{"train_loss": 0.0006995184230618179, "global_step": 55014, "epoch": 462, "lr": 1.2608951436787281e-05} +{"train_loss": 0.0004246832395438105, "global_step": 55015, "epoch": 462, "lr": 1.260748059567589e-05} +{"train_loss": 0.001009600586257875, "global_step": 55016, "epoch": 462, "lr": 1.2606009827980709e-05} +{"train_loss": 0.0005740824271924794, "global_step": 55017, "epoch": 462, "lr": 1.2604539133704646e-05} +{"train_loss": 0.0007884246879257262, "global_step": 55018, "epoch": 462, "lr": 1.2603068512850557e-05} +{"train_loss": 0.0007066554971970618, "global_step": 55019, "epoch": 462, "lr": 1.2601597965421368e-05} +{"train_loss": 0.0005875296192243695, "global_step": 55020, "epoch": 462, "lr": 1.2600127491419927e-05} +{"train_loss": 0.000666371954139322, "global_step": 55021, "epoch": 462, "lr": 1.2598657090849158e-05} +{"train_loss": 0.0006680323276668787, "global_step": 55022, "epoch": 462, "lr": 1.2597186763711926e-05} +{"train_loss": 0.0003771573246922344, "global_step": 55023, "epoch": 462, "lr": 1.2595716510011107e-05} +{"train_loss": 0.0009779002284631133, "global_step": 55024, "epoch": 462, "lr": 1.2594246329749621e-05} +{"train_loss": 0.0006018524873070419, "global_step": 55025, "epoch": 462, "lr": 1.2592776222930319e-05} +{"train_loss": 0.0006730893510393798, "global_step": 55026, "epoch": 462, "lr": 1.2591306189556123e-05} +{"train_loss": 0.00034025500644929707, "global_step": 55027, "epoch": 462, "lr": 1.2589836229629881e-05} +{"train_loss": 0.0010210846085101366, "global_step": 55028, "epoch": 462, "lr": 1.2588366343154517e-05} +{"train_loss": 0.000892774376552552, "global_step": 55029, "epoch": 462, "lr": 1.2586896530132897e-05} +{"train_loss": 0.0007181776454672217, "global_step": 55030, "epoch": 462, "lr": 1.2585426790567894e-05} +{"train_loss": 0.0008004371193237603, "global_step": 55031, "epoch": 462, "lr": 1.2583957124462426e-05} +{"train_loss": 0.0006175985909067094, "global_step": 55032, "epoch": 462, "lr": 1.2582487531819343e-05} +{"train_loss": 0.0007645134464837611, "global_step": 55033, "epoch": 462, "lr": 1.2581018012641565e-05} +{"train_loss": 0.00039756917976774275, "global_step": 55034, "epoch": 462, "lr": 1.2579548566931959e-05} +{"train_loss": 0.0006825218442827463, "global_step": 55035, "epoch": 462, "lr": 1.2578079194693393e-05} +{"train_loss": 0.0011191179510205984, "global_step": 55036, "epoch": 462, "lr": 1.2576609895928792e-05} +{"train_loss": 0.000572088873013854, "global_step": 55037, "epoch": 462, "lr": 1.2575140670641e-05} +{"train_loss": 0.00042369100265204906, "global_step": 55038, "epoch": 462, "lr": 1.257367151883294e-05} +{"train_loss": 0.00036304965033195913, "global_step": 55039, "epoch": 462, "lr": 1.2572202440507458e-05} +{"train_loss": 0.0004114499606657773, "global_step": 55040, "epoch": 462, "lr": 1.2570733435667475e-05} +{"train_loss": 0.0005375588079914451, "global_step": 55041, "epoch": 462, "lr": 1.2569264504315848e-05} +{"train_loss": 0.0007266760221682489, "global_step": 55042, "epoch": 462, "lr": 1.2567795646455477e-05} +{"train_loss": 0.001679635839536786, "global_step": 55043, "epoch": 462, "lr": 1.2566326862089234e-05} +{"train_loss": 0.000843032612465322, "global_step": 55044, "epoch": 462, "lr": 1.2564858151220022e-05} +{"train_loss": 0.0005329477717168629, "global_step": 55045, "epoch": 462, "lr": 1.2563389513850693e-05} +{"train_loss": 0.0006211054278537631, "global_step": 55046, "epoch": 462, "lr": 1.2561920949984163e-05} +{"train_loss": 0.0006293233018368483, "global_step": 55047, "epoch": 462, "lr": 1.2560452459623289e-05} +{"train_loss": 0.0009915931150317192, "global_step": 55048, "epoch": 462, "lr": 1.2558984042770982e-05} +{"train_loss": 0.00045959933777339756, "global_step": 55049, "epoch": 462, "lr": 1.2557515699430094e-05} +{"train_loss": 0.000704614503774792, "global_step": 55050, "epoch": 462, "lr": 1.255604742960354e-05} +{"train_loss": 0.0006174944574013352, "global_step": 55051, "epoch": 462, "lr": 1.2554579233294172e-05} +{"train_loss": 0.0008438204531557858, "global_step": 55052, "epoch": 462, "lr": 1.2553111110504906e-05} +{"train_loss": 0.00033178922603838146, "global_step": 55053, "epoch": 462, "lr": 1.25516430612386e-05} +{"train_loss": 0.00030244735535234213, "global_step": 55054, "epoch": 462, "lr": 1.2550175085498129e-05} +{"train_loss": 0.00039844942511990666, "global_step": 55055, "epoch": 462, "lr": 1.2548707183286401e-05} +{"train_loss": 0.0010531505104154348, "global_step": 55056, "epoch": 462, "lr": 1.2547239354606272e-05} +{"train_loss": 0.0005111396312713623, "global_step": 55057, "epoch": 462, "lr": 1.2545771599460653e-05} +{"train_loss": 0.0004309095675125718, "global_step": 55058, "epoch": 462, "lr": 1.2544303917852396e-05} +{"train_loss": 0.0006339817773550749, "global_step": 55059, "epoch": 462, "lr": 1.2542836309784406e-05} +{"train_loss": 0.0006822884315624833, "global_step": 55060, "epoch": 462, "lr": 1.254136877525956e-05} +{"train_loss": 0.0003272920148447156, "global_step": 55061, "epoch": 462, "lr": 1.2539901314280722e-05} +{"train_loss": 0.0004011036944575608, "global_step": 55062, "epoch": 462, "lr": 1.2538433926850795e-05} +{"train_loss": 0.0005294773145578802, "global_step": 55063, "epoch": 462, "lr": 1.2536966612972639e-05} +{"train_loss": 0.0006861022557131946, "global_step": 55064, "epoch": 462, "lr": 1.2535499372649161e-05} +{"train_loss": 0.000613780808635056, "global_step": 55065, "epoch": 462, "lr": 1.2534032205883228e-05} +{"train_loss": 0.0005245836800895631, "global_step": 55066, "epoch": 462, "lr": 1.2532565112677708e-05} +{"train_loss": 0.0010922981891781092, "global_step": 55067, "epoch": 462, "lr": 1.2531098093035504e-05} +{"train_loss": 0.00048488948959857225, "global_step": 55068, "epoch": 462, "lr": 1.252963114695947e-05} +{"train_loss": 0.0006599638145416975, "global_step": 55069, "epoch": 462, "lr": 1.252816427445252e-05} +{"train_loss": 0.0007197290542535484, "global_step": 55070, "epoch": 462, "lr": 1.2526697475517502e-05} +{"train_loss": 0.0008714062860235572, "global_step": 55071, "epoch": 462, "lr": 1.2525230750157324e-05} +{"train_loss": 0.0003989745455328375, "global_step": 55072, "epoch": 462, "lr": 1.2523764098374852e-05} +{"train_loss": 0.00047756280400790274, "global_step": 55073, "epoch": 462, "lr": 1.2522297520172949e-05} +{"train_loss": 0.0010097816120833158, "global_step": 55074, "epoch": 462, "lr": 1.2520831015554524e-05} +{"train_loss": 0.0013154129264876246, "global_step": 55075, "epoch": 462, "lr": 1.251936458452243e-05} +{"train_loss": 0.0008231188985519111, "global_step": 55076, "epoch": 462, "lr": 1.251789822707956e-05} +{"train_loss": 0.0008470299653708935, "global_step": 55077, "epoch": 462, "lr": 1.2516431943228813e-05} +{"train_loss": 0.00038495362969115376, "global_step": 55078, "epoch": 462, "lr": 1.2514965732973028e-05} +{"train_loss": 0.0012226239778101444, "global_step": 55079, "epoch": 462, "lr": 1.2513499596315115e-05} +{"train_loss": 0.0004916815087199211, "global_step": 55080, "epoch": 462, "lr": 1.2512033533257927e-05} +{"train_loss": 0.0006506197387352586, "global_step": 55081, "epoch": 462, "lr": 1.2510567543804374e-05} +{"train_loss": 0.0006403941661119461, "global_step": 55082, "epoch": 462, "lr": 1.2509101627957297e-05} +{"train_loss": 0.00040044207707978785, "global_step": 55083, "epoch": 462, "lr": 1.2507635785719613e-05} +{"train_loss": 0.0004030705022159964, "global_step": 55084, "epoch": 462, "lr": 1.2506170017094182e-05} +{"train_loss": 0.0003814414085354656, "global_step": 55085, "epoch": 462, "lr": 1.250470432208386e-05} +{"train_loss": 0.0008369753486476839, "global_step": 55086, "epoch": 462, "lr": 1.2503238700691561e-05} +{"train_loss": 0.0008143617887981236, "global_step": 55087, "epoch": 462, "lr": 1.2501773152920137e-05} +{"train_loss": 0.0006099700112827122, "global_step": 55088, "epoch": 462, "lr": 1.2500307678772489e-05} +{"train_loss": 0.0008034442435018718, "global_step": 55089, "epoch": 462, "lr": 1.249884227825146e-05} +{"train_loss": 0.0008655375568196177, "global_step": 55090, "epoch": 462, "lr": 1.2497376951359969e-05} +{"train_loss": 0.0005014673224650323, "global_step": 55091, "epoch": 462, "lr": 1.2495911698100865e-05} +{"train_loss": 0.0011093317298218608, "global_step": 55092, "epoch": 462, "lr": 1.2494446518477022e-05} +{"train_loss": 0.0009855072712525725, "global_step": 55093, "epoch": 462, "lr": 1.2492981412491339e-05} +{"train_loss": 0.00045609197695739567, "global_step": 55094, "epoch": 462, "lr": 1.2491516380146667e-05} +{"train_loss": 0.0008464890415780246, "global_step": 55095, "epoch": 462, "lr": 1.2490051421445914e-05} +{"train_loss": 0.0006944842767674758, "global_step": 55096, "epoch": 462, "lr": 1.2488586536391916e-05, "val_loss": 0.020092694088816643} +{"train_loss": 0.0008438389631919563, "global_step": 55097, "epoch": 463, "lr": 1.2487121724987589e-05} +{"train_loss": 0.00061599857872352, "global_step": 55098, "epoch": 463, "lr": 1.2485656987235788e-05} +{"train_loss": 0.0008081142441369593, "global_step": 55099, "epoch": 463, "lr": 1.2484192323139383e-05} +{"train_loss": 0.0002077047829516232, "global_step": 55100, "epoch": 463, "lr": 1.2482727732701266e-05} +{"train_loss": 0.00028661402757279575, "global_step": 55101, "epoch": 463, "lr": 1.2481263215924295e-05} +{"train_loss": 0.0003777056117542088, "global_step": 55102, "epoch": 463, "lr": 1.2479798772811368e-05} +{"train_loss": 0.00023983490245882422, "global_step": 55103, "epoch": 463, "lr": 1.247833440336535e-05} +{"train_loss": 0.0003535746945999563, "global_step": 55104, "epoch": 463, "lr": 1.2476870107589095e-05} +{"train_loss": 0.0005733277066610754, "global_step": 55105, "epoch": 463, "lr": 1.2475405885485513e-05} +{"train_loss": 0.0005040827090851963, "global_step": 55106, "epoch": 463, "lr": 1.2473941737057449e-05} +{"train_loss": 0.0005758134066127241, "global_step": 55107, "epoch": 463, "lr": 1.2472477662307803e-05} +{"train_loss": 0.0004925731918774545, "global_step": 55108, "epoch": 463, "lr": 1.2471013661239428e-05} +{"train_loss": 0.000742701580747962, "global_step": 55109, "epoch": 463, "lr": 1.2469549733855217e-05} +{"train_loss": 0.0003381444257684052, "global_step": 55110, "epoch": 463, "lr": 1.2468085880158026e-05} +{"train_loss": 0.0006708184373565018, "global_step": 55111, "epoch": 463, "lr": 1.2466622100150754e-05} +{"train_loss": 0.0005959978443570435, "global_step": 55112, "epoch": 463, "lr": 1.246515839383624e-05} +{"train_loss": 0.0003302975674159825, "global_step": 55113, "epoch": 463, "lr": 1.2463694761217382e-05} +{"train_loss": 0.000465345976408571, "global_step": 55114, "epoch": 463, "lr": 1.2462231202297064e-05} +{"train_loss": 0.0006537929875776172, "global_step": 55115, "epoch": 463, "lr": 1.2460767717078126e-05} +{"train_loss": 0.0005690022371709347, "global_step": 55116, "epoch": 463, "lr": 1.245930430556348e-05} +{"train_loss": 0.0007979266811162233, "global_step": 55117, "epoch": 463, "lr": 1.2457840967755973e-05} +{"train_loss": 0.00027670300914905965, "global_step": 55118, "epoch": 463, "lr": 1.2456377703658472e-05} +{"train_loss": 0.0012419788399711251, "global_step": 55119, "epoch": 463, "lr": 1.245491451327388e-05} +{"train_loss": 0.0008389109279960394, "global_step": 55120, "epoch": 463, "lr": 1.2453451396605037e-05} +{"train_loss": 0.0007098853820934892, "global_step": 55121, "epoch": 463, "lr": 1.2451988353654847e-05} +{"train_loss": 0.0008711927221156657, "global_step": 55122, "epoch": 463, "lr": 1.2450525384426165e-05} +{"train_loss": 0.0016273356741294265, "global_step": 55123, "epoch": 463, "lr": 1.2449062488921847e-05} +{"train_loss": 0.0007170048193074763, "global_step": 55124, "epoch": 463, "lr": 1.24475996671448e-05} +{"train_loss": 0.000623529776930809, "global_step": 55125, "epoch": 463, "lr": 1.2446136919097861e-05} +{"train_loss": 0.0007227173773571849, "global_step": 55126, "epoch": 463, "lr": 1.2444674244783943e-05} +{"train_loss": 0.0004942514933645725, "global_step": 55127, "epoch": 463, "lr": 1.2443211644205871e-05} +{"train_loss": 0.0007335103582590818, "global_step": 55128, "epoch": 463, "lr": 1.2441749117366563e-05} +{"train_loss": 0.00039812418981455266, "global_step": 55129, "epoch": 463, "lr": 1.2440286664268864e-05} +{"train_loss": 0.000490809790790081, "global_step": 55130, "epoch": 463, "lr": 1.2438824284915635e-05} +{"train_loss": 0.0003321728727314621, "global_step": 55131, "epoch": 463, "lr": 1.2437361979309775e-05} +{"train_loss": 0.0006145989755168557, "global_step": 55132, "epoch": 463, "lr": 1.2435899747454132e-05} +{"train_loss": 0.0002560111170168966, "global_step": 55133, "epoch": 463, "lr": 1.24344375893516e-05} +{"train_loss": 0.0011387111153453588, "global_step": 55134, "epoch": 463, "lr": 1.2432975505005034e-05} +{"train_loss": 0.0005949285114184022, "global_step": 55135, "epoch": 463, "lr": 1.243151349441729e-05} +{"train_loss": 0.0007083823438733816, "global_step": 55136, "epoch": 463, "lr": 1.2430051557591277e-05} +{"train_loss": 0.0004452312714420259, "global_step": 55137, "epoch": 463, "lr": 1.2428589694529823e-05} +{"train_loss": 0.0005390789592638612, "global_step": 55138, "epoch": 463, "lr": 1.2427127905235841e-05} +{"train_loss": 0.0005486503941938281, "global_step": 55139, "epoch": 463, "lr": 1.242566618971216e-05} +{"train_loss": 0.0010064819362014532, "global_step": 55140, "epoch": 463, "lr": 1.2424204547961681e-05} +{"train_loss": 0.0006554658175446093, "global_step": 55141, "epoch": 463, "lr": 1.242274297998725e-05} +{"train_loss": 0.0007503714296035469, "global_step": 55142, "epoch": 463, "lr": 1.242128148579177e-05} +{"train_loss": 0.0005113533698022366, "global_step": 55143, "epoch": 463, "lr": 1.2419820065378068e-05} +{"train_loss": 0.0009713442996144295, "global_step": 55144, "epoch": 463, "lr": 1.2418358718749046e-05} +{"train_loss": 0.00037169252755120397, "global_step": 55145, "epoch": 463, "lr": 1.2416897445907556e-05} +{"train_loss": 0.0006011656951159239, "global_step": 55146, "epoch": 463, "lr": 1.2415436246856477e-05} +{"train_loss": 0.0008930970216169953, "global_step": 55147, "epoch": 463, "lr": 1.2413975121598664e-05} +{"train_loss": 0.0005977901164442301, "global_step": 55148, "epoch": 463, "lr": 1.241251407013701e-05} +{"train_loss": 0.0007331851520575583, "global_step": 55149, "epoch": 463, "lr": 1.2411053092474356e-05} +{"train_loss": 0.0004442640929482877, "global_step": 55150, "epoch": 463, "lr": 1.2409592188613594e-05} +{"train_loss": 0.0004802214971277863, "global_step": 55151, "epoch": 463, "lr": 1.2408131358557573e-05} +{"train_loss": 0.0005381320370361209, "global_step": 55152, "epoch": 463, "lr": 1.2406670602309178e-05} +{"train_loss": 0.0007159813540056348, "global_step": 55153, "epoch": 463, "lr": 1.2405209919871275e-05} +{"train_loss": 0.00047181820264086127, "global_step": 55154, "epoch": 463, "lr": 1.240374931124671e-05} +{"train_loss": 0.0008228984079323709, "global_step": 55155, "epoch": 463, "lr": 1.2402288776438376e-05} +{"train_loss": 0.0005827561835758388, "global_step": 55156, "epoch": 463, "lr": 1.240082831544912e-05} +{"train_loss": 0.0005992839578539133, "global_step": 55157, "epoch": 463, "lr": 1.2399367928281835e-05} +{"train_loss": 0.0003785118751693517, "global_step": 55158, "epoch": 463, "lr": 1.2397907614939363e-05} +{"train_loss": 0.0006715370691381395, "global_step": 55159, "epoch": 463, "lr": 1.2396447375424596e-05} +{"train_loss": 0.000924419320654124, "global_step": 55160, "epoch": 463, "lr": 1.2394987209740383e-05} +{"train_loss": 0.0007222880376502872, "global_step": 55161, "epoch": 463, "lr": 1.2393527117889581e-05} +{"train_loss": 0.0006992642884142697, "global_step": 55162, "epoch": 463, "lr": 1.2392067099875087e-05} +{"train_loss": 0.00036773583269678056, "global_step": 55163, "epoch": 463, "lr": 1.239060715569974e-05} +{"train_loss": 0.0003822487487923354, "global_step": 55164, "epoch": 463, "lr": 1.2389147285366432e-05} +{"train_loss": 0.0005871657049283385, "global_step": 55165, "epoch": 463, "lr": 1.2387687488877997e-05} +{"train_loss": 0.0006549332174472511, "global_step": 55166, "epoch": 463, "lr": 1.2386227766237335e-05} +{"train_loss": 0.00046005495823919773, "global_step": 55167, "epoch": 463, "lr": 1.2384768117447293e-05} +{"train_loss": 0.0002789174614008516, "global_step": 55168, "epoch": 463, "lr": 1.2383308542510729e-05} +{"train_loss": 0.0006498121074400842, "global_step": 55169, "epoch": 463, "lr": 1.2381849041430538e-05} +{"train_loss": 0.00040797344991005957, "global_step": 55170, "epoch": 463, "lr": 1.2380389614209547e-05} +{"train_loss": 0.0006367854657582939, "global_step": 55171, "epoch": 463, "lr": 1.2378930260850657e-05} +{"train_loss": 0.0009264727123081684, "global_step": 55172, "epoch": 463, "lr": 1.237747098135672e-05} +{"train_loss": 0.0005878139636479318, "global_step": 55173, "epoch": 463, "lr": 1.237601177573059e-05} +{"train_loss": 0.000422340672230348, "global_step": 55174, "epoch": 463, "lr": 1.2374552643975135e-05} +{"train_loss": 0.00102178193628788, "global_step": 55175, "epoch": 463, "lr": 1.2373093586093243e-05} +{"train_loss": 0.0007430291152559221, "global_step": 55176, "epoch": 463, "lr": 1.2371634602087744e-05} +{"train_loss": 0.0004208338796161115, "global_step": 55177, "epoch": 463, "lr": 1.2370175691961539e-05} +{"train_loss": 0.0005566402105614543, "global_step": 55178, "epoch": 463, "lr": 1.2368716855717455e-05} +{"train_loss": 0.00045181886525824666, "global_step": 55179, "epoch": 463, "lr": 1.2367258093358392e-05} +{"train_loss": 0.0005148373893462121, "global_step": 55180, "epoch": 463, "lr": 1.2365799404887185e-05} +{"train_loss": 0.0007990846643224359, "global_step": 55181, "epoch": 463, "lr": 1.2364340790306723e-05} +{"train_loss": 0.0006611933349631727, "global_step": 55182, "epoch": 463, "lr": 1.236288224961984e-05} +{"train_loss": 0.0005464305286295712, "global_step": 55183, "epoch": 463, "lr": 1.2361423782829435e-05} +{"train_loss": 0.0006271544261835515, "global_step": 55184, "epoch": 463, "lr": 1.2359965389938356e-05} +{"train_loss": 0.0005122317816130817, "global_step": 55185, "epoch": 463, "lr": 1.2358507070949443e-05} +{"train_loss": 0.0010158016812056303, "global_step": 55186, "epoch": 463, "lr": 1.2357048825865597e-05} +{"train_loss": 0.0005659200251102448, "global_step": 55187, "epoch": 463, "lr": 1.2355590654689648e-05} +{"train_loss": 0.0005212125252000988, "global_step": 55188, "epoch": 463, "lr": 1.2354132557424492e-05} +{"train_loss": 0.0011595353716984391, "global_step": 55189, "epoch": 463, "lr": 1.2352674534072955e-05} +{"train_loss": 0.0005094542284496129, "global_step": 55190, "epoch": 463, "lr": 1.2351216584637942e-05} +{"train_loss": 0.0004303878522478044, "global_step": 55191, "epoch": 463, "lr": 1.2349758709122289e-05} +{"train_loss": 0.0006078049773350358, "global_step": 55192, "epoch": 463, "lr": 1.2348300907528848e-05} +{"train_loss": 0.0005720360204577446, "global_step": 55193, "epoch": 463, "lr": 1.2346843179860512e-05} +{"train_loss": 0.0004996227216906846, "global_step": 55194, "epoch": 463, "lr": 1.2345385526120107e-05} +{"train_loss": 0.0008903020061552525, "global_step": 55195, "epoch": 463, "lr": 1.2343927946310536e-05} +{"train_loss": 0.00042874342761933804, "global_step": 55196, "epoch": 463, "lr": 1.2342470440434622e-05} +{"train_loss": 0.0004512899904511869, "global_step": 55197, "epoch": 463, "lr": 1.2341013008495256e-05} +{"train_loss": 0.0008168587228283286, "global_step": 55198, "epoch": 463, "lr": 1.2339555650495294e-05} +{"train_loss": 0.00048350373981520534, "global_step": 55199, "epoch": 463, "lr": 1.2338098366437572e-05} +{"train_loss": 0.0009988583624362946, "global_step": 55200, "epoch": 463, "lr": 1.2336641156324986e-05} +{"train_loss": 0.001203277031891048, "global_step": 55201, "epoch": 463, "lr": 1.2335184020160361e-05} +{"train_loss": 0.0006823741132393479, "global_step": 55202, "epoch": 463, "lr": 1.23337269579466e-05} +{"train_loss": 0.00040282824193127453, "global_step": 55203, "epoch": 463, "lr": 1.2332269969686544e-05} +{"train_loss": 0.0009297940414398909, "global_step": 55204, "epoch": 463, "lr": 1.2330813055383034e-05} +{"train_loss": 0.0003372404898982495, "global_step": 55205, "epoch": 463, "lr": 1.2329356215038962e-05} +{"train_loss": 0.0006279100780375302, "global_step": 55206, "epoch": 463, "lr": 1.232789944865716e-05} +{"train_loss": 0.0005470148753374815, "global_step": 55207, "epoch": 463, "lr": 1.2326442756240513e-05} +{"train_loss": 0.00032075284980237484, "global_step": 55208, "epoch": 463, "lr": 1.232498613779186e-05} +{"train_loss": 0.0008389619179069996, "global_step": 55209, "epoch": 463, "lr": 1.2323529593314076e-05} +{"train_loss": 0.0004965969128534198, "global_step": 55210, "epoch": 463, "lr": 1.232207312281003e-05} +{"train_loss": 0.00047133187763392925, "global_step": 55211, "epoch": 463, "lr": 1.2320616726282547e-05} +{"train_loss": 0.0009248250280506909, "global_step": 55212, "epoch": 463, "lr": 1.2319160403734525e-05} +{"train_loss": 0.00048724882071837783, "global_step": 55213, "epoch": 463, "lr": 1.2317704155168797e-05} +{"train_loss": 0.0009826334426179528, "global_step": 55214, "epoch": 463, "lr": 1.2316247980588241e-05} +{"train_loss": 0.0006232487871517044, "global_step": 55215, "epoch": 463, "lr": 1.2314791879995692e-05, "val_loss": 0.032396551221609116} +{"train_loss": 0.0006309194723144174, "global_step": 55216, "epoch": 464, "lr": 1.2313335853394036e-05} +{"train_loss": 0.0006756698130629957, "global_step": 55217, "epoch": 464, "lr": 1.2311879900786121e-05} +{"train_loss": 0.00037470398820005357, "global_step": 55218, "epoch": 464, "lr": 1.2310424022174788e-05} +{"train_loss": 0.00048714346485212445, "global_step": 55219, "epoch": 464, "lr": 1.2308968217562928e-05} +{"train_loss": 0.0006529030506499112, "global_step": 55220, "epoch": 464, "lr": 1.2307512486953366e-05} +{"train_loss": 0.00032352469861507416, "global_step": 55221, "epoch": 464, "lr": 1.2306056830348989e-05} +{"train_loss": 0.001463338267058134, "global_step": 55222, "epoch": 464, "lr": 1.2304601247752645e-05} +{"train_loss": 0.0004864002694375813, "global_step": 55223, "epoch": 464, "lr": 1.2303145739167171e-05} +{"train_loss": 0.0003950487880501896, "global_step": 55224, "epoch": 464, "lr": 1.2301690304595459e-05} +{"train_loss": 0.00025579691282473505, "global_step": 55225, "epoch": 464, "lr": 1.230023494404034e-05} +{"train_loss": 0.0004911745199933648, "global_step": 55226, "epoch": 464, "lr": 1.2298779657504695e-05} +{"train_loss": 0.0007902101497165859, "global_step": 55227, "epoch": 464, "lr": 1.2297324444991348e-05} +{"train_loss": 0.0005899102543480694, "global_step": 55228, "epoch": 464, "lr": 1.2295869306503199e-05} +{"train_loss": 0.0003606109821703285, "global_step": 55229, "epoch": 464, "lr": 1.2294414242043079e-05} +{"train_loss": 0.0006590156117454171, "global_step": 55230, "epoch": 464, "lr": 1.2292959251613834e-05} +{"train_loss": 0.0004695348907262087, "global_step": 55231, "epoch": 464, "lr": 1.229150433521835e-05} +{"train_loss": 0.0008311441051773727, "global_step": 55232, "epoch": 464, "lr": 1.2290049492859451e-05} +{"train_loss": 0.00046351904165931046, "global_step": 55233, "epoch": 464, "lr": 1.2288594724540031e-05} +{"train_loss": 0.0002514500811230391, "global_step": 55234, "epoch": 464, "lr": 1.228714003026291e-05} +{"train_loss": 0.0007312115631066263, "global_step": 55235, "epoch": 464, "lr": 1.2285685410030973e-05} +{"train_loss": 0.00062145123956725, "global_step": 55236, "epoch": 464, "lr": 1.2284230863847068e-05} +{"train_loss": 0.00048036419320851564, "global_step": 55237, "epoch": 464, "lr": 1.2282776391714023e-05} +{"train_loss": 0.0008908568415790796, "global_step": 55238, "epoch": 464, "lr": 1.2281321993634743e-05} +{"train_loss": 0.0007548722205683589, "global_step": 55239, "epoch": 464, "lr": 1.2279867669612032e-05} +{"train_loss": 0.00076779950177297, "global_step": 55240, "epoch": 464, "lr": 1.2278413419648794e-05} +{"train_loss": 0.0006599266198463738, "global_step": 55241, "epoch": 464, "lr": 1.2276959243747843e-05} +{"train_loss": 0.00045086053432896733, "global_step": 55242, "epoch": 464, "lr": 1.227550514191207e-05} +{"train_loss": 0.0005058249807916582, "global_step": 55243, "epoch": 464, "lr": 1.2274051114144292e-05} +{"train_loss": 0.0008689342066645622, "global_step": 55244, "epoch": 464, "lr": 1.2272597160447392e-05} +{"train_loss": 0.0004554797487799078, "global_step": 55245, "epoch": 464, "lr": 1.2271143280824227e-05} +{"train_loss": 0.0005318325711414218, "global_step": 55246, "epoch": 464, "lr": 1.2269689475277624e-05} +{"train_loss": 0.00040934726712293923, "global_step": 55247, "epoch": 464, "lr": 1.2268235743810474e-05} +{"train_loss": 0.0008174677495844662, "global_step": 55248, "epoch": 464, "lr": 1.226678208642561e-05} +{"train_loss": 0.0006495294510386884, "global_step": 55249, "epoch": 464, "lr": 1.2265328503125872e-05} +{"train_loss": 0.00048814876936376095, "global_step": 55250, "epoch": 464, "lr": 1.2263874993914149e-05} +{"train_loss": 0.00047216800157912076, "global_step": 55251, "epoch": 464, "lr": 1.2262421558793258e-05} +{"train_loss": 0.00040392871596850455, "global_step": 55252, "epoch": 464, "lr": 1.2260968197766087e-05} +{"train_loss": 0.000368524226360023, "global_step": 55253, "epoch": 464, "lr": 1.2259514910835474e-05} +{"train_loss": 0.0004492333682719618, "global_step": 55254, "epoch": 464, "lr": 1.2258061698004253e-05} +{"train_loss": 0.0005042788106948137, "global_step": 55255, "epoch": 464, "lr": 1.2256608559275312e-05} +{"train_loss": 0.0011194146936759353, "global_step": 55256, "epoch": 464, "lr": 1.2255155494651477e-05} +{"train_loss": 0.0016591945895925164, "global_step": 55257, "epoch": 464, "lr": 1.2253702504135623e-05} +{"train_loss": 0.0010124186519533396, "global_step": 55258, "epoch": 464, "lr": 1.225224958773058e-05} +{"train_loss": 0.0005208277143537998, "global_step": 55259, "epoch": 464, "lr": 1.225079674543922e-05} +{"train_loss": 0.0005970356869511306, "global_step": 55260, "epoch": 464, "lr": 1.2249343977264394e-05} +{"train_loss": 0.00064380670664832, "global_step": 55261, "epoch": 464, "lr": 1.2247891283208929e-05} +{"train_loss": 0.0004812416445929557, "global_step": 55262, "epoch": 464, "lr": 1.2246438663275716e-05} +{"train_loss": 0.0007453558500856161, "global_step": 55263, "epoch": 464, "lr": 1.2244986117467566e-05} +{"train_loss": 0.00032907308195717633, "global_step": 55264, "epoch": 464, "lr": 1.224353364578737e-05} +{"train_loss": 0.00041678064735606313, "global_step": 55265, "epoch": 464, "lr": 1.2242081248237953e-05} +{"train_loss": 0.0003584801161196083, "global_step": 55266, "epoch": 464, "lr": 1.2240628924822184e-05} +{"train_loss": 0.0006011611549183726, "global_step": 55267, "epoch": 464, "lr": 1.2239176675542906e-05} +{"train_loss": 0.000563531182706356, "global_step": 55268, "epoch": 464, "lr": 1.2237724500402959e-05} +{"train_loss": 0.0003621108189690858, "global_step": 55269, "epoch": 464, "lr": 1.2236272399405218e-05} +{"train_loss": 0.00047103952965699136, "global_step": 55270, "epoch": 464, "lr": 1.2234820372552509e-05} +{"train_loss": 0.0005188525537960231, "global_step": 55271, "epoch": 464, "lr": 1.2233368419847708e-05} +{"train_loss": 0.0006220901268534362, "global_step": 55272, "epoch": 464, "lr": 1.2231916541293636e-05} +{"train_loss": 0.00035050956648774445, "global_step": 55273, "epoch": 464, "lr": 1.2230464736893178e-05} +{"train_loss": 0.0003789384791161865, "global_step": 55274, "epoch": 464, "lr": 1.2229013006649154e-05} +{"train_loss": 0.0008416992495767772, "global_step": 55275, "epoch": 464, "lr": 1.2227561350564443e-05} +{"train_loss": 0.0008469375898130238, "global_step": 55276, "epoch": 464, "lr": 1.2226109768641863e-05} +{"train_loss": 0.000305016030324623, "global_step": 55277, "epoch": 464, "lr": 1.2224658260884298e-05} +{"train_loss": 0.00107747339643538, "global_step": 55278, "epoch": 464, "lr": 1.2223206827294564e-05} +{"train_loss": 0.000443772180005908, "global_step": 55279, "epoch": 464, "lr": 1.2221755467875546e-05} +{"train_loss": 0.0011380478972569108, "global_step": 55280, "epoch": 464, "lr": 1.2220304182630054e-05} +{"train_loss": 0.0005875344504602253, "global_step": 55281, "epoch": 464, "lr": 1.221885297156098e-05} +{"train_loss": 0.0006423405720852315, "global_step": 55282, "epoch": 464, "lr": 1.2217401834671132e-05} +{"train_loss": 0.0005485517322085798, "global_step": 55283, "epoch": 464, "lr": 1.2215950771963396e-05} +{"train_loss": 0.0004318878927733749, "global_step": 55284, "epoch": 464, "lr": 1.2214499783440592e-05} +{"train_loss": 0.0004922595690004528, "global_step": 55285, "epoch": 464, "lr": 1.2213048869105592e-05} +{"train_loss": 0.0007634835201315582, "global_step": 55286, "epoch": 464, "lr": 1.2211598028961235e-05} +{"train_loss": 0.000508543336763978, "global_step": 55287, "epoch": 464, "lr": 1.2210147263010353e-05} +{"train_loss": 0.0008403763058595359, "global_step": 55288, "epoch": 464, "lr": 1.2208696571255823e-05} +{"train_loss": 0.0002420196105958894, "global_step": 55289, "epoch": 464, "lr": 1.2207245953700464e-05} +{"train_loss": 0.000488812627736479, "global_step": 55290, "epoch": 464, "lr": 1.220579541034716e-05} +{"train_loss": 0.000710161286406219, "global_step": 55291, "epoch": 464, "lr": 1.2204344941198736e-05} +{"train_loss": 0.001140405423939228, "global_step": 55292, "epoch": 464, "lr": 1.2202894546258026e-05} +{"train_loss": 0.00037472372059710324, "global_step": 55293, "epoch": 464, "lr": 1.2201444225527915e-05} +{"train_loss": 0.0007153222686611116, "global_step": 55294, "epoch": 464, "lr": 1.219999397901121e-05} +{"train_loss": 0.0003588202816899866, "global_step": 55295, "epoch": 464, "lr": 1.2198543806710794e-05} +{"train_loss": 0.0005651224637404084, "global_step": 55296, "epoch": 464, "lr": 1.2197093708629486e-05} +{"train_loss": 0.0004713029193226248, "global_step": 55297, "epoch": 464, "lr": 1.2195643684770159e-05} +{"train_loss": 0.0006858182605355978, "global_step": 55298, "epoch": 464, "lr": 1.2194193735135645e-05} +{"train_loss": 0.00029160440317355096, "global_step": 55299, "epoch": 464, "lr": 1.2192743859728784e-05} +{"train_loss": 0.000550820492208004, "global_step": 55300, "epoch": 464, "lr": 1.2191294058552438e-05} +{"train_loss": 0.0006217684713192284, "global_step": 55301, "epoch": 464, "lr": 1.218984433160944e-05} +{"train_loss": 0.0007493874873034656, "global_step": 55302, "epoch": 464, "lr": 1.2188394678902654e-05} +{"train_loss": 0.0005179829895496368, "global_step": 55303, "epoch": 464, "lr": 1.2186945100434899e-05} +{"train_loss": 0.000292188924504444, "global_step": 55304, "epoch": 464, "lr": 1.2185495596209056e-05} +{"train_loss": 0.0006800888222642243, "global_step": 55305, "epoch": 464, "lr": 1.2184046166227952e-05} +{"train_loss": 0.0006253320025280118, "global_step": 55306, "epoch": 464, "lr": 1.2182596810494417e-05} +{"train_loss": 0.0003547079104464501, "global_step": 55307, "epoch": 464, "lr": 1.2181147529011311e-05} +{"train_loss": 0.0006259782239794731, "global_step": 55308, "epoch": 464, "lr": 1.2179698321781502e-05} +{"train_loss": 0.00029225563048385084, "global_step": 55309, "epoch": 464, "lr": 1.2178249188807795e-05} +{"train_loss": 0.00022246409207582474, "global_step": 55310, "epoch": 464, "lr": 1.2176800130093075e-05} +{"train_loss": 0.0010413709096610546, "global_step": 55311, "epoch": 464, "lr": 1.2175351145640146e-05} +{"train_loss": 0.00045029952889308333, "global_step": 55312, "epoch": 464, "lr": 1.2173902235451896e-05} +{"train_loss": 0.0007015750161372125, "global_step": 55313, "epoch": 464, "lr": 1.2172453399531125e-05} +{"train_loss": 0.0004894024459645152, "global_step": 55314, "epoch": 464, "lr": 1.2171004637880718e-05} +{"train_loss": 0.000404978432925418, "global_step": 55315, "epoch": 464, "lr": 1.2169555950503492e-05} +{"train_loss": 0.0002411862078588456, "global_step": 55316, "epoch": 464, "lr": 1.2168107337402312e-05} +{"train_loss": 0.0009877263801172376, "global_step": 55317, "epoch": 464, "lr": 1.2166658798580011e-05} +{"train_loss": 0.0004061466024722904, "global_step": 55318, "epoch": 464, "lr": 1.2165210334039417e-05} +{"train_loss": 0.0004586309951264411, "global_step": 55319, "epoch": 464, "lr": 1.2163761943783409e-05} +{"train_loss": 0.00038569109165109694, "global_step": 55320, "epoch": 464, "lr": 1.2162313627814797e-05} +{"train_loss": 0.0004810279351659119, "global_step": 55321, "epoch": 464, "lr": 1.2160865386136456e-05} +{"train_loss": 0.0007382704643532634, "global_step": 55322, "epoch": 464, "lr": 1.2159417218751206e-05} +{"train_loss": 0.0005190082010813057, "global_step": 55323, "epoch": 464, "lr": 1.2157969125661894e-05} +{"train_loss": 0.0006548952660523355, "global_step": 55324, "epoch": 464, "lr": 1.2156521106871372e-05} +{"train_loss": 0.0004867224779445678, "global_step": 55325, "epoch": 464, "lr": 1.2155073162382468e-05} +{"train_loss": 0.0005275940056890249, "global_step": 55326, "epoch": 464, "lr": 1.215362529219805e-05} +{"train_loss": 0.00042321375804021955, "global_step": 55327, "epoch": 464, "lr": 1.2152177496320926e-05} +{"train_loss": 0.0006219085771590471, "global_step": 55328, "epoch": 464, "lr": 1.2150729774753977e-05} +{"train_loss": 0.0004989160806871951, "global_step": 55329, "epoch": 464, "lr": 1.2149282127500027e-05} +{"train_loss": 0.0004945393884554505, "global_step": 55330, "epoch": 464, "lr": 1.2147834554561899e-05} +{"train_loss": 0.0004477940092328936, "global_step": 55331, "epoch": 464, "lr": 1.2146387055942471e-05} +{"train_loss": 0.0003252810565754771, "global_step": 55332, "epoch": 464, "lr": 1.2144939631644554e-05} +{"train_loss": 0.0002556360559538007, "global_step": 55333, "epoch": 464, "lr": 1.2143492281671015e-05} +{"train_loss": 0.0005774250961576017, "global_step": 55334, "epoch": 464, "lr": 1.2142045006024677e-05, "val_loss": 0.015217987820506096} +{"train_loss": 0.0005086039891466498, "global_step": 55335, "epoch": 465, "lr": 1.2140597804708399e-05} +{"train_loss": 0.0004358197911642492, "global_step": 55336, "epoch": 465, "lr": 1.2139150677725009e-05} +{"train_loss": 0.0005505123408511281, "global_step": 55337, "epoch": 465, "lr": 1.2137703625077346e-05} +{"train_loss": 0.0005391443846747279, "global_step": 55338, "epoch": 465, "lr": 1.2136256646768262e-05} +{"train_loss": 0.00047757563879713416, "global_step": 55339, "epoch": 465, "lr": 1.2134809742800585e-05} +{"train_loss": 0.0005431966856122017, "global_step": 55340, "epoch": 465, "lr": 1.2133362913177177e-05} +{"train_loss": 0.001044774311594665, "global_step": 55341, "epoch": 465, "lr": 1.2131916157900847e-05} +{"train_loss": 0.0003201120998710394, "global_step": 55342, "epoch": 465, "lr": 1.213046947697446e-05} +{"train_loss": 0.0005290949484333396, "global_step": 55343, "epoch": 465, "lr": 1.2129022870400864e-05} +{"train_loss": 0.0008758270996622741, "global_step": 55344, "epoch": 465, "lr": 1.2127576338182866e-05} +{"train_loss": 0.0005642706528306007, "global_step": 55345, "epoch": 465, "lr": 1.2126129880323344e-05} +{"train_loss": 0.000788967648986727, "global_step": 55346, "epoch": 465, "lr": 1.2124683496825106e-05} +{"train_loss": 0.000538261083420366, "global_step": 55347, "epoch": 465, "lr": 1.2123237187691016e-05} +{"train_loss": 0.000424354278948158, "global_step": 55348, "epoch": 465, "lr": 1.2121790952923906e-05} +{"train_loss": 0.0005355298053473234, "global_step": 55349, "epoch": 465, "lr": 1.21203447925266e-05} +{"train_loss": 0.0008852921309880912, "global_step": 55350, "epoch": 465, "lr": 1.2118898706501963e-05} +{"train_loss": 0.00036874765646643937, "global_step": 55351, "epoch": 465, "lr": 1.211745269485281e-05} +{"train_loss": 0.0005831087473779917, "global_step": 55352, "epoch": 465, "lr": 1.2116006757582e-05} +{"train_loss": 0.0007574291084893048, "global_step": 55353, "epoch": 465, "lr": 1.211456089469235e-05} +{"train_loss": 0.0003858716518152505, "global_step": 55354, "epoch": 465, "lr": 1.2113115106186729e-05} +{"train_loss": 0.0003302678233012557, "global_step": 55355, "epoch": 465, "lr": 1.211166939206796e-05} +{"train_loss": 0.0012069190852344036, "global_step": 55356, "epoch": 465, "lr": 1.2110223752338868e-05} +{"train_loss": 0.0004238551773596555, "global_step": 55357, "epoch": 465, "lr": 1.2108778187002311e-05} +{"train_loss": 0.00038794855936430395, "global_step": 55358, "epoch": 465, "lr": 1.2107332696061108e-05} +{"train_loss": 0.0006542779738083482, "global_step": 55359, "epoch": 465, "lr": 1.2105887279518125e-05} +{"train_loss": 0.0006454097456298769, "global_step": 55360, "epoch": 465, "lr": 1.2104441937376181e-05} +{"train_loss": 0.0003882781893480569, "global_step": 55361, "epoch": 465, "lr": 1.2102996669638105e-05} +{"train_loss": 0.0003214710741303861, "global_step": 55362, "epoch": 465, "lr": 1.2101551476306766e-05} +{"train_loss": 0.0009052374516613781, "global_step": 55363, "epoch": 465, "lr": 1.210010635738496e-05} +{"train_loss": 0.0011864498956128955, "global_step": 55364, "epoch": 465, "lr": 1.2098661312875565e-05} +{"train_loss": 0.00035881431540474296, "global_step": 55365, "epoch": 465, "lr": 1.2097216342781381e-05} +{"train_loss": 0.0005928927566856146, "global_step": 55366, "epoch": 465, "lr": 1.2095771447105275e-05} +{"train_loss": 0.00039684181683696806, "global_step": 55367, "epoch": 465, "lr": 1.2094326625850078e-05} +{"train_loss": 0.00042355002369731665, "global_step": 55368, "epoch": 465, "lr": 1.2092881879018608e-05} +{"train_loss": 0.00040035921847447753, "global_step": 55369, "epoch": 465, "lr": 1.2091437206613727e-05} +{"train_loss": 0.0003133909194730222, "global_step": 55370, "epoch": 465, "lr": 1.2089992608638239e-05} +{"train_loss": 0.000297699763905257, "global_step": 55371, "epoch": 465, "lr": 1.2088548085095025e-05} +{"train_loss": 0.00047229189658537507, "global_step": 55372, "epoch": 465, "lr": 1.2087103635986873e-05} +{"train_loss": 0.00033584790071472526, "global_step": 55373, "epoch": 465, "lr": 1.2085659261316662e-05} +{"train_loss": 0.00043665445991791785, "global_step": 55374, "epoch": 465, "lr": 1.2084214961087193e-05} +{"train_loss": 0.000702905876096338, "global_step": 55375, "epoch": 465, "lr": 1.208277073530133e-05} +{"train_loss": 0.001462467829696834, "global_step": 55376, "epoch": 465, "lr": 1.2081326583961883e-05} +{"train_loss": 0.0005001778481528163, "global_step": 55377, "epoch": 465, "lr": 1.2079882507071705e-05} +{"train_loss": 0.0005016207578592002, "global_step": 55378, "epoch": 465, "lr": 1.2078438504633632e-05} +{"train_loss": 0.00033299686037935317, "global_step": 55379, "epoch": 465, "lr": 1.2076994576650501e-05} +{"train_loss": 0.0008155876421369612, "global_step": 55380, "epoch": 465, "lr": 1.2075550723125124e-05} +{"train_loss": 0.0004948670975863934, "global_step": 55381, "epoch": 465, "lr": 1.207410694406036e-05} +{"train_loss": 0.0007712481310591102, "global_step": 55382, "epoch": 465, "lr": 1.2072663239459026e-05} +{"train_loss": 0.00129587366245687, "global_step": 55383, "epoch": 465, "lr": 1.207121960932398e-05} +{"train_loss": 0.00205865316092968, "global_step": 55384, "epoch": 465, "lr": 1.2069776053658028e-05} +{"train_loss": 0.0005847906577400863, "global_step": 55385, "epoch": 465, "lr": 1.2068332572464031e-05} +{"train_loss": 0.00032448224374093115, "global_step": 55386, "epoch": 465, "lr": 1.206688916574481e-05} +{"train_loss": 0.00043703033588826656, "global_step": 55387, "epoch": 465, "lr": 1.2065445833503186e-05} +{"train_loss": 0.0007017473108135164, "global_step": 55388, "epoch": 465, "lr": 1.2064002575742023e-05} +{"train_loss": 0.001207986380904913, "global_step": 55389, "epoch": 465, "lr": 1.2062559392464124e-05} +{"train_loss": 0.000528056756593287, "global_step": 55390, "epoch": 465, "lr": 1.2061116283672346e-05} +{"train_loss": 0.0005377152701839805, "global_step": 55391, "epoch": 465, "lr": 1.2059673249369519e-05} +{"train_loss": 0.0005483782151713967, "global_step": 55392, "epoch": 465, "lr": 1.2058230289558448e-05} +{"train_loss": 0.0004947790876030922, "global_step": 55393, "epoch": 465, "lr": 1.2056787404242009e-05} +{"train_loss": 0.0006657993071712554, "global_step": 55394, "epoch": 465, "lr": 1.2055344593423002e-05} +{"train_loss": 0.0006622167420573533, "global_step": 55395, "epoch": 465, "lr": 1.2053901857104283e-05} +{"train_loss": 0.0007766162161715329, "global_step": 55396, "epoch": 465, "lr": 1.2052459195288657e-05} +{"train_loss": 0.0005015574279241264, "global_step": 55397, "epoch": 465, "lr": 1.2051016607978988e-05} +{"train_loss": 0.0004049773560836911, "global_step": 55398, "epoch": 465, "lr": 1.2049574095178095e-05} +{"train_loss": 0.00038835752638988197, "global_step": 55399, "epoch": 465, "lr": 1.20481316568888e-05} +{"train_loss": 0.0011073891073465347, "global_step": 55400, "epoch": 465, "lr": 1.204668929311395e-05} +{"train_loss": 0.00033907507895492017, "global_step": 55401, "epoch": 465, "lr": 1.2045247003856363e-05} +{"train_loss": 0.0006061376770958304, "global_step": 55402, "epoch": 465, "lr": 1.204380478911889e-05} +{"train_loss": 0.001228410517796874, "global_step": 55403, "epoch": 465, "lr": 1.2042362648904337e-05} +{"train_loss": 0.0006031037773936987, "global_step": 55404, "epoch": 465, "lr": 1.2040920583215564e-05} +{"train_loss": 0.0008762174402363598, "global_step": 55405, "epoch": 465, "lr": 1.203947859205537e-05} +{"train_loss": 0.0008371879812330008, "global_step": 55406, "epoch": 465, "lr": 1.2038036675426622e-05} +{"train_loss": 0.0009569721296429634, "global_step": 55407, "epoch": 465, "lr": 1.2036594833332121e-05} +{"train_loss": 0.000787793134804815, "global_step": 55408, "epoch": 465, "lr": 1.2035153065774723e-05} +{"train_loss": 0.0004794402339030057, "global_step": 55409, "epoch": 465, "lr": 1.2033711372757233e-05} +{"train_loss": 0.0009007591288536787, "global_step": 55410, "epoch": 465, "lr": 1.2032269754282504e-05} +{"train_loss": 0.0007097919587977231, "global_step": 55411, "epoch": 465, "lr": 1.2030828210353351e-05} +{"train_loss": 0.0006082020699977875, "global_step": 55412, "epoch": 465, "lr": 1.202938674097262e-05} +{"train_loss": 0.0005593563546426594, "global_step": 55413, "epoch": 465, "lr": 1.2027945346143116e-05} +{"train_loss": 0.00034467646037228405, "global_step": 55414, "epoch": 465, "lr": 1.2026504025867702e-05} +{"train_loss": 0.0003470006922725588, "global_step": 55415, "epoch": 465, "lr": 1.2025062780149171e-05} +{"train_loss": 0.0007569849258288741, "global_step": 55416, "epoch": 465, "lr": 1.2023621608990392e-05} +{"train_loss": 0.0009529133094474673, "global_step": 55417, "epoch": 465, "lr": 1.202218051239417e-05} +{"train_loss": 0.0009266561828553677, "global_step": 55418, "epoch": 465, "lr": 1.2020739490363331e-05} +{"train_loss": 0.0003581598575692624, "global_step": 55419, "epoch": 465, "lr": 1.2019298542900726e-05} +{"train_loss": 0.0005266305524855852, "global_step": 55420, "epoch": 465, "lr": 1.2017857670009153e-05} +{"train_loss": 0.0006053014076314867, "global_step": 55421, "epoch": 465, "lr": 1.2016416871691472e-05} +{"train_loss": 0.00044373556738719344, "global_step": 55422, "epoch": 465, "lr": 1.2014976147950485e-05} +{"train_loss": 0.000692597939632833, "global_step": 55423, "epoch": 465, "lr": 1.2013535498789053e-05} +{"train_loss": 0.00035935037885792553, "global_step": 55424, "epoch": 465, "lr": 1.2012094924209982e-05} +{"train_loss": 0.0007435203297063708, "global_step": 55425, "epoch": 465, "lr": 1.2010654424216088e-05} +{"train_loss": 0.0005793358432129025, "global_step": 55426, "epoch": 465, "lr": 1.2009213998810232e-05} +{"train_loss": 0.000755356450099498, "global_step": 55427, "epoch": 465, "lr": 1.2007773647995212e-05} +{"train_loss": 0.00042725709499791265, "global_step": 55428, "epoch": 465, "lr": 1.2006333371773881e-05} +{"train_loss": 0.0006617822800762951, "global_step": 55429, "epoch": 465, "lr": 1.2004893170149061e-05} +{"train_loss": 0.0008997971890494227, "global_step": 55430, "epoch": 465, "lr": 1.2003453043123553e-05} +{"train_loss": 0.0005749872652813792, "global_step": 55431, "epoch": 465, "lr": 1.2002012990700224e-05} +{"train_loss": 0.0008486027945764363, "global_step": 55432, "epoch": 465, "lr": 1.2000573012881871e-05} +{"train_loss": 0.0005834529874846339, "global_step": 55433, "epoch": 465, "lr": 1.1999133109671346e-05} +{"train_loss": 0.00043693510815501213, "global_step": 55434, "epoch": 465, "lr": 1.1997693281071442e-05} +{"train_loss": 0.000527873809915036, "global_step": 55435, "epoch": 465, "lr": 1.1996253527085027e-05} +{"train_loss": 0.0005453918129205704, "global_step": 55436, "epoch": 465, "lr": 1.1994813847714908e-05} +{"train_loss": 0.0008701332844793797, "global_step": 55437, "epoch": 465, "lr": 1.1993374242963901e-05} +{"train_loss": 0.000475425214972347, "global_step": 55438, "epoch": 465, "lr": 1.1991934712834857e-05} +{"train_loss": 0.0004880105552729219, "global_step": 55439, "epoch": 465, "lr": 1.1990495257330569e-05} +{"train_loss": 0.0006194797460921109, "global_step": 55440, "epoch": 465, "lr": 1.1989055876453887e-05} +{"train_loss": 0.0012045276816934347, "global_step": 55441, "epoch": 465, "lr": 1.1987616570207644e-05} +{"train_loss": 0.0008433227194473147, "global_step": 55442, "epoch": 465, "lr": 1.1986177338594645e-05} +{"train_loss": 0.0005054984940215945, "global_step": 55443, "epoch": 465, "lr": 1.1984738181617733e-05} +{"train_loss": 0.0007459759945049882, "global_step": 55444, "epoch": 465, "lr": 1.1983299099279715e-05} +{"train_loss": 0.000611792434938252, "global_step": 55445, "epoch": 465, "lr": 1.1981860091583447e-05} +{"train_loss": 0.00045548967318609357, "global_step": 55446, "epoch": 465, "lr": 1.1980421158531719e-05} +{"train_loss": 0.0010272283107042313, "global_step": 55447, "epoch": 465, "lr": 1.1978982300127384e-05} +{"train_loss": 0.0007134969928301871, "global_step": 55448, "epoch": 465, "lr": 1.1977543516373253e-05} +{"train_loss": 0.0011643574107438326, "global_step": 55449, "epoch": 465, "lr": 1.1976104807272143e-05} +{"train_loss": 0.0009677804773673415, "global_step": 55450, "epoch": 465, "lr": 1.1974666172826904e-05} +{"train_loss": 0.0003531394468154758, "global_step": 55451, "epoch": 465, "lr": 1.1973227613040327e-05} +{"train_loss": 0.0006680421647615731, "global_step": 55452, "epoch": 465, "lr": 1.1971789127915273e-05} +{"train_loss": 0.0006453666088617399, "global_step": 55453, "epoch": 465, "lr": 1.1970350717454531e-05, "val_loss": 0.04728960990905762, "train_action_mse_error": 8.701469596417155e-06} +{"train_loss": 0.0005199004663154483, "global_step": 55454, "epoch": 466, "lr": 1.1968912381660957e-05} +{"train_loss": 0.0009986483491957188, "global_step": 55455, "epoch": 466, "lr": 1.1967474120537365e-05} +{"train_loss": 0.0007264810265041888, "global_step": 55456, "epoch": 466, "lr": 1.1966035934086556e-05} +{"train_loss": 0.0006317552179098129, "global_step": 55457, "epoch": 466, "lr": 1.1964597822311385e-05} +{"train_loss": 0.0007617689552716911, "global_step": 55458, "epoch": 466, "lr": 1.196315978521465e-05} +{"train_loss": 0.0005712872371077538, "global_step": 55459, "epoch": 466, "lr": 1.1961721822799204e-05} +{"train_loss": 0.0006516611902043223, "global_step": 55460, "epoch": 466, "lr": 1.1960283935067851e-05} +{"train_loss": 0.00032453698804602027, "global_step": 55461, "epoch": 466, "lr": 1.1958846122023404e-05} +{"train_loss": 0.0006909970543347299, "global_step": 55462, "epoch": 466, "lr": 1.1957408383668712e-05} +{"train_loss": 0.0008201918099075556, "global_step": 55463, "epoch": 466, "lr": 1.195597072000657e-05} +{"train_loss": 0.0007271887152455747, "global_step": 55464, "epoch": 466, "lr": 1.195453313103983e-05} +{"train_loss": 0.00031691239564679563, "global_step": 55465, "epoch": 466, "lr": 1.1953095616771281e-05} +{"train_loss": 0.0004146347346249968, "global_step": 55466, "epoch": 466, "lr": 1.1951658177203783e-05} +{"train_loss": 0.000629484944511205, "global_step": 55467, "epoch": 466, "lr": 1.195022081234014e-05} +{"train_loss": 0.0006462195888161659, "global_step": 55468, "epoch": 466, "lr": 1.1948783522183154e-05} +{"train_loss": 0.000521570909768343, "global_step": 55469, "epoch": 466, "lr": 1.1947346306735685e-05} +{"train_loss": 0.0008023303817026317, "global_step": 55470, "epoch": 466, "lr": 1.1945909166000524e-05} +{"train_loss": 0.0004799176240339875, "global_step": 55471, "epoch": 466, "lr": 1.1944472099980514e-05} +{"train_loss": 0.0002879152016248554, "global_step": 55472, "epoch": 466, "lr": 1.1943035108678457e-05} +{"train_loss": 0.0005270866677165031, "global_step": 55473, "epoch": 466, "lr": 1.1941598192097198e-05} +{"train_loss": 0.0006263913819566369, "global_step": 55474, "epoch": 466, "lr": 1.1940161350239526e-05} +{"train_loss": 0.0007378619047813118, "global_step": 55475, "epoch": 466, "lr": 1.1938724583108284e-05} +{"train_loss": 0.00042091807699762285, "global_step": 55476, "epoch": 466, "lr": 1.1937287890706306e-05} +{"train_loss": 0.0013328386703506112, "global_step": 55477, "epoch": 466, "lr": 1.1935851273036386e-05} +{"train_loss": 0.0004096590855624527, "global_step": 55478, "epoch": 466, "lr": 1.1934414730101362e-05} +{"train_loss": 0.000702675140928477, "global_step": 55479, "epoch": 466, "lr": 1.1932978261904055e-05} +{"train_loss": 0.0006757654482498765, "global_step": 55480, "epoch": 466, "lr": 1.193154186844726e-05} +{"train_loss": 0.000430617161327973, "global_step": 55481, "epoch": 466, "lr": 1.1930105549733827e-05} +{"train_loss": 0.0005046401056461036, "global_step": 55482, "epoch": 466, "lr": 1.1928669305766554e-05} +{"train_loss": 0.0010629338212311268, "global_step": 55483, "epoch": 466, "lr": 1.1927233136548288e-05} +{"train_loss": 0.000891741132363677, "global_step": 55484, "epoch": 466, "lr": 1.1925797042081815e-05} +{"train_loss": 0.0009973193518817425, "global_step": 55485, "epoch": 466, "lr": 1.192436102236999e-05} +{"train_loss": 0.0007284415187314153, "global_step": 55486, "epoch": 466, "lr": 1.1922925077415609e-05} +{"train_loss": 0.000844550842884928, "global_step": 55487, "epoch": 466, "lr": 1.1921489207221482e-05} +{"train_loss": 0.0009098022128455341, "global_step": 55488, "epoch": 466, "lr": 1.192005341179046e-05} +{"train_loss": 0.0003794255608227104, "global_step": 55489, "epoch": 466, "lr": 1.1918617691125333e-05} +{"train_loss": 0.0005151383811607957, "global_step": 55490, "epoch": 466, "lr": 1.1917182045228941e-05} +{"train_loss": 0.0004745165933854878, "global_step": 55491, "epoch": 466, "lr": 1.1915746474104094e-05} +{"train_loss": 0.0005465353024192154, "global_step": 55492, "epoch": 466, "lr": 1.1914310977753602e-05} +{"train_loss": 0.00044602929847314954, "global_step": 55493, "epoch": 466, "lr": 1.1912875556180297e-05} +{"train_loss": 0.0007133635226637125, "global_step": 55494, "epoch": 466, "lr": 1.1911440209386982e-05} +{"train_loss": 0.00045530468923971057, "global_step": 55495, "epoch": 466, "lr": 1.1910004937376501e-05} +{"train_loss": 0.00038319124723784626, "global_step": 55496, "epoch": 466, "lr": 1.1908569740151643e-05} +{"train_loss": 0.0008180485456250608, "global_step": 55497, "epoch": 466, "lr": 1.190713461771525e-05} +{"train_loss": 0.0004713048692792654, "global_step": 55498, "epoch": 466, "lr": 1.1905699570070129e-05} +{"train_loss": 0.000717817572876811, "global_step": 55499, "epoch": 466, "lr": 1.1904264597219077e-05} +{"train_loss": 0.0014135640813037753, "global_step": 55500, "epoch": 466, "lr": 1.1902829699164952e-05} +{"train_loss": 0.0006254135514609516, "global_step": 55501, "epoch": 466, "lr": 1.1901394875910538e-05} +{"train_loss": 0.0007982169045135379, "global_step": 55502, "epoch": 466, "lr": 1.1899960127458675e-05} +{"train_loss": 0.00039622464100830257, "global_step": 55503, "epoch": 466, "lr": 1.189852545381216e-05} +{"train_loss": 0.00048611368401907384, "global_step": 55504, "epoch": 466, "lr": 1.189709085497383e-05} +{"train_loss": 0.0005005000857636333, "global_step": 55505, "epoch": 466, "lr": 1.189565633094648e-05} +{"train_loss": 0.0006157137686386704, "global_step": 55506, "epoch": 466, "lr": 1.1894221881732947e-05} +{"train_loss": 0.0003990247205365449, "global_step": 55507, "epoch": 466, "lr": 1.1892787507336029e-05} +{"train_loss": 0.0011223102919757366, "global_step": 55508, "epoch": 466, "lr": 1.1891353207758565e-05} +{"train_loss": 0.00043331694905646145, "global_step": 55509, "epoch": 466, "lr": 1.1889918983003345e-05} +{"train_loss": 0.0005239085876382887, "global_step": 55510, "epoch": 466, "lr": 1.188848483307321e-05} +{"train_loss": 0.0005346282850950956, "global_step": 55511, "epoch": 466, "lr": 1.1887050757970946e-05} +{"train_loss": 0.0012567363446578383, "global_step": 55512, "epoch": 466, "lr": 1.1885616757699409e-05} +{"train_loss": 0.00037680257810279727, "global_step": 55513, "epoch": 466, "lr": 1.188418283226137e-05} +{"train_loss": 0.00048593204701319337, "global_step": 55514, "epoch": 466, "lr": 1.188274898165968e-05} +{"train_loss": 0.0003456652339082211, "global_step": 55515, "epoch": 466, "lr": 1.1881315205897132e-05} +{"train_loss": 0.0005541244754567742, "global_step": 55516, "epoch": 466, "lr": 1.1879881504976558e-05} +{"train_loss": 0.00044556555803865194, "global_step": 55517, "epoch": 466, "lr": 1.1878447878900768e-05} +{"train_loss": 0.0005331677384674549, "global_step": 55518, "epoch": 466, "lr": 1.1877014327672553e-05} +{"train_loss": 0.0007108661811798811, "global_step": 55519, "epoch": 466, "lr": 1.1875580851294765e-05} +{"train_loss": 0.00036817521322518587, "global_step": 55520, "epoch": 466, "lr": 1.1874147449770184e-05} +{"train_loss": 0.00031726888846606016, "global_step": 55521, "epoch": 466, "lr": 1.1872714123101664e-05} +{"train_loss": 0.0008213215623982251, "global_step": 55522, "epoch": 466, "lr": 1.1871280871291974e-05} +{"train_loss": 0.00035318286973051727, "global_step": 55523, "epoch": 466, "lr": 1.1869847694343966e-05} +{"train_loss": 0.0008037422085180879, "global_step": 55524, "epoch": 466, "lr": 1.186841459226044e-05} +{"train_loss": 0.0004233205982018262, "global_step": 55525, "epoch": 466, "lr": 1.1866981565044195e-05} +{"train_loss": 0.0003176909522153437, "global_step": 55526, "epoch": 466, "lr": 1.1865548612698069e-05} +{"train_loss": 0.0003659907670225948, "global_step": 55527, "epoch": 466, "lr": 1.186411573522485e-05} +{"train_loss": 0.0005058844108134508, "global_step": 55528, "epoch": 466, "lr": 1.1862682932627383e-05} +{"train_loss": 0.0004766868078149855, "global_step": 55529, "epoch": 466, "lr": 1.1861250204908464e-05} +{"train_loss": 0.0005302262143231928, "global_step": 55530, "epoch": 466, "lr": 1.185981755207089e-05} +{"train_loss": 0.0007402024930343032, "global_step": 55531, "epoch": 466, "lr": 1.1858384974117503e-05} +{"train_loss": 0.0010069099953398108, "global_step": 55532, "epoch": 466, "lr": 1.185695247105109e-05} +{"train_loss": 0.0005996107938699424, "global_step": 55533, "epoch": 466, "lr": 1.1855520042874485e-05} +{"train_loss": 0.0007811798132024705, "global_step": 55534, "epoch": 466, "lr": 1.1854087689590481e-05} +{"train_loss": 0.0005171613302081823, "global_step": 55535, "epoch": 466, "lr": 1.1852655411201918e-05} +{"train_loss": 0.0004254644736647606, "global_step": 55536, "epoch": 466, "lr": 1.1851223207711587e-05} +{"train_loss": 0.00024550739908590913, "global_step": 55537, "epoch": 466, "lr": 1.1849791079122291e-05} +{"train_loss": 0.000636009790468961, "global_step": 55538, "epoch": 466, "lr": 1.1848359025436851e-05} +{"train_loss": 0.0005066092126071453, "global_step": 55539, "epoch": 466, "lr": 1.1846927046658096e-05} +{"train_loss": 0.00044532748870551586, "global_step": 55540, "epoch": 466, "lr": 1.1845495142788815e-05} +{"train_loss": 0.0005408627912402153, "global_step": 55541, "epoch": 466, "lr": 1.1844063313831837e-05} +{"train_loss": 0.0007985056145116687, "global_step": 55542, "epoch": 466, "lr": 1.1842631559789952e-05} +{"train_loss": 0.0006354371435008943, "global_step": 55543, "epoch": 466, "lr": 1.1841199880665998e-05} +{"train_loss": 0.0006054245168343186, "global_step": 55544, "epoch": 466, "lr": 1.1839768276462759e-05} +{"train_loss": 0.00036796816857531667, "global_step": 55545, "epoch": 466, "lr": 1.183833674718307e-05} +{"train_loss": 0.0005350431310944259, "global_step": 55546, "epoch": 466, "lr": 1.1836905292829714e-05} +{"train_loss": 0.0009641815559007227, "global_step": 55547, "epoch": 466, "lr": 1.1835473913405537e-05} +{"train_loss": 0.0009123529307544231, "global_step": 55548, "epoch": 466, "lr": 1.1834042608913326e-05} +{"train_loss": 0.00086883275071159, "global_step": 55549, "epoch": 466, "lr": 1.1832611379355878e-05} +{"train_loss": 0.0003217036428395659, "global_step": 55550, "epoch": 466, "lr": 1.1831180224736038e-05} +{"train_loss": 0.00042090879287570715, "global_step": 55551, "epoch": 466, "lr": 1.1829749145056585e-05} +{"train_loss": 0.0005208791117183864, "global_step": 55552, "epoch": 466, "lr": 1.182831814032035e-05} +{"train_loss": 0.000763595278840512, "global_step": 55553, "epoch": 466, "lr": 1.1826887210530125e-05} +{"train_loss": 0.0007072360021993518, "global_step": 55554, "epoch": 466, "lr": 1.1825456355688742e-05} +{"train_loss": 0.0003915185807272792, "global_step": 55555, "epoch": 466, "lr": 1.1824025575798997e-05} +{"train_loss": 0.0004278320702724159, "global_step": 55556, "epoch": 466, "lr": 1.1822594870863685e-05} +{"train_loss": 0.00046225442201830447, "global_step": 55557, "epoch": 466, "lr": 1.1821164240885641e-05} +{"train_loss": 0.0007792190299369395, "global_step": 55558, "epoch": 466, "lr": 1.1819733685867651e-05} +{"train_loss": 0.0002963926235679537, "global_step": 55559, "epoch": 466, "lr": 1.1818303205812548e-05} +{"train_loss": 0.0006963826017454267, "global_step": 55560, "epoch": 466, "lr": 1.1816872800723127e-05} +{"train_loss": 0.0007135138148441911, "global_step": 55561, "epoch": 466, "lr": 1.181544247060219e-05} +{"train_loss": 0.0011481385445222259, "global_step": 55562, "epoch": 466, "lr": 1.1814012215452558e-05} +{"train_loss": 0.0007109740399755538, "global_step": 55563, "epoch": 466, "lr": 1.181258203527702e-05} +{"train_loss": 0.0006967256194911897, "global_step": 55564, "epoch": 466, "lr": 1.1811151930078413e-05} +{"train_loss": 0.000503474147990346, "global_step": 55565, "epoch": 466, "lr": 1.1809721899859516e-05} +{"train_loss": 0.000619534810539335, "global_step": 55566, "epoch": 466, "lr": 1.1808291944623163e-05} +{"train_loss": 0.000258926535025239, "global_step": 55567, "epoch": 466, "lr": 1.1806862064372149e-05} +{"train_loss": 0.0009681422961875796, "global_step": 55568, "epoch": 466, "lr": 1.1805432259109267e-05} +{"train_loss": 0.0013943483354523778, "global_step": 55569, "epoch": 466, "lr": 1.1804002528837355e-05} +{"train_loss": 0.0004896405152976513, "global_step": 55570, "epoch": 466, "lr": 1.1802572873559186e-05} +{"train_loss": 0.0004706206964328885, "global_step": 55571, "epoch": 466, "lr": 1.18011432932776e-05} +{"train_loss": 0.0006173119467914011, "global_step": 55572, "epoch": 466, "lr": 1.179971378799537e-05, "val_loss": 0.012434217147529125} +{"train_loss": 0.0003710396704263985, "global_step": 55573, "epoch": 467, "lr": 1.1798284357715329e-05} +{"train_loss": 0.0006710300804115832, "global_step": 55574, "epoch": 467, "lr": 1.1796855002440282e-05} +{"train_loss": 0.0005432770703919232, "global_step": 55575, "epoch": 467, "lr": 1.1795425722173015e-05} +{"train_loss": 0.000779596739448607, "global_step": 55576, "epoch": 467, "lr": 1.1793996516916367e-05} +{"train_loss": 0.0006334198405966163, "global_step": 55577, "epoch": 467, "lr": 1.179256738667311e-05} +{"train_loss": 0.001057676738128066, "global_step": 55578, "epoch": 467, "lr": 1.1791138331446078e-05} +{"train_loss": 0.0002418646472506225, "global_step": 55579, "epoch": 467, "lr": 1.1789709351238059e-05} +{"train_loss": 0.00042430427856743336, "global_step": 55580, "epoch": 467, "lr": 1.1788280446051859e-05} +{"train_loss": 0.00043232442112639546, "global_step": 55581, "epoch": 467, "lr": 1.1786851615890294e-05} +{"train_loss": 0.00041508872527629137, "global_step": 55582, "epoch": 467, "lr": 1.178542286075615e-05} +{"train_loss": 0.00036751042352989316, "global_step": 55583, "epoch": 467, "lr": 1.1783994180652264e-05} +{"train_loss": 0.0008220912422984838, "global_step": 55584, "epoch": 467, "lr": 1.1782565575581406e-05} +{"train_loss": 0.0005144541501067579, "global_step": 55585, "epoch": 467, "lr": 1.1781137045546414e-05} +{"train_loss": 0.0008070120820775628, "global_step": 55586, "epoch": 467, "lr": 1.1779708590550075e-05} +{"train_loss": 0.0004769936786033213, "global_step": 55587, "epoch": 467, "lr": 1.1778280210595183e-05} +{"train_loss": 0.00038510773447342217, "global_step": 55588, "epoch": 467, "lr": 1.1776851905684561e-05} +{"train_loss": 0.0005859829834662378, "global_step": 55589, "epoch": 467, "lr": 1.1775423675821e-05} +{"train_loss": 0.0006199749186635017, "global_step": 55590, "epoch": 467, "lr": 1.1773995521007326e-05} +{"train_loss": 0.000318010279443115, "global_step": 55591, "epoch": 467, "lr": 1.1772567441246308e-05} +{"train_loss": 0.0009963042102754116, "global_step": 55592, "epoch": 467, "lr": 1.1771139436540784e-05} +{"train_loss": 0.0003718645602930337, "global_step": 55593, "epoch": 467, "lr": 1.1769711506893549e-05} +{"train_loss": 0.0007941583753563464, "global_step": 55594, "epoch": 467, "lr": 1.1768283652307383e-05} +{"train_loss": 0.0004455512680578977, "global_step": 55595, "epoch": 467, "lr": 1.1766855872785122e-05} +{"train_loss": 0.0005620047450065613, "global_step": 55596, "epoch": 467, "lr": 1.176542816832954e-05} +{"train_loss": 0.00032745019416324794, "global_step": 55597, "epoch": 467, "lr": 1.176400053894347e-05} +{"train_loss": 0.0012464436003938317, "global_step": 55598, "epoch": 467, "lr": 1.1762572984629706e-05} +{"train_loss": 0.0006001900183036923, "global_step": 55599, "epoch": 467, "lr": 1.1761145505391025e-05} +{"train_loss": 0.0002758502378128469, "global_step": 55600, "epoch": 467, "lr": 1.175971810123026e-05} +{"train_loss": 0.0007214791257865727, "global_step": 55601, "epoch": 467, "lr": 1.1758290772150193e-05} +{"train_loss": 0.0005154585815034807, "global_step": 55602, "epoch": 467, "lr": 1.1756863518153655e-05} +{"train_loss": 0.0004423288628458977, "global_step": 55603, "epoch": 467, "lr": 1.1755436339243408e-05} +{"train_loss": 0.0004280101275071502, "global_step": 55604, "epoch": 467, "lr": 1.1754009235422292e-05} +{"train_loss": 0.0002481465635355562, "global_step": 55605, "epoch": 467, "lr": 1.175258220669308e-05} +{"train_loss": 0.00017691389075480402, "global_step": 55606, "epoch": 467, "lr": 1.1751155253058605e-05} +{"train_loss": 0.0004915180034004152, "global_step": 55607, "epoch": 467, "lr": 1.1749728374521628e-05} +{"train_loss": 0.0010362450266256928, "global_step": 55608, "epoch": 467, "lr": 1.174830157108498e-05} +{"train_loss": 0.00037168528069742024, "global_step": 55609, "epoch": 467, "lr": 1.1746874842751465e-05} +{"train_loss": 0.0004371749528218061, "global_step": 55610, "epoch": 467, "lr": 1.1745448189523867e-05} +{"train_loss": 0.00047048815758898854, "global_step": 55611, "epoch": 467, "lr": 1.1744021611404999e-05} +{"train_loss": 0.0003864330647047609, "global_step": 55612, "epoch": 467, "lr": 1.1742595108397664e-05} +{"train_loss": 0.00043397166882641613, "global_step": 55613, "epoch": 467, "lr": 1.1741168680504638e-05} +{"train_loss": 0.000362832477549091, "global_step": 55614, "epoch": 467, "lr": 1.1739742327728759e-05} +{"train_loss": 0.0005530150956474245, "global_step": 55615, "epoch": 467, "lr": 1.173831605007279e-05} +{"train_loss": 0.0003297443618066609, "global_step": 55616, "epoch": 467, "lr": 1.1736889847539567e-05} +{"train_loss": 0.0004336109268479049, "global_step": 55617, "epoch": 467, "lr": 1.1735463720131872e-05} +{"train_loss": 0.0005273799179121852, "global_step": 55618, "epoch": 467, "lr": 1.1734037667852493e-05} +{"train_loss": 0.0005392925231717527, "global_step": 55619, "epoch": 467, "lr": 1.1732611690704254e-05} +{"train_loss": 0.00046447658678516746, "global_step": 55620, "epoch": 467, "lr": 1.173118578868993e-05} +{"train_loss": 0.0003605936944950372, "global_step": 55621, "epoch": 467, "lr": 1.1729759961812353e-05} +{"train_loss": 0.0004660885315388441, "global_step": 55622, "epoch": 467, "lr": 1.1728334210074282e-05} +{"train_loss": 0.0007297027623280883, "global_step": 55623, "epoch": 467, "lr": 1.1726908533478558e-05} +{"train_loss": 0.0006640105857513845, "global_step": 55624, "epoch": 467, "lr": 1.1725482932027959e-05} +{"train_loss": 0.00030888625769875944, "global_step": 55625, "epoch": 467, "lr": 1.1724057405725269e-05} +{"train_loss": 0.0003431388468015939, "global_step": 55626, "epoch": 467, "lr": 1.1722631954573321e-05} +{"train_loss": 0.0008340857457369566, "global_step": 55627, "epoch": 467, "lr": 1.1721206578574877e-05} +{"train_loss": 0.0007303786114789546, "global_step": 55628, "epoch": 467, "lr": 1.1719781277732771e-05} +{"train_loss": 0.000448758655693382, "global_step": 55629, "epoch": 467, "lr": 1.171835605204979e-05} +{"train_loss": 0.0007464622613042593, "global_step": 55630, "epoch": 467, "lr": 1.1716930901528706e-05} +{"train_loss": 0.0006418746779672801, "global_step": 55631, "epoch": 467, "lr": 1.1715505826172357e-05} +{"train_loss": 0.0008032133337110281, "global_step": 55632, "epoch": 467, "lr": 1.1714080825983503e-05} +{"train_loss": 0.00035837001632899046, "global_step": 55633, "epoch": 467, "lr": 1.1712655900964976e-05} +{"train_loss": 0.0005373748717829585, "global_step": 55634, "epoch": 467, "lr": 1.1711231051119548e-05} +{"train_loss": 0.000556584564037621, "global_step": 55635, "epoch": 467, "lr": 1.1709806276450042e-05} +{"train_loss": 0.0010639118263497949, "global_step": 55636, "epoch": 467, "lr": 1.170838157695922e-05} +{"train_loss": 0.00042120422585867345, "global_step": 55637, "epoch": 467, "lr": 1.1706956952649922e-05} +{"train_loss": 0.0007188374293036759, "global_step": 55638, "epoch": 467, "lr": 1.1705532403524905e-05} +{"train_loss": 0.0007049816194921732, "global_step": 55639, "epoch": 467, "lr": 1.1704107929586994e-05} +{"train_loss": 0.00035750248935073614, "global_step": 55640, "epoch": 467, "lr": 1.1702683530838971e-05} +{"train_loss": 0.0005496413796208799, "global_step": 55641, "epoch": 467, "lr": 1.1701259207283643e-05} +{"train_loss": 0.000529723591171205, "global_step": 55642, "epoch": 467, "lr": 1.169983495892379e-05} +{"train_loss": 0.0006755393696948886, "global_step": 55643, "epoch": 467, "lr": 1.1698410785762232e-05} +{"train_loss": 0.00024895317619666457, "global_step": 55644, "epoch": 467, "lr": 1.1696986687801743e-05} +{"train_loss": 0.00042143400060012937, "global_step": 55645, "epoch": 467, "lr": 1.169556266504514e-05} +{"train_loss": 0.0003301430551800877, "global_step": 55646, "epoch": 467, "lr": 1.169413871749519e-05} +{"train_loss": 0.00045540998689830303, "global_step": 55647, "epoch": 467, "lr": 1.1692714845154724e-05} +{"train_loss": 0.0004551281745079905, "global_step": 55648, "epoch": 467, "lr": 1.169129104802652e-05} +{"train_loss": 0.0007615044596605003, "global_step": 55649, "epoch": 467, "lr": 1.1689867326113358e-05} +{"train_loss": 0.0003352672210894525, "global_step": 55650, "epoch": 467, "lr": 1.1688443679418065e-05} +{"train_loss": 0.0004562308022286743, "global_step": 55651, "epoch": 467, "lr": 1.1687020107943404e-05} +{"train_loss": 0.00044256928958930075, "global_step": 55652, "epoch": 467, "lr": 1.1685596611692201e-05} +{"train_loss": 0.0004012048593722284, "global_step": 55653, "epoch": 467, "lr": 1.168417319066722e-05} +{"train_loss": 0.0004883570363745093, "global_step": 55654, "epoch": 467, "lr": 1.1682749844871282e-05} +{"train_loss": 0.0006063366308808327, "global_step": 55655, "epoch": 467, "lr": 1.1681326574307177e-05} +{"train_loss": 0.0005263143684715033, "global_step": 55656, "epoch": 467, "lr": 1.167990337897768e-05} +{"train_loss": 0.0009055084665305912, "global_step": 55657, "epoch": 467, "lr": 1.167848025888561e-05} +{"train_loss": 0.00025560084031894803, "global_step": 55658, "epoch": 467, "lr": 1.1677057214033738e-05} +{"train_loss": 0.00043733659549616277, "global_step": 55659, "epoch": 467, "lr": 1.1675634244424883e-05} +{"train_loss": 0.00028951867716386914, "global_step": 55660, "epoch": 467, "lr": 1.167421135006181e-05} +{"train_loss": 0.0004881563363596797, "global_step": 55661, "epoch": 467, "lr": 1.1672788530947343e-05} +{"train_loss": 0.0005167051567696035, "global_step": 55662, "epoch": 467, "lr": 1.1671365787084259e-05} +{"train_loss": 0.00072333007119596, "global_step": 55663, "epoch": 467, "lr": 1.1669943118475346e-05} +{"train_loss": 0.0004977092030458152, "global_step": 55664, "epoch": 467, "lr": 1.1668520525123417e-05} +{"train_loss": 0.00044630205957219005, "global_step": 55665, "epoch": 467, "lr": 1.1667098007031236e-05} +{"train_loss": 0.0005767059046775103, "global_step": 55666, "epoch": 467, "lr": 1.1665675564201628e-05} +{"train_loss": 0.0007985076517798007, "global_step": 55667, "epoch": 467, "lr": 1.166425319663737e-05} +{"train_loss": 0.0003603236109483987, "global_step": 55668, "epoch": 467, "lr": 1.1662830904341238e-05} +{"train_loss": 0.0006318496307358146, "global_step": 55669, "epoch": 467, "lr": 1.166140868731605e-05} +{"train_loss": 0.0009318264201283455, "global_step": 55670, "epoch": 467, "lr": 1.1659986545564599e-05} +{"train_loss": 0.0002972920483443886, "global_step": 55671, "epoch": 467, "lr": 1.165856447908965e-05} +{"train_loss": 0.0004988976870663464, "global_step": 55672, "epoch": 467, "lr": 1.1657142487894034e-05} +{"train_loss": 0.0004045398673042655, "global_step": 55673, "epoch": 467, "lr": 1.1655720571980511e-05} +{"train_loss": 0.0004940045764669776, "global_step": 55674, "epoch": 467, "lr": 1.1654298731351893e-05} +{"train_loss": 0.00039891726919449866, "global_step": 55675, "epoch": 467, "lr": 1.165287696601095e-05} +{"train_loss": 0.00055606325622648, "global_step": 55676, "epoch": 467, "lr": 1.1651455275960499e-05} +{"train_loss": 0.0009450963698327541, "global_step": 55677, "epoch": 467, "lr": 1.1650033661203303e-05} +{"train_loss": 0.00031877803849056363, "global_step": 55678, "epoch": 467, "lr": 1.1648612121742185e-05} +{"train_loss": 0.0006067563081160188, "global_step": 55679, "epoch": 467, "lr": 1.164719065757992e-05} +{"train_loss": 0.00027884438168257475, "global_step": 55680, "epoch": 467, "lr": 1.1645769268719286e-05} +{"train_loss": 0.0005675964057445526, "global_step": 55681, "epoch": 467, "lr": 1.1644347955163105e-05} +{"train_loss": 0.0005654619890265167, "global_step": 55682, "epoch": 467, "lr": 1.1642926716914127e-05} +{"train_loss": 0.0002891837211791426, "global_step": 55683, "epoch": 467, "lr": 1.164150555397518e-05} +{"train_loss": 0.0004732568340841681, "global_step": 55684, "epoch": 467, "lr": 1.1640084466349027e-05} +{"train_loss": 0.0007022489444352686, "global_step": 55685, "epoch": 467, "lr": 1.1638663454038484e-05} +{"train_loss": 0.0006585527444258332, "global_step": 55686, "epoch": 467, "lr": 1.1637242517046327e-05} +{"train_loss": 0.0005455926875583827, "global_step": 55687, "epoch": 467, "lr": 1.1635821655375328e-05} +{"train_loss": 0.0005025847349315882, "global_step": 55688, "epoch": 467, "lr": 1.163440086902831e-05} +{"train_loss": 0.0007997037027962506, "global_step": 55689, "epoch": 467, "lr": 1.1632980158008039e-05} +{"train_loss": 0.0007058818009682, "global_step": 55690, "epoch": 467, "lr": 1.163155952231732e-05} +{"train_loss": 0.0005387592483057539, "global_step": 55691, "epoch": 467, "lr": 1.1630138961958924e-05, "val_loss": 0.031776197254657745} +{"train_loss": 0.0004226278106216341, "global_step": 55692, "epoch": 468, "lr": 1.1628718476935662e-05} +{"train_loss": 0.000250433076871559, "global_step": 55693, "epoch": 468, "lr": 1.1627298067250314e-05} +{"train_loss": 0.00030384131241589785, "global_step": 55694, "epoch": 468, "lr": 1.1625877732905654e-05} +{"train_loss": 0.000433935783803463, "global_step": 55695, "epoch": 468, "lr": 1.16244574739045e-05} +{"train_loss": 0.0009046174818649888, "global_step": 55696, "epoch": 468, "lr": 1.16230372902496e-05} +{"train_loss": 0.0004171424370724708, "global_step": 55697, "epoch": 468, "lr": 1.1621617181943789e-05} +{"train_loss": 0.00048041652189567685, "global_step": 55698, "epoch": 468, "lr": 1.162019714898983e-05} +{"train_loss": 0.0003120526671409607, "global_step": 55699, "epoch": 468, "lr": 1.1618777191390501e-05} +{"train_loss": 0.000517804641276598, "global_step": 55700, "epoch": 468, "lr": 1.1617357309148614e-05} +{"train_loss": 0.000509349221829325, "global_step": 55701, "epoch": 468, "lr": 1.1615937502266932e-05} +{"train_loss": 0.0007029002881608903, "global_step": 55702, "epoch": 468, "lr": 1.1614517770748267e-05} +{"train_loss": 0.0005897096707485616, "global_step": 55703, "epoch": 468, "lr": 1.161309811459539e-05} +{"train_loss": 0.0003554682189133018, "global_step": 55704, "epoch": 468, "lr": 1.1611678533811088e-05} +{"train_loss": 0.0005042945267632604, "global_step": 55705, "epoch": 468, "lr": 1.1610259028398168e-05} +{"train_loss": 0.0009498398285359144, "global_step": 55706, "epoch": 468, "lr": 1.160883959835939e-05} +{"train_loss": 0.0005637688445858657, "global_step": 55707, "epoch": 468, "lr": 1.1607420243697564e-05} +{"train_loss": 0.0012999020982533693, "global_step": 55708, "epoch": 468, "lr": 1.160600096441546e-05} +{"train_loss": 0.0008464050479233265, "global_step": 55709, "epoch": 468, "lr": 1.1604581760515881e-05} +{"train_loss": 0.0009870033245533705, "global_step": 55710, "epoch": 468, "lr": 1.160316263200159e-05} +{"train_loss": 0.0002800535876303911, "global_step": 55711, "epoch": 468, "lr": 1.1601743578875401e-05} +{"train_loss": 0.00037703730049543083, "global_step": 55712, "epoch": 468, "lr": 1.1600324601140083e-05} +{"train_loss": 0.0008215041598305106, "global_step": 55713, "epoch": 468, "lr": 1.1598905698798418e-05} +{"train_loss": 0.0006076435674913228, "global_step": 55714, "epoch": 468, "lr": 1.1597486871853209e-05} +{"train_loss": 0.0005407478893175721, "global_step": 55715, "epoch": 468, "lr": 1.1596068120307218e-05} +{"train_loss": 0.0008060216787271202, "global_step": 55716, "epoch": 468, "lr": 1.1594649444163257e-05} +{"train_loss": 0.0006401711143553257, "global_step": 55717, "epoch": 468, "lr": 1.1593230843424107e-05} +{"train_loss": 0.0003370494523551315, "global_step": 55718, "epoch": 468, "lr": 1.1591812318092521e-05} +{"train_loss": 0.0004666729364544153, "global_step": 55719, "epoch": 468, "lr": 1.1590393868171328e-05} +{"train_loss": 0.001025659847073257, "global_step": 55720, "epoch": 468, "lr": 1.1588975493663279e-05} +{"train_loss": 0.0006686464766971767, "global_step": 55721, "epoch": 468, "lr": 1.1587557194571186e-05} +{"train_loss": 0.0014339827466756105, "global_step": 55722, "epoch": 468, "lr": 1.1586138970897804e-05} +{"train_loss": 0.001434151898138225, "global_step": 55723, "epoch": 468, "lr": 1.158472082264595e-05} +{"train_loss": 0.0003919605223927647, "global_step": 55724, "epoch": 468, "lr": 1.1583302749818392e-05} +{"train_loss": 0.0006416715914383531, "global_step": 55725, "epoch": 468, "lr": 1.1581884752417905e-05} +{"train_loss": 0.0005995055544190109, "global_step": 55726, "epoch": 468, "lr": 1.1580466830447296e-05} +{"train_loss": 0.0003357231034897268, "global_step": 55727, "epoch": 468, "lr": 1.1579048983909318e-05} +{"train_loss": 0.0004807936493307352, "global_step": 55728, "epoch": 468, "lr": 1.1577631212806788e-05} +{"train_loss": 0.0005610089865513146, "global_step": 55729, "epoch": 468, "lr": 1.1576213517142459e-05} +{"train_loss": 0.0004843217320740223, "global_step": 55730, "epoch": 468, "lr": 1.1574795896919143e-05} +{"train_loss": 0.0004335849662311375, "global_step": 55731, "epoch": 468, "lr": 1.1573378352139612e-05} +{"train_loss": 0.0004906815593130887, "global_step": 55732, "epoch": 468, "lr": 1.1571960882806638e-05} +{"train_loss": 0.0008189525105990469, "global_step": 55733, "epoch": 468, "lr": 1.1570543488923024e-05} +{"train_loss": 0.0007345475605688989, "global_step": 55734, "epoch": 468, "lr": 1.1569126170491524e-05} +{"train_loss": 0.0003994835424236953, "global_step": 55735, "epoch": 468, "lr": 1.1567708927514958e-05} +{"train_loss": 0.0005976481479592621, "global_step": 55736, "epoch": 468, "lr": 1.1566291759996073e-05} +{"train_loss": 0.0005731245037168264, "global_step": 55737, "epoch": 468, "lr": 1.1564874667937686e-05} +{"train_loss": 0.0006690858281217515, "global_step": 55738, "epoch": 468, "lr": 1.156345765134254e-05} +{"train_loss": 0.0004352513060439378, "global_step": 55739, "epoch": 468, "lr": 1.1562040710213462e-05} +{"train_loss": 0.0005220952443778515, "global_step": 55740, "epoch": 468, "lr": 1.1560623844553193e-05} +{"train_loss": 0.0004469678387977183, "global_step": 55741, "epoch": 468, "lr": 1.155920705436453e-05} +{"train_loss": 0.0004065499815624207, "global_step": 55742, "epoch": 468, "lr": 1.155779033965027e-05} +{"train_loss": 0.00034230778692290187, "global_step": 55743, "epoch": 468, "lr": 1.1556373700413187e-05} +{"train_loss": 0.0006962406914681196, "global_step": 55744, "epoch": 468, "lr": 1.1554957136656036e-05} +{"train_loss": 0.0008539679110981524, "global_step": 55745, "epoch": 468, "lr": 1.1553540648381639e-05} +{"train_loss": 0.0010924394009634852, "global_step": 55746, "epoch": 468, "lr": 1.1552124235592742e-05} +{"train_loss": 0.000621497631072998, "global_step": 55747, "epoch": 468, "lr": 1.1550707898292158e-05} +{"train_loss": 0.0007823493797332048, "global_step": 55748, "epoch": 468, "lr": 1.1549291636482646e-05} +{"train_loss": 0.0005741714267060161, "global_step": 55749, "epoch": 468, "lr": 1.1547875450166985e-05} +{"train_loss": 0.0006609433912672102, "global_step": 55750, "epoch": 468, "lr": 1.154645933934797e-05} +{"train_loss": 0.0004794331325683743, "global_step": 55751, "epoch": 468, "lr": 1.1545043304028363e-05} +{"train_loss": 0.0005958499386906624, "global_step": 55752, "epoch": 468, "lr": 1.1543627344210967e-05} +{"train_loss": 0.0009986150544136763, "global_step": 55753, "epoch": 468, "lr": 1.1542211459898539e-05} +{"train_loss": 0.0004635156656149775, "global_step": 55754, "epoch": 468, "lr": 1.1540795651093884e-05} +{"train_loss": 0.0005797219928354025, "global_step": 55755, "epoch": 468, "lr": 1.1539379917799764e-05} +{"train_loss": 0.00047193196951411664, "global_step": 55756, "epoch": 468, "lr": 1.1537964260018952e-05} +{"train_loss": 0.0005617848364636302, "global_step": 55757, "epoch": 468, "lr": 1.1536548677754255e-05} +{"train_loss": 0.000853542354889214, "global_step": 55758, "epoch": 468, "lr": 1.1535133171008416e-05} +{"train_loss": 0.0011096865637227893, "global_step": 55759, "epoch": 468, "lr": 1.153371773978425e-05} +{"train_loss": 0.0006565932417288423, "global_step": 55760, "epoch": 468, "lr": 1.1532302384084508e-05} +{"train_loss": 0.00039160874439403415, "global_step": 55761, "epoch": 468, "lr": 1.1530887103911992e-05} +{"train_loss": 0.0009569914545863867, "global_step": 55762, "epoch": 468, "lr": 1.1529471899269467e-05} +{"train_loss": 0.0006586253875866532, "global_step": 55763, "epoch": 468, "lr": 1.1528056770159707e-05} +{"train_loss": 0.0004777390859089792, "global_step": 55764, "epoch": 468, "lr": 1.1526641716585507e-05} +{"train_loss": 0.0007725846371613443, "global_step": 55765, "epoch": 468, "lr": 1.1525226738549621e-05} +{"train_loss": 0.00047291492228396237, "global_step": 55766, "epoch": 468, "lr": 1.1523811836054855e-05} +{"train_loss": 0.0004525397380348295, "global_step": 55767, "epoch": 468, "lr": 1.1522397009103963e-05} +{"train_loss": 0.000487999408505857, "global_step": 55768, "epoch": 468, "lr": 1.1520982257699741e-05} +{"train_loss": 0.0007078257040120661, "global_step": 55769, "epoch": 468, "lr": 1.1519567581844953e-05} +{"train_loss": 0.0009437148692086339, "global_step": 55770, "epoch": 468, "lr": 1.1518152981542396e-05} +{"train_loss": 0.0004062577208969742, "global_step": 55771, "epoch": 468, "lr": 1.1516738456794818e-05} +{"train_loss": 0.0006303766858763993, "global_step": 55772, "epoch": 468, "lr": 1.1515324007605028e-05} +{"train_loss": 0.000435724388808012, "global_step": 55773, "epoch": 468, "lr": 1.1513909633975773e-05} +{"train_loss": 0.0006831994978711009, "global_step": 55774, "epoch": 468, "lr": 1.1512495335909862e-05} +{"train_loss": 0.0010277311084792018, "global_step": 55775, "epoch": 468, "lr": 1.1511081113410038e-05} +{"train_loss": 0.0012771410401910543, "global_step": 55776, "epoch": 468, "lr": 1.1509666966479104e-05} +{"train_loss": 0.0006335091893561184, "global_step": 55777, "epoch": 468, "lr": 1.1508252895119819e-05} +{"train_loss": 0.0007148130098357797, "global_step": 55778, "epoch": 468, "lr": 1.1506838899334982e-05} +{"train_loss": 0.0007367822690866888, "global_step": 55779, "epoch": 468, "lr": 1.1505424979127338e-05} +{"train_loss": 0.0010472427820786834, "global_step": 55780, "epoch": 468, "lr": 1.1504011134499693e-05} +{"train_loss": 0.0009227215778082609, "global_step": 55781, "epoch": 468, "lr": 1.1502597365454809e-05} +{"train_loss": 0.0006722529069520533, "global_step": 55782, "epoch": 468, "lr": 1.1501183671995447e-05} +{"train_loss": 0.00029959622770547867, "global_step": 55783, "epoch": 468, "lr": 1.1499770054124415e-05} +{"train_loss": 0.0008674085256643593, "global_step": 55784, "epoch": 468, "lr": 1.1498356511844454e-05} +{"train_loss": 0.0004266090109013021, "global_step": 55785, "epoch": 468, "lr": 1.1496943045158377e-05} +{"train_loss": 0.000526461168192327, "global_step": 55786, "epoch": 468, "lr": 1.1495529654068931e-05} +{"train_loss": 0.0015021906001493335, "global_step": 55787, "epoch": 468, "lr": 1.1494116338578892e-05} +{"train_loss": 0.00045199182932265103, "global_step": 55788, "epoch": 468, "lr": 1.1492703098691054e-05} +{"train_loss": 0.00028914352878928185, "global_step": 55789, "epoch": 468, "lr": 1.1491289934408161e-05} +{"train_loss": 0.00039751516305841506, "global_step": 55790, "epoch": 468, "lr": 1.1489876845733022e-05} +{"train_loss": 0.0005490041803568602, "global_step": 55791, "epoch": 468, "lr": 1.1488463832668384e-05} +{"train_loss": 0.00040313194040209055, "global_step": 55792, "epoch": 468, "lr": 1.148705089521705e-05} +{"train_loss": 0.000560532440431416, "global_step": 55793, "epoch": 468, "lr": 1.1485638033381768e-05} +{"train_loss": 0.0005222954787313938, "global_step": 55794, "epoch": 468, "lr": 1.1484225247165314e-05} +{"train_loss": 0.0007687992183491588, "global_step": 55795, "epoch": 468, "lr": 1.148281253657048e-05} +{"train_loss": 0.00056030647829175, "global_step": 55796, "epoch": 468, "lr": 1.1481399901600015e-05} +{"train_loss": 0.0007605577120557427, "global_step": 55797, "epoch": 468, "lr": 1.147998734225672e-05} +{"train_loss": 0.000687716412357986, "global_step": 55798, "epoch": 468, "lr": 1.1478574858543355e-05} +{"train_loss": 0.00032900081714615226, "global_step": 55799, "epoch": 468, "lr": 1.147716245046268e-05} +{"train_loss": 0.0006589968106709421, "global_step": 55800, "epoch": 468, "lr": 1.1475750118017498e-05} +{"train_loss": 0.0004319726431276649, "global_step": 55801, "epoch": 468, "lr": 1.1474337861210543e-05} +{"train_loss": 0.0005405903793871403, "global_step": 55802, "epoch": 468, "lr": 1.1472925680044616e-05} +{"train_loss": 0.00074560142820701, "global_step": 55803, "epoch": 468, "lr": 1.1471513574522496e-05} +{"train_loss": 0.0003972310514654964, "global_step": 55804, "epoch": 468, "lr": 1.1470101544646927e-05} +{"train_loss": 0.0005059994873590767, "global_step": 55805, "epoch": 468, "lr": 1.1468689590420712e-05} +{"train_loss": 0.0005090130143798888, "global_step": 55806, "epoch": 468, "lr": 1.1467277711846597e-05} +{"train_loss": 0.0011391168227419257, "global_step": 55807, "epoch": 468, "lr": 1.1465865908927375e-05} +{"train_loss": 0.0013100046198815107, "global_step": 55808, "epoch": 468, "lr": 1.1464454181665796e-05} +{"train_loss": 0.0005906687583774328, "global_step": 55809, "epoch": 468, "lr": 1.146304253006466e-05} +{"train_loss": 0.0006375396174198689, "global_step": 55810, "epoch": 468, "lr": 1.1461630954126712e-05, "val_loss": 0.0369415208697319} +{"train_loss": 0.000766037730500102, "global_step": 55811, "epoch": 469, "lr": 1.1460219453854742e-05} +{"train_loss": 0.0008770027197897434, "global_step": 55812, "epoch": 469, "lr": 1.1458808029251517e-05} +{"train_loss": 0.0004614246136043221, "global_step": 55813, "epoch": 469, "lr": 1.1457396680319793e-05} +{"train_loss": 0.0003326814330648631, "global_step": 55814, "epoch": 469, "lr": 1.1455985407062365e-05} +{"train_loss": 0.0006874137907288969, "global_step": 55815, "epoch": 469, "lr": 1.1454574209481972e-05} +{"train_loss": 0.001705200644209981, "global_step": 55816, "epoch": 469, "lr": 1.1453163087581426e-05} +{"train_loss": 0.0008634214755147696, "global_step": 55817, "epoch": 469, "lr": 1.1451752041363473e-05} +{"train_loss": 0.0004949390422552824, "global_step": 55818, "epoch": 469, "lr": 1.1450341070830872e-05} +{"train_loss": 0.0012350408360362053, "global_step": 55819, "epoch": 469, "lr": 1.1448930175986428e-05} +{"train_loss": 0.0011956735979765654, "global_step": 55820, "epoch": 469, "lr": 1.144751935683287e-05} +{"train_loss": 0.0006053866818547249, "global_step": 55821, "epoch": 469, "lr": 1.1446108613373007e-05} +{"train_loss": 0.0007363083423115313, "global_step": 55822, "epoch": 469, "lr": 1.1444697945609572e-05} +{"train_loss": 0.0007709137280471623, "global_step": 55823, "epoch": 469, "lr": 1.1443287353545373e-05} +{"train_loss": 0.000620093138422817, "global_step": 55824, "epoch": 469, "lr": 1.1441876837183158e-05} +{"train_loss": 0.0008593818638473749, "global_step": 55825, "epoch": 469, "lr": 1.1440466396525684e-05} +{"train_loss": 0.0004973872564733028, "global_step": 55826, "epoch": 469, "lr": 1.1439056031575752e-05} +{"train_loss": 0.0002803804527502507, "global_step": 55827, "epoch": 469, "lr": 1.1437645742336096e-05} +{"train_loss": 0.0004095598997082561, "global_step": 55828, "epoch": 469, "lr": 1.1436235528809513e-05} +{"train_loss": 0.0006395240779966116, "global_step": 55829, "epoch": 469, "lr": 1.1434825390998755e-05} +{"train_loss": 0.00038335361750796437, "global_step": 55830, "epoch": 469, "lr": 1.1433415328906611e-05} +{"train_loss": 0.00044607551535591483, "global_step": 55831, "epoch": 469, "lr": 1.1432005342535835e-05} +{"train_loss": 0.0008034651982598007, "global_step": 55832, "epoch": 469, "lr": 1.1430595431889179e-05} +{"train_loss": 0.0012078844010829926, "global_step": 55833, "epoch": 469, "lr": 1.1429185596969444e-05} +{"train_loss": 0.0006387963076122105, "global_step": 55834, "epoch": 469, "lr": 1.1427775837779364e-05} +{"train_loss": 0.0010974763426929712, "global_step": 55835, "epoch": 469, "lr": 1.1426366154321744e-05} +{"train_loss": 0.0005025851423852146, "global_step": 55836, "epoch": 469, "lr": 1.1424956546599319e-05} +{"train_loss": 0.00040390962385572493, "global_step": 55837, "epoch": 469, "lr": 1.1423547014614871e-05} +{"train_loss": 0.00038602377753704786, "global_step": 55838, "epoch": 469, "lr": 1.1422137558371181e-05} +{"train_loss": 0.0003578441101126373, "global_step": 55839, "epoch": 469, "lr": 1.1420728177870987e-05} +{"train_loss": 0.00036710838321596384, "global_step": 55840, "epoch": 469, "lr": 1.1419318873117092e-05} +{"train_loss": 0.000741681840736419, "global_step": 55841, "epoch": 469, "lr": 1.1417909644112218e-05} +{"train_loss": 0.00037796649849042296, "global_step": 55842, "epoch": 469, "lr": 1.1416500490859177e-05} +{"train_loss": 0.0005553907249122858, "global_step": 55843, "epoch": 469, "lr": 1.1415091413360712e-05} +{"train_loss": 0.00040159988566301763, "global_step": 55844, "epoch": 469, "lr": 1.1413682411619585e-05} +{"train_loss": 0.0005751432036049664, "global_step": 55845, "epoch": 469, "lr": 1.141227348563858e-05} +{"train_loss": 0.00042822540854103863, "global_step": 55846, "epoch": 469, "lr": 1.1410864635420437e-05} +{"train_loss": 0.0005436469218693674, "global_step": 55847, "epoch": 469, "lr": 1.1409455860967956e-05} +{"train_loss": 0.0006685670814476907, "global_step": 55848, "epoch": 469, "lr": 1.140804716228387e-05} +{"train_loss": 0.0008067329181358218, "global_step": 55849, "epoch": 469, "lr": 1.1406638539370978e-05} +{"train_loss": 0.0009436678956262767, "global_step": 55850, "epoch": 469, "lr": 1.1405229992232024e-05} +{"train_loss": 0.0006530404789373279, "global_step": 55851, "epoch": 469, "lr": 1.1403821520869767e-05} +{"train_loss": 0.0004068621201440692, "global_step": 55852, "epoch": 469, "lr": 1.1402413125286993e-05} +{"train_loss": 0.0006355105433613062, "global_step": 55853, "epoch": 469, "lr": 1.1401004805486448e-05} +{"train_loss": 0.0005221899482421577, "global_step": 55854, "epoch": 469, "lr": 1.1399596561470916e-05} +{"train_loss": 0.0003896342241205275, "global_step": 55855, "epoch": 469, "lr": 1.1398188393243153e-05} +{"train_loss": 0.0003511038958095014, "global_step": 55856, "epoch": 469, "lr": 1.1396780300805909e-05} +{"train_loss": 0.00037864939076825976, "global_step": 55857, "epoch": 469, "lr": 1.139537228416198e-05} +{"train_loss": 0.00044979085214436054, "global_step": 55858, "epoch": 469, "lr": 1.1393964343314101e-05} +{"train_loss": 0.00043757841922342777, "global_step": 55859, "epoch": 469, "lr": 1.1392556478265054e-05} +{"train_loss": 0.00044669516501016915, "global_step": 55860, "epoch": 469, "lr": 1.1391148689017589e-05} +{"train_loss": 0.00046387716429308057, "global_step": 55861, "epoch": 469, "lr": 1.1389740975574493e-05} +{"train_loss": 0.00045318162301555276, "global_step": 55862, "epoch": 469, "lr": 1.1388333337938517e-05} +{"train_loss": 0.00039370727608911693, "global_step": 55863, "epoch": 469, "lr": 1.1386925776112406e-05} +{"train_loss": 0.0002599355357233435, "global_step": 55864, "epoch": 469, "lr": 1.1385518290098956e-05} +{"train_loss": 0.0004751943633891642, "global_step": 55865, "epoch": 469, "lr": 1.1384110879900906e-05} +{"train_loss": 0.0005248798406682909, "global_step": 55866, "epoch": 469, "lr": 1.1382703545521034e-05} +{"train_loss": 0.0005500289262272418, "global_step": 55867, "epoch": 469, "lr": 1.138129628696209e-05} +{"train_loss": 0.000638491241261363, "global_step": 55868, "epoch": 469, "lr": 1.137988910422686e-05} +{"train_loss": 0.0003228781861253083, "global_step": 55869, "epoch": 469, "lr": 1.1378481997318074e-05} +{"train_loss": 0.00023060053354129195, "global_step": 55870, "epoch": 469, "lr": 1.1377074966238527e-05} +{"train_loss": 0.0004166285216342658, "global_step": 55871, "epoch": 469, "lr": 1.1375668010990953e-05} +{"train_loss": 0.0004463456862140447, "global_step": 55872, "epoch": 469, "lr": 1.1374261131578129e-05} +{"train_loss": 0.0002843858674168587, "global_step": 55873, "epoch": 469, "lr": 1.1372854328002836e-05} +{"train_loss": 0.0005882723489776254, "global_step": 55874, "epoch": 469, "lr": 1.1371447600267809e-05} +{"train_loss": 0.0003636907204054296, "global_step": 55875, "epoch": 469, "lr": 1.137004094837581e-05} +{"train_loss": 0.00046903538168407977, "global_step": 55876, "epoch": 469, "lr": 1.1368634372329617e-05} +{"train_loss": 0.0005168062634766102, "global_step": 55877, "epoch": 469, "lr": 1.1367227872131969e-05} +{"train_loss": 0.00039280913188122213, "global_step": 55878, "epoch": 469, "lr": 1.1365821447785663e-05} +{"train_loss": 0.0004800694587174803, "global_step": 55879, "epoch": 469, "lr": 1.1364415099293419e-05} +{"train_loss": 0.0003851883811876178, "global_step": 55880, "epoch": 469, "lr": 1.1363008826658034e-05} +{"train_loss": 0.0003702476678881794, "global_step": 55881, "epoch": 469, "lr": 1.1361602629882252e-05} +{"train_loss": 0.0004783623153343797, "global_step": 55882, "epoch": 469, "lr": 1.1360196508968824e-05} +{"train_loss": 0.0007151856552809477, "global_step": 55883, "epoch": 469, "lr": 1.1358790463920533e-05} +{"train_loss": 0.0003031957894563675, "global_step": 55884, "epoch": 469, "lr": 1.135738449474012e-05} +{"train_loss": 0.0003041221643798053, "global_step": 55885, "epoch": 469, "lr": 1.1355978601430361e-05} +{"train_loss": 0.0004426386731211096, "global_step": 55886, "epoch": 469, "lr": 1.1354572783994016e-05} +{"train_loss": 0.00031759976991452277, "global_step": 55887, "epoch": 469, "lr": 1.1353167042433821e-05} +{"train_loss": 0.0008123478619381785, "global_step": 55888, "epoch": 469, "lr": 1.1351761376752568e-05} +{"train_loss": 0.00020744206267409027, "global_step": 55889, "epoch": 469, "lr": 1.1350355786952988e-05} +{"train_loss": 0.0005791636649519205, "global_step": 55890, "epoch": 469, "lr": 1.1348950273037873e-05} +{"train_loss": 0.00039925274904817343, "global_step": 55891, "epoch": 469, "lr": 1.134754483500995e-05} +{"train_loss": 0.00030086710467003286, "global_step": 55892, "epoch": 469, "lr": 1.1346139472872002e-05} +{"train_loss": 0.0004618136736098677, "global_step": 55893, "epoch": 469, "lr": 1.1344734186626782e-05} +{"train_loss": 0.0003273813345003873, "global_step": 55894, "epoch": 469, "lr": 1.1343328976277034e-05} +{"train_loss": 0.000598584592808038, "global_step": 55895, "epoch": 469, "lr": 1.1341923841825546e-05} +{"train_loss": 0.0007410245598293841, "global_step": 55896, "epoch": 469, "lr": 1.1340518783275044e-05} +{"train_loss": 0.00033409675233997405, "global_step": 55897, "epoch": 469, "lr": 1.133911380062832e-05} +{"train_loss": 0.00030972808599472046, "global_step": 55898, "epoch": 469, "lr": 1.13377088938881e-05} +{"train_loss": 0.000771238817833364, "global_step": 55899, "epoch": 469, "lr": 1.1336304063057169e-05} +{"train_loss": 0.0005945524899289012, "global_step": 55900, "epoch": 469, "lr": 1.1334899308138263e-05} +{"train_loss": 0.0007226077723316848, "global_step": 55901, "epoch": 469, "lr": 1.1333494629134161e-05} +{"train_loss": 0.00023858010536059737, "global_step": 55902, "epoch": 469, "lr": 1.1332090026047604e-05} +{"train_loss": 0.0005118490080349147, "global_step": 55903, "epoch": 469, "lr": 1.1330685498881371e-05} +{"train_loss": 0.00046026078052818775, "global_step": 55904, "epoch": 469, "lr": 1.1329281047638185e-05} +{"train_loss": 0.00037953906576149166, "global_step": 55905, "epoch": 469, "lr": 1.1327876672320848e-05} +{"train_loss": 0.0005286688101477921, "global_step": 55906, "epoch": 469, "lr": 1.1326472372932073e-05} +{"train_loss": 0.0007244647713378072, "global_step": 55907, "epoch": 469, "lr": 1.1325068149474654e-05} +{"train_loss": 0.0006583411013707519, "global_step": 55908, "epoch": 469, "lr": 1.1323664001951318e-05} +{"train_loss": 0.00046905677299946547, "global_step": 55909, "epoch": 469, "lr": 1.1322259930364848e-05} +{"train_loss": 0.0007600625394843519, "global_step": 55910, "epoch": 469, "lr": 1.1320855934717971e-05} +{"train_loss": 0.0005216789431869984, "global_step": 55911, "epoch": 469, "lr": 1.1319452015013482e-05} +{"train_loss": 0.0004544400726445019, "global_step": 55912, "epoch": 469, "lr": 1.1318048171254114e-05} +{"train_loss": 0.0006295191124081612, "global_step": 55913, "epoch": 469, "lr": 1.131664440344261e-05} +{"train_loss": 0.0007778897997923195, "global_step": 55914, "epoch": 469, "lr": 1.131524071158176e-05} +{"train_loss": 0.00046804375597275794, "global_step": 55915, "epoch": 469, "lr": 1.1313837095674285e-05} +{"train_loss": 0.00038827277603559196, "global_step": 55916, "epoch": 469, "lr": 1.1312433555722972e-05} +{"train_loss": 0.0006125839427113533, "global_step": 55917, "epoch": 469, "lr": 1.131103009173055e-05} +{"train_loss": 0.0008895935025066137, "global_step": 55918, "epoch": 469, "lr": 1.13096267036998e-05} +{"train_loss": 0.0005207951180636883, "global_step": 55919, "epoch": 469, "lr": 1.1308223391633465e-05} +{"train_loss": 0.000359058118192479, "global_step": 55920, "epoch": 469, "lr": 1.1306820155534287e-05} +{"train_loss": 0.0005169863579794765, "global_step": 55921, "epoch": 469, "lr": 1.130541699540505e-05} +{"train_loss": 0.0006599854095838964, "global_step": 55922, "epoch": 469, "lr": 1.1304013911248473e-05} +{"train_loss": 0.0005475453799590468, "global_step": 55923, "epoch": 469, "lr": 1.1302610903067346e-05} +{"train_loss": 0.0006363762659020722, "global_step": 55924, "epoch": 469, "lr": 1.1301207970864408e-05} +{"train_loss": 0.0004818984598387033, "global_step": 55925, "epoch": 469, "lr": 1.1299805114642403e-05} +{"train_loss": 0.000962402846198529, "global_step": 55926, "epoch": 469, "lr": 1.1298402334404107e-05} +{"train_loss": 0.0005262796767055988, "global_step": 55927, "epoch": 469, "lr": 1.1296999630152254e-05} +{"train_loss": 0.0002552922233007848, "global_step": 55928, "epoch": 469, "lr": 1.1295597001889618e-05} +{"train_loss": 0.0005514475520888046, "global_step": 55929, "epoch": 469, "lr": 1.1294194449618929e-05, "val_loss": 0.01139818038791418} +{"train_loss": 0.0006474687834270298, "global_step": 55930, "epoch": 470, "lr": 1.1292791973342965e-05} +{"train_loss": 0.00037194843753241, "global_step": 55931, "epoch": 470, "lr": 1.129138957306447e-05} +{"train_loss": 0.0004797737638000399, "global_step": 55932, "epoch": 470, "lr": 1.1289987248786189e-05} +{"train_loss": 0.000404714432079345, "global_step": 55933, "epoch": 470, "lr": 1.1288585000510888e-05} +{"train_loss": 0.0003283583791926503, "global_step": 55934, "epoch": 470, "lr": 1.1287182828241305e-05} +{"train_loss": 0.000871694297529757, "global_step": 55935, "epoch": 470, "lr": 1.12857807319802e-05} +{"train_loss": 0.0005623172037303448, "global_step": 55936, "epoch": 470, "lr": 1.1284378711730342e-05} +{"train_loss": 0.0006594781880266964, "global_step": 55937, "epoch": 470, "lr": 1.1282976767494458e-05} +{"train_loss": 0.0004601793480105698, "global_step": 55938, "epoch": 470, "lr": 1.1281574899275327e-05} +{"train_loss": 0.0005239378078840673, "global_step": 55939, "epoch": 470, "lr": 1.1280173107075675e-05} +{"train_loss": 0.00046982179628685117, "global_step": 55940, "epoch": 470, "lr": 1.127877139089828e-05} +{"train_loss": 0.0008011789177544415, "global_step": 55941, "epoch": 470, "lr": 1.1277369750745864e-05} +{"train_loss": 0.00075347232632339, "global_step": 55942, "epoch": 470, "lr": 1.127596818662121e-05} +{"train_loss": 0.0005406266427598894, "global_step": 55943, "epoch": 470, "lr": 1.1274566698527056e-05} +{"train_loss": 0.0006572107085958123, "global_step": 55944, "epoch": 470, "lr": 1.1273165286466136e-05} +{"train_loss": 0.0006011463119648397, "global_step": 55945, "epoch": 470, "lr": 1.1271763950441238e-05} +{"train_loss": 0.0006012304220348597, "global_step": 55946, "epoch": 470, "lr": 1.1270362690455077e-05} +{"train_loss": 0.00030562310712412, "global_step": 55947, "epoch": 470, "lr": 1.1268961506510439e-05} +{"train_loss": 0.00047765945782884955, "global_step": 55948, "epoch": 470, "lr": 1.1267560398610038e-05} +{"train_loss": 0.0006355469231493771, "global_step": 55949, "epoch": 470, "lr": 1.1266159366756662e-05} +{"train_loss": 0.0003644716343842447, "global_step": 55950, "epoch": 470, "lr": 1.1264758410953041e-05} +{"train_loss": 0.0005194366676732898, "global_step": 55951, "epoch": 470, "lr": 1.1263357531201917e-05} +{"train_loss": 0.0006538181914947927, "global_step": 55952, "epoch": 470, "lr": 1.1261956727506063e-05} +{"train_loss": 0.0006935955607332289, "global_step": 55953, "epoch": 470, "lr": 1.1260555999868205e-05} +{"train_loss": 0.0004095552139915526, "global_step": 55954, "epoch": 470, "lr": 1.1259155348291123e-05} +{"train_loss": 0.0005683238850906491, "global_step": 55955, "epoch": 470, "lr": 1.1257754772777552e-05} +{"train_loss": 0.000496076769195497, "global_step": 55956, "epoch": 470, "lr": 1.1256354273330223e-05} +{"train_loss": 0.0006480826414190233, "global_step": 55957, "epoch": 470, "lr": 1.125495384995192e-05} +{"train_loss": 0.00043325257138349116, "global_step": 55958, "epoch": 470, "lr": 1.1253553502645358e-05} +{"train_loss": 0.00030644223443232477, "global_step": 55959, "epoch": 470, "lr": 1.125215323141332e-05} +{"train_loss": 0.0005161167355254292, "global_step": 55960, "epoch": 470, "lr": 1.1250753036258527e-05} +{"train_loss": 0.0007421693298965693, "global_step": 55961, "epoch": 470, "lr": 1.1249352917183753e-05} +{"train_loss": 0.0005005257553420961, "global_step": 55962, "epoch": 470, "lr": 1.1247952874191736e-05} +{"train_loss": 0.00037374987732619047, "global_step": 55963, "epoch": 470, "lr": 1.1246552907285213e-05} +{"train_loss": 0.0006403094157576561, "global_step": 55964, "epoch": 470, "lr": 1.1245153016466952e-05} +{"train_loss": 0.0003747545706573874, "global_step": 55965, "epoch": 470, "lr": 1.1243753201739676e-05} +{"train_loss": 0.0003080843889620155, "global_step": 55966, "epoch": 470, "lr": 1.124235346310617e-05} +{"train_loss": 0.0005253356066532433, "global_step": 55967, "epoch": 470, "lr": 1.1240953800569149e-05} +{"train_loss": 0.00043125133379362524, "global_step": 55968, "epoch": 470, "lr": 1.1239554214131382e-05} +{"train_loss": 0.0009897506097331643, "global_step": 55969, "epoch": 470, "lr": 1.1238154703795601e-05} +{"train_loss": 0.0003897754068020731, "global_step": 55970, "epoch": 470, "lr": 1.1236755269564558e-05} +{"train_loss": 0.0005000131204724312, "global_step": 55971, "epoch": 470, "lr": 1.1235355911441025e-05} +{"train_loss": 0.0009461418376304209, "global_step": 55972, "epoch": 470, "lr": 1.123395662942771e-05} +{"train_loss": 0.0002581623266451061, "global_step": 55973, "epoch": 470, "lr": 1.1232557423527396e-05} +{"train_loss": 0.00040235131746158004, "global_step": 55974, "epoch": 470, "lr": 1.123115829374281e-05} +{"train_loss": 0.0006239134818315506, "global_step": 55975, "epoch": 470, "lr": 1.1229759240076693e-05} +{"train_loss": 0.000297531922115013, "global_step": 55976, "epoch": 470, "lr": 1.1228360262531812e-05} +{"train_loss": 0.00033331342274323106, "global_step": 55977, "epoch": 470, "lr": 1.1226961361110894e-05} +{"train_loss": 0.0006690324516966939, "global_step": 55978, "epoch": 470, "lr": 1.1225562535816709e-05} +{"train_loss": 0.00024851495982147753, "global_step": 55979, "epoch": 470, "lr": 1.122416378665197e-05} +{"train_loss": 0.0008514855289831758, "global_step": 55980, "epoch": 470, "lr": 1.122276511361946e-05} +{"train_loss": 0.0003315226931590587, "global_step": 55981, "epoch": 470, "lr": 1.122136651672191e-05} +{"train_loss": 0.0004979390650987625, "global_step": 55982, "epoch": 470, "lr": 1.1219967995962043e-05} +{"train_loss": 0.0008085703593678772, "global_step": 55983, "epoch": 470, "lr": 1.1218569551342651e-05} +{"train_loss": 0.0011435856577008963, "global_step": 55984, "epoch": 470, "lr": 1.1217171182866431e-05} +{"train_loss": 0.0006110180402174592, "global_step": 55985, "epoch": 470, "lr": 1.1215772890536168e-05} +{"train_loss": 0.0005790999275632203, "global_step": 55986, "epoch": 470, "lr": 1.1214374674354594e-05} +{"train_loss": 0.00042354330071248114, "global_step": 55987, "epoch": 470, "lr": 1.1212976534324438e-05} +{"train_loss": 0.00045237585436552763, "global_step": 55988, "epoch": 470, "lr": 1.121157847044847e-05} +{"train_loss": 0.0009548335219733417, "global_step": 55989, "epoch": 470, "lr": 1.121018048272941e-05} +{"train_loss": 0.0005458341911435127, "global_step": 55990, "epoch": 470, "lr": 1.1208782571170035e-05} +{"train_loss": 0.00037172561860643327, "global_step": 55991, "epoch": 470, "lr": 1.1207384735773052e-05} +{"train_loss": 0.00035329617094248533, "global_step": 55992, "epoch": 470, "lr": 1.1205986976541243e-05} +{"train_loss": 0.0004385636711958796, "global_step": 55993, "epoch": 470, "lr": 1.120458929347733e-05} +{"train_loss": 0.000576688558794558, "global_step": 55994, "epoch": 470, "lr": 1.1203191686584046e-05} +{"train_loss": 0.0007830366957932711, "global_step": 55995, "epoch": 470, "lr": 1.1201794155864171e-05} +{"train_loss": 0.00048819457879289985, "global_step": 55996, "epoch": 470, "lr": 1.120039670132041e-05} +{"train_loss": 0.00027949531795457006, "global_step": 55997, "epoch": 470, "lr": 1.119899932295554e-05} +{"train_loss": 0.00039125015609897673, "global_step": 55998, "epoch": 470, "lr": 1.1197602020772275e-05} +{"train_loss": 0.0003241121012251824, "global_step": 55999, "epoch": 470, "lr": 1.1196204794773385e-05} +{"train_loss": 0.000590253621339798, "global_step": 56000, "epoch": 470, "lr": 1.1194807644961592e-05} +{"train_loss": 0.00040828969213180244, "global_step": 56001, "epoch": 470, "lr": 1.1193410571339658e-05} +{"train_loss": 0.0006342852720990777, "global_step": 56002, "epoch": 470, "lr": 1.1192013573910304e-05} +{"train_loss": 0.0002687558881007135, "global_step": 56003, "epoch": 470, "lr": 1.11906166526763e-05} +{"train_loss": 0.0005356761976145208, "global_step": 56004, "epoch": 470, "lr": 1.1189219807640355e-05} +{"train_loss": 0.000563230540137738, "global_step": 56005, "epoch": 470, "lr": 1.118782303880525e-05} +{"train_loss": 0.000285670772427693, "global_step": 56006, "epoch": 470, "lr": 1.1186426346173695e-05} +{"train_loss": 0.0007746001938357949, "global_step": 56007, "epoch": 470, "lr": 1.1185029729748459e-05} +{"train_loss": 0.0003753804776351899, "global_step": 56008, "epoch": 470, "lr": 1.118363318953225e-05} +{"train_loss": 0.00046246228157542646, "global_step": 56009, "epoch": 470, "lr": 1.1182236725527851e-05} +{"train_loss": 0.00028867615037597716, "global_step": 56010, "epoch": 470, "lr": 1.118084033773797e-05} +{"train_loss": 0.00039157530409283936, "global_step": 56011, "epoch": 470, "lr": 1.117944402616537e-05} +{"train_loss": 0.00100566481705755, "global_step": 56012, "epoch": 470, "lr": 1.1178047790812784e-05} +{"train_loss": 0.0006165386294014752, "global_step": 56013, "epoch": 470, "lr": 1.1176651631682944e-05} +{"train_loss": 0.0005006230785511434, "global_step": 56014, "epoch": 470, "lr": 1.1175255548778618e-05} +{"train_loss": 0.0010691634379327297, "global_step": 56015, "epoch": 470, "lr": 1.117385954210251e-05} +{"train_loss": 0.0002779065107461065, "global_step": 56016, "epoch": 470, "lr": 1.1172463611657396e-05} +{"train_loss": 0.0004270711506251246, "global_step": 56017, "epoch": 470, "lr": 1.1171067757445986e-05} +{"train_loss": 0.0009181591449305415, "global_step": 56018, "epoch": 470, "lr": 1.1169671979471053e-05} +{"train_loss": 0.000588668161071837, "global_step": 56019, "epoch": 470, "lr": 1.1168276277735317e-05} +{"train_loss": 0.00025117784389294684, "global_step": 56020, "epoch": 470, "lr": 1.1166880652241512e-05} +{"train_loss": 0.0005561276338994503, "global_step": 56021, "epoch": 470, "lr": 1.1165485102992402e-05} +{"train_loss": 0.00028919728356413543, "global_step": 56022, "epoch": 470, "lr": 1.1164089629990699e-05} +{"train_loss": 0.0006777981761842966, "global_step": 56023, "epoch": 470, "lr": 1.1162694233239168e-05} +{"train_loss": 0.0009275235934183002, "global_step": 56024, "epoch": 470, "lr": 1.1161298912740543e-05} +{"train_loss": 0.0004773941182065755, "global_step": 56025, "epoch": 470, "lr": 1.115990366849754e-05} +{"train_loss": 0.0004411576665006578, "global_step": 56026, "epoch": 470, "lr": 1.1158508500512933e-05} +{"train_loss": 0.0002924261789303273, "global_step": 56027, "epoch": 470, "lr": 1.1157113408789428e-05} +{"train_loss": 0.00033536911359988153, "global_step": 56028, "epoch": 470, "lr": 1.1155718393329795e-05} +{"train_loss": 0.0005061863921582699, "global_step": 56029, "epoch": 470, "lr": 1.115432345413675e-05} +{"train_loss": 0.0005670083919540048, "global_step": 56030, "epoch": 470, "lr": 1.1152928591213052e-05} +{"train_loss": 0.00036048880429007113, "global_step": 56031, "epoch": 470, "lr": 1.1151533804561426e-05} +{"train_loss": 0.0007147657452151179, "global_step": 56032, "epoch": 470, "lr": 1.1150139094184602e-05} +{"train_loss": 0.0007723344024270773, "global_step": 56033, "epoch": 470, "lr": 1.1148744460085331e-05} +{"train_loss": 0.00025396861019544303, "global_step": 56034, "epoch": 470, "lr": 1.1147349902266358e-05} +{"train_loss": 0.00026624463498592377, "global_step": 56035, "epoch": 470, "lr": 1.1145955420730403e-05} +{"train_loss": 0.00038894775207154453, "global_step": 56036, "epoch": 470, "lr": 1.1144561015480227e-05} +{"train_loss": 0.0007544702966697514, "global_step": 56037, "epoch": 470, "lr": 1.114316668651854e-05} +{"train_loss": 0.0002818315988406539, "global_step": 56038, "epoch": 470, "lr": 1.1141772433848108e-05} +{"train_loss": 0.0006967496010474861, "global_step": 56039, "epoch": 470, "lr": 1.114037825747164e-05} +{"train_loss": 0.0003900873998645693, "global_step": 56040, "epoch": 470, "lr": 1.1138984157391902e-05} +{"train_loss": 0.0004943354870192707, "global_step": 56041, "epoch": 470, "lr": 1.1137590133611603e-05} +{"train_loss": 0.0005865306011401117, "global_step": 56042, "epoch": 470, "lr": 1.1136196186133507e-05} +{"train_loss": 0.0007507847039960325, "global_step": 56043, "epoch": 470, "lr": 1.1134802314960336e-05} +{"train_loss": 0.0006112980772741139, "global_step": 56044, "epoch": 470, "lr": 1.1133408520094817e-05} +{"train_loss": 0.00047827360685914755, "global_step": 56045, "epoch": 470, "lr": 1.1132014801539713e-05} +{"train_loss": 0.0004660043923649937, "global_step": 56046, "epoch": 470, "lr": 1.1130621159297733e-05} +{"train_loss": 0.0005893061170354486, "global_step": 56047, "epoch": 470, "lr": 1.1129227593371639e-05} +{"train_loss": 0.000529517315204858, "global_step": 56048, "epoch": 470, "lr": 1.1127834103764135e-05, "val_loss": 0.01574552245438099, "train_action_mse_error": 6.50737229079823e-06} +{"train_loss": 0.0006329030729830265, "global_step": 56049, "epoch": 471, "lr": 1.1126440690477996e-05} +{"train_loss": 0.0004088779678568244, "global_step": 56050, "epoch": 471, "lr": 1.1125047353515932e-05} +{"train_loss": 0.0006734143826179206, "global_step": 56051, "epoch": 471, "lr": 1.1123654092880675e-05} +{"train_loss": 0.00045209581730887294, "global_step": 56052, "epoch": 471, "lr": 1.1122260908574982e-05} +{"train_loss": 0.0009254384785890579, "global_step": 56053, "epoch": 471, "lr": 1.1120867800601564e-05} +{"train_loss": 0.0005831901216879487, "global_step": 56054, "epoch": 471, "lr": 1.1119474768963179e-05} +{"train_loss": 0.0007808393565937877, "global_step": 56055, "epoch": 471, "lr": 1.111808181366255e-05} +{"train_loss": 0.0004756913986057043, "global_step": 56056, "epoch": 471, "lr": 1.1116688934702408e-05} +{"train_loss": 0.0008337738690897822, "global_step": 56057, "epoch": 471, "lr": 1.11152961320855e-05} +{"train_loss": 0.0006569967372342944, "global_step": 56058, "epoch": 471, "lr": 1.111390340581454e-05} +{"train_loss": 0.00042184186168015003, "global_step": 56059, "epoch": 471, "lr": 1.1112510755892292e-05} +{"train_loss": 0.0009115857537835836, "global_step": 56060, "epoch": 471, "lr": 1.1111118182321462e-05} +{"train_loss": 0.0003682711103465408, "global_step": 56061, "epoch": 471, "lr": 1.110972568510481e-05} +{"train_loss": 0.00043677425128407776, "global_step": 56062, "epoch": 471, "lr": 1.1108333264245057e-05} +{"train_loss": 0.0005218465230427682, "global_step": 56063, "epoch": 471, "lr": 1.1106940919744923e-05} +{"train_loss": 0.00034350508940406144, "global_step": 56064, "epoch": 471, "lr": 1.1105548651607168e-05} +{"train_loss": 0.0005435086786746979, "global_step": 56065, "epoch": 471, "lr": 1.1104156459834498e-05} +{"train_loss": 0.0005007414729334414, "global_step": 56066, "epoch": 471, "lr": 1.1102764344429678e-05} +{"train_loss": 0.0006452741217799485, "global_step": 56067, "epoch": 471, "lr": 1.1101372305395408e-05} +{"train_loss": 0.00043665821431204677, "global_step": 56068, "epoch": 471, "lr": 1.1099980342734439e-05} +{"train_loss": 0.0008030454046092927, "global_step": 56069, "epoch": 471, "lr": 1.1098588456449516e-05} +{"train_loss": 0.0008452600450254977, "global_step": 56070, "epoch": 471, "lr": 1.1097196646543346e-05} +{"train_loss": 0.0007846697699278593, "global_step": 56071, "epoch": 471, "lr": 1.1095804913018686e-05} +{"train_loss": 0.0012488471111282706, "global_step": 56072, "epoch": 471, "lr": 1.1094413255878244e-05} +{"train_loss": 0.0003724370035342872, "global_step": 56073, "epoch": 471, "lr": 1.1093021675124781e-05} +{"train_loss": 0.0006422981969080865, "global_step": 56074, "epoch": 471, "lr": 1.1091630170761013e-05} +{"train_loss": 0.0005782541120424867, "global_step": 56075, "epoch": 471, "lr": 1.1090238742789661e-05} +{"train_loss": 0.00046778202522546053, "global_step": 56076, "epoch": 471, "lr": 1.1088847391213474e-05} +{"train_loss": 0.0005533808725886047, "global_step": 56077, "epoch": 471, "lr": 1.1087456116035172e-05} +{"train_loss": 0.00048289564438164234, "global_step": 56078, "epoch": 471, "lr": 1.10860649172575e-05} +{"train_loss": 0.0006823851144872606, "global_step": 56079, "epoch": 471, "lr": 1.1084673794883172e-05} +{"train_loss": 0.0005401296657510102, "global_step": 56080, "epoch": 471, "lr": 1.1083282748914941e-05} +{"train_loss": 0.0003879879950545728, "global_step": 56081, "epoch": 471, "lr": 1.108189177935553e-05} +{"train_loss": 0.0005823945975862443, "global_step": 56082, "epoch": 471, "lr": 1.1080500886207657e-05} +{"train_loss": 0.0006183145451359451, "global_step": 56083, "epoch": 471, "lr": 1.1079110069474069e-05} +{"train_loss": 0.0006216070614755154, "global_step": 56084, "epoch": 471, "lr": 1.1077719329157477e-05} +{"train_loss": 0.0004840961191803217, "global_step": 56085, "epoch": 471, "lr": 1.1076328665260638e-05} +{"train_loss": 0.000837086932733655, "global_step": 56086, "epoch": 471, "lr": 1.1074938077786261e-05} +{"train_loss": 0.0005661837058141828, "global_step": 56087, "epoch": 471, "lr": 1.1073547566737097e-05} +{"train_loss": 0.0005492310156114399, "global_step": 56088, "epoch": 471, "lr": 1.1072157132115857e-05} +{"train_loss": 0.00046857225243002176, "global_step": 56089, "epoch": 471, "lr": 1.1070766773925272e-05} +{"train_loss": 0.0005280579789541662, "global_step": 56090, "epoch": 471, "lr": 1.1069376492168088e-05} +{"train_loss": 0.0007429441320709884, "global_step": 56091, "epoch": 471, "lr": 1.106798628684701e-05} +{"train_loss": 0.0005919241812080145, "global_step": 56092, "epoch": 471, "lr": 1.1066596157964793e-05} +{"train_loss": 0.0004819671157747507, "global_step": 56093, "epoch": 471, "lr": 1.1065206105524156e-05} +{"train_loss": 0.0003695386985782534, "global_step": 56094, "epoch": 471, "lr": 1.1063816129527815e-05} +{"train_loss": 0.00038812137790955603, "global_step": 56095, "epoch": 471, "lr": 1.106242622997853e-05} +{"train_loss": 0.0003990864206571132, "global_step": 56096, "epoch": 471, "lr": 1.1061036406878988e-05} +{"train_loss": 0.000507719349116087, "global_step": 56097, "epoch": 471, "lr": 1.1059646660231964e-05} +{"train_loss": 0.00037025322671979666, "global_step": 56098, "epoch": 471, "lr": 1.1058256990040144e-05} +{"train_loss": 0.000445356999989599, "global_step": 56099, "epoch": 471, "lr": 1.1056867396306291e-05} +{"train_loss": 0.0005796936457045376, "global_step": 56100, "epoch": 471, "lr": 1.1055477879033105e-05} +{"train_loss": 0.0005510190967470407, "global_step": 56101, "epoch": 471, "lr": 1.1054088438223343e-05} +{"train_loss": 0.0007625968428328633, "global_step": 56102, "epoch": 471, "lr": 1.1052699073879702e-05} +{"train_loss": 0.0001898219488793984, "global_step": 56103, "epoch": 471, "lr": 1.1051309786004921e-05} +{"train_loss": 0.0004916961188428104, "global_step": 56104, "epoch": 471, "lr": 1.1049920574601753e-05} +{"train_loss": 0.001103671151213348, "global_step": 56105, "epoch": 471, "lr": 1.1048531439672888e-05} +{"train_loss": 0.0004213231150060892, "global_step": 56106, "epoch": 471, "lr": 1.1047142381221082e-05} +{"train_loss": 0.0005111484206281602, "global_step": 56107, "epoch": 471, "lr": 1.1045753399249054e-05} +{"train_loss": 0.0007209268514998257, "global_step": 56108, "epoch": 471, "lr": 1.1044364493759512e-05} +{"train_loss": 0.0005338735645636916, "global_step": 56109, "epoch": 471, "lr": 1.1042975664755212e-05} +{"train_loss": 0.00028749709599651396, "global_step": 56110, "epoch": 471, "lr": 1.1041586912238854e-05} +{"train_loss": 0.0006547675584442914, "global_step": 56111, "epoch": 471, "lr": 1.1040198236213195e-05} +{"train_loss": 0.0003929081140086055, "global_step": 56112, "epoch": 471, "lr": 1.103880963668094e-05} +{"train_loss": 0.0008672899566590786, "global_step": 56113, "epoch": 471, "lr": 1.1037421113644807e-05} +{"train_loss": 0.0006215487373992801, "global_step": 56114, "epoch": 471, "lr": 1.1036032667107549e-05} +{"train_loss": 0.0005721624474972486, "global_step": 56115, "epoch": 471, "lr": 1.1034644297071866e-05} +{"train_loss": 0.000674526032526046, "global_step": 56116, "epoch": 471, "lr": 1.1033256003540509e-05} +{"train_loss": 0.0003679118526633829, "global_step": 56117, "epoch": 471, "lr": 1.1031867786516175e-05} +{"train_loss": 0.00047445838572457433, "global_step": 56118, "epoch": 471, "lr": 1.1030479646001624e-05} +{"train_loss": 0.0004399731697048992, "global_step": 56119, "epoch": 471, "lr": 1.1029091581999561e-05} +{"train_loss": 0.00047709682257846, "global_step": 56120, "epoch": 471, "lr": 1.1027703594512694e-05} +{"train_loss": 0.0005022344412282109, "global_step": 56121, "epoch": 471, "lr": 1.1026315683543792e-05} +{"train_loss": 0.00047807107330299914, "global_step": 56122, "epoch": 471, "lr": 1.1024927849095534e-05} +{"train_loss": 0.00043033622205257416, "global_step": 56123, "epoch": 471, "lr": 1.102354009117068e-05} +{"train_loss": 0.00031001653405837715, "global_step": 56124, "epoch": 471, "lr": 1.102215240977194e-05} +{"train_loss": 0.0009796214289963245, "global_step": 56125, "epoch": 471, "lr": 1.1020764804902034e-05} +{"train_loss": 0.00043670099694281816, "global_step": 56126, "epoch": 471, "lr": 1.1019377276563698e-05} +{"train_loss": 0.0006974057760089636, "global_step": 56127, "epoch": 471, "lr": 1.1017989824759638e-05} +{"train_loss": 0.0010645868023857474, "global_step": 56128, "epoch": 471, "lr": 1.1016602449492602e-05} +{"train_loss": 0.0004345631168689579, "global_step": 56129, "epoch": 471, "lr": 1.1015215150765295e-05} +{"train_loss": 0.0007009078399278224, "global_step": 56130, "epoch": 471, "lr": 1.1013827928580456e-05} +{"train_loss": 0.0004988962318748236, "global_step": 56131, "epoch": 471, "lr": 1.1012440782940792e-05} +{"train_loss": 0.0003170706331729889, "global_step": 56132, "epoch": 471, "lr": 1.1011053713849046e-05} +{"train_loss": 0.0003826880711130798, "global_step": 56133, "epoch": 471, "lr": 1.1009666721307916e-05} +{"train_loss": 0.0004108759167138487, "global_step": 56134, "epoch": 471, "lr": 1.1008279805320154e-05} +{"train_loss": 0.000526446383446455, "global_step": 56135, "epoch": 471, "lr": 1.1006892965888454e-05} +{"train_loss": 0.0006083279731683433, "global_step": 56136, "epoch": 471, "lr": 1.1005506203015569e-05} +{"train_loss": 0.00036192400148138404, "global_step": 56137, "epoch": 471, "lr": 1.1004119516704198e-05} +{"train_loss": 0.0004050099814776331, "global_step": 56138, "epoch": 471, "lr": 1.100273290695708e-05} +{"train_loss": 0.0006624733796343207, "global_step": 56139, "epoch": 471, "lr": 1.1001346373776917e-05} +{"train_loss": 0.0004857430176343769, "global_step": 56140, "epoch": 471, "lr": 1.0999959917166458e-05} +{"train_loss": 0.0005024158162996173, "global_step": 56141, "epoch": 471, "lr": 1.0998573537128398e-05} +{"train_loss": 0.0007217045640572906, "global_step": 56142, "epoch": 471, "lr": 1.0997187233665485e-05} +{"train_loss": 0.000278701598290354, "global_step": 56143, "epoch": 471, "lr": 1.0995801006780431e-05} +{"train_loss": 0.0006816365057602525, "global_step": 56144, "epoch": 471, "lr": 1.0994414856475937e-05} +{"train_loss": 0.0008311906130984426, "global_step": 56145, "epoch": 471, "lr": 1.099302878275476e-05} +{"train_loss": 0.0004798051086254418, "global_step": 56146, "epoch": 471, "lr": 1.0991642785619587e-05} +{"train_loss": 0.0002638925507199019, "global_step": 56147, "epoch": 471, "lr": 1.0990256865073167e-05} +{"train_loss": 0.0002976176328957081, "global_step": 56148, "epoch": 471, "lr": 1.0988871021118201e-05} +{"train_loss": 0.0004581448738463223, "global_step": 56149, "epoch": 471, "lr": 1.0987485253757434e-05} +{"train_loss": 0.00024851562920957804, "global_step": 56150, "epoch": 471, "lr": 1.0986099562993568e-05} +{"train_loss": 0.00029390479903668165, "global_step": 56151, "epoch": 471, "lr": 1.0984713948829312e-05} +{"train_loss": 0.0005116197280585766, "global_step": 56152, "epoch": 471, "lr": 1.0983328411267419e-05} +{"train_loss": 0.000715268834028393, "global_step": 56153, "epoch": 471, "lr": 1.098194295031058e-05} +{"train_loss": 0.0005609630607068539, "global_step": 56154, "epoch": 471, "lr": 1.098055756596154e-05} +{"train_loss": 0.0004573616315610707, "global_step": 56155, "epoch": 471, "lr": 1.0979172258222991e-05} +{"train_loss": 0.00037211953895166516, "global_step": 56156, "epoch": 471, "lr": 1.0977787027097686e-05} +{"train_loss": 0.000586429494433105, "global_step": 56157, "epoch": 471, "lr": 1.0976401872588326e-05} +{"train_loss": 0.0003526451764628291, "global_step": 56158, "epoch": 471, "lr": 1.0975016794697612e-05} +{"train_loss": 0.0007491519791074097, "global_step": 56159, "epoch": 471, "lr": 1.0973631793428307e-05} +{"train_loss": 0.00045634349226020277, "global_step": 56160, "epoch": 471, "lr": 1.0972246868783087e-05} +{"train_loss": 0.000988179468549788, "global_step": 56161, "epoch": 471, "lr": 1.0970862020764706e-05} +{"train_loss": 0.0003566398227121681, "global_step": 56162, "epoch": 471, "lr": 1.0969477249375864e-05} +{"train_loss": 0.0004830769612453878, "global_step": 56163, "epoch": 471, "lr": 1.0968092554619275e-05} +{"train_loss": 0.0005497948150150478, "global_step": 56164, "epoch": 471, "lr": 1.0966707936497667e-05} +{"train_loss": 0.0005086506716907024, "global_step": 56165, "epoch": 471, "lr": 1.0965323395013765e-05} +{"train_loss": 0.000529762648511678, "global_step": 56166, "epoch": 471, "lr": 1.096393893017027e-05} +{"train_loss": 0.0005511279796796045, "global_step": 56167, "epoch": 471, "lr": 1.0962554541969926e-05, "val_loss": 0.014223428443074226} +{"train_loss": 0.00033040737616829574, "global_step": 56168, "epoch": 472, "lr": 1.0961170230415424e-05} +{"train_loss": 0.00040344189619645476, "global_step": 56169, "epoch": 472, "lr": 1.0959785995509502e-05} +{"train_loss": 0.0005679462337866426, "global_step": 56170, "epoch": 472, "lr": 1.0958401837254856e-05} +{"train_loss": 0.00035084414412267506, "global_step": 56171, "epoch": 472, "lr": 1.0957017755654237e-05} +{"train_loss": 0.0006516650901176035, "global_step": 56172, "epoch": 472, "lr": 1.095563375071032e-05} +{"train_loss": 0.00040048747905530035, "global_step": 56173, "epoch": 472, "lr": 1.0954249822425866e-05} +{"train_loss": 0.00033162516774609685, "global_step": 56174, "epoch": 472, "lr": 1.0952865970803566e-05} +{"train_loss": 0.0010791325476020575, "global_step": 56175, "epoch": 472, "lr": 1.095148219584613e-05} +{"train_loss": 0.000753720523789525, "global_step": 56176, "epoch": 472, "lr": 1.0950098497556304e-05} +{"train_loss": 0.0003697829379234463, "global_step": 56177, "epoch": 472, "lr": 1.0948714875936767e-05} +{"train_loss": 0.000726120313629508, "global_step": 56178, "epoch": 472, "lr": 1.0947331330990273e-05} +{"train_loss": 0.00030208611860871315, "global_step": 56179, "epoch": 472, "lr": 1.0945947862719513e-05} +{"train_loss": 0.0011057534720748663, "global_step": 56180, "epoch": 472, "lr": 1.0944564471127222e-05} +{"train_loss": 0.00047863091458566487, "global_step": 56181, "epoch": 472, "lr": 1.0943181156216103e-05} +{"train_loss": 0.0003168783150613308, "global_step": 56182, "epoch": 472, "lr": 1.0941797917988866e-05} +{"train_loss": 0.0006224788958206773, "global_step": 56183, "epoch": 472, "lr": 1.0940414756448247e-05} +{"train_loss": 0.0004222621500957757, "global_step": 56184, "epoch": 472, "lr": 1.0939031671596938e-05} +{"train_loss": 0.0007366338977590203, "global_step": 56185, "epoch": 472, "lr": 1.0937648663437683e-05} +{"train_loss": 0.0005054975626990199, "global_step": 56186, "epoch": 472, "lr": 1.0936265731973167e-05} +{"train_loss": 0.0004036584577988833, "global_step": 56187, "epoch": 472, "lr": 1.0934882877206131e-05} +{"train_loss": 0.00030148494988679886, "global_step": 56188, "epoch": 472, "lr": 1.0933500099139282e-05} +{"train_loss": 0.0003855035756714642, "global_step": 56189, "epoch": 472, "lr": 1.0932117397775315e-05} +{"train_loss": 0.00047081545926630497, "global_step": 56190, "epoch": 472, "lr": 1.093073477311698e-05} +{"train_loss": 0.0005323258228600025, "global_step": 56191, "epoch": 472, "lr": 1.0929352225166956e-05} +{"train_loss": 0.00042511551873758435, "global_step": 56192, "epoch": 472, "lr": 1.0927969753927992e-05} +{"train_loss": 0.0005064783617854118, "global_step": 56193, "epoch": 472, "lr": 1.0926587359402779e-05} +{"train_loss": 0.0006415066309273243, "global_step": 56194, "epoch": 472, "lr": 1.0925205041594028e-05} +{"train_loss": 0.0007690985803492367, "global_step": 56195, "epoch": 472, "lr": 1.092382280050448e-05} +{"train_loss": 0.0006437062402255833, "global_step": 56196, "epoch": 472, "lr": 1.092244063613681e-05} +{"train_loss": 0.0011291385162621737, "global_step": 56197, "epoch": 472, "lr": 1.0921058548493767e-05} +{"train_loss": 0.00037291826447471976, "global_step": 56198, "epoch": 472, "lr": 1.0919676537578045e-05} +{"train_loss": 0.00024066267360467464, "global_step": 56199, "epoch": 472, "lr": 1.091829460339237e-05} +{"train_loss": 0.00031729962211102247, "global_step": 56200, "epoch": 472, "lr": 1.0916912745939434e-05} +{"train_loss": 0.0003484200278762728, "global_step": 56201, "epoch": 472, "lr": 1.0915530965221964e-05} +{"train_loss": 0.0007741085137240589, "global_step": 56202, "epoch": 472, "lr": 1.091414926124269e-05} +{"train_loss": 0.00033299095230177045, "global_step": 56203, "epoch": 472, "lr": 1.0912767634004295e-05} +{"train_loss": 0.00034195181797258556, "global_step": 56204, "epoch": 472, "lr": 1.0911386083509517e-05} +{"train_loss": 0.0004838001332245767, "global_step": 56205, "epoch": 472, "lr": 1.0910004609761043e-05} +{"train_loss": 0.0006974946591071784, "global_step": 56206, "epoch": 472, "lr": 1.0908623212761616e-05} +{"train_loss": 0.000846287002786994, "global_step": 56207, "epoch": 472, "lr": 1.0907241892513926e-05} +{"train_loss": 0.00038850033888593316, "global_step": 56208, "epoch": 472, "lr": 1.0905860649020677e-05} +{"train_loss": 0.0009833858348429203, "global_step": 56209, "epoch": 472, "lr": 1.0904479482284607e-05} +{"train_loss": 0.0006199629860930145, "global_step": 56210, "epoch": 472, "lr": 1.0903098392308402e-05} +{"train_loss": 0.000686005805619061, "global_step": 56211, "epoch": 472, "lr": 1.0901717379094806e-05} +{"train_loss": 0.0006257460336200893, "global_step": 56212, "epoch": 472, "lr": 1.0900336442646502e-05} +{"train_loss": 0.0005192077369429171, "global_step": 56213, "epoch": 472, "lr": 1.0898955582966203e-05} +{"train_loss": 0.000911132781766355, "global_step": 56214, "epoch": 472, "lr": 1.0897574800056637e-05} +{"train_loss": 0.00046389721683226526, "global_step": 56215, "epoch": 472, "lr": 1.0896194093920491e-05} +{"train_loss": 0.00025127670960500836, "global_step": 56216, "epoch": 472, "lr": 1.089481346456051e-05} +{"train_loss": 0.0007040700293146074, "global_step": 56217, "epoch": 472, "lr": 1.0893432911979367e-05} +{"train_loss": 0.0003551252302713692, "global_step": 56218, "epoch": 472, "lr": 1.0892052436179807e-05} +{"train_loss": 0.0004930610884912312, "global_step": 56219, "epoch": 472, "lr": 1.0890672037164518e-05} +{"train_loss": 0.000578461040277034, "global_step": 56220, "epoch": 472, "lr": 1.0889291714936205e-05} +{"train_loss": 0.002345526125282049, "global_step": 56221, "epoch": 472, "lr": 1.0887911469497608e-05} +{"train_loss": 0.00026759441243484616, "global_step": 56222, "epoch": 472, "lr": 1.08865313008514e-05} +{"train_loss": 0.0005747979739680886, "global_step": 56223, "epoch": 472, "lr": 1.0885151209000321e-05} +{"train_loss": 0.00046188320266082883, "global_step": 56224, "epoch": 472, "lr": 1.0883771193947061e-05} +{"train_loss": 0.0006996000302024186, "global_step": 56225, "epoch": 472, "lr": 1.0882391255694347e-05} +{"train_loss": 0.0010882248170673847, "global_step": 56226, "epoch": 472, "lr": 1.0881011394244878e-05} +{"train_loss": 0.00034958592732436955, "global_step": 56227, "epoch": 472, "lr": 1.0879631609601353e-05} +{"train_loss": 0.0008625421905890107, "global_step": 56228, "epoch": 472, "lr": 1.0878251901766507e-05} +{"train_loss": 0.0003892173117492348, "global_step": 56229, "epoch": 472, "lr": 1.0876872270743015e-05} +{"train_loss": 0.0008105285814963281, "global_step": 56230, "epoch": 472, "lr": 1.087549271653362e-05} +{"train_loss": 0.0007738632848486304, "global_step": 56231, "epoch": 472, "lr": 1.0874113239141003e-05} +{"train_loss": 0.0005740480846725404, "global_step": 56232, "epoch": 472, "lr": 1.08727338385679e-05} +{"train_loss": 0.0005308444378897548, "global_step": 56233, "epoch": 472, "lr": 1.087135451481699e-05} +{"train_loss": 0.0005049222963862121, "global_step": 56234, "epoch": 472, "lr": 1.0869975267891003e-05} +{"train_loss": 0.0004024775407742709, "global_step": 56235, "epoch": 472, "lr": 1.0868596097792627e-05} +{"train_loss": 0.0005592738161794841, "global_step": 56236, "epoch": 472, "lr": 1.0867217004524589e-05} +{"train_loss": 0.0003385331074241549, "global_step": 56237, "epoch": 472, "lr": 1.0865837988089594e-05} +{"train_loss": 0.0005734341102652252, "global_step": 56238, "epoch": 472, "lr": 1.086445904849035e-05} +{"train_loss": 0.00044525362318381667, "global_step": 56239, "epoch": 472, "lr": 1.0863080185729546e-05} +{"train_loss": 0.0003212289302609861, "global_step": 56240, "epoch": 472, "lr": 1.086170139980992e-05} +{"train_loss": 0.0008417500066570938, "global_step": 56241, "epoch": 472, "lr": 1.0860322690734142e-05} +{"train_loss": 0.000677828153129667, "global_step": 56242, "epoch": 472, "lr": 1.0858944058504954e-05} +{"train_loss": 0.00047938668285496533, "global_step": 56243, "epoch": 472, "lr": 1.085756550312505e-05} +{"train_loss": 0.00026082407566718757, "global_step": 56244, "epoch": 472, "lr": 1.0856187024597119e-05} +{"train_loss": 0.000487014971440658, "global_step": 56245, "epoch": 472, "lr": 1.0854808622923901e-05} +{"train_loss": 0.0005758226034231484, "global_step": 56246, "epoch": 472, "lr": 1.0853430298108064e-05} +{"train_loss": 0.0006562705966643989, "global_step": 56247, "epoch": 472, "lr": 1.0852052050152351e-05} +{"train_loss": 0.0003873234672937542, "global_step": 56248, "epoch": 472, "lr": 1.0850673879059436e-05} +{"train_loss": 0.0008463398553431034, "global_step": 56249, "epoch": 472, "lr": 1.0849295784832058e-05} +{"train_loss": 0.0004169480234850198, "global_step": 56250, "epoch": 472, "lr": 1.0847917767472904e-05} +{"train_loss": 0.0006105939974077046, "global_step": 56251, "epoch": 472, "lr": 1.0846539826984664e-05} +{"train_loss": 0.0007006924133747816, "global_step": 56252, "epoch": 472, "lr": 1.0845161963370076e-05} +{"train_loss": 0.000469917751615867, "global_step": 56253, "epoch": 472, "lr": 1.0843784176631817e-05} +{"train_loss": 0.0005441762041300535, "global_step": 56254, "epoch": 472, "lr": 1.0842406466772614e-05} +{"train_loss": 0.000594630662817508, "global_step": 56255, "epoch": 472, "lr": 1.0841028833795152e-05} +{"train_loss": 0.0004990879679098725, "global_step": 56256, "epoch": 472, "lr": 1.0839651277702162e-05} +{"train_loss": 0.0005820455844514072, "global_step": 56257, "epoch": 472, "lr": 1.0838273798496328e-05} +{"train_loss": 0.0005221200990490615, "global_step": 56258, "epoch": 472, "lr": 1.0836896396180352e-05} +{"train_loss": 0.00043658973299898207, "global_step": 56259, "epoch": 472, "lr": 1.0835519070756955e-05} +{"train_loss": 0.000386598811019212, "global_step": 56260, "epoch": 472, "lr": 1.0834141822228816e-05} +{"train_loss": 0.0011088282335549593, "global_step": 56261, "epoch": 472, "lr": 1.0832764650598675e-05} +{"train_loss": 0.00046846899203956127, "global_step": 56262, "epoch": 472, "lr": 1.0831387555869199e-05} +{"train_loss": 0.0006719474913552403, "global_step": 56263, "epoch": 472, "lr": 1.0830010538043123e-05} +{"train_loss": 0.0005514426156878471, "global_step": 56264, "epoch": 472, "lr": 1.0828633597123129e-05} +{"train_loss": 0.0006584235816262662, "global_step": 56265, "epoch": 472, "lr": 1.0827256733111934e-05} +{"train_loss": 0.00018568956875242293, "global_step": 56266, "epoch": 472, "lr": 1.0825879946012223e-05} +{"train_loss": 0.000523855909705162, "global_step": 56267, "epoch": 472, "lr": 1.0824503235826728e-05} +{"train_loss": 0.00076087232446298, "global_step": 56268, "epoch": 472, "lr": 1.082312660255812e-05} +{"train_loss": 0.0011862004175782204, "global_step": 56269, "epoch": 472, "lr": 1.0821750046209129e-05} +{"train_loss": 0.0004781438910868019, "global_step": 56270, "epoch": 472, "lr": 1.0820373566782437e-05} +{"train_loss": 0.0003012816596310586, "global_step": 56271, "epoch": 472, "lr": 1.0818997164280764e-05} +{"train_loss": 0.0005242625484243035, "global_step": 56272, "epoch": 472, "lr": 1.0817620838706799e-05} +{"train_loss": 0.0007597070070914924, "global_step": 56273, "epoch": 472, "lr": 1.0816244590063256e-05} +{"train_loss": 0.0002750447019934654, "global_step": 56274, "epoch": 472, "lr": 1.081486841835282e-05} +{"train_loss": 0.00048162657185457647, "global_step": 56275, "epoch": 472, "lr": 1.0813492323578218e-05} +{"train_loss": 0.0007232975913211703, "global_step": 56276, "epoch": 472, "lr": 1.081211630574213e-05} +{"train_loss": 0.0007096192566677928, "global_step": 56277, "epoch": 472, "lr": 1.081074036484726e-05} +{"train_loss": 0.0003336141526233405, "global_step": 56278, "epoch": 472, "lr": 1.0809364500896323e-05} +{"train_loss": 0.0004427307576406747, "global_step": 56279, "epoch": 472, "lr": 1.0807988713892003e-05} +{"train_loss": 0.0002778292109724134, "global_step": 56280, "epoch": 472, "lr": 1.0806613003837018e-05} +{"train_loss": 0.00039291588473133743, "global_step": 56281, "epoch": 472, "lr": 1.0805237370734067e-05} +{"train_loss": 0.0004405112413223833, "global_step": 56282, "epoch": 472, "lr": 1.080386181458583e-05} +{"train_loss": 0.0009571004775352776, "global_step": 56283, "epoch": 472, "lr": 1.0802486335395034e-05} +{"train_loss": 0.0005438584485091269, "global_step": 56284, "epoch": 472, "lr": 1.0801110933164354e-05} +{"train_loss": 0.0007347735809162259, "global_step": 56285, "epoch": 472, "lr": 1.0799735607896522e-05} +{"train_loss": 0.0005722813404354995, "global_step": 56286, "epoch": 472, "lr": 1.0798360359594206e-05, "val_loss": 0.014803363010287285} +{"train_loss": 0.0008517933893017471, "global_step": 56287, "epoch": 473, "lr": 1.0796985188260134e-05} +{"train_loss": 0.000469610677100718, "global_step": 56288, "epoch": 473, "lr": 1.0795610093896997e-05} +{"train_loss": 0.0005104432348161936, "global_step": 56289, "epoch": 473, "lr": 1.0794235076507475e-05} +{"train_loss": 0.0009110535611398518, "global_step": 56290, "epoch": 473, "lr": 1.0792860136094297e-05} +{"train_loss": 0.00029392726719379425, "global_step": 56291, "epoch": 473, "lr": 1.0791485272660135e-05} +{"train_loss": 0.0005860186647623777, "global_step": 56292, "epoch": 473, "lr": 1.0790110486207723e-05} +{"train_loss": 0.00044929844443686306, "global_step": 56293, "epoch": 473, "lr": 1.0788735776739734e-05} +{"train_loss": 0.00043780499254353344, "global_step": 56294, "epoch": 473, "lr": 1.0787361144258857e-05} +{"train_loss": 0.0003590706910472363, "global_step": 56295, "epoch": 473, "lr": 1.0785986588767828e-05} +{"train_loss": 0.0005756523460149765, "global_step": 56296, "epoch": 473, "lr": 1.0784612110269305e-05} +{"train_loss": 0.0003294298949185759, "global_step": 56297, "epoch": 473, "lr": 1.0783237708766008e-05} +{"train_loss": 0.00041518156649544835, "global_step": 56298, "epoch": 473, "lr": 1.0781863384260648e-05} +{"train_loss": 0.0004942028317600489, "global_step": 56299, "epoch": 473, "lr": 1.07804891367559e-05} +{"train_loss": 0.0004784560587722808, "global_step": 56300, "epoch": 473, "lr": 1.0779114966254483e-05} +{"train_loss": 0.0005987938493490219, "global_step": 56301, "epoch": 473, "lr": 1.0777740872759067e-05} +{"train_loss": 0.00044448947301134467, "global_step": 56302, "epoch": 473, "lr": 1.0776366856272385e-05} +{"train_loss": 0.0005195540143176913, "global_step": 56303, "epoch": 473, "lr": 1.0774992916797099e-05} +{"train_loss": 0.00042086909525096416, "global_step": 56304, "epoch": 473, "lr": 1.0773619054335937e-05} +{"train_loss": 0.00031913857674226165, "global_step": 56305, "epoch": 473, "lr": 1.0772245268891568e-05} +{"train_loss": 0.0009290285524912179, "global_step": 56306, "epoch": 473, "lr": 1.0770871560466722e-05} +{"train_loss": 0.00021724423277191818, "global_step": 56307, "epoch": 473, "lr": 1.0769497929064083e-05} +{"train_loss": 0.0003993007121607661, "global_step": 56308, "epoch": 473, "lr": 1.0768124374686322e-05} +{"train_loss": 0.0009107744554057717, "global_step": 56309, "epoch": 473, "lr": 1.0766750897336176e-05} +{"train_loss": 0.0002991580404341221, "global_step": 56310, "epoch": 473, "lr": 1.0765377497016305e-05} +{"train_loss": 0.00032327297958545387, "global_step": 56311, "epoch": 473, "lr": 1.0764004173729436e-05} +{"train_loss": 0.0006251814775168896, "global_step": 56312, "epoch": 473, "lr": 1.0762630927478256e-05} +{"train_loss": 0.0001671978534432128, "global_step": 56313, "epoch": 473, "lr": 1.0761257758265447e-05} +{"train_loss": 0.0004303922178223729, "global_step": 56314, "epoch": 473, "lr": 1.0759884666093728e-05} +{"train_loss": 0.0009338559466414154, "global_step": 56315, "epoch": 473, "lr": 1.0758511650965774e-05} +{"train_loss": 0.0009733128827065229, "global_step": 56316, "epoch": 473, "lr": 1.0757138712884295e-05} +{"train_loss": 0.0005432709003798664, "global_step": 56317, "epoch": 473, "lr": 1.0755765851851974e-05} +{"train_loss": 0.00040039795567281544, "global_step": 56318, "epoch": 473, "lr": 1.0754393067871526e-05} +{"train_loss": 0.0004383190826047212, "global_step": 56319, "epoch": 473, "lr": 1.0753020360945636e-05} +{"train_loss": 0.0003150511474814266, "global_step": 56320, "epoch": 473, "lr": 1.0751647731076985e-05} +{"train_loss": 0.00042217253940179944, "global_step": 56321, "epoch": 473, "lr": 1.0750275178268293e-05} +{"train_loss": 0.0009135880973190069, "global_step": 56322, "epoch": 473, "lr": 1.0748902702522223e-05} +{"train_loss": 0.0007062951335683465, "global_step": 56323, "epoch": 473, "lr": 1.0747530303841508e-05} +{"train_loss": 0.0006421388243325055, "global_step": 56324, "epoch": 473, "lr": 1.074615798222881e-05} +{"train_loss": 0.0005169968353584409, "global_step": 56325, "epoch": 473, "lr": 1.0744785737686852e-05} +{"train_loss": 0.0006453496171161532, "global_step": 56326, "epoch": 473, "lr": 1.0743413570218313e-05} +{"train_loss": 0.00032662751618772745, "global_step": 56327, "epoch": 473, "lr": 1.074204147982587e-05} +{"train_loss": 0.000553568359464407, "global_step": 56328, "epoch": 473, "lr": 1.0740669466512255e-05} +{"train_loss": 0.0005279528559185565, "global_step": 56329, "epoch": 473, "lr": 1.0739297530280124e-05} +{"train_loss": 0.0009193624136969447, "global_step": 56330, "epoch": 473, "lr": 1.0737925671132198e-05} +{"train_loss": 0.00037542072823271155, "global_step": 56331, "epoch": 473, "lr": 1.073655388907115e-05} +{"train_loss": 0.0006741790566593409, "global_step": 56332, "epoch": 473, "lr": 1.0735182184099685e-05} +{"train_loss": 0.0006817009998485446, "global_step": 56333, "epoch": 473, "lr": 1.0733810556220508e-05} +{"train_loss": 0.000514747342094779, "global_step": 56334, "epoch": 473, "lr": 1.0732439005436284e-05} +{"train_loss": 0.0009326605941168964, "global_step": 56335, "epoch": 473, "lr": 1.0731067531749733e-05} +{"train_loss": 0.0007798040169291198, "global_step": 56336, "epoch": 473, "lr": 1.0729696135163525e-05} +{"train_loss": 0.0006615036982111633, "global_step": 56337, "epoch": 473, "lr": 1.072832481568038e-05} +{"train_loss": 0.0005045164143666625, "global_step": 56338, "epoch": 473, "lr": 1.0726953573302967e-05} +{"train_loss": 0.00080535386223346, "global_step": 56339, "epoch": 473, "lr": 1.0725582408033974e-05} +{"train_loss": 0.00040140055352821946, "global_step": 56340, "epoch": 473, "lr": 1.0724211319876116e-05} +{"train_loss": 0.0006031793891452253, "global_step": 56341, "epoch": 473, "lr": 1.0722840308832061e-05} +{"train_loss": 0.0004484368837438524, "global_step": 56342, "epoch": 473, "lr": 1.072146937490453e-05} +{"train_loss": 0.0006834278465248644, "global_step": 56343, "epoch": 473, "lr": 1.0720098518096178e-05} +{"train_loss": 0.0006458120769821107, "global_step": 56344, "epoch": 473, "lr": 1.0718727738409734e-05} +{"train_loss": 0.00038577604573220015, "global_step": 56345, "epoch": 473, "lr": 1.071735703584787e-05} +{"train_loss": 0.0005596153205260634, "global_step": 56346, "epoch": 473, "lr": 1.0715986410413264e-05} +{"train_loss": 0.0008018076769076288, "global_step": 56347, "epoch": 473, "lr": 1.0714615862108635e-05} +{"train_loss": 0.0004651793569792062, "global_step": 56348, "epoch": 473, "lr": 1.071324539093665e-05} +{"train_loss": 0.0006929121445864439, "global_step": 56349, "epoch": 473, "lr": 1.0711874996900024e-05} +{"train_loss": 0.0013760861475020647, "global_step": 56350, "epoch": 473, "lr": 1.0710504680001433e-05} +{"train_loss": 0.0003369374026078731, "global_step": 56351, "epoch": 473, "lr": 1.0709134440243557e-05} +{"train_loss": 0.0006961325416341424, "global_step": 56352, "epoch": 473, "lr": 1.0707764277629107e-05} +{"train_loss": 0.0005176585400477052, "global_step": 56353, "epoch": 473, "lr": 1.070639419216075e-05} +{"train_loss": 0.0007245684391818941, "global_step": 56354, "epoch": 473, "lr": 1.070502418384121e-05} +{"train_loss": 0.0005133769591338933, "global_step": 56355, "epoch": 473, "lr": 1.070365425267314e-05} +{"train_loss": 0.000626254070084542, "global_step": 56356, "epoch": 473, "lr": 1.0702284398659257e-05} +{"train_loss": 0.0006468199426308274, "global_step": 56357, "epoch": 473, "lr": 1.0700914621802244e-05} +{"train_loss": 0.00043568044202402234, "global_step": 56358, "epoch": 473, "lr": 1.0699544922104776e-05} +{"train_loss": 0.000424367404775694, "global_step": 56359, "epoch": 473, "lr": 1.0698175299569563e-05} +{"train_loss": 0.0006016449187882245, "global_step": 56360, "epoch": 473, "lr": 1.0696805754199269e-05} +{"train_loss": 0.0004411684349179268, "global_step": 56361, "epoch": 473, "lr": 1.0695436285996613e-05} +{"train_loss": 0.0008486479055136442, "global_step": 56362, "epoch": 473, "lr": 1.0694066894964255e-05} +{"train_loss": 0.0004366788489278406, "global_step": 56363, "epoch": 473, "lr": 1.069269758110491e-05} +{"train_loss": 0.0007847599918022752, "global_step": 56364, "epoch": 473, "lr": 1.0691328344421242e-05} +{"train_loss": 0.00041760929161682725, "global_step": 56365, "epoch": 473, "lr": 1.0689959184915965e-05} +{"train_loss": 0.0008346464019268751, "global_step": 56366, "epoch": 473, "lr": 1.0688590102591738e-05} +{"train_loss": 0.000924510124605149, "global_step": 56367, "epoch": 473, "lr": 1.0687221097451267e-05} +{"train_loss": 0.0008996197138912976, "global_step": 56368, "epoch": 473, "lr": 1.0685852169497252e-05} +{"train_loss": 0.0006031615776009858, "global_step": 56369, "epoch": 473, "lr": 1.0684483318732363e-05} +{"train_loss": 0.00032539787935093045, "global_step": 56370, "epoch": 473, "lr": 1.0683114545159278e-05} +{"train_loss": 0.0008499702671542764, "global_step": 56371, "epoch": 473, "lr": 1.0681745848780711e-05} +{"train_loss": 0.0007174730417318642, "global_step": 56372, "epoch": 473, "lr": 1.068037722959932e-05} +{"train_loss": 0.0010894228471443057, "global_step": 56373, "epoch": 473, "lr": 1.0679008687617825e-05} +{"train_loss": 0.0003696736239362508, "global_step": 56374, "epoch": 473, "lr": 1.0677640222838875e-05} +{"train_loss": 0.0015154548455029726, "global_step": 56375, "epoch": 473, "lr": 1.06762718352652e-05} +{"train_loss": 0.00035553460475057364, "global_step": 56376, "epoch": 473, "lr": 1.067490352489946e-05} +{"train_loss": 0.0013964633690193295, "global_step": 56377, "epoch": 473, "lr": 1.067353529174433e-05} +{"train_loss": 0.0004911663709208369, "global_step": 56378, "epoch": 473, "lr": 1.067216713580253e-05} +{"train_loss": 0.0005298100295476615, "global_step": 56379, "epoch": 473, "lr": 1.0670799057076714e-05} +{"train_loss": 0.0010751407826319337, "global_step": 56380, "epoch": 473, "lr": 1.066943105556959e-05} +{"train_loss": 0.000364469742635265, "global_step": 56381, "epoch": 473, "lr": 1.0668063131283845e-05} +{"train_loss": 0.0006479599978774786, "global_step": 56382, "epoch": 473, "lr": 1.066669528422214e-05} +{"train_loss": 0.0007442424539476633, "global_step": 56383, "epoch": 473, "lr": 1.0665327514387186e-05} +{"train_loss": 0.0004957881756126881, "global_step": 56384, "epoch": 473, "lr": 1.066395982178165e-05} +{"train_loss": 0.0008292814018204808, "global_step": 56385, "epoch": 473, "lr": 1.0662592206408234e-05} +{"train_loss": 0.0002574085083324462, "global_step": 56386, "epoch": 473, "lr": 1.066122466826961e-05} +{"train_loss": 0.00044212426291778684, "global_step": 56387, "epoch": 473, "lr": 1.0659857207368473e-05} +{"train_loss": 0.000708282517734915, "global_step": 56388, "epoch": 473, "lr": 1.0658489823707513e-05} +{"train_loss": 0.00045204465277493, "global_step": 56389, "epoch": 473, "lr": 1.0657122517289386e-05} +{"train_loss": 0.0010668080067262053, "global_step": 56390, "epoch": 473, "lr": 1.065575528811681e-05} +{"train_loss": 0.0005356292240321636, "global_step": 56391, "epoch": 473, "lr": 1.0654388136192445e-05} +{"train_loss": 0.000742954493034631, "global_step": 56392, "epoch": 473, "lr": 1.0653021061518997e-05} +{"train_loss": 0.0007582263788208365, "global_step": 56393, "epoch": 473, "lr": 1.0651654064099121e-05} +{"train_loss": 0.0004698095144703984, "global_step": 56394, "epoch": 473, "lr": 1.065028714393554e-05} +{"train_loss": 0.0003279810189269483, "global_step": 56395, "epoch": 473, "lr": 1.0648920301030895e-05} +{"train_loss": 0.00029744900530204177, "global_step": 56396, "epoch": 473, "lr": 1.0647553535387906e-05} +{"train_loss": 0.0006220837240107358, "global_step": 56397, "epoch": 473, "lr": 1.0646186847009232e-05} +{"train_loss": 0.0009059850708581507, "global_step": 56398, "epoch": 473, "lr": 1.0644820235897573e-05} +{"train_loss": 0.0007466612732969224, "global_step": 56399, "epoch": 473, "lr": 1.06434537020556e-05} +{"train_loss": 0.0005560555146075785, "global_step": 56400, "epoch": 473, "lr": 1.064208724548601e-05} +{"train_loss": 0.000329971662722528, "global_step": 56401, "epoch": 473, "lr": 1.0640720866191461e-05} +{"train_loss": 0.000947978813201189, "global_step": 56402, "epoch": 473, "lr": 1.063935456417467e-05} +{"train_loss": 0.0004358768055681139, "global_step": 56403, "epoch": 473, "lr": 1.0637988339438282e-05} +{"train_loss": 0.0005319967167451978, "global_step": 56404, "epoch": 473, "lr": 1.0636622191985018e-05} +{"train_loss": 0.0006045598656324545, "global_step": 56405, "epoch": 473, "lr": 1.0635256121817521e-05, "val_loss": 0.03673617169260979} +{"train_loss": 0.0004677026881836355, "global_step": 56406, "epoch": 474, "lr": 1.0633890128938512e-05} +{"train_loss": 0.0007033927249722183, "global_step": 56407, "epoch": 474, "lr": 1.0632524213350653e-05} +{"train_loss": 0.0006665100809186697, "global_step": 56408, "epoch": 474, "lr": 1.0631158375056615e-05} +{"train_loss": 0.0005106834578327835, "global_step": 56409, "epoch": 474, "lr": 1.0629792614059103e-05} +{"train_loss": 0.0009645443642511964, "global_step": 56410, "epoch": 474, "lr": 1.0628426930360775e-05} +{"train_loss": 0.00026925737620331347, "global_step": 56411, "epoch": 474, "lr": 1.0627061323964332e-05} +{"train_loss": 0.0007033789879642427, "global_step": 56412, "epoch": 474, "lr": 1.0625695794872442e-05} +{"train_loss": 0.0005968619370833039, "global_step": 56413, "epoch": 474, "lr": 1.0624330343087801e-05} +{"train_loss": 0.0012379416730254889, "global_step": 56414, "epoch": 474, "lr": 1.0622964968613081e-05} +{"train_loss": 0.0006367524620145559, "global_step": 56415, "epoch": 474, "lr": 1.062159967145095e-05} +{"train_loss": 0.0003473558172117919, "global_step": 56416, "epoch": 474, "lr": 1.0620234451604117e-05} +{"train_loss": 0.00042928734910674393, "global_step": 56417, "epoch": 474, "lr": 1.061886930907523e-05} +{"train_loss": 0.0003695514751598239, "global_step": 56418, "epoch": 474, "lr": 1.0617504243867e-05} +{"train_loss": 0.0006363571737892926, "global_step": 56419, "epoch": 474, "lr": 1.0616139255982095e-05} +{"train_loss": 0.0002436634968034923, "global_step": 56420, "epoch": 474, "lr": 1.0614774345423173e-05} +{"train_loss": 0.0009306062711402774, "global_step": 56421, "epoch": 474, "lr": 1.0613409512192951e-05} +{"train_loss": 0.0006025602924637496, "global_step": 56422, "epoch": 474, "lr": 1.0612044756294082e-05} +{"train_loss": 0.0003877606359310448, "global_step": 56423, "epoch": 474, "lr": 1.0610680077729263e-05} +{"train_loss": 0.0003672807360999286, "global_step": 56424, "epoch": 474, "lr": 1.0609315476501159e-05} +{"train_loss": 0.00040228452417068183, "global_step": 56425, "epoch": 474, "lr": 1.060795095261246e-05} +{"train_loss": 0.0010522697120904922, "global_step": 56426, "epoch": 474, "lr": 1.0606586506065846e-05} +{"train_loss": 0.0004215714579913765, "global_step": 56427, "epoch": 474, "lr": 1.060522213686398e-05} +{"train_loss": 0.0007515012403018773, "global_step": 56428, "epoch": 474, "lr": 1.0603857845009563e-05} +{"train_loss": 0.0005917580565437675, "global_step": 56429, "epoch": 474, "lr": 1.0602493630505246e-05} +{"train_loss": 0.0003997329040430486, "global_step": 56430, "epoch": 474, "lr": 1.0601129493353724e-05} +{"train_loss": 0.000584480119869113, "global_step": 56431, "epoch": 474, "lr": 1.059976543355769e-05} +{"train_loss": 0.0005510060000233352, "global_step": 56432, "epoch": 474, "lr": 1.0598401451119794e-05} +{"train_loss": 0.0005799802020192146, "global_step": 56433, "epoch": 474, "lr": 1.0597037546042742e-05} +{"train_loss": 0.0012283101677894592, "global_step": 56434, "epoch": 474, "lr": 1.0595673718329185e-05} +{"train_loss": 0.00035369457327760756, "global_step": 56435, "epoch": 474, "lr": 1.0594309967981824e-05} +{"train_loss": 0.00040821224683895707, "global_step": 56436, "epoch": 474, "lr": 1.0592946295003309e-05} +{"train_loss": 0.0006538087036460638, "global_step": 56437, "epoch": 474, "lr": 1.0591582699396353e-05} +{"train_loss": 0.000610081129707396, "global_step": 56438, "epoch": 474, "lr": 1.0590219181163613e-05} +{"train_loss": 0.0004641075211111456, "global_step": 56439, "epoch": 474, "lr": 1.0588855740307751e-05} +{"train_loss": 0.0004282099544070661, "global_step": 56440, "epoch": 474, "lr": 1.0587492376831476e-05} +{"train_loss": 0.0005115896929055452, "global_step": 56441, "epoch": 474, "lr": 1.0586129090737435e-05} +{"train_loss": 0.0006620836793445051, "global_step": 56442, "epoch": 474, "lr": 1.058476588202833e-05} +{"train_loss": 0.0008950658375397325, "global_step": 56443, "epoch": 474, "lr": 1.0583402750706817e-05} +{"train_loss": 0.0004928300040774047, "global_step": 56444, "epoch": 474, "lr": 1.0582039696775592e-05} +{"train_loss": 0.0006804174627177417, "global_step": 56445, "epoch": 474, "lr": 1.058067672023732e-05} +{"train_loss": 0.0003219587670173496, "global_step": 56446, "epoch": 474, "lr": 1.0579313821094667e-05} +{"train_loss": 0.0006347480230033398, "global_step": 56447, "epoch": 474, "lr": 1.0577950999350333e-05} +{"train_loss": 0.0006153749418444932, "global_step": 56448, "epoch": 474, "lr": 1.057658825500697e-05} +{"train_loss": 0.0004156038339715451, "global_step": 56449, "epoch": 474, "lr": 1.0575225588067272e-05} +{"train_loss": 0.0008050542091950774, "global_step": 56450, "epoch": 474, "lr": 1.0573862998533907e-05} +{"train_loss": 0.0005036320653744042, "global_step": 56451, "epoch": 474, "lr": 1.0572500486409542e-05} +{"train_loss": 0.0004466223472263664, "global_step": 56452, "epoch": 474, "lr": 1.0571138051696865e-05} +{"train_loss": 0.000588916998822242, "global_step": 56453, "epoch": 474, "lr": 1.0569775694398542e-05} +{"train_loss": 0.000580282649025321, "global_step": 56454, "epoch": 474, "lr": 1.056841341451726e-05} +{"train_loss": 0.0006726637366227806, "global_step": 56455, "epoch": 474, "lr": 1.0567051212055673e-05} +{"train_loss": 0.0006381996208801866, "global_step": 56456, "epoch": 474, "lr": 1.0565689087016483e-05} +{"train_loss": 0.00041835816227830946, "global_step": 56457, "epoch": 474, "lr": 1.056432703940235e-05} +{"train_loss": 0.00023366724781226367, "global_step": 56458, "epoch": 474, "lr": 1.056296506921593e-05} +{"train_loss": 0.0005129650235176086, "global_step": 56459, "epoch": 474, "lr": 1.0561603176459933e-05} +{"train_loss": 0.0005214791744947433, "global_step": 56460, "epoch": 474, "lr": 1.0560241361136996e-05} +{"train_loss": 0.000654732168186456, "global_step": 56461, "epoch": 474, "lr": 1.0558879623249828e-05} +{"train_loss": 0.000631147064268589, "global_step": 56462, "epoch": 474, "lr": 1.0557517962801077e-05} +{"train_loss": 0.0005560917779803276, "global_step": 56463, "epoch": 474, "lr": 1.0556156379793436e-05} +{"train_loss": 0.0003836142423097044, "global_step": 56464, "epoch": 474, "lr": 1.0554794874229552e-05} +{"train_loss": 0.00040114487637765706, "global_step": 56465, "epoch": 474, "lr": 1.0553433446112116e-05} +{"train_loss": 0.00044148790766485035, "global_step": 56466, "epoch": 474, "lr": 1.055207209544381e-05} +{"train_loss": 0.0007454825681634247, "global_step": 56467, "epoch": 474, "lr": 1.0550710822227289e-05} +{"train_loss": 0.00044857527245767415, "global_step": 56468, "epoch": 474, "lr": 1.0549349626465237e-05} +{"train_loss": 0.0006623878725804389, "global_step": 56469, "epoch": 474, "lr": 1.0547988508160334e-05} +{"train_loss": 0.0005073340144008398, "global_step": 56470, "epoch": 474, "lr": 1.0546627467315218e-05} +{"train_loss": 0.0004562200920190662, "global_step": 56471, "epoch": 474, "lr": 1.05452665039326e-05} +{"train_loss": 0.0005465777940116823, "global_step": 56472, "epoch": 474, "lr": 1.0543905618015126e-05} +{"train_loss": 0.00039728492265567183, "global_step": 56473, "epoch": 474, "lr": 1.0542544809565485e-05} +{"train_loss": 0.0006014889222569764, "global_step": 56474, "epoch": 474, "lr": 1.0541184078586336e-05} +{"train_loss": 0.00044242350850254297, "global_step": 56475, "epoch": 474, "lr": 1.0539823425080364e-05} +{"train_loss": 0.0005792411393485963, "global_step": 56476, "epoch": 474, "lr": 1.0538462849050234e-05} +{"train_loss": 0.0004516859771683812, "global_step": 56477, "epoch": 474, "lr": 1.0537102350498607e-05} +{"train_loss": 0.0005568518536165357, "global_step": 56478, "epoch": 474, "lr": 1.0535741929428172e-05} +{"train_loss": 0.00032192078651860356, "global_step": 56479, "epoch": 474, "lr": 1.053438158584158e-05} +{"train_loss": 0.000383384816814214, "global_step": 56480, "epoch": 474, "lr": 1.0533021319741525e-05} +{"train_loss": 0.00037385051837190986, "global_step": 56481, "epoch": 474, "lr": 1.0531661131130671e-05} +{"train_loss": 0.000324650522088632, "global_step": 56482, "epoch": 474, "lr": 1.0530301020011668e-05} +{"train_loss": 0.0007428458775393665, "global_step": 56483, "epoch": 474, "lr": 1.0528940986387214e-05} +{"train_loss": 0.0006012049270793796, "global_step": 56484, "epoch": 474, "lr": 1.0527581030259953e-05} +{"train_loss": 0.00034397694980725646, "global_step": 56485, "epoch": 474, "lr": 1.0526221151632587e-05} +{"train_loss": 0.0010748447384685278, "global_step": 56486, "epoch": 474, "lr": 1.0524861350507753e-05} +{"train_loss": 0.0003199067141395062, "global_step": 56487, "epoch": 474, "lr": 1.0523501626888155e-05} +{"train_loss": 0.0007671479252167046, "global_step": 56488, "epoch": 474, "lr": 1.0522141980776435e-05} +{"train_loss": 0.0003199927741661668, "global_step": 56489, "epoch": 474, "lr": 1.0520782412175262e-05} +{"train_loss": 0.0005333420122042298, "global_step": 56490, "epoch": 474, "lr": 1.051942292108733e-05} +{"train_loss": 0.0006263386458158493, "global_step": 56491, "epoch": 474, "lr": 1.051806350751528e-05} +{"train_loss": 0.0006162681384012103, "global_step": 56492, "epoch": 474, "lr": 1.0516704171461805e-05} +{"train_loss": 0.0006271389429457486, "global_step": 56493, "epoch": 474, "lr": 1.0515344912929554e-05} +{"train_loss": 0.0004961668164469302, "global_step": 56494, "epoch": 474, "lr": 1.0513985731921216e-05} +{"train_loss": 0.0007474200101569295, "global_step": 56495, "epoch": 474, "lr": 1.0512626628439437e-05} +{"train_loss": 0.0003678312641568482, "global_step": 56496, "epoch": 474, "lr": 1.0511267602486907e-05} +{"train_loss": 0.0006722723483107984, "global_step": 56497, "epoch": 474, "lr": 1.050990865406627e-05} +{"train_loss": 0.0003501267347019166, "global_step": 56498, "epoch": 474, "lr": 1.0508549783180228e-05} +{"train_loss": 0.0009801925625652075, "global_step": 56499, "epoch": 474, "lr": 1.0507190989831412e-05} +{"train_loss": 0.000484776304801926, "global_step": 56500, "epoch": 474, "lr": 1.050583227402252e-05} +{"train_loss": 0.0005393269238993526, "global_step": 56501, "epoch": 474, "lr": 1.0504473635756196e-05} +{"train_loss": 0.0006720008095726371, "global_step": 56502, "epoch": 474, "lr": 1.0503115075035126e-05} +{"train_loss": 0.0008002385729923844, "global_step": 56503, "epoch": 474, "lr": 1.050175659186196e-05} +{"train_loss": 0.0007913581794127822, "global_step": 56504, "epoch": 474, "lr": 1.050039818623939e-05} +{"train_loss": 0.0007677205721847713, "global_step": 56505, "epoch": 474, "lr": 1.0499039858170057e-05} +{"train_loss": 0.0004731918452307582, "global_step": 56506, "epoch": 474, "lr": 1.0497681607656651e-05} +{"train_loss": 0.0007920539355836809, "global_step": 56507, "epoch": 474, "lr": 1.0496323434701828e-05} +{"train_loss": 0.000822409288957715, "global_step": 56508, "epoch": 474, "lr": 1.0494965339308232e-05} +{"train_loss": 0.00047272670781239867, "global_step": 56509, "epoch": 474, "lr": 1.0493607321478571e-05} +{"train_loss": 0.00018516906129661947, "global_step": 56510, "epoch": 474, "lr": 1.049224938121548e-05} +{"train_loss": 0.00038277439307421446, "global_step": 56511, "epoch": 474, "lr": 1.0490891518521646e-05} +{"train_loss": 0.00019342204905115068, "global_step": 56512, "epoch": 474, "lr": 1.0489533733399715e-05} +{"train_loss": 0.001030188286677003, "global_step": 56513, "epoch": 474, "lr": 1.0488176025852376e-05} +{"train_loss": 0.00037636884371750057, "global_step": 56514, "epoch": 474, "lr": 1.0486818395882281e-05} +{"train_loss": 0.00043061524047516286, "global_step": 56515, "epoch": 474, "lr": 1.0485460843492084e-05} +{"train_loss": 0.00023844072711654007, "global_step": 56516, "epoch": 474, "lr": 1.0484103368684478e-05} +{"train_loss": 0.0005528362817130983, "global_step": 56517, "epoch": 474, "lr": 1.04827459714621e-05} +{"train_loss": 0.0005835443735122681, "global_step": 56518, "epoch": 474, "lr": 1.048138865182764e-05} +{"train_loss": 0.0003949847596231848, "global_step": 56519, "epoch": 474, "lr": 1.0480031409783753e-05} +{"train_loss": 0.0003396261599846184, "global_step": 56520, "epoch": 474, "lr": 1.0478674245333087e-05} +{"train_loss": 0.0004666645545512438, "global_step": 56521, "epoch": 474, "lr": 1.0477317158478333e-05} +{"train_loss": 0.0005512459902092814, "global_step": 56522, "epoch": 474, "lr": 1.0475960149222136e-05} +{"train_loss": 0.00045630105887539685, "global_step": 56523, "epoch": 474, "lr": 1.047460321756718e-05} +{"train_loss": 0.0005529164407547063, "global_step": 56524, "epoch": 474, "lr": 1.0473246363516104e-05, "val_loss": 0.05006113648414612} +{"train_loss": 0.0002814861945807934, "global_step": 56525, "epoch": 475, "lr": 1.0471889587071599e-05} +{"train_loss": 0.0016624252311885357, "global_step": 56526, "epoch": 475, "lr": 1.0470532888236318e-05} +{"train_loss": 0.000645943742711097, "global_step": 56527, "epoch": 475, "lr": 1.0469176267012909e-05} +{"train_loss": 0.0005251215188764036, "global_step": 56528, "epoch": 475, "lr": 1.0467819723404049e-05} +{"train_loss": 0.0008145582396537066, "global_step": 56529, "epoch": 475, "lr": 1.0466463257412412e-05} +{"train_loss": 0.0006288180593401194, "global_step": 56530, "epoch": 475, "lr": 1.0465106869040643e-05} +{"train_loss": 0.0010728191118687391, "global_step": 56531, "epoch": 475, "lr": 1.046375055829142e-05} +{"train_loss": 0.0004611806070897728, "global_step": 56532, "epoch": 475, "lr": 1.046239432516739e-05} +{"train_loss": 0.0005507580353878438, "global_step": 56533, "epoch": 475, "lr": 1.0461038169671234e-05} +{"train_loss": 0.00029815445304848254, "global_step": 56534, "epoch": 475, "lr": 1.0459682091805595e-05} +{"train_loss": 0.0005481585976667702, "global_step": 56535, "epoch": 475, "lr": 1.0458326091573161e-05} +{"train_loss": 0.000719861825928092, "global_step": 56536, "epoch": 475, "lr": 1.045697016897656e-05} +{"train_loss": 0.0005757392500527203, "global_step": 56537, "epoch": 475, "lr": 1.0455614324018492e-05} +{"train_loss": 0.0006087142392061651, "global_step": 56538, "epoch": 475, "lr": 1.04542585567016e-05} +{"train_loss": 0.0006854484090581536, "global_step": 56539, "epoch": 475, "lr": 1.0452902867028536e-05} +{"train_loss": 0.00038430781569331884, "global_step": 56540, "epoch": 475, "lr": 1.0451547255001981e-05} +{"train_loss": 0.000305097084492445, "global_step": 56541, "epoch": 475, "lr": 1.0450191720624575e-05} +{"train_loss": 0.0007347280043177307, "global_step": 56542, "epoch": 475, "lr": 1.0448836263899004e-05} +{"train_loss": 0.0002653949777595699, "global_step": 56543, "epoch": 475, "lr": 1.044748088482791e-05} +{"train_loss": 0.0010892743011936545, "global_step": 56544, "epoch": 475, "lr": 1.0446125583413968e-05} +{"train_loss": 0.0006983591010794044, "global_step": 56545, "epoch": 475, "lr": 1.0444770359659839e-05} +{"train_loss": 0.0003607468097470701, "global_step": 56546, "epoch": 475, "lr": 1.0443415213568158e-05} +{"train_loss": 0.00023644563043490052, "global_step": 56547, "epoch": 475, "lr": 1.0442060145141625e-05} +{"train_loss": 0.0006830848287791014, "global_step": 56548, "epoch": 475, "lr": 1.0440705154382863e-05} +{"train_loss": 0.0003467493806965649, "global_step": 56549, "epoch": 475, "lr": 1.0439350241294566e-05} +{"train_loss": 0.00042888132156804204, "global_step": 56550, "epoch": 475, "lr": 1.0437995405879381e-05} +{"train_loss": 0.0009059805306605995, "global_step": 56551, "epoch": 475, "lr": 1.0436640648139945e-05} +{"train_loss": 0.0009787773014977574, "global_step": 56552, "epoch": 475, "lr": 1.0435285968078957e-05} +{"train_loss": 0.0005079519469290972, "global_step": 56553, "epoch": 475, "lr": 1.043393136569904e-05} +{"train_loss": 0.00038879673229530454, "global_step": 56554, "epoch": 475, "lr": 1.043257684100289e-05} +{"train_loss": 0.0011150726350024343, "global_step": 56555, "epoch": 475, "lr": 1.0431222393993135e-05} +{"train_loss": 0.0005773885059170425, "global_step": 56556, "epoch": 475, "lr": 1.0429868024672456e-05} +{"train_loss": 0.0007477455073967576, "global_step": 56557, "epoch": 475, "lr": 1.042851373304351e-05} +{"train_loss": 0.0003923451295122504, "global_step": 56558, "epoch": 475, "lr": 1.0427159519108931e-05} +{"train_loss": 0.0004661153943743557, "global_step": 56559, "epoch": 475, "lr": 1.0425805382871413e-05} +{"train_loss": 0.000519205757882446, "global_step": 56560, "epoch": 475, "lr": 1.0424451324333584e-05} +{"train_loss": 0.0009264443069696426, "global_step": 56561, "epoch": 475, "lr": 1.0423097343498129e-05} +{"train_loss": 0.00038417577161453664, "global_step": 56562, "epoch": 475, "lr": 1.0421743440367682e-05} +{"train_loss": 0.0002351428265683353, "global_step": 56563, "epoch": 475, "lr": 1.042038961494491e-05} +{"train_loss": 0.0006280555389821529, "global_step": 56564, "epoch": 475, "lr": 1.0419035867232491e-05} +{"train_loss": 0.0006751053733751178, "global_step": 56565, "epoch": 475, "lr": 1.0417682197233053e-05} +{"train_loss": 0.0008590749930590391, "global_step": 56566, "epoch": 475, "lr": 1.0416328604949283e-05} +{"train_loss": 0.00078103959094733, "global_step": 56567, "epoch": 475, "lr": 1.0414975090383805e-05} +{"train_loss": 0.0003806694585364312, "global_step": 56568, "epoch": 475, "lr": 1.0413621653539313e-05} +{"train_loss": 0.0002777127083390951, "global_step": 56569, "epoch": 475, "lr": 1.0412268294418442e-05} +{"train_loss": 0.0007896181778050959, "global_step": 56570, "epoch": 475, "lr": 1.0410915013023836e-05} +{"train_loss": 0.0005753544974140823, "global_step": 56571, "epoch": 475, "lr": 1.0409561809358187e-05} +{"train_loss": 0.0007981545059010386, "global_step": 56572, "epoch": 475, "lr": 1.040820868342412e-05} +{"train_loss": 0.0005098224501125515, "global_step": 56573, "epoch": 475, "lr": 1.0406855635224323e-05} +{"train_loss": 0.0008076553349383175, "global_step": 56574, "epoch": 475, "lr": 1.0405502664761412e-05} +{"train_loss": 0.00029240717412903905, "global_step": 56575, "epoch": 475, "lr": 1.0404149772038092e-05} +{"train_loss": 0.0005031234468333423, "global_step": 56576, "epoch": 475, "lr": 1.0402796957056981e-05} +{"train_loss": 0.0006332145421765745, "global_step": 56577, "epoch": 475, "lr": 1.0401444219820744e-05} +{"train_loss": 0.0003056942077819258, "global_step": 56578, "epoch": 475, "lr": 1.0400091560332048e-05} +{"train_loss": 0.0005560130812227726, "global_step": 56579, "epoch": 475, "lr": 1.039873897859353e-05} +{"train_loss": 0.0005549155175685883, "global_step": 56580, "epoch": 475, "lr": 1.0397386474607873e-05} +{"train_loss": 0.000788299657870084, "global_step": 56581, "epoch": 475, "lr": 1.03960340483777e-05} +{"train_loss": 0.00029439895297400653, "global_step": 56582, "epoch": 475, "lr": 1.0394681699905701e-05} +{"train_loss": 0.0004043826775159687, "global_step": 56583, "epoch": 475, "lr": 1.039332942919451e-05} +{"train_loss": 0.0007837593439035118, "global_step": 56584, "epoch": 475, "lr": 1.0391977236246774e-05} +{"train_loss": 0.0002881049585994333, "global_step": 56585, "epoch": 475, "lr": 1.0390625121065172e-05} +{"train_loss": 0.000641393184196204, "global_step": 56586, "epoch": 475, "lr": 1.0389273083652329e-05} +{"train_loss": 0.00037779429112561047, "global_step": 56587, "epoch": 475, "lr": 1.0387921124010936e-05} +{"train_loss": 0.0007215074729174376, "global_step": 56588, "epoch": 475, "lr": 1.0386569242143623e-05} +{"train_loss": 0.0005990369245409966, "global_step": 56589, "epoch": 475, "lr": 1.0385217438053036e-05} +{"train_loss": 0.0010688325855880976, "global_step": 56590, "epoch": 475, "lr": 1.0383865711741858e-05} +{"train_loss": 0.0007539618527516723, "global_step": 56591, "epoch": 475, "lr": 1.0382514063212711e-05} +{"train_loss": 0.00038277116254903376, "global_step": 56592, "epoch": 475, "lr": 1.0381162492468282e-05} +{"train_loss": 0.0008024020353332162, "global_step": 56593, "epoch": 475, "lr": 1.0379810999511191e-05} +{"train_loss": 0.0005649416125379503, "global_step": 56594, "epoch": 475, "lr": 1.0378459584344124e-05} +{"train_loss": 0.0005130594945512712, "global_step": 56595, "epoch": 475, "lr": 1.0377108246969708e-05} +{"train_loss": 0.0004069137794431299, "global_step": 56596, "epoch": 475, "lr": 1.0375756987390617e-05} +{"train_loss": 0.0006273415056057274, "global_step": 56597, "epoch": 475, "lr": 1.0374405805609477e-05} +{"train_loss": 0.0007730922079645097, "global_step": 56598, "epoch": 475, "lr": 1.0373054701628964e-05} +{"train_loss": 0.000723749166354537, "global_step": 56599, "epoch": 475, "lr": 1.0371703675451732e-05} +{"train_loss": 0.0006925324560143054, "global_step": 56600, "epoch": 475, "lr": 1.0370352727080434e-05} +{"train_loss": 0.00041568410233594477, "global_step": 56601, "epoch": 475, "lr": 1.0369001856517696e-05} +{"train_loss": 0.0007157378131523728, "global_step": 56602, "epoch": 475, "lr": 1.0367651063766204e-05} +{"train_loss": 0.00029437843477353454, "global_step": 56603, "epoch": 475, "lr": 1.0366300348828579e-05} +{"train_loss": 0.0003622794756665826, "global_step": 56604, "epoch": 475, "lr": 1.0364949711707506e-05} +{"train_loss": 0.0007537962519563735, "global_step": 56605, "epoch": 475, "lr": 1.03635991524056e-05} +{"train_loss": 0.0007252229261212051, "global_step": 56606, "epoch": 475, "lr": 1.0362248670925557e-05} +{"train_loss": 0.0003514671407174319, "global_step": 56607, "epoch": 475, "lr": 1.0360898267269997e-05} +{"train_loss": 0.0008748031686991453, "global_step": 56608, "epoch": 475, "lr": 1.035954794144156e-05} +{"train_loss": 0.0003254394105169922, "global_step": 56609, "epoch": 475, "lr": 1.035819769344294e-05} +{"train_loss": 0.00026060378877446055, "global_step": 56610, "epoch": 475, "lr": 1.0356847523276742e-05} +{"train_loss": 0.0003716830105986446, "global_step": 56611, "epoch": 475, "lr": 1.0355497430945655e-05} +{"train_loss": 0.0011035955976694822, "global_step": 56612, "epoch": 475, "lr": 1.0354147416452303e-05} +{"train_loss": 0.00035105098504573107, "global_step": 56613, "epoch": 475, "lr": 1.0352797479799359e-05} +{"train_loss": 0.0006254108739085495, "global_step": 56614, "epoch": 475, "lr": 1.0351447620989457e-05} +{"train_loss": 0.0002664215280674398, "global_step": 56615, "epoch": 475, "lr": 1.0350097840025242e-05} +{"train_loss": 0.0004336319980211556, "global_step": 56616, "epoch": 475, "lr": 1.0348748136909387e-05} +{"train_loss": 0.0009195363381877542, "global_step": 56617, "epoch": 475, "lr": 1.0347398511644512e-05} +{"train_loss": 0.0004709100176114589, "global_step": 56618, "epoch": 475, "lr": 1.0346048964233302e-05} +{"train_loss": 0.0009170456323772669, "global_step": 56619, "epoch": 475, "lr": 1.034469949467839e-05} +{"train_loss": 0.0006091766408644617, "global_step": 56620, "epoch": 475, "lr": 1.0343350102982408e-05} +{"train_loss": 0.00048226251965388656, "global_step": 56621, "epoch": 475, "lr": 1.0342000789148032e-05} +{"train_loss": 0.0006878840504214168, "global_step": 56622, "epoch": 475, "lr": 1.0340651553177889e-05} +{"train_loss": 0.0006302515394054353, "global_step": 56623, "epoch": 475, "lr": 1.0339302395074657e-05} +{"train_loss": 0.0006606876268051565, "global_step": 56624, "epoch": 475, "lr": 1.0337953314840949e-05} +{"train_loss": 0.00037375924875959754, "global_step": 56625, "epoch": 475, "lr": 1.0336604312479448e-05} +{"train_loss": 0.0005991043872199953, "global_step": 56626, "epoch": 475, "lr": 1.033525538799277e-05} +{"train_loss": 0.0005564757739193738, "global_step": 56627, "epoch": 475, "lr": 1.0333906541383598e-05} +{"train_loss": 0.0004705274768639356, "global_step": 56628, "epoch": 475, "lr": 1.033255777265455e-05} +{"train_loss": 0.0006300535169430077, "global_step": 56629, "epoch": 475, "lr": 1.0331209081808297e-05} +{"train_loss": 0.00043969188118353486, "global_step": 56630, "epoch": 475, "lr": 1.032986046884747e-05} +{"train_loss": 0.0002715604496188462, "global_step": 56631, "epoch": 475, "lr": 1.0328511933774731e-05} +{"train_loss": 0.0005557741969823837, "global_step": 56632, "epoch": 475, "lr": 1.0327163476592705e-05} +{"train_loss": 0.00036644662031903863, "global_step": 56633, "epoch": 475, "lr": 1.0325815097304075e-05} +{"train_loss": 0.0003359171678312123, "global_step": 56634, "epoch": 475, "lr": 1.0324466795911452e-05} +{"train_loss": 0.0009520347812213004, "global_step": 56635, "epoch": 475, "lr": 1.0323118572417512e-05} +{"train_loss": 0.0006476239068433642, "global_step": 56636, "epoch": 475, "lr": 1.0321770426824879e-05} +{"train_loss": 0.0006916241836734116, "global_step": 56637, "epoch": 475, "lr": 1.0320422359136222e-05} +{"train_loss": 0.0003757906670216471, "global_step": 56638, "epoch": 475, "lr": 1.0319074369354181e-05} +{"train_loss": 0.0008442307589575648, "global_step": 56639, "epoch": 475, "lr": 1.031772645748138e-05} +{"train_loss": 0.0005857300711795688, "global_step": 56640, "epoch": 475, "lr": 1.03163786235205e-05} +{"train_loss": 0.0004853010759688914, "global_step": 56641, "epoch": 475, "lr": 1.0315030867474157e-05} +{"train_loss": 0.00047709757927805185, "global_step": 56642, "epoch": 475, "lr": 1.0313683189345024e-05} +{"train_loss": 0.0005872411530625325, "global_step": 56643, "epoch": 475, "lr": 1.0312335589135718e-05, "val_loss": 0.05219980329275131, "train_action_mse_error": 7.049079158605309e-06} +{"train_loss": 0.000493582512717694, "global_step": 56644, "epoch": 476, "lr": 1.031098806684892e-05} +{"train_loss": 0.00042257181485183537, "global_step": 56645, "epoch": 476, "lr": 1.0309640622487254e-05} +{"train_loss": 0.0007186761358752847, "global_step": 56646, "epoch": 476, "lr": 1.0308293256053352e-05} +{"train_loss": 0.0003887892817147076, "global_step": 56647, "epoch": 476, "lr": 1.0306945967549892e-05} +{"train_loss": 0.000623773958068341, "global_step": 56648, "epoch": 476, "lr": 1.030559875697949e-05} +{"train_loss": 0.00034570222487673163, "global_step": 56649, "epoch": 476, "lr": 1.0304251624344819e-05} +{"train_loss": 0.0003881874436046928, "global_step": 56650, "epoch": 476, "lr": 1.0302904569648492e-05} +{"train_loss": 0.0005017658695578575, "global_step": 56651, "epoch": 476, "lr": 1.0301557592893185e-05} +{"train_loss": 0.0003328727907501161, "global_step": 56652, "epoch": 476, "lr": 1.030021069408153e-05} +{"train_loss": 0.0004617598606273532, "global_step": 56653, "epoch": 476, "lr": 1.0298863873216158e-05} +{"train_loss": 0.0004650760965887457, "global_step": 56654, "epoch": 476, "lr": 1.0297517130299738e-05} +{"train_loss": 0.00039161398308351636, "global_step": 56655, "epoch": 476, "lr": 1.0296170465334886e-05} +{"train_loss": 0.0004579864034894854, "global_step": 56656, "epoch": 476, "lr": 1.0294823878324279e-05} +{"train_loss": 0.0005552152870222926, "global_step": 56657, "epoch": 476, "lr": 1.0293477369270538e-05} +{"train_loss": 0.0002446139114908874, "global_step": 56658, "epoch": 476, "lr": 1.0292130938176298e-05} +{"train_loss": 0.0005165457259863615, "global_step": 56659, "epoch": 476, "lr": 1.0290784585044233e-05} +{"train_loss": 0.0004973022150807083, "global_step": 56660, "epoch": 476, "lr": 1.0289438309876959e-05} +{"train_loss": 0.0005245556822046638, "global_step": 56661, "epoch": 476, "lr": 1.0288092112677127e-05} +{"train_loss": 0.0004894195008091629, "global_step": 56662, "epoch": 476, "lr": 1.0286745993447399e-05} +{"train_loss": 0.00036131872911937535, "global_step": 56663, "epoch": 476, "lr": 1.0285399952190389e-05} +{"train_loss": 0.0004371480317786336, "global_step": 56664, "epoch": 476, "lr": 1.0284053988908765e-05} +{"train_loss": 0.0006186279933899641, "global_step": 56665, "epoch": 476, "lr": 1.028270810360515e-05} +{"train_loss": 0.0003353798820171505, "global_step": 56666, "epoch": 476, "lr": 1.0281362296282205e-05} +{"train_loss": 0.0004648129397537559, "global_step": 56667, "epoch": 476, "lr": 1.0280016566942547e-05} +{"train_loss": 0.0006690224981866777, "global_step": 56668, "epoch": 476, "lr": 1.0278670915588845e-05} +{"train_loss": 0.0008893747581169009, "global_step": 56669, "epoch": 476, "lr": 1.027732534222373e-05} +{"train_loss": 0.00034553679870441556, "global_step": 56670, "epoch": 476, "lr": 1.0275979846849831e-05} +{"train_loss": 0.0004443706711754203, "global_step": 56671, "epoch": 476, "lr": 1.0274634429469815e-05} +{"train_loss": 0.0004517846100497991, "global_step": 56672, "epoch": 476, "lr": 1.0273289090086296e-05} +{"train_loss": 0.00037505957880057395, "global_step": 56673, "epoch": 476, "lr": 1.0271943828701941e-05} +{"train_loss": 0.0003869466600008309, "global_step": 56674, "epoch": 476, "lr": 1.0270598645319368e-05} +{"train_loss": 0.0003540078760124743, "global_step": 56675, "epoch": 476, "lr": 1.0269253539941249e-05} +{"train_loss": 0.0005784581298939884, "global_step": 56676, "epoch": 476, "lr": 1.0267908512570196e-05} +{"train_loss": 0.0005868137232027948, "global_step": 56677, "epoch": 476, "lr": 1.0266563563208852e-05} +{"train_loss": 0.0002064760192297399, "global_step": 56678, "epoch": 476, "lr": 1.026521869185988e-05} +{"train_loss": 0.0009450936922803521, "global_step": 56679, "epoch": 476, "lr": 1.0263873898525894e-05} +{"train_loss": 0.000692126399371773, "global_step": 56680, "epoch": 476, "lr": 1.0262529183209557e-05} +{"train_loss": 0.00033738286583684385, "global_step": 56681, "epoch": 476, "lr": 1.0261184545913482e-05} +{"train_loss": 0.0004787769285030663, "global_step": 56682, "epoch": 476, "lr": 1.0259839986640346e-05} +{"train_loss": 0.00029262813040986657, "global_step": 56683, "epoch": 476, "lr": 1.0258495505392762e-05} +{"train_loss": 0.0008918055100366473, "global_step": 56684, "epoch": 476, "lr": 1.0257151102173368e-05} +{"train_loss": 0.0007147949654608965, "global_step": 56685, "epoch": 476, "lr": 1.0255806776984822e-05} +{"train_loss": 0.0007013269932940602, "global_step": 56686, "epoch": 476, "lr": 1.0254462529829745e-05} +{"train_loss": 0.00041102172690443695, "global_step": 56687, "epoch": 476, "lr": 1.0253118360710794e-05} +{"train_loss": 0.0003946351062040776, "global_step": 56688, "epoch": 476, "lr": 1.0251774269630599e-05} +{"train_loss": 0.0008285053190775216, "global_step": 56689, "epoch": 476, "lr": 1.0250430256591787e-05} +{"train_loss": 0.00048284747754223645, "global_step": 56690, "epoch": 476, "lr": 1.0249086321597017e-05} +{"train_loss": 0.0012412319192662835, "global_step": 56691, "epoch": 476, "lr": 1.0247742464648914e-05} +{"train_loss": 0.00029196630930528045, "global_step": 56692, "epoch": 476, "lr": 1.0246398685750126e-05} +{"train_loss": 0.0005011918256059289, "global_step": 56693, "epoch": 476, "lr": 1.0245054984903279e-05} +{"train_loss": 0.0007385704084299505, "global_step": 56694, "epoch": 476, "lr": 1.024371136211103e-05} +{"train_loss": 0.00036748897400684655, "global_step": 56695, "epoch": 476, "lr": 1.0242367817375998e-05} +{"train_loss": 0.000476075685583055, "global_step": 56696, "epoch": 476, "lr": 1.0241024350700824e-05} +{"train_loss": 0.00037676270585507154, "global_step": 56697, "epoch": 476, "lr": 1.0239680962088167e-05} +{"train_loss": 0.00031134230084717274, "global_step": 56698, "epoch": 476, "lr": 1.0238337651540636e-05} +{"train_loss": 0.0005025523132644594, "global_step": 56699, "epoch": 476, "lr": 1.0236994419060891e-05} +{"train_loss": 0.0012799849500879645, "global_step": 56700, "epoch": 476, "lr": 1.0235651264651552e-05} +{"train_loss": 0.0005001688259653747, "global_step": 56701, "epoch": 476, "lr": 1.0234308188315273e-05} +{"train_loss": 0.00039206971996463835, "global_step": 56702, "epoch": 476, "lr": 1.0232965190054684e-05} +{"train_loss": 0.0009521885658614337, "global_step": 56703, "epoch": 476, "lr": 1.0231622269872404e-05} +{"train_loss": 0.00035346864024177194, "global_step": 56704, "epoch": 476, "lr": 1.0230279427771095e-05} +{"train_loss": 0.0007198947132565081, "global_step": 56705, "epoch": 476, "lr": 1.0228936663753374e-05} +{"train_loss": 0.0003341698320582509, "global_step": 56706, "epoch": 476, "lr": 1.0227593977821903e-05} +{"train_loss": 0.0005633430555462837, "global_step": 56707, "epoch": 476, "lr": 1.0226251369979295e-05} +{"train_loss": 0.000312275456963107, "global_step": 56708, "epoch": 476, "lr": 1.0224908840228187e-05} +{"train_loss": 0.0004881945496890694, "global_step": 56709, "epoch": 476, "lr": 1.0223566388571232e-05} +{"train_loss": 0.0004504747921600938, "global_step": 56710, "epoch": 476, "lr": 1.0222224015011039e-05} +{"train_loss": 0.0005028444575145841, "global_step": 56711, "epoch": 476, "lr": 1.0220881719550274e-05} +{"train_loss": 0.00033098782296292484, "global_step": 56712, "epoch": 476, "lr": 1.021953950219155e-05} +{"train_loss": 0.000442977761849761, "global_step": 56713, "epoch": 476, "lr": 1.0218197362937516e-05} +{"train_loss": 0.00027164415223523974, "global_step": 56714, "epoch": 476, "lr": 1.0216855301790806e-05} +{"train_loss": 0.0007732965750619769, "global_step": 56715, "epoch": 476, "lr": 1.0215513318754032e-05} +{"train_loss": 0.0003110128454864025, "global_step": 56716, "epoch": 476, "lr": 1.0214171413829864e-05} +{"train_loss": 0.0005760371568612754, "global_step": 56717, "epoch": 476, "lr": 1.0212829587020911e-05} +{"train_loss": 0.0002458168310113251, "global_step": 56718, "epoch": 476, "lr": 1.0211487838329826e-05} +{"train_loss": 0.0004230478371027857, "global_step": 56719, "epoch": 476, "lr": 1.0210146167759222e-05} +{"train_loss": 0.00083479646127671, "global_step": 56720, "epoch": 476, "lr": 1.0208804575311753e-05} +{"train_loss": 0.0006440022843889892, "global_step": 56721, "epoch": 476, "lr": 1.0207463060990052e-05} +{"train_loss": 0.0003227164561394602, "global_step": 56722, "epoch": 476, "lr": 1.0206121624796728e-05} +{"train_loss": 0.0003830358327832073, "global_step": 56723, "epoch": 476, "lr": 1.0204780266734449e-05} +{"train_loss": 0.00034471676917746663, "global_step": 56724, "epoch": 476, "lr": 1.0203438986805813e-05} +{"train_loss": 0.0006381314597092569, "global_step": 56725, "epoch": 476, "lr": 1.0202097785013493e-05} +{"train_loss": 0.0005614325636997819, "global_step": 56726, "epoch": 476, "lr": 1.020075666136009e-05} +{"train_loss": 0.0008509317995049059, "global_step": 56727, "epoch": 476, "lr": 1.0199415615848257e-05} +{"train_loss": 0.0005748471012338996, "global_step": 56728, "epoch": 476, "lr": 1.019807464848061e-05} +{"train_loss": 0.0004680659912992269, "global_step": 56729, "epoch": 476, "lr": 1.0196733759259802e-05} +{"train_loss": 0.0010110437870025635, "global_step": 56730, "epoch": 476, "lr": 1.0195392948188443e-05} +{"train_loss": 0.0007468347903341055, "global_step": 56731, "epoch": 476, "lr": 1.0194052215269178e-05} +{"train_loss": 0.000725410645827651, "global_step": 56732, "epoch": 476, "lr": 1.0192711560504652e-05} +{"train_loss": 0.0006503965705633163, "global_step": 56733, "epoch": 476, "lr": 1.019137098389748e-05} +{"train_loss": 0.0006419465062208474, "global_step": 56734, "epoch": 476, "lr": 1.0190030485450292e-05} +{"train_loss": 0.0002967288892250508, "global_step": 56735, "epoch": 476, "lr": 1.0188690065165735e-05} +{"train_loss": 0.00019222985429223627, "global_step": 56736, "epoch": 476, "lr": 1.0187349723046418e-05} +{"train_loss": 0.00040053672273643315, "global_step": 56737, "epoch": 476, "lr": 1.0186009459095003e-05} +{"train_loss": 0.000481403578305617, "global_step": 56738, "epoch": 476, "lr": 1.0184669273314101e-05} +{"train_loss": 0.0003470770607236773, "global_step": 56739, "epoch": 476, "lr": 1.0183329165706335e-05} +{"train_loss": 0.0006666737026534975, "global_step": 56740, "epoch": 476, "lr": 1.0181989136274367e-05} +{"train_loss": 0.0009438140550628304, "global_step": 56741, "epoch": 476, "lr": 1.018064918502079e-05} +{"train_loss": 0.00039657545858062804, "global_step": 56742, "epoch": 476, "lr": 1.0179309311948271e-05} +{"train_loss": 0.0009496461134403944, "global_step": 56743, "epoch": 476, "lr": 1.0177969517059404e-05} +{"train_loss": 0.00040195960900746286, "global_step": 56744, "epoch": 476, "lr": 1.0176629800356857e-05} +{"train_loss": 0.0007323820027522743, "global_step": 56745, "epoch": 476, "lr": 1.0175290161843248e-05} +{"train_loss": 0.0005066827870905399, "global_step": 56746, "epoch": 476, "lr": 1.0173950601521182e-05} +{"train_loss": 0.0003375645028427243, "global_step": 56747, "epoch": 476, "lr": 1.0172611119393327e-05} +{"train_loss": 0.0006845451425760984, "global_step": 56748, "epoch": 476, "lr": 1.0171271715462277e-05} +{"train_loss": 0.0006096361903473735, "global_step": 56749, "epoch": 476, "lr": 1.0169932389730696e-05} +{"train_loss": 0.0003920257731806487, "global_step": 56750, "epoch": 476, "lr": 1.0168593142201188e-05} +{"train_loss": 0.00039973502862267196, "global_step": 56751, "epoch": 476, "lr": 1.01672539728764e-05} +{"train_loss": 0.0006683162646368146, "global_step": 56752, "epoch": 476, "lr": 1.0165914881758954e-05} +{"train_loss": 0.0006761910626664758, "global_step": 56753, "epoch": 476, "lr": 1.0164575868851467e-05} +{"train_loss": 0.0005253596464172006, "global_step": 56754, "epoch": 476, "lr": 1.016323693415659e-05} +{"train_loss": 0.0003833644441328943, "global_step": 56755, "epoch": 476, "lr": 1.0161898077676929e-05} +{"train_loss": 0.0006810601335018873, "global_step": 56756, "epoch": 476, "lr": 1.016055929941514e-05} +{"train_loss": 0.00046298987581394613, "global_step": 56757, "epoch": 476, "lr": 1.0159220599373826e-05} +{"train_loss": 0.0006459069554693997, "global_step": 56758, "epoch": 476, "lr": 1.0157881977555633e-05} +{"train_loss": 0.0007528074202127755, "global_step": 56759, "epoch": 476, "lr": 1.0156543433963173e-05} +{"train_loss": 0.0004692215006798506, "global_step": 56760, "epoch": 476, "lr": 1.0155204968599097e-05} +{"train_loss": 0.000339613325195387, "global_step": 56761, "epoch": 476, "lr": 1.0153866581466004e-05} +{"train_loss": 0.0005286710385473821, "global_step": 56762, "epoch": 476, "lr": 1.0152528272566547e-05, "val_loss": 0.031259991228580475} +{"train_loss": 0.00042848786688409746, "global_step": 56763, "epoch": 477, "lr": 1.0151190041903336e-05} +{"train_loss": 0.0003887093917001039, "global_step": 56764, "epoch": 477, "lr": 1.0149851889479017e-05} +{"train_loss": 0.0012357259402051568, "global_step": 56765, "epoch": 477, "lr": 1.0148513815296195e-05} +{"train_loss": 0.00044141546823084354, "global_step": 56766, "epoch": 477, "lr": 1.0147175819357518e-05} +{"train_loss": 0.0003486265195533633, "global_step": 56767, "epoch": 477, "lr": 1.0145837901665595e-05} +{"train_loss": 0.0007893253350630403, "global_step": 56768, "epoch": 477, "lr": 1.0144500062223072e-05} +{"train_loss": 0.00030097199487499893, "global_step": 56769, "epoch": 477, "lr": 1.0143162301032549e-05} +{"train_loss": 0.0003547963860910386, "global_step": 56770, "epoch": 477, "lr": 1.014182461809669e-05} +{"train_loss": 0.00028156369808129966, "global_step": 56771, "epoch": 477, "lr": 1.0140487013418093e-05} +{"train_loss": 0.0007260701386258006, "global_step": 56772, "epoch": 477, "lr": 1.0139149486999384e-05} +{"train_loss": 0.0007173640187829733, "global_step": 56773, "epoch": 477, "lr": 1.0137812038843202e-05} +{"train_loss": 0.0008460684330202639, "global_step": 56774, "epoch": 477, "lr": 1.0136474668952162e-05} +{"train_loss": 0.0006479554576799273, "global_step": 56775, "epoch": 477, "lr": 1.0135137377328907e-05} +{"train_loss": 0.0006085900822654366, "global_step": 56776, "epoch": 477, "lr": 1.0133800163976049e-05} +{"train_loss": 0.0004497369227465242, "global_step": 56777, "epoch": 477, "lr": 1.0132463028896199e-05} +{"train_loss": 0.000526653602719307, "global_step": 56778, "epoch": 477, "lr": 1.0131125972092014e-05} +{"train_loss": 0.0008305874071083963, "global_step": 56779, "epoch": 477, "lr": 1.0129788993566091e-05} +{"train_loss": 0.0010195837821811438, "global_step": 56780, "epoch": 477, "lr": 1.0128452093321084e-05} +{"train_loss": 0.0004909863346256316, "global_step": 56781, "epoch": 477, "lr": 1.0127115271359582e-05} +{"train_loss": 0.00042607716750353575, "global_step": 56782, "epoch": 477, "lr": 1.0125778527684249e-05} +{"train_loss": 0.000681402743794024, "global_step": 56783, "epoch": 477, "lr": 1.012444186229769e-05} +{"train_loss": 0.0003817747056018561, "global_step": 56784, "epoch": 477, "lr": 1.012310527520251e-05} +{"train_loss": 0.0005216951831243932, "global_step": 56785, "epoch": 477, "lr": 1.0121768766401373e-05} +{"train_loss": 0.001966268289834261, "global_step": 56786, "epoch": 477, "lr": 1.0120432335896863e-05} +{"train_loss": 0.0005498264217749238, "global_step": 56787, "epoch": 477, "lr": 1.011909598369164e-05} +{"train_loss": 0.0007216977537609637, "global_step": 56788, "epoch": 477, "lr": 1.011775970978831e-05} +{"train_loss": 0.0007076709298416972, "global_step": 56789, "epoch": 477, "lr": 1.0116423514189489e-05} +{"train_loss": 0.00031821458833292127, "global_step": 56790, "epoch": 477, "lr": 1.0115087396897821e-05} +{"train_loss": 0.0003824031155090779, "global_step": 56791, "epoch": 477, "lr": 1.0113751357915902e-05} +{"train_loss": 0.0007796502322889864, "global_step": 56792, "epoch": 477, "lr": 1.0112415397246371e-05} +{"train_loss": 0.000609850452747196, "global_step": 56793, "epoch": 477, "lr": 1.0111079514891864e-05} +{"train_loss": 0.0009380367700941861, "global_step": 56794, "epoch": 477, "lr": 1.010974371085498e-05} +{"train_loss": 0.0006954579730518162, "global_step": 56795, "epoch": 477, "lr": 1.0108407985138363e-05} +{"train_loss": 0.0004713282687589526, "global_step": 56796, "epoch": 477, "lr": 1.0107072337744617e-05} +{"train_loss": 0.00046216495684348047, "global_step": 56797, "epoch": 477, "lr": 1.0105736768676383e-05} +{"train_loss": 0.00046982005005702376, "global_step": 56798, "epoch": 477, "lr": 1.0104401277936259e-05} +{"train_loss": 0.0005765177775174379, "global_step": 56799, "epoch": 477, "lr": 1.0103065865526894e-05} +{"train_loss": 0.0007741537992842495, "global_step": 56800, "epoch": 477, "lr": 1.010173053145088e-05} +{"train_loss": 0.000615257304161787, "global_step": 56801, "epoch": 477, "lr": 1.0100395275710871e-05} +{"train_loss": 0.00025845051277428865, "global_step": 56802, "epoch": 477, "lr": 1.0099060098309477e-05} +{"train_loss": 0.00041984510608017445, "global_step": 56803, "epoch": 477, "lr": 1.0097724999249303e-05} +{"train_loss": 0.00033211393747478724, "global_step": 56804, "epoch": 477, "lr": 1.0096389978532993e-05} +{"train_loss": 0.0005727720563299954, "global_step": 56805, "epoch": 477, "lr": 1.0095055036163143e-05} +{"train_loss": 0.0005586055922321975, "global_step": 56806, "epoch": 477, "lr": 1.0093720172142407e-05} +{"train_loss": 0.0005912960041314363, "global_step": 56807, "epoch": 477, "lr": 1.0092385386473386e-05} +{"train_loss": 0.0005375905311666429, "global_step": 56808, "epoch": 477, "lr": 1.0091050679158692e-05} +{"train_loss": 0.0005212050746195018, "global_step": 56809, "epoch": 477, "lr": 1.0089716050200964e-05} +{"train_loss": 0.0003111384576186538, "global_step": 56810, "epoch": 477, "lr": 1.0088381499602805e-05} +{"train_loss": 0.00031420643790625036, "global_step": 56811, "epoch": 477, "lr": 1.0087047027366859e-05} +{"train_loss": 0.0008390030125156045, "global_step": 56812, "epoch": 477, "lr": 1.008571263349572e-05} +{"train_loss": 0.0005576414405368268, "global_step": 56813, "epoch": 477, "lr": 1.0084378317992028e-05} +{"train_loss": 0.0009511602111160755, "global_step": 56814, "epoch": 477, "lr": 1.00830440808584e-05} +{"train_loss": 0.000388767832191661, "global_step": 56815, "epoch": 477, "lr": 1.0081709922097432e-05} +{"train_loss": 0.0002530500350985676, "global_step": 56816, "epoch": 477, "lr": 1.008037584171178e-05} +{"train_loss": 0.00037845285260118544, "global_step": 56817, "epoch": 477, "lr": 1.0079041839704029e-05} +{"train_loss": 0.0007466904353350401, "global_step": 56818, "epoch": 477, "lr": 1.0077707916076828e-05} +{"train_loss": 0.00043691624887287617, "global_step": 56819, "epoch": 477, "lr": 1.0076374070832772e-05} +{"train_loss": 0.0005132604273967445, "global_step": 56820, "epoch": 477, "lr": 1.0075040303974504e-05} +{"train_loss": 0.0007549503934569657, "global_step": 56821, "epoch": 477, "lr": 1.0073706615504624e-05} +{"train_loss": 0.0007106909761205316, "global_step": 56822, "epoch": 477, "lr": 1.0072373005425746e-05} +{"train_loss": 0.00022644796990789473, "global_step": 56823, "epoch": 477, "lr": 1.0071039473740512e-05} +{"train_loss": 0.0005082290153950453, "global_step": 56824, "epoch": 477, "lr": 1.0069706020451508e-05} +{"train_loss": 0.0005920938565395772, "global_step": 56825, "epoch": 477, "lr": 1.0068372645561385e-05} +{"train_loss": 0.0003320380055811256, "global_step": 56826, "epoch": 477, "lr": 1.0067039349072737e-05} +{"train_loss": 0.0008844073745422065, "global_step": 56827, "epoch": 477, "lr": 1.0065706130988201e-05} +{"train_loss": 0.0003856804396491498, "global_step": 56828, "epoch": 477, "lr": 1.0064372991310373e-05} +{"train_loss": 0.0005608565988950431, "global_step": 56829, "epoch": 477, "lr": 1.0063039930041885e-05} +{"train_loss": 0.00047687068581581116, "global_step": 56830, "epoch": 477, "lr": 1.0061706947185356e-05} +{"train_loss": 0.0006314011407084763, "global_step": 56831, "epoch": 477, "lr": 1.0060374042743392e-05} +{"train_loss": 0.0009894159156829119, "global_step": 56832, "epoch": 477, "lr": 1.0059041216718628e-05} +{"train_loss": 0.00032085541170090437, "global_step": 56833, "epoch": 477, "lr": 1.0057708469113669e-05} +{"train_loss": 0.000670421461109072, "global_step": 56834, "epoch": 477, "lr": 1.0056375799931123e-05} +{"train_loss": 0.000634233292657882, "global_step": 56835, "epoch": 477, "lr": 1.0055043209173626e-05} +{"train_loss": 0.0004804267955478281, "global_step": 56836, "epoch": 477, "lr": 1.005371069684377e-05} +{"train_loss": 0.0006581510533578694, "global_step": 56837, "epoch": 477, "lr": 1.0052378262944201e-05} +{"train_loss": 0.000538730644620955, "global_step": 56838, "epoch": 477, "lr": 1.0051045907477502e-05} +{"train_loss": 0.000962850812356919, "global_step": 56839, "epoch": 477, "lr": 1.0049713630446323e-05} +{"train_loss": 0.0003068372025154531, "global_step": 56840, "epoch": 477, "lr": 1.0048381431853265e-05} +{"train_loss": 0.0005754337762482464, "global_step": 56841, "epoch": 477, "lr": 1.0047049311700923e-05} +{"train_loss": 0.0007217318052425981, "global_step": 56842, "epoch": 477, "lr": 1.004571726999195e-05} +{"train_loss": 0.0005806481349281967, "global_step": 56843, "epoch": 477, "lr": 1.0044385306728927e-05} +{"train_loss": 0.0003705502604134381, "global_step": 56844, "epoch": 477, "lr": 1.00430534219145e-05} +{"train_loss": 0.0006228066049516201, "global_step": 56845, "epoch": 477, "lr": 1.0041721615551269e-05} +{"train_loss": 0.0006245177937671542, "global_step": 56846, "epoch": 477, "lr": 1.0040389887641832e-05} +{"train_loss": 0.0006539582973346114, "global_step": 56847, "epoch": 477, "lr": 1.0039058238188836e-05} +{"train_loss": 0.0003604060329962522, "global_step": 56848, "epoch": 477, "lr": 1.0037726667194864e-05} +{"train_loss": 0.0008759645279496908, "global_step": 56849, "epoch": 477, "lr": 1.003639517466256e-05} +{"train_loss": 0.0006137219606898725, "global_step": 56850, "epoch": 477, "lr": 1.0035063760594516e-05} +{"train_loss": 0.00037485218490473926, "global_step": 56851, "epoch": 477, "lr": 1.0033732424993365e-05} +{"train_loss": 0.0002905764849856496, "global_step": 56852, "epoch": 477, "lr": 1.003240116786171e-05} +{"train_loss": 0.000277172977803275, "global_step": 56853, "epoch": 477, "lr": 1.0031069989202152e-05} +{"train_loss": 0.0004547877178993076, "global_step": 56854, "epoch": 477, "lr": 1.0029738889017332e-05} +{"train_loss": 0.0007274656090885401, "global_step": 56855, "epoch": 477, "lr": 1.0028407867309836e-05} +{"train_loss": 0.0005387409473769367, "global_step": 56856, "epoch": 477, "lr": 1.0027076924082307e-05} +{"train_loss": 0.0005597192794084549, "global_step": 56857, "epoch": 477, "lr": 1.0025746059337327e-05} +{"train_loss": 0.00043706264114007354, "global_step": 56858, "epoch": 477, "lr": 1.0024415273077536e-05} +{"train_loss": 0.0008079815306700766, "global_step": 56859, "epoch": 477, "lr": 1.0023084565305518e-05} +{"train_loss": 0.0003194482997059822, "global_step": 56860, "epoch": 477, "lr": 1.002175393602392e-05} +{"train_loss": 0.00040270548197440803, "global_step": 56861, "epoch": 477, "lr": 1.0020423385235327e-05} +{"train_loss": 0.0005580500583164394, "global_step": 56862, "epoch": 477, "lr": 1.0019092912942368e-05} +{"train_loss": 0.00032957803341560066, "global_step": 56863, "epoch": 477, "lr": 1.0017762519147639e-05} +{"train_loss": 0.0004422547353897244, "global_step": 56864, "epoch": 477, "lr": 1.0016432203853777e-05} +{"train_loss": 0.0003899125149473548, "global_step": 56865, "epoch": 477, "lr": 1.0015101967063362e-05} +{"train_loss": 0.0002996300463564694, "global_step": 56866, "epoch": 477, "lr": 1.0013771808779038e-05} +{"train_loss": 0.000495403481181711, "global_step": 56867, "epoch": 477, "lr": 1.0012441729003385e-05} +{"train_loss": 0.0006113259587436914, "global_step": 56868, "epoch": 477, "lr": 1.0011111727739048e-05} +{"train_loss": 0.00023038436484057456, "global_step": 56869, "epoch": 477, "lr": 1.0009781804988605e-05} +{"train_loss": 0.00038423744263127446, "global_step": 56870, "epoch": 477, "lr": 1.00084519607547e-05} +{"train_loss": 0.00042046967428177595, "global_step": 56871, "epoch": 477, "lr": 1.000712219503992e-05} +{"train_loss": 0.00050687650218606, "global_step": 56872, "epoch": 477, "lr": 1.0005792507846879e-05} +{"train_loss": 0.0004381098260637373, "global_step": 56873, "epoch": 477, "lr": 1.0004462899178196e-05} +{"train_loss": 0.0009349273750558496, "global_step": 56874, "epoch": 477, "lr": 1.0003133369036466e-05} +{"train_loss": 0.00027471809880807996, "global_step": 56875, "epoch": 477, "lr": 1.0001803917424329e-05} +{"train_loss": 0.0005030327010899782, "global_step": 56876, "epoch": 477, "lr": 1.0000474544344374e-05} +{"train_loss": 0.000483470328617841, "global_step": 56877, "epoch": 477, "lr": 9.999145249799197e-06} +{"train_loss": 0.0005670858081430197, "global_step": 56878, "epoch": 477, "lr": 9.99781603379144e-06} +{"train_loss": 0.000567585346288979, "global_step": 56879, "epoch": 477, "lr": 9.996486896323687e-06} +{"train_loss": 0.0007076163892634213, "global_step": 56880, "epoch": 477, "lr": 9.995157837398572e-06} +{"train_loss": 0.0005572669127586243, "global_step": 56881, "epoch": 477, "lr": 9.993828857018672e-06, "val_loss": 0.01618644781410694} +{"train_loss": 0.00037075646105222404, "global_step": 56882, "epoch": 478, "lr": 9.992499955186636e-06} +{"train_loss": 0.0011412248713895679, "global_step": 56883, "epoch": 478, "lr": 9.991171131905047e-06} +{"train_loss": 0.0008498768438585103, "global_step": 56884, "epoch": 478, "lr": 9.989842387176507e-06} +{"train_loss": 0.0007270060013979673, "global_step": 56885, "epoch": 478, "lr": 9.988513721003645e-06} +{"train_loss": 0.0005588345229625702, "global_step": 56886, "epoch": 478, "lr": 9.987185133389055e-06} +{"train_loss": 0.00016774098912719637, "global_step": 56887, "epoch": 478, "lr": 9.985856624335366e-06} +{"train_loss": 0.0006630434072576463, "global_step": 56888, "epoch": 478, "lr": 9.984528193845156e-06} +{"train_loss": 0.0006272291648201644, "global_step": 56889, "epoch": 478, "lr": 9.983199841921065e-06} +{"train_loss": 0.00037539785262197256, "global_step": 56890, "epoch": 478, "lr": 9.981871568565671e-06} +{"train_loss": 0.0007668201578781009, "global_step": 56891, "epoch": 478, "lr": 9.980543373781614e-06} +{"train_loss": 0.0002513081708457321, "global_step": 56892, "epoch": 478, "lr": 9.979215257571468e-06} +{"train_loss": 0.0009410206112079322, "global_step": 56893, "epoch": 478, "lr": 9.97788721993787e-06} +{"train_loss": 0.000693423964548856, "global_step": 56894, "epoch": 478, "lr": 9.9765592608834e-06} +{"train_loss": 0.00044738565338775516, "global_step": 56895, "epoch": 478, "lr": 9.9752313804107e-06} +{"train_loss": 0.0008361039217561483, "global_step": 56896, "epoch": 478, "lr": 9.973903578522337e-06} +{"train_loss": 0.0006277244538068771, "global_step": 56897, "epoch": 478, "lr": 9.972575855220956e-06} +{"train_loss": 0.0004405257641337812, "global_step": 56898, "epoch": 478, "lr": 9.971248210509133e-06} +{"train_loss": 0.000716430542524904, "global_step": 56899, "epoch": 478, "lr": 9.969920644389497e-06} +{"train_loss": 0.0007126082200556993, "global_step": 56900, "epoch": 478, "lr": 9.96859315686463e-06} +{"train_loss": 0.0005559634882956743, "global_step": 56901, "epoch": 478, "lr": 9.967265747937177e-06} +{"train_loss": 0.0004642971616704017, "global_step": 56902, "epoch": 478, "lr": 9.965938417609711e-06} +{"train_loss": 0.00036594938137568533, "global_step": 56903, "epoch": 478, "lr": 9.964611165884841e-06} +{"train_loss": 0.00032723572803661227, "global_step": 56904, "epoch": 478, "lr": 9.963283992765188e-06} +{"train_loss": 0.0007969907019287348, "global_step": 56905, "epoch": 478, "lr": 9.961956898253338e-06} +{"train_loss": 0.0007584994891658425, "global_step": 56906, "epoch": 478, "lr": 9.960629882351924e-06} +{"train_loss": 0.0003917139256373048, "global_step": 56907, "epoch": 478, "lr": 9.959302945063531e-06} +{"train_loss": 0.001355356420390308, "global_step": 56908, "epoch": 478, "lr": 9.957976086390758e-06} +{"train_loss": 0.0009582873317413032, "global_step": 56909, "epoch": 478, "lr": 9.956649306336236e-06} +{"train_loss": 0.0005729782860726118, "global_step": 56910, "epoch": 478, "lr": 9.95532260490254e-06} +{"train_loss": 0.0005440882523544133, "global_step": 56911, "epoch": 478, "lr": 9.953995982092306e-06} +{"train_loss": 0.0004650282207876444, "global_step": 56912, "epoch": 478, "lr": 9.952669437908108e-06} +{"train_loss": 0.0004159755480941385, "global_step": 56913, "epoch": 478, "lr": 9.951342972352579e-06} +{"train_loss": 0.0009344783611595631, "global_step": 56914, "epoch": 478, "lr": 9.950016585428307e-06} +{"train_loss": 0.0005076350062154233, "global_step": 56915, "epoch": 478, "lr": 9.948690277137884e-06} +{"train_loss": 0.0005751065909862518, "global_step": 56916, "epoch": 478, "lr": 9.947364047483948e-06} +{"train_loss": 0.0006503689219243824, "global_step": 56917, "epoch": 478, "lr": 9.946037896469062e-06} +{"train_loss": 0.0003368847246747464, "global_step": 56918, "epoch": 478, "lr": 9.944711824095871e-06} +{"train_loss": 0.0004301336011849344, "global_step": 56919, "epoch": 478, "lr": 9.943385830366947e-06} +{"train_loss": 0.00042225548531860113, "global_step": 56920, "epoch": 478, "lr": 9.942059915284913e-06} +{"train_loss": 0.0005908499588258564, "global_step": 56921, "epoch": 478, "lr": 9.94073407885237e-06} +{"train_loss": 0.00041442058864049613, "global_step": 56922, "epoch": 478, "lr": 9.939408321071903e-06} +{"train_loss": 0.00039450672920793295, "global_step": 56923, "epoch": 478, "lr": 9.93808264194614e-06} +{"train_loss": 0.000546815455891192, "global_step": 56924, "epoch": 478, "lr": 9.936757041477652e-06} +{"train_loss": 0.0002830812882166356, "global_step": 56925, "epoch": 478, "lr": 9.93543151966907e-06} +{"train_loss": 0.0002765928511507809, "global_step": 56926, "epoch": 478, "lr": 9.934106076522998e-06} +{"train_loss": 0.0007731033256277442, "global_step": 56927, "epoch": 478, "lr": 9.93278071204201e-06} +{"train_loss": 0.0006324000423774123, "global_step": 56928, "epoch": 478, "lr": 9.931455426228748e-06} +{"train_loss": 0.0004698416742030531, "global_step": 56929, "epoch": 478, "lr": 9.930130219085775e-06} +{"train_loss": 0.000563048233743757, "global_step": 56930, "epoch": 478, "lr": 9.928805090615728e-06} +{"train_loss": 0.0004944037646055222, "global_step": 56931, "epoch": 478, "lr": 9.927480040821174e-06} +{"train_loss": 0.0005075672524981201, "global_step": 56932, "epoch": 478, "lr": 9.926155069704745e-06} +{"train_loss": 0.000661177618894726, "global_step": 56933, "epoch": 478, "lr": 9.92483017726903e-06} +{"train_loss": 0.0005181204760447145, "global_step": 56934, "epoch": 478, "lr": 9.923505363516616e-06} +{"train_loss": 0.0005689554964192212, "global_step": 56935, "epoch": 478, "lr": 9.922180628450134e-06} +{"train_loss": 0.00034914276329800487, "global_step": 56936, "epoch": 478, "lr": 9.920855972072151e-06} +{"train_loss": 0.00040288889431394637, "global_step": 56937, "epoch": 478, "lr": 9.919531394385302e-06} +{"train_loss": 0.0008816242916509509, "global_step": 56938, "epoch": 478, "lr": 9.918206895392156e-06} +{"train_loss": 0.00031080347253009677, "global_step": 56939, "epoch": 478, "lr": 9.916882475095341e-06} +{"train_loss": 0.00042560987640172243, "global_step": 56940, "epoch": 478, "lr": 9.91555813349745e-06} +{"train_loss": 0.00026909084408544004, "global_step": 56941, "epoch": 478, "lr": 9.914233870601059e-06} +{"train_loss": 0.00029286995413713157, "global_step": 56942, "epoch": 478, "lr": 9.9129096864088e-06} +{"train_loss": 0.0006383912404999137, "global_step": 56943, "epoch": 478, "lr": 9.911585580923255e-06} +{"train_loss": 0.0004036248428747058, "global_step": 56944, "epoch": 478, "lr": 9.910261554147032e-06} +{"train_loss": 0.0006663384265266359, "global_step": 56945, "epoch": 478, "lr": 9.908937606082735e-06} +{"train_loss": 0.000672915717586875, "global_step": 56946, "epoch": 478, "lr": 9.90761373673294e-06} +{"train_loss": 0.0003425191098358482, "global_step": 56947, "epoch": 478, "lr": 9.906289946100278e-06} +{"train_loss": 0.00046409829519689083, "global_step": 56948, "epoch": 478, "lr": 9.904966234187313e-06} +{"train_loss": 0.0003594245936255902, "global_step": 56949, "epoch": 478, "lr": 9.903642600996682e-06} +{"train_loss": 0.0002802034141495824, "global_step": 56950, "epoch": 478, "lr": 9.90231904653095e-06} +{"train_loss": 0.0006171952118165791, "global_step": 56951, "epoch": 478, "lr": 9.900995570792742e-06} +{"train_loss": 0.00043844516039825976, "global_step": 56952, "epoch": 478, "lr": 9.899672173784646e-06} +{"train_loss": 0.0007404087227769196, "global_step": 56953, "epoch": 478, "lr": 9.898348855509248e-06} +{"train_loss": 0.0006513757980428636, "global_step": 56954, "epoch": 478, "lr": 9.897025615969175e-06} +{"train_loss": 0.000342189974617213, "global_step": 56955, "epoch": 478, "lr": 9.89570245516699e-06} +{"train_loss": 0.00037221357342787087, "global_step": 56956, "epoch": 478, "lr": 9.894379373105317e-06} +{"train_loss": 0.000407300831284374, "global_step": 56957, "epoch": 478, "lr": 9.893056369786741e-06} +{"train_loss": 0.0004684594750870019, "global_step": 56958, "epoch": 478, "lr": 9.891733445213874e-06} +{"train_loss": 0.0009827760513871908, "global_step": 56959, "epoch": 478, "lr": 9.890410599389289e-06} +{"train_loss": 0.0003438585845287889, "global_step": 56960, "epoch": 478, "lr": 9.889087832315597e-06} +{"train_loss": 0.0010492530418559909, "global_step": 56961, "epoch": 478, "lr": 9.88776514399541e-06} +{"train_loss": 0.0005648318910971284, "global_step": 56962, "epoch": 478, "lr": 9.8864425344313e-06} +{"train_loss": 0.00027507165214046836, "global_step": 56963, "epoch": 478, "lr": 9.885120003625886e-06} +{"train_loss": 0.00029556872323155403, "global_step": 56964, "epoch": 478, "lr": 9.883797551581753e-06} +{"train_loss": 0.0005443861591629684, "global_step": 56965, "epoch": 478, "lr": 9.882475178301481e-06} +{"train_loss": 0.0005654792184941471, "global_step": 56966, "epoch": 478, "lr": 9.881152883787704e-06} +{"train_loss": 0.0006229912396520376, "global_step": 56967, "epoch": 478, "lr": 9.879830668042978e-06} +{"train_loss": 0.00043761549750342965, "global_step": 56968, "epoch": 478, "lr": 9.878508531069936e-06} +{"train_loss": 0.00039363859104923904, "global_step": 56969, "epoch": 478, "lr": 9.877186472871136e-06} +{"train_loss": 0.000474334170576185, "global_step": 56970, "epoch": 478, "lr": 9.875864493449216e-06} +{"train_loss": 0.0004786559729836881, "global_step": 56971, "epoch": 478, "lr": 9.87454259280674e-06} +{"train_loss": 0.000571949640288949, "global_step": 56972, "epoch": 478, "lr": 9.873220770946307e-06} +{"train_loss": 0.0005946190212853253, "global_step": 56973, "epoch": 478, "lr": 9.87189902787053e-06} +{"train_loss": 0.0005006244755350053, "global_step": 56974, "epoch": 478, "lr": 9.87057736358198e-06} +{"train_loss": 0.0004960153019055724, "global_step": 56975, "epoch": 478, "lr": 9.86925577808327e-06} +{"train_loss": 0.0005923874559812248, "global_step": 56976, "epoch": 478, "lr": 9.867934271376994e-06} +{"train_loss": 0.0003825763997156173, "global_step": 56977, "epoch": 478, "lr": 9.866612843465728e-06} +{"train_loss": 0.00024700548965483904, "global_step": 56978, "epoch": 478, "lr": 9.865291494352096e-06} +{"train_loss": 0.00036015876685269177, "global_step": 56979, "epoch": 478, "lr": 9.86397022403866e-06} +{"train_loss": 0.0004943994572386146, "global_step": 56980, "epoch": 478, "lr": 9.862649032528042e-06} +{"train_loss": 0.0009022847516462207, "global_step": 56981, "epoch": 478, "lr": 9.861327919822816e-06} +{"train_loss": 0.0002228566590929404, "global_step": 56982, "epoch": 478, "lr": 9.860006885925599e-06} +{"train_loss": 0.0010417512385174632, "global_step": 56983, "epoch": 478, "lr": 9.858685930838968e-06} +{"train_loss": 0.0005503171123564243, "global_step": 56984, "epoch": 478, "lr": 9.857365054565504e-06} +{"train_loss": 0.0004308999050408602, "global_step": 56985, "epoch": 478, "lr": 9.856044257107827e-06} +{"train_loss": 0.0003928490332327783, "global_step": 56986, "epoch": 478, "lr": 9.854723538468508e-06} +{"train_loss": 0.00045077840331941843, "global_step": 56987, "epoch": 478, "lr": 9.853402898650161e-06} +{"train_loss": 0.00038375388248823583, "global_step": 56988, "epoch": 478, "lr": 9.852082337655355e-06} +{"train_loss": 0.00044964629341848195, "global_step": 56989, "epoch": 478, "lr": 9.850761855486713e-06} +{"train_loss": 0.0003596596943680197, "global_step": 56990, "epoch": 478, "lr": 9.849441452146795e-06} +{"train_loss": 0.0005300898919813335, "global_step": 56991, "epoch": 478, "lr": 9.848121127638221e-06} +{"train_loss": 0.0005864972481504083, "global_step": 56992, "epoch": 478, "lr": 9.846800881963563e-06} +{"train_loss": 0.0003298580995760858, "global_step": 56993, "epoch": 478, "lr": 9.845480715125432e-06} +{"train_loss": 0.0002808288554660976, "global_step": 56994, "epoch": 478, "lr": 9.844160627126398e-06} +{"train_loss": 0.0006115546566434205, "global_step": 56995, "epoch": 478, "lr": 9.842840617969073e-06} +{"train_loss": 0.0004034149751532823, "global_step": 56996, "epoch": 478, "lr": 9.841520687656031e-06} +{"train_loss": 0.0002536158135626465, "global_step": 56997, "epoch": 478, "lr": 9.840200836189888e-06} +{"train_loss": 0.00030987325590103865, "global_step": 56998, "epoch": 478, "lr": 9.838881063573202e-06} +{"train_loss": 0.0005081351264379919, "global_step": 56999, "epoch": 478, "lr": 9.837561369808602e-06} +{"train_loss": 0.0005292441691526314, "global_step": 57000, "epoch": 478, "lr": 9.836241754898639e-06, "val_loss": 0.02465732768177986} +{"train_loss": 0.0006736991344951093, "global_step": 57001, "epoch": 479, "lr": 9.834922218845944e-06} +{"train_loss": 0.0005508554168045521, "global_step": 57002, "epoch": 479, "lr": 9.833602761653087e-06} +{"train_loss": 0.00027954220422543585, "global_step": 57003, "epoch": 479, "lr": 9.832283383322644e-06} +{"train_loss": 0.0002992384252138436, "global_step": 57004, "epoch": 479, "lr": 9.830964083857235e-06} +{"train_loss": 0.00040952657582238317, "global_step": 57005, "epoch": 479, "lr": 9.829644863259424e-06} +{"train_loss": 0.0008076448575593531, "global_step": 57006, "epoch": 479, "lr": 9.828325721531828e-06} +{"train_loss": 0.000538171676453203, "global_step": 57007, "epoch": 479, "lr": 9.827006658677007e-06} +{"train_loss": 0.0006680219667032361, "global_step": 57008, "epoch": 479, "lr": 9.825687674697581e-06} +{"train_loss": 0.0006712124450132251, "global_step": 57009, "epoch": 479, "lr": 9.824368769596126e-06} +{"train_loss": 0.0005361546645872295, "global_step": 57010, "epoch": 479, "lr": 9.823049943375218e-06} +{"train_loss": 0.0004440564080141485, "global_step": 57011, "epoch": 479, "lr": 9.82173119603747e-06} +{"train_loss": 0.0004465660604182631, "global_step": 57012, "epoch": 479, "lr": 9.820412527585453e-06} +{"train_loss": 0.000696406583301723, "global_step": 57013, "epoch": 479, "lr": 9.819093938021773e-06} +{"train_loss": 0.0004319361178204417, "global_step": 57014, "epoch": 479, "lr": 9.817775427349007e-06} +{"train_loss": 0.0004462430952116847, "global_step": 57015, "epoch": 479, "lr": 9.816456995569734e-06} +{"train_loss": 0.0006081581814214587, "global_step": 57016, "epoch": 479, "lr": 9.815138642686566e-06} +{"train_loss": 0.0002848055155482143, "global_step": 57017, "epoch": 479, "lr": 9.81382036870207e-06} +{"train_loss": 0.0004038831393700093, "global_step": 57018, "epoch": 479, "lr": 9.812502173618859e-06} +{"train_loss": 0.0005223266780376434, "global_step": 57019, "epoch": 479, "lr": 9.811184057439493e-06} +{"train_loss": 0.0005831748712807894, "global_step": 57020, "epoch": 479, "lr": 9.809866020166587e-06} +{"train_loss": 0.0004972016904503107, "global_step": 57021, "epoch": 479, "lr": 9.808548061802714e-06} +{"train_loss": 0.00033265698584727943, "global_step": 57022, "epoch": 479, "lr": 9.807230182350446e-06} +{"train_loss": 0.00037566007813438773, "global_step": 57023, "epoch": 479, "lr": 9.805912381812393e-06} +{"train_loss": 0.0005211298703216016, "global_step": 57024, "epoch": 479, "lr": 9.804594660191146e-06} +{"train_loss": 0.00046777218813076615, "global_step": 57025, "epoch": 479, "lr": 9.803277017489276e-06} +{"train_loss": 0.0005299607291817665, "global_step": 57026, "epoch": 479, "lr": 9.801959453709386e-06} +{"train_loss": 0.00028325276798568666, "global_step": 57027, "epoch": 479, "lr": 9.80064196885404e-06} +{"train_loss": 0.0005279335891827941, "global_step": 57028, "epoch": 479, "lr": 9.799324562925854e-06} +{"train_loss": 0.0003197844489477575, "global_step": 57029, "epoch": 479, "lr": 9.798007235927386e-06} +{"train_loss": 0.000690082844812423, "global_step": 57030, "epoch": 479, "lr": 9.796689987861247e-06} +{"train_loss": 0.0005363459931686521, "global_step": 57031, "epoch": 479, "lr": 9.795372818730003e-06} +{"train_loss": 0.0004899886553175747, "global_step": 57032, "epoch": 479, "lr": 9.79405572853626e-06} +{"train_loss": 0.0005747146205976605, "global_step": 57033, "epoch": 479, "lr": 9.79273871728259e-06} +{"train_loss": 0.00032954729977063835, "global_step": 57034, "epoch": 479, "lr": 9.791421784971572e-06} +{"train_loss": 0.0006940494058653712, "global_step": 57035, "epoch": 479, "lr": 9.79010493160582e-06} +{"train_loss": 0.0006072550895623863, "global_step": 57036, "epoch": 479, "lr": 9.788788157187877e-06} +{"train_loss": 0.0003320489777252078, "global_step": 57037, "epoch": 479, "lr": 9.787471461720377e-06} +{"train_loss": 0.0006212063017301261, "global_step": 57038, "epoch": 479, "lr": 9.786154845205859e-06} +{"train_loss": 0.00041039075586013496, "global_step": 57039, "epoch": 479, "lr": 9.784838307646948e-06} +{"train_loss": 0.0004913104930892587, "global_step": 57040, "epoch": 479, "lr": 9.783521849046207e-06} +{"train_loss": 0.0005106226890347898, "global_step": 57041, "epoch": 479, "lr": 9.782205469406215e-06} +{"train_loss": 0.00030949228676036, "global_step": 57042, "epoch": 479, "lr": 9.78088916872958e-06} +{"train_loss": 0.0007294302922673523, "global_step": 57043, "epoch": 479, "lr": 9.77957294701885e-06} +{"train_loss": 0.0004356690915301442, "global_step": 57044, "epoch": 479, "lr": 9.778256804276652e-06} +{"train_loss": 0.0003982357739005238, "global_step": 57045, "epoch": 479, "lr": 9.776940740505553e-06} +{"train_loss": 0.0003741273540072143, "global_step": 57046, "epoch": 479, "lr": 9.775624755708112e-06} +{"train_loss": 0.0005611898377537727, "global_step": 57047, "epoch": 479, "lr": 9.774308849886954e-06} +{"train_loss": 0.0007708797929808497, "global_step": 57048, "epoch": 479, "lr": 9.77299302304463e-06} +{"train_loss": 0.0004182485572528094, "global_step": 57049, "epoch": 479, "lr": 9.771677275183744e-06} +{"train_loss": 0.00044906733091920614, "global_step": 57050, "epoch": 479, "lr": 9.77036160630686e-06} +{"train_loss": 0.000497741624712944, "global_step": 57051, "epoch": 479, "lr": 9.76904601641659e-06} +{"train_loss": 0.0005462962435558438, "global_step": 57052, "epoch": 479, "lr": 9.767730505515499e-06} +{"train_loss": 0.0005981511203572154, "global_step": 57053, "epoch": 479, "lr": 9.766415073606161e-06} +{"train_loss": 0.0005770025309175253, "global_step": 57054, "epoch": 479, "lr": 9.765099720691173e-06} +{"train_loss": 0.0006130588008090854, "global_step": 57055, "epoch": 479, "lr": 9.763784446773106e-06} +{"train_loss": 0.00041301167220808566, "global_step": 57056, "epoch": 479, "lr": 9.762469251854561e-06} +{"train_loss": 0.0005238254088908434, "global_step": 57057, "epoch": 479, "lr": 9.7611541359381e-06} +{"train_loss": 0.0006836333777755499, "global_step": 57058, "epoch": 479, "lr": 9.759839099026308e-06} +{"train_loss": 0.000454712106147781, "global_step": 57059, "epoch": 479, "lr": 9.758524141121788e-06} +{"train_loss": 0.000649690511636436, "global_step": 57060, "epoch": 479, "lr": 9.757209262227096e-06} +{"train_loss": 0.00034347682958468795, "global_step": 57061, "epoch": 479, "lr": 9.75589446234484e-06} +{"train_loss": 0.0005449722521007061, "global_step": 57062, "epoch": 479, "lr": 9.754579741477565e-06} +{"train_loss": 0.000524811097420752, "global_step": 57063, "epoch": 479, "lr": 9.75326509962789e-06} +{"train_loss": 0.0003960927715525031, "global_step": 57064, "epoch": 479, "lr": 9.751950536798383e-06} +{"train_loss": 0.0005739592015743256, "global_step": 57065, "epoch": 479, "lr": 9.750636052991602e-06} +{"train_loss": 0.000520679634064436, "global_step": 57066, "epoch": 479, "lr": 9.749321648210163e-06} +{"train_loss": 0.00045936371316201985, "global_step": 57067, "epoch": 479, "lr": 9.748007322456615e-06} +{"train_loss": 0.0004501918738242239, "global_step": 57068, "epoch": 479, "lr": 9.74669307573357e-06} +{"train_loss": 0.0005693744169548154, "global_step": 57069, "epoch": 479, "lr": 9.745378908043578e-06} +{"train_loss": 0.0004812681581825018, "global_step": 57070, "epoch": 479, "lr": 9.744064819389248e-06} +{"train_loss": 0.0003522272745613009, "global_step": 57071, "epoch": 479, "lr": 9.742750809773143e-06} +{"train_loss": 0.00024804589338600636, "global_step": 57072, "epoch": 479, "lr": 9.74143687919784e-06} +{"train_loss": 0.0003914740227628499, "global_step": 57073, "epoch": 479, "lr": 9.740123027665932e-06} +{"train_loss": 0.0003974387072958052, "global_step": 57074, "epoch": 479, "lr": 9.738809255179982e-06} +{"train_loss": 0.00045168347423896194, "global_step": 57075, "epoch": 479, "lr": 9.737495561742589e-06} +{"train_loss": 0.0006258719367906451, "global_step": 57076, "epoch": 479, "lr": 9.73618194735631e-06} +{"train_loss": 0.0005045735160820186, "global_step": 57077, "epoch": 479, "lr": 9.734868412023746e-06} +{"train_loss": 0.00037573656300082803, "global_step": 57078, "epoch": 479, "lr": 9.73355495574747e-06} +{"train_loss": 0.0005738910404033959, "global_step": 57079, "epoch": 479, "lr": 9.732241578530044e-06} +{"train_loss": 0.00040898198494687676, "global_step": 57080, "epoch": 479, "lr": 9.730928280374074e-06} +{"train_loss": 0.0006063723121769726, "global_step": 57081, "epoch": 479, "lr": 9.729615061282105e-06} +{"train_loss": 0.00026200865977443755, "global_step": 57082, "epoch": 479, "lr": 9.728301921256755e-06} +{"train_loss": 0.0006977816228754818, "global_step": 57083, "epoch": 479, "lr": 9.726988860300579e-06} +{"train_loss": 0.00021960202138870955, "global_step": 57084, "epoch": 479, "lr": 9.72567587841614e-06} +{"train_loss": 0.0005961408605799079, "global_step": 57085, "epoch": 479, "lr": 9.724362975606054e-06} +{"train_loss": 0.0005436569335870445, "global_step": 57086, "epoch": 479, "lr": 9.723050151872858e-06} +{"train_loss": 0.0005779938073828816, "global_step": 57087, "epoch": 479, "lr": 9.721737407219172e-06} +{"train_loss": 0.0004056187462992966, "global_step": 57088, "epoch": 479, "lr": 9.720424741647532e-06} +{"train_loss": 0.0006707451539114118, "global_step": 57089, "epoch": 479, "lr": 9.719112155160548e-06} +{"train_loss": 0.0007225120207294822, "global_step": 57090, "epoch": 479, "lr": 9.717799647760773e-06} +{"train_loss": 0.0003382705326657742, "global_step": 57091, "epoch": 479, "lr": 9.716487219450809e-06} +{"train_loss": 0.0004308231291361153, "global_step": 57092, "epoch": 479, "lr": 9.715174870233207e-06} +{"train_loss": 0.00045292507275007665, "global_step": 57093, "epoch": 479, "lr": 9.71386260011055e-06} +{"train_loss": 0.00023619089915882796, "global_step": 57094, "epoch": 479, "lr": 9.712550409085435e-06} +{"train_loss": 0.0007970258011482656, "global_step": 57095, "epoch": 479, "lr": 9.711238297160424e-06} +{"train_loss": 0.0007292666123248637, "global_step": 57096, "epoch": 479, "lr": 9.709926264338081e-06} +{"train_loss": 0.0011884350096806884, "global_step": 57097, "epoch": 479, "lr": 9.708614310621e-06} +{"train_loss": 0.0004940934013575315, "global_step": 57098, "epoch": 479, "lr": 9.707302436011744e-06} +{"train_loss": 0.0005616539274342358, "global_step": 57099, "epoch": 479, "lr": 9.705990640512907e-06} +{"train_loss": 0.0007068944396451116, "global_step": 57100, "epoch": 479, "lr": 9.704678924127037e-06} +{"train_loss": 0.00038189676706679165, "global_step": 57101, "epoch": 479, "lr": 9.703367286856741e-06} +{"train_loss": 0.00032586028100922704, "global_step": 57102, "epoch": 479, "lr": 9.702055728704574e-06} +{"train_loss": 0.000693905574735254, "global_step": 57103, "epoch": 479, "lr": 9.700744249673104e-06} +{"train_loss": 0.000849726318847388, "global_step": 57104, "epoch": 479, "lr": 9.699432849764933e-06} +{"train_loss": 0.0004069102287758142, "global_step": 57105, "epoch": 479, "lr": 9.698121528982606e-06} +{"train_loss": 0.0005849329754710197, "global_step": 57106, "epoch": 479, "lr": 9.696810287328723e-06} +{"train_loss": 0.0002960154670290649, "global_step": 57107, "epoch": 479, "lr": 9.695499124805835e-06} +{"train_loss": 0.00041801712359301746, "global_step": 57108, "epoch": 479, "lr": 9.694188041416542e-06} +{"train_loss": 0.00029484429978765547, "global_step": 57109, "epoch": 479, "lr": 9.692877037163407e-06} +{"train_loss": 0.0006408208864741027, "global_step": 57110, "epoch": 479, "lr": 9.691566112048983e-06} +{"train_loss": 0.0004625410365406424, "global_step": 57111, "epoch": 479, "lr": 9.690255266075881e-06} +{"train_loss": 0.0008368065464310348, "global_step": 57112, "epoch": 479, "lr": 9.688944499246644e-06} +{"train_loss": 0.00088496197713539, "global_step": 57113, "epoch": 479, "lr": 9.687633811563868e-06} +{"train_loss": 0.0010834229178726673, "global_step": 57114, "epoch": 479, "lr": 9.686323203030118e-06} +{"train_loss": 0.0003790644695982337, "global_step": 57115, "epoch": 479, "lr": 9.685012673647948e-06} +{"train_loss": 0.00036277336766943336, "global_step": 57116, "epoch": 479, "lr": 9.683702223419965e-06} +{"train_loss": 0.000432081229519099, "global_step": 57117, "epoch": 479, "lr": 9.68239185234871e-06} +{"train_loss": 0.0003696479252539575, "global_step": 57118, "epoch": 479, "lr": 9.681081560436789e-06} +{"train_loss": 0.0005113204943354657, "global_step": 57119, "epoch": 479, "lr": 9.679771347686739e-06, "val_loss": 0.024378132075071335} +{"train_loss": 0.00042111839866265655, "global_step": 57120, "epoch": 480, "lr": 9.67846121410117e-06} +{"train_loss": 0.00047020683996379375, "global_step": 57121, "epoch": 480, "lr": 9.677151159682613e-06} +{"train_loss": 0.000414414273109287, "global_step": 57122, "epoch": 480, "lr": 9.675841184433681e-06} +{"train_loss": 0.0006906816270202398, "global_step": 57123, "epoch": 480, "lr": 9.674531288356914e-06} +{"train_loss": 0.0004333121469244361, "global_step": 57124, "epoch": 480, "lr": 9.673221471454908e-06} +{"train_loss": 0.0004652921052183956, "global_step": 57125, "epoch": 480, "lr": 9.67191173373021e-06} +{"train_loss": 0.0004183529526926577, "global_step": 57126, "epoch": 480, "lr": 9.670602075185415e-06} +{"train_loss": 0.0006468332139775157, "global_step": 57127, "epoch": 480, "lr": 9.669292495823074e-06} +{"train_loss": 0.0002843309775926173, "global_step": 57128, "epoch": 480, "lr": 9.667982995645786e-06} +{"train_loss": 0.0003801066195592284, "global_step": 57129, "epoch": 480, "lr": 9.666673574656087e-06} +{"train_loss": 0.000335104443365708, "global_step": 57130, "epoch": 480, "lr": 9.665364232856578e-06} +{"train_loss": 0.0005282722413539886, "global_step": 57131, "epoch": 480, "lr": 9.664054970249802e-06} +{"train_loss": 0.0006654286989942193, "global_step": 57132, "epoch": 480, "lr": 9.662745786838362e-06} +{"train_loss": 0.0003854941460303962, "global_step": 57133, "epoch": 480, "lr": 9.661436682624808e-06} +{"train_loss": 0.0007089798455126584, "global_step": 57134, "epoch": 480, "lr": 9.660127657611706e-06} +{"train_loss": 0.0006764949066564441, "global_step": 57135, "epoch": 480, "lr": 9.658818711801643e-06} +{"train_loss": 0.00041031811269931495, "global_step": 57136, "epoch": 480, "lr": 9.657509845197166e-06} +{"train_loss": 0.0007681756396777928, "global_step": 57137, "epoch": 480, "lr": 9.656201057800873e-06} +{"train_loss": 0.00036638096207752824, "global_step": 57138, "epoch": 480, "lr": 9.654892349615308e-06} +{"train_loss": 0.0009812259813770652, "global_step": 57139, "epoch": 480, "lr": 9.653583720643062e-06} +{"train_loss": 0.00043513980926945806, "global_step": 57140, "epoch": 480, "lr": 9.652275170886694e-06} +{"train_loss": 0.0005111228092573583, "global_step": 57141, "epoch": 480, "lr": 9.650966700348757e-06} +{"train_loss": 0.0006264802068471909, "global_step": 57142, "epoch": 480, "lr": 9.64965830903185e-06} +{"train_loss": 0.0001990870659938082, "global_step": 57143, "epoch": 480, "lr": 9.648349996938522e-06} +{"train_loss": 0.0007214686484076083, "global_step": 57144, "epoch": 480, "lr": 9.647041764071357e-06} +{"train_loss": 0.0005153054953552783, "global_step": 57145, "epoch": 480, "lr": 9.6457336104329e-06} +{"train_loss": 0.0006405373569577932, "global_step": 57146, "epoch": 480, "lr": 9.644425536025748e-06} +{"train_loss": 0.0003531999245751649, "global_step": 57147, "epoch": 480, "lr": 9.643117540852454e-06} +{"train_loss": 0.000619619560893625, "global_step": 57148, "epoch": 480, "lr": 9.641809624915576e-06} +{"train_loss": 0.0003333606873638928, "global_step": 57149, "epoch": 480, "lr": 9.640501788217705e-06} +{"train_loss": 0.000971394416410476, "global_step": 57150, "epoch": 480, "lr": 9.639194030761383e-06} +{"train_loss": 0.00042313538142479956, "global_step": 57151, "epoch": 480, "lr": 9.637886352549209e-06} +{"train_loss": 0.000485581491375342, "global_step": 57152, "epoch": 480, "lr": 9.636578753583726e-06} +{"train_loss": 0.000745568482670933, "global_step": 57153, "epoch": 480, "lr": 9.635271233867499e-06} +{"train_loss": 0.0004017552128061652, "global_step": 57154, "epoch": 480, "lr": 9.633963793403117e-06} +{"train_loss": 0.0005275423754937947, "global_step": 57155, "epoch": 480, "lr": 9.632656432193127e-06} +{"train_loss": 0.0003044149780180305, "global_step": 57156, "epoch": 480, "lr": 9.631349150240098e-06} +{"train_loss": 0.00038605890586040914, "global_step": 57157, "epoch": 480, "lr": 9.630041947546615e-06} +{"train_loss": 0.000658918812405318, "global_step": 57158, "epoch": 480, "lr": 9.62873482411522e-06} +{"train_loss": 0.00035138995735906065, "global_step": 57159, "epoch": 480, "lr": 9.627427779948506e-06} +{"train_loss": 0.0007434796425513923, "global_step": 57160, "epoch": 480, "lr": 9.626120815049006e-06} +{"train_loss": 0.000576270860619843, "global_step": 57161, "epoch": 480, "lr": 9.624813929419324e-06} +{"train_loss": 0.0003228119167033583, "global_step": 57162, "epoch": 480, "lr": 9.623507123061986e-06} +{"train_loss": 0.0003428116033319384, "global_step": 57163, "epoch": 480, "lr": 9.622200395979598e-06} +{"train_loss": 0.00034900620812550187, "global_step": 57164, "epoch": 480, "lr": 9.620893748174703e-06} +{"train_loss": 0.001213966403156519, "global_step": 57165, "epoch": 480, "lr": 9.619587179649858e-06} +{"train_loss": 0.0005579515709541738, "global_step": 57166, "epoch": 480, "lr": 9.618280690407649e-06} +{"train_loss": 0.00045197445433586836, "global_step": 57167, "epoch": 480, "lr": 9.616974280450618e-06} +{"train_loss": 0.0004386055807117373, "global_step": 57168, "epoch": 480, "lr": 9.615667949781359e-06} +{"train_loss": 0.00030109004001133144, "global_step": 57169, "epoch": 480, "lr": 9.614361698402413e-06} +{"train_loss": 0.000526545918546617, "global_step": 57170, "epoch": 480, "lr": 9.613055526316361e-06} +{"train_loss": 0.0005065227160230279, "global_step": 57171, "epoch": 480, "lr": 9.611749433525763e-06} +{"train_loss": 0.00038747492362745106, "global_step": 57172, "epoch": 480, "lr": 9.610443420033165e-06} +{"train_loss": 0.0003468259528744966, "global_step": 57173, "epoch": 480, "lr": 9.609137485841158e-06} +{"train_loss": 0.0004103646788280457, "global_step": 57174, "epoch": 480, "lr": 9.607831630952286e-06} +{"train_loss": 0.00044096403871662915, "global_step": 57175, "epoch": 480, "lr": 9.60652585536913e-06} +{"train_loss": 0.00042102360748685896, "global_step": 57176, "epoch": 480, "lr": 9.60522015909423e-06} +{"train_loss": 0.0003586271486710757, "global_step": 57177, "epoch": 480, "lr": 9.603914542130183e-06} +{"train_loss": 0.0008226626086980104, "global_step": 57178, "epoch": 480, "lr": 9.602609004479528e-06} +{"train_loss": 0.0003457522252574563, "global_step": 57179, "epoch": 480, "lr": 9.601303546144829e-06} +{"train_loss": 0.0009636491304263473, "global_step": 57180, "epoch": 480, "lr": 9.599998167128666e-06} +{"train_loss": 0.000697030161973089, "global_step": 57181, "epoch": 480, "lr": 9.598692867433573e-06} +{"train_loss": 0.0003109307726845145, "global_step": 57182, "epoch": 480, "lr": 9.597387647062145e-06} +{"train_loss": 0.0004658888792619109, "global_step": 57183, "epoch": 480, "lr": 9.596082506016934e-06} +{"train_loss": 0.0005148735363036394, "global_step": 57184, "epoch": 480, "lr": 9.594777444300479e-06} +{"train_loss": 0.00032479444053024054, "global_step": 57185, "epoch": 480, "lr": 9.593472461915381e-06} +{"train_loss": 0.0005551128415390849, "global_step": 57186, "epoch": 480, "lr": 9.592167558864167e-06} +{"train_loss": 0.0006735672359354794, "global_step": 57187, "epoch": 480, "lr": 9.590862735149425e-06} +{"train_loss": 0.00041666076867841184, "global_step": 57188, "epoch": 480, "lr": 9.589557990773701e-06} +{"train_loss": 0.00041922988020814955, "global_step": 57189, "epoch": 480, "lr": 9.588253325739572e-06} +{"train_loss": 0.0005175921251066029, "global_step": 57190, "epoch": 480, "lr": 9.586948740049573e-06} +{"train_loss": 0.0005943858413957059, "global_step": 57191, "epoch": 480, "lr": 9.585644233706287e-06} +{"train_loss": 0.0005110291531309485, "global_step": 57192, "epoch": 480, "lr": 9.584339806712284e-06} +{"train_loss": 0.0003651058941613883, "global_step": 57193, "epoch": 480, "lr": 9.583035459070099e-06} +{"train_loss": 0.0006651094881817698, "global_step": 57194, "epoch": 480, "lr": 9.581731190782318e-06} +{"train_loss": 0.0005685670766979456, "global_step": 57195, "epoch": 480, "lr": 9.580427001851478e-06} +{"train_loss": 0.00036566852941177785, "global_step": 57196, "epoch": 480, "lr": 9.579122892280163e-06} +{"train_loss": 0.0004491505678743124, "global_step": 57197, "epoch": 480, "lr": 9.577818862070925e-06} +{"train_loss": 0.00023041876556817442, "global_step": 57198, "epoch": 480, "lr": 9.576514911226304e-06} +{"train_loss": 0.00044386935769580305, "global_step": 57199, "epoch": 480, "lr": 9.575211039748894e-06} +{"train_loss": 0.00039515120442956686, "global_step": 57200, "epoch": 480, "lr": 9.573907247641223e-06} +{"train_loss": 0.00042394164483994246, "global_step": 57201, "epoch": 480, "lr": 9.572603534905877e-06} +{"train_loss": 0.0004025367379654199, "global_step": 57202, "epoch": 480, "lr": 9.571299901545411e-06} +{"train_loss": 0.0004173202032689005, "global_step": 57203, "epoch": 480, "lr": 9.56999634756236e-06} +{"train_loss": 0.0003578411997295916, "global_step": 57204, "epoch": 480, "lr": 9.568692872959316e-06} +{"train_loss": 0.0005840828525833786, "global_step": 57205, "epoch": 480, "lr": 9.567389477738814e-06} +{"train_loss": 0.0005433691549114883, "global_step": 57206, "epoch": 480, "lr": 9.56608616190343e-06} +{"train_loss": 0.0004773861146531999, "global_step": 57207, "epoch": 480, "lr": 9.564782925455712e-06} +{"train_loss": 0.0004433457797858864, "global_step": 57208, "epoch": 480, "lr": 9.563479768398232e-06} +{"train_loss": 0.0002914991637226194, "global_step": 57209, "epoch": 480, "lr": 9.562176690733538e-06} +{"train_loss": 0.00038186428719200194, "global_step": 57210, "epoch": 480, "lr": 9.56087369246418e-06} +{"train_loss": 0.0004735655675176531, "global_step": 57211, "epoch": 480, "lr": 9.559570773592735e-06} +{"train_loss": 0.00022848049411550164, "global_step": 57212, "epoch": 480, "lr": 9.55826793412174e-06} +{"train_loss": 0.001275310292840004, "global_step": 57213, "epoch": 480, "lr": 9.556965174053778e-06} +{"train_loss": 0.0004014746518805623, "global_step": 57214, "epoch": 480, "lr": 9.555662493391398e-06} +{"train_loss": 0.00038382105412892997, "global_step": 57215, "epoch": 480, "lr": 9.554359892137137e-06} +{"train_loss": 0.0005142972804605961, "global_step": 57216, "epoch": 480, "lr": 9.553057370293583e-06} +{"train_loss": 0.0007563857943750918, "global_step": 57217, "epoch": 480, "lr": 9.551754927863272e-06} +{"train_loss": 0.00047540906234644353, "global_step": 57218, "epoch": 480, "lr": 9.550452564848772e-06} +{"train_loss": 0.0008281894261017442, "global_step": 57219, "epoch": 480, "lr": 9.549150281252633e-06} +{"train_loss": 0.0008595052058808506, "global_step": 57220, "epoch": 480, "lr": 9.547848077077427e-06} +{"train_loss": 0.0003139651380479336, "global_step": 57221, "epoch": 480, "lr": 9.54654595232568e-06} +{"train_loss": 0.00033926303149200976, "global_step": 57222, "epoch": 480, "lr": 9.54524390699999e-06} +{"train_loss": 0.0006007274496369064, "global_step": 57223, "epoch": 480, "lr": 9.543941941102874e-06} +{"train_loss": 0.0007387922960333526, "global_step": 57224, "epoch": 480, "lr": 9.54264005463692e-06} +{"train_loss": 0.0008823963580653071, "global_step": 57225, "epoch": 480, "lr": 9.54133824760466e-06} +{"train_loss": 0.0005872529000043869, "global_step": 57226, "epoch": 480, "lr": 9.540036520008655e-06} +{"train_loss": 0.0004175057983957231, "global_step": 57227, "epoch": 480, "lr": 9.538734871851479e-06} +{"train_loss": 0.000636559387203306, "global_step": 57228, "epoch": 480, "lr": 9.537433303135678e-06} +{"train_loss": 0.0005053045460954309, "global_step": 57229, "epoch": 480, "lr": 9.536131813863786e-06} +{"train_loss": 0.0005428699660114944, "global_step": 57230, "epoch": 480, "lr": 9.534830404038391e-06} +{"train_loss": 0.0004366838838905096, "global_step": 57231, "epoch": 480, "lr": 9.533529073662023e-06} +{"train_loss": 0.00020555620722007006, "global_step": 57232, "epoch": 480, "lr": 9.532227822737261e-06} +{"train_loss": 0.0005355808534659445, "global_step": 57233, "epoch": 480, "lr": 9.530926651266642e-06} +{"train_loss": 0.0007694789674133062, "global_step": 57234, "epoch": 480, "lr": 9.529625559252713e-06} +{"train_loss": 0.0006368769682012498, "global_step": 57235, "epoch": 480, "lr": 9.528324546698058e-06} +{"train_loss": 0.0007092223968356848, "global_step": 57236, "epoch": 480, "lr": 9.527023613605195e-06} +{"train_loss": 0.000382934114895761, "global_step": 57237, "epoch": 480, "lr": 9.525722759976718e-06} +{"train_loss": 0.0005151099524658345, "global_step": 57238, "epoch": 480, "lr": 9.52442198581514e-06, "val_loss": 0.019154109060764313, "train_action_mse_error": 6.930170002306113e-06} +{"train_loss": 0.0003773197822738439, "global_step": 57239, "epoch": 481, "lr": 9.52312129112305e-06} +{"train_loss": 0.0005554814706556499, "global_step": 57240, "epoch": 481, "lr": 9.521820675902992e-06} +{"train_loss": 0.0004410476831253618, "global_step": 57241, "epoch": 481, "lr": 9.520520140157496e-06} +{"train_loss": 0.0005961722927168012, "global_step": 57242, "epoch": 481, "lr": 9.519219683889147e-06} +{"train_loss": 0.0003413888916838914, "global_step": 57243, "epoch": 481, "lr": 9.517919307100477e-06} +{"train_loss": 0.0006718513905070722, "global_step": 57244, "epoch": 481, "lr": 9.516619009794054e-06} +{"train_loss": 0.0002931845374405384, "global_step": 57245, "epoch": 481, "lr": 9.515318791972417e-06} +{"train_loss": 0.0002997317351400852, "global_step": 57246, "epoch": 481, "lr": 9.51401865363814e-06} +{"train_loss": 0.0005369935533963144, "global_step": 57247, "epoch": 481, "lr": 9.512718594793756e-06} +{"train_loss": 0.000416573544498533, "global_step": 57248, "epoch": 481, "lr": 9.511418615441814e-06} +{"train_loss": 0.00034077742020599544, "global_step": 57249, "epoch": 481, "lr": 9.510118715584892e-06} +{"train_loss": 0.0004272845108062029, "global_step": 57250, "epoch": 481, "lr": 9.508818895225507e-06} +{"train_loss": 0.0004334850236773491, "global_step": 57251, "epoch": 481, "lr": 9.507519154366251e-06} +{"train_loss": 0.00032052575261332095, "global_step": 57252, "epoch": 481, "lr": 9.50621949300965e-06} +{"train_loss": 0.0003925933560822159, "global_step": 57253, "epoch": 481, "lr": 9.50491991115825e-06} +{"train_loss": 0.0004994962364435196, "global_step": 57254, "epoch": 481, "lr": 9.503620408814612e-06} +{"train_loss": 0.0008559431880712509, "global_step": 57255, "epoch": 481, "lr": 9.5023209859813e-06} +{"train_loss": 0.0003804322623182088, "global_step": 57256, "epoch": 481, "lr": 9.501021642660846e-06} +{"train_loss": 0.0002793815510813147, "global_step": 57257, "epoch": 481, "lr": 9.499722378855818e-06} +{"train_loss": 0.0007010929984971881, "global_step": 57258, "epoch": 481, "lr": 9.498423194568745e-06} +{"train_loss": 0.00046538602327927947, "global_step": 57259, "epoch": 481, "lr": 9.497124089802206e-06} +{"train_loss": 0.00034542815410532057, "global_step": 57260, "epoch": 481, "lr": 9.495825064558728e-06} +{"train_loss": 0.0006163587677292526, "global_step": 57261, "epoch": 481, "lr": 9.494526118840879e-06} +{"train_loss": 0.0005207801586948335, "global_step": 57262, "epoch": 481, "lr": 9.493227252651188e-06} +{"train_loss": 0.0006081637693569064, "global_step": 57263, "epoch": 481, "lr": 9.491928465992228e-06} +{"train_loss": 0.0005569793283939362, "global_step": 57264, "epoch": 481, "lr": 9.490629758866526e-06} +{"train_loss": 0.0005935713415965438, "global_step": 57265, "epoch": 481, "lr": 9.489331131276663e-06} +{"train_loss": 0.000630618364084512, "global_step": 57266, "epoch": 481, "lr": 9.488032583225165e-06} +{"train_loss": 0.0006318653468042612, "global_step": 57267, "epoch": 481, "lr": 9.48673411471458e-06} +{"train_loss": 0.0004143413680139929, "global_step": 57268, "epoch": 481, "lr": 9.485435725747472e-06} +{"train_loss": 0.00039238977478817105, "global_step": 57269, "epoch": 481, "lr": 9.484137416326373e-06} +{"train_loss": 0.00042882829438894987, "global_step": 57270, "epoch": 481, "lr": 9.482839186453851e-06} +{"train_loss": 0.0002550658246036619, "global_step": 57271, "epoch": 481, "lr": 9.481541036132446e-06} +{"train_loss": 0.0003425139293540269, "global_step": 57272, "epoch": 481, "lr": 9.4802429653647e-06} +{"train_loss": 0.0004046827380079776, "global_step": 57273, "epoch": 481, "lr": 9.478944974153176e-06} +{"train_loss": 0.00035566918086260557, "global_step": 57274, "epoch": 481, "lr": 9.4776470625004e-06} +{"train_loss": 0.0003012942033819854, "global_step": 57275, "epoch": 481, "lr": 9.476349230408949e-06} +{"train_loss": 0.0004236130334902555, "global_step": 57276, "epoch": 481, "lr": 9.475051477881341e-06} +{"train_loss": 0.00031117405160330236, "global_step": 57277, "epoch": 481, "lr": 9.47375380492016e-06} +{"train_loss": 0.00038152895285747945, "global_step": 57278, "epoch": 481, "lr": 9.472456211527931e-06} +{"train_loss": 0.0004743478784803301, "global_step": 57279, "epoch": 481, "lr": 9.471158697707188e-06} +{"train_loss": 0.000792402948718518, "global_step": 57280, "epoch": 481, "lr": 9.469861263460512e-06} +{"train_loss": 0.0005664842901751399, "global_step": 57281, "epoch": 481, "lr": 9.468563908790417e-06} +{"train_loss": 0.0006125136278569698, "global_step": 57282, "epoch": 481, "lr": 9.467266633699484e-06} +{"train_loss": 0.0006087303045205772, "global_step": 57283, "epoch": 481, "lr": 9.465969438190243e-06} +{"train_loss": 0.0007085009128786623, "global_step": 57284, "epoch": 481, "lr": 9.464672322265222e-06} +{"train_loss": 0.0003648421843536198, "global_step": 57285, "epoch": 481, "lr": 9.463375285927001e-06} +{"train_loss": 0.0005376619519665837, "global_step": 57286, "epoch": 481, "lr": 9.462078329178103e-06} +{"train_loss": 0.0006480067386291921, "global_step": 57287, "epoch": 481, "lr": 9.460781452021095e-06} +{"train_loss": 0.0005356947076506913, "global_step": 57288, "epoch": 481, "lr": 9.459484654458495e-06} +{"train_loss": 0.0004750617372337729, "global_step": 57289, "epoch": 481, "lr": 9.458187936492869e-06} +{"train_loss": 0.0004128843720536679, "global_step": 57290, "epoch": 481, "lr": 9.456891298126769e-06} +{"train_loss": 0.0006618381012231112, "global_step": 57291, "epoch": 481, "lr": 9.455594739362722e-06} +{"train_loss": 0.0006195526802912354, "global_step": 57292, "epoch": 481, "lr": 9.454298260203298e-06} +{"train_loss": 0.0005683504277840257, "global_step": 57293, "epoch": 481, "lr": 9.453001860651011e-06} +{"train_loss": 0.00043242835090495646, "global_step": 57294, "epoch": 481, "lr": 9.451705540708439e-06} +{"train_loss": 0.0003764789435081184, "global_step": 57295, "epoch": 481, "lr": 9.450409300378093e-06} +{"train_loss": 0.00042498306720517576, "global_step": 57296, "epoch": 481, "lr": 9.449113139662553e-06} +{"train_loss": 0.0002473018248565495, "global_step": 57297, "epoch": 481, "lr": 9.447817058564345e-06} +{"train_loss": 0.0002681565238162875, "global_step": 57298, "epoch": 481, "lr": 9.446521057086005e-06} +{"train_loss": 0.00032412211294285953, "global_step": 57299, "epoch": 481, "lr": 9.445225135230102e-06} +{"train_loss": 0.0005167926428839564, "global_step": 57300, "epoch": 481, "lr": 9.443929292999154e-06} +{"train_loss": 0.00027081547887064517, "global_step": 57301, "epoch": 481, "lr": 9.442633530395728e-06} +{"train_loss": 0.000348607572959736, "global_step": 57302, "epoch": 481, "lr": 9.44133784742236e-06} +{"train_loss": 0.00032431352883577347, "global_step": 57303, "epoch": 481, "lr": 9.440042244081581e-06} +{"train_loss": 0.0006291603785939515, "global_step": 57304, "epoch": 481, "lr": 9.438746720375957e-06} +{"train_loss": 0.0003635975590441376, "global_step": 57305, "epoch": 481, "lr": 9.437451276308007e-06} +{"train_loss": 0.0004525664262473583, "global_step": 57306, "epoch": 481, "lr": 9.4361559118803e-06} +{"train_loss": 0.00039389304583892226, "global_step": 57307, "epoch": 481, "lr": 9.43486062709536e-06} +{"train_loss": 0.0003316550573799759, "global_step": 57308, "epoch": 481, "lr": 9.433565421955742e-06} +{"train_loss": 0.0005695590516552329, "global_step": 57309, "epoch": 481, "lr": 9.43227029646399e-06} +{"train_loss": 0.0004302093293517828, "global_step": 57310, "epoch": 481, "lr": 9.430975250622626e-06} +{"train_loss": 0.0006339777610264719, "global_step": 57311, "epoch": 481, "lr": 9.429680284434222e-06} +{"train_loss": 0.0004646042361855507, "global_step": 57312, "epoch": 481, "lr": 9.428385397901296e-06} +{"train_loss": 0.0005318733747117221, "global_step": 57313, "epoch": 481, "lr": 9.42709059102641e-06} +{"train_loss": 0.0011177690466865897, "global_step": 57314, "epoch": 481, "lr": 9.425795863812087e-06} +{"train_loss": 0.0005266538937576115, "global_step": 57315, "epoch": 481, "lr": 9.42450121626089e-06} +{"train_loss": 0.0003276902425568551, "global_step": 57316, "epoch": 481, "lr": 9.423206648375348e-06} +{"train_loss": 0.0003698397777043283, "global_step": 57317, "epoch": 481, "lr": 9.421912160157992e-06} +{"train_loss": 0.00023045987472869456, "global_step": 57318, "epoch": 481, "lr": 9.420617751611393e-06} +{"train_loss": 0.0004899504128843546, "global_step": 57319, "epoch": 481, "lr": 9.419323422738063e-06} +{"train_loss": 0.00040668874862603843, "global_step": 57320, "epoch": 481, "lr": 9.418029173540566e-06} +{"train_loss": 0.000409064901759848, "global_step": 57321, "epoch": 481, "lr": 9.416735004021421e-06} +{"train_loss": 0.0003791440976783633, "global_step": 57322, "epoch": 481, "lr": 9.415440914183194e-06} +{"train_loss": 0.0005762490327470005, "global_step": 57323, "epoch": 481, "lr": 9.414146904028403e-06} +{"train_loss": 0.00037029519444331527, "global_step": 57324, "epoch": 481, "lr": 9.412852973559595e-06} +{"train_loss": 0.0010374091798439622, "global_step": 57325, "epoch": 481, "lr": 9.411559122779329e-06} +{"train_loss": 0.0006166951498016715, "global_step": 57326, "epoch": 481, "lr": 9.410265351690112e-06} +{"train_loss": 0.000541853136382997, "global_step": 57327, "epoch": 481, "lr": 9.408971660294524e-06} +{"train_loss": 0.00039391504833474755, "global_step": 57328, "epoch": 481, "lr": 9.407678048595081e-06} +{"train_loss": 0.00030049768975004554, "global_step": 57329, "epoch": 481, "lr": 9.406384516594308e-06} +{"train_loss": 0.0005006805877201259, "global_step": 57330, "epoch": 481, "lr": 9.405091064294779e-06} +{"train_loss": 0.0005505764274857938, "global_step": 57331, "epoch": 481, "lr": 9.403797691699002e-06} +{"train_loss": 0.0005075444933027029, "global_step": 57332, "epoch": 481, "lr": 9.402504398809547e-06} +{"train_loss": 0.000627720495685935, "global_step": 57333, "epoch": 481, "lr": 9.401211185628921e-06} +{"train_loss": 0.0008606819319538772, "global_step": 57334, "epoch": 481, "lr": 9.399918052159695e-06} +{"train_loss": 0.0002252540143672377, "global_step": 57335, "epoch": 481, "lr": 9.398624998404393e-06} +{"train_loss": 0.0004545265401247889, "global_step": 57336, "epoch": 481, "lr": 9.397332024365541e-06} +{"train_loss": 0.0005739133339375257, "global_step": 57337, "epoch": 481, "lr": 9.396039130045698e-06} +{"train_loss": 0.0004543120739981532, "global_step": 57338, "epoch": 481, "lr": 9.394746315447383e-06} +{"train_loss": 0.00041737619903869927, "global_step": 57339, "epoch": 481, "lr": 9.393453580573159e-06} +{"train_loss": 0.0004171815817244351, "global_step": 57340, "epoch": 481, "lr": 9.392160925425552e-06} +{"train_loss": 0.0003882895107381046, "global_step": 57341, "epoch": 481, "lr": 9.390868350007088e-06} +{"train_loss": 0.0005208213697187603, "global_step": 57342, "epoch": 481, "lr": 9.389575854320326e-06} +{"train_loss": 0.00038856148603372276, "global_step": 57343, "epoch": 481, "lr": 9.388283438367778e-06} +{"train_loss": 0.00034935673465952277, "global_step": 57344, "epoch": 481, "lr": 9.38699110215201e-06} +{"train_loss": 0.000269865122390911, "global_step": 57345, "epoch": 481, "lr": 9.385698845675533e-06} +{"train_loss": 0.00041292159585282207, "global_step": 57346, "epoch": 481, "lr": 9.384406668940915e-06} +{"train_loss": 0.0008057245868258178, "global_step": 57347, "epoch": 481, "lr": 9.383114571950675e-06} +{"train_loss": 0.0005332354339770973, "global_step": 57348, "epoch": 481, "lr": 9.381822554707331e-06} +{"train_loss": 0.0004897227045148611, "global_step": 57349, "epoch": 481, "lr": 9.380530617213457e-06} +{"train_loss": 0.0005025776918046176, "global_step": 57350, "epoch": 481, "lr": 9.379238759471554e-06} +{"train_loss": 0.0005456796498037875, "global_step": 57351, "epoch": 481, "lr": 9.377946981484193e-06} +{"train_loss": 0.0003669647267088294, "global_step": 57352, "epoch": 481, "lr": 9.376655283253882e-06} +{"train_loss": 0.0005883093690499663, "global_step": 57353, "epoch": 481, "lr": 9.375363664783177e-06} +{"train_loss": 0.0006212507141754031, "global_step": 57354, "epoch": 481, "lr": 9.374072126074595e-06} +{"train_loss": 0.0003806080494541675, "global_step": 57355, "epoch": 481, "lr": 9.372780667130693e-06} +{"train_loss": 0.0004225319717079401, "global_step": 57356, "epoch": 481, "lr": 9.371489287953983e-06} +{"train_loss": 0.0004772857976627356, "global_step": 57357, "epoch": 481, "lr": 9.37019798854703e-06, "val_loss": 0.02899014577269554} +{"train_loss": 0.0006370932096615434, "global_step": 57358, "epoch": 482, "lr": 9.36890676891234e-06} +{"train_loss": 0.0004987223073840141, "global_step": 57359, "epoch": 482, "lr": 9.367615629052467e-06} +{"train_loss": 0.0004381965263746679, "global_step": 57360, "epoch": 482, "lr": 9.366324568969931e-06} +{"train_loss": 0.0002235219581052661, "global_step": 57361, "epoch": 482, "lr": 9.365033588667288e-06} +{"train_loss": 0.00026175292441621423, "global_step": 57362, "epoch": 482, "lr": 9.363742688147049e-06} +{"train_loss": 0.0007179409731179476, "global_step": 57363, "epoch": 482, "lr": 9.36245186741177e-06} +{"train_loss": 0.00045694739674218, "global_step": 57364, "epoch": 482, "lr": 9.361161126463963e-06} +{"train_loss": 0.0004238798574078828, "global_step": 57365, "epoch": 482, "lr": 9.359870465306187e-06} +{"train_loss": 0.0005782891530543566, "global_step": 57366, "epoch": 482, "lr": 9.358579883940966e-06} +{"train_loss": 0.0006289005395956337, "global_step": 57367, "epoch": 482, "lr": 9.357289382370816e-06} +{"train_loss": 0.0007473548757843673, "global_step": 57368, "epoch": 482, "lr": 9.3559989605983e-06} +{"train_loss": 0.0006278331857174635, "global_step": 57369, "epoch": 482, "lr": 9.35470861862593e-06} +{"train_loss": 0.00070038071135059, "global_step": 57370, "epoch": 482, "lr": 9.35341835645625e-06} +{"train_loss": 0.00019723955483641475, "global_step": 57371, "epoch": 482, "lr": 9.352128174091801e-06} +{"train_loss": 0.00043962185736745596, "global_step": 57372, "epoch": 482, "lr": 9.350838071535084e-06} +{"train_loss": 0.00041950575541704893, "global_step": 57373, "epoch": 482, "lr": 9.349548048788675e-06} +{"train_loss": 0.00041233343654312193, "global_step": 57374, "epoch": 482, "lr": 9.348258105855068e-06} +{"train_loss": 0.0004850111436098814, "global_step": 57375, "epoch": 482, "lr": 9.346968242736825e-06} +{"train_loss": 0.00041732299723662436, "global_step": 57376, "epoch": 482, "lr": 9.345678459436458e-06} +{"train_loss": 0.000355610711267218, "global_step": 57377, "epoch": 482, "lr": 9.344388755956518e-06} +{"train_loss": 0.0007680390845052898, "global_step": 57378, "epoch": 482, "lr": 9.343099132299527e-06} +{"train_loss": 0.0003654526371974498, "global_step": 57379, "epoch": 482, "lr": 9.341809588468004e-06} +{"train_loss": 0.0006023214082233608, "global_step": 57380, "epoch": 482, "lr": 9.340520124464508e-06} +{"train_loss": 0.0007437182939611375, "global_step": 57381, "epoch": 482, "lr": 9.339230740291543e-06} +{"train_loss": 0.0008397464407607913, "global_step": 57382, "epoch": 482, "lr": 9.337941435951669e-06} +{"train_loss": 0.00030653891735710204, "global_step": 57383, "epoch": 482, "lr": 9.336652211447388e-06} +{"train_loss": 0.0004601121472660452, "global_step": 57384, "epoch": 482, "lr": 9.335363066781261e-06} +{"train_loss": 0.0004268148331902921, "global_step": 57385, "epoch": 482, "lr": 9.334074001955789e-06} +{"train_loss": 0.0003876730042975396, "global_step": 57386, "epoch": 482, "lr": 9.332785016973533e-06} +{"train_loss": 0.00032470928272232413, "global_step": 57387, "epoch": 482, "lr": 9.331496111836995e-06} +{"train_loss": 0.0003195581375621259, "global_step": 57388, "epoch": 482, "lr": 9.330207286548737e-06} +{"train_loss": 0.0005140213761478662, "global_step": 57389, "epoch": 482, "lr": 9.328918541111253e-06} +{"train_loss": 0.0003358715621288866, "global_step": 57390, "epoch": 482, "lr": 9.327629875527111e-06} +{"train_loss": 0.0004352937685325742, "global_step": 57391, "epoch": 482, "lr": 9.326341289798807e-06} +{"train_loss": 0.00030957284616306424, "global_step": 57392, "epoch": 482, "lr": 9.3250527839289e-06} +{"train_loss": 0.000761806673835963, "global_step": 57393, "epoch": 482, "lr": 9.32376435791989e-06} +{"train_loss": 0.0006579330074600875, "global_step": 57394, "epoch": 482, "lr": 9.32247601177434e-06} +{"train_loss": 0.0002906519512180239, "global_step": 57395, "epoch": 482, "lr": 9.321187745494747e-06} +{"train_loss": 0.00025349503266625106, "global_step": 57396, "epoch": 482, "lr": 9.319899559083673e-06} +{"train_loss": 0.0007439234177581966, "global_step": 57397, "epoch": 482, "lr": 9.318611452543625e-06} +{"train_loss": 0.000726357800886035, "global_step": 57398, "epoch": 482, "lr": 9.317323425877128e-06} +{"train_loss": 0.0005450727185234427, "global_step": 57399, "epoch": 482, "lr": 9.316035479086727e-06} +{"train_loss": 0.0002223494666395709, "global_step": 57400, "epoch": 482, "lr": 9.31474761217494e-06} +{"train_loss": 0.000690374756231904, "global_step": 57401, "epoch": 482, "lr": 9.313459825144306e-06} +{"train_loss": 0.0005386840784922242, "global_step": 57402, "epoch": 482, "lr": 9.312172117997348e-06} +{"train_loss": 0.00027984040207229555, "global_step": 57403, "epoch": 482, "lr": 9.310884490736582e-06} +{"train_loss": 0.0003991304256487638, "global_step": 57404, "epoch": 482, "lr": 9.309596943364556e-06} +{"train_loss": 0.0004569122102111578, "global_step": 57405, "epoch": 482, "lr": 9.30830947588378e-06} +{"train_loss": 0.0004317990969866514, "global_step": 57406, "epoch": 482, "lr": 9.307022088296808e-06} +{"train_loss": 0.000485244148876518, "global_step": 57407, "epoch": 482, "lr": 9.30573478060613e-06} +{"train_loss": 0.00043194074532948434, "global_step": 57408, "epoch": 482, "lr": 9.30444755281431e-06} +{"train_loss": 0.0007083017844706774, "global_step": 57409, "epoch": 482, "lr": 9.303160404923861e-06} +{"train_loss": 0.00041881093056872487, "global_step": 57410, "epoch": 482, "lr": 9.301873336937295e-06} +{"train_loss": 0.00045401687384583056, "global_step": 57411, "epoch": 482, "lr": 9.300586348857166e-06} +{"train_loss": 0.0003813808725681156, "global_step": 57412, "epoch": 482, "lr": 9.299299440685977e-06} +{"train_loss": 0.0002045890287263319, "global_step": 57413, "epoch": 482, "lr": 9.298012612426277e-06} +{"train_loss": 0.000390147470170632, "global_step": 57414, "epoch": 482, "lr": 9.296725864080563e-06} +{"train_loss": 0.000535551633220166, "global_step": 57415, "epoch": 482, "lr": 9.295439195651395e-06} +{"train_loss": 0.0005900964024476707, "global_step": 57416, "epoch": 482, "lr": 9.294152607141287e-06} +{"train_loss": 0.0008501646225340664, "global_step": 57417, "epoch": 482, "lr": 9.292866098552743e-06} +{"train_loss": 0.0002906404552049935, "global_step": 57418, "epoch": 482, "lr": 9.291579669888322e-06} +{"train_loss": 0.0002845684939529747, "global_step": 57419, "epoch": 482, "lr": 9.290293321150528e-06} +{"train_loss": 0.0005553277442231774, "global_step": 57420, "epoch": 482, "lr": 9.289007052341885e-06} +{"train_loss": 0.0005317957838997245, "global_step": 57421, "epoch": 482, "lr": 9.28772086346495e-06} +{"train_loss": 0.0003913329273927957, "global_step": 57422, "epoch": 482, "lr": 9.286434754522205e-06} +{"train_loss": 0.00031114049488678575, "global_step": 57423, "epoch": 482, "lr": 9.285148725516213e-06} +{"train_loss": 0.00046626158291473985, "global_step": 57424, "epoch": 482, "lr": 9.283862776449465e-06} +{"train_loss": 0.0007641452248208225, "global_step": 57425, "epoch": 482, "lr": 9.28257690732452e-06} +{"train_loss": 0.0003208983689546585, "global_step": 57426, "epoch": 482, "lr": 9.28129111814387e-06} +{"train_loss": 0.0007195843500085175, "global_step": 57427, "epoch": 482, "lr": 9.280005408910064e-06} +{"train_loss": 0.0002613325195852667, "global_step": 57428, "epoch": 482, "lr": 9.278719779625622e-06} +{"train_loss": 0.00036874410579912364, "global_step": 57429, "epoch": 482, "lr": 9.277434230293047e-06} +{"train_loss": 0.0005028079031035304, "global_step": 57430, "epoch": 482, "lr": 9.276148760914893e-06} +{"train_loss": 0.0006681039812974632, "global_step": 57431, "epoch": 482, "lr": 9.274863371493664e-06} +{"train_loss": 0.0005609166692011058, "global_step": 57432, "epoch": 482, "lr": 9.273578062031896e-06} +{"train_loss": 0.0004285933682695031, "global_step": 57433, "epoch": 482, "lr": 9.272292832532093e-06} +{"train_loss": 0.0004368973895907402, "global_step": 57434, "epoch": 482, "lr": 9.271007682996807e-06} +{"train_loss": 0.0005820962833240628, "global_step": 57435, "epoch": 482, "lr": 9.269722613428544e-06} +{"train_loss": 0.0003357859677635133, "global_step": 57436, "epoch": 482, "lr": 9.268437623829817e-06} +{"train_loss": 0.0006216457113623619, "global_step": 57437, "epoch": 482, "lr": 9.26715271420318e-06} +{"train_loss": 0.00035978941014036536, "global_step": 57438, "epoch": 482, "lr": 9.265867884551117e-06} +{"train_loss": 0.0006442572921514511, "global_step": 57439, "epoch": 482, "lr": 9.264583134876186e-06} +{"train_loss": 0.0003663520619738847, "global_step": 57440, "epoch": 482, "lr": 9.263298465180897e-06} +{"train_loss": 0.0003595686866901815, "global_step": 57441, "epoch": 482, "lr": 9.262013875467751e-06} +{"train_loss": 0.00027691811555996537, "global_step": 57442, "epoch": 482, "lr": 9.260729365739301e-06} +{"train_loss": 0.0004591663309838623, "global_step": 57443, "epoch": 482, "lr": 9.259444935998051e-06} +{"train_loss": 0.0005430539604276419, "global_step": 57444, "epoch": 482, "lr": 9.258160586246534e-06} +{"train_loss": 0.00043849137728102505, "global_step": 57445, "epoch": 482, "lr": 9.256876316487256e-06} +{"train_loss": 0.00045151603990234435, "global_step": 57446, "epoch": 482, "lr": 9.255592126722763e-06} +{"train_loss": 0.0005773333832621574, "global_step": 57447, "epoch": 482, "lr": 9.254308016955559e-06} +{"train_loss": 0.0003361638227943331, "global_step": 57448, "epoch": 482, "lr": 9.253023987188159e-06} +{"train_loss": 0.0006575653096660972, "global_step": 57449, "epoch": 482, "lr": 9.2517400374231e-06} +{"train_loss": 0.00032971863402053714, "global_step": 57450, "epoch": 482, "lr": 9.250456167662891e-06} +{"train_loss": 0.00038761747418902814, "global_step": 57451, "epoch": 482, "lr": 9.249172377910064e-06} +{"train_loss": 0.0002865776768885553, "global_step": 57452, "epoch": 482, "lr": 9.247888668167126e-06} +{"train_loss": 0.0003828675835393369, "global_step": 57453, "epoch": 482, "lr": 9.246605038436613e-06} +{"train_loss": 0.0004314850957598537, "global_step": 57454, "epoch": 482, "lr": 9.245321488721026e-06} +{"train_loss": 0.0005913938512094319, "global_step": 57455, "epoch": 482, "lr": 9.24403801902291e-06} +{"train_loss": 0.0005996363470330834, "global_step": 57456, "epoch": 482, "lr": 9.242754629344758e-06} +{"train_loss": 0.0006475191912613809, "global_step": 57457, "epoch": 482, "lr": 9.241471319689105e-06} +{"train_loss": 0.0008048362215049565, "global_step": 57458, "epoch": 482, "lr": 9.240188090058476e-06} +{"train_loss": 0.0008416532655246556, "global_step": 57459, "epoch": 482, "lr": 9.238904940455389e-06} +{"train_loss": 0.00042565009789541364, "global_step": 57460, "epoch": 482, "lr": 9.237621870882341e-06} +{"train_loss": 0.0009200595086440444, "global_step": 57461, "epoch": 482, "lr": 9.236338881341884e-06} +{"train_loss": 0.00041078764479607344, "global_step": 57462, "epoch": 482, "lr": 9.235055971836504e-06} +{"train_loss": 0.0002264558570459485, "global_step": 57463, "epoch": 482, "lr": 9.233773142368751e-06} +{"train_loss": 0.00033835263457149267, "global_step": 57464, "epoch": 482, "lr": 9.232490392941118e-06} +{"train_loss": 0.0005332370637916028, "global_step": 57465, "epoch": 482, "lr": 9.231207723556145e-06} +{"train_loss": 0.0005715269944630563, "global_step": 57466, "epoch": 482, "lr": 9.22992513421634e-06} +{"train_loss": 0.0007816166034899652, "global_step": 57467, "epoch": 482, "lr": 9.22864262492421e-06} +{"train_loss": 0.0003403999435249716, "global_step": 57468, "epoch": 482, "lr": 9.227360195682295e-06} +{"train_loss": 0.0003666933916974813, "global_step": 57469, "epoch": 482, "lr": 9.226077846493093e-06} +{"train_loss": 0.0003925051132682711, "global_step": 57470, "epoch": 482, "lr": 9.22479557735914e-06} +{"train_loss": 0.00031889602541923523, "global_step": 57471, "epoch": 482, "lr": 9.22351338828295e-06} +{"train_loss": 0.0004823764902539551, "global_step": 57472, "epoch": 482, "lr": 9.222231279267018e-06} +{"train_loss": 0.0008362123626284301, "global_step": 57473, "epoch": 482, "lr": 9.220949250313893e-06} +{"train_loss": 0.00044290447840467095, "global_step": 57474, "epoch": 482, "lr": 9.21966730142606e-06} +{"train_loss": 0.00041679159039631486, "global_step": 57475, "epoch": 482, "lr": 9.218385432606074e-06} +{"train_loss": 0.0004833754145456165, "global_step": 57476, "epoch": 482, "lr": 9.217103643856411e-06, "val_loss": 0.03781473636627197} +{"train_loss": 0.00034128656261600554, "global_step": 57477, "epoch": 483, "lr": 9.215821935179626e-06} +{"train_loss": 0.0006362991407513618, "global_step": 57478, "epoch": 483, "lr": 9.214540306578218e-06} +{"train_loss": 0.0005097308312542737, "global_step": 57479, "epoch": 483, "lr": 9.213258758054688e-06} +{"train_loss": 0.00029649605858139694, "global_step": 57480, "epoch": 483, "lr": 9.211977289611579e-06} +{"train_loss": 0.00038854972808621824, "global_step": 57481, "epoch": 483, "lr": 9.210695901251382e-06} +{"train_loss": 0.0003456020203884691, "global_step": 57482, "epoch": 483, "lr": 9.20941459297664e-06} +{"train_loss": 0.000339699414325878, "global_step": 57483, "epoch": 483, "lr": 9.208133364789844e-06} +{"train_loss": 0.00023765300284139812, "global_step": 57484, "epoch": 483, "lr": 9.206852216693529e-06} +{"train_loss": 0.0004926346591673791, "global_step": 57485, "epoch": 483, "lr": 9.205571148690189e-06} +{"train_loss": 0.00030110101215541363, "global_step": 57486, "epoch": 483, "lr": 9.20429016078237e-06} +{"train_loss": 0.00035511591704562306, "global_step": 57487, "epoch": 483, "lr": 9.20300925297255e-06} +{"train_loss": 0.0004277352709323168, "global_step": 57488, "epoch": 483, "lr": 9.201728425263278e-06} +{"train_loss": 0.0005547793116420507, "global_step": 57489, "epoch": 483, "lr": 9.200447677657042e-06} +{"train_loss": 0.00043490901589393616, "global_step": 57490, "epoch": 483, "lr": 9.199167010156379e-06} +{"train_loss": 0.00035677323467098176, "global_step": 57491, "epoch": 483, "lr": 9.19788642276378e-06} +{"train_loss": 0.0005133582162670791, "global_step": 57492, "epoch": 483, "lr": 9.196605915481788e-06} +{"train_loss": 0.0005817361525259912, "global_step": 57493, "epoch": 483, "lr": 9.195325488312883e-06} +{"train_loss": 0.00033860004623420537, "global_step": 57494, "epoch": 483, "lr": 9.19404514125961e-06} +{"train_loss": 0.00039215025026351213, "global_step": 57495, "epoch": 483, "lr": 9.192764874324462e-06} +{"train_loss": 0.00020582732395268977, "global_step": 57496, "epoch": 483, "lr": 9.191484687509971e-06} +{"train_loss": 0.000268837611656636, "global_step": 57497, "epoch": 483, "lr": 9.19020458081864e-06} +{"train_loss": 0.0005321358912624419, "global_step": 57498, "epoch": 483, "lr": 9.18892455425297e-06} +{"train_loss": 0.00042823576950468123, "global_step": 57499, "epoch": 483, "lr": 9.187644607815498e-06} +{"train_loss": 0.0004949712892994285, "global_step": 57500, "epoch": 483, "lr": 9.186364741508712e-06} +{"train_loss": 0.0004844997893087566, "global_step": 57501, "epoch": 483, "lr": 9.185084955335155e-06} +{"train_loss": 0.0002883604320231825, "global_step": 57502, "epoch": 483, "lr": 9.183805249297311e-06} +{"train_loss": 0.0007547971908934414, "global_step": 57503, "epoch": 483, "lr": 9.182525623397713e-06} +{"train_loss": 0.0003047253703698516, "global_step": 57504, "epoch": 483, "lr": 9.181246077638866e-06} +{"train_loss": 0.0004001849447377026, "global_step": 57505, "epoch": 483, "lr": 9.179966612023272e-06} +{"train_loss": 0.00037063800846226513, "global_step": 57506, "epoch": 483, "lr": 9.178687226553461e-06} +{"train_loss": 0.0004926068941131234, "global_step": 57507, "epoch": 483, "lr": 9.17740792123193e-06} +{"train_loss": 0.0007027633837424219, "global_step": 57508, "epoch": 483, "lr": 9.176128696061203e-06} +{"train_loss": 0.0003018455463461578, "global_step": 57509, "epoch": 483, "lr": 9.17484955104379e-06} +{"train_loss": 0.0011270151007920504, "global_step": 57510, "epoch": 483, "lr": 9.173570486182186e-06} +{"train_loss": 0.0004017990722786635, "global_step": 57511, "epoch": 483, "lr": 9.172291501478925e-06} +{"train_loss": 0.00036236984306015074, "global_step": 57512, "epoch": 483, "lr": 9.171012596936495e-06} +{"train_loss": 0.00023801841598469764, "global_step": 57513, "epoch": 483, "lr": 9.169733772557438e-06} +{"train_loss": 0.00041220258572138846, "global_step": 57514, "epoch": 483, "lr": 9.16845502834423e-06} +{"train_loss": 0.0004548098659142852, "global_step": 57515, "epoch": 483, "lr": 9.167176364299406e-06} +{"train_loss": 0.0005110815982334316, "global_step": 57516, "epoch": 483, "lr": 9.165897780425475e-06} +{"train_loss": 0.0003547859669197351, "global_step": 57517, "epoch": 483, "lr": 9.164619276724928e-06} +{"train_loss": 0.0010201670229434967, "global_step": 57518, "epoch": 483, "lr": 9.163340853200291e-06} +{"train_loss": 0.001067489036358893, "global_step": 57519, "epoch": 483, "lr": 9.16206250985408e-06} +{"train_loss": 0.00020552474597934633, "global_step": 57520, "epoch": 483, "lr": 9.160784246688786e-06} +{"train_loss": 0.00041081514791585505, "global_step": 57521, "epoch": 483, "lr": 9.159506063706941e-06} +{"train_loss": 0.0004944735555909574, "global_step": 57522, "epoch": 483, "lr": 9.158227960911025e-06} +{"train_loss": 0.0003472281387075782, "global_step": 57523, "epoch": 483, "lr": 9.156949938303583e-06} +{"train_loss": 0.0004257787368260324, "global_step": 57524, "epoch": 483, "lr": 9.155671995887094e-06} +{"train_loss": 0.00045535634853877127, "global_step": 57525, "epoch": 483, "lr": 9.15439413366409e-06} +{"train_loss": 0.0005748054245486856, "global_step": 57526, "epoch": 483, "lr": 9.153116351637059e-06} +{"train_loss": 0.00023532647173851728, "global_step": 57527, "epoch": 483, "lr": 9.15183864980853e-06} +{"train_loss": 0.0010229671606794, "global_step": 57528, "epoch": 483, "lr": 9.150561028181003e-06} +{"train_loss": 0.0006075061392039061, "global_step": 57529, "epoch": 483, "lr": 9.149283486756976e-06} +{"train_loss": 0.0002759929047897458, "global_step": 57530, "epoch": 483, "lr": 9.148006025538974e-06} +{"train_loss": 0.0006417802651412785, "global_step": 57531, "epoch": 483, "lr": 9.146728644529489e-06} +{"train_loss": 0.00076081114821136, "global_step": 57532, "epoch": 483, "lr": 9.145451343731049e-06} +{"train_loss": 0.0006637432961724699, "global_step": 57533, "epoch": 483, "lr": 9.144174123146138e-06} +{"train_loss": 0.0004430703411344439, "global_step": 57534, "epoch": 483, "lr": 9.142896982777288e-06} +{"train_loss": 0.0006077256402932107, "global_step": 57535, "epoch": 483, "lr": 9.141619922626998e-06} +{"train_loss": 0.00034367720945738256, "global_step": 57536, "epoch": 483, "lr": 9.140342942697756e-06} +{"train_loss": 0.00028295937227085233, "global_step": 57537, "epoch": 483, "lr": 9.1390660429921e-06} +{"train_loss": 0.0002669437089934945, "global_step": 57538, "epoch": 483, "lr": 9.137789223512505e-06} +{"train_loss": 0.00039610793464817107, "global_step": 57539, "epoch": 483, "lr": 9.136512484261517e-06} +{"train_loss": 0.0003057442663703114, "global_step": 57540, "epoch": 483, "lr": 9.135235825241611e-06} +{"train_loss": 0.00037350665661506355, "global_step": 57541, "epoch": 483, "lr": 9.133959246455299e-06} +{"train_loss": 0.00023082082043401897, "global_step": 57542, "epoch": 483, "lr": 9.132682747905102e-06} +{"train_loss": 0.0005945379962213337, "global_step": 57543, "epoch": 483, "lr": 9.131406329593507e-06} +{"train_loss": 0.0004803900374099612, "global_step": 57544, "epoch": 483, "lr": 9.130129991523034e-06} +{"train_loss": 0.0005457635270431638, "global_step": 57545, "epoch": 483, "lr": 9.12885373369618e-06} +{"train_loss": 0.00030828698072582483, "global_step": 57546, "epoch": 483, "lr": 9.127577556115462e-06} +{"train_loss": 0.0003721626417245716, "global_step": 57547, "epoch": 483, "lr": 9.126301458783382e-06} +{"train_loss": 0.00025453249691054225, "global_step": 57548, "epoch": 483, "lr": 9.125025441702428e-06} +{"train_loss": 0.0006006380426697433, "global_step": 57549, "epoch": 483, "lr": 9.123749504875135e-06} +{"train_loss": 0.00020116227096877992, "global_step": 57550, "epoch": 483, "lr": 9.12247364830398e-06} +{"train_loss": 0.00040141723002307117, "global_step": 57551, "epoch": 483, "lr": 9.121197871991493e-06} +{"train_loss": 0.0004651578492484987, "global_step": 57552, "epoch": 483, "lr": 9.119922175940155e-06} +{"train_loss": 0.0003999803739134222, "global_step": 57553, "epoch": 483, "lr": 9.118646560152477e-06} +{"train_loss": 0.0006427834159694612, "global_step": 57554, "epoch": 483, "lr": 9.117371024630989e-06} +{"train_loss": 0.0004338064172770828, "global_step": 57555, "epoch": 483, "lr": 9.116095569378158e-06} +{"train_loss": 0.0003628430131357163, "global_step": 57556, "epoch": 483, "lr": 9.114820194396517e-06} +{"train_loss": 0.0005114279920235276, "global_step": 57557, "epoch": 483, "lr": 9.113544899688548e-06} +{"train_loss": 0.0004509383288677782, "global_step": 57558, "epoch": 483, "lr": 9.11226968525678e-06} +{"train_loss": 0.00045316832256503403, "global_step": 57559, "epoch": 483, "lr": 9.110994551103701e-06} +{"train_loss": 0.0006218038615770638, "global_step": 57560, "epoch": 483, "lr": 9.109719497231805e-06} +{"train_loss": 0.0007329407380893826, "global_step": 57561, "epoch": 483, "lr": 9.108444523643616e-06} +{"train_loss": 0.00023023087123874575, "global_step": 57562, "epoch": 483, "lr": 9.107169630341616e-06} +{"train_loss": 0.0004280016291886568, "global_step": 57563, "epoch": 483, "lr": 9.10589481732833e-06} +{"train_loss": 0.00046783953439444304, "global_step": 57564, "epoch": 483, "lr": 9.10462008460624e-06} +{"train_loss": 0.00034805835457518697, "global_step": 57565, "epoch": 483, "lr": 9.103345432177873e-06} +{"train_loss": 0.0005786541732959449, "global_step": 57566, "epoch": 483, "lr": 9.10207086004572e-06} +{"train_loss": 0.00023266032803803682, "global_step": 57567, "epoch": 483, "lr": 9.100796368212261e-06} +{"train_loss": 0.0008796281181275845, "global_step": 57568, "epoch": 483, "lr": 9.09952195668004e-06} +{"train_loss": 0.00036472149076871574, "global_step": 57569, "epoch": 483, "lr": 9.098247625451523e-06} +{"train_loss": 0.0005828881985507905, "global_step": 57570, "epoch": 483, "lr": 9.096973374529239e-06} +{"train_loss": 0.0002781373041216284, "global_step": 57571, "epoch": 483, "lr": 9.095699203915664e-06} +{"train_loss": 0.0004709650238510221, "global_step": 57572, "epoch": 483, "lr": 9.094425113613324e-06} +{"train_loss": 0.0007186633301898837, "global_step": 57573, "epoch": 483, "lr": 9.093151103624714e-06} +{"train_loss": 0.00039585927152074873, "global_step": 57574, "epoch": 483, "lr": 9.091877173952323e-06} +{"train_loss": 0.0010244515724480152, "global_step": 57575, "epoch": 483, "lr": 9.090603324598667e-06} +{"train_loss": 0.0004460984782781452, "global_step": 57576, "epoch": 483, "lr": 9.089329555566229e-06} +{"train_loss": 0.0004380034515634179, "global_step": 57577, "epoch": 483, "lr": 9.088055866857537e-06} +{"train_loss": 0.0002400618977844715, "global_step": 57578, "epoch": 483, "lr": 9.086782258475073e-06} +{"train_loss": 0.0004106908745598048, "global_step": 57579, "epoch": 483, "lr": 9.085508730421333e-06} +{"train_loss": 0.0008096082019619644, "global_step": 57580, "epoch": 483, "lr": 9.084235282698833e-06} +{"train_loss": 0.00037675266503356397, "global_step": 57581, "epoch": 483, "lr": 9.082961915310057e-06} +{"train_loss": 0.0008910565520636737, "global_step": 57582, "epoch": 483, "lr": 9.081688628257529e-06} +{"train_loss": 0.0002272500714752823, "global_step": 57583, "epoch": 483, "lr": 9.080415421543715e-06} +{"train_loss": 0.0003372797218617052, "global_step": 57584, "epoch": 483, "lr": 9.07914229517115e-06} +{"train_loss": 0.000794108142144978, "global_step": 57585, "epoch": 483, "lr": 9.0778692491423e-06} +{"train_loss": 0.0006412189686670899, "global_step": 57586, "epoch": 483, "lr": 9.076596283459704e-06} +{"train_loss": 0.0005955485394224524, "global_step": 57587, "epoch": 483, "lr": 9.075323398125818e-06} +{"train_loss": 0.0002672169357538223, "global_step": 57588, "epoch": 483, "lr": 9.074050593143163e-06} +{"train_loss": 0.0008252226398326457, "global_step": 57589, "epoch": 483, "lr": 9.072777868514254e-06} +{"train_loss": 0.0004713989910669625, "global_step": 57590, "epoch": 483, "lr": 9.071505224241573e-06} +{"train_loss": 0.00040349329356104136, "global_step": 57591, "epoch": 483, "lr": 9.070232660327605e-06} +{"train_loss": 0.0006075724959373474, "global_step": 57592, "epoch": 483, "lr": 9.068960176774871e-06} +{"train_loss": 0.0005958109977655113, "global_step": 57593, "epoch": 483, "lr": 9.067687773585854e-06} +{"train_loss": 0.00044572207843884826, "global_step": 57594, "epoch": 483, "lr": 9.066415450763072e-06} +{"train_loss": 0.0004739610698639548, "global_step": 57595, "epoch": 483, "lr": 9.06514320830899e-06, "val_loss": 0.018519559875130653} +{"train_loss": 0.0004450996348168701, "global_step": 57596, "epoch": 484, "lr": 9.063871046226146e-06} +{"train_loss": 0.0007016200688667595, "global_step": 57597, "epoch": 484, "lr": 9.062598964517017e-06} +{"train_loss": 0.0004086758417543024, "global_step": 57598, "epoch": 484, "lr": 9.061326963184085e-06} +{"train_loss": 0.0005783174419775605, "global_step": 57599, "epoch": 484, "lr": 9.060055042229881e-06} +{"train_loss": 0.00039745037793181837, "global_step": 57600, "epoch": 484, "lr": 9.058783201656873e-06} +{"train_loss": 0.00029540908872149885, "global_step": 57601, "epoch": 484, "lr": 9.057511441467581e-06} +{"train_loss": 0.0007953896420076489, "global_step": 57602, "epoch": 484, "lr": 9.056239761664476e-06} +{"train_loss": 0.0005348990089260042, "global_step": 57603, "epoch": 484, "lr": 9.054968162250082e-06} +{"train_loss": 0.0003574876463972032, "global_step": 57604, "epoch": 484, "lr": 9.05369664322689e-06} +{"train_loss": 0.0004666498280130327, "global_step": 57605, "epoch": 484, "lr": 9.05242520459737e-06} +{"train_loss": 0.0004004721122328192, "global_step": 57606, "epoch": 484, "lr": 9.051153846364058e-06} +{"train_loss": 0.0005148111376911402, "global_step": 57607, "epoch": 484, "lr": 9.049882568529416e-06} +{"train_loss": 0.0008755067246966064, "global_step": 57608, "epoch": 484, "lr": 9.048611371095966e-06} +{"train_loss": 0.00046154731535352767, "global_step": 57609, "epoch": 484, "lr": 9.047340254066194e-06} +{"train_loss": 0.000497846573125571, "global_step": 57610, "epoch": 484, "lr": 9.046069217442577e-06} +{"train_loss": 0.00040325423469766974, "global_step": 57611, "epoch": 484, "lr": 9.044798261227644e-06} +{"train_loss": 0.00041130505269393325, "global_step": 57612, "epoch": 484, "lr": 9.043527385423862e-06} +{"train_loss": 0.000662001664750278, "global_step": 57613, "epoch": 484, "lr": 9.042256590033754e-06} +{"train_loss": 0.00026626038015820086, "global_step": 57614, "epoch": 484, "lr": 9.040985875059783e-06} +{"train_loss": 0.0009040838340297341, "global_step": 57615, "epoch": 484, "lr": 9.03971524050447e-06} +{"train_loss": 0.00038921364466659725, "global_step": 57616, "epoch": 484, "lr": 9.038444686370296e-06} +{"train_loss": 0.0006464699981734157, "global_step": 57617, "epoch": 484, "lr": 9.037174212659766e-06} +{"train_loss": 0.00028892786940559745, "global_step": 57618, "epoch": 484, "lr": 9.035903819375357e-06} +{"train_loss": 0.00039903627475723624, "global_step": 57619, "epoch": 484, "lr": 9.034633506519585e-06} +{"train_loss": 0.0008462921250611544, "global_step": 57620, "epoch": 484, "lr": 9.033363274094925e-06} +{"train_loss": 0.0006639274070039392, "global_step": 57621, "epoch": 484, "lr": 9.03209312210389e-06} +{"train_loss": 0.0003685964038595557, "global_step": 57622, "epoch": 484, "lr": 9.030823050548947e-06} +{"train_loss": 0.0010176347568631172, "global_step": 57623, "epoch": 484, "lr": 9.029553059432628e-06} +{"train_loss": 0.0008152375230565667, "global_step": 57624, "epoch": 484, "lr": 9.028283148757383e-06} +{"train_loss": 0.0005453500198200345, "global_step": 57625, "epoch": 484, "lr": 9.027013318525746e-06} +{"train_loss": 0.0005906902952119708, "global_step": 57626, "epoch": 484, "lr": 9.025743568740174e-06} +{"train_loss": 0.0005312210414558649, "global_step": 57627, "epoch": 484, "lr": 9.024473899403191e-06} +{"train_loss": 0.0003405249153729528, "global_step": 57628, "epoch": 484, "lr": 9.023204310517275e-06} +{"train_loss": 0.0005586858023889363, "global_step": 57629, "epoch": 484, "lr": 9.021934802084909e-06} +{"train_loss": 0.0004737712733913213, "global_step": 57630, "epoch": 484, "lr": 9.02066537410861e-06} +{"train_loss": 0.0005233082920312881, "global_step": 57631, "epoch": 484, "lr": 9.019396026590842e-06} +{"train_loss": 0.0008398783393204212, "global_step": 57632, "epoch": 484, "lr": 9.018126759534124e-06} +{"train_loss": 0.0005434876657091081, "global_step": 57633, "epoch": 484, "lr": 9.016857572940923e-06} +{"train_loss": 0.00043481471948325634, "global_step": 57634, "epoch": 484, "lr": 9.015588466813756e-06} +{"train_loss": 0.0004622634151019156, "global_step": 57635, "epoch": 484, "lr": 9.014319441155106e-06} +{"train_loss": 0.0004786798672284931, "global_step": 57636, "epoch": 484, "lr": 9.013050495967445e-06} +{"train_loss": 0.0004459730116650462, "global_step": 57637, "epoch": 484, "lr": 9.011781631253291e-06} +{"train_loss": 0.0005490678595378995, "global_step": 57638, "epoch": 484, "lr": 9.010512847015118e-06} +{"train_loss": 0.00034842308377847075, "global_step": 57639, "epoch": 484, "lr": 9.00924414325543e-06} +{"train_loss": 0.0007356210262514651, "global_step": 57640, "epoch": 484, "lr": 9.007975519976702e-06} +{"train_loss": 0.0006322546978481114, "global_step": 57641, "epoch": 484, "lr": 9.006706977181451e-06} +{"train_loss": 0.0004982802201993763, "global_step": 57642, "epoch": 484, "lr": 9.005438514872149e-06} +{"train_loss": 0.000431197346188128, "global_step": 57643, "epoch": 484, "lr": 9.004170133051277e-06} +{"train_loss": 0.0003520062891766429, "global_step": 57644, "epoch": 484, "lr": 9.00290183172135e-06} +{"train_loss": 0.00048428206355310977, "global_step": 57645, "epoch": 484, "lr": 9.00163361088483e-06} +{"train_loss": 0.0002725061494857073, "global_step": 57646, "epoch": 484, "lr": 9.000365470544236e-06} +{"train_loss": 0.00043411582009866834, "global_step": 57647, "epoch": 484, "lr": 8.999097410702046e-06} +{"train_loss": 0.0004779956361744553, "global_step": 57648, "epoch": 484, "lr": 8.997829431360732e-06} +{"train_loss": 0.00025814276887103915, "global_step": 57649, "epoch": 484, "lr": 8.996561532522812e-06} +{"train_loss": 0.0004644495784305036, "global_step": 57650, "epoch": 484, "lr": 8.995293714190755e-06} +{"train_loss": 0.0004347127687651664, "global_step": 57651, "epoch": 484, "lr": 8.994025976367054e-06} +{"train_loss": 0.000508780125528574, "global_step": 57652, "epoch": 484, "lr": 8.992758319054218e-06} +{"train_loss": 0.000877290207426995, "global_step": 57653, "epoch": 484, "lr": 8.991490742254705e-06} +{"train_loss": 0.000713520566932857, "global_step": 57654, "epoch": 484, "lr": 8.99022324597103e-06} +{"train_loss": 0.00043194126919843256, "global_step": 57655, "epoch": 484, "lr": 8.988955830205664e-06} +{"train_loss": 0.00031449180096387863, "global_step": 57656, "epoch": 484, "lr": 8.98768849496111e-06} +{"train_loss": 0.0003805742890108377, "global_step": 57657, "epoch": 484, "lr": 8.986421240239833e-06} +{"train_loss": 0.0003428064228501171, "global_step": 57658, "epoch": 484, "lr": 8.985154066044354e-06} +{"train_loss": 0.0005151215009391308, "global_step": 57659, "epoch": 484, "lr": 8.983886972377137e-06} +{"train_loss": 0.0006499402225017548, "global_step": 57660, "epoch": 484, "lr": 8.982619959240669e-06} +{"train_loss": 0.00032079979428090155, "global_step": 57661, "epoch": 484, "lr": 8.981353026637456e-06} +{"train_loss": 0.0014305947115644813, "global_step": 57662, "epoch": 484, "lr": 8.980086174569962e-06} +{"train_loss": 0.0004120453668292612, "global_step": 57663, "epoch": 484, "lr": 8.978819403040695e-06} +{"train_loss": 0.00042289565317332745, "global_step": 57664, "epoch": 484, "lr": 8.977552712052129e-06} +{"train_loss": 0.0004886477254331112, "global_step": 57665, "epoch": 484, "lr": 8.976286101606763e-06} +{"train_loss": 0.0002787269768305123, "global_step": 57666, "epoch": 484, "lr": 8.975019571707078e-06} +{"train_loss": 0.00034416973358020186, "global_step": 57667, "epoch": 484, "lr": 8.973753122355544e-06} +{"train_loss": 0.000407739426009357, "global_step": 57668, "epoch": 484, "lr": 8.972486753554677e-06} +{"train_loss": 0.0002872960758395493, "global_step": 57669, "epoch": 484, "lr": 8.971220465306934e-06} +{"train_loss": 0.000670749053824693, "global_step": 57670, "epoch": 484, "lr": 8.969954257614832e-06} +{"train_loss": 0.0003799235273618251, "global_step": 57671, "epoch": 484, "lr": 8.96868813048083e-06} +{"train_loss": 0.000297351652989164, "global_step": 57672, "epoch": 484, "lr": 8.967422083907435e-06} +{"train_loss": 0.00033625177456997335, "global_step": 57673, "epoch": 484, "lr": 8.966156117897124e-06} +{"train_loss": 0.0002785239485092461, "global_step": 57674, "epoch": 484, "lr": 8.964890232452367e-06} +{"train_loss": 0.00039522902807220817, "global_step": 57675, "epoch": 484, "lr": 8.963624427575678e-06} +{"train_loss": 0.0006737186340615153, "global_step": 57676, "epoch": 484, "lr": 8.962358703269519e-06} +{"train_loss": 0.0004555996274575591, "global_step": 57677, "epoch": 484, "lr": 8.961093059536396e-06} +{"train_loss": 0.00044922702363692224, "global_step": 57678, "epoch": 484, "lr": 8.95982749637878e-06} +{"train_loss": 0.0002749414124991745, "global_step": 57679, "epoch": 484, "lr": 8.958562013799143e-06} +{"train_loss": 0.0005596688133664429, "global_step": 57680, "epoch": 484, "lr": 8.957296611800004e-06} +{"train_loss": 0.0010591786121949553, "global_step": 57681, "epoch": 484, "lr": 8.95603129038381e-06} +{"train_loss": 0.000556700921151787, "global_step": 57682, "epoch": 484, "lr": 8.954766049553082e-06} +{"train_loss": 0.0005697509623132646, "global_step": 57683, "epoch": 484, "lr": 8.953500889310267e-06} +{"train_loss": 0.0006024066242389381, "global_step": 57684, "epoch": 484, "lr": 8.952235809657889e-06} +{"train_loss": 0.00047341681784018874, "global_step": 57685, "epoch": 484, "lr": 8.950970810598392e-06} +{"train_loss": 0.0009371653432026505, "global_step": 57686, "epoch": 484, "lr": 8.949705892134274e-06} +{"train_loss": 0.0004845595976803452, "global_step": 57687, "epoch": 484, "lr": 8.948441054268042e-06} +{"train_loss": 0.00023661159502808005, "global_step": 57688, "epoch": 484, "lr": 8.947176297002146e-06} +{"train_loss": 0.000415780144976452, "global_step": 57689, "epoch": 484, "lr": 8.945911620339097e-06} +{"train_loss": 0.00043005062616430223, "global_step": 57690, "epoch": 484, "lr": 8.944647024281356e-06} +{"train_loss": 0.0007540460792370141, "global_step": 57691, "epoch": 484, "lr": 8.943382508831422e-06} +{"train_loss": 0.0007748595671728253, "global_step": 57692, "epoch": 484, "lr": 8.942118073991768e-06} +{"train_loss": 0.00041762381442822516, "global_step": 57693, "epoch": 484, "lr": 8.940853719764869e-06} +{"train_loss": 0.00022183467808645219, "global_step": 57694, "epoch": 484, "lr": 8.939589446153229e-06} +{"train_loss": 0.0003386464377399534, "global_step": 57695, "epoch": 484, "lr": 8.938325253159307e-06} +{"train_loss": 0.00048322451766580343, "global_step": 57696, "epoch": 484, "lr": 8.937061140785608e-06} +{"train_loss": 0.0006716798525303602, "global_step": 57697, "epoch": 484, "lr": 8.935797109034604e-06} +{"train_loss": 0.00029635123792104423, "global_step": 57698, "epoch": 484, "lr": 8.934533157908758e-06} +{"train_loss": 0.0009466413175687194, "global_step": 57699, "epoch": 484, "lr": 8.93326928741059e-06} +{"train_loss": 0.0003410336503293365, "global_step": 57700, "epoch": 484, "lr": 8.932005497542544e-06} +{"train_loss": 0.0004745829210150987, "global_step": 57701, "epoch": 484, "lr": 8.93074178830713e-06} +{"train_loss": 0.000901295687071979, "global_step": 57702, "epoch": 484, "lr": 8.9294781597068e-06} +{"train_loss": 0.00041747366776689887, "global_step": 57703, "epoch": 484, "lr": 8.928214611744068e-06} +{"train_loss": 0.0005532904760912061, "global_step": 57704, "epoch": 484, "lr": 8.926951144421403e-06} +{"train_loss": 0.0005597383715212345, "global_step": 57705, "epoch": 484, "lr": 8.925687757741264e-06} +{"train_loss": 0.00028691531042568386, "global_step": 57706, "epoch": 484, "lr": 8.92442445170616e-06} +{"train_loss": 0.00047844910295680165, "global_step": 57707, "epoch": 484, "lr": 8.92316122631855e-06} +{"train_loss": 0.00033847932354547083, "global_step": 57708, "epoch": 484, "lr": 8.921898081580938e-06} +{"train_loss": 0.00036835193168371916, "global_step": 57709, "epoch": 484, "lr": 8.920635017495794e-06} +{"train_loss": 0.0011259722523391247, "global_step": 57710, "epoch": 484, "lr": 8.919372034065576e-06} +{"train_loss": 0.00037449348019436, "global_step": 57711, "epoch": 484, "lr": 8.918109131292795e-06} +{"train_loss": 0.0005259708850644529, "global_step": 57712, "epoch": 484, "lr": 8.916846309179906e-06} +{"train_loss": 0.0003560926124919206, "global_step": 57713, "epoch": 484, "lr": 8.915583567729413e-06} +{"train_loss": 0.0005122134002207333, "global_step": 57714, "epoch": 484, "lr": 8.914320906943774e-06, "val_loss": 0.025125376880168915} +{"train_loss": 0.0003749565512407571, "global_step": 57715, "epoch": 485, "lr": 8.913058326825485e-06} +{"train_loss": 0.0005088431644253433, "global_step": 57716, "epoch": 485, "lr": 8.911795827377e-06} +{"train_loss": 0.0006376272067427635, "global_step": 57717, "epoch": 485, "lr": 8.910533408600836e-06} +{"train_loss": 0.0003225409600418061, "global_step": 57718, "epoch": 485, "lr": 8.909271070499432e-06} +{"train_loss": 0.0006080102175474167, "global_step": 57719, "epoch": 485, "lr": 8.908008813075297e-06} +{"train_loss": 0.0004474442976061255, "global_step": 57720, "epoch": 485, "lr": 8.906746636330882e-06} +{"train_loss": 0.0003425177128519863, "global_step": 57721, "epoch": 485, "lr": 8.905484540268682e-06} +{"train_loss": 0.0005016475333832204, "global_step": 57722, "epoch": 485, "lr": 8.904222524891186e-06} +{"train_loss": 0.0004949567373842001, "global_step": 57723, "epoch": 485, "lr": 8.90296059020086e-06} +{"train_loss": 0.00045590338413603604, "global_step": 57724, "epoch": 485, "lr": 8.901698736200164e-06} +{"train_loss": 0.0003138516622129828, "global_step": 57725, "epoch": 485, "lr": 8.900436962891607e-06} +{"train_loss": 0.0006924247718416154, "global_step": 57726, "epoch": 485, "lr": 8.899175270277638e-06} +{"train_loss": 0.0007886204402893782, "global_step": 57727, "epoch": 485, "lr": 8.897913658360762e-06} +{"train_loss": 0.0006167295505292714, "global_step": 57728, "epoch": 485, "lr": 8.89665212714344e-06} +{"train_loss": 0.0004244336159899831, "global_step": 57729, "epoch": 485, "lr": 8.895390676628135e-06} +{"train_loss": 0.0004270171339157969, "global_step": 57730, "epoch": 485, "lr": 8.894129306817356e-06} +{"train_loss": 0.00043251243187114596, "global_step": 57731, "epoch": 485, "lr": 8.892868017713546e-06} +{"train_loss": 0.0004217851674184203, "global_step": 57732, "epoch": 485, "lr": 8.891606809319215e-06} +{"train_loss": 0.0006412353250198066, "global_step": 57733, "epoch": 485, "lr": 8.890345681636803e-06} +{"train_loss": 0.00026128615718334913, "global_step": 57734, "epoch": 485, "lr": 8.88908463466882e-06} +{"train_loss": 0.0003500291786622256, "global_step": 57735, "epoch": 485, "lr": 8.887823668417734e-06} +{"train_loss": 0.0006909255753271282, "global_step": 57736, "epoch": 485, "lr": 8.886562782885994e-06} +{"train_loss": 0.0005159003776498139, "global_step": 57737, "epoch": 485, "lr": 8.88530197807611e-06} +{"train_loss": 0.0004052065487485379, "global_step": 57738, "epoch": 485, "lr": 8.884041253990533e-06} +{"train_loss": 0.0003760145336855203, "global_step": 57739, "epoch": 485, "lr": 8.882780610631758e-06} +{"train_loss": 0.0003844971943181008, "global_step": 57740, "epoch": 485, "lr": 8.881520048002239e-06} +{"train_loss": 0.00041818461613729596, "global_step": 57741, "epoch": 485, "lr": 8.880259566104477e-06} +{"train_loss": 0.0004812888219021261, "global_step": 57742, "epoch": 485, "lr": 8.878999164940932e-06} +{"train_loss": 0.000406987383030355, "global_step": 57743, "epoch": 485, "lr": 8.877738844514066e-06} +{"train_loss": 0.0004637653473764658, "global_step": 57744, "epoch": 485, "lr": 8.876478604826377e-06} +{"train_loss": 0.00037063437048345804, "global_step": 57745, "epoch": 485, "lr": 8.875218445880317e-06} +{"train_loss": 0.0005424162372946739, "global_step": 57746, "epoch": 485, "lr": 8.873958367678387e-06} +{"train_loss": 0.000460150302387774, "global_step": 57747, "epoch": 485, "lr": 8.872698370223043e-06} +{"train_loss": 0.0005316004971973598, "global_step": 57748, "epoch": 485, "lr": 8.871438453516751e-06} +{"train_loss": 0.0011900616809725761, "global_step": 57749, "epoch": 485, "lr": 8.870178617561998e-06} +{"train_loss": 0.00048326863907277584, "global_step": 57750, "epoch": 485, "lr": 8.868918862361264e-06} +{"train_loss": 0.0006161638884805143, "global_step": 57751, "epoch": 485, "lr": 8.867659187917e-06} +{"train_loss": 0.00041924690594896674, "global_step": 57752, "epoch": 485, "lr": 8.866399594231706e-06} +{"train_loss": 0.00021546987409237772, "global_step": 57753, "epoch": 485, "lr": 8.865140081307833e-06} +{"train_loss": 0.000548051786608994, "global_step": 57754, "epoch": 485, "lr": 8.86388064914787e-06} +{"train_loss": 0.0005574572714976966, "global_step": 57755, "epoch": 485, "lr": 8.862621297754276e-06} +{"train_loss": 0.0004422795318532735, "global_step": 57756, "epoch": 485, "lr": 8.861362027129538e-06} +{"train_loss": 0.0008117436082102358, "global_step": 57757, "epoch": 485, "lr": 8.860102837276113e-06} +{"train_loss": 0.00032772330450825393, "global_step": 57758, "epoch": 485, "lr": 8.858843728196491e-06} +{"train_loss": 0.0006850793724879622, "global_step": 57759, "epoch": 485, "lr": 8.857584699893124e-06} +{"train_loss": 0.0007400562753900886, "global_step": 57760, "epoch": 485, "lr": 8.8563257523685e-06} +{"train_loss": 0.000557424034923315, "global_step": 57761, "epoch": 485, "lr": 8.855066885625091e-06} +{"train_loss": 0.0003467178321443498, "global_step": 57762, "epoch": 485, "lr": 8.853808099665346e-06} +{"train_loss": 0.00020195437537040561, "global_step": 57763, "epoch": 485, "lr": 8.852549394491766e-06} +{"train_loss": 0.0003665295953396708, "global_step": 57764, "epoch": 485, "lr": 8.851290770106801e-06} +{"train_loss": 0.00028368658968247473, "global_step": 57765, "epoch": 485, "lr": 8.850032226512938e-06} +{"train_loss": 0.0002585492911748588, "global_step": 57766, "epoch": 485, "lr": 8.848773763712642e-06} +{"train_loss": 0.0003618876216933131, "global_step": 57767, "epoch": 485, "lr": 8.847515381708371e-06} +{"train_loss": 0.00042172748362645507, "global_step": 57768, "epoch": 485, "lr": 8.846257080502617e-06} +{"train_loss": 0.00032467147684656084, "global_step": 57769, "epoch": 485, "lr": 8.844998860097831e-06} +{"train_loss": 0.0005883562844246626, "global_step": 57770, "epoch": 485, "lr": 8.843740720496502e-06} +{"train_loss": 0.0004709968634415418, "global_step": 57771, "epoch": 485, "lr": 8.842482661701084e-06} +{"train_loss": 0.00039654402644373477, "global_step": 57772, "epoch": 485, "lr": 8.841224683714061e-06} +{"train_loss": 0.0006009309436194599, "global_step": 57773, "epoch": 485, "lr": 8.8399667865379e-06} +{"train_loss": 0.0010271831415593624, "global_step": 57774, "epoch": 485, "lr": 8.838708970175052e-06} +{"train_loss": 0.0002989756176248193, "global_step": 57775, "epoch": 485, "lr": 8.837451234628019e-06} +{"train_loss": 0.0007016507443040609, "global_step": 57776, "epoch": 485, "lr": 8.836193579899238e-06} +{"train_loss": 0.001329867634922266, "global_step": 57777, "epoch": 485, "lr": 8.8349360059912e-06} +{"train_loss": 0.00033925820025615394, "global_step": 57778, "epoch": 485, "lr": 8.833678512906374e-06} +{"train_loss": 0.0009492845274507999, "global_step": 57779, "epoch": 485, "lr": 8.832421100647209e-06} +{"train_loss": 0.0003062281757593155, "global_step": 57780, "epoch": 485, "lr": 8.831163769216195e-06} +{"train_loss": 0.000334220560034737, "global_step": 57781, "epoch": 485, "lr": 8.829906518615783e-06} +{"train_loss": 0.00040425066254101694, "global_step": 57782, "epoch": 485, "lr": 8.828649348848467e-06} +{"train_loss": 0.00035722082247957587, "global_step": 57783, "epoch": 485, "lr": 8.827392259916684e-06} +{"train_loss": 0.0003334405191708356, "global_step": 57784, "epoch": 485, "lr": 8.826135251822915e-06} +{"train_loss": 0.000983458012342453, "global_step": 57785, "epoch": 485, "lr": 8.824878324569646e-06} +{"train_loss": 0.00047102279495447874, "global_step": 57786, "epoch": 485, "lr": 8.823621478159317e-06} +{"train_loss": 0.0003426101466175169, "global_step": 57787, "epoch": 485, "lr": 8.822364712594423e-06} +{"train_loss": 0.0009585791267454624, "global_step": 57788, "epoch": 485, "lr": 8.8211080278774e-06} +{"train_loss": 0.00029372976860031486, "global_step": 57789, "epoch": 485, "lr": 8.819851424010744e-06} +{"train_loss": 0.0004132512549404055, "global_step": 57790, "epoch": 485, "lr": 8.818594900996902e-06} +{"train_loss": 0.0007319713477045298, "global_step": 57791, "epoch": 485, "lr": 8.817338458838359e-06} +{"train_loss": 0.000708524021320045, "global_step": 57792, "epoch": 485, "lr": 8.816082097537576e-06} +{"train_loss": 0.0004885338712483644, "global_step": 57793, "epoch": 485, "lr": 8.814825817097e-06} +{"train_loss": 0.0005200454033911228, "global_step": 57794, "epoch": 485, "lr": 8.813569617519124e-06} +{"train_loss": 0.0005489333416335285, "global_step": 57795, "epoch": 485, "lr": 8.812313498806396e-06} +{"train_loss": 0.000821959984023124, "global_step": 57796, "epoch": 485, "lr": 8.811057460961296e-06} +{"train_loss": 0.0004926974652335048, "global_step": 57797, "epoch": 485, "lr": 8.809801503986292e-06} +{"train_loss": 0.00048157613491639495, "global_step": 57798, "epoch": 485, "lr": 8.80854562788383e-06} +{"train_loss": 0.00034692336339503527, "global_step": 57799, "epoch": 485, "lr": 8.807289832656395e-06} +{"train_loss": 0.0004988983855582774, "global_step": 57800, "epoch": 485, "lr": 8.806034118306433e-06} +{"train_loss": 0.00039100166759453714, "global_step": 57801, "epoch": 485, "lr": 8.80477848483644e-06} +{"train_loss": 0.00023492047330364585, "global_step": 57802, "epoch": 485, "lr": 8.803522932248848e-06} +{"train_loss": 0.0007058547344058752, "global_step": 57803, "epoch": 485, "lr": 8.802267460546149e-06} +{"train_loss": 0.00026297057047486305, "global_step": 57804, "epoch": 485, "lr": 8.801012069730797e-06} +{"train_loss": 0.0002650032693054527, "global_step": 57805, "epoch": 485, "lr": 8.799756759805245e-06} +{"train_loss": 0.0004846762167289853, "global_step": 57806, "epoch": 485, "lr": 8.79850153077198e-06} +{"train_loss": 0.000708986131940037, "global_step": 57807, "epoch": 485, "lr": 8.797246382633444e-06} +{"train_loss": 0.0002912335330620408, "global_step": 57808, "epoch": 485, "lr": 8.795991315392122e-06} +{"train_loss": 0.0004566333082038909, "global_step": 57809, "epoch": 485, "lr": 8.794736329050463e-06} +{"train_loss": 0.0004517720080912113, "global_step": 57810, "epoch": 485, "lr": 8.793481423610944e-06} +{"train_loss": 0.0003233289753552526, "global_step": 57811, "epoch": 485, "lr": 8.792226599076025e-06} +{"train_loss": 0.0007811186951585114, "global_step": 57812, "epoch": 485, "lr": 8.790971855448155e-06} +{"train_loss": 0.0005371170700527728, "global_step": 57813, "epoch": 485, "lr": 8.789717192729818e-06} +{"train_loss": 0.00045694963773712516, "global_step": 57814, "epoch": 485, "lr": 8.788462610923459e-06} +{"train_loss": 0.0005914781359024346, "global_step": 57815, "epoch": 485, "lr": 8.787208110031563e-06} +{"train_loss": 0.000543986214324832, "global_step": 57816, "epoch": 485, "lr": 8.785953690056565e-06} +{"train_loss": 0.0004377235018182546, "global_step": 57817, "epoch": 485, "lr": 8.784699351000958e-06} +{"train_loss": 0.0005320449126884341, "global_step": 57818, "epoch": 485, "lr": 8.783445092867182e-06} +{"train_loss": 0.00043522592750377953, "global_step": 57819, "epoch": 485, "lr": 8.782190915657706e-06} +{"train_loss": 0.0005413126200437546, "global_step": 57820, "epoch": 485, "lr": 8.780936819375007e-06} +{"train_loss": 0.00039793158066459, "global_step": 57821, "epoch": 485, "lr": 8.779682804021521e-06} +{"train_loss": 0.0002672804403118789, "global_step": 57822, "epoch": 485, "lr": 8.778428869599737e-06} +{"train_loss": 0.0003608319675549865, "global_step": 57823, "epoch": 485, "lr": 8.777175016112104e-06} +{"train_loss": 0.00025008851662278175, "global_step": 57824, "epoch": 485, "lr": 8.775921243561076e-06} +{"train_loss": 0.0007520558428950608, "global_step": 57825, "epoch": 485, "lr": 8.774667551949129e-06} +{"train_loss": 0.0003080522292293608, "global_step": 57826, "epoch": 485, "lr": 8.773413941278707e-06} +{"train_loss": 0.0002985669707413763, "global_step": 57827, "epoch": 485, "lr": 8.772160411552294e-06} +{"train_loss": 0.0005238670855760574, "global_step": 57828, "epoch": 485, "lr": 8.77090696277233e-06} +{"train_loss": 0.0005163405439816415, "global_step": 57829, "epoch": 485, "lr": 8.769653594941297e-06} +{"train_loss": 0.0011289415415376425, "global_step": 57830, "epoch": 485, "lr": 8.768400308061642e-06} +{"train_loss": 0.000619945814833045, "global_step": 57831, "epoch": 485, "lr": 8.76714710213582e-06} +{"train_loss": 0.00046550185652449727, "global_step": 57832, "epoch": 485, "lr": 8.765893977166306e-06} +{"train_loss": 0.0005032289890619386, "global_step": 57833, "epoch": 485, "lr": 8.76464093315555e-06, "val_loss": 0.007029838860034943, "train_action_mse_error": 5.914005669183098e-06} +{"train_loss": 0.0002981780271511525, "global_step": 57834, "epoch": 486, "lr": 8.763387970106024e-06} +{"train_loss": 0.0004938115598633885, "global_step": 57835, "epoch": 486, "lr": 8.762135088020179e-06} +{"train_loss": 0.00034748826874420047, "global_step": 57836, "epoch": 486, "lr": 8.760882286900463e-06} +{"train_loss": 0.0003897598653566092, "global_step": 57837, "epoch": 486, "lr": 8.759629566749361e-06} +{"train_loss": 0.000489911762997508, "global_step": 57838, "epoch": 486, "lr": 8.758376927569311e-06} +{"train_loss": 0.0007216262747533619, "global_step": 57839, "epoch": 486, "lr": 8.757124369362796e-06} +{"train_loss": 0.0012967034708708525, "global_step": 57840, "epoch": 486, "lr": 8.755871892132245e-06} +{"train_loss": 0.000255712540820241, "global_step": 57841, "epoch": 486, "lr": 8.754619495880146e-06} +{"train_loss": 0.00041003021760843694, "global_step": 57842, "epoch": 486, "lr": 8.753367180608945e-06} +{"train_loss": 0.00025392655516043305, "global_step": 57843, "epoch": 486, "lr": 8.752114946321088e-06} +{"train_loss": 0.00033055964740924537, "global_step": 57844, "epoch": 486, "lr": 8.75086279301906e-06} +{"train_loss": 0.00038884402601979673, "global_step": 57845, "epoch": 486, "lr": 8.749610720705292e-06} +{"train_loss": 0.0004851545672863722, "global_step": 57846, "epoch": 486, "lr": 8.748358729382272e-06} +{"train_loss": 0.0006712297326885164, "global_step": 57847, "epoch": 486, "lr": 8.747106819052431e-06} +{"train_loss": 0.00046162959188222885, "global_step": 57848, "epoch": 486, "lr": 8.745854989718249e-06} +{"train_loss": 0.000326193607179448, "global_step": 57849, "epoch": 486, "lr": 8.74460324138216e-06} +{"train_loss": 0.0002553655649535358, "global_step": 57850, "epoch": 486, "lr": 8.743351574046649e-06} +{"train_loss": 0.000514896004460752, "global_step": 57851, "epoch": 486, "lr": 8.742099987714147e-06} +{"train_loss": 0.00034994425368495286, "global_step": 57852, "epoch": 486, "lr": 8.740848482387138e-06} +{"train_loss": 0.00048203003825619817, "global_step": 57853, "epoch": 486, "lr": 8.73959705806805e-06} +{"train_loss": 0.0005413830513134599, "global_step": 57854, "epoch": 486, "lr": 8.738345714759366e-06} +{"train_loss": 0.0008561548311263323, "global_step": 57855, "epoch": 486, "lr": 8.737094452463523e-06} +{"train_loss": 0.0005505329463630915, "global_step": 57856, "epoch": 486, "lr": 8.735843271182997e-06} +{"train_loss": 0.0005878818337805569, "global_step": 57857, "epoch": 486, "lr": 8.73459217092022e-06} +{"train_loss": 0.00019955036987084895, "global_step": 57858, "epoch": 486, "lr": 8.733341151677682e-06} +{"train_loss": 0.0008541157003492117, "global_step": 57859, "epoch": 486, "lr": 8.7320902134578e-06} +{"train_loss": 0.0009163081413134933, "global_step": 57860, "epoch": 486, "lr": 8.730839356263065e-06} +{"train_loss": 0.0004141411918681115, "global_step": 57861, "epoch": 486, "lr": 8.72958858009592e-06} +{"train_loss": 0.0009915519040077925, "global_step": 57862, "epoch": 486, "lr": 8.728337884958804e-06} +{"train_loss": 0.0010294815292581916, "global_step": 57863, "epoch": 486, "lr": 8.7270872708542e-06} +{"train_loss": 0.00028367681079544127, "global_step": 57864, "epoch": 486, "lr": 8.725836737784542e-06} +{"train_loss": 0.0003003857273142785, "global_step": 57865, "epoch": 486, "lr": 8.724586285752307e-06} +{"train_loss": 0.0006156614981591702, "global_step": 57866, "epoch": 486, "lr": 8.723335914759934e-06} +{"train_loss": 0.0005082923453301191, "global_step": 57867, "epoch": 486, "lr": 8.722085624809867e-06} +{"train_loss": 0.000479204609291628, "global_step": 57868, "epoch": 486, "lr": 8.720835415904589e-06} +{"train_loss": 0.00035192316863685846, "global_step": 57869, "epoch": 486, "lr": 8.719585288046528e-06} +{"train_loss": 0.0005430118180811405, "global_step": 57870, "epoch": 486, "lr": 8.718335241238163e-06} +{"train_loss": 0.0009614375303499401, "global_step": 57871, "epoch": 486, "lr": 8.717085275481924e-06} +{"train_loss": 0.00029439973877742887, "global_step": 57872, "epoch": 486, "lr": 8.715835390780291e-06} +{"train_loss": 0.0006973916897550225, "global_step": 57873, "epoch": 486, "lr": 8.714585587135704e-06} +{"train_loss": 0.0005676612490788102, "global_step": 57874, "epoch": 486, "lr": 8.71333586455061e-06} +{"train_loss": 0.0005741323111578822, "global_step": 57875, "epoch": 486, "lr": 8.712086223027477e-06} +{"train_loss": 0.0003749572788365185, "global_step": 57876, "epoch": 486, "lr": 8.71083666256874e-06} +{"train_loss": 0.0003809300542343408, "global_step": 57877, "epoch": 486, "lr": 8.709587183176877e-06} +{"train_loss": 0.0004818663001060486, "global_step": 57878, "epoch": 486, "lr": 8.708337784854314e-06} +{"train_loss": 0.0006042985478416085, "global_step": 57879, "epoch": 486, "lr": 8.707088467603536e-06} +{"train_loss": 0.0005107246688567102, "global_step": 57880, "epoch": 486, "lr": 8.705839231426959e-06} +{"train_loss": 0.0005193675169721246, "global_step": 57881, "epoch": 486, "lr": 8.704590076327075e-06} +{"train_loss": 0.00037778663681820035, "global_step": 57882, "epoch": 486, "lr": 8.703341002306299e-06} +{"train_loss": 0.00034974043956026435, "global_step": 57883, "epoch": 486, "lr": 8.702092009367113e-06} +{"train_loss": 0.00043220308725722134, "global_step": 57884, "epoch": 486, "lr": 8.700843097511946e-06} +{"train_loss": 0.0005033320630900562, "global_step": 57885, "epoch": 486, "lr": 8.699594266743278e-06} +{"train_loss": 0.0007029708358459175, "global_step": 57886, "epoch": 486, "lr": 8.698345517063527e-06} +{"train_loss": 0.0003845219616778195, "global_step": 57887, "epoch": 486, "lr": 8.697096848475178e-06} +{"train_loss": 0.000901838531717658, "global_step": 57888, "epoch": 486, "lr": 8.69584826098065e-06} +{"train_loss": 0.0006985885556787252, "global_step": 57889, "epoch": 486, "lr": 8.694599754582427e-06} +{"train_loss": 0.000547458534128964, "global_step": 57890, "epoch": 486, "lr": 8.693351329282933e-06} +{"train_loss": 0.0008740941993892193, "global_step": 57891, "epoch": 486, "lr": 8.692102985084638e-06} +{"train_loss": 0.0002728945983108133, "global_step": 57892, "epoch": 486, "lr": 8.690854721989989e-06} +{"train_loss": 0.00045521912397816777, "global_step": 57893, "epoch": 486, "lr": 8.68960654000142e-06} +{"train_loss": 0.0004577779909595847, "global_step": 57894, "epoch": 486, "lr": 8.688358439121414e-06} +{"train_loss": 0.00034515527659095824, "global_step": 57895, "epoch": 486, "lr": 8.687110419352384e-06} +{"train_loss": 0.000467548641609028, "global_step": 57896, "epoch": 486, "lr": 8.68586248069681e-06} +{"train_loss": 0.0004128669679630548, "global_step": 57897, "epoch": 486, "lr": 8.684614623157133e-06} +{"train_loss": 0.00022912272834219038, "global_step": 57898, "epoch": 486, "lr": 8.68336684673579e-06} +{"train_loss": 0.00042243339703418314, "global_step": 57899, "epoch": 486, "lr": 8.682119151435259e-06} +{"train_loss": 0.0005059314426034689, "global_step": 57900, "epoch": 486, "lr": 8.680871537257951e-06} +{"train_loss": 0.000423252466134727, "global_step": 57901, "epoch": 486, "lr": 8.679624004206355e-06} +{"train_loss": 0.0006571278790943325, "global_step": 57902, "epoch": 486, "lr": 8.67837655228289e-06} +{"train_loss": 0.0003779068938456476, "global_step": 57903, "epoch": 486, "lr": 8.677129181490029e-06} +{"train_loss": 0.00038326173671521246, "global_step": 57904, "epoch": 486, "lr": 8.675881891830212e-06} +{"train_loss": 0.0005691329715773463, "global_step": 57905, "epoch": 486, "lr": 8.674634683305876e-06} +{"train_loss": 0.0004922195221297443, "global_step": 57906, "epoch": 486, "lr": 8.673387555919487e-06} +{"train_loss": 0.0004086426051799208, "global_step": 57907, "epoch": 486, "lr": 8.672140509673476e-06} +{"train_loss": 0.0004686984757427126, "global_step": 57908, "epoch": 486, "lr": 8.670893544570319e-06} +{"train_loss": 0.0003001278964802623, "global_step": 57909, "epoch": 486, "lr": 8.669646660612429e-06} +{"train_loss": 0.0005119412089698017, "global_step": 57910, "epoch": 486, "lr": 8.668399857802284e-06} +{"train_loss": 0.0002740605268627405, "global_step": 57911, "epoch": 486, "lr": 8.667153136142325e-06} +{"train_loss": 0.0006462172023020685, "global_step": 57912, "epoch": 486, "lr": 8.665906495634979e-06} +{"train_loss": 0.00039663369534537196, "global_step": 57913, "epoch": 486, "lr": 8.664659936282727e-06} +{"train_loss": 0.0006389081827364862, "global_step": 57914, "epoch": 486, "lr": 8.663413458087982e-06} +{"train_loss": 0.000813436636235565, "global_step": 57915, "epoch": 486, "lr": 8.662167061053223e-06} +{"train_loss": 0.0003861016302835196, "global_step": 57916, "epoch": 486, "lr": 8.660920745180868e-06} +{"train_loss": 0.0009657850605435669, "global_step": 57917, "epoch": 486, "lr": 8.65967451047338e-06} +{"train_loss": 0.0003727542934939265, "global_step": 57918, "epoch": 486, "lr": 8.658428356933218e-06} +{"train_loss": 0.0008971277857199311, "global_step": 57919, "epoch": 486, "lr": 8.657182284562799e-06} +{"train_loss": 0.00031788661726750433, "global_step": 57920, "epoch": 486, "lr": 8.655936293364603e-06} +{"train_loss": 0.0006642753724008799, "global_step": 57921, "epoch": 486, "lr": 8.654690383341042e-06} +{"train_loss": 0.0005817010533064604, "global_step": 57922, "epoch": 486, "lr": 8.653444554494594e-06} +{"train_loss": 0.00021580245811492205, "global_step": 57923, "epoch": 486, "lr": 8.652198806827694e-06} +{"train_loss": 0.0003726726572494954, "global_step": 57924, "epoch": 486, "lr": 8.650953140342765e-06} +{"train_loss": 0.000790488556958735, "global_step": 57925, "epoch": 486, "lr": 8.649707555042291e-06} +{"train_loss": 0.0005061127594672143, "global_step": 57926, "epoch": 486, "lr": 8.648462050928679e-06} +{"train_loss": 0.0006139373290352523, "global_step": 57927, "epoch": 486, "lr": 8.647216628004413e-06} +{"train_loss": 0.0003270924207754433, "global_step": 57928, "epoch": 486, "lr": 8.645971286271904e-06} +{"train_loss": 0.0004915963509120047, "global_step": 57929, "epoch": 486, "lr": 8.644726025733623e-06} +{"train_loss": 0.00038033080636523664, "global_step": 57930, "epoch": 486, "lr": 8.64348084639201e-06} +{"train_loss": 0.00041267817141488194, "global_step": 57931, "epoch": 486, "lr": 8.642235748249489e-06} +{"train_loss": 0.0004464979574549943, "global_step": 57932, "epoch": 486, "lr": 8.64099073130853e-06} +{"train_loss": 0.0006051856908015907, "global_step": 57933, "epoch": 486, "lr": 8.639745795571558e-06} +{"train_loss": 0.000529628072399646, "global_step": 57934, "epoch": 486, "lr": 8.638500941041033e-06} +{"train_loss": 0.0003740261890925467, "global_step": 57935, "epoch": 486, "lr": 8.637256167719399e-06} +{"train_loss": 0.0011887388536706567, "global_step": 57936, "epoch": 486, "lr": 8.63601147560908e-06} +{"train_loss": 0.00023740995675325394, "global_step": 57937, "epoch": 486, "lr": 8.63476686471254e-06} +{"train_loss": 0.00022212043404579163, "global_step": 57938, "epoch": 486, "lr": 8.633522335032207e-06} +{"train_loss": 0.00038606076850555837, "global_step": 57939, "epoch": 486, "lr": 8.63227788657055e-06} +{"train_loss": 0.0002793514868244529, "global_step": 57940, "epoch": 486, "lr": 8.631033519329979e-06} +{"train_loss": 0.0007599095115438104, "global_step": 57941, "epoch": 486, "lr": 8.629789233312969e-06} +{"train_loss": 0.00024716765619814396, "global_step": 57942, "epoch": 486, "lr": 8.628545028521944e-06} +{"train_loss": 0.0003982342022936791, "global_step": 57943, "epoch": 486, "lr": 8.627300904959346e-06} +{"train_loss": 0.0006337130907922983, "global_step": 57944, "epoch": 486, "lr": 8.62605686262763e-06} +{"train_loss": 0.00042544008465483785, "global_step": 57945, "epoch": 486, "lr": 8.624812901529216e-06} +{"train_loss": 0.00035452013253234327, "global_step": 57946, "epoch": 486, "lr": 8.623569021666578e-06} +{"train_loss": 0.00039801569073460996, "global_step": 57947, "epoch": 486, "lr": 8.622325223042132e-06} +{"train_loss": 0.00038031855365261436, "global_step": 57948, "epoch": 486, "lr": 8.621081505658335e-06} +{"train_loss": 0.0004938647616654634, "global_step": 57949, "epoch": 486, "lr": 8.619837869517616e-06} +{"train_loss": 0.00033192423870787024, "global_step": 57950, "epoch": 486, "lr": 8.618594314622436e-06} +{"train_loss": 0.00036417105002328753, "global_step": 57951, "epoch": 486, "lr": 8.617350840975213e-06} +{"train_loss": 0.0005036861064184472, "global_step": 57952, "epoch": 486, "lr": 8.616107448578403e-06, "val_loss": 0.012082371860742569} +{"train_loss": 0.00024087850761134177, "global_step": 57953, "epoch": 487, "lr": 8.614864137434453e-06} +{"train_loss": 0.00028997843037359416, "global_step": 57954, "epoch": 487, "lr": 8.613620907545799e-06} +{"train_loss": 0.00018954317783936858, "global_step": 57955, "epoch": 487, "lr": 8.612377758914864e-06} +{"train_loss": 0.0002604530309326947, "global_step": 57956, "epoch": 487, "lr": 8.61113469154412e-06} +{"train_loss": 0.000549285439774394, "global_step": 57957, "epoch": 487, "lr": 8.609891705435973e-06} +{"train_loss": 0.0003566126397345215, "global_step": 57958, "epoch": 487, "lr": 8.6086488005929e-06} +{"train_loss": 0.0004002197820227593, "global_step": 57959, "epoch": 487, "lr": 8.607405977017307e-06} +{"train_loss": 0.000536116654984653, "global_step": 57960, "epoch": 487, "lr": 8.606163234711662e-06} +{"train_loss": 0.0006421635625883937, "global_step": 57961, "epoch": 487, "lr": 8.604920573678394e-06} +{"train_loss": 0.00039957964327186346, "global_step": 57962, "epoch": 487, "lr": 8.603677993919935e-06} +{"train_loss": 0.00023615211830474436, "global_step": 57963, "epoch": 487, "lr": 8.602435495438737e-06} +{"train_loss": 0.000544107926543802, "global_step": 57964, "epoch": 487, "lr": 8.601193078237224e-06} +{"train_loss": 0.0002521346905268729, "global_step": 57965, "epoch": 487, "lr": 8.599950742317858e-06} +{"train_loss": 0.00032424225355498493, "global_step": 57966, "epoch": 487, "lr": 8.598708487683066e-06} +{"train_loss": 0.000737089547328651, "global_step": 57967, "epoch": 487, "lr": 8.597466314335272e-06} +{"train_loss": 0.0002728715480770916, "global_step": 57968, "epoch": 487, "lr": 8.59622422227695e-06} +{"train_loss": 0.0007086361874826252, "global_step": 57969, "epoch": 487, "lr": 8.594982211510499e-06} +{"train_loss": 0.0004965112311765552, "global_step": 57970, "epoch": 487, "lr": 8.593740282038386e-06} +{"train_loss": 0.0002445746213197708, "global_step": 57971, "epoch": 487, "lr": 8.59249843386304e-06} +{"train_loss": 0.0003088400699198246, "global_step": 57972, "epoch": 487, "lr": 8.591256666986902e-06} +{"train_loss": 0.0007929496350698173, "global_step": 57973, "epoch": 487, "lr": 8.59001498141241e-06} +{"train_loss": 0.00036427061422728, "global_step": 57974, "epoch": 487, "lr": 8.588773377141985e-06} +{"train_loss": 0.00038530267192982137, "global_step": 57975, "epoch": 487, "lr": 8.587531854178099e-06} +{"train_loss": 0.00047922207158990204, "global_step": 57976, "epoch": 487, "lr": 8.586290412523152e-06} +{"train_loss": 0.000683231686707586, "global_step": 57977, "epoch": 487, "lr": 8.58504905217961e-06} +{"train_loss": 0.00034010139643214643, "global_step": 57978, "epoch": 487, "lr": 8.583807773149894e-06} +{"train_loss": 0.0005578345153480768, "global_step": 57979, "epoch": 487, "lr": 8.582566575436451e-06} +{"train_loss": 0.0005476350779645145, "global_step": 57980, "epoch": 487, "lr": 8.581325459041707e-06} +{"train_loss": 0.00041752340621314943, "global_step": 57981, "epoch": 487, "lr": 8.580084423968116e-06} +{"train_loss": 0.0006199435447342694, "global_step": 57982, "epoch": 487, "lr": 8.57884347021809e-06} +{"train_loss": 0.0007707352051511407, "global_step": 57983, "epoch": 487, "lr": 8.577602597794098e-06} +{"train_loss": 0.0003520490718074143, "global_step": 57984, "epoch": 487, "lr": 8.57636180669854e-06} +{"train_loss": 0.0008469070307910442, "global_step": 57985, "epoch": 487, "lr": 8.575121096933886e-06} +{"train_loss": 0.000510163779836148, "global_step": 57986, "epoch": 487, "lr": 8.573880468502544e-06} +{"train_loss": 0.0002013428893405944, "global_step": 57987, "epoch": 487, "lr": 8.572639921406966e-06} +{"train_loss": 0.00023806086392141879, "global_step": 57988, "epoch": 487, "lr": 8.571399455649581e-06} +{"train_loss": 0.0002786426921375096, "global_step": 57989, "epoch": 487, "lr": 8.570159071232836e-06} +{"train_loss": 0.0003593727888073772, "global_step": 57990, "epoch": 487, "lr": 8.568918768159146e-06} +{"train_loss": 0.0007524045067839324, "global_step": 57991, "epoch": 487, "lr": 8.567678546430969e-06} +{"train_loss": 0.0004220679693389684, "global_step": 57992, "epoch": 487, "lr": 8.566438406050731e-06} +{"train_loss": 0.0005244914209470153, "global_step": 57993, "epoch": 487, "lr": 8.565198347020847e-06} +{"train_loss": 0.0005000158562324941, "global_step": 57994, "epoch": 487, "lr": 8.563958369343788e-06} +{"train_loss": 0.0004443485231604427, "global_step": 57995, "epoch": 487, "lr": 8.562718473021952e-06} +{"train_loss": 0.00034940423211082816, "global_step": 57996, "epoch": 487, "lr": 8.561478658057809e-06} +{"train_loss": 0.0009313758346252143, "global_step": 57997, "epoch": 487, "lr": 8.560238924453761e-06} +{"train_loss": 0.0003136511368211359, "global_step": 57998, "epoch": 487, "lr": 8.55899927221227e-06} +{"train_loss": 0.00023798568872734904, "global_step": 57999, "epoch": 487, "lr": 8.557759701335754e-06} +{"train_loss": 0.0005392176099121571, "global_step": 58000, "epoch": 487, "lr": 8.556520211826641e-06} +{"train_loss": 0.00024189840769395232, "global_step": 58001, "epoch": 487, "lr": 8.555280803687382e-06} +{"train_loss": 0.0008032642654143274, "global_step": 58002, "epoch": 487, "lr": 8.554041476920388e-06} +{"train_loss": 0.0005901654367335141, "global_step": 58003, "epoch": 487, "lr": 8.552802231528117e-06} +{"train_loss": 0.0002863524714484811, "global_step": 58004, "epoch": 487, "lr": 8.551563067512997e-06} +{"train_loss": 0.0004626355366781354, "global_step": 58005, "epoch": 487, "lr": 8.55032398487744e-06} +{"train_loss": 0.0005287263775244355, "global_step": 58006, "epoch": 487, "lr": 8.549084983623907e-06} +{"train_loss": 0.0003815463569480926, "global_step": 58007, "epoch": 487, "lr": 8.5478460637548e-06} +{"train_loss": 0.0007788104703649879, "global_step": 58008, "epoch": 487, "lr": 8.546607225272584e-06} +{"train_loss": 0.000518182700034231, "global_step": 58009, "epoch": 487, "lr": 8.545368468179666e-06} +{"train_loss": 0.00045602471800521016, "global_step": 58010, "epoch": 487, "lr": 8.544129792478495e-06} +{"train_loss": 0.000734651111997664, "global_step": 58011, "epoch": 487, "lr": 8.542891198171504e-06} +{"train_loss": 0.0005619724397547543, "global_step": 58012, "epoch": 487, "lr": 8.541652685261098e-06} +{"train_loss": 0.0012922369642183185, "global_step": 58013, "epoch": 487, "lr": 8.54041425374973e-06} +{"train_loss": 0.0006340640829876065, "global_step": 58014, "epoch": 487, "lr": 8.539175903639845e-06} +{"train_loss": 0.0006023795576766133, "global_step": 58015, "epoch": 487, "lr": 8.53793763493384e-06} +{"train_loss": 0.0004288015188649297, "global_step": 58016, "epoch": 487, "lr": 8.536699447634183e-06} +{"train_loss": 0.0003632103034760803, "global_step": 58017, "epoch": 487, "lr": 8.535461341743272e-06} +{"train_loss": 0.0005763288936577737, "global_step": 58018, "epoch": 487, "lr": 8.534223317263563e-06} +{"train_loss": 0.0006817943649366498, "global_step": 58019, "epoch": 487, "lr": 8.532985374197467e-06} +{"train_loss": 0.000742852920666337, "global_step": 58020, "epoch": 487, "lr": 8.53174751254744e-06} +{"train_loss": 0.0005311337299644947, "global_step": 58021, "epoch": 487, "lr": 8.530509732315877e-06} +{"train_loss": 0.0003510675160214305, "global_step": 58022, "epoch": 487, "lr": 8.529272033505242e-06} +{"train_loss": 0.00041326283826492727, "global_step": 58023, "epoch": 487, "lr": 8.528034416117953e-06} +{"train_loss": 0.0003034921537619084, "global_step": 58024, "epoch": 487, "lr": 8.526796880156423e-06} +{"train_loss": 0.0005976324900984764, "global_step": 58025, "epoch": 487, "lr": 8.525559425623114e-06} +{"train_loss": 0.0003415980318095535, "global_step": 58026, "epoch": 487, "lr": 8.524322052520423e-06} +{"train_loss": 0.0003980585315730423, "global_step": 58027, "epoch": 487, "lr": 8.523084760850802e-06} +{"train_loss": 0.00046291909529827535, "global_step": 58028, "epoch": 487, "lr": 8.521847550616668e-06} +{"train_loss": 0.00031091400887817144, "global_step": 58029, "epoch": 487, "lr": 8.520610421820463e-06} +{"train_loss": 0.0008962351712398231, "global_step": 58030, "epoch": 487, "lr": 8.519373374464612e-06} +{"train_loss": 0.0006199150229804218, "global_step": 58031, "epoch": 487, "lr": 8.518136408551525e-06} +{"train_loss": 0.000546660739928484, "global_step": 58032, "epoch": 487, "lr": 8.516899524083654e-06} +{"train_loss": 0.0004481423238757998, "global_step": 58033, "epoch": 487, "lr": 8.515662721063412e-06} +{"train_loss": 0.0004629657487384975, "global_step": 58034, "epoch": 487, "lr": 8.514425999493241e-06} +{"train_loss": 0.0007089732098393142, "global_step": 58035, "epoch": 487, "lr": 8.513189359375568e-06} +{"train_loss": 0.0004023564397357404, "global_step": 58036, "epoch": 487, "lr": 8.511952800712803e-06} +{"train_loss": 0.0003733386693056673, "global_step": 58037, "epoch": 487, "lr": 8.510716323507395e-06} +{"train_loss": 0.0007004559738561511, "global_step": 58038, "epoch": 487, "lr": 8.509479927761755e-06} +{"train_loss": 0.0009380181436426938, "global_step": 58039, "epoch": 487, "lr": 8.508243613478329e-06} +{"train_loss": 0.0003870436630677432, "global_step": 58040, "epoch": 487, "lr": 8.507007380659521e-06} +{"train_loss": 0.0005353434826247394, "global_step": 58041, "epoch": 487, "lr": 8.505771229307785e-06} +{"train_loss": 0.0004365125496406108, "global_step": 58042, "epoch": 487, "lr": 8.504535159425531e-06} +{"train_loss": 0.00028852481045760214, "global_step": 58043, "epoch": 487, "lr": 8.503299171015177e-06} +{"train_loss": 0.0003152840363327414, "global_step": 58044, "epoch": 487, "lr": 8.502063264079179e-06} +{"train_loss": 0.00033691953285597265, "global_step": 58045, "epoch": 487, "lr": 8.500827438619929e-06} +{"train_loss": 0.0008026938303373754, "global_step": 58046, "epoch": 487, "lr": 8.499591694639886e-06} +{"train_loss": 0.00082194380229339, "global_step": 58047, "epoch": 487, "lr": 8.498356032141447e-06} +{"train_loss": 0.000839479558635503, "global_step": 58048, "epoch": 487, "lr": 8.497120451127056e-06} +{"train_loss": 0.0006121547194197774, "global_step": 58049, "epoch": 487, "lr": 8.495884951599142e-06} +{"train_loss": 0.0005114592495374382, "global_step": 58050, "epoch": 487, "lr": 8.494649533560112e-06} +{"train_loss": 0.0011361216893419623, "global_step": 58051, "epoch": 487, "lr": 8.493414197012422e-06} +{"train_loss": 0.00045871749171055853, "global_step": 58052, "epoch": 487, "lr": 8.492178941958462e-06} +{"train_loss": 0.000491616316139698, "global_step": 58053, "epoch": 487, "lr": 8.490943768400683e-06} +{"train_loss": 0.0003260077501181513, "global_step": 58054, "epoch": 487, "lr": 8.489708676341507e-06} +{"train_loss": 0.0003953854029532522, "global_step": 58055, "epoch": 487, "lr": 8.488473665783336e-06} +{"train_loss": 0.0003181478241458535, "global_step": 58056, "epoch": 487, "lr": 8.48723873672863e-06} +{"train_loss": 0.0002550983044784516, "global_step": 58057, "epoch": 487, "lr": 8.486003889179783e-06} +{"train_loss": 0.0003371533821336925, "global_step": 58058, "epoch": 487, "lr": 8.484769123139242e-06} +{"train_loss": 0.0003738527884706855, "global_step": 58059, "epoch": 487, "lr": 8.483534438609409e-06} +{"train_loss": 0.0005669600213877857, "global_step": 58060, "epoch": 487, "lr": 8.482299835592733e-06} +{"train_loss": 0.00039609044324606657, "global_step": 58061, "epoch": 487, "lr": 8.481065314091625e-06} +{"train_loss": 0.00041837606113404036, "global_step": 58062, "epoch": 487, "lr": 8.479830874108501e-06} +{"train_loss": 0.0005064402357675135, "global_step": 58063, "epoch": 487, "lr": 8.478596515645804e-06} +{"train_loss": 0.00046912144171074033, "global_step": 58064, "epoch": 487, "lr": 8.477362238705933e-06} +{"train_loss": 0.000551333068870008, "global_step": 58065, "epoch": 487, "lr": 8.476128043291337e-06} +{"train_loss": 0.0004102570819668472, "global_step": 58066, "epoch": 487, "lr": 8.474893929404414e-06} +{"train_loss": 0.00024089656653814018, "global_step": 58067, "epoch": 487, "lr": 8.47365989704762e-06} +{"train_loss": 0.0006188626284711063, "global_step": 58068, "epoch": 487, "lr": 8.47242594622335e-06} +{"train_loss": 0.0007438135799020529, "global_step": 58069, "epoch": 487, "lr": 8.471192076934027e-06} +{"train_loss": 0.00032391288550570607, "global_step": 58070, "epoch": 487, "lr": 8.469958289182095e-06} +{"train_loss": 0.0004982057971803535, "global_step": 58071, "epoch": 487, "lr": 8.46872458296995e-06, "val_loss": 0.017512395977973938} +{"train_loss": 0.00047616547090001404, "global_step": 58072, "epoch": 488, "lr": 8.46749095830004e-06} +{"train_loss": 0.00024141196627169847, "global_step": 58073, "epoch": 488, "lr": 8.466257415174772e-06} +{"train_loss": 0.0006378876278176904, "global_step": 58074, "epoch": 488, "lr": 8.465023953596557e-06} +{"train_loss": 0.000522205897141248, "global_step": 58075, "epoch": 488, "lr": 8.463790573567848e-06} +{"train_loss": 0.0003898422874044627, "global_step": 58076, "epoch": 488, "lr": 8.462557275091033e-06} +{"train_loss": 0.00034884337219409645, "global_step": 58077, "epoch": 488, "lr": 8.461324058168557e-06} +{"train_loss": 0.0003253735485486686, "global_step": 58078, "epoch": 488, "lr": 8.460090922802828e-06} +{"train_loss": 0.0004129184235353023, "global_step": 58079, "epoch": 488, "lr": 8.458857868996283e-06} +{"train_loss": 0.0004922306397929788, "global_step": 58080, "epoch": 488, "lr": 8.45762489675132e-06} +{"train_loss": 0.00023873856116551906, "global_step": 58081, "epoch": 488, "lr": 8.456392006070384e-06} +{"train_loss": 0.0004644212604034692, "global_step": 58082, "epoch": 488, "lr": 8.45515919695587e-06} +{"train_loss": 0.0005196937127038836, "global_step": 58083, "epoch": 488, "lr": 8.453926469410218e-06} +{"train_loss": 0.0002595951082184911, "global_step": 58084, "epoch": 488, "lr": 8.452693823435848e-06} +{"train_loss": 0.0005660110036842525, "global_step": 58085, "epoch": 488, "lr": 8.451461259035181e-06} +{"train_loss": 0.0007915932801552117, "global_step": 58086, "epoch": 488, "lr": 8.450228776210617e-06} +{"train_loss": 0.0008482977864332497, "global_step": 58087, "epoch": 488, "lr": 8.448996374964602e-06} +{"train_loss": 0.0005305481026880443, "global_step": 58088, "epoch": 488, "lr": 8.447764055299529e-06} +{"train_loss": 0.00025693365023471415, "global_step": 58089, "epoch": 488, "lr": 8.446531817217846e-06} +{"train_loss": 0.000373024377040565, "global_step": 58090, "epoch": 488, "lr": 8.445299660721951e-06} +{"train_loss": 0.000452423031674698, "global_step": 58091, "epoch": 488, "lr": 8.444067585814275e-06} +{"train_loss": 0.0006049037328921258, "global_step": 58092, "epoch": 488, "lr": 8.442835592497233e-06} +{"train_loss": 0.0005649311351589859, "global_step": 58093, "epoch": 488, "lr": 8.441603680773236e-06} +{"train_loss": 0.0005259299650788307, "global_step": 58094, "epoch": 488, "lr": 8.440371850644723e-06} +{"train_loss": 0.0005007499712519348, "global_step": 58095, "epoch": 488, "lr": 8.439140102114085e-06} +{"train_loss": 0.00043881862075068057, "global_step": 58096, "epoch": 488, "lr": 8.437908435183768e-06} +{"train_loss": 0.00032929208828136325, "global_step": 58097, "epoch": 488, "lr": 8.436676849856168e-06} +{"train_loss": 0.0004034068842884153, "global_step": 58098, "epoch": 488, "lr": 8.435445346133719e-06} +{"train_loss": 0.0004919061320833862, "global_step": 58099, "epoch": 488, "lr": 8.434213924018835e-06} +{"train_loss": 0.0004565490526147187, "global_step": 58100, "epoch": 488, "lr": 8.43298258351392e-06} +{"train_loss": 0.0002842228568624705, "global_step": 58101, "epoch": 488, "lr": 8.431751324621417e-06} +{"train_loss": 0.00030907109612599015, "global_step": 58102, "epoch": 488, "lr": 8.430520147343712e-06} +{"train_loss": 0.0005480788531713188, "global_step": 58103, "epoch": 488, "lr": 8.42928905168326e-06} +{"train_loss": 0.0004902358050458133, "global_step": 58104, "epoch": 488, "lr": 8.42805803764245e-06} +{"train_loss": 0.0005401743692345917, "global_step": 58105, "epoch": 488, "lr": 8.4268271052237e-06} +{"train_loss": 0.00042646739166229963, "global_step": 58106, "epoch": 488, "lr": 8.425596254429441e-06} +{"train_loss": 0.0003046104102395475, "global_step": 58107, "epoch": 488, "lr": 8.42436548526207e-06} +{"train_loss": 0.0005945641896687448, "global_step": 58108, "epoch": 488, "lr": 8.42313479772403e-06} +{"train_loss": 0.0006169859552755952, "global_step": 58109, "epoch": 488, "lr": 8.421904191817715e-06} +{"train_loss": 0.0005485505680553615, "global_step": 58110, "epoch": 488, "lr": 8.420673667545553e-06} +{"train_loss": 0.00022524619998876005, "global_step": 58111, "epoch": 488, "lr": 8.41944322490995e-06} +{"train_loss": 0.00023125545703805983, "global_step": 58112, "epoch": 488, "lr": 8.418212863913338e-06} +{"train_loss": 0.0005570577923208475, "global_step": 58113, "epoch": 488, "lr": 8.416982584558115e-06} +{"train_loss": 0.0006374543881975114, "global_step": 58114, "epoch": 488, "lr": 8.415752386846708e-06} +{"train_loss": 0.0003187183756381273, "global_step": 58115, "epoch": 488, "lr": 8.414522270781521e-06} +{"train_loss": 0.0004521169466897845, "global_step": 58116, "epoch": 488, "lr": 8.413292236364989e-06} +{"train_loss": 0.000629670568741858, "global_step": 58117, "epoch": 488, "lr": 8.412062283599504e-06} +{"train_loss": 0.00020935219072271138, "global_step": 58118, "epoch": 488, "lr": 8.410832412487502e-06} +{"train_loss": 0.0003702118410728872, "global_step": 58119, "epoch": 488, "lr": 8.409602623031371e-06} +{"train_loss": 0.0003223555686417967, "global_step": 58120, "epoch": 488, "lr": 8.408372915233559e-06} +{"train_loss": 0.00041950741433538496, "global_step": 58121, "epoch": 488, "lr": 8.407143289096454e-06} +{"train_loss": 0.00039889043546281755, "global_step": 58122, "epoch": 488, "lr": 8.405913744622484e-06} +{"train_loss": 0.0007977292407304049, "global_step": 58123, "epoch": 488, "lr": 8.404684281814062e-06} +{"train_loss": 0.00034626468550413847, "global_step": 58124, "epoch": 488, "lr": 8.403454900673591e-06} +{"train_loss": 0.00048531347420066595, "global_step": 58125, "epoch": 488, "lr": 8.4022256012035e-06} +{"train_loss": 0.0005671994294971228, "global_step": 58126, "epoch": 488, "lr": 8.400996383406184e-06} +{"train_loss": 0.0004448821709956974, "global_step": 58127, "epoch": 488, "lr": 8.39976724728408e-06} +{"train_loss": 0.0008971142233349383, "global_step": 58128, "epoch": 488, "lr": 8.398538192839578e-06} +{"train_loss": 0.0003460767911747098, "global_step": 58129, "epoch": 488, "lr": 8.39730922007511e-06} +{"train_loss": 0.0005530763883143663, "global_step": 58130, "epoch": 488, "lr": 8.396080328993083e-06} +{"train_loss": 0.0004007693787571043, "global_step": 58131, "epoch": 488, "lr": 8.394851519595893e-06} +{"train_loss": 0.0008179540163837373, "global_step": 58132, "epoch": 488, "lr": 8.39362279188598e-06} +{"train_loss": 0.0007844569627195597, "global_step": 58133, "epoch": 488, "lr": 8.392394145865734e-06} +{"train_loss": 0.0004112719907425344, "global_step": 58134, "epoch": 488, "lr": 8.391165581537591e-06} +{"train_loss": 0.0006761577096767724, "global_step": 58135, "epoch": 488, "lr": 8.389937098903933e-06} +{"train_loss": 0.00023695309937465936, "global_step": 58136, "epoch": 488, "lr": 8.388708697967202e-06} +{"train_loss": 0.00036009802715852857, "global_step": 58137, "epoch": 488, "lr": 8.387480378729795e-06} +{"train_loss": 0.0002456946240272373, "global_step": 58138, "epoch": 488, "lr": 8.386252141194112e-06} +{"train_loss": 0.000565238471608609, "global_step": 58139, "epoch": 488, "lr": 8.385023985362589e-06} +{"train_loss": 0.0005846739513799548, "global_step": 58140, "epoch": 488, "lr": 8.383795911237613e-06} +{"train_loss": 0.0010032524587586522, "global_step": 58141, "epoch": 488, "lr": 8.382567918821622e-06} +{"train_loss": 0.0007318552234210074, "global_step": 58142, "epoch": 488, "lr": 8.381340008117012e-06} +{"train_loss": 0.00040734990034252405, "global_step": 58143, "epoch": 488, "lr": 8.380112179126181e-06} +{"train_loss": 0.00038714605034328997, "global_step": 58144, "epoch": 488, "lr": 8.378884431851569e-06} +{"train_loss": 0.0002787893172353506, "global_step": 58145, "epoch": 488, "lr": 8.377656766295555e-06} +{"train_loss": 0.0002759672934189439, "global_step": 58146, "epoch": 488, "lr": 8.376429182460566e-06} +{"train_loss": 0.00047695799730718136, "global_step": 58147, "epoch": 488, "lr": 8.375201680349027e-06} +{"train_loss": 0.0005277876043692231, "global_step": 58148, "epoch": 488, "lr": 8.37397425996332e-06} +{"train_loss": 0.0005188141367398202, "global_step": 58149, "epoch": 488, "lr": 8.372746921305874e-06} +{"train_loss": 0.0004505408287514001, "global_step": 58150, "epoch": 488, "lr": 8.371519664379086e-06} +{"train_loss": 0.00042605752241797745, "global_step": 58151, "epoch": 488, "lr": 8.370292489185378e-06} +{"train_loss": 0.0005108760669827461, "global_step": 58152, "epoch": 488, "lr": 8.369065395727144e-06} +{"train_loss": 0.00033643931965343654, "global_step": 58153, "epoch": 488, "lr": 8.367838384006815e-06} +{"train_loss": 0.0002824394905474037, "global_step": 58154, "epoch": 488, "lr": 8.36661145402679e-06} +{"train_loss": 0.0006062875618226826, "global_step": 58155, "epoch": 488, "lr": 8.365384605789462e-06} +{"train_loss": 0.00040602227090857923, "global_step": 58156, "epoch": 488, "lr": 8.364157839297259e-06} +{"train_loss": 0.000336819066433236, "global_step": 58157, "epoch": 488, "lr": 8.362931154552578e-06} +{"train_loss": 0.0005133836530148983, "global_step": 58158, "epoch": 488, "lr": 8.361704551557847e-06} +{"train_loss": 0.0004989155568182468, "global_step": 58159, "epoch": 488, "lr": 8.360478030315444e-06} +{"train_loss": 0.00044199201511219144, "global_step": 58160, "epoch": 488, "lr": 8.359251590827811e-06} +{"train_loss": 0.0004776292771566659, "global_step": 58161, "epoch": 488, "lr": 8.358025233097338e-06} +{"train_loss": 0.0004721053410321474, "global_step": 58162, "epoch": 488, "lr": 8.356798957126416e-06} +{"train_loss": 0.0003118661406915635, "global_step": 58163, "epoch": 488, "lr": 8.35557276291749e-06} +{"train_loss": 0.000500320631545037, "global_step": 58164, "epoch": 488, "lr": 8.354346650472933e-06} +{"train_loss": 0.0007043306832201779, "global_step": 58165, "epoch": 488, "lr": 8.353120619795174e-06} +{"train_loss": 0.0003556170267984271, "global_step": 58166, "epoch": 488, "lr": 8.351894670886607e-06} +{"train_loss": 0.0006436010589823127, "global_step": 58167, "epoch": 488, "lr": 8.350668803749655e-06} +{"train_loss": 0.0006773839122615755, "global_step": 58168, "epoch": 488, "lr": 8.349443018386716e-06} +{"train_loss": 0.0004108407301828265, "global_step": 58169, "epoch": 488, "lr": 8.348217314800183e-06} +{"train_loss": 0.00046276327339001, "global_step": 58170, "epoch": 488, "lr": 8.34699169299249e-06} +{"train_loss": 0.0003839785058517009, "global_step": 58171, "epoch": 488, "lr": 8.345766152966016e-06} +{"train_loss": 0.00027881620917469263, "global_step": 58172, "epoch": 488, "lr": 8.344540694723192e-06} +{"train_loss": 0.0005073075299151242, "global_step": 58173, "epoch": 488, "lr": 8.343315318266409e-06} +{"train_loss": 0.0005178514984436333, "global_step": 58174, "epoch": 488, "lr": 8.34209002359807e-06} +{"train_loss": 0.0005654834094457328, "global_step": 58175, "epoch": 488, "lr": 8.340864810720594e-06} +{"train_loss": 0.0001893239823402837, "global_step": 58176, "epoch": 488, "lr": 8.33963967963637e-06} +{"train_loss": 0.0005044542485848069, "global_step": 58177, "epoch": 488, "lr": 8.338414630347824e-06} +{"train_loss": 0.00026877946220338345, "global_step": 58178, "epoch": 488, "lr": 8.337189662857336e-06} +{"train_loss": 0.0006428459892049432, "global_step": 58179, "epoch": 488, "lr": 8.335964777167338e-06} +{"train_loss": 0.000502803479321301, "global_step": 58180, "epoch": 488, "lr": 8.33473997328021e-06} +{"train_loss": 0.0006306517752818763, "global_step": 58181, "epoch": 488, "lr": 8.333515251198371e-06} +{"train_loss": 0.000374908180674538, "global_step": 58182, "epoch": 488, "lr": 8.332290610924232e-06} +{"train_loss": 0.0003977883025072515, "global_step": 58183, "epoch": 488, "lr": 8.331066052460178e-06} +{"train_loss": 0.00028277296223677695, "global_step": 58184, "epoch": 488, "lr": 8.329841575808639e-06} +{"train_loss": 0.0004025509988423437, "global_step": 58185, "epoch": 488, "lr": 8.328617180971987e-06} +{"train_loss": 0.0003591787244658917, "global_step": 58186, "epoch": 488, "lr": 8.327392867952661e-06} +{"train_loss": 0.00038539167144335806, "global_step": 58187, "epoch": 488, "lr": 8.32616863675304e-06} +{"train_loss": 0.000983168836683035, "global_step": 58188, "epoch": 488, "lr": 8.32494448737553e-06} +{"train_loss": 0.00035405007656663656, "global_step": 58189, "epoch": 488, "lr": 8.323720419822545e-06} +{"train_loss": 0.0004692654446512852, "global_step": 58190, "epoch": 488, "lr": 8.322496434096477e-06, "val_loss": 0.017478398978710175} +{"train_loss": 0.00022164388792589307, "global_step": 58191, "epoch": 489, "lr": 8.321272530199743e-06} +{"train_loss": 0.00024690150166861713, "global_step": 58192, "epoch": 489, "lr": 8.320048708134736e-06} +{"train_loss": 0.0005271253176033497, "global_step": 58193, "epoch": 489, "lr": 8.318824967903849e-06} +{"train_loss": 0.0005935032968409359, "global_step": 58194, "epoch": 489, "lr": 8.317601309509509e-06} +{"train_loss": 0.0003395214444026351, "global_step": 58195, "epoch": 489, "lr": 8.316377732954095e-06} +{"train_loss": 0.000442053540609777, "global_step": 58196, "epoch": 489, "lr": 8.315154238240031e-06} +{"train_loss": 0.0002760820207186043, "global_step": 58197, "epoch": 489, "lr": 8.313930825369697e-06} +{"train_loss": 0.0006740732351318002, "global_step": 58198, "epoch": 489, "lr": 8.312707494345518e-06} +{"train_loss": 0.00037077328306622803, "global_step": 58199, "epoch": 489, "lr": 8.311484245169886e-06} +{"train_loss": 0.00021491377265192568, "global_step": 58200, "epoch": 489, "lr": 8.310261077845188e-06} +{"train_loss": 0.0007576591451652348, "global_step": 58201, "epoch": 489, "lr": 8.309037992373847e-06} +{"train_loss": 0.0005475152283906937, "global_step": 58202, "epoch": 489, "lr": 8.30781498875825e-06} +{"train_loss": 0.00021588699019048363, "global_step": 58203, "epoch": 489, "lr": 8.306592067000812e-06} +{"train_loss": 0.0002810168080031872, "global_step": 58204, "epoch": 489, "lr": 8.305369227103926e-06} +{"train_loss": 0.0005400060908868909, "global_step": 58205, "epoch": 489, "lr": 8.304146469069978e-06} +{"train_loss": 0.0005885694990865886, "global_step": 58206, "epoch": 489, "lr": 8.302923792901402e-06} +{"train_loss": 0.0003538118035066873, "global_step": 58207, "epoch": 489, "lr": 8.30170119860057e-06} +{"train_loss": 0.0006473573157563806, "global_step": 58208, "epoch": 489, "lr": 8.300478686169899e-06} +{"train_loss": 0.0005584144964814186, "global_step": 58209, "epoch": 489, "lr": 8.29925625561177e-06} +{"train_loss": 0.0003566895902622491, "global_step": 58210, "epoch": 489, "lr": 8.298033906928615e-06} +{"train_loss": 0.0009782954584807158, "global_step": 58211, "epoch": 489, "lr": 8.296811640122798e-06} +{"train_loss": 0.0002559910644777119, "global_step": 58212, "epoch": 489, "lr": 8.29558945519675e-06} +{"train_loss": 0.00036332092713564634, "global_step": 58213, "epoch": 489, "lr": 8.294367352152843e-06} +{"train_loss": 0.0006595810409635305, "global_step": 58214, "epoch": 489, "lr": 8.293145330993506e-06} +{"train_loss": 0.0005335861351341009, "global_step": 58215, "epoch": 489, "lr": 8.291923391721107e-06} +{"train_loss": 0.00033235654700547457, "global_step": 58216, "epoch": 489, "lr": 8.290701534338063e-06} +{"train_loss": 0.0006967476801946759, "global_step": 58217, "epoch": 489, "lr": 8.28947975884678e-06} +{"train_loss": 0.0003870078653562814, "global_step": 58218, "epoch": 489, "lr": 8.288258065249648e-06} +{"train_loss": 0.0004152519104536623, "global_step": 58219, "epoch": 489, "lr": 8.287036453549052e-06} +{"train_loss": 0.0006467074854299426, "global_step": 58220, "epoch": 489, "lr": 8.28581492374742e-06} +{"train_loss": 0.0006008282653056085, "global_step": 58221, "epoch": 489, "lr": 8.284593475847119e-06} +{"train_loss": 0.000751402520108968, "global_step": 58222, "epoch": 489, "lr": 8.283372109850574e-06} +{"train_loss": 0.0006180834025144577, "global_step": 58223, "epoch": 489, "lr": 8.28215082576017e-06} +{"train_loss": 0.00036045245360583067, "global_step": 58224, "epoch": 489, "lr": 8.280929623578293e-06} +{"train_loss": 0.0004452370048966259, "global_step": 58225, "epoch": 489, "lr": 8.27970850330737e-06} +{"train_loss": 0.000740588700864464, "global_step": 58226, "epoch": 489, "lr": 8.27848746494977e-06} +{"train_loss": 0.0006315427599474788, "global_step": 58227, "epoch": 489, "lr": 8.277266508507908e-06} +{"train_loss": 0.0004919787752442062, "global_step": 58228, "epoch": 489, "lr": 8.276045633984169e-06} +{"train_loss": 0.0002236121945315972, "global_step": 58229, "epoch": 489, "lr": 8.274824841380969e-06} +{"train_loss": 0.0002959984412882477, "global_step": 58230, "epoch": 489, "lr": 8.273604130700691e-06} +{"train_loss": 0.0008131427457556129, "global_step": 58231, "epoch": 489, "lr": 8.272383501945723e-06} +{"train_loss": 0.00029954055207781494, "global_step": 58232, "epoch": 489, "lr": 8.271162955118484e-06} +{"train_loss": 0.00037800773861818016, "global_step": 58233, "epoch": 489, "lr": 8.269942490221343e-06} +{"train_loss": 0.0004942803061567247, "global_step": 58234, "epoch": 489, "lr": 8.268722107256732e-06} +{"train_loss": 0.00040913588600233197, "global_step": 58235, "epoch": 489, "lr": 8.267501806227007e-06} +{"train_loss": 0.0005816639750264585, "global_step": 58236, "epoch": 489, "lr": 8.2662815871346e-06} +{"train_loss": 0.00023586182214785367, "global_step": 58237, "epoch": 489, "lr": 8.265061449981887e-06} +{"train_loss": 0.0003242341917939484, "global_step": 58238, "epoch": 489, "lr": 8.26384139477126e-06} +{"train_loss": 0.0006547056837007403, "global_step": 58239, "epoch": 489, "lr": 8.26262142150513e-06} +{"train_loss": 0.00045037578092888, "global_step": 58240, "epoch": 489, "lr": 8.26140153018587e-06} +{"train_loss": 0.00048192666145041585, "global_step": 58241, "epoch": 489, "lr": 8.260181720815901e-06} +{"train_loss": 0.0005179326981306076, "global_step": 58242, "epoch": 489, "lr": 8.258961993397613e-06} +{"train_loss": 0.00036600950988940895, "global_step": 58243, "epoch": 489, "lr": 8.257742347933373e-06} +{"train_loss": 0.00023398148186970502, "global_step": 58244, "epoch": 489, "lr": 8.256522784425603e-06} +{"train_loss": 0.0005184016190469265, "global_step": 58245, "epoch": 489, "lr": 8.255303302876698e-06} +{"train_loss": 0.0005558048724196851, "global_step": 58246, "epoch": 489, "lr": 8.254083903289033e-06} +{"train_loss": 0.0005853152251802385, "global_step": 58247, "epoch": 489, "lr": 8.252864585665033e-06} +{"train_loss": 0.0004592108307406306, "global_step": 58248, "epoch": 489, "lr": 8.251645350007054e-06} +{"train_loss": 0.00068471027771011, "global_step": 58249, "epoch": 489, "lr": 8.250426196317528e-06} +{"train_loss": 0.0005318447365425527, "global_step": 58250, "epoch": 489, "lr": 8.249207124598812e-06} +{"train_loss": 0.0002557459520176053, "global_step": 58251, "epoch": 489, "lr": 8.247988134853329e-06} +{"train_loss": 0.0006542355404235423, "global_step": 58252, "epoch": 489, "lr": 8.246769227083455e-06} +{"train_loss": 0.0002810792066156864, "global_step": 58253, "epoch": 489, "lr": 8.245550401291596e-06} +{"train_loss": 0.0006381268030963838, "global_step": 58254, "epoch": 489, "lr": 8.244331657480126e-06} +{"train_loss": 0.0005956402164883912, "global_step": 58255, "epoch": 489, "lr": 8.243112995651465e-06} +{"train_loss": 0.0002879699459299445, "global_step": 58256, "epoch": 489, "lr": 8.241894415807988e-06} +{"train_loss": 0.00036364648258313537, "global_step": 58257, "epoch": 489, "lr": 8.240675917952079e-06} +{"train_loss": 0.0007138639921322465, "global_step": 58258, "epoch": 489, "lr": 8.239457502086156e-06} +{"train_loss": 0.0003328359453007579, "global_step": 58259, "epoch": 489, "lr": 8.23823916821258e-06} +{"train_loss": 0.00047273284872062504, "global_step": 58260, "epoch": 489, "lr": 8.237020916333777e-06} +{"train_loss": 0.0005801981315016747, "global_step": 58261, "epoch": 489, "lr": 8.235802746452115e-06} +{"train_loss": 0.00035749710514210165, "global_step": 58262, "epoch": 489, "lr": 8.234584658569982e-06} +{"train_loss": 0.0006515450659208, "global_step": 58263, "epoch": 489, "lr": 8.233366652689794e-06} +{"train_loss": 0.0005313805304467678, "global_step": 58264, "epoch": 489, "lr": 8.23214872881392e-06} +{"train_loss": 0.0006166723906062543, "global_step": 58265, "epoch": 489, "lr": 8.230930886944765e-06} +{"train_loss": 0.00035165625740773976, "global_step": 58266, "epoch": 489, "lr": 8.22971312708471e-06} +{"train_loss": 0.0003372634237166494, "global_step": 58267, "epoch": 489, "lr": 8.228495449236157e-06} +{"train_loss": 0.00032395319431088865, "global_step": 58268, "epoch": 489, "lr": 8.227277853401494e-06} +{"train_loss": 0.0009008419001474977, "global_step": 58269, "epoch": 489, "lr": 8.22606033958309e-06} +{"train_loss": 0.00037371349753811955, "global_step": 58270, "epoch": 489, "lr": 8.224842907783376e-06} +{"train_loss": 0.00046826250036247075, "global_step": 58271, "epoch": 489, "lr": 8.2236255580047e-06} +{"train_loss": 0.0004360632156021893, "global_step": 58272, "epoch": 489, "lr": 8.22240829024949e-06} +{"train_loss": 0.00043303362326696515, "global_step": 58273, "epoch": 489, "lr": 8.221191104520109e-06} +{"train_loss": 0.0003066682838834822, "global_step": 58274, "epoch": 489, "lr": 8.219974000818954e-06} +{"train_loss": 0.0004976748023182154, "global_step": 58275, "epoch": 489, "lr": 8.218756979148423e-06} +{"train_loss": 0.00035781582118943334, "global_step": 58276, "epoch": 489, "lr": 8.217540039510885e-06} +{"train_loss": 0.0004399063182063401, "global_step": 58277, "epoch": 489, "lr": 8.216323181908758e-06} +{"train_loss": 0.00031004881020635366, "global_step": 58278, "epoch": 489, "lr": 8.215106406344402e-06} +{"train_loss": 0.00025373438256792724, "global_step": 58279, "epoch": 489, "lr": 8.213889712820227e-06} +{"train_loss": 0.00023081025574356318, "global_step": 58280, "epoch": 489, "lr": 8.212673101338625e-06} +{"train_loss": 0.0006832793005742133, "global_step": 58281, "epoch": 489, "lr": 8.211456571901959e-06} +{"train_loss": 0.0007765077752992511, "global_step": 58282, "epoch": 489, "lr": 8.210240124512646e-06} +{"train_loss": 0.0004123403923586011, "global_step": 58283, "epoch": 489, "lr": 8.20902375917305e-06} +{"train_loss": 0.0003877439594361931, "global_step": 58284, "epoch": 489, "lr": 8.207807475885587e-06} +{"train_loss": 0.0004847103264182806, "global_step": 58285, "epoch": 489, "lr": 8.20659127465262e-06} +{"train_loss": 0.0007080046343617141, "global_step": 58286, "epoch": 489, "lr": 8.205375155476553e-06} +{"train_loss": 0.0012023154413327575, "global_step": 58287, "epoch": 489, "lr": 8.204159118359767e-06} +{"train_loss": 0.00028580607613548636, "global_step": 58288, "epoch": 489, "lr": 8.202943163304634e-06} +{"train_loss": 0.00038350498653016984, "global_step": 58289, "epoch": 489, "lr": 8.201727290313572e-06} +{"train_loss": 0.0004039103223476559, "global_step": 58290, "epoch": 489, "lr": 8.20051149938894e-06} +{"train_loss": 0.0006340981344692409, "global_step": 58291, "epoch": 489, "lr": 8.199295790533152e-06} +{"train_loss": 0.0004379874444566667, "global_step": 58292, "epoch": 489, "lr": 8.198080163748584e-06} +{"train_loss": 0.0005338268238119781, "global_step": 58293, "epoch": 489, "lr": 8.196864619037603e-06} +{"train_loss": 0.0007313717505894601, "global_step": 58294, "epoch": 489, "lr": 8.195649156402624e-06} +{"train_loss": 0.0015619059558957815, "global_step": 58295, "epoch": 489, "lr": 8.19443377584601e-06} +{"train_loss": 0.0003211390576325357, "global_step": 58296, "epoch": 489, "lr": 8.193218477370173e-06} +{"train_loss": 0.0003944384807255119, "global_step": 58297, "epoch": 489, "lr": 8.192003260977472e-06} +{"train_loss": 0.0003150803968310356, "global_step": 58298, "epoch": 489, "lr": 8.190788126670318e-06} +{"train_loss": 0.0005043562850914896, "global_step": 58299, "epoch": 489, "lr": 8.189573074451084e-06} +{"train_loss": 0.00039477137033827603, "global_step": 58300, "epoch": 489, "lr": 8.188358104322148e-06} +{"train_loss": 0.000802052381914109, "global_step": 58301, "epoch": 489, "lr": 8.187143216285913e-06} +{"train_loss": 0.0004891559947282076, "global_step": 58302, "epoch": 489, "lr": 8.185928410344746e-06} +{"train_loss": 0.0006415607640519738, "global_step": 58303, "epoch": 489, "lr": 8.18471368650105e-06} +{"train_loss": 0.0005238222656771541, "global_step": 58304, "epoch": 489, "lr": 8.183499044757186e-06} +{"train_loss": 0.00037926118238829076, "global_step": 58305, "epoch": 489, "lr": 8.182284485115572e-06} +{"train_loss": 0.0007202778360806406, "global_step": 58306, "epoch": 489, "lr": 8.181070007578573e-06} +{"train_loss": 0.0008642468601465225, "global_step": 58307, "epoch": 489, "lr": 8.179855612148568e-06} +{"train_loss": 0.00042970135109499097, "global_step": 58308, "epoch": 489, "lr": 8.178641298827956e-06} +{"train_loss": 0.0005030119412543424, "global_step": 58309, "epoch": 489, "lr": 8.177427067619104e-06, "val_loss": 0.026072189211845398} +{"train_loss": 0.0005975304520688951, "global_step": 58310, "epoch": 490, "lr": 8.176212918524411e-06} +{"train_loss": 0.00033969947253353894, "global_step": 58311, "epoch": 490, "lr": 8.17499885154625e-06} +{"train_loss": 0.0005874198977835476, "global_step": 58312, "epoch": 490, "lr": 8.173784866687023e-06} +{"train_loss": 0.0004833560378756374, "global_step": 58313, "epoch": 490, "lr": 8.17257096394909e-06} +{"train_loss": 0.00032362816273234785, "global_step": 58314, "epoch": 490, "lr": 8.171357143334841e-06} +{"train_loss": 0.00033173509291373193, "global_step": 58315, "epoch": 490, "lr": 8.170143404846676e-06} +{"train_loss": 0.0005640272283926606, "global_step": 58316, "epoch": 490, "lr": 8.168929748486954e-06} +{"train_loss": 0.0006638261256739497, "global_step": 58317, "epoch": 490, "lr": 8.167716174258083e-06} +{"train_loss": 0.0008401992963626981, "global_step": 58318, "epoch": 490, "lr": 8.16650268216243e-06} +{"train_loss": 0.00042883239802904427, "global_step": 58319, "epoch": 490, "lr": 8.16528927220237e-06} +{"train_loss": 0.0004077058983966708, "global_step": 58320, "epoch": 490, "lr": 8.164075944380306e-06} +{"train_loss": 0.00040814009844325483, "global_step": 58321, "epoch": 490, "lr": 8.162862698698598e-06} +{"train_loss": 0.0005643132608383894, "global_step": 58322, "epoch": 490, "lr": 8.161649535159648e-06} +{"train_loss": 0.00041520045488141477, "global_step": 58323, "epoch": 490, "lr": 8.160436453765835e-06} +{"train_loss": 0.00044557341607287526, "global_step": 58324, "epoch": 490, "lr": 8.15922345451952e-06} +{"train_loss": 0.0005007847212255001, "global_step": 58325, "epoch": 490, "lr": 8.158010537423116e-06} +{"train_loss": 0.0005975830135867, "global_step": 58326, "epoch": 490, "lr": 8.156797702478968e-06} +{"train_loss": 0.0004381508915685117, "global_step": 58327, "epoch": 490, "lr": 8.155584949689498e-06} +{"train_loss": 0.0009881845908239484, "global_step": 58328, "epoch": 490, "lr": 8.154372279057049e-06} +{"train_loss": 0.00048386017442680895, "global_step": 58329, "epoch": 490, "lr": 8.153159690584034e-06} +{"train_loss": 0.0003176203172188252, "global_step": 58330, "epoch": 490, "lr": 8.151947184272818e-06} +{"train_loss": 0.0005996960680931807, "global_step": 58331, "epoch": 490, "lr": 8.150734760125772e-06} +{"train_loss": 0.00039742907392792404, "global_step": 58332, "epoch": 490, "lr": 8.149522418145294e-06} +{"train_loss": 0.00039746047696098685, "global_step": 58333, "epoch": 490, "lr": 8.14831015833375e-06} +{"train_loss": 0.0003736339567694813, "global_step": 58334, "epoch": 490, "lr": 8.14709798069354e-06} +{"train_loss": 0.0004604794376064092, "global_step": 58335, "epoch": 490, "lr": 8.145885885227023e-06} +{"train_loss": 0.00021843363356310874, "global_step": 58336, "epoch": 490, "lr": 8.144673871936593e-06} +{"train_loss": 0.0006693977047689259, "global_step": 58337, "epoch": 490, "lr": 8.143461940824632e-06} +{"train_loss": 0.0007577181095257401, "global_step": 58338, "epoch": 490, "lr": 8.142250091893495e-06} +{"train_loss": 0.0006493354449048638, "global_step": 58339, "epoch": 490, "lr": 8.141038325145589e-06} +{"train_loss": 0.00040069405804388225, "global_step": 58340, "epoch": 490, "lr": 8.13982664058327e-06} +{"train_loss": 0.0003399859124328941, "global_step": 58341, "epoch": 490, "lr": 8.138615038208946e-06} +{"train_loss": 0.000345405685948208, "global_step": 58342, "epoch": 490, "lr": 8.13740351802496e-06} +{"train_loss": 0.0004151832254137844, "global_step": 58343, "epoch": 490, "lr": 8.136192080033727e-06} +{"train_loss": 0.0003660139045678079, "global_step": 58344, "epoch": 490, "lr": 8.134980724237594e-06} +{"train_loss": 0.0005418463842943311, "global_step": 58345, "epoch": 490, "lr": 8.133769450638967e-06} +{"train_loss": 0.0004390563117340207, "global_step": 58346, "epoch": 490, "lr": 8.132558259240203e-06} +{"train_loss": 0.0002539138658903539, "global_step": 58347, "epoch": 490, "lr": 8.131347150043694e-06} +{"train_loss": 0.0004563563852570951, "global_step": 58348, "epoch": 490, "lr": 8.130136123051802e-06} +{"train_loss": 0.0008635781705379486, "global_step": 58349, "epoch": 490, "lr": 8.128925178266928e-06} +{"train_loss": 0.0003310859901830554, "global_step": 58350, "epoch": 490, "lr": 8.12771431569142e-06} +{"train_loss": 0.0005229992093518376, "global_step": 58351, "epoch": 490, "lr": 8.12650353532769e-06} +{"train_loss": 0.0005267890519462526, "global_step": 58352, "epoch": 490, "lr": 8.125292837178078e-06} +{"train_loss": 0.0009753737831488252, "global_step": 58353, "epoch": 490, "lr": 8.124082221244994e-06} +{"train_loss": 0.00047546386485919356, "global_step": 58354, "epoch": 490, "lr": 8.122871687530792e-06} +{"train_loss": 0.00027964863693341613, "global_step": 58355, "epoch": 490, "lr": 8.121661236037864e-06} +{"train_loss": 0.0009310349123552442, "global_step": 58356, "epoch": 490, "lr": 8.120450866768586e-06} +{"train_loss": 0.00039897405076771975, "global_step": 58357, "epoch": 490, "lr": 8.119240579725312e-06} +{"train_loss": 0.0002021524269366637, "global_step": 58358, "epoch": 490, "lr": 8.118030374910451e-06} +{"train_loss": 0.0003173117293044925, "global_step": 58359, "epoch": 490, "lr": 8.116820252326346e-06} +{"train_loss": 0.0006887399358674884, "global_step": 58360, "epoch": 490, "lr": 8.115610211975406e-06} +{"train_loss": 0.0003672254388220608, "global_step": 58361, "epoch": 490, "lr": 8.114400253859989e-06} +{"train_loss": 0.00044815268483944237, "global_step": 58362, "epoch": 490, "lr": 8.11319037798246e-06} +{"train_loss": 0.0002821560192387551, "global_step": 58363, "epoch": 490, "lr": 8.11198058434522e-06} +{"train_loss": 0.0007590489112772048, "global_step": 58364, "epoch": 490, "lr": 8.110770872950619e-06} +{"train_loss": 0.0007099948707036674, "global_step": 58365, "epoch": 490, "lr": 8.10956124380105e-06} +{"train_loss": 0.00039422421832568944, "global_step": 58366, "epoch": 490, "lr": 8.108351696898881e-06} +{"train_loss": 0.00032555597135797143, "global_step": 58367, "epoch": 490, "lr": 8.107142232246489e-06} +{"train_loss": 0.0004018397303298116, "global_step": 58368, "epoch": 490, "lr": 8.105932849846254e-06} +{"train_loss": 0.00030588440131396055, "global_step": 58369, "epoch": 490, "lr": 8.104723549700532e-06} +{"train_loss": 0.0005185685004107654, "global_step": 58370, "epoch": 490, "lr": 8.103514331811723e-06} +{"train_loss": 0.0003891145170200616, "global_step": 58371, "epoch": 490, "lr": 8.102305196182169e-06} +{"train_loss": 0.00048052496276795864, "global_step": 58372, "epoch": 490, "lr": 8.10109614281428e-06} +{"train_loss": 0.0013105871621519327, "global_step": 58373, "epoch": 490, "lr": 8.099887171710402e-06} +{"train_loss": 0.00047674126108177006, "global_step": 58374, "epoch": 490, "lr": 8.098678282872928e-06} +{"train_loss": 0.0007066779653541744, "global_step": 58375, "epoch": 490, "lr": 8.097469476304226e-06} +{"train_loss": 0.0004527707351371646, "global_step": 58376, "epoch": 490, "lr": 8.096260752006652e-06} +{"train_loss": 0.0003038126742467284, "global_step": 58377, "epoch": 490, "lr": 8.095052109982587e-06} +{"train_loss": 0.000418799405451864, "global_step": 58378, "epoch": 490, "lr": 8.093843550234432e-06} +{"train_loss": 0.0004702851874753833, "global_step": 58379, "epoch": 490, "lr": 8.092635072764521e-06} +{"train_loss": 0.0005280558252707124, "global_step": 58380, "epoch": 490, "lr": 8.091426677575254e-06} +{"train_loss": 0.0007456194143742323, "global_step": 58381, "epoch": 490, "lr": 8.090218364668989e-06} +{"train_loss": 0.00042803105316124856, "global_step": 58382, "epoch": 490, "lr": 8.089010134048108e-06} +{"train_loss": 0.00031959061743691564, "global_step": 58383, "epoch": 490, "lr": 8.087801985714965e-06} +{"train_loss": 0.00017196671979036182, "global_step": 58384, "epoch": 490, "lr": 8.086593919671964e-06} +{"train_loss": 0.0007302313460968435, "global_step": 58385, "epoch": 490, "lr": 8.085385935921441e-06} +{"train_loss": 0.0006861949223093688, "global_step": 58386, "epoch": 490, "lr": 8.0841780344658e-06} +{"train_loss": 0.00039896724047139287, "global_step": 58387, "epoch": 490, "lr": 8.082970215307395e-06} +{"train_loss": 0.00037616543704643846, "global_step": 58388, "epoch": 490, "lr": 8.08176247844859e-06} +{"train_loss": 0.0006919889128766954, "global_step": 58389, "epoch": 490, "lr": 8.080554823891773e-06} +{"train_loss": 0.000258611049503088, "global_step": 58390, "epoch": 490, "lr": 8.079347251639302e-06} +{"train_loss": 0.0003144791699014604, "global_step": 58391, "epoch": 490, "lr": 8.078139761693564e-06} +{"train_loss": 0.0006779291434213519, "global_step": 58392, "epoch": 490, "lr": 8.07693235405692e-06} +{"train_loss": 0.0005119884153828025, "global_step": 58393, "epoch": 490, "lr": 8.075725028731728e-06} +{"train_loss": 0.00044241390423849225, "global_step": 58394, "epoch": 490, "lr": 8.074517785720381e-06} +{"train_loss": 0.000688303669448942, "global_step": 58395, "epoch": 490, "lr": 8.073310625025232e-06} +{"train_loss": 0.00037370159407146275, "global_step": 58396, "epoch": 490, "lr": 8.072103546648669e-06} +{"train_loss": 0.00045482045970857143, "global_step": 58397, "epoch": 490, "lr": 8.070896550593037e-06} +{"train_loss": 0.00031792238587513566, "global_step": 58398, "epoch": 490, "lr": 8.069689636860734e-06} +{"train_loss": 0.00031304554431699216, "global_step": 58399, "epoch": 490, "lr": 8.068482805454114e-06} +{"train_loss": 0.0007748765638098121, "global_step": 58400, "epoch": 490, "lr": 8.067276056375539e-06} +{"train_loss": 0.00029827276011928916, "global_step": 58401, "epoch": 490, "lr": 8.066069389627396e-06} +{"train_loss": 0.0003820443816948682, "global_step": 58402, "epoch": 490, "lr": 8.064862805212036e-06} +{"train_loss": 0.00024232250871136785, "global_step": 58403, "epoch": 490, "lr": 8.06365630313185e-06} +{"train_loss": 0.00028566381661221385, "global_step": 58404, "epoch": 490, "lr": 8.062449883389184e-06} +{"train_loss": 0.0003873115638270974, "global_step": 58405, "epoch": 490, "lr": 8.061243545986424e-06} +{"train_loss": 0.00039953592931851745, "global_step": 58406, "epoch": 490, "lr": 8.060037290925938e-06} +{"train_loss": 0.0005269196117296815, "global_step": 58407, "epoch": 490, "lr": 8.05883111821007e-06} +{"train_loss": 0.00029160664416849613, "global_step": 58408, "epoch": 490, "lr": 8.057625027841227e-06} +{"train_loss": 0.0003286070714239031, "global_step": 58409, "epoch": 490, "lr": 8.056419019821736e-06} +{"train_loss": 0.0005467548035085201, "global_step": 58410, "epoch": 490, "lr": 8.055213094154001e-06} +{"train_loss": 0.0003070839447900653, "global_step": 58411, "epoch": 490, "lr": 8.054007250840363e-06} +{"train_loss": 0.00020683980255853385, "global_step": 58412, "epoch": 490, "lr": 8.052801489883199e-06} +{"train_loss": 0.0005199657753109932, "global_step": 58413, "epoch": 490, "lr": 8.05159581128489e-06} +{"train_loss": 0.00036840507527813315, "global_step": 58414, "epoch": 490, "lr": 8.050390215047777e-06} +{"train_loss": 0.0006547201774083078, "global_step": 58415, "epoch": 490, "lr": 8.049184701174255e-06} +{"train_loss": 0.0007890413980931044, "global_step": 58416, "epoch": 490, "lr": 8.047979269666667e-06} +{"train_loss": 0.0005744446534663439, "global_step": 58417, "epoch": 490, "lr": 8.046773920527396e-06} +{"train_loss": 0.00022829808585811406, "global_step": 58418, "epoch": 490, "lr": 8.045568653758806e-06} +{"train_loss": 0.0005031966720707715, "global_step": 58419, "epoch": 490, "lr": 8.044363469363247e-06} +{"train_loss": 0.0006730628083460033, "global_step": 58420, "epoch": 490, "lr": 8.043158367343112e-06} +{"train_loss": 0.00047072715824469924, "global_step": 58421, "epoch": 490, "lr": 8.041953347700743e-06} +{"train_loss": 0.00020381809736136347, "global_step": 58422, "epoch": 490, "lr": 8.040748410438526e-06} +{"train_loss": 0.00030170142417773604, "global_step": 58423, "epoch": 490, "lr": 8.039543555558804e-06} +{"train_loss": 0.0006990406545810401, "global_step": 58424, "epoch": 490, "lr": 8.038338783063965e-06} +{"train_loss": 0.0007272381917573512, "global_step": 58425, "epoch": 490, "lr": 8.037134092956366e-06} +{"train_loss": 0.000617613026406616, "global_step": 58426, "epoch": 490, "lr": 8.035929485238363e-06} +{"train_loss": 0.000891979958396405, "global_step": 58427, "epoch": 490, "lr": 8.034724959912337e-06} +{"train_loss": 0.00048553192999777425, "global_step": 58428, "epoch": 490, "lr": 8.033520516980637e-06, "val_loss": 0.02744932286441326, "train_action_mse_error": 5.826873803016497e-06} +{"train_loss": 0.0005108434124849737, "global_step": 58429, "epoch": 491, "lr": 8.032316156445647e-06} +{"train_loss": 0.00022613725741393864, "global_step": 58430, "epoch": 491, "lr": 8.031111878309717e-06} +{"train_loss": 0.0005121871363371611, "global_step": 58431, "epoch": 491, "lr": 8.029907682575205e-06} +{"train_loss": 0.0003587055834941566, "global_step": 58432, "epoch": 491, "lr": 8.0287035692445e-06} +{"train_loss": 0.00031063315691426396, "global_step": 58433, "epoch": 491, "lr": 8.027499538319938e-06} +{"train_loss": 0.00040129281114786863, "global_step": 58434, "epoch": 491, "lr": 8.026295589803906e-06} +{"train_loss": 0.00041190089541487396, "global_step": 58435, "epoch": 491, "lr": 8.025091723698747e-06} +{"train_loss": 0.0003980470937676728, "global_step": 58436, "epoch": 491, "lr": 8.023887940006852e-06} +{"train_loss": 0.0005283053615130484, "global_step": 58437, "epoch": 491, "lr": 8.022684238730566e-06} +{"train_loss": 0.0004355036944616586, "global_step": 58438, "epoch": 491, "lr": 8.021480619872241e-06} +{"train_loss": 0.00036078793345950544, "global_step": 58439, "epoch": 491, "lr": 8.020277083434269e-06} +{"train_loss": 0.0003890465304721147, "global_step": 58440, "epoch": 491, "lr": 8.019073629418982e-06} +{"train_loss": 0.0002513190556783229, "global_step": 58441, "epoch": 491, "lr": 8.01787025782878e-06} +{"train_loss": 0.0004688833432737738, "global_step": 58442, "epoch": 491, "lr": 8.016666968665987e-06} +{"train_loss": 0.0007835695287212729, "global_step": 58443, "epoch": 491, "lr": 8.01546376193299e-06} +{"train_loss": 0.0007401934126392007, "global_step": 58444, "epoch": 491, "lr": 8.014260637632136e-06} +{"train_loss": 0.0002004322741413489, "global_step": 58445, "epoch": 491, "lr": 8.013057595765811e-06} +{"train_loss": 0.0007711011567153037, "global_step": 58446, "epoch": 491, "lr": 8.011854636336347e-06} +{"train_loss": 0.00028541075880639255, "global_step": 58447, "epoch": 491, "lr": 8.010651759346122e-06} +{"train_loss": 0.0003465992340352386, "global_step": 58448, "epoch": 491, "lr": 8.009448964797511e-06} +{"train_loss": 0.0002859228989109397, "global_step": 58449, "epoch": 491, "lr": 8.008246252692859e-06} +{"train_loss": 0.0005330254789441824, "global_step": 58450, "epoch": 491, "lr": 8.007043623034516e-06} +{"train_loss": 0.00029534584609791636, "global_step": 58451, "epoch": 491, "lr": 8.005841075824866e-06} +{"train_loss": 0.00032799868495203555, "global_step": 58452, "epoch": 491, "lr": 8.004638611066251e-06} +{"train_loss": 0.0004508997080847621, "global_step": 58453, "epoch": 491, "lr": 8.003436228761051e-06} +{"train_loss": 0.0004571115132421255, "global_step": 58454, "epoch": 491, "lr": 8.002233928911612e-06} +{"train_loss": 0.00035474091419018805, "global_step": 58455, "epoch": 491, "lr": 8.001031711520307e-06} +{"train_loss": 0.0008707136148586869, "global_step": 58456, "epoch": 491, "lr": 7.99982957658949e-06} +{"train_loss": 0.00047995481872931123, "global_step": 58457, "epoch": 491, "lr": 7.99862752412151e-06} +{"train_loss": 0.00033971815719269216, "global_step": 58458, "epoch": 491, "lr": 7.997425554118748e-06} +{"train_loss": 0.0003629018901847303, "global_step": 58459, "epoch": 491, "lr": 7.996223666583541e-06} +{"train_loss": 0.0002578955318313092, "global_step": 58460, "epoch": 491, "lr": 7.995021861518276e-06} +{"train_loss": 0.0005845861742272973, "global_step": 58461, "epoch": 491, "lr": 7.993820138925295e-06} +{"train_loss": 0.00027345327544026077, "global_step": 58462, "epoch": 491, "lr": 7.992618498806953e-06} +{"train_loss": 0.0005745731177739799, "global_step": 58463, "epoch": 491, "lr": 7.991416941165624e-06} +{"train_loss": 0.0015029446221888065, "global_step": 58464, "epoch": 491, "lr": 7.990215466003647e-06} +{"train_loss": 0.000879517407156527, "global_step": 58465, "epoch": 491, "lr": 7.989014073323415e-06} +{"train_loss": 0.0006690263980999589, "global_step": 58466, "epoch": 491, "lr": 7.987812763127245e-06} +{"train_loss": 0.00032417240436188877, "global_step": 58467, "epoch": 491, "lr": 7.986611535417526e-06} +{"train_loss": 0.000438384129665792, "global_step": 58468, "epoch": 491, "lr": 7.985410390196612e-06} +{"train_loss": 0.00038573233177885413, "global_step": 58469, "epoch": 491, "lr": 7.984209327466846e-06} +{"train_loss": 0.000253509875619784, "global_step": 58470, "epoch": 491, "lr": 7.983008347230603e-06} +{"train_loss": 0.00029282280593179166, "global_step": 58471, "epoch": 491, "lr": 7.981807449490225e-06} +{"train_loss": 0.000803206698037684, "global_step": 58472, "epoch": 491, "lr": 7.980606634248094e-06} +{"train_loss": 0.00032574537908658385, "global_step": 58473, "epoch": 491, "lr": 7.979405901506536e-06} +{"train_loss": 0.00025978987105190754, "global_step": 58474, "epoch": 491, "lr": 7.97820525126794e-06} +{"train_loss": 0.00021055994147900492, "global_step": 58475, "epoch": 491, "lr": 7.977004683534634e-06} +{"train_loss": 0.0004737636772915721, "global_step": 58476, "epoch": 491, "lr": 7.975804198309005e-06} +{"train_loss": 0.0005084807053208351, "global_step": 58477, "epoch": 491, "lr": 7.974603795593383e-06} +{"train_loss": 0.00040356229874305427, "global_step": 58478, "epoch": 491, "lr": 7.973403475390146e-06} +{"train_loss": 0.00018454388191457838, "global_step": 58479, "epoch": 491, "lr": 7.97220323770163e-06} +{"train_loss": 0.0003522641200106591, "global_step": 58480, "epoch": 491, "lr": 7.971003082530215e-06} +{"train_loss": 0.0005086680175736547, "global_step": 58481, "epoch": 491, "lr": 7.969803009878235e-06} +{"train_loss": 0.0006078016012907028, "global_step": 58482, "epoch": 491, "lr": 7.968603019748067e-06} +{"train_loss": 0.000641311053186655, "global_step": 58483, "epoch": 491, "lr": 7.967403112142042e-06} +{"train_loss": 0.0005378230707719922, "global_step": 58484, "epoch": 491, "lr": 7.966203287062546e-06} +{"train_loss": 0.00030348822474479675, "global_step": 58485, "epoch": 491, "lr": 7.965003544511907e-06} +{"train_loss": 0.0006676180637441576, "global_step": 58486, "epoch": 491, "lr": 7.963803884492505e-06} +{"train_loss": 0.00034916208824142814, "global_step": 58487, "epoch": 491, "lr": 7.962604307006682e-06} +{"train_loss": 0.0004070866561960429, "global_step": 58488, "epoch": 491, "lr": 7.961404812056782e-06} +{"train_loss": 0.0001938342466019094, "global_step": 58489, "epoch": 491, "lr": 7.960205399645182e-06} +{"train_loss": 0.00048613749095238745, "global_step": 58490, "epoch": 491, "lr": 7.959006069774221e-06} +{"train_loss": 0.00024794292403385043, "global_step": 58491, "epoch": 491, "lr": 7.957806822446268e-06} +{"train_loss": 0.00044392404379323125, "global_step": 58492, "epoch": 491, "lr": 7.956607657663662e-06} +{"train_loss": 0.0002082365972455591, "global_step": 58493, "epoch": 491, "lr": 7.955408575428774e-06} +{"train_loss": 0.0006267960416153073, "global_step": 58494, "epoch": 491, "lr": 7.954209575743948e-06} +{"train_loss": 0.0007171054021455348, "global_step": 58495, "epoch": 491, "lr": 7.953010658611531e-06} +{"train_loss": 0.0002274087310070172, "global_step": 58496, "epoch": 491, "lr": 7.9518118240339e-06} +{"train_loss": 0.0002414286573184654, "global_step": 58497, "epoch": 491, "lr": 7.950613072013374e-06} +{"train_loss": 0.0004404516366776079, "global_step": 58498, "epoch": 491, "lr": 7.949414402552346e-06} +{"train_loss": 0.0005114278756082058, "global_step": 58499, "epoch": 491, "lr": 7.948215815653149e-06} +{"train_loss": 0.0003237332566641271, "global_step": 58500, "epoch": 491, "lr": 7.947017311318122e-06} +{"train_loss": 0.00018510954396333545, "global_step": 58501, "epoch": 491, "lr": 7.94581888954965e-06} +{"train_loss": 0.0003034386900253594, "global_step": 58502, "epoch": 491, "lr": 7.944620550350057e-06} +{"train_loss": 0.000380947400117293, "global_step": 58503, "epoch": 491, "lr": 7.94342229372172e-06} +{"train_loss": 0.0009663569508120418, "global_step": 58504, "epoch": 491, "lr": 7.942224119666964e-06} +{"train_loss": 0.0005155757535248995, "global_step": 58505, "epoch": 491, "lr": 7.941026028188176e-06} +{"train_loss": 0.00041647834586910903, "global_step": 58506, "epoch": 491, "lr": 7.939828019287687e-06} +{"train_loss": 0.0002825419360306114, "global_step": 58507, "epoch": 491, "lr": 7.938630092967842e-06} +{"train_loss": 0.0002806257107295096, "global_step": 58508, "epoch": 491, "lr": 7.937432249231002e-06} +{"train_loss": 0.0004797043511644006, "global_step": 58509, "epoch": 491, "lr": 7.93623448807953e-06} +{"train_loss": 0.00052403419977054, "global_step": 58510, "epoch": 491, "lr": 7.935036809515762e-06} +{"train_loss": 0.0004781616444233805, "global_step": 58511, "epoch": 491, "lr": 7.93383921354206e-06} +{"train_loss": 0.0008169157081283629, "global_step": 58512, "epoch": 491, "lr": 7.932641700160764e-06} +{"train_loss": 0.00044421787606552243, "global_step": 58513, "epoch": 491, "lr": 7.931444269374238e-06} +{"train_loss": 0.0005685027572326362, "global_step": 58514, "epoch": 491, "lr": 7.93024692118482e-06} +{"train_loss": 0.0003753741621039808, "global_step": 58515, "epoch": 491, "lr": 7.929049655594877e-06} +{"train_loss": 0.0003055960114579648, "global_step": 58516, "epoch": 491, "lr": 7.92785247260674e-06} +{"train_loss": 0.0004659655096475035, "global_step": 58517, "epoch": 491, "lr": 7.926655372222779e-06} +{"train_loss": 0.0004614796780515462, "global_step": 58518, "epoch": 491, "lr": 7.925458354445342e-06} +{"train_loss": 0.0004479355120565742, "global_step": 58519, "epoch": 491, "lr": 7.924261419276757e-06} +{"train_loss": 0.0006706839194521308, "global_step": 58520, "epoch": 491, "lr": 7.923064566719396e-06} +{"train_loss": 0.00034544902155175805, "global_step": 58521, "epoch": 491, "lr": 7.9218677967756e-06} +{"train_loss": 0.0004126409476157278, "global_step": 58522, "epoch": 491, "lr": 7.920671109447725e-06} +{"train_loss": 0.0006761263939552009, "global_step": 58523, "epoch": 491, "lr": 7.919474504738112e-06} +{"train_loss": 0.0002352750743739307, "global_step": 58524, "epoch": 491, "lr": 7.91827798264912e-06} +{"train_loss": 0.00031690773903392255, "global_step": 58525, "epoch": 491, "lr": 7.917081543183097e-06} +{"train_loss": 0.0004692391084972769, "global_step": 58526, "epoch": 491, "lr": 7.915885186342375e-06} +{"train_loss": 0.0005309233674779534, "global_step": 58527, "epoch": 491, "lr": 7.914688912129331e-06} +{"train_loss": 0.0003664804098661989, "global_step": 58528, "epoch": 491, "lr": 7.913492720546284e-06} +{"train_loss": 0.0003653789171949029, "global_step": 58529, "epoch": 491, "lr": 7.912296611595616e-06} +{"train_loss": 0.0006013073725625873, "global_step": 58530, "epoch": 491, "lr": 7.911100585279652e-06} +{"train_loss": 0.00033880575210787356, "global_step": 58531, "epoch": 491, "lr": 7.909904641600735e-06} +{"train_loss": 0.000636972370557487, "global_step": 58532, "epoch": 491, "lr": 7.90870878056123e-06} +{"train_loss": 0.000584586407057941, "global_step": 58533, "epoch": 491, "lr": 7.907513002163475e-06} +{"train_loss": 0.000255470717092976, "global_step": 58534, "epoch": 491, "lr": 7.906317306409827e-06} +{"train_loss": 0.0006038963911123574, "global_step": 58535, "epoch": 491, "lr": 7.90512169330262e-06} +{"train_loss": 0.00038730475353077054, "global_step": 58536, "epoch": 491, "lr": 7.903926162844222e-06} +{"train_loss": 0.0003121192567050457, "global_step": 58537, "epoch": 491, "lr": 7.902730715036966e-06} +{"train_loss": 0.0005625025369226933, "global_step": 58538, "epoch": 491, "lr": 7.901535349883188e-06} +{"train_loss": 0.0006593322614207864, "global_step": 58539, "epoch": 491, "lr": 7.90034006738526e-06} +{"train_loss": 0.00020217882411088794, "global_step": 58540, "epoch": 491, "lr": 7.899144867545504e-06} +{"train_loss": 0.00039914119406603277, "global_step": 58541, "epoch": 491, "lr": 7.89794975036629e-06} +{"train_loss": 0.0003496644785627723, "global_step": 58542, "epoch": 491, "lr": 7.896754715849947e-06} +{"train_loss": 0.00022739545966032892, "global_step": 58543, "epoch": 491, "lr": 7.895559763998833e-06} +{"train_loss": 0.00037002822500653565, "global_step": 58544, "epoch": 491, "lr": 7.894364894815282e-06} +{"train_loss": 0.00034509648685343564, "global_step": 58545, "epoch": 491, "lr": 7.893170108301645e-06} +{"train_loss": 0.00026015492039732635, "global_step": 58546, "epoch": 491, "lr": 7.891975404460284e-06} +{"train_loss": 0.0004437296842557511, "global_step": 58547, "epoch": 491, "lr": 7.890780783293523e-06, "val_loss": 0.04545079916715622} +{"train_loss": 0.0005544103914871812, "global_step": 58548, "epoch": 492, "lr": 7.889586244803721e-06} +{"train_loss": 0.0006671045557595789, "global_step": 58549, "epoch": 492, "lr": 7.888391788993216e-06} +{"train_loss": 0.0006517905276268721, "global_step": 58550, "epoch": 492, "lr": 7.887197415864344e-06} +{"train_loss": 0.0005385228432714939, "global_step": 58551, "epoch": 492, "lr": 7.886003125419478e-06} +{"train_loss": 0.00027194712311029434, "global_step": 58552, "epoch": 492, "lr": 7.884808917660929e-06} +{"train_loss": 0.0003579572367016226, "global_step": 58553, "epoch": 492, "lr": 7.88361479259107e-06} +{"train_loss": 0.00041104049887508154, "global_step": 58554, "epoch": 492, "lr": 7.882420750212222e-06} +{"train_loss": 0.0006567946402356029, "global_step": 58555, "epoch": 492, "lr": 7.881226790526757e-06} +{"train_loss": 0.0004939627833664417, "global_step": 58556, "epoch": 492, "lr": 7.880032913537e-06} +{"train_loss": 0.0005094073712825775, "global_step": 58557, "epoch": 492, "lr": 7.878839119245285e-06} +{"train_loss": 0.000390835280995816, "global_step": 58558, "epoch": 492, "lr": 7.877645407653988e-06} +{"train_loss": 0.00015956436982378364, "global_step": 58559, "epoch": 492, "lr": 7.876451778765415e-06} +{"train_loss": 0.0007686408935114741, "global_step": 58560, "epoch": 492, "lr": 7.875258232581945e-06} +{"train_loss": 0.00026719222660176456, "global_step": 58561, "epoch": 492, "lr": 7.874064769105894e-06} +{"train_loss": 0.000429368345066905, "global_step": 58562, "epoch": 492, "lr": 7.872871388339625e-06} +{"train_loss": 0.0004120727826375514, "global_step": 58563, "epoch": 492, "lr": 7.871678090285473e-06} +{"train_loss": 0.00033401435939595103, "global_step": 58564, "epoch": 492, "lr": 7.870484874945766e-06} +{"train_loss": 0.00024336525530088693, "global_step": 58565, "epoch": 492, "lr": 7.869291742322876e-06} +{"train_loss": 0.000421484699472785, "global_step": 58566, "epoch": 492, "lr": 7.868098692419119e-06} +{"train_loss": 0.00038576399674639106, "global_step": 58567, "epoch": 492, "lr": 7.866905725236861e-06} +{"train_loss": 0.0002782015362754464, "global_step": 58568, "epoch": 492, "lr": 7.865712840778433e-06} +{"train_loss": 0.0006706571439281106, "global_step": 58569, "epoch": 492, "lr": 7.864520039046164e-06} +{"train_loss": 0.00044572772458195686, "global_step": 58570, "epoch": 492, "lr": 7.86332732004242e-06} +{"train_loss": 0.0004597681690938771, "global_step": 58571, "epoch": 492, "lr": 7.862134683769517e-06} +{"train_loss": 0.0005646829959005117, "global_step": 58572, "epoch": 492, "lr": 7.860942130229826e-06} +{"train_loss": 0.0003888576466124505, "global_step": 58573, "epoch": 492, "lr": 7.859749659425659e-06} +{"train_loss": 0.0003180764033459127, "global_step": 58574, "epoch": 492, "lr": 7.858557271359385e-06} +{"train_loss": 0.0005835244664922357, "global_step": 58575, "epoch": 492, "lr": 7.857364966033321e-06} +{"train_loss": 0.0004799630260095, "global_step": 58576, "epoch": 492, "lr": 7.85617274344983e-06} +{"train_loss": 0.0004582024703267962, "global_step": 58577, "epoch": 492, "lr": 7.854980603611229e-06} +{"train_loss": 0.0005823338287882507, "global_step": 58578, "epoch": 492, "lr": 7.85378854651988e-06} +{"train_loss": 0.0004245942400302738, "global_step": 58579, "epoch": 492, "lr": 7.852596572178105e-06} +{"train_loss": 0.00045141324517317116, "global_step": 58580, "epoch": 492, "lr": 7.851404680588264e-06} +{"train_loss": 0.0004088607965968549, "global_step": 58581, "epoch": 492, "lr": 7.850212871752676e-06} +{"train_loss": 0.0005034859059378505, "global_step": 58582, "epoch": 492, "lr": 7.849021145673707e-06} +{"train_loss": 0.0003281011595390737, "global_step": 58583, "epoch": 492, "lr": 7.847829502353666e-06} +{"train_loss": 0.00030939740827307105, "global_step": 58584, "epoch": 492, "lr": 7.84663794179492e-06} +{"train_loss": 0.00023990795307327062, "global_step": 58585, "epoch": 492, "lr": 7.845446463999789e-06} +{"train_loss": 0.0003878226852975786, "global_step": 58586, "epoch": 492, "lr": 7.844255068970629e-06} +{"train_loss": 0.0002890508621931076, "global_step": 58587, "epoch": 492, "lr": 7.843063756709774e-06} +{"train_loss": 0.000245191011345014, "global_step": 58588, "epoch": 492, "lr": 7.841872527219546e-06} +{"train_loss": 0.0005816129851154983, "global_step": 58589, "epoch": 492, "lr": 7.840681380502307e-06} +{"train_loss": 0.0006305652786977589, "global_step": 58590, "epoch": 492, "lr": 7.839490316560378e-06} +{"train_loss": 0.000598088838160038, "global_step": 58591, "epoch": 492, "lr": 7.838299335396116e-06} +{"train_loss": 0.0007652544882148504, "global_step": 58592, "epoch": 492, "lr": 7.837108437011831e-06} +{"train_loss": 0.000672346621286124, "global_step": 58593, "epoch": 492, "lr": 7.8359176214099e-06} +{"train_loss": 0.0005757830222137272, "global_step": 58594, "epoch": 492, "lr": 7.834726888592637e-06} +{"train_loss": 0.0006478754803538322, "global_step": 58595, "epoch": 492, "lr": 7.833536238562366e-06} +{"train_loss": 0.0005428465083241463, "global_step": 58596, "epoch": 492, "lr": 7.832345671321462e-06} +{"train_loss": 0.00032380965421907604, "global_step": 58597, "epoch": 492, "lr": 7.831155186872225e-06} +{"train_loss": 0.00024094662512652576, "global_step": 58598, "epoch": 492, "lr": 7.829964785217026e-06} +{"train_loss": 0.0005085264565423131, "global_step": 58599, "epoch": 492, "lr": 7.82877446635818e-06} +{"train_loss": 0.00038475406472571194, "global_step": 58600, "epoch": 492, "lr": 7.827584230298023e-06} +{"train_loss": 0.0003796883102040738, "global_step": 58601, "epoch": 492, "lr": 7.826394077038907e-06} +{"train_loss": 0.0005650093662552536, "global_step": 58602, "epoch": 492, "lr": 7.825204006583154e-06} +{"train_loss": 0.0006532057304866612, "global_step": 58603, "epoch": 492, "lr": 7.824014018933112e-06} +{"train_loss": 0.00041119297384284437, "global_step": 58604, "epoch": 492, "lr": 7.822824114091104e-06} +{"train_loss": 0.00029975190409459174, "global_step": 58605, "epoch": 492, "lr": 7.821634292059487e-06} +{"train_loss": 0.0003474815166555345, "global_step": 58606, "epoch": 492, "lr": 7.820444552840577e-06} +{"train_loss": 0.00040878079016692936, "global_step": 58607, "epoch": 492, "lr": 7.819254896436729e-06} +{"train_loss": 0.0006396540557034314, "global_step": 58608, "epoch": 492, "lr": 7.818065322850248e-06} +{"train_loss": 0.0003045703051611781, "global_step": 58609, "epoch": 492, "lr": 7.816875832083508e-06} +{"train_loss": 0.0008742691716179252, "global_step": 58610, "epoch": 492, "lr": 7.815686424138813e-06} +{"train_loss": 0.0005712589481845498, "global_step": 58611, "epoch": 492, "lr": 7.814497099018519e-06} +{"train_loss": 0.0003585090453270823, "global_step": 58612, "epoch": 492, "lr": 7.81330785672495e-06} +{"train_loss": 0.0002474991197232157, "global_step": 58613, "epoch": 492, "lr": 7.812118697260446e-06} +{"train_loss": 0.0006051675300113857, "global_step": 58614, "epoch": 492, "lr": 7.810929620627333e-06} +{"train_loss": 0.00040735179209150374, "global_step": 58615, "epoch": 492, "lr": 7.809740626827966e-06} +{"train_loss": 0.0006456554983742535, "global_step": 58616, "epoch": 492, "lr": 7.808551715864648e-06} +{"train_loss": 0.0004938815254718065, "global_step": 58617, "epoch": 492, "lr": 7.80736288773975e-06} +{"train_loss": 0.000558330852072686, "global_step": 58618, "epoch": 492, "lr": 7.80617414245558e-06} +{"train_loss": 0.0006151612033136189, "global_step": 58619, "epoch": 492, "lr": 7.80498548001447e-06} +{"train_loss": 0.0006642178050242364, "global_step": 58620, "epoch": 492, "lr": 7.80379690041878e-06} +{"train_loss": 0.00024406149168498814, "global_step": 58621, "epoch": 492, "lr": 7.802608403670807e-06} +{"train_loss": 0.0005993567174300551, "global_step": 58622, "epoch": 492, "lr": 7.801419989772923e-06} +{"train_loss": 0.0003608077531680465, "global_step": 58623, "epoch": 492, "lr": 7.80023165872743e-06} +{"train_loss": 0.0006369056063704193, "global_step": 58624, "epoch": 492, "lr": 7.799043410536683e-06} +{"train_loss": 0.00045914098154753447, "global_step": 58625, "epoch": 492, "lr": 7.797855245203006e-06} +{"train_loss": 0.0005904304562136531, "global_step": 58626, "epoch": 492, "lr": 7.796667162728721e-06} +{"train_loss": 0.0002898837556131184, "global_step": 58627, "epoch": 492, "lr": 7.795479163116182e-06} +{"train_loss": 0.0003446084738243371, "global_step": 58628, "epoch": 492, "lr": 7.794291246367696e-06} +{"train_loss": 0.0004366170905996114, "global_step": 58629, "epoch": 492, "lr": 7.793103412485631e-06} +{"train_loss": 0.0003357228997629136, "global_step": 58630, "epoch": 492, "lr": 7.791915661472288e-06} +{"train_loss": 0.000349659618223086, "global_step": 58631, "epoch": 492, "lr": 7.790727993330005e-06} +{"train_loss": 0.0006083998596295714, "global_step": 58632, "epoch": 492, "lr": 7.789540408061124e-06} +{"train_loss": 0.00034352560760453343, "global_step": 58633, "epoch": 492, "lr": 7.788352905667961e-06} +{"train_loss": 0.00037302784039638937, "global_step": 58634, "epoch": 492, "lr": 7.787165486152876e-06} +{"train_loss": 0.0003493906988296658, "global_step": 58635, "epoch": 492, "lr": 7.785978149518164e-06} +{"train_loss": 0.0007447824464179575, "global_step": 58636, "epoch": 492, "lr": 7.784790895766181e-06} +{"train_loss": 0.0004161655087955296, "global_step": 58637, "epoch": 492, "lr": 7.783603724899257e-06} +{"train_loss": 0.0004194224311504513, "global_step": 58638, "epoch": 492, "lr": 7.782416636919703e-06} +{"train_loss": 0.00043859591824002564, "global_step": 58639, "epoch": 492, "lr": 7.781229631829879e-06} +{"train_loss": 0.00044494157191365957, "global_step": 58640, "epoch": 492, "lr": 7.780042709632085e-06} +{"train_loss": 0.0003776377416215837, "global_step": 58641, "epoch": 492, "lr": 7.778855870328672e-06} +{"train_loss": 0.0003552085836417973, "global_step": 58642, "epoch": 492, "lr": 7.777669113921971e-06} +{"train_loss": 0.00015619541227351874, "global_step": 58643, "epoch": 492, "lr": 7.776482440414296e-06} +{"train_loss": 0.0003036301350221038, "global_step": 58644, "epoch": 492, "lr": 7.775295849807994e-06} +{"train_loss": 0.00033609403180889785, "global_step": 58645, "epoch": 492, "lr": 7.774109342105384e-06} +{"train_loss": 0.0005014676135033369, "global_step": 58646, "epoch": 492, "lr": 7.772922917308806e-06} +{"train_loss": 0.0006283984403125942, "global_step": 58647, "epoch": 492, "lr": 7.771736575420568e-06} +{"train_loss": 0.00041882655932568014, "global_step": 58648, "epoch": 492, "lr": 7.770550316443032e-06} +{"train_loss": 0.00036223625647835433, "global_step": 58649, "epoch": 492, "lr": 7.769364140378505e-06} +{"train_loss": 0.0005495036020874977, "global_step": 58650, "epoch": 492, "lr": 7.768178047229308e-06} +{"train_loss": 0.0007498307386413217, "global_step": 58651, "epoch": 492, "lr": 7.766992036997794e-06} +{"train_loss": 0.0004839136963710189, "global_step": 58652, "epoch": 492, "lr": 7.765806109686268e-06} +{"train_loss": 0.00035598024260252714, "global_step": 58653, "epoch": 492, "lr": 7.764620265297085e-06} +{"train_loss": 0.000510521000251174, "global_step": 58654, "epoch": 492, "lr": 7.76343450383254e-06} +{"train_loss": 0.0007024662918411195, "global_step": 58655, "epoch": 492, "lr": 7.762248825294993e-06} +{"train_loss": 0.00029470931622199714, "global_step": 58656, "epoch": 492, "lr": 7.76106322968676e-06} +{"train_loss": 0.0002967925393022597, "global_step": 58657, "epoch": 492, "lr": 7.759877717010156e-06} +{"train_loss": 0.00030319474171847105, "global_step": 58658, "epoch": 492, "lr": 7.758692287267526e-06} +{"train_loss": 0.0004895192687399685, "global_step": 58659, "epoch": 492, "lr": 7.757506940461179e-06} +{"train_loss": 0.0004754025430884212, "global_step": 58660, "epoch": 492, "lr": 7.75632167659347e-06} +{"train_loss": 0.0009490731754340231, "global_step": 58661, "epoch": 492, "lr": 7.755136495666698e-06} +{"train_loss": 0.00040403581806458533, "global_step": 58662, "epoch": 492, "lr": 7.753951397683212e-06} +{"train_loss": 0.00032638953416608274, "global_step": 58663, "epoch": 492, "lr": 7.752766382645331e-06} +{"train_loss": 0.0002914586802944541, "global_step": 58664, "epoch": 492, "lr": 7.751581450555368e-06} +{"train_loss": 0.0006285256240516901, "global_step": 58665, "epoch": 492, "lr": 7.750396601415671e-06} +{"train_loss": 0.00046076013487978925, "global_step": 58666, "epoch": 492, "lr": 7.749211835228547e-06, "val_loss": 0.029165906831622124} +{"train_loss": 0.0004882159410044551, "global_step": 58667, "epoch": 493, "lr": 7.74802715199634e-06} +{"train_loss": 0.0002878164523281157, "global_step": 58668, "epoch": 493, "lr": 7.746842551721373e-06} +{"train_loss": 0.0005120424320921302, "global_step": 58669, "epoch": 493, "lr": 7.745658034405951e-06} +{"train_loss": 0.00046434992691501975, "global_step": 58670, "epoch": 493, "lr": 7.744473600052427e-06} +{"train_loss": 0.0003984132199548185, "global_step": 58671, "epoch": 493, "lr": 7.743289248663104e-06} +{"train_loss": 0.0004412358975969255, "global_step": 58672, "epoch": 493, "lr": 7.742104980240333e-06} +{"train_loss": 0.00031519250478595495, "global_step": 58673, "epoch": 493, "lr": 7.74092079478641e-06} +{"train_loss": 0.00026090603205375373, "global_step": 58674, "epoch": 493, "lr": 7.739736692303684e-06} +{"train_loss": 0.00036223221104592085, "global_step": 58675, "epoch": 493, "lr": 7.738552672794458e-06} +{"train_loss": 0.00034252056502737105, "global_step": 58676, "epoch": 493, "lr": 7.737368736261074e-06} +{"train_loss": 0.0005198471480980515, "global_step": 58677, "epoch": 493, "lr": 7.73618488270586e-06} +{"train_loss": 0.0003625900426413864, "global_step": 58678, "epoch": 493, "lr": 7.735001112131118e-06} +{"train_loss": 0.0006139978650026023, "global_step": 58679, "epoch": 493, "lr": 7.733817424539197e-06} +{"train_loss": 0.0005491962074302137, "global_step": 58680, "epoch": 493, "lr": 7.732633819932406e-06} +{"train_loss": 0.0007477879989892244, "global_step": 58681, "epoch": 493, "lr": 7.731450298313075e-06} +{"train_loss": 0.0003591689164750278, "global_step": 58682, "epoch": 493, "lr": 7.730266859683533e-06} +{"train_loss": 0.0006935148267075419, "global_step": 58683, "epoch": 493, "lr": 7.72908350404608e-06} +{"train_loss": 0.00023377589241135865, "global_step": 58684, "epoch": 493, "lr": 7.727900231403068e-06} +{"train_loss": 0.0008293738937936723, "global_step": 58685, "epoch": 493, "lr": 7.726717041756798e-06} +{"train_loss": 0.00027448893524706364, "global_step": 58686, "epoch": 493, "lr": 7.725533935109613e-06} +{"train_loss": 0.0003857881820295006, "global_step": 58687, "epoch": 493, "lr": 7.72435091146383e-06} +{"train_loss": 0.0006508630467578769, "global_step": 58688, "epoch": 493, "lr": 7.723167970821748e-06} +{"train_loss": 0.0004756715497933328, "global_step": 58689, "epoch": 493, "lr": 7.721985113185725e-06} +{"train_loss": 0.0010519723873585463, "global_step": 58690, "epoch": 493, "lr": 7.720802338558059e-06} +{"train_loss": 0.00036684598308056593, "global_step": 58691, "epoch": 493, "lr": 7.719619646941085e-06} +{"train_loss": 0.000741775322239846, "global_step": 58692, "epoch": 493, "lr": 7.718437038337118e-06} +{"train_loss": 0.0003265186387579888, "global_step": 58693, "epoch": 493, "lr": 7.717254512748485e-06} +{"train_loss": 0.0003674172912724316, "global_step": 58694, "epoch": 493, "lr": 7.71607207017751e-06} +{"train_loss": 0.0006273987819440663, "global_step": 58695, "epoch": 493, "lr": 7.7148897106265e-06} +{"train_loss": 0.0003713623736985028, "global_step": 58696, "epoch": 493, "lr": 7.713707434097795e-06} +{"train_loss": 0.00035905407276004553, "global_step": 58697, "epoch": 493, "lr": 7.7125252405937e-06} +{"train_loss": 0.0003136540181003511, "global_step": 58698, "epoch": 493, "lr": 7.711343130116556e-06} +{"train_loss": 0.0005647809011861682, "global_step": 58699, "epoch": 493, "lr": 7.710161102668666e-06} +{"train_loss": 0.0005055753863416612, "global_step": 58700, "epoch": 493, "lr": 7.708979158252349e-06} +{"train_loss": 0.0004963221726939082, "global_step": 58701, "epoch": 493, "lr": 7.707797296869945e-06} +{"train_loss": 0.0006866722251288593, "global_step": 58702, "epoch": 493, "lr": 7.706615518523752e-06} +{"train_loss": 0.0005559598794206977, "global_step": 58703, "epoch": 493, "lr": 7.705433823216106e-06} +{"train_loss": 0.0003480978193692863, "global_step": 58704, "epoch": 493, "lr": 7.704252210949319e-06} +{"train_loss": 0.00028790393844246864, "global_step": 58705, "epoch": 493, "lr": 7.703070681725722e-06} +{"train_loss": 0.0004715692193713039, "global_step": 58706, "epoch": 493, "lr": 7.701889235547616e-06} +{"train_loss": 0.0003800137201324105, "global_step": 58707, "epoch": 493, "lr": 7.700707872417345e-06} +{"train_loss": 0.00041024593519978225, "global_step": 58708, "epoch": 493, "lr": 7.699526592337203e-06} +{"train_loss": 0.0006757093360647559, "global_step": 58709, "epoch": 493, "lr": 7.698345395309531e-06} +{"train_loss": 0.0003591466520447284, "global_step": 58710, "epoch": 493, "lr": 7.697164281336628e-06} +{"train_loss": 0.0005507217720150948, "global_step": 58711, "epoch": 493, "lr": 7.69598325042082e-06} +{"train_loss": 0.00033486465690657496, "global_step": 58712, "epoch": 493, "lr": 7.694802302564446e-06} +{"train_loss": 0.0005190788651816547, "global_step": 58713, "epoch": 493, "lr": 7.693621437769805e-06} +{"train_loss": 0.0007295128307305276, "global_step": 58714, "epoch": 493, "lr": 7.692440656039207e-06} +{"train_loss": 0.0004740044823847711, "global_step": 58715, "epoch": 493, "lr": 7.691259957374997e-06} +{"train_loss": 0.0004536201013252139, "global_step": 58716, "epoch": 493, "lr": 7.69007934177946e-06} +{"train_loss": 0.00037901822361163795, "global_step": 58717, "epoch": 493, "lr": 7.688898809254952e-06} +{"train_loss": 0.00032072135945782065, "global_step": 58718, "epoch": 493, "lr": 7.687718359803763e-06} +{"train_loss": 0.00033804462873376906, "global_step": 58719, "epoch": 493, "lr": 7.68653799342821e-06} +{"train_loss": 0.00024097863934002817, "global_step": 58720, "epoch": 493, "lr": 7.68535771013063e-06} +{"train_loss": 0.00019129292923025787, "global_step": 58721, "epoch": 493, "lr": 7.684177509913321e-06} +{"train_loss": 0.0004311766824685037, "global_step": 58722, "epoch": 493, "lr": 7.682997392778618e-06} +{"train_loss": 0.0005204807966947556, "global_step": 58723, "epoch": 493, "lr": 7.681817358728815e-06} +{"train_loss": 0.00028710259357467294, "global_step": 58724, "epoch": 493, "lr": 7.680637407766262e-06} +{"train_loss": 0.0005077412351965904, "global_step": 58725, "epoch": 493, "lr": 7.679457539893248e-06} +{"train_loss": 0.0003214053576812148, "global_step": 58726, "epoch": 493, "lr": 7.67827775511209e-06} +{"train_loss": 0.0002778561902232468, "global_step": 58727, "epoch": 493, "lr": 7.677098053425125e-06} +{"train_loss": 0.00043088712845928967, "global_step": 58728, "epoch": 493, "lr": 7.67591843483464e-06} +{"train_loss": 0.00045921473065391183, "global_step": 58729, "epoch": 493, "lr": 7.674738899342982e-06} +{"train_loss": 0.00027868631877936423, "global_step": 58730, "epoch": 493, "lr": 7.673559446952444e-06} +{"train_loss": 0.0002760031202342361, "global_step": 58731, "epoch": 493, "lr": 7.672380077665354e-06} +{"train_loss": 0.0004877345636487007, "global_step": 58732, "epoch": 493, "lr": 7.671200791484029e-06} +{"train_loss": 0.00026642298325896263, "global_step": 58733, "epoch": 493, "lr": 7.67002158841077e-06} +{"train_loss": 0.00025836832355707884, "global_step": 58734, "epoch": 493, "lr": 7.668842468447907e-06} +{"train_loss": 0.00019368699577171355, "global_step": 58735, "epoch": 493, "lr": 7.667663431597739e-06} +{"train_loss": 0.0006655639153905213, "global_step": 58736, "epoch": 493, "lr": 7.666484477862607e-06} +{"train_loss": 0.0010590155143290758, "global_step": 58737, "epoch": 493, "lr": 7.665305607244804e-06} +{"train_loss": 0.00039779109647497535, "global_step": 58738, "epoch": 493, "lr": 7.664126819746643e-06} +{"train_loss": 0.00034204666735604405, "global_step": 58739, "epoch": 493, "lr": 7.662948115370445e-06} +{"train_loss": 0.0005997823900543153, "global_step": 58740, "epoch": 493, "lr": 7.661769494118537e-06} +{"train_loss": 0.0003057009889744222, "global_step": 58741, "epoch": 493, "lr": 7.660590955993213e-06} +{"train_loss": 0.0003422472218517214, "global_step": 58742, "epoch": 493, "lr": 7.659412500996804e-06} +{"train_loss": 0.0003968037781305611, "global_step": 58743, "epoch": 493, "lr": 7.658234129131603e-06} +{"train_loss": 0.0002757906331680715, "global_step": 58744, "epoch": 493, "lr": 7.657055840399946e-06} +{"train_loss": 0.00024570096866227686, "global_step": 58745, "epoch": 493, "lr": 7.655877634804125e-06} +{"train_loss": 0.0003250049485359341, "global_step": 58746, "epoch": 493, "lr": 7.654699512346481e-06} +{"train_loss": 0.00037483155028894544, "global_step": 58747, "epoch": 493, "lr": 7.653521473029296e-06} +{"train_loss": 0.00021774668130092323, "global_step": 58748, "epoch": 493, "lr": 7.652343516854909e-06} +{"train_loss": 0.0002513734216336161, "global_step": 58749, "epoch": 493, "lr": 7.651165643825608e-06} +{"train_loss": 0.0002473684726282954, "global_step": 58750, "epoch": 493, "lr": 7.64998785394373e-06} +{"train_loss": 0.00033519291901029646, "global_step": 58751, "epoch": 493, "lr": 7.648810147211583e-06} +{"train_loss": 0.0004878481267951429, "global_step": 58752, "epoch": 493, "lr": 7.647632523631454e-06} +{"train_loss": 0.0002495745138730854, "global_step": 58753, "epoch": 493, "lr": 7.646454983205687e-06} +{"train_loss": 0.0005333316512405872, "global_step": 58754, "epoch": 493, "lr": 7.645277525936572e-06} +{"train_loss": 0.0003380347625352442, "global_step": 58755, "epoch": 493, "lr": 7.64410015182644e-06} +{"train_loss": 0.0003293760819360614, "global_step": 58756, "epoch": 493, "lr": 7.642922860877588e-06} +{"train_loss": 0.00021875367383472621, "global_step": 58757, "epoch": 493, "lr": 7.641745653092324e-06} +{"train_loss": 0.0002157678100047633, "global_step": 58758, "epoch": 493, "lr": 7.64056852847298e-06} +{"train_loss": 0.0005104589508846402, "global_step": 58759, "epoch": 493, "lr": 7.639391487021841e-06} +{"train_loss": 0.00042524555465206504, "global_step": 58760, "epoch": 493, "lr": 7.638214528741245e-06} +{"train_loss": 0.0002897700178436935, "global_step": 58761, "epoch": 493, "lr": 7.637037653633478e-06} +{"train_loss": 0.0002997757983393967, "global_step": 58762, "epoch": 493, "lr": 7.635860861700866e-06} +{"train_loss": 0.0006005692412145436, "global_step": 58763, "epoch": 493, "lr": 7.63468415294572e-06} +{"train_loss": 0.0003915088891517371, "global_step": 58764, "epoch": 493, "lr": 7.633507527370338e-06} +{"train_loss": 0.001021986361593008, "global_step": 58765, "epoch": 493, "lr": 7.632330984977044e-06} +{"train_loss": 0.0007591868052259088, "global_step": 58766, "epoch": 493, "lr": 7.631154525768131e-06} +{"train_loss": 0.00031749167828820646, "global_step": 58767, "epoch": 493, "lr": 7.629978149745931e-06} +{"train_loss": 0.00031746432068757713, "global_step": 58768, "epoch": 493, "lr": 7.628801856912743e-06} +{"train_loss": 0.000643183768261224, "global_step": 58769, "epoch": 493, "lr": 7.627625647270869e-06} +{"train_loss": 0.0002315333840670064, "global_step": 58770, "epoch": 493, "lr": 7.626449520822632e-06} +{"train_loss": 0.000947785098105669, "global_step": 58771, "epoch": 493, "lr": 7.625273477570322e-06} +{"train_loss": 0.0005427211290225387, "global_step": 58772, "epoch": 493, "lr": 7.624097517516271e-06} +{"train_loss": 0.0005190508672967553, "global_step": 58773, "epoch": 493, "lr": 7.622921640662772e-06} +{"train_loss": 0.0006290663150139153, "global_step": 58774, "epoch": 493, "lr": 7.621745847012135e-06} +{"train_loss": 0.0007795390556566417, "global_step": 58775, "epoch": 493, "lr": 7.620570136566685e-06} +{"train_loss": 0.000385540712159127, "global_step": 58776, "epoch": 493, "lr": 7.6193945093287036e-06} +{"train_loss": 0.0002486119628883898, "global_step": 58777, "epoch": 493, "lr": 7.6182189653005275e-06} +{"train_loss": 0.0011206152848899364, "global_step": 58778, "epoch": 493, "lr": 7.617043504484439e-06} +{"train_loss": 0.0011047400766983628, "global_step": 58779, "epoch": 493, "lr": 7.615868126882769e-06} +{"train_loss": 0.0006263715913519263, "global_step": 58780, "epoch": 493, "lr": 7.614692832497799e-06} +{"train_loss": 0.0007946233963593841, "global_step": 58781, "epoch": 493, "lr": 7.613517621331867e-06} +{"train_loss": 0.00023081828840076923, "global_step": 58782, "epoch": 493, "lr": 7.612342493387264e-06} +{"train_loss": 0.0002709974942263216, "global_step": 58783, "epoch": 493, "lr": 7.611167448666284e-06} +{"train_loss": 0.0006844886229373515, "global_step": 58784, "epoch": 493, "lr": 7.609992487171264e-06} +{"train_loss": 0.00045450832014864295, "global_step": 58785, "epoch": 493, "lr": 7.608817608904484e-06, "val_loss": 0.016982121393084526} +{"train_loss": 0.00030419911490753293, "global_step": 58786, "epoch": 494, "lr": 7.607642813868271e-06} +{"train_loss": 0.0011545814340934157, "global_step": 58787, "epoch": 494, "lr": 7.606468102064918e-06} +{"train_loss": 0.0008929370087571442, "global_step": 58788, "epoch": 494, "lr": 7.605293473496733e-06} +{"train_loss": 0.0008968281326815486, "global_step": 58789, "epoch": 494, "lr": 7.604118928166032e-06} +{"train_loss": 0.0005409863078966737, "global_step": 58790, "epoch": 494, "lr": 7.602944466075101e-06} +{"train_loss": 0.0006684164982289076, "global_step": 58791, "epoch": 494, "lr": 7.601770087226273e-06} +{"train_loss": 0.0005288663087412715, "global_step": 58792, "epoch": 494, "lr": 7.600595791621828e-06} +{"train_loss": 0.0010018227621912956, "global_step": 58793, "epoch": 494, "lr": 7.599421579264093e-06} +{"train_loss": 0.0004132950271014124, "global_step": 58794, "epoch": 494, "lr": 7.598247450155366e-06} +{"train_loss": 0.0007714530802331865, "global_step": 58795, "epoch": 494, "lr": 7.597073404297939e-06} +{"train_loss": 0.0003924315969925374, "global_step": 58796, "epoch": 494, "lr": 7.595899441694138e-06} +{"train_loss": 0.0003153385187033564, "global_step": 58797, "epoch": 494, "lr": 7.59472556234625e-06} +{"train_loss": 0.00027724713436327875, "global_step": 58798, "epoch": 494, "lr": 7.593551766256596e-06} +{"train_loss": 0.0005589303909800947, "global_step": 58799, "epoch": 494, "lr": 7.592378053427462e-06} +{"train_loss": 0.00030115569825284183, "global_step": 58800, "epoch": 494, "lr": 7.591204423861176e-06} +{"train_loss": 0.0007264515734277666, "global_step": 58801, "epoch": 494, "lr": 7.590030877560028e-06} +{"train_loss": 0.0005458331434056163, "global_step": 58802, "epoch": 494, "lr": 7.588857414526313e-06} +{"train_loss": 0.0006060974556021392, "global_step": 58803, "epoch": 494, "lr": 7.587684034762355e-06} +{"train_loss": 0.0007115152548067272, "global_step": 58804, "epoch": 494, "lr": 7.5865107382704355e-06} +{"train_loss": 0.0003349852340761572, "global_step": 58805, "epoch": 494, "lr": 7.5853375250528876e-06} +{"train_loss": 0.0008105041342787445, "global_step": 58806, "epoch": 494, "lr": 7.584164395111981e-06} +{"train_loss": 0.0004974933690391481, "global_step": 58807, "epoch": 494, "lr": 7.582991348450053e-06} +{"train_loss": 0.0006586101371794939, "global_step": 58808, "epoch": 494, "lr": 7.581818385069378e-06} +{"train_loss": 0.00039872524212114513, "global_step": 58809, "epoch": 494, "lr": 7.5806455049722666e-06} +{"train_loss": 0.0003089510428253561, "global_step": 58810, "epoch": 494, "lr": 7.579472708161039e-06} +{"train_loss": 0.0005400748923420906, "global_step": 58811, "epoch": 494, "lr": 7.578299994637977e-06} +{"train_loss": 0.0005706482916139066, "global_step": 58812, "epoch": 494, "lr": 7.5771273644054006e-06} +{"train_loss": 0.0005218205042183399, "global_step": 58813, "epoch": 494, "lr": 7.575954817465597e-06} +{"train_loss": 0.0009187177056446671, "global_step": 58814, "epoch": 494, "lr": 7.5747823538208695e-06} +{"train_loss": 0.00044084727414883673, "global_step": 58815, "epoch": 494, "lr": 7.573609973473533e-06} +{"train_loss": 0.0003918228030670434, "global_step": 58816, "epoch": 494, "lr": 7.57243767642587e-06} +{"train_loss": 0.0003845168394036591, "global_step": 58817, "epoch": 494, "lr": 7.571265462680205e-06} +{"train_loss": 0.0006040438893251121, "global_step": 58818, "epoch": 494, "lr": 7.570093332238826e-06} +{"train_loss": 0.0004351603565737605, "global_step": 58819, "epoch": 494, "lr": 7.568921285104025e-06} +{"train_loss": 0.0005344278179109097, "global_step": 58820, "epoch": 494, "lr": 7.5677493212781225e-06} +{"train_loss": 0.00040863879257813096, "global_step": 58821, "epoch": 494, "lr": 7.5665774407634e-06} +{"train_loss": 0.0004252759099472314, "global_step": 58822, "epoch": 494, "lr": 7.565405643562185e-06} +{"train_loss": 0.0003767543239519, "global_step": 58823, "epoch": 494, "lr": 7.564233929676745e-06} +{"train_loss": 0.0005210338858887553, "global_step": 58824, "epoch": 494, "lr": 7.563062299109413e-06} +{"train_loss": 0.0003842478326987475, "global_step": 58825, "epoch": 494, "lr": 7.561890751862477e-06} +{"train_loss": 0.0005620549200102687, "global_step": 58826, "epoch": 494, "lr": 7.5607192879382225e-06} +{"train_loss": 0.0006114456336945295, "global_step": 58827, "epoch": 494, "lr": 7.559547907338971e-06} +{"train_loss": 0.0006200596690177917, "global_step": 58828, "epoch": 494, "lr": 7.558376610067003e-06} +{"train_loss": 0.0002491594641469419, "global_step": 58829, "epoch": 494, "lr": 7.557205396124639e-06} +{"train_loss": 0.0005758309853263199, "global_step": 58830, "epoch": 494, "lr": 7.556034265514156e-06} +{"train_loss": 0.000436530914157629, "global_step": 58831, "epoch": 494, "lr": 7.554863218237879e-06} +{"train_loss": 0.0004370558017399162, "global_step": 58832, "epoch": 494, "lr": 7.553692254298089e-06} +{"train_loss": 0.0002858448715414852, "global_step": 58833, "epoch": 494, "lr": 7.55252137369708e-06} +{"train_loss": 0.0005086544551886618, "global_step": 58834, "epoch": 494, "lr": 7.551350576437172e-06} +{"train_loss": 0.00020378842600621283, "global_step": 58835, "epoch": 494, "lr": 7.550179862520645e-06} +{"train_loss": 0.0003422410518396646, "global_step": 58836, "epoch": 494, "lr": 7.5490092319498104e-06} +{"train_loss": 0.0010826917132362723, "global_step": 58837, "epoch": 494, "lr": 7.547838684726954e-06} +{"train_loss": 0.00044283230090513825, "global_step": 58838, "epoch": 494, "lr": 7.546668220854386e-06} +{"train_loss": 0.000811619043815881, "global_step": 58839, "epoch": 494, "lr": 7.545497840334392e-06} +{"train_loss": 0.00032705740886740386, "global_step": 58840, "epoch": 494, "lr": 7.544327543169288e-06} +{"train_loss": 0.0004714095557574183, "global_step": 58841, "epoch": 494, "lr": 7.543157329361356e-06} +{"train_loss": 0.0005003937403671443, "global_step": 58842, "epoch": 494, "lr": 7.541987198912903e-06} +{"train_loss": 0.00039797386853024364, "global_step": 58843, "epoch": 494, "lr": 7.540817151826213e-06} +{"train_loss": 0.0005774469464085996, "global_step": 58844, "epoch": 494, "lr": 7.539647188103604e-06} +{"train_loss": 0.0004494256863836199, "global_step": 58845, "epoch": 494, "lr": 7.538477307747349e-06} +{"train_loss": 0.0003021432494278997, "global_step": 58846, "epoch": 494, "lr": 7.537307510759767e-06} +{"train_loss": 0.00046628390555270016, "global_step": 58847, "epoch": 494, "lr": 7.536137797143139e-06} +{"train_loss": 0.00028835010016337037, "global_step": 58848, "epoch": 494, "lr": 7.534968166899775e-06} +{"train_loss": 0.0003802118881139904, "global_step": 58849, "epoch": 494, "lr": 7.533798620031951e-06} +{"train_loss": 0.000358749384758994, "global_step": 58850, "epoch": 494, "lr": 7.532629156541993e-06} +{"train_loss": 0.00030873343348503113, "global_step": 58851, "epoch": 494, "lr": 7.531459776432181e-06} +{"train_loss": 0.0008735746960155666, "global_step": 58852, "epoch": 494, "lr": 7.530290479704794e-06} +{"train_loss": 0.0003635050670709461, "global_step": 58853, "epoch": 494, "lr": 7.52912126636216e-06} +{"train_loss": 0.00042528234189376235, "global_step": 58854, "epoch": 494, "lr": 7.527952136406547e-06} +{"train_loss": 0.0006187091930769384, "global_step": 58855, "epoch": 494, "lr": 7.526783089840272e-06} +{"train_loss": 0.0003456707636360079, "global_step": 58856, "epoch": 494, "lr": 7.525614126665626e-06} +{"train_loss": 0.0006089739035815, "global_step": 58857, "epoch": 494, "lr": 7.524445246884881e-06} +{"train_loss": 0.0004951629671268165, "global_step": 58858, "epoch": 494, "lr": 7.5232764505003664e-06} +{"train_loss": 0.0005698896129615605, "global_step": 58859, "epoch": 494, "lr": 7.522107737514345e-06} +{"train_loss": 0.0002983607118949294, "global_step": 58860, "epoch": 494, "lr": 7.5209391079291426e-06} +{"train_loss": 0.0006357660749927163, "global_step": 58861, "epoch": 494, "lr": 7.519770561747025e-06} +{"train_loss": 0.00041264656465500593, "global_step": 58862, "epoch": 494, "lr": 7.518602098970307e-06} +{"train_loss": 0.0004876671882811934, "global_step": 58863, "epoch": 494, "lr": 7.51743371960128e-06} +{"train_loss": 0.00030121859163045883, "global_step": 58864, "epoch": 494, "lr": 7.516265423642221e-06} +{"train_loss": 0.0004197507514618337, "global_step": 58865, "epoch": 494, "lr": 7.515097211095446e-06} +{"train_loss": 0.0005183209432289004, "global_step": 58866, "epoch": 494, "lr": 7.513929081963228e-06} +{"train_loss": 0.0004044634406454861, "global_step": 58867, "epoch": 494, "lr": 7.512761036247884e-06} +{"train_loss": 0.0006242034141905606, "global_step": 58868, "epoch": 494, "lr": 7.511593073951684e-06} +{"train_loss": 0.0009143597562797368, "global_step": 58869, "epoch": 494, "lr": 7.510425195076942e-06} +{"train_loss": 0.0002593003446236253, "global_step": 58870, "epoch": 494, "lr": 7.509257399625941e-06} +{"train_loss": 0.0006853517261333764, "global_step": 58871, "epoch": 494, "lr": 7.508089687600961e-06} +{"train_loss": 0.00047420462942682207, "global_step": 58872, "epoch": 494, "lr": 7.506922059004307e-06} +{"train_loss": 0.0007061453652568161, "global_step": 58873, "epoch": 494, "lr": 7.505754513838281e-06} +{"train_loss": 0.0002390993176959455, "global_step": 58874, "epoch": 494, "lr": 7.504587052105161e-06} +{"train_loss": 0.0005350198480300605, "global_step": 58875, "epoch": 494, "lr": 7.503419673807255e-06} +{"train_loss": 0.0009333030320703983, "global_step": 58876, "epoch": 494, "lr": 7.502252378946828e-06} +{"train_loss": 0.0008529707556590438, "global_step": 58877, "epoch": 494, "lr": 7.501085167526201e-06} +{"train_loss": 0.0002282118221046403, "global_step": 58878, "epoch": 494, "lr": 7.499918039547643e-06} +{"train_loss": 0.0005627431673929095, "global_step": 58879, "epoch": 494, "lr": 7.498750995013465e-06} +{"train_loss": 0.00023937091464176774, "global_step": 58880, "epoch": 494, "lr": 7.497584033925942e-06} +{"train_loss": 0.0005514565273188055, "global_step": 58881, "epoch": 494, "lr": 7.496417156287378e-06} +{"train_loss": 0.00034372470690868795, "global_step": 58882, "epoch": 494, "lr": 7.4952503621000644e-06} +{"train_loss": 0.0006683747633360326, "global_step": 58883, "epoch": 494, "lr": 7.494083651366268e-06} +{"train_loss": 0.0006400531274266541, "global_step": 58884, "epoch": 494, "lr": 7.492917024088314e-06} +{"train_loss": 0.00036881931009702384, "global_step": 58885, "epoch": 494, "lr": 7.491750480268461e-06} +{"train_loss": 0.0007018368341960013, "global_step": 58886, "epoch": 494, "lr": 7.490584019909025e-06} +{"train_loss": 0.0004583295376505703, "global_step": 58887, "epoch": 494, "lr": 7.489417643012287e-06} +{"train_loss": 0.0002920636907219887, "global_step": 58888, "epoch": 494, "lr": 7.488251349580527e-06} +{"train_loss": 0.0003688902943395078, "global_step": 58889, "epoch": 494, "lr": 7.4870851396160516e-06} +{"train_loss": 0.0006261979578994215, "global_step": 58890, "epoch": 494, "lr": 7.485919013121134e-06} +{"train_loss": 0.00045384152326732874, "global_step": 58891, "epoch": 494, "lr": 7.484752970098086e-06} +{"train_loss": 0.00027275236789137125, "global_step": 58892, "epoch": 494, "lr": 7.483587010549164e-06} +{"train_loss": 0.0004784047487191856, "global_step": 58893, "epoch": 494, "lr": 7.482421134476697e-06} +{"train_loss": 0.0004913675365969539, "global_step": 58894, "epoch": 494, "lr": 7.4812553418829475e-06} +{"train_loss": 0.0008776937611401081, "global_step": 58895, "epoch": 494, "lr": 7.480089632770204e-06} +{"train_loss": 0.0007585401181131601, "global_step": 58896, "epoch": 494, "lr": 7.478924007140769e-06} +{"train_loss": 0.00031796289840713143, "global_step": 58897, "epoch": 494, "lr": 7.4777584649969145e-06} +{"train_loss": 0.0006934510311111808, "global_step": 58898, "epoch": 494, "lr": 7.4765930063409485e-06} +{"train_loss": 0.0002823651011567563, "global_step": 58899, "epoch": 494, "lr": 7.4754276311751414e-06} +{"train_loss": 0.00031865446362644434, "global_step": 58900, "epoch": 494, "lr": 7.474262339501797e-06} +{"train_loss": 0.0005793951568193734, "global_step": 58901, "epoch": 494, "lr": 7.473097131323198e-06} +{"train_loss": 0.0004668265173677355, "global_step": 58902, "epoch": 494, "lr": 7.471932006641619e-06} +{"train_loss": 0.0003821268037427217, "global_step": 58903, "epoch": 494, "lr": 7.470766965459364e-06} +{"train_loss": 0.0005112050362606337, "global_step": 58904, "epoch": 494, "lr": 7.4696020077787085e-06, "val_loss": 0.030148319900035858} +{"train_loss": 0.00032406681566499174, "global_step": 58905, "epoch": 495, "lr": 7.468437133601952e-06} +{"train_loss": 0.0005388866411522031, "global_step": 58906, "epoch": 495, "lr": 7.46727234293137e-06} +{"train_loss": 0.0006465119658969343, "global_step": 58907, "epoch": 495, "lr": 7.4661076357692485e-06} +{"train_loss": 0.0002796915068756789, "global_step": 58908, "epoch": 495, "lr": 7.464943012117898e-06} +{"train_loss": 0.00033971614902839065, "global_step": 58909, "epoch": 495, "lr": 7.4637784719795715e-06} +{"train_loss": 0.0004777373105753213, "global_step": 58910, "epoch": 495, "lr": 7.462614015356584e-06} +{"train_loss": 0.0001842471829149872, "global_step": 58911, "epoch": 495, "lr": 7.4614496422512e-06} +{"train_loss": 0.00021271857258398086, "global_step": 58912, "epoch": 495, "lr": 7.4602853526657245e-06} +{"train_loss": 0.00038911160663701594, "global_step": 58913, "epoch": 495, "lr": 7.459121146602432e-06} +{"train_loss": 0.0009655609028413892, "global_step": 58914, "epoch": 495, "lr": 7.457957024063606e-06} +{"train_loss": 0.00043337297393009067, "global_step": 58915, "epoch": 495, "lr": 7.456792985051542e-06} +{"train_loss": 0.0004804065392818302, "global_step": 58916, "epoch": 495, "lr": 7.455629029568512e-06} +{"train_loss": 0.0002344990789424628, "global_step": 58917, "epoch": 495, "lr": 7.454465157616819e-06} +{"train_loss": 0.00022362859454005957, "global_step": 58918, "epoch": 495, "lr": 7.453301369198723e-06} +{"train_loss": 0.0008033711928874254, "global_step": 58919, "epoch": 495, "lr": 7.452137664316538e-06} +{"train_loss": 0.0006474814144894481, "global_step": 58920, "epoch": 495, "lr": 7.450974042972542e-06} +{"train_loss": 0.00030507089104503393, "global_step": 58921, "epoch": 495, "lr": 7.449810505168991e-06} +{"train_loss": 0.00030387192964553833, "global_step": 58922, "epoch": 495, "lr": 7.4486470509082086e-06} +{"train_loss": 0.0003514603595249355, "global_step": 58923, "epoch": 495, "lr": 7.447483680192452e-06} +{"train_loss": 0.00030486821196973324, "global_step": 58924, "epoch": 495, "lr": 7.44632039302402e-06} +{"train_loss": 0.0004020522756036371, "global_step": 58925, "epoch": 495, "lr": 7.445157189405199e-06} +{"train_loss": 0.0006288589793257415, "global_step": 58926, "epoch": 495, "lr": 7.4439940693382505e-06} +{"train_loss": 0.00025504795485176146, "global_step": 58927, "epoch": 495, "lr": 7.442831032825487e-06} +{"train_loss": 0.00034675243659876287, "global_step": 58928, "epoch": 495, "lr": 7.441668079869163e-06} +{"train_loss": 0.0005714193102903664, "global_step": 58929, "epoch": 495, "lr": 7.4405052104715875e-06} +{"train_loss": 0.00042389577720314264, "global_step": 58930, "epoch": 495, "lr": 7.439342424635026e-06} +{"train_loss": 0.0004026555398013443, "global_step": 58931, "epoch": 495, "lr": 7.438179722361776e-06} +{"train_loss": 0.000735724694095552, "global_step": 58932, "epoch": 495, "lr": 7.43701710365412e-06} +{"train_loss": 0.00041198619874194264, "global_step": 58933, "epoch": 495, "lr": 7.4358545685143165e-06} +{"train_loss": 0.00035534834023565054, "global_step": 58934, "epoch": 495, "lr": 7.434692116944675e-06} +{"train_loss": 0.00031541980570182204, "global_step": 58935, "epoch": 495, "lr": 7.43352974894746e-06} +{"train_loss": 0.0006217400077730417, "global_step": 58936, "epoch": 495, "lr": 7.432367464524975e-06} +{"train_loss": 0.0002845238777808845, "global_step": 58937, "epoch": 495, "lr": 7.431205263679475e-06} +{"train_loss": 0.0006978936726227403, "global_step": 58938, "epoch": 495, "lr": 7.430043146413268e-06} +{"train_loss": 0.000841963104903698, "global_step": 58939, "epoch": 495, "lr": 7.428881112728609e-06} +{"train_loss": 0.0005274815484881401, "global_step": 58940, "epoch": 495, "lr": 7.4277191626278105e-06} +{"train_loss": 0.0005081845447421074, "global_step": 58941, "epoch": 495, "lr": 7.426557296113123e-06} +{"train_loss": 0.0005006719729863107, "global_step": 58942, "epoch": 495, "lr": 7.425395513186839e-06} +{"train_loss": 0.0002041947445832193, "global_step": 58943, "epoch": 495, "lr": 7.424233813851256e-06} +{"train_loss": 0.00038265209877863526, "global_step": 58944, "epoch": 495, "lr": 7.423072198108644e-06} +{"train_loss": 0.00039296215982176363, "global_step": 58945, "epoch": 495, "lr": 7.421910665961268e-06} +{"train_loss": 0.0005022368859499693, "global_step": 58946, "epoch": 495, "lr": 7.420749217411433e-06} +{"train_loss": 0.000246027106186375, "global_step": 58947, "epoch": 495, "lr": 7.419587852461396e-06} +{"train_loss": 0.00043398476555012167, "global_step": 58948, "epoch": 495, "lr": 7.4184265711134625e-06} +{"train_loss": 0.0003218190686311573, "global_step": 58949, "epoch": 495, "lr": 7.417265373369886e-06} +{"train_loss": 0.000261238485109061, "global_step": 58950, "epoch": 495, "lr": 7.41610425923297e-06} +{"train_loss": 0.00030025863088667393, "global_step": 58951, "epoch": 495, "lr": 7.414943228704984e-06} +{"train_loss": 0.000444683333626017, "global_step": 58952, "epoch": 495, "lr": 7.413782281788201e-06} +{"train_loss": 0.00041770178359001875, "global_step": 58953, "epoch": 495, "lr": 7.412621418484911e-06} +{"train_loss": 0.0002335972385481, "global_step": 58954, "epoch": 495, "lr": 7.41146063879738e-06} +{"train_loss": 0.00019036729645449668, "global_step": 58955, "epoch": 495, "lr": 7.4102999427279105e-06} +{"train_loss": 0.00041216114186681807, "global_step": 58956, "epoch": 495, "lr": 7.409139330278764e-06} +{"train_loss": 0.00041550147579982877, "global_step": 58957, "epoch": 495, "lr": 7.4079788014522145e-06} +{"train_loss": 0.00039102049777284265, "global_step": 58958, "epoch": 495, "lr": 7.406818356250556e-06} +{"train_loss": 0.0007334608817473054, "global_step": 58959, "epoch": 495, "lr": 7.405657994676052e-06} +{"train_loss": 0.0006321886321529746, "global_step": 58960, "epoch": 495, "lr": 7.404497716730996e-06} +{"train_loss": 0.0005076931556686759, "global_step": 58961, "epoch": 495, "lr": 7.403337522417647e-06} +{"train_loss": 0.0003600813797675073, "global_step": 58962, "epoch": 495, "lr": 7.402177411738304e-06} +{"train_loss": 0.0005352634470909834, "global_step": 58963, "epoch": 495, "lr": 7.401017384695236e-06} +{"train_loss": 0.00035697303246706724, "global_step": 58964, "epoch": 495, "lr": 7.399857441290709e-06} +{"train_loss": 0.0007087277481332421, "global_step": 58965, "epoch": 495, "lr": 7.39869758152702e-06} +{"train_loss": 0.00022601342061534524, "global_step": 58966, "epoch": 495, "lr": 7.397537805406429e-06} +{"train_loss": 0.00024574974668212235, "global_step": 58967, "epoch": 495, "lr": 7.396378112931229e-06} +{"train_loss": 0.0002813240571413189, "global_step": 58968, "epoch": 495, "lr": 7.3952185041036795e-06} +{"train_loss": 0.0004190239415038377, "global_step": 58969, "epoch": 495, "lr": 7.394058978926077e-06} +{"train_loss": 0.0008133664377965033, "global_step": 58970, "epoch": 495, "lr": 7.392899537400677e-06} +{"train_loss": 0.0002759822818916291, "global_step": 58971, "epoch": 495, "lr": 7.391740179529783e-06} +{"train_loss": 0.00031269140890799463, "global_step": 58972, "epoch": 495, "lr": 7.390580905315636e-06} +{"train_loss": 0.0003854899841826409, "global_step": 58973, "epoch": 495, "lr": 7.389421714760547e-06} +{"train_loss": 0.00033646004158072174, "global_step": 58974, "epoch": 495, "lr": 7.388262607866764e-06} +{"train_loss": 0.00039054162334650755, "global_step": 58975, "epoch": 495, "lr": 7.3871035846365845e-06} +{"train_loss": 0.0002701885241549462, "global_step": 58976, "epoch": 495, "lr": 7.385944645072268e-06} +{"train_loss": 0.0005938030662946403, "global_step": 58977, "epoch": 495, "lr": 7.3847857891761016e-06} +{"train_loss": 0.00040691805770620704, "global_step": 58978, "epoch": 495, "lr": 7.383627016950351e-06} +{"train_loss": 0.00041787693044170737, "global_step": 58979, "epoch": 495, "lr": 7.382468328397302e-06} +{"train_loss": 0.0004805948701687157, "global_step": 58980, "epoch": 495, "lr": 7.381309723519214e-06} +{"train_loss": 0.0002940532867796719, "global_step": 58981, "epoch": 495, "lr": 7.380151202318381e-06} +{"train_loss": 0.0002717238967306912, "global_step": 58982, "epoch": 495, "lr": 7.378992764797071e-06} +{"train_loss": 0.00040694500785320997, "global_step": 58983, "epoch": 495, "lr": 7.37783441095754e-06} +{"train_loss": 0.00040182872908189893, "global_step": 58984, "epoch": 495, "lr": 7.376676140802091e-06} +{"train_loss": 0.0005931549821980298, "global_step": 58985, "epoch": 495, "lr": 7.3755179543329725e-06} +{"train_loss": 0.0005869101732969284, "global_step": 58986, "epoch": 495, "lr": 7.374359851552487e-06} +{"train_loss": 0.0005017642397433519, "global_step": 58987, "epoch": 495, "lr": 7.373201832462873e-06} +{"train_loss": 0.00023257796419784427, "global_step": 58988, "epoch": 495, "lr": 7.372043897066438e-06} +{"train_loss": 0.0003809029294643551, "global_step": 58989, "epoch": 495, "lr": 7.370886045365444e-06} +{"train_loss": 0.0002667478402145207, "global_step": 58990, "epoch": 495, "lr": 7.369728277362148e-06} +{"train_loss": 0.0007500048377551138, "global_step": 58991, "epoch": 495, "lr": 7.368570593058843e-06} +{"train_loss": 0.00043137939064763486, "global_step": 58992, "epoch": 495, "lr": 7.36741299245779e-06} +{"train_loss": 0.000240741137531586, "global_step": 58993, "epoch": 495, "lr": 7.366255475561273e-06} +{"train_loss": 0.0003752642951440066, "global_step": 58994, "epoch": 495, "lr": 7.36509804237156e-06} +{"train_loss": 0.00040843666647560894, "global_step": 58995, "epoch": 495, "lr": 7.363940692890914e-06} +{"train_loss": 0.00034386085462756455, "global_step": 58996, "epoch": 495, "lr": 7.362783427121622e-06} +{"train_loss": 0.0004311329103074968, "global_step": 58997, "epoch": 495, "lr": 7.361626245065944e-06} +{"train_loss": 0.00034097657771781087, "global_step": 58998, "epoch": 495, "lr": 7.360469146726162e-06} +{"train_loss": 0.00020419088832568377, "global_step": 58999, "epoch": 495, "lr": 7.35931213210454e-06} +{"train_loss": 0.0002177751885028556, "global_step": 59000, "epoch": 495, "lr": 7.35815520120336e-06} +{"train_loss": 0.00023292744299396873, "global_step": 59001, "epoch": 495, "lr": 7.356998354024886e-06} +{"train_loss": 0.000703304132912308, "global_step": 59002, "epoch": 495, "lr": 7.355841590571377e-06} +{"train_loss": 0.0005168088246136904, "global_step": 59003, "epoch": 495, "lr": 7.354684910845133e-06} +{"train_loss": 0.00028149562422186136, "global_step": 59004, "epoch": 495, "lr": 7.353528314848396e-06} +{"train_loss": 0.0002952733775600791, "global_step": 59005, "epoch": 495, "lr": 7.352371802583452e-06} +{"train_loss": 0.0005177041748538613, "global_step": 59006, "epoch": 495, "lr": 7.351215374052578e-06} +{"train_loss": 0.0004339484730735421, "global_step": 59007, "epoch": 495, "lr": 7.350059029258027e-06} +{"train_loss": 0.00027724786195904016, "global_step": 59008, "epoch": 495, "lr": 7.348902768202088e-06} +{"train_loss": 0.0004310954827815294, "global_step": 59009, "epoch": 495, "lr": 7.347746590887011e-06} +{"train_loss": 0.00037619288195855916, "global_step": 59010, "epoch": 495, "lr": 7.346590497315093e-06} +{"train_loss": 0.0005357870250009, "global_step": 59011, "epoch": 495, "lr": 7.345434487488567e-06} +{"train_loss": 0.0004607998125720769, "global_step": 59012, "epoch": 495, "lr": 7.34427856140974e-06} +{"train_loss": 0.0005568102351389825, "global_step": 59013, "epoch": 495, "lr": 7.343122719080864e-06} +{"train_loss": 0.0007491396390832961, "global_step": 59014, "epoch": 495, "lr": 7.341966960504199e-06} +{"train_loss": 0.0006403548177331686, "global_step": 59015, "epoch": 495, "lr": 7.340811285682036e-06} +{"train_loss": 0.0006122415070421994, "global_step": 59016, "epoch": 495, "lr": 7.33965569461662e-06} +{"train_loss": 0.0005131161888130009, "global_step": 59017, "epoch": 495, "lr": 7.338500187310249e-06} +{"train_loss": 0.0003954360436182469, "global_step": 59018, "epoch": 495, "lr": 7.337344763765159e-06} +{"train_loss": 0.00020458651124499738, "global_step": 59019, "epoch": 495, "lr": 7.336189423983647e-06} +{"train_loss": 0.00037259369855746627, "global_step": 59020, "epoch": 495, "lr": 7.335034167967969e-06} +{"train_loss": 0.0004591795732267201, "global_step": 59021, "epoch": 495, "lr": 7.333878995720378e-06} +{"train_loss": 0.00042866080184467137, "global_step": 59022, "epoch": 495, "lr": 7.332723907243178e-06} +{"train_loss": 0.0004248322730447643, "global_step": 59023, "epoch": 495, "lr": 7.331568902538594e-06, "val_loss": 0.019513951614499092, "train_action_mse_error": 4.922959305986296e-06} +{"train_loss": 0.000586490728892386, "global_step": 59024, "epoch": 496, "lr": 7.330413981608935e-06} +{"train_loss": 0.0003899986040778458, "global_step": 59025, "epoch": 496, "lr": 7.329259144456446e-06} +{"train_loss": 0.0002816009509842843, "global_step": 59026, "epoch": 496, "lr": 7.32810439108339e-06} +{"train_loss": 0.00020266564388293773, "global_step": 59027, "epoch": 496, "lr": 7.3269497214920494e-06} +{"train_loss": 0.0005570889916270971, "global_step": 59028, "epoch": 496, "lr": 7.325795135684676e-06} +{"train_loss": 0.00030118372524157166, "global_step": 59029, "epoch": 496, "lr": 7.324640633663554e-06} +{"train_loss": 0.0002521446440368891, "global_step": 59030, "epoch": 496, "lr": 7.3234862154309305e-06} +{"train_loss": 0.0005580255528911948, "global_step": 59031, "epoch": 496, "lr": 7.322331880989097e-06} +{"train_loss": 0.0003484278277028352, "global_step": 59032, "epoch": 496, "lr": 7.321177630340298e-06} +{"train_loss": 0.0005714829894714057, "global_step": 59033, "epoch": 496, "lr": 7.320023463486803e-06} +{"train_loss": 0.0007639917312189937, "global_step": 59034, "epoch": 496, "lr": 7.318869380430893e-06} +{"train_loss": 0.00018714592442847788, "global_step": 59035, "epoch": 496, "lr": 7.317715381174806e-06} +{"train_loss": 0.0002916427329182625, "global_step": 59036, "epoch": 496, "lr": 7.316561465720839e-06} +{"train_loss": 0.0006153874564915895, "global_step": 59037, "epoch": 496, "lr": 7.315407634071236e-06} +{"train_loss": 0.000273609854048118, "global_step": 59038, "epoch": 496, "lr": 7.314253886228278e-06} +{"train_loss": 0.0004511297447606921, "global_step": 59039, "epoch": 496, "lr": 7.313100222194208e-06} +{"train_loss": 0.0007412892882712185, "global_step": 59040, "epoch": 496, "lr": 7.3119466419713125e-06} +{"train_loss": 0.00028604656108655035, "global_step": 59041, "epoch": 496, "lr": 7.310793145561856e-06} +{"train_loss": 0.0004623382701538503, "global_step": 59042, "epoch": 496, "lr": 7.309639732968082e-06} +{"train_loss": 0.0005613118410110474, "global_step": 59043, "epoch": 496, "lr": 7.308486404192288e-06} +{"train_loss": 0.0003633601008914411, "global_step": 59044, "epoch": 496, "lr": 7.307333159236712e-06} +{"train_loss": 0.0004572091274894774, "global_step": 59045, "epoch": 496, "lr": 7.3061799981036236e-06} +{"train_loss": 0.0005107716424390674, "global_step": 59046, "epoch": 496, "lr": 7.305026920795293e-06} +{"train_loss": 0.00040891734533943236, "global_step": 59047, "epoch": 496, "lr": 7.303873927313975e-06} +{"train_loss": 0.0003069625818170607, "global_step": 59048, "epoch": 496, "lr": 7.302721017661951e-06} +{"train_loss": 0.00024344108533114195, "global_step": 59049, "epoch": 496, "lr": 7.301568191841457e-06} +{"train_loss": 0.0003316009242553264, "global_step": 59050, "epoch": 496, "lr": 7.300415449854786e-06} +{"train_loss": 0.00021622661733999848, "global_step": 59051, "epoch": 496, "lr": 7.299262791704187e-06} +{"train_loss": 0.0003183209919370711, "global_step": 59052, "epoch": 496, "lr": 7.2981102173919126e-06} +{"train_loss": 0.0006037044222466648, "global_step": 59053, "epoch": 496, "lr": 7.29695772692025e-06} +{"train_loss": 0.0005205448251217604, "global_step": 59054, "epoch": 496, "lr": 7.295805320291432e-06} +{"train_loss": 0.0003737478400580585, "global_step": 59055, "epoch": 496, "lr": 7.294652997507756e-06} +{"train_loss": 0.0004045853565912694, "global_step": 59056, "epoch": 496, "lr": 7.2935007585714534e-06} +{"train_loss": 0.0005879302625544369, "global_step": 59057, "epoch": 496, "lr": 7.292348603484805e-06} +{"train_loss": 0.00021985081548336893, "global_step": 59058, "epoch": 496, "lr": 7.2911965322500715e-06} +{"train_loss": 0.0003069759695790708, "global_step": 59059, "epoch": 496, "lr": 7.290044544869501e-06} +{"train_loss": 0.00034635505289770663, "global_step": 59060, "epoch": 496, "lr": 7.288892641345374e-06} +{"train_loss": 0.0002564538735896349, "global_step": 59061, "epoch": 496, "lr": 7.287740821679934e-06} +{"train_loss": 0.00018962153990287334, "global_step": 59062, "epoch": 496, "lr": 7.286589085875462e-06} +{"train_loss": 0.0003739396051969379, "global_step": 59063, "epoch": 496, "lr": 7.285437433934212e-06} +{"train_loss": 0.0006274755578488111, "global_step": 59064, "epoch": 496, "lr": 7.284285865858425e-06} +{"train_loss": 0.0005307397223077714, "global_step": 59065, "epoch": 496, "lr": 7.2831343816503975e-06} +{"train_loss": 0.00042418233351781964, "global_step": 59066, "epoch": 496, "lr": 7.281982981312358e-06} +{"train_loss": 0.00029625731986016035, "global_step": 59067, "epoch": 496, "lr": 7.280831664846588e-06} +{"train_loss": 0.0006350179901346564, "global_step": 59068, "epoch": 496, "lr": 7.279680432255331e-06} +{"train_loss": 0.00028105342062190175, "global_step": 59069, "epoch": 496, "lr": 7.278529283540875e-06} +{"train_loss": 0.0009094728739000857, "global_step": 59070, "epoch": 496, "lr": 7.277378218705444e-06} +{"train_loss": 0.0004977613571099937, "global_step": 59071, "epoch": 496, "lr": 7.276227237751332e-06} +{"train_loss": 0.0003595939197111875, "global_step": 59072, "epoch": 496, "lr": 7.275076340680775e-06} +{"train_loss": 0.00028282630955800414, "global_step": 59073, "epoch": 496, "lr": 7.273925527496045e-06} +{"train_loss": 0.00022192500182427466, "global_step": 59074, "epoch": 496, "lr": 7.2727747981993944e-06} +{"train_loss": 0.0007044545491226017, "global_step": 59075, "epoch": 496, "lr": 7.271624152793094e-06} +{"train_loss": 0.0011310247937217355, "global_step": 59076, "epoch": 496, "lr": 7.270473591279381e-06} +{"train_loss": 0.00027859609690494835, "global_step": 59077, "epoch": 496, "lr": 7.269323113660542e-06} +{"train_loss": 0.0005167518393136561, "global_step": 59078, "epoch": 496, "lr": 7.26817271993881e-06} +{"train_loss": 0.000258820247836411, "global_step": 59079, "epoch": 496, "lr": 7.267022410116464e-06} +{"train_loss": 0.0006034616380929947, "global_step": 59080, "epoch": 496, "lr": 7.2658721841957435e-06} +{"train_loss": 0.0005815013428218663, "global_step": 59081, "epoch": 496, "lr": 7.264722042178934e-06} +{"train_loss": 0.0005703022470697761, "global_step": 59082, "epoch": 496, "lr": 7.263571984068274e-06} +{"train_loss": 0.0004234636726323515, "global_step": 59083, "epoch": 496, "lr": 7.26242200986601e-06} +{"train_loss": 0.00038432038854807615, "global_step": 59084, "epoch": 496, "lr": 7.26127211957443e-06} +{"train_loss": 0.0005995050305500627, "global_step": 59085, "epoch": 496, "lr": 7.2601223131957604e-06} +{"train_loss": 0.00040671901660971344, "global_step": 59086, "epoch": 496, "lr": 7.258972590732294e-06} +{"train_loss": 0.0004355821292847395, "global_step": 59087, "epoch": 496, "lr": 7.2578229521862494e-06} +{"train_loss": 0.0005091548664495349, "global_step": 59088, "epoch": 496, "lr": 7.256673397559921e-06} +{"train_loss": 0.00031441019382327795, "global_step": 59089, "epoch": 496, "lr": 7.255523926855546e-06} +{"train_loss": 0.00033147158683277667, "global_step": 59090, "epoch": 496, "lr": 7.254374540075365e-06} +{"train_loss": 0.0003732048498932272, "global_step": 59091, "epoch": 496, "lr": 7.253225237221672e-06} +{"train_loss": 0.0003492050454951823, "global_step": 59092, "epoch": 496, "lr": 7.252076018296688e-06} +{"train_loss": 0.00022809200163464993, "global_step": 59093, "epoch": 496, "lr": 7.2509268833027055e-06} +{"train_loss": 0.0007000793120823801, "global_step": 59094, "epoch": 496, "lr": 7.2497778322419555e-06} +{"train_loss": 0.00046238460345193744, "global_step": 59095, "epoch": 496, "lr": 7.248628865116686e-06} +{"train_loss": 0.0003342141571920365, "global_step": 59096, "epoch": 496, "lr": 7.247479981929178e-06} +{"train_loss": 0.000416175345890224, "global_step": 59097, "epoch": 496, "lr": 7.24633118268167e-06} +{"train_loss": 0.0004981224774383008, "global_step": 59098, "epoch": 496, "lr": 7.245182467376427e-06} +{"train_loss": 0.0004659424303099513, "global_step": 59099, "epoch": 496, "lr": 7.2440338360156955e-06} +{"train_loss": 0.0008394325850531459, "global_step": 59100, "epoch": 496, "lr": 7.242885288601742e-06} +{"train_loss": 0.0003475888224784285, "global_step": 59101, "epoch": 496, "lr": 7.241736825136808e-06} +{"train_loss": 0.00042261710041202605, "global_step": 59102, "epoch": 496, "lr": 7.240588445623164e-06} +{"train_loss": 0.0005263859638944268, "global_step": 59103, "epoch": 496, "lr": 7.239440150063048e-06} +{"train_loss": 0.0011223920155316591, "global_step": 59104, "epoch": 496, "lr": 7.238291938458735e-06} +{"train_loss": 0.0002508058096282184, "global_step": 59105, "epoch": 496, "lr": 7.237143810812452e-06} +{"train_loss": 0.0002837228530552238, "global_step": 59106, "epoch": 496, "lr": 7.23599576712648e-06} +{"train_loss": 0.00039862230187281966, "global_step": 59107, "epoch": 496, "lr": 7.234847807403056e-06} +{"train_loss": 0.00021101997117511928, "global_step": 59108, "epoch": 496, "lr": 7.233699931644444e-06} +{"train_loss": 0.0008022409747354686, "global_step": 59109, "epoch": 496, "lr": 7.232552139852889e-06} +{"train_loss": 0.0007317374693229795, "global_step": 59110, "epoch": 496, "lr": 7.231404432030653e-06} +{"train_loss": 0.0007158966618590057, "global_step": 59111, "epoch": 496, "lr": 7.23025680817998e-06} +{"train_loss": 0.0003162407665513456, "global_step": 59112, "epoch": 496, "lr": 7.229109268303135e-06} +{"train_loss": 0.000420455849962309, "global_step": 59113, "epoch": 496, "lr": 7.227961812402367e-06} +{"train_loss": 0.0002860984532162547, "global_step": 59114, "epoch": 496, "lr": 7.226814440479912e-06} +{"train_loss": 0.0003751889744307846, "global_step": 59115, "epoch": 496, "lr": 7.225667152538052e-06} +{"train_loss": 0.0002698157331906259, "global_step": 59116, "epoch": 496, "lr": 7.224519948579011e-06} +{"train_loss": 0.0001896817411761731, "global_step": 59117, "epoch": 496, "lr": 7.223372828605068e-06} +{"train_loss": 0.0004065360117238015, "global_step": 59118, "epoch": 496, "lr": 7.222225792618453e-06} +{"train_loss": 0.000347029825206846, "global_step": 59119, "epoch": 496, "lr": 7.221078840621437e-06} +{"train_loss": 0.000225370517000556, "global_step": 59120, "epoch": 496, "lr": 7.219931972616262e-06} +{"train_loss": 0.000464266020571813, "global_step": 59121, "epoch": 496, "lr": 7.218785188605171e-06} +{"train_loss": 0.00043416174594312906, "global_step": 59122, "epoch": 496, "lr": 7.217638488590434e-06} +{"train_loss": 0.00043339471449144185, "global_step": 59123, "epoch": 496, "lr": 7.216491872574283e-06} +{"train_loss": 0.0004636694211512804, "global_step": 59124, "epoch": 496, "lr": 7.215345340558993e-06} +{"train_loss": 0.00019074442388955504, "global_step": 59125, "epoch": 496, "lr": 7.214198892546797e-06} +{"train_loss": 0.00040297332452610135, "global_step": 59126, "epoch": 496, "lr": 7.213052528539943e-06} +{"train_loss": 0.0003944171767216176, "global_step": 59127, "epoch": 496, "lr": 7.211906248540695e-06} +{"train_loss": 0.00046081264736130834, "global_step": 59128, "epoch": 496, "lr": 7.2107600525512905e-06} +{"train_loss": 0.00048414425691589713, "global_step": 59129, "epoch": 496, "lr": 7.209613940574e-06} +{"train_loss": 0.00044979623635299504, "global_step": 59130, "epoch": 496, "lr": 7.208467912611045e-06} +{"train_loss": 0.0003602711367420852, "global_step": 59131, "epoch": 496, "lr": 7.20732196866471e-06} +{"train_loss": 0.00040201173396781087, "global_step": 59132, "epoch": 496, "lr": 7.206176108737217e-06} +{"train_loss": 0.0005025891587138176, "global_step": 59133, "epoch": 496, "lr": 7.20503033283082e-06} +{"train_loss": 0.0005587089108303189, "global_step": 59134, "epoch": 496, "lr": 7.203884640947789e-06} +{"train_loss": 0.00029272399842739105, "global_step": 59135, "epoch": 496, "lr": 7.202739033090339e-06} +{"train_loss": 0.00046838363050483167, "global_step": 59136, "epoch": 496, "lr": 7.201593509260745e-06} +{"train_loss": 0.00028551596915349364, "global_step": 59137, "epoch": 496, "lr": 7.200448069461257e-06} +{"train_loss": 0.0005094512598589063, "global_step": 59138, "epoch": 496, "lr": 7.199302713694106e-06} +{"train_loss": 0.0004238926339894533, "global_step": 59139, "epoch": 496, "lr": 7.198157441961567e-06} +{"train_loss": 0.0004120568046346307, "global_step": 59140, "epoch": 496, "lr": 7.197012254265856e-06} +{"train_loss": 0.000723223784007132, "global_step": 59141, "epoch": 496, "lr": 7.1958671506092535e-06} +{"train_loss": 0.0004360543984866959, "global_step": 59142, "epoch": 496, "lr": 7.194722130993981e-06, "val_loss": 0.025385763496160507} +{"train_loss": 0.00045221546315588057, "global_step": 59143, "epoch": 497, "lr": 7.193577195422313e-06} +{"train_loss": 0.0008535108645446599, "global_step": 59144, "epoch": 497, "lr": 7.192432343896477e-06} +{"train_loss": 0.00032649573404341936, "global_step": 59145, "epoch": 497, "lr": 7.1912875764187205e-06} +{"train_loss": 0.00030063159647397697, "global_step": 59146, "epoch": 497, "lr": 7.190142892991303e-06} +{"train_loss": 0.0003558161261025816, "global_step": 59147, "epoch": 497, "lr": 7.188998293616461e-06} +{"train_loss": 0.0004147286235820502, "global_step": 59148, "epoch": 497, "lr": 7.187853778296455e-06} +{"train_loss": 0.0007428879616782069, "global_step": 59149, "epoch": 497, "lr": 7.186709347033516e-06} +{"train_loss": 0.0002863015979528427, "global_step": 59150, "epoch": 497, "lr": 7.185564999829908e-06} +{"train_loss": 0.0004794624401256442, "global_step": 59151, "epoch": 497, "lr": 7.184420736687869e-06} +{"train_loss": 0.0003538693708833307, "global_step": 59152, "epoch": 497, "lr": 7.183276557609631e-06} +{"train_loss": 0.0005296366289258003, "global_step": 59153, "epoch": 497, "lr": 7.182132462597474e-06} +{"train_loss": 0.00034487174707464874, "global_step": 59154, "epoch": 497, "lr": 7.180988451653609e-06} +{"train_loss": 0.000433346867794171, "global_step": 59155, "epoch": 497, "lr": 7.17984452478031e-06} +{"train_loss": 0.0004488483536988497, "global_step": 59156, "epoch": 497, "lr": 7.178700681979805e-06} +{"train_loss": 0.00022827069915365428, "global_step": 59157, "epoch": 497, "lr": 7.177556923254352e-06} +{"train_loss": 0.000296327838441357, "global_step": 59158, "epoch": 497, "lr": 7.1764132486061954e-06} +{"train_loss": 0.0006152509013190866, "global_step": 59159, "epoch": 497, "lr": 7.175269658037565e-06} +{"train_loss": 0.0003985508228652179, "global_step": 59160, "epoch": 497, "lr": 7.174126151550725e-06} +{"train_loss": 0.00028942213975824416, "global_step": 59161, "epoch": 497, "lr": 7.172982729147903e-06} +{"train_loss": 0.00030865296139381826, "global_step": 59162, "epoch": 497, "lr": 7.171839390831364e-06} +{"train_loss": 0.0004573978076223284, "global_step": 59163, "epoch": 497, "lr": 7.17069613660335e-06} +{"train_loss": 0.0001812832779251039, "global_step": 59164, "epoch": 497, "lr": 7.169552966466081e-06} +{"train_loss": 0.0003429149801377207, "global_step": 59165, "epoch": 497, "lr": 7.1684098804218284e-06} +{"train_loss": 0.0004807853256352246, "global_step": 59166, "epoch": 497, "lr": 7.1672668784728226e-06} +{"train_loss": 0.0002930732152890414, "global_step": 59167, "epoch": 497, "lr": 7.1661239606213185e-06} +{"train_loss": 0.00025750260101631284, "global_step": 59168, "epoch": 497, "lr": 7.164981126869541e-06} +{"train_loss": 0.0006737950025126338, "global_step": 59169, "epoch": 497, "lr": 7.1638383772197615e-06} +{"train_loss": 0.00030037376563996077, "global_step": 59170, "epoch": 497, "lr": 7.1626957116741995e-06} +{"train_loss": 0.00048763820086605847, "global_step": 59171, "epoch": 497, "lr": 7.161553130235104e-06} +{"train_loss": 0.00040660606464371085, "global_step": 59172, "epoch": 497, "lr": 7.160410632904735e-06} +{"train_loss": 0.0005970174679532647, "global_step": 59173, "epoch": 497, "lr": 7.159268219685311e-06} +{"train_loss": 0.0004440431948751211, "global_step": 59174, "epoch": 497, "lr": 7.1581258905791035e-06} +{"train_loss": 0.0008364081149920821, "global_step": 59175, "epoch": 497, "lr": 7.156983645588322e-06} +{"train_loss": 0.0002087484608637169, "global_step": 59176, "epoch": 497, "lr": 7.155841484715237e-06} +{"train_loss": 0.0003743410634342581, "global_step": 59177, "epoch": 497, "lr": 7.154699407962084e-06} +{"train_loss": 0.00045999910798855126, "global_step": 59178, "epoch": 497, "lr": 7.1535574153310855e-06} +{"train_loss": 0.0005918003153055906, "global_step": 59179, "epoch": 497, "lr": 7.152415506824517e-06} +{"train_loss": 0.00033484792220406234, "global_step": 59180, "epoch": 497, "lr": 7.151273682444587e-06} +{"train_loss": 0.0006110642571002245, "global_step": 59181, "epoch": 497, "lr": 7.150131942193566e-06} +{"train_loss": 0.00034721012343652546, "global_step": 59182, "epoch": 497, "lr": 7.148990286073681e-06} +{"train_loss": 0.0005469007301144302, "global_step": 59183, "epoch": 497, "lr": 7.147848714087163e-06} +{"train_loss": 0.00035743883927352726, "global_step": 59184, "epoch": 497, "lr": 7.146707226236282e-06} +{"train_loss": 0.00037655115011148155, "global_step": 59185, "epoch": 497, "lr": 7.1455658225232535e-06} +{"train_loss": 0.0002665486535988748, "global_step": 59186, "epoch": 497, "lr": 7.144424502950336e-06} +{"train_loss": 0.0006051514646969736, "global_step": 59187, "epoch": 497, "lr": 7.1432832675197515e-06} +{"train_loss": 0.00030219342443160713, "global_step": 59188, "epoch": 497, "lr": 7.142142116233763e-06} +{"train_loss": 0.0006915867561474442, "global_step": 59189, "epoch": 497, "lr": 7.141001049094598e-06} +{"train_loss": 0.00030239243642427027, "global_step": 59190, "epoch": 497, "lr": 7.139860066104486e-06} +{"train_loss": 0.0006320684333331883, "global_step": 59191, "epoch": 497, "lr": 7.138719167265695e-06} +{"train_loss": 0.0005170992226339877, "global_step": 59192, "epoch": 497, "lr": 7.137578352580437e-06} +{"train_loss": 0.00044954847544431686, "global_step": 59193, "epoch": 497, "lr": 7.136437622050979e-06} +{"train_loss": 0.00023495001369155943, "global_step": 59194, "epoch": 497, "lr": 7.135296975679545e-06} +{"train_loss": 0.0006604532827623188, "global_step": 59195, "epoch": 497, "lr": 7.134156413468362e-06} +{"train_loss": 0.0002916076919063926, "global_step": 59196, "epoch": 497, "lr": 7.1330159354196955e-06} +{"train_loss": 0.000602369022089988, "global_step": 59197, "epoch": 497, "lr": 7.131875541535765e-06} +{"train_loss": 0.0004859548935201019, "global_step": 59198, "epoch": 497, "lr": 7.130735231818825e-06} +{"train_loss": 0.0006356352241709828, "global_step": 59199, "epoch": 497, "lr": 7.129595006271095e-06} +{"train_loss": 0.0006057868013158441, "global_step": 59200, "epoch": 497, "lr": 7.128454864894835e-06} +{"train_loss": 0.00044031054130755365, "global_step": 59201, "epoch": 497, "lr": 7.127314807692264e-06} +{"train_loss": 0.0006326481234282255, "global_step": 59202, "epoch": 497, "lr": 7.126174834665645e-06} +{"train_loss": 0.00032331375405192375, "global_step": 59203, "epoch": 497, "lr": 7.125034945817188e-06} +{"train_loss": 0.00043895337148569524, "global_step": 59204, "epoch": 497, "lr": 7.123895141149156e-06} +{"train_loss": 0.0010228686733171344, "global_step": 59205, "epoch": 497, "lr": 7.122755420663762e-06} +{"train_loss": 0.00048688420793041587, "global_step": 59206, "epoch": 497, "lr": 7.121615784363267e-06} +{"train_loss": 0.000736975867766887, "global_step": 59207, "epoch": 497, "lr": 7.12047623224989e-06} +{"train_loss": 0.0006850158097222447, "global_step": 59208, "epoch": 497, "lr": 7.119336764325885e-06} +{"train_loss": 0.0002830829471349716, "global_step": 59209, "epoch": 497, "lr": 7.118197380593472e-06} +{"train_loss": 0.0008117395918816328, "global_step": 59210, "epoch": 497, "lr": 7.117058081054911e-06} +{"train_loss": 0.00033550491207279265, "global_step": 59211, "epoch": 497, "lr": 7.115918865712412e-06} +{"train_loss": 0.0004037625330965966, "global_step": 59212, "epoch": 497, "lr": 7.114779734568233e-06} +{"train_loss": 0.000753785774577409, "global_step": 59213, "epoch": 497, "lr": 7.113640687624606e-06} +{"train_loss": 0.0004875477752648294, "global_step": 59214, "epoch": 497, "lr": 7.112501724883752e-06} +{"train_loss": 0.0005849211593158543, "global_step": 59215, "epoch": 497, "lr": 7.11136284634793e-06} +{"train_loss": 0.0005633424152620137, "global_step": 59216, "epoch": 497, "lr": 7.110224052019354e-06} +{"train_loss": 0.0004646883753594011, "global_step": 59217, "epoch": 497, "lr": 7.1090853419002846e-06} +{"train_loss": 0.0003005475737154484, "global_step": 59218, "epoch": 497, "lr": 7.1079467159929245e-06} +{"train_loss": 0.0006874307873658836, "global_step": 59219, "epoch": 497, "lr": 7.10680817429955e-06} +{"train_loss": 0.0004516044573392719, "global_step": 59220, "epoch": 497, "lr": 7.105669716822366e-06} +{"train_loss": 0.0006113079725764692, "global_step": 59221, "epoch": 497, "lr": 7.104531343563614e-06} +{"train_loss": 0.00038123835111036897, "global_step": 59222, "epoch": 497, "lr": 7.1033930545255366e-06} +{"train_loss": 0.0009225485846400261, "global_step": 59223, "epoch": 497, "lr": 7.1022548497103605e-06} +{"train_loss": 0.0005281557678245008, "global_step": 59224, "epoch": 497, "lr": 7.1011167291203275e-06} +{"train_loss": 0.00048716095625422895, "global_step": 59225, "epoch": 497, "lr": 7.099978692757658e-06} +{"train_loss": 0.0005354612949304283, "global_step": 59226, "epoch": 497, "lr": 7.098840740624613e-06} +{"train_loss": 0.00034966127714142203, "global_step": 59227, "epoch": 497, "lr": 7.097702872723411e-06} +{"train_loss": 0.000588390335906297, "global_step": 59228, "epoch": 497, "lr": 7.096565089056273e-06} +{"train_loss": 0.0004421884659677744, "global_step": 59229, "epoch": 497, "lr": 7.095427389625453e-06} +{"train_loss": 0.0005913365166634321, "global_step": 59230, "epoch": 497, "lr": 7.094289774433171e-06} +{"train_loss": 0.0004893715376965702, "global_step": 59231, "epoch": 497, "lr": 7.093152243481677e-06} +{"train_loss": 0.0007736568222753704, "global_step": 59232, "epoch": 497, "lr": 7.0920147967731945e-06} +{"train_loss": 0.0002720977645367384, "global_step": 59233, "epoch": 497, "lr": 7.090877434309951e-06} +{"train_loss": 0.0003994965518359095, "global_step": 59234, "epoch": 497, "lr": 7.089740156094177e-06} +{"train_loss": 0.0004484547534957528, "global_step": 59235, "epoch": 497, "lr": 7.088602962128132e-06} +{"train_loss": 0.00030611883266828954, "global_step": 59236, "epoch": 497, "lr": 7.087465852414016e-06} +{"train_loss": 0.00027334317564964294, "global_step": 59237, "epoch": 497, "lr": 7.0863288269540865e-06} +{"train_loss": 0.00035049751750193536, "global_step": 59238, "epoch": 497, "lr": 7.085191885750558e-06} +{"train_loss": 0.0003562791971489787, "global_step": 59239, "epoch": 497, "lr": 7.084055028805675e-06} +{"train_loss": 0.0003057712165173143, "global_step": 59240, "epoch": 497, "lr": 7.0829182561216624e-06} +{"train_loss": 0.00033158290898427367, "global_step": 59241, "epoch": 497, "lr": 7.0817815677007625e-06} +{"train_loss": 0.0004738940915558487, "global_step": 59242, "epoch": 497, "lr": 7.080644963545185e-06} +{"train_loss": 0.0004706906620413065, "global_step": 59243, "epoch": 497, "lr": 7.07950844365719e-06} +{"train_loss": 0.0007423167699016631, "global_step": 59244, "epoch": 497, "lr": 7.078372008038997e-06} +{"train_loss": 0.000498804438393563, "global_step": 59245, "epoch": 497, "lr": 7.077235656692821e-06} +{"train_loss": 0.000697959796525538, "global_step": 59246, "epoch": 497, "lr": 7.076099389620916e-06} +{"train_loss": 0.0004107855202164501, "global_step": 59247, "epoch": 497, "lr": 7.074963206825497e-06} +{"train_loss": 0.00040215946501120925, "global_step": 59248, "epoch": 497, "lr": 7.073827108308812e-06} +{"train_loss": 0.0003632523294072598, "global_step": 59249, "epoch": 497, "lr": 7.0726910940730695e-06} +{"train_loss": 0.0006062111933715641, "global_step": 59250, "epoch": 497, "lr": 7.071555164120525e-06} +{"train_loss": 0.0007368370424956083, "global_step": 59251, "epoch": 497, "lr": 7.070419318453391e-06} +{"train_loss": 0.00032469897996634245, "global_step": 59252, "epoch": 497, "lr": 7.069283557073897e-06} +{"train_loss": 0.0005491044721566141, "global_step": 59253, "epoch": 497, "lr": 7.0681478799842886e-06} +{"train_loss": 0.0006561411428265274, "global_step": 59254, "epoch": 497, "lr": 7.0670122871867695e-06} +{"train_loss": 0.0002365594991715625, "global_step": 59255, "epoch": 497, "lr": 7.0658767786836e-06} +{"train_loss": 0.00041004904778674245, "global_step": 59256, "epoch": 497, "lr": 7.064741354476984e-06} +{"train_loss": 0.0003288228763267398, "global_step": 59257, "epoch": 497, "lr": 7.0636060145691685e-06} +{"train_loss": 0.000686985848005861, "global_step": 59258, "epoch": 497, "lr": 7.062470758962381e-06} +{"train_loss": 0.0003462388995103538, "global_step": 59259, "epoch": 497, "lr": 7.061335587658829e-06} +{"train_loss": 0.00036758638452738523, "global_step": 59260, "epoch": 497, "lr": 7.060200500660768e-06} +{"train_loss": 0.0004733850815804957, "global_step": 59261, "epoch": 497, "lr": 7.059065497970407e-06, "val_loss": 0.031218741089105606} +{"train_loss": 0.0004577577637974173, "global_step": 59262, "epoch": 498, "lr": 7.05793057959e-06} +{"train_loss": 0.0005908318562433124, "global_step": 59263, "epoch": 498, "lr": 7.0567957455217495e-06} +{"train_loss": 0.0003326458972878754, "global_step": 59264, "epoch": 498, "lr": 7.055660995767888e-06} +{"train_loss": 0.00035565922735258937, "global_step": 59265, "epoch": 498, "lr": 7.0545263303306575e-06} +{"train_loss": 0.00046390952775254846, "global_step": 59266, "epoch": 498, "lr": 7.053391749212263e-06} +{"train_loss": 0.0006290232995525002, "global_step": 59267, "epoch": 498, "lr": 7.052257252414957e-06} +{"train_loss": 0.000363740575267002, "global_step": 59268, "epoch": 498, "lr": 7.051122839940943e-06} +{"train_loss": 0.0002954843803308904, "global_step": 59269, "epoch": 498, "lr": 7.049988511792466e-06} +{"train_loss": 0.0003853565431199968, "global_step": 59270, "epoch": 498, "lr": 7.048854267971755e-06} +{"train_loss": 0.00046208922867663205, "global_step": 59271, "epoch": 498, "lr": 7.047720108481021e-06} +{"train_loss": 0.0004113978357054293, "global_step": 59272, "epoch": 498, "lr": 7.046586033322511e-06} +{"train_loss": 0.00024803096312098205, "global_step": 59273, "epoch": 498, "lr": 7.04545204249843e-06} +{"train_loss": 0.0008784107631072402, "global_step": 59274, "epoch": 498, "lr": 7.044318136011024e-06} +{"train_loss": 0.0003522111801430583, "global_step": 59275, "epoch": 498, "lr": 7.0431843138625e-06} +{"train_loss": 0.0004536328779067844, "global_step": 59276, "epoch": 498, "lr": 7.042050576055109e-06} +{"train_loss": 0.0003569525433704257, "global_step": 59277, "epoch": 498, "lr": 7.040916922591056e-06} +{"train_loss": 0.00038354838034138083, "global_step": 59278, "epoch": 498, "lr": 7.039783353472567e-06} +{"train_loss": 0.0004759809235110879, "global_step": 59279, "epoch": 498, "lr": 7.03864986870188e-06} +{"train_loss": 0.00041203966247849166, "global_step": 59280, "epoch": 498, "lr": 7.037516468281208e-06} +{"train_loss": 0.0006384543958120048, "global_step": 59281, "epoch": 498, "lr": 7.036383152212789e-06} +{"train_loss": 0.00038794553256593645, "global_step": 59282, "epoch": 498, "lr": 7.035249920498843e-06} +{"train_loss": 0.0006690702284686267, "global_step": 59283, "epoch": 498, "lr": 7.034116773141586e-06} +{"train_loss": 0.0006986100925132632, "global_step": 59284, "epoch": 498, "lr": 7.032983710143259e-06} +{"train_loss": 0.0005208460497669876, "global_step": 59285, "epoch": 498, "lr": 7.031850731506068e-06} +{"train_loss": 0.0004216264351271093, "global_step": 59286, "epoch": 498, "lr": 7.0307178372322595e-06} +{"train_loss": 0.0010463662911206484, "global_step": 59287, "epoch": 498, "lr": 7.029585027324031e-06} +{"train_loss": 0.0002736249880399555, "global_step": 59288, "epoch": 498, "lr": 7.028452301783634e-06} +{"train_loss": 0.0008991089416667819, "global_step": 59289, "epoch": 498, "lr": 7.027319660613285e-06} +{"train_loss": 0.0004467789549380541, "global_step": 59290, "epoch": 498, "lr": 7.026187103815185e-06} +{"train_loss": 0.000370035064406693, "global_step": 59291, "epoch": 498, "lr": 7.025054631391592e-06} +{"train_loss": 0.00031548060360364616, "global_step": 59292, "epoch": 498, "lr": 7.023922243344699e-06} +{"train_loss": 0.00037497602170333266, "global_step": 59293, "epoch": 498, "lr": 7.022789939676755e-06} +{"train_loss": 0.0006171324057504535, "global_step": 59294, "epoch": 498, "lr": 7.021657720389957e-06} +{"train_loss": 0.0007390317623503506, "global_step": 59295, "epoch": 498, "lr": 7.020525585486559e-06} +{"train_loss": 0.0011335571762174368, "global_step": 59296, "epoch": 498, "lr": 7.019393534968766e-06} +{"train_loss": 0.0005481961998157203, "global_step": 59297, "epoch": 498, "lr": 7.018261568838791e-06} +{"train_loss": 0.00025022507179528475, "global_step": 59298, "epoch": 498, "lr": 7.0171296870988775e-06} +{"train_loss": 0.00046481634490191936, "global_step": 59299, "epoch": 498, "lr": 7.015997889751225e-06} +{"train_loss": 0.000485622207634151, "global_step": 59300, "epoch": 498, "lr": 7.014866176798079e-06} +{"train_loss": 0.0004720124416053295, "global_step": 59301, "epoch": 498, "lr": 7.0137345482416465e-06} +{"train_loss": 0.00048289255937561393, "global_step": 59302, "epoch": 498, "lr": 7.012603004084162e-06} +{"train_loss": 0.0004948130226694047, "global_step": 59303, "epoch": 498, "lr": 7.0114715443278244e-06} +{"train_loss": 0.0004777772701345384, "global_step": 59304, "epoch": 498, "lr": 7.010340168974872e-06} +{"train_loss": 0.0002002015826292336, "global_step": 59305, "epoch": 498, "lr": 7.0092088780275345e-06} +{"train_loss": 0.0003113067359663546, "global_step": 59306, "epoch": 498, "lr": 7.008077671488011e-06} +{"train_loss": 0.0005811959854327142, "global_step": 59307, "epoch": 498, "lr": 7.006946549358545e-06} +{"train_loss": 0.0004070737340953201, "global_step": 59308, "epoch": 498, "lr": 7.0058155116413504e-06} +{"train_loss": 0.0002708591637201607, "global_step": 59309, "epoch": 498, "lr": 7.004684558338631e-06} +{"train_loss": 0.00039790512528270483, "global_step": 59310, "epoch": 498, "lr": 7.00355368945263e-06} +{"train_loss": 0.0012500176671892405, "global_step": 59311, "epoch": 498, "lr": 7.002422904985545e-06} +{"train_loss": 0.00027751154266297817, "global_step": 59312, "epoch": 498, "lr": 7.001292204939625e-06} +{"train_loss": 0.00044847774552181363, "global_step": 59313, "epoch": 498, "lr": 7.000161589317067e-06} +{"train_loss": 0.00048298912588506937, "global_step": 59314, "epoch": 498, "lr": 6.999031058120092e-06} +{"train_loss": 0.00028974804445169866, "global_step": 59315, "epoch": 498, "lr": 6.997900611350933e-06} +{"train_loss": 0.000366402295185253, "global_step": 59316, "epoch": 498, "lr": 6.996770249011797e-06} +{"train_loss": 0.0003300276293884963, "global_step": 59317, "epoch": 498, "lr": 6.995639971104912e-06} +{"train_loss": 0.0004594161291606724, "global_step": 59318, "epoch": 498, "lr": 6.994509777632485e-06} +{"train_loss": 0.0006009139469824731, "global_step": 59319, "epoch": 498, "lr": 6.993379668596755e-06} +{"train_loss": 0.00044382992200553417, "global_step": 59320, "epoch": 498, "lr": 6.992249643999932e-06} +{"train_loss": 0.0002593676035758108, "global_step": 59321, "epoch": 498, "lr": 6.991119703844218e-06} +{"train_loss": 0.0003803772560786456, "global_step": 59322, "epoch": 498, "lr": 6.9899898481318614e-06} +{"train_loss": 0.00044055189937353134, "global_step": 59323, "epoch": 498, "lr": 6.98886007686505e-06} +{"train_loss": 0.0005810066359117627, "global_step": 59324, "epoch": 498, "lr": 6.9877303900460264e-06} +{"train_loss": 0.0003313959459774196, "global_step": 59325, "epoch": 498, "lr": 6.986600787676989e-06} +{"train_loss": 0.0005403967807069421, "global_step": 59326, "epoch": 498, "lr": 6.98547126976018e-06} +{"train_loss": 0.00047971069579944015, "global_step": 59327, "epoch": 498, "lr": 6.984341836297797e-06} +{"train_loss": 0.0005100855487398803, "global_step": 59328, "epoch": 498, "lr": 6.9832124872920565e-06} +{"train_loss": 0.00042392549221403897, "global_step": 59329, "epoch": 498, "lr": 6.982083222745195e-06} +{"train_loss": 0.0001898063492262736, "global_step": 59330, "epoch": 498, "lr": 6.980954042659405e-06} +{"train_loss": 0.0004938651109114289, "global_step": 59331, "epoch": 498, "lr": 6.979824947036923e-06} +{"train_loss": 0.0005152460071258247, "global_step": 59332, "epoch": 498, "lr": 6.978695935879948e-06} +{"train_loss": 0.00023727279040031135, "global_step": 59333, "epoch": 498, "lr": 6.977567009190722e-06} +{"train_loss": 0.000752644264139235, "global_step": 59334, "epoch": 498, "lr": 6.976438166971433e-06} +{"train_loss": 0.0006693190080113709, "global_step": 59335, "epoch": 498, "lr": 6.975309409224329e-06} +{"train_loss": 0.0005268949898891151, "global_step": 59336, "epoch": 498, "lr": 6.974180735951591e-06} +{"train_loss": 0.0005024989368394017, "global_step": 59337, "epoch": 498, "lr": 6.973052147155462e-06} +{"train_loss": 0.00040616357000544667, "global_step": 59338, "epoch": 498, "lr": 6.971923642838141e-06} +{"train_loss": 0.00044503144454210997, "global_step": 59339, "epoch": 498, "lr": 6.970795223001864e-06} +{"train_loss": 0.0002888895687647164, "global_step": 59340, "epoch": 498, "lr": 6.969666887648818e-06} +{"train_loss": 0.000215584208490327, "global_step": 59341, "epoch": 498, "lr": 6.968538636781247e-06} +{"train_loss": 0.0004489741113502532, "global_step": 59342, "epoch": 498, "lr": 6.9674104704013425e-06} +{"train_loss": 0.00033100825385190547, "global_step": 59343, "epoch": 498, "lr": 6.966282388511342e-06} +{"train_loss": 0.0004917420446872711, "global_step": 59344, "epoch": 498, "lr": 6.965154391113432e-06} +{"train_loss": 0.00033754660398699343, "global_step": 59345, "epoch": 498, "lr": 6.964026478209862e-06} +{"train_loss": 0.0003709231677930802, "global_step": 59346, "epoch": 498, "lr": 6.962898649802823e-06} +{"train_loss": 0.00042440748075023293, "global_step": 59347, "epoch": 498, "lr": 6.961770905894527e-06} +{"train_loss": 0.0005293876165524125, "global_step": 59348, "epoch": 498, "lr": 6.960643246487203e-06} +{"train_loss": 0.00044047864503227174, "global_step": 59349, "epoch": 498, "lr": 6.95951567158305e-06} +{"train_loss": 0.0002922579587902874, "global_step": 59350, "epoch": 498, "lr": 6.9583881811842995e-06} +{"train_loss": 0.0006890845252200961, "global_step": 59351, "epoch": 498, "lr": 6.957260775293156e-06} +{"train_loss": 0.00048818395589478314, "global_step": 59352, "epoch": 498, "lr": 6.956133453911823e-06} +{"train_loss": 0.0003725712886080146, "global_step": 59353, "epoch": 498, "lr": 6.955006217042537e-06} +{"train_loss": 0.00024604465579614043, "global_step": 59354, "epoch": 498, "lr": 6.95387906468748e-06} +{"train_loss": 0.00041878194315358996, "global_step": 59355, "epoch": 498, "lr": 6.9527519968488995e-06} +{"train_loss": 0.0005241318140178919, "global_step": 59356, "epoch": 498, "lr": 6.9516250135289726e-06} +{"train_loss": 0.00023881492961663753, "global_step": 59357, "epoch": 498, "lr": 6.950498114729947e-06} +{"train_loss": 0.0006737372605130076, "global_step": 59358, "epoch": 498, "lr": 6.949371300454022e-06} +{"train_loss": 0.0005683198687620461, "global_step": 59359, "epoch": 498, "lr": 6.9482445707033934e-06} +{"train_loss": 0.00031004109769128263, "global_step": 59360, "epoch": 498, "lr": 6.947117925480301e-06} +{"train_loss": 0.00027422592393122613, "global_step": 59361, "epoch": 498, "lr": 6.945991364786925e-06} +{"train_loss": 0.0004510864382609725, "global_step": 59362, "epoch": 498, "lr": 6.944864888625513e-06} +{"train_loss": 0.00023890790180303156, "global_step": 59363, "epoch": 498, "lr": 6.943738496998242e-06} +{"train_loss": 0.0005760107305832207, "global_step": 59364, "epoch": 498, "lr": 6.942612189907355e-06} +{"train_loss": 0.00040848884964361787, "global_step": 59365, "epoch": 498, "lr": 6.941485967355049e-06} +{"train_loss": 0.0003342751588206738, "global_step": 59366, "epoch": 498, "lr": 6.940359829343529e-06} +{"train_loss": 0.0004280243592802435, "global_step": 59367, "epoch": 498, "lr": 6.9392337758750035e-06} +{"train_loss": 0.0002758376067504287, "global_step": 59368, "epoch": 498, "lr": 6.93810780695171e-06} +{"train_loss": 0.0006477141287177801, "global_step": 59369, "epoch": 498, "lr": 6.936981922575825e-06} +{"train_loss": 0.00021096576529089361, "global_step": 59370, "epoch": 498, "lr": 6.93585612274959e-06} +{"train_loss": 0.0007376660360023379, "global_step": 59371, "epoch": 498, "lr": 6.934730407475187e-06} +{"train_loss": 0.0003117580199614167, "global_step": 59372, "epoch": 498, "lr": 6.933604776754854e-06} +{"train_loss": 0.00042590335942804813, "global_step": 59373, "epoch": 498, "lr": 6.932479230590777e-06} +{"train_loss": 0.0007523958338424563, "global_step": 59374, "epoch": 498, "lr": 6.931353768985183e-06} +{"train_loss": 0.000469507765956223, "global_step": 59375, "epoch": 498, "lr": 6.930228391940264e-06} +{"train_loss": 0.00030696517205797136, "global_step": 59376, "epoch": 498, "lr": 6.9291030994582505e-06} +{"train_loss": 0.00033786793937906623, "global_step": 59377, "epoch": 498, "lr": 6.927977891541349e-06} +{"train_loss": 0.0003262069949414581, "global_step": 59378, "epoch": 498, "lr": 6.926852768191744e-06} +{"train_loss": 0.0007371708052232862, "global_step": 59379, "epoch": 498, "lr": 6.925727729411674e-06} +{"train_loss": 0.00045852381219997407, "global_step": 59380, "epoch": 498, "lr": 6.92460277520332e-06, "val_loss": 0.02587086707353592} +{"train_loss": 0.0003507609653752297, "global_step": 59381, "epoch": 499, "lr": 6.9234779055689254e-06} +{"train_loss": 0.00027750033768825233, "global_step": 59382, "epoch": 499, "lr": 6.922353120510677e-06} +{"train_loss": 0.0005375132313929498, "global_step": 59383, "epoch": 499, "lr": 6.921228420030773e-06} +{"train_loss": 0.0003840713179670274, "global_step": 59384, "epoch": 499, "lr": 6.92010380413145e-06} +{"train_loss": 0.0006223246455192566, "global_step": 59385, "epoch": 499, "lr": 6.918979272814885e-06} +{"train_loss": 0.00037971168057993054, "global_step": 59386, "epoch": 499, "lr": 6.917854826083314e-06} +{"train_loss": 0.0005744578666053712, "global_step": 59387, "epoch": 499, "lr": 6.916730463938925e-06} +{"train_loss": 0.0004758539726026356, "global_step": 59388, "epoch": 499, "lr": 6.9156061863839385e-06} +{"train_loss": 0.0005538174300454557, "global_step": 59389, "epoch": 499, "lr": 6.914481993420558e-06} +{"train_loss": 0.00033312832238152623, "global_step": 59390, "epoch": 499, "lr": 6.9133578850509805e-06} +{"train_loss": 0.0002354077878408134, "global_step": 59391, "epoch": 499, "lr": 6.912233861277434e-06} +{"train_loss": 0.0004564534465316683, "global_step": 59392, "epoch": 499, "lr": 6.911109922102099e-06} +{"train_loss": 0.0004112533060833812, "global_step": 59393, "epoch": 499, "lr": 6.909986067527208e-06} +{"train_loss": 0.00024439109256491065, "global_step": 59394, "epoch": 499, "lr": 6.908862297554941e-06} +{"train_loss": 0.00028355675749480724, "global_step": 59395, "epoch": 499, "lr": 6.907738612187536e-06} +{"train_loss": 0.00044129748130217195, "global_step": 59396, "epoch": 499, "lr": 6.906615011427181e-06} +{"train_loss": 0.0006697755889035761, "global_step": 59397, "epoch": 499, "lr": 6.905491495276073e-06} +{"train_loss": 0.0005788260605186224, "global_step": 59398, "epoch": 499, "lr": 6.904368063736439e-06} +{"train_loss": 0.0005734722944907844, "global_step": 59399, "epoch": 499, "lr": 6.903244716810458e-06} +{"train_loss": 0.00030361596145667136, "global_step": 59400, "epoch": 499, "lr": 6.902121454500371e-06} +{"train_loss": 0.000783233845140785, "global_step": 59401, "epoch": 499, "lr": 6.900998276808346e-06} +{"train_loss": 0.0003050864615943283, "global_step": 59402, "epoch": 499, "lr": 6.8998751837366096e-06} +{"train_loss": 0.000551536912098527, "global_step": 59403, "epoch": 499, "lr": 6.898752175287376e-06} +{"train_loss": 0.0004522665694821626, "global_step": 59404, "epoch": 499, "lr": 6.897629251462828e-06} +{"train_loss": 0.00031395553378388286, "global_step": 59405, "epoch": 499, "lr": 6.896506412265186e-06} +{"train_loss": 0.00019312700896989554, "global_step": 59406, "epoch": 499, "lr": 6.895383657696641e-06} +{"train_loss": 0.00035493128234520555, "global_step": 59407, "epoch": 499, "lr": 6.894260987759415e-06} +{"train_loss": 0.00025634185294620693, "global_step": 59408, "epoch": 499, "lr": 6.8931384024557066e-06} +{"train_loss": 0.00041746304486878216, "global_step": 59409, "epoch": 499, "lr": 6.892015901787702e-06} +{"train_loss": 0.0004061499785166234, "global_step": 59410, "epoch": 499, "lr": 6.8908934857576264e-06} +{"train_loss": 0.0005123635637573898, "global_step": 59411, "epoch": 499, "lr": 6.889771154367669e-06} +{"train_loss": 0.0001781270548235625, "global_step": 59412, "epoch": 499, "lr": 6.8886489076200485e-06} +{"train_loss": 0.00020840621436946094, "global_step": 59413, "epoch": 499, "lr": 6.887526745516953e-06} +{"train_loss": 0.00043091055704280734, "global_step": 59414, "epoch": 499, "lr": 6.886404668060603e-06} +{"train_loss": 0.00040283246198669076, "global_step": 59415, "epoch": 499, "lr": 6.885282675253185e-06} +{"train_loss": 0.00037180137587711215, "global_step": 59416, "epoch": 499, "lr": 6.884160767096903e-06} +{"train_loss": 0.00030569941736757755, "global_step": 59417, "epoch": 499, "lr": 6.883038943593978e-06} +{"train_loss": 0.0006512535037472844, "global_step": 59418, "epoch": 499, "lr": 6.881917204746585e-06} +{"train_loss": 0.0002471735642757267, "global_step": 59419, "epoch": 499, "lr": 6.880795550556951e-06} +{"train_loss": 0.0002961834834422916, "global_step": 59420, "epoch": 499, "lr": 6.8796739810272735e-06} +{"train_loss": 0.0003971673722844571, "global_step": 59421, "epoch": 499, "lr": 6.8785524961597345e-06} +{"train_loss": 0.00028958875918760896, "global_step": 59422, "epoch": 499, "lr": 6.8774310959565605e-06} +{"train_loss": 0.00046102626947686076, "global_step": 59423, "epoch": 499, "lr": 6.876309780419937e-06} +{"train_loss": 0.0006228163838386536, "global_step": 59424, "epoch": 499, "lr": 6.8751885495520805e-06} +{"train_loss": 0.0003062278847210109, "global_step": 59425, "epoch": 499, "lr": 6.874067403355172e-06} +{"train_loss": 0.00042397412471473217, "global_step": 59426, "epoch": 499, "lr": 6.8729463418314375e-06} +{"train_loss": 0.0007354955305345356, "global_step": 59427, "epoch": 499, "lr": 6.871825364983064e-06} +{"train_loss": 0.0005803609383292496, "global_step": 59428, "epoch": 499, "lr": 6.870704472812245e-06} +{"train_loss": 0.0005099980626255274, "global_step": 59429, "epoch": 499, "lr": 6.8695836653212e-06} +{"train_loss": 0.0002579909050837159, "global_step": 59430, "epoch": 499, "lr": 6.86846294251211e-06} +{"train_loss": 0.00042052712524309754, "global_step": 59431, "epoch": 499, "lr": 6.867342304387192e-06} +{"train_loss": 0.0004166644357610494, "global_step": 59432, "epoch": 499, "lr": 6.866221750948632e-06} +{"train_loss": 0.0005042878910899162, "global_step": 59433, "epoch": 499, "lr": 6.8651012821986495e-06} +{"train_loss": 0.00023968287860043347, "global_step": 59434, "epoch": 499, "lr": 6.863980898139416e-06} +{"train_loss": 0.00020738592138513923, "global_step": 59435, "epoch": 499, "lr": 6.862860598773163e-06} +{"train_loss": 0.0006475344998762012, "global_step": 59436, "epoch": 499, "lr": 6.8617403841020665e-06} +{"train_loss": 0.0002609013463370502, "global_step": 59437, "epoch": 499, "lr": 6.8606202541283306e-06} +{"train_loss": 0.0004243317525833845, "global_step": 59438, "epoch": 499, "lr": 6.859500208854164e-06} +{"train_loss": 0.0004737013950943947, "global_step": 59439, "epoch": 499, "lr": 6.858380248281765e-06} +{"train_loss": 0.00024892381043173373, "global_step": 59440, "epoch": 499, "lr": 6.857260372413316e-06} +{"train_loss": 0.00025214487686753273, "global_step": 59441, "epoch": 499, "lr": 6.856140581251041e-06} +{"train_loss": 0.0003209292481187731, "global_step": 59442, "epoch": 499, "lr": 6.855020874797108e-06} +{"train_loss": 0.000709629850462079, "global_step": 59443, "epoch": 499, "lr": 6.853901253053746e-06} +{"train_loss": 0.0003937714791391045, "global_step": 59444, "epoch": 499, "lr": 6.8527817160231325e-06} +{"train_loss": 0.0004583892005030066, "global_step": 59445, "epoch": 499, "lr": 6.851662263707476e-06} +{"train_loss": 0.00034055658034048975, "global_step": 59446, "epoch": 499, "lr": 6.850542896108975e-06} +{"train_loss": 0.0004840596520807594, "global_step": 59447, "epoch": 499, "lr": 6.84942361322981e-06} +{"train_loss": 0.0004516926419455558, "global_step": 59448, "epoch": 499, "lr": 6.848304415072204e-06} +{"train_loss": 0.0006236823974177241, "global_step": 59449, "epoch": 499, "lr": 6.847185301638331e-06} +{"train_loss": 0.00034104674705304205, "global_step": 59450, "epoch": 499, "lr": 6.846066272930412e-06} +{"train_loss": 0.0003257971548009664, "global_step": 59451, "epoch": 499, "lr": 6.844947328950635e-06} +{"train_loss": 0.00040602186345495284, "global_step": 59452, "epoch": 499, "lr": 6.843828469701174e-06} +{"train_loss": 0.0003517945879139006, "global_step": 59453, "epoch": 499, "lr": 6.8427096951842625e-06} +{"train_loss": 0.0004959539510309696, "global_step": 59454, "epoch": 499, "lr": 6.841591005402065e-06} +{"train_loss": 0.00025068543618544936, "global_step": 59455, "epoch": 499, "lr": 6.8404724003568065e-06} +{"train_loss": 0.00045161001617088914, "global_step": 59456, "epoch": 499, "lr": 6.839353880050658e-06} +{"train_loss": 0.0004433896392583847, "global_step": 59457, "epoch": 499, "lr": 6.8382354444858355e-06} +{"train_loss": 0.0004110615118406713, "global_step": 59458, "epoch": 499, "lr": 6.83711709366453e-06} +{"train_loss": 0.0003758040547836572, "global_step": 59459, "epoch": 499, "lr": 6.835998827588919e-06} +{"train_loss": 0.0002500354021321982, "global_step": 59460, "epoch": 499, "lr": 6.8348806462612265e-06} +{"train_loss": 0.00027952264645136893, "global_step": 59461, "epoch": 499, "lr": 6.833762549683625e-06} +{"train_loss": 0.00033809294109232724, "global_step": 59462, "epoch": 499, "lr": 6.8326445378583295e-06} +{"train_loss": 0.00047856959281489253, "global_step": 59463, "epoch": 499, "lr": 6.831526610787509e-06} +{"train_loss": 0.00038722221506759524, "global_step": 59464, "epoch": 499, "lr": 6.83040876847339e-06} +{"train_loss": 0.0004030304553452879, "global_step": 59465, "epoch": 499, "lr": 6.829291010918137e-06} +{"train_loss": 0.00028479890897870064, "global_step": 59466, "epoch": 499, "lr": 6.828173338123972e-06} +{"train_loss": 0.0004824810312129557, "global_step": 59467, "epoch": 499, "lr": 6.8270557500930695e-06} +{"train_loss": 0.0008186238701455295, "global_step": 59468, "epoch": 499, "lr": 6.825938246827634e-06} +{"train_loss": 0.0005782748339697719, "global_step": 59469, "epoch": 499, "lr": 6.824820828329847e-06} +{"train_loss": 0.0003740538959391415, "global_step": 59470, "epoch": 499, "lr": 6.823703494601929e-06} +{"train_loss": 0.0005117386463098228, "global_step": 59471, "epoch": 499, "lr": 6.82258624564604e-06} +{"train_loss": 0.0002224241616204381, "global_step": 59472, "epoch": 499, "lr": 6.821469081464404e-06} +{"train_loss": 0.0004814074491150677, "global_step": 59473, "epoch": 499, "lr": 6.820352002059182e-06} +{"train_loss": 0.000479592417832464, "global_step": 59474, "epoch": 499, "lr": 6.819235007432606e-06} +{"train_loss": 0.0002503885771147907, "global_step": 59475, "epoch": 499, "lr": 6.8181180975868345e-06} +{"train_loss": 0.0010264575248584151, "global_step": 59476, "epoch": 499, "lr": 6.817001272524087e-06} +{"train_loss": 0.00021823520364705473, "global_step": 59477, "epoch": 499, "lr": 6.815884532246541e-06} +{"train_loss": 0.0005789549322798848, "global_step": 59478, "epoch": 499, "lr": 6.814767876756384e-06} +{"train_loss": 0.0006009740754961967, "global_step": 59479, "epoch": 499, "lr": 6.8136513060558236e-06} +{"train_loss": 0.00038353033596649766, "global_step": 59480, "epoch": 499, "lr": 6.812534820147037e-06} +{"train_loss": 0.00019832918769679964, "global_step": 59481, "epoch": 499, "lr": 6.8114184190322335e-06} +{"train_loss": 0.0002895376819651574, "global_step": 59482, "epoch": 499, "lr": 6.81030210271359e-06} +{"train_loss": 0.000302901171380654, "global_step": 59483, "epoch": 499, "lr": 6.809185871193313e-06} +{"train_loss": 0.0004887809045612812, "global_step": 59484, "epoch": 499, "lr": 6.808069724473581e-06} +{"train_loss": 0.0003213966265320778, "global_step": 59485, "epoch": 499, "lr": 6.806953662556581e-06} +{"train_loss": 0.00042269707773812115, "global_step": 59486, "epoch": 499, "lr": 6.8058376854445275e-06} +{"train_loss": 0.00041492615127936006, "global_step": 59487, "epoch": 499, "lr": 6.804721793139584e-06} +{"train_loss": 0.0004228566540405154, "global_step": 59488, "epoch": 499, "lr": 6.803605985643962e-06} +{"train_loss": 0.00030097083072178066, "global_step": 59489, "epoch": 499, "lr": 6.8024902629598485e-06} +{"train_loss": 0.00047575365169905126, "global_step": 59490, "epoch": 499, "lr": 6.801374625089418e-06} +{"train_loss": 0.0005008911248296499, "global_step": 59491, "epoch": 499, "lr": 6.800259072034887e-06} +{"train_loss": 0.0003376741660758853, "global_step": 59492, "epoch": 499, "lr": 6.799143603798419e-06} +{"train_loss": 0.000797137210611254, "global_step": 59493, "epoch": 499, "lr": 6.79802822038223e-06} +{"train_loss": 0.00018814664508681744, "global_step": 59494, "epoch": 499, "lr": 6.796912921788484e-06} +{"train_loss": 0.0002852886391337961, "global_step": 59495, "epoch": 499, "lr": 6.795797708019397e-06} +{"train_loss": 0.000598694896325469, "global_step": 59496, "epoch": 499, "lr": 6.794682579077144e-06} +{"train_loss": 0.0002886377915274352, "global_step": 59497, "epoch": 499, "lr": 6.793567534963901e-06} +{"train_loss": 0.00028536003082990646, "global_step": 59498, "epoch": 499, "lr": 6.7924525756818905e-06} +{"train_loss": 0.00041699364594039074, "global_step": 59499, "epoch": 499, "lr": 6.7913377012332694e-06, "val_loss": 0.013159927912056446} +{"train_loss": 0.0005429575103335083, "global_step": 59500, "epoch": 500, "lr": 6.790222911620236e-06} +{"train_loss": 0.00022866865037940443, "global_step": 59501, "epoch": 500, "lr": 6.789108206845002e-06} +{"train_loss": 0.0003694001352414489, "global_step": 59502, "epoch": 500, "lr": 6.787993586909719e-06} +{"train_loss": 0.00020867367857135832, "global_step": 59503, "epoch": 500, "lr": 6.786879051816614e-06} +{"train_loss": 0.001032606465741992, "global_step": 59504, "epoch": 500, "lr": 6.785764601567834e-06} +{"train_loss": 0.00035863497760146856, "global_step": 59505, "epoch": 500, "lr": 6.7846502361656076e-06} +{"train_loss": 0.0003989440738223493, "global_step": 59506, "epoch": 500, "lr": 6.783535955612091e-06} +{"train_loss": 0.0003137096937280148, "global_step": 59507, "epoch": 500, "lr": 6.782421759909496e-06} +{"train_loss": 0.000307030335534364, "global_step": 59508, "epoch": 500, "lr": 6.781307649059998e-06} +{"train_loss": 0.00015315022028516978, "global_step": 59509, "epoch": 500, "lr": 6.780193623065772e-06} +{"train_loss": 0.0003986479132436216, "global_step": 59510, "epoch": 500, "lr": 6.7790796819290295e-06} +{"train_loss": 0.00036700410419143736, "global_step": 59511, "epoch": 500, "lr": 6.7779658256519386e-06} +{"train_loss": 0.00032557707163505256, "global_step": 59512, "epoch": 500, "lr": 6.776852054236704e-06} +{"train_loss": 0.00045308656990528107, "global_step": 59513, "epoch": 500, "lr": 6.775738367685491e-06} +{"train_loss": 0.00028801418375223875, "global_step": 59514, "epoch": 500, "lr": 6.774624766000509e-06} +{"train_loss": 0.0006028556381352246, "global_step": 59515, "epoch": 500, "lr": 6.773511249183933e-06} +{"train_loss": 0.0003737477236427367, "global_step": 59516, "epoch": 500, "lr": 6.772397817237941e-06} +{"train_loss": 0.0005082570714876056, "global_step": 59517, "epoch": 500, "lr": 6.771284470164735e-06} +{"train_loss": 0.0003174866724293679, "global_step": 59518, "epoch": 500, "lr": 6.770171207966486e-06} +{"train_loss": 0.0003736197541002184, "global_step": 59519, "epoch": 500, "lr": 6.769058030645397e-06} +{"train_loss": 0.00027647678507491946, "global_step": 59520, "epoch": 500, "lr": 6.7679449382036405e-06} +{"train_loss": 0.00041355780558660626, "global_step": 59521, "epoch": 500, "lr": 6.7668319306434026e-06} +{"train_loss": 0.00035671063233166933, "global_step": 59522, "epoch": 500, "lr": 6.765719007966876e-06} +{"train_loss": 0.0005431001773104072, "global_step": 59523, "epoch": 500, "lr": 6.76460617017623e-06} +{"train_loss": 0.0002668765955604613, "global_step": 59524, "epoch": 500, "lr": 6.763493417273675e-06} +{"train_loss": 0.0005347759579308331, "global_step": 59525, "epoch": 500, "lr": 6.762380749261371e-06} +{"train_loss": 0.000761649978812784, "global_step": 59526, "epoch": 500, "lr": 6.761268166141521e-06} +{"train_loss": 0.00047812380944378674, "global_step": 59527, "epoch": 500, "lr": 6.760155667916301e-06} +{"train_loss": 0.00020516864606179297, "global_step": 59528, "epoch": 500, "lr": 6.759043254587888e-06} +{"train_loss": 0.0001615166838746518, "global_step": 59529, "epoch": 500, "lr": 6.757930926158485e-06} +{"train_loss": 0.0002647392393555492, "global_step": 59530, "epoch": 500, "lr": 6.75681868263025e-06} +{"train_loss": 0.000644302403088659, "global_step": 59531, "epoch": 500, "lr": 6.7557065240053955e-06} +{"train_loss": 0.00025702224229462445, "global_step": 59532, "epoch": 500, "lr": 6.754594450286083e-06} +{"train_loss": 0.00016688965843059123, "global_step": 59533, "epoch": 500, "lr": 6.753482461474508e-06} +{"train_loss": 0.0001430477568646893, "global_step": 59534, "epoch": 500, "lr": 6.752370557572846e-06} +{"train_loss": 0.00014902482507750392, "global_step": 59535, "epoch": 500, "lr": 6.751258738583282e-06} +{"train_loss": 0.0004087751149199903, "global_step": 59536, "epoch": 500, "lr": 6.750147004508012e-06} +{"train_loss": 0.0003464120381977409, "global_step": 59537, "epoch": 500, "lr": 6.749035355349192e-06} +{"train_loss": 0.0002684285573195666, "global_step": 59538, "epoch": 500, "lr": 6.74792379110904e-06} +{"train_loss": 0.00037978857289999723, "global_step": 59539, "epoch": 500, "lr": 6.746812311789713e-06} +{"train_loss": 0.00047024182276800275, "global_step": 59540, "epoch": 500, "lr": 6.745700917393389e-06} +{"train_loss": 0.00028636041679419577, "global_step": 59541, "epoch": 500, "lr": 6.744589607922275e-06} +{"train_loss": 0.00022018412710167468, "global_step": 59542, "epoch": 500, "lr": 6.743478383378521e-06} +{"train_loss": 0.00018230434216093272, "global_step": 59543, "epoch": 500, "lr": 6.742367243764341e-06} +{"train_loss": 0.0004995570634491742, "global_step": 59544, "epoch": 500, "lr": 6.741256189081891e-06} +{"train_loss": 0.000409746979130432, "global_step": 59545, "epoch": 500, "lr": 6.740145219333372e-06} +{"train_loss": 0.000254456652328372, "global_step": 59546, "epoch": 500, "lr": 6.739034334520955e-06} +{"train_loss": 0.0005459490930661559, "global_step": 59547, "epoch": 500, "lr": 6.737923534646812e-06} +{"train_loss": 0.00037184666143730283, "global_step": 59548, "epoch": 500, "lr": 6.7368128197131455e-06} +{"train_loss": 0.00023848730779718608, "global_step": 59549, "epoch": 500, "lr": 6.735702189722115e-06} +{"train_loss": 0.0003461602027527988, "global_step": 59550, "epoch": 500, "lr": 6.734591644675919e-06} +{"train_loss": 0.0003722929104696959, "global_step": 59551, "epoch": 500, "lr": 6.733481184576723e-06} +{"train_loss": 0.0007961568189784884, "global_step": 59552, "epoch": 500, "lr": 6.732370809426725e-06} +{"train_loss": 0.00023416693147737533, "global_step": 59553, "epoch": 500, "lr": 6.731260519228094e-06} +{"train_loss": 0.00031842075986787677, "global_step": 59554, "epoch": 500, "lr": 6.730150313982997e-06} +{"train_loss": 0.0005298127653077245, "global_step": 59555, "epoch": 500, "lr": 6.729040193693642e-06} +{"train_loss": 0.0007391276303678751, "global_step": 59556, "epoch": 500, "lr": 6.727930158362184e-06} +{"train_loss": 0.00048348109703511, "global_step": 59557, "epoch": 500, "lr": 6.726820207990819e-06} +{"train_loss": 0.00018851013737730682, "global_step": 59558, "epoch": 500, "lr": 6.7257103425817205e-06} +{"train_loss": 0.00032004155218601227, "global_step": 59559, "epoch": 500, "lr": 6.724600562137057e-06} +{"train_loss": 0.0003386247262824327, "global_step": 59560, "epoch": 500, "lr": 6.723490866659027e-06} +{"train_loss": 0.0006859588902443647, "global_step": 59561, "epoch": 500, "lr": 6.722381256149784e-06} +{"train_loss": 0.0004574411432258785, "global_step": 59562, "epoch": 500, "lr": 6.721271730611539e-06} +{"train_loss": 0.00021970452507957816, "global_step": 59563, "epoch": 500, "lr": 6.720162290046439e-06} +{"train_loss": 0.00027870104531757534, "global_step": 59564, "epoch": 500, "lr": 6.7190529344566875e-06} +{"train_loss": 0.00036975540569983423, "global_step": 59565, "epoch": 500, "lr": 6.717943663844445e-06} +{"train_loss": 0.00036217624437995255, "global_step": 59566, "epoch": 500, "lr": 6.716834478211903e-06} +{"train_loss": 0.0003354868676979095, "global_step": 59567, "epoch": 500, "lr": 6.715725377561222e-06} +{"train_loss": 0.00019112609152216464, "global_step": 59568, "epoch": 500, "lr": 6.714616361894599e-06} +{"train_loss": 0.0004784872289747, "global_step": 59569, "epoch": 500, "lr": 6.713507431214194e-06} +{"train_loss": 0.0005242734332568944, "global_step": 59570, "epoch": 500, "lr": 6.712398585522206e-06} +{"train_loss": 0.00024496641708537936, "global_step": 59571, "epoch": 500, "lr": 6.7112898248207825e-06} +{"train_loss": 0.00035852339351549745, "global_step": 59572, "epoch": 500, "lr": 6.710181149112133e-06} +{"train_loss": 0.00042870049946941435, "global_step": 59573, "epoch": 500, "lr": 6.709072558398405e-06} +{"train_loss": 0.000324014516081661, "global_step": 59574, "epoch": 500, "lr": 6.707964052681798e-06} +{"train_loss": 0.0004494663153309375, "global_step": 59575, "epoch": 500, "lr": 6.7068556319644645e-06} +{"train_loss": 0.00031594294705428183, "global_step": 59576, "epoch": 500, "lr": 6.70574729624861e-06} +{"train_loss": 0.0003479749138932675, "global_step": 59577, "epoch": 500, "lr": 6.704639045536398e-06} +{"train_loss": 0.0003956332220695913, "global_step": 59578, "epoch": 500, "lr": 6.703530879829983e-06} +{"train_loss": 0.0004026307142339647, "global_step": 59579, "epoch": 500, "lr": 6.7024227991315745e-06} +{"train_loss": 0.0002524817828088999, "global_step": 59580, "epoch": 500, "lr": 6.701314803443326e-06} +{"train_loss": 0.0006081716273911297, "global_step": 59581, "epoch": 500, "lr": 6.70020689276743e-06} +{"train_loss": 0.00030189764220267534, "global_step": 59582, "epoch": 500, "lr": 6.699099067106035e-06} +{"train_loss": 0.000649358844384551, "global_step": 59583, "epoch": 500, "lr": 6.69799132646135e-06} +{"train_loss": 0.0002899029350373894, "global_step": 59584, "epoch": 500, "lr": 6.69688367083553e-06} +{"train_loss": 0.00046978448517620564, "global_step": 59585, "epoch": 500, "lr": 6.695776100230738e-06} +{"train_loss": 0.00036308736889623106, "global_step": 59586, "epoch": 500, "lr": 6.69466861464918e-06} +{"train_loss": 0.00046592680155299604, "global_step": 59587, "epoch": 500, "lr": 6.693561214093002e-06} +{"train_loss": 0.00026732560945674777, "global_step": 59588, "epoch": 500, "lr": 6.692453898564399e-06} +{"train_loss": 0.0004638081882148981, "global_step": 59589, "epoch": 500, "lr": 6.69134666806554e-06} +{"train_loss": 0.0004488458507694304, "global_step": 59590, "epoch": 500, "lr": 6.6902395225985795e-06} +{"train_loss": 0.0003596408059820533, "global_step": 59591, "epoch": 500, "lr": 6.6891324621657206e-06} +{"train_loss": 0.0007004392682574689, "global_step": 59592, "epoch": 500, "lr": 6.6880254867691115e-06} +{"train_loss": 0.0002836555358953774, "global_step": 59593, "epoch": 500, "lr": 6.686918596410946e-06} +{"train_loss": 0.0005354058230295777, "global_step": 59594, "epoch": 500, "lr": 6.6858117910933774e-06} +{"train_loss": 0.00034972172579728067, "global_step": 59595, "epoch": 500, "lr": 6.684705070818603e-06} +{"train_loss": 0.00040687763248570263, "global_step": 59596, "epoch": 500, "lr": 6.683598435588773e-06} +{"train_loss": 0.00047257417463697493, "global_step": 59597, "epoch": 500, "lr": 6.682491885406078e-06} +{"train_loss": 0.00032445648685097694, "global_step": 59598, "epoch": 500, "lr": 6.681385420272674e-06} +{"train_loss": 0.0006342835258692503, "global_step": 59599, "epoch": 500, "lr": 6.6802790401907455e-06} +{"train_loss": 0.0005084174918010831, "global_step": 59600, "epoch": 500, "lr": 6.67917274516246e-06} +{"train_loss": 0.00043574883602559566, "global_step": 59601, "epoch": 500, "lr": 6.678066535189997e-06} +{"train_loss": 0.0003187684342265129, "global_step": 59602, "epoch": 500, "lr": 6.676960410275513e-06} +{"train_loss": 0.0003367414465174079, "global_step": 59603, "epoch": 500, "lr": 6.6758543704211975e-06} +{"train_loss": 0.0002926736488007009, "global_step": 59604, "epoch": 500, "lr": 6.6747484156292e-06} +{"train_loss": 0.0003410176432225853, "global_step": 59605, "epoch": 500, "lr": 6.67364254590172e-06} +{"train_loss": 0.0006425347528420389, "global_step": 59606, "epoch": 500, "lr": 6.672536761240905e-06} +{"train_loss": 0.00020872503228019923, "global_step": 59607, "epoch": 500, "lr": 6.671431061648942e-06} +{"train_loss": 0.0004097963101230562, "global_step": 59608, "epoch": 500, "lr": 6.670325447127995e-06} +{"train_loss": 0.0003625502868089825, "global_step": 59609, "epoch": 500, "lr": 6.669219917680225e-06} +{"train_loss": 0.00020749577379319817, "global_step": 59610, "epoch": 500, "lr": 6.66811447330783e-06} +{"train_loss": 0.0004334768746048212, "global_step": 59611, "epoch": 500, "lr": 6.667009114012946e-06} +{"train_loss": 0.0005282392958179116, "global_step": 59612, "epoch": 500, "lr": 6.665903839797766e-06} +{"train_loss": 0.0008120772545225918, "global_step": 59613, "epoch": 500, "lr": 6.66479865066445e-06} +{"train_loss": 0.0005536821554414928, "global_step": 59614, "epoch": 500, "lr": 6.663693546615185e-06} +{"train_loss": 0.00031987621332518756, "global_step": 59615, "epoch": 500, "lr": 6.662588527652125e-06} +{"train_loss": 0.000390899513149634, "global_step": 59616, "epoch": 500, "lr": 6.661483593777429e-06} +{"train_loss": 0.0006729340530000627, "global_step": 59617, "epoch": 500, "lr": 6.660378744993295e-06} +{"train_loss": 0.0003973014624358914, "global_step": 59618, "epoch": 500, "lr": 6.659273981301861e-06, "val_loss": 0.021711019799113274, "train_action_mse_error": 6.411842605302809e-06} +{"train_loss": 0.0003209818678442389, "global_step": 59619, "epoch": 501, "lr": 6.658169302705325e-06} +{"train_loss": 0.0002946397289633751, "global_step": 59620, "epoch": 501, "lr": 6.657064709205846e-06} +{"train_loss": 0.0002790464204736054, "global_step": 59621, "epoch": 501, "lr": 6.655960200805577e-06} +{"train_loss": 0.00041545118438079953, "global_step": 59622, "epoch": 501, "lr": 6.654855777506713e-06} +{"train_loss": 0.0002611051022540778, "global_step": 59623, "epoch": 501, "lr": 6.653751439311395e-06} +{"train_loss": 0.0005473373457789421, "global_step": 59624, "epoch": 501, "lr": 6.652647186221816e-06} +{"train_loss": 0.00023319607134908438, "global_step": 59625, "epoch": 501, "lr": 6.651543018240125e-06} +{"train_loss": 0.000418224954046309, "global_step": 59626, "epoch": 501, "lr": 6.650438935368508e-06} +{"train_loss": 0.00038165051955729723, "global_step": 59627, "epoch": 501, "lr": 6.649334937609125e-06} +{"train_loss": 0.000281042157439515, "global_step": 59628, "epoch": 501, "lr": 6.648231024964124e-06} +{"train_loss": 0.0003390223137103021, "global_step": 59629, "epoch": 501, "lr": 6.64712719743571e-06} +{"train_loss": 0.0003728088631760329, "global_step": 59630, "epoch": 501, "lr": 6.646023455026013e-06} +{"train_loss": 0.00044489189167506993, "global_step": 59631, "epoch": 501, "lr": 6.6449197977372315e-06} +{"train_loss": 0.00019187018915545195, "global_step": 59632, "epoch": 501, "lr": 6.643816225571503e-06} +{"train_loss": 0.0005804051761515439, "global_step": 59633, "epoch": 501, "lr": 6.642712738531009e-06} +{"train_loss": 0.00034513769787736237, "global_step": 59634, "epoch": 501, "lr": 6.641609336617932e-06} +{"train_loss": 0.0004805669595953077, "global_step": 59635, "epoch": 501, "lr": 6.640506019834408e-06} +{"train_loss": 0.0004511254373937845, "global_step": 59636, "epoch": 501, "lr": 6.639402788182636e-06} +{"train_loss": 0.0002585301408544183, "global_step": 59637, "epoch": 501, "lr": 6.638299641664747e-06} +{"train_loss": 0.0005636878195218742, "global_step": 59638, "epoch": 501, "lr": 6.637196580282934e-06} +{"train_loss": 0.00040865832124836743, "global_step": 59639, "epoch": 501, "lr": 6.6360936040393565e-06} +{"train_loss": 0.00036008437746204436, "global_step": 59640, "epoch": 501, "lr": 6.634990712936168e-06} +{"train_loss": 0.0005886571598239243, "global_step": 59641, "epoch": 501, "lr": 6.63388790697555e-06} +{"train_loss": 0.0003215497999917716, "global_step": 59642, "epoch": 501, "lr": 6.632785186159646e-06} +{"train_loss": 0.0003714827762451023, "global_step": 59643, "epoch": 501, "lr": 6.631682550490648e-06} +{"train_loss": 0.0005253065610304475, "global_step": 59644, "epoch": 501, "lr": 6.6305799999706986e-06} +{"train_loss": 0.0003255086194258183, "global_step": 59645, "epoch": 501, "lr": 6.629477534601985e-06} +{"train_loss": 0.00025660861865617335, "global_step": 59646, "epoch": 501, "lr": 6.628375154386657e-06} +{"train_loss": 0.00034202143433503807, "global_step": 59647, "epoch": 501, "lr": 6.627272859326867e-06} +{"train_loss": 0.00034116400638595223, "global_step": 59648, "epoch": 501, "lr": 6.626170649424806e-06} +{"train_loss": 0.0003562612400855869, "global_step": 59649, "epoch": 501, "lr": 6.625068524682615e-06} +{"train_loss": 0.00024355892674066126, "global_step": 59650, "epoch": 501, "lr": 6.623966485102478e-06} +{"train_loss": 0.000507170450873673, "global_step": 59651, "epoch": 501, "lr": 6.62286453068654e-06} +{"train_loss": 0.00036419855314306915, "global_step": 59652, "epoch": 501, "lr": 6.621762661436981e-06} +{"train_loss": 0.0004653488867916167, "global_step": 59653, "epoch": 501, "lr": 6.620660877355956e-06} +{"train_loss": 0.0002729206462390721, "global_step": 59654, "epoch": 501, "lr": 6.619559178445622e-06} +{"train_loss": 0.000410112232202664, "global_step": 59655, "epoch": 501, "lr": 6.6184575647081586e-06} +{"train_loss": 0.0003830480563919991, "global_step": 59656, "epoch": 501, "lr": 6.6173560361457055e-06} +{"train_loss": 0.0004987891879864037, "global_step": 59657, "epoch": 501, "lr": 6.616254592760457e-06} +{"train_loss": 0.00036633547279052436, "global_step": 59658, "epoch": 501, "lr": 6.61515323455455e-06} +{"train_loss": 0.0005361232324503362, "global_step": 59659, "epoch": 501, "lr": 6.614051961530149e-06} +{"train_loss": 0.0005354161257855594, "global_step": 59660, "epoch": 501, "lr": 6.612950773689431e-06} +{"train_loss": 0.0003510003734845668, "global_step": 59661, "epoch": 501, "lr": 6.611849671034537e-06} +{"train_loss": 0.0008459645905531943, "global_step": 59662, "epoch": 501, "lr": 6.6107486535676496e-06} +{"train_loss": 0.0005410233861766756, "global_step": 59663, "epoch": 501, "lr": 6.609647721290913e-06} +{"train_loss": 0.0002569085918366909, "global_step": 59664, "epoch": 501, "lr": 6.608546874206512e-06} +{"train_loss": 0.0006654871394857764, "global_step": 59665, "epoch": 501, "lr": 6.607446112316579e-06} +{"train_loss": 0.0003435417893342674, "global_step": 59666, "epoch": 501, "lr": 6.606345435623301e-06} +{"train_loss": 0.00040285338764078915, "global_step": 59667, "epoch": 501, "lr": 6.605244844128816e-06} +{"train_loss": 0.0003731708275154233, "global_step": 59668, "epoch": 501, "lr": 6.604144337835299e-06} +{"train_loss": 0.00023570333723910153, "global_step": 59669, "epoch": 501, "lr": 6.603043916744916e-06} +{"train_loss": 0.00033991268719546497, "global_step": 59670, "epoch": 501, "lr": 6.601943580859815e-06} +{"train_loss": 0.0004666812310460955, "global_step": 59671, "epoch": 501, "lr": 6.600843330182166e-06} +{"train_loss": 0.00032473463215865195, "global_step": 59672, "epoch": 501, "lr": 6.599743164714128e-06} +{"train_loss": 0.0002433690387988463, "global_step": 59673, "epoch": 501, "lr": 6.598643084457845e-06} +{"train_loss": 0.00019467363017611206, "global_step": 59674, "epoch": 501, "lr": 6.597543089415503e-06} +{"train_loss": 0.0004388244415167719, "global_step": 59675, "epoch": 501, "lr": 6.596443179589234e-06} +{"train_loss": 0.0004121628880966455, "global_step": 59676, "epoch": 501, "lr": 6.595343354981226e-06} +{"train_loss": 0.00036428924067877233, "global_step": 59677, "epoch": 501, "lr": 6.594243615593621e-06} +{"train_loss": 0.0003475642006378621, "global_step": 59678, "epoch": 501, "lr": 6.593143961428572e-06} +{"train_loss": 0.0003152849094476551, "global_step": 59679, "epoch": 501, "lr": 6.592044392488261e-06} +{"train_loss": 0.00032327225198969245, "global_step": 59680, "epoch": 501, "lr": 6.5909449087748206e-06} +{"train_loss": 0.0007015515002422035, "global_step": 59681, "epoch": 501, "lr": 6.5898455102904325e-06} +{"train_loss": 0.0003645479155238718, "global_step": 59682, "epoch": 501, "lr": 6.588746197037232e-06} +{"train_loss": 0.00032733954139985144, "global_step": 59683, "epoch": 501, "lr": 6.587646969017402e-06} +{"train_loss": 0.0004860842600464821, "global_step": 59684, "epoch": 501, "lr": 6.586547826233092e-06} +{"train_loss": 0.00030574132688343525, "global_step": 59685, "epoch": 501, "lr": 6.585448768686448e-06} +{"train_loss": 0.0006117109442129731, "global_step": 59686, "epoch": 501, "lr": 6.5843497963796465e-06} +{"train_loss": 0.0006904836627654731, "global_step": 59687, "epoch": 501, "lr": 6.58325090931482e-06} +{"train_loss": 0.0003071590035688132, "global_step": 59688, "epoch": 501, "lr": 6.58215210749416e-06} +{"train_loss": 0.0005271947011351585, "global_step": 59689, "epoch": 501, "lr": 6.5810533909198e-06} +{"train_loss": 0.0002499774273019284, "global_step": 59690, "epoch": 501, "lr": 6.579954759593898e-06} +{"train_loss": 0.0006575658335350454, "global_step": 59691, "epoch": 501, "lr": 6.578856213518625e-06} +{"train_loss": 0.0005805628607049584, "global_step": 59692, "epoch": 501, "lr": 6.577757752696112e-06} +{"train_loss": 0.0004740958393085748, "global_step": 59693, "epoch": 501, "lr": 6.576659377128552e-06} +{"train_loss": 0.00033059538691304624, "global_step": 59694, "epoch": 501, "lr": 6.575561086818066e-06} +{"train_loss": 0.0003266565327066928, "global_step": 59695, "epoch": 501, "lr": 6.574462881766841e-06} +{"train_loss": 0.000257165142102167, "global_step": 59696, "epoch": 501, "lr": 6.5733647619770025e-06} +{"train_loss": 0.00034785494790412486, "global_step": 59697, "epoch": 501, "lr": 6.572266727450737e-06} +{"train_loss": 0.0004692876827903092, "global_step": 59698, "epoch": 501, "lr": 6.571168778190179e-06} +{"train_loss": 0.0004379942547529936, "global_step": 59699, "epoch": 501, "lr": 6.570070914197496e-06} +{"train_loss": 0.00027512694941833615, "global_step": 59700, "epoch": 501, "lr": 6.568973135474832e-06} +{"train_loss": 0.0002568452910054475, "global_step": 59701, "epoch": 501, "lr": 6.567875442024362e-06} +{"train_loss": 0.00017181823204737157, "global_step": 59702, "epoch": 501, "lr": 6.5667778338482145e-06} +{"train_loss": 0.0003768285096157342, "global_step": 59703, "epoch": 501, "lr": 6.565680310948569e-06} +{"train_loss": 0.0003208170528523624, "global_step": 59704, "epoch": 501, "lr": 6.564582873327557e-06} +{"train_loss": 0.00036349627771414816, "global_step": 59705, "epoch": 501, "lr": 6.563485520987362e-06} +{"train_loss": 0.0004973973263986409, "global_step": 59706, "epoch": 501, "lr": 6.562388253930107e-06} +{"train_loss": 0.00034972248249687254, "global_step": 59707, "epoch": 501, "lr": 6.561291072157977e-06} +{"train_loss": 0.00047871333663351834, "global_step": 59708, "epoch": 501, "lr": 6.560193975673113e-06} +{"train_loss": 0.0004625010769814253, "global_step": 59709, "epoch": 501, "lr": 6.559096964477651e-06} +{"train_loss": 0.00039690049015916884, "global_step": 59710, "epoch": 501, "lr": 6.558000038573775e-06} +{"train_loss": 0.00028320192359387875, "global_step": 59711, "epoch": 501, "lr": 6.5569031979636155e-06} +{"train_loss": 0.00021860598644707352, "global_step": 59712, "epoch": 501, "lr": 6.5558064426493425e-06} +{"train_loss": 0.00026173933292739093, "global_step": 59713, "epoch": 501, "lr": 6.554709772633094e-06} +{"train_loss": 0.00030352556495927274, "global_step": 59714, "epoch": 501, "lr": 6.55361318791704e-06} +{"train_loss": 0.0008685995126143098, "global_step": 59715, "epoch": 501, "lr": 6.552516688503324e-06} +{"train_loss": 0.00037782255094498396, "global_step": 59716, "epoch": 501, "lr": 6.551420274394093e-06} +{"train_loss": 0.00048391835298389196, "global_step": 59717, "epoch": 501, "lr": 6.550323945591513e-06} +{"train_loss": 0.0004983700346201658, "global_step": 59718, "epoch": 501, "lr": 6.549227702097721e-06} +{"train_loss": 0.0006331451586447656, "global_step": 59719, "epoch": 501, "lr": 6.548131543914893e-06} +{"train_loss": 0.00043156612082384527, "global_step": 59720, "epoch": 501, "lr": 6.547035471045148e-06} +{"train_loss": 0.00043033709516748786, "global_step": 59721, "epoch": 501, "lr": 6.5459394834906765e-06} +{"train_loss": 0.000250592187512666, "global_step": 59722, "epoch": 501, "lr": 6.544843581253607e-06} +{"train_loss": 0.000434128480264917, "global_step": 59723, "epoch": 501, "lr": 6.543747764336078e-06} +{"train_loss": 0.00036399628152139485, "global_step": 59724, "epoch": 501, "lr": 6.542652032740276e-06} +{"train_loss": 0.0005178573192097247, "global_step": 59725, "epoch": 501, "lr": 6.541556386468317e-06} +{"train_loss": 0.0003368580073583871, "global_step": 59726, "epoch": 501, "lr": 6.540460825522387e-06} +{"train_loss": 0.0003454689576756209, "global_step": 59727, "epoch": 501, "lr": 6.539365349904613e-06} +{"train_loss": 0.00025036625447683036, "global_step": 59728, "epoch": 501, "lr": 6.538269959617144e-06} +{"train_loss": 0.00029634253587573767, "global_step": 59729, "epoch": 501, "lr": 6.537174654662137e-06} +{"train_loss": 0.0004949445137754083, "global_step": 59730, "epoch": 501, "lr": 6.536079435041759e-06} +{"train_loss": 0.0002511122729629278, "global_step": 59731, "epoch": 501, "lr": 6.534984300758135e-06} +{"train_loss": 0.0005753878504037857, "global_step": 59732, "epoch": 501, "lr": 6.53388925181343e-06} +{"train_loss": 0.00031180764199234545, "global_step": 59733, "epoch": 501, "lr": 6.532794288209781e-06} +{"train_loss": 0.0003965483629144728, "global_step": 59734, "epoch": 501, "lr": 6.53169940994936e-06} +{"train_loss": 0.0004433846042957157, "global_step": 59735, "epoch": 501, "lr": 6.530604617034291e-06} +{"train_loss": 0.0007593042100779712, "global_step": 59736, "epoch": 501, "lr": 6.529509909466753e-06} +{"train_loss": 0.0004001662231484788, "global_step": 59737, "epoch": 501, "lr": 6.528415287248857e-06, "val_loss": 0.03102118708193302} +{"train_loss": 0.00019786307530011982, "global_step": 59738, "epoch": 502, "lr": 6.527320750382793e-06} +{"train_loss": 0.00032441155053675175, "global_step": 59739, "epoch": 502, "lr": 6.526226298870686e-06} +{"train_loss": 0.0003050366067327559, "global_step": 59740, "epoch": 502, "lr": 6.525131932714679e-06} +{"train_loss": 0.0002506000455468893, "global_step": 59741, "epoch": 502, "lr": 6.524037651916937e-06} +{"train_loss": 0.0007496012258343399, "global_step": 59742, "epoch": 502, "lr": 6.522943456479597e-06} +{"train_loss": 0.000346911110682413, "global_step": 59743, "epoch": 502, "lr": 6.521849346404823e-06} +{"train_loss": 0.00029281299794092774, "global_step": 59744, "epoch": 502, "lr": 6.5207553216947435e-06} +{"train_loss": 0.0003305130230728537, "global_step": 59745, "epoch": 502, "lr": 6.5196613823515215e-06} +{"train_loss": 0.00024052910157479346, "global_step": 59746, "epoch": 502, "lr": 6.5185675283773e-06} +{"train_loss": 0.0003663086681626737, "global_step": 59747, "epoch": 502, "lr": 6.517473759774218e-06} +{"train_loss": 0.00026117762899957597, "global_step": 59748, "epoch": 502, "lr": 6.516380076544442e-06} +{"train_loss": 0.0005240881000645459, "global_step": 59749, "epoch": 502, "lr": 6.515286478690097e-06} +{"train_loss": 0.0002361187944188714, "global_step": 59750, "epoch": 502, "lr": 6.51419296621335e-06} +{"train_loss": 0.000298282946459949, "global_step": 59751, "epoch": 502, "lr": 6.5130995391163295e-06} +{"train_loss": 0.0003836749237962067, "global_step": 59752, "epoch": 502, "lr": 6.512006197401205e-06} +{"train_loss": 0.00022271915804594755, "global_step": 59753, "epoch": 502, "lr": 6.510912941070107e-06} +{"train_loss": 0.0004891410353593528, "global_step": 59754, "epoch": 502, "lr": 6.509819770125181e-06} +{"train_loss": 0.00022843065380584449, "global_step": 59755, "epoch": 502, "lr": 6.5087266845685834e-06} +{"train_loss": 0.0004892213619314134, "global_step": 59756, "epoch": 502, "lr": 6.507633684402442e-06} +{"train_loss": 0.00048769594286568463, "global_step": 59757, "epoch": 502, "lr": 6.506540769628927e-06} +{"train_loss": 0.0003098668239545077, "global_step": 59758, "epoch": 502, "lr": 6.505447940250176e-06} +{"train_loss": 0.0005919670220464468, "global_step": 59759, "epoch": 502, "lr": 6.504355196268319e-06} +{"train_loss": 0.000289830204565078, "global_step": 59760, "epoch": 502, "lr": 6.503262537685522e-06} +{"train_loss": 0.0003556717128958553, "global_step": 59761, "epoch": 502, "lr": 6.502169964503913e-06} +{"train_loss": 0.0005801304359920323, "global_step": 59762, "epoch": 502, "lr": 6.5010774767256586e-06} +{"train_loss": 0.0003463306638877839, "global_step": 59763, "epoch": 502, "lr": 6.499985074352877e-06} +{"train_loss": 0.0003086372744292021, "global_step": 59764, "epoch": 502, "lr": 6.4988927573877315e-06} +{"train_loss": 0.0002467199810780585, "global_step": 59765, "epoch": 502, "lr": 6.497800525832371e-06} +{"train_loss": 0.0002503404102753848, "global_step": 59766, "epoch": 502, "lr": 6.496708379688921e-06} +{"train_loss": 0.0004265990573912859, "global_step": 59767, "epoch": 502, "lr": 6.495616318959546e-06} +{"train_loss": 0.0003365157754160464, "global_step": 59768, "epoch": 502, "lr": 6.494524343646374e-06} +{"train_loss": 0.0004162004333920777, "global_step": 59769, "epoch": 502, "lr": 6.493432453751563e-06} +{"train_loss": 0.00031168677378445864, "global_step": 59770, "epoch": 502, "lr": 6.49234064927724e-06} +{"train_loss": 0.0004799567977897823, "global_step": 59771, "epoch": 502, "lr": 6.491248930225568e-06} +{"train_loss": 0.00026309239910915494, "global_step": 59772, "epoch": 502, "lr": 6.4901572965986814e-06} +{"train_loss": 0.0006830318598076701, "global_step": 59773, "epoch": 502, "lr": 6.4890657483987095e-06} +{"train_loss": 0.00022114689636509866, "global_step": 59774, "epoch": 502, "lr": 6.4879742856278235e-06} +{"train_loss": 0.0006534030544571579, "global_step": 59775, "epoch": 502, "lr": 6.4868829082881334e-06} +{"train_loss": 0.0005084284930489957, "global_step": 59776, "epoch": 502, "lr": 6.48579161638182e-06} +{"train_loss": 0.0008496011723764241, "global_step": 59777, "epoch": 502, "lr": 6.484700409910998e-06} +{"train_loss": 0.000695400929544121, "global_step": 59778, "epoch": 502, "lr": 6.483609288877812e-06} +{"train_loss": 0.00043453663238324225, "global_step": 59779, "epoch": 502, "lr": 6.4825182532844195e-06} +{"train_loss": 0.0004224172735121101, "global_step": 59780, "epoch": 502, "lr": 6.481427303132942e-06} +{"train_loss": 0.0005596208502538502, "global_step": 59781, "epoch": 502, "lr": 6.480336438425544e-06} +{"train_loss": 0.0005626099300570786, "global_step": 59782, "epoch": 502, "lr": 6.479245659164346e-06} +{"train_loss": 0.0004518738714978099, "global_step": 59783, "epoch": 502, "lr": 6.478154965351507e-06} +{"train_loss": 0.00023276303545571864, "global_step": 59784, "epoch": 502, "lr": 6.477064356989165e-06} +{"train_loss": 0.00030041194986552, "global_step": 59785, "epoch": 502, "lr": 6.475973834079446e-06} +{"train_loss": 0.0007868555258028209, "global_step": 59786, "epoch": 502, "lr": 6.474883396624509e-06} +{"train_loss": 0.0004483918601181358, "global_step": 59787, "epoch": 502, "lr": 6.473793044626486e-06} +{"train_loss": 0.0002004452544497326, "global_step": 59788, "epoch": 502, "lr": 6.472702778087525e-06} +{"train_loss": 0.00024426577147096395, "global_step": 59789, "epoch": 502, "lr": 6.471612597009752e-06} +{"train_loss": 0.0004968924331478775, "global_step": 59790, "epoch": 502, "lr": 6.470522501395327e-06} +{"train_loss": 0.0008054127683863044, "global_step": 59791, "epoch": 502, "lr": 6.4694324912463854e-06} +{"train_loss": 0.0002602168533485383, "global_step": 59792, "epoch": 502, "lr": 6.468342566565045e-06} +{"train_loss": 0.0005109274061396718, "global_step": 59793, "epoch": 502, "lr": 6.467252727353479e-06} +{"train_loss": 0.000537073879968375, "global_step": 59794, "epoch": 502, "lr": 6.4661629736137985e-06} +{"train_loss": 0.000542435038369149, "global_step": 59795, "epoch": 502, "lr": 6.465073305348168e-06} +{"train_loss": 0.00023968266032170504, "global_step": 59796, "epoch": 502, "lr": 6.463983722558703e-06} +{"train_loss": 0.0004515022155828774, "global_step": 59797, "epoch": 502, "lr": 6.4628942252475675e-06} +{"train_loss": 0.0004453473666217178, "global_step": 59798, "epoch": 502, "lr": 6.4618048134168775e-06} +{"train_loss": 0.0004027094109915197, "global_step": 59799, "epoch": 502, "lr": 6.4607154870687806e-06} +{"train_loss": 0.0005188144859857857, "global_step": 59800, "epoch": 502, "lr": 6.459626246205425e-06} +{"train_loss": 0.0008361421059817076, "global_step": 59801, "epoch": 502, "lr": 6.458537090828937e-06} +{"train_loss": 0.0004730677464976907, "global_step": 59802, "epoch": 502, "lr": 6.45744802094147e-06} +{"train_loss": 0.0003373905783519149, "global_step": 59803, "epoch": 502, "lr": 6.456359036545145e-06} +{"train_loss": 0.0005293184658512473, "global_step": 59804, "epoch": 502, "lr": 6.4552701376421054e-06} +{"train_loss": 0.00034072011476382613, "global_step": 59805, "epoch": 502, "lr": 6.454181324234493e-06} +{"train_loss": 0.0003629086131695658, "global_step": 59806, "epoch": 502, "lr": 6.453092596324439e-06} +{"train_loss": 0.00048777315532788634, "global_step": 59807, "epoch": 502, "lr": 6.452003953914093e-06} +{"train_loss": 0.0004153653862886131, "global_step": 59808, "epoch": 502, "lr": 6.4509153970055855e-06} +{"train_loss": 0.000539979140739888, "global_step": 59809, "epoch": 502, "lr": 6.449826925601043e-06} +{"train_loss": 0.00036695931339636445, "global_step": 59810, "epoch": 502, "lr": 6.448738539702626e-06} +{"train_loss": 0.0003494935226626694, "global_step": 59811, "epoch": 502, "lr": 6.447650239312441e-06} +{"train_loss": 0.0002506219025235623, "global_step": 59812, "epoch": 502, "lr": 6.4465620244326565e-06} +{"train_loss": 0.00049855891847983, "global_step": 59813, "epoch": 502, "lr": 6.445473895065384e-06} +{"train_loss": 0.000576834543608129, "global_step": 59814, "epoch": 502, "lr": 6.444385851212781e-06} +{"train_loss": 0.00041913348832167685, "global_step": 59815, "epoch": 502, "lr": 6.443297892876976e-06} +{"train_loss": 0.00044989478192292154, "global_step": 59816, "epoch": 502, "lr": 6.442210020060085e-06} +{"train_loss": 0.0003097128646913916, "global_step": 59817, "epoch": 502, "lr": 6.441122232764274e-06} +{"train_loss": 0.00035153955104760826, "global_step": 59818, "epoch": 502, "lr": 6.440034530991657e-06} +{"train_loss": 0.00024531909730285406, "global_step": 59819, "epoch": 502, "lr": 6.438946914744393e-06} +{"train_loss": 0.0008457486401312053, "global_step": 59820, "epoch": 502, "lr": 6.437859384024586e-06} +{"train_loss": 0.0003030471852980554, "global_step": 59821, "epoch": 502, "lr": 6.4367719388344016e-06} +{"train_loss": 0.00033634345163591206, "global_step": 59822, "epoch": 502, "lr": 6.43568457917596e-06} +{"train_loss": 0.0004602130502462387, "global_step": 59823, "epoch": 502, "lr": 6.434597305051388e-06} +{"train_loss": 0.000531132856849581, "global_step": 59824, "epoch": 502, "lr": 6.433510116462838e-06} +{"train_loss": 0.0007128759752959013, "global_step": 59825, "epoch": 502, "lr": 6.432423013412425e-06} +{"train_loss": 0.0002961887512356043, "global_step": 59826, "epoch": 502, "lr": 6.43133599590231e-06} +{"train_loss": 0.00066657445859164, "global_step": 59827, "epoch": 502, "lr": 6.430249063934601e-06} +{"train_loss": 0.0006149917026050389, "global_step": 59828, "epoch": 502, "lr": 6.429162217511453e-06} +{"train_loss": 0.00037360770511440933, "global_step": 59829, "epoch": 502, "lr": 6.42807545663498e-06} +{"train_loss": 0.00034296594094485044, "global_step": 59830, "epoch": 502, "lr": 6.426988781307336e-06} +{"train_loss": 0.00025383394677191973, "global_step": 59831, "epoch": 502, "lr": 6.42590219153063e-06} +{"train_loss": 0.0002616884303279221, "global_step": 59832, "epoch": 502, "lr": 6.424815687307023e-06} +{"train_loss": 0.0002684112114366144, "global_step": 59833, "epoch": 502, "lr": 6.423729268638629e-06} +{"train_loss": 0.00034953985596075654, "global_step": 59834, "epoch": 502, "lr": 6.422642935527595e-06} +{"train_loss": 0.0003837778349407017, "global_step": 59835, "epoch": 502, "lr": 6.4215566879760324e-06} +{"train_loss": 0.00037759917904622853, "global_step": 59836, "epoch": 502, "lr": 6.4204705259861e-06} +{"train_loss": 0.00046365606249310076, "global_step": 59837, "epoch": 502, "lr": 6.419384449559906e-06} +{"train_loss": 0.00032752694096416235, "global_step": 59838, "epoch": 502, "lr": 6.418298458699612e-06} +{"train_loss": 0.00035409716656431556, "global_step": 59839, "epoch": 502, "lr": 6.417212553407315e-06} +{"train_loss": 0.00029844100936315954, "global_step": 59840, "epoch": 502, "lr": 6.416126733685179e-06} +{"train_loss": 0.0006072188843972981, "global_step": 59841, "epoch": 502, "lr": 6.415040999535321e-06} +{"train_loss": 0.00033182124025188386, "global_step": 59842, "epoch": 502, "lr": 6.41395535095986e-06} +{"train_loss": 0.00025505395024083555, "global_step": 59843, "epoch": 502, "lr": 6.412869787960957e-06} +{"train_loss": 0.00032826128881424665, "global_step": 59844, "epoch": 502, "lr": 6.411784310540714e-06} +{"train_loss": 0.0005571552901528776, "global_step": 59845, "epoch": 502, "lr": 6.410698918701286e-06} +{"train_loss": 0.00042977792327292264, "global_step": 59846, "epoch": 502, "lr": 6.4096136124447984e-06} +{"train_loss": 0.0007039810298010707, "global_step": 59847, "epoch": 502, "lr": 6.4085283917733605e-06} +{"train_loss": 0.0006019325228407979, "global_step": 59848, "epoch": 502, "lr": 6.4074432566891325e-06} +{"train_loss": 0.0004961979575455189, "global_step": 59849, "epoch": 502, "lr": 6.406358207194224e-06} +{"train_loss": 0.00030429736943915486, "global_step": 59850, "epoch": 502, "lr": 6.405273243290782e-06} +{"train_loss": 0.0006698555080220103, "global_step": 59851, "epoch": 502, "lr": 6.404188364980923e-06} +{"train_loss": 0.00042147625936195254, "global_step": 59852, "epoch": 502, "lr": 6.403103572266789e-06} +{"train_loss": 0.0005548602202907205, "global_step": 59853, "epoch": 502, "lr": 6.402018865150505e-06} +{"train_loss": 0.0003009149804711342, "global_step": 59854, "epoch": 502, "lr": 6.400934243634188e-06} +{"train_loss": 0.0004092560848221183, "global_step": 59855, "epoch": 502, "lr": 6.399849707719985e-06} +{"train_loss": 0.0004231072061043624, "global_step": 59856, "epoch": 502, "lr": 6.398765257410017e-06, "val_loss": 0.015159238129854202} +{"train_loss": 0.0005328943370841444, "global_step": 59857, "epoch": 503, "lr": 6.39768089270642e-06} +{"train_loss": 0.00037434001569636166, "global_step": 59858, "epoch": 503, "lr": 6.396596613611311e-06} +{"train_loss": 0.0006123359780758619, "global_step": 59859, "epoch": 503, "lr": 6.395512420126831e-06} +{"train_loss": 0.0003299677337054163, "global_step": 59860, "epoch": 503, "lr": 6.394428312255107e-06} +{"train_loss": 0.0002625123888719827, "global_step": 59861, "epoch": 503, "lr": 6.39334428999826e-06} +{"train_loss": 0.00035572651540860534, "global_step": 59862, "epoch": 503, "lr": 6.392260353358415e-06} +{"train_loss": 0.00019744674500543624, "global_step": 59863, "epoch": 503, "lr": 6.39117650233772e-06} +{"train_loss": 0.0007887791725806892, "global_step": 59864, "epoch": 503, "lr": 6.39009273693828e-06} +{"train_loss": 0.0002706644299905747, "global_step": 59865, "epoch": 503, "lr": 6.389009057162249e-06} +{"train_loss": 0.0004004306101705879, "global_step": 59866, "epoch": 503, "lr": 6.387925463011724e-06} +{"train_loss": 0.0003386841563042253, "global_step": 59867, "epoch": 503, "lr": 6.386841954488865e-06} +{"train_loss": 0.00035812181886285543, "global_step": 59868, "epoch": 503, "lr": 6.385758531595764e-06} +{"train_loss": 0.0003807965258602053, "global_step": 59869, "epoch": 503, "lr": 6.384675194334583e-06} +{"train_loss": 0.0004927408299408853, "global_step": 59870, "epoch": 503, "lr": 6.383591942707417e-06} +{"train_loss": 0.00029663523309864104, "global_step": 59871, "epoch": 503, "lr": 6.382508776716423e-06} +{"train_loss": 0.00029578167595900595, "global_step": 59872, "epoch": 503, "lr": 6.381425696363713e-06} +{"train_loss": 0.00043171492870897055, "global_step": 59873, "epoch": 503, "lr": 6.380342701651404e-06} +{"train_loss": 0.0002768370322883129, "global_step": 59874, "epoch": 503, "lr": 6.379259792581638e-06} +{"train_loss": 0.00022761226864531636, "global_step": 59875, "epoch": 503, "lr": 6.37817696915653e-06} +{"train_loss": 0.00032869441201910377, "global_step": 59876, "epoch": 503, "lr": 6.3770942313782166e-06} +{"train_loss": 0.0003614961460698396, "global_step": 59877, "epoch": 503, "lr": 6.3760115792488255e-06} +{"train_loss": 0.0004994797054678202, "global_step": 59878, "epoch": 503, "lr": 6.374929012770459e-06} +{"train_loss": 0.0003497573488857597, "global_step": 59879, "epoch": 503, "lr": 6.373846531945271e-06} +{"train_loss": 0.0003952987608499825, "global_step": 59880, "epoch": 503, "lr": 6.372764136775361e-06} +{"train_loss": 0.0002483176358509809, "global_step": 59881, "epoch": 503, "lr": 6.371681827262882e-06} +{"train_loss": 0.00029673188691958785, "global_step": 59882, "epoch": 503, "lr": 6.370599603409933e-06} +{"train_loss": 0.00022912440181244165, "global_step": 59883, "epoch": 503, "lr": 6.369517465218661e-06} +{"train_loss": 0.000390992674510926, "global_step": 59884, "epoch": 503, "lr": 6.368435412691176e-06} +{"train_loss": 0.00038377888267859817, "global_step": 59885, "epoch": 503, "lr": 6.367353445829605e-06} +{"train_loss": 0.0002663101477082819, "global_step": 59886, "epoch": 503, "lr": 6.366271564636078e-06} +{"train_loss": 0.0004938083002343774, "global_step": 59887, "epoch": 503, "lr": 6.365189769112706e-06} +{"train_loss": 0.00027278586640022695, "global_step": 59888, "epoch": 503, "lr": 6.364108059261631e-06} +{"train_loss": 0.0009684762917459011, "global_step": 59889, "epoch": 503, "lr": 6.363026435084962e-06} +{"train_loss": 0.00027848067111335695, "global_step": 59890, "epoch": 503, "lr": 6.3619448965848375e-06} +{"train_loss": 0.00026437011547386646, "global_step": 59891, "epoch": 503, "lr": 6.360863443763371e-06} +{"train_loss": 0.0004111262387596071, "global_step": 59892, "epoch": 503, "lr": 6.359782076622678e-06} +{"train_loss": 0.00037292405613698065, "global_step": 59893, "epoch": 503, "lr": 6.3587007951649015e-06} +{"train_loss": 0.0004349545924924314, "global_step": 59894, "epoch": 503, "lr": 6.357619599392139e-06} +{"train_loss": 0.0004128968867007643, "global_step": 59895, "epoch": 503, "lr": 6.356538489306541e-06} +{"train_loss": 0.00028287002351135015, "global_step": 59896, "epoch": 503, "lr": 6.355457464910208e-06} +{"train_loss": 0.0005453256308101118, "global_step": 59897, "epoch": 503, "lr": 6.354376526205269e-06} +{"train_loss": 0.00031293928623199463, "global_step": 59898, "epoch": 503, "lr": 6.35329567319386e-06} +{"train_loss": 0.00021669373381882906, "global_step": 59899, "epoch": 503, "lr": 6.3522149058780844e-06} +{"train_loss": 0.0006567995296791196, "global_step": 59900, "epoch": 503, "lr": 6.35113422426008e-06} +{"train_loss": 0.0004366859211586416, "global_step": 59901, "epoch": 503, "lr": 6.350053628341951e-06} +{"train_loss": 0.00027318811044096947, "global_step": 59902, "epoch": 503, "lr": 6.348973118125834e-06} +{"train_loss": 0.0005356970359571278, "global_step": 59903, "epoch": 503, "lr": 6.347892693613849e-06} +{"train_loss": 0.0004988525761291385, "global_step": 59904, "epoch": 503, "lr": 6.346812354808101e-06} +{"train_loss": 0.0007148055592551827, "global_step": 59905, "epoch": 503, "lr": 6.345732101710738e-06} +{"train_loss": 0.0005774192395620048, "global_step": 59906, "epoch": 503, "lr": 6.344651934323853e-06} +{"train_loss": 0.0003845763567369431, "global_step": 59907, "epoch": 503, "lr": 6.343571852649588e-06} +{"train_loss": 0.0005037455121055245, "global_step": 59908, "epoch": 503, "lr": 6.342491856690047e-06} +{"train_loss": 0.0003900254669133574, "global_step": 59909, "epoch": 503, "lr": 6.341411946447373e-06} +{"train_loss": 0.00019416688883211464, "global_step": 59910, "epoch": 503, "lr": 6.34033212192367e-06} +{"train_loss": 0.00014783520600758493, "global_step": 59911, "epoch": 503, "lr": 6.339252383121047e-06} +{"train_loss": 0.0003004188765771687, "global_step": 59912, "epoch": 503, "lr": 6.3381727300416525e-06} +{"train_loss": 0.0004934463067911565, "global_step": 59913, "epoch": 503, "lr": 6.337093162687579e-06} +{"train_loss": 0.0005761705106124282, "global_step": 59914, "epoch": 503, "lr": 6.336013681060965e-06} +{"train_loss": 0.0004912869189865887, "global_step": 59915, "epoch": 503, "lr": 6.3349342851639295e-06} +{"train_loss": 0.0005070450133644044, "global_step": 59916, "epoch": 503, "lr": 6.333854974998571e-06} +{"train_loss": 0.0005222929758019745, "global_step": 59917, "epoch": 503, "lr": 6.332775750567038e-06} +{"train_loss": 0.00027781177777796984, "global_step": 59918, "epoch": 503, "lr": 6.3316966118714186e-06} +{"train_loss": 0.0004911892465315759, "global_step": 59919, "epoch": 503, "lr": 6.330617558913865e-06} +{"train_loss": 0.00036131328670307994, "global_step": 59920, "epoch": 503, "lr": 6.32953859169646e-06} +{"train_loss": 0.0006484129698947072, "global_step": 59921, "epoch": 503, "lr": 6.328459710221357e-06} +{"train_loss": 0.00020426166884135455, "global_step": 59922, "epoch": 503, "lr": 6.327380914490655e-06} +{"train_loss": 0.0006265551201067865, "global_step": 59923, "epoch": 503, "lr": 6.326302204506468e-06} +{"train_loss": 0.0003605398233048618, "global_step": 59924, "epoch": 503, "lr": 6.325223580270928e-06} +{"train_loss": 0.00037094674189575016, "global_step": 59925, "epoch": 503, "lr": 6.324145041786133e-06} +{"train_loss": 0.000260552711552009, "global_step": 59926, "epoch": 503, "lr": 6.323066589054227e-06} +{"train_loss": 0.00017578947881702334, "global_step": 59927, "epoch": 503, "lr": 6.3219882220773015e-06} +{"train_loss": 0.0010517856571823359, "global_step": 59928, "epoch": 503, "lr": 6.320909940857495e-06} +{"train_loss": 0.0007247606990858912, "global_step": 59929, "epoch": 503, "lr": 6.319831745396909e-06} +{"train_loss": 0.00043854524847120047, "global_step": 59930, "epoch": 503, "lr": 6.318753635697671e-06} +{"train_loss": 0.00021323109103832394, "global_step": 59931, "epoch": 503, "lr": 6.317675611761892e-06} +{"train_loss": 0.00027402472915127873, "global_step": 59932, "epoch": 503, "lr": 6.316597673591684e-06} +{"train_loss": 0.00038547077565453947, "global_step": 59933, "epoch": 503, "lr": 6.315519821189181e-06} +{"train_loss": 0.0006000582361593843, "global_step": 59934, "epoch": 503, "lr": 6.314442054556491e-06} +{"train_loss": 0.0003391319187358022, "global_step": 59935, "epoch": 503, "lr": 6.313364373695713e-06} +{"train_loss": 0.0005311385029926896, "global_step": 59936, "epoch": 503, "lr": 6.3122867786089834e-06} +{"train_loss": 0.0005864726845175028, "global_step": 59937, "epoch": 503, "lr": 6.3112092692984075e-06} +{"train_loss": 0.0002476549125276506, "global_step": 59938, "epoch": 503, "lr": 6.310131845766115e-06} +{"train_loss": 0.00033587179495953023, "global_step": 59939, "epoch": 503, "lr": 6.309054508014195e-06} +{"train_loss": 0.0003798917168751359, "global_step": 59940, "epoch": 503, "lr": 6.3079772560447946e-06} +{"train_loss": 0.0003854050883091986, "global_step": 59941, "epoch": 503, "lr": 6.306900089860012e-06} +{"train_loss": 0.0004293788515496999, "global_step": 59942, "epoch": 503, "lr": 6.305823009461953e-06} +{"train_loss": 0.00021856592502444983, "global_step": 59943, "epoch": 503, "lr": 6.304746014852752e-06} +{"train_loss": 0.0004264322924427688, "global_step": 59944, "epoch": 503, "lr": 6.3036691060345046e-06} +{"train_loss": 0.0003725917194969952, "global_step": 59945, "epoch": 503, "lr": 6.302592283009345e-06} +{"train_loss": 0.0003437378618400544, "global_step": 59946, "epoch": 503, "lr": 6.301515545779374e-06} +{"train_loss": 0.0006955702556297183, "global_step": 59947, "epoch": 503, "lr": 6.3004388943467e-06} +{"train_loss": 0.0004221890412736684, "global_step": 59948, "epoch": 503, "lr": 6.299362328713459e-06} +{"train_loss": 0.000348236586432904, "global_step": 59949, "epoch": 503, "lr": 6.298285848881736e-06} +{"train_loss": 0.0006327979499474168, "global_step": 59950, "epoch": 503, "lr": 6.297209454853676e-06} +{"train_loss": 0.0005368094425648451, "global_step": 59951, "epoch": 503, "lr": 6.296133146631361e-06} +{"train_loss": 0.00043056230060756207, "global_step": 59952, "epoch": 503, "lr": 6.29505692421693e-06} +{"train_loss": 0.00031368026975542307, "global_step": 59953, "epoch": 503, "lr": 6.293980787612485e-06} +{"train_loss": 0.0003981390327680856, "global_step": 59954, "epoch": 503, "lr": 6.292904736820132e-06} +{"train_loss": 0.0009974417043849826, "global_step": 59955, "epoch": 503, "lr": 6.291828771842001e-06} +{"train_loss": 0.00027940195286646485, "global_step": 59956, "epoch": 503, "lr": 6.290752892680185e-06} +{"train_loss": 0.00034093373687937856, "global_step": 59957, "epoch": 503, "lr": 6.289677099336816e-06} +{"train_loss": 0.000226469652261585, "global_step": 59958, "epoch": 503, "lr": 6.288601391813987e-06} +{"train_loss": 0.00031579332426190376, "global_step": 59959, "epoch": 503, "lr": 6.287525770113828e-06} +{"train_loss": 0.0007476701866835356, "global_step": 59960, "epoch": 503, "lr": 6.286450234238428e-06} +{"train_loss": 0.00027445005252957344, "global_step": 59961, "epoch": 503, "lr": 6.285374784189929e-06} +{"train_loss": 0.00027258822228759527, "global_step": 59962, "epoch": 503, "lr": 6.284299419970413e-06} +{"train_loss": 0.000509140023496002, "global_step": 59963, "epoch": 503, "lr": 6.283224141582017e-06} +{"train_loss": 0.0003705901326611638, "global_step": 59964, "epoch": 503, "lr": 6.282148949026828e-06} +{"train_loss": 0.0002785741235129535, "global_step": 59965, "epoch": 503, "lr": 6.281073842306978e-06} +{"train_loss": 0.0004471236024983227, "global_step": 59966, "epoch": 503, "lr": 6.279998821424565e-06} +{"train_loss": 0.00043345591984689236, "global_step": 59967, "epoch": 503, "lr": 6.27892388638171e-06} +{"train_loss": 0.0006101605831645429, "global_step": 59968, "epoch": 503, "lr": 6.2778490371805054e-06} +{"train_loss": 0.00041479666833765805, "global_step": 59969, "epoch": 503, "lr": 6.276774273823083e-06} +{"train_loss": 0.00039959800778888166, "global_step": 59970, "epoch": 503, "lr": 6.275699596311535e-06} +{"train_loss": 0.00021778320660814643, "global_step": 59971, "epoch": 503, "lr": 6.274625004647988e-06} +{"train_loss": 0.0003285730490460992, "global_step": 59972, "epoch": 503, "lr": 6.273550498834546e-06} +{"train_loss": 0.00040349323535338044, "global_step": 59973, "epoch": 503, "lr": 6.2724760788733015e-06} +{"train_loss": 0.00031597420456819236, "global_step": 59974, "epoch": 503, "lr": 6.271401744766392e-06} +{"train_loss": 0.000410920731721352, "global_step": 59975, "epoch": 503, "lr": 6.270327496515905e-06, "val_loss": 0.025234023109078407} +{"train_loss": 0.0005615592235699296, "global_step": 59976, "epoch": 504, "lr": 6.269253334123965e-06} +{"train_loss": 0.00027451090863905847, "global_step": 59977, "epoch": 504, "lr": 6.2681792575926656e-06} +{"train_loss": 0.001034909626469016, "global_step": 59978, "epoch": 504, "lr": 6.267105266924134e-06} +{"train_loss": 0.00036272648139856756, "global_step": 59979, "epoch": 504, "lr": 6.266031362120467e-06} +{"train_loss": 0.00043177910265512764, "global_step": 59980, "epoch": 504, "lr": 6.264957543183769e-06} +{"train_loss": 0.0002583295863587409, "global_step": 59981, "epoch": 504, "lr": 6.263883810116161e-06} +{"train_loss": 0.0003565005608834326, "global_step": 59982, "epoch": 504, "lr": 6.262810162919735e-06} +{"train_loss": 0.0004822330956812948, "global_step": 59983, "epoch": 504, "lr": 6.2617366015966185e-06} +{"train_loss": 0.0005513050127774477, "global_step": 59984, "epoch": 504, "lr": 6.260663126148914e-06} +{"train_loss": 0.00029415416065603495, "global_step": 59985, "epoch": 504, "lr": 6.259589736578708e-06} +{"train_loss": 0.00042931680218316615, "global_step": 59986, "epoch": 504, "lr": 6.258516432888139e-06} +{"train_loss": 0.0003779387043323368, "global_step": 59987, "epoch": 504, "lr": 6.257443215079289e-06} +{"train_loss": 0.00044953604810871184, "global_step": 59988, "epoch": 504, "lr": 6.256370083154284e-06} +{"train_loss": 0.00025467792875133455, "global_step": 59989, "epoch": 504, "lr": 6.255297037115215e-06} +{"train_loss": 0.000316090154228732, "global_step": 59990, "epoch": 504, "lr": 6.2542240769642105e-06} +{"train_loss": 0.0010782411554828286, "global_step": 59991, "epoch": 504, "lr": 6.253151202703355e-06} +{"train_loss": 0.00042467168532311916, "global_step": 59992, "epoch": 504, "lr": 6.252078414334761e-06} +{"train_loss": 0.0004614419594872743, "global_step": 59993, "epoch": 504, "lr": 6.2510057118605415e-06} +{"train_loss": 0.0003541451587807387, "global_step": 59994, "epoch": 504, "lr": 6.249933095282795e-06} +{"train_loss": 0.00041973459883593023, "global_step": 59995, "epoch": 504, "lr": 6.2488605646036254e-06} +{"train_loss": 0.0006854844396002591, "global_step": 59996, "epoch": 504, "lr": 6.2477881198251544e-06} +{"train_loss": 0.0004985803971067071, "global_step": 59997, "epoch": 504, "lr": 6.2467157609494674e-06} +{"train_loss": 0.000517911568749696, "global_step": 59998, "epoch": 504, "lr": 6.245643487978692e-06} +{"train_loss": 0.0003829153429251164, "global_step": 59999, "epoch": 504, "lr": 6.244571300914909e-06} +{"train_loss": 0.0002802198869176209, "global_step": 60000, "epoch": 504, "lr": 6.24349919976025e-06} +{"train_loss": 0.0002260827604914084, "global_step": 60001, "epoch": 504, "lr": 6.242427184516792e-06} +{"train_loss": 0.00046135683078318834, "global_step": 60002, "epoch": 504, "lr": 6.241355255186659e-06} +{"train_loss": 0.0005027662846259773, "global_step": 60003, "epoch": 504, "lr": 6.240283411771958e-06} +{"train_loss": 0.000461749907117337, "global_step": 60004, "epoch": 504, "lr": 6.239211654274768e-06} +{"train_loss": 0.00051191943930462, "global_step": 60005, "epoch": 504, "lr": 6.2381399826972276e-06} +{"train_loss": 0.0003577838942874223, "global_step": 60006, "epoch": 504, "lr": 6.237068397041413e-06} +{"train_loss": 0.0002443761331960559, "global_step": 60007, "epoch": 504, "lr": 6.235996897309443e-06} +{"train_loss": 0.0003663577663246542, "global_step": 60008, "epoch": 504, "lr": 6.2349254835034125e-06} +{"train_loss": 0.00027119318838231266, "global_step": 60009, "epoch": 504, "lr": 6.23385415562544e-06} +{"train_loss": 0.0002823451941367239, "global_step": 60010, "epoch": 504, "lr": 6.2327829136776205e-06} +{"train_loss": 0.00039722732617519796, "global_step": 60011, "epoch": 504, "lr": 6.231711757662045e-06} +{"train_loss": 0.00047938767238520086, "global_step": 60012, "epoch": 504, "lr": 6.230640687580835e-06} +{"train_loss": 0.0002735006273724139, "global_step": 60013, "epoch": 504, "lr": 6.2295697034360775e-06} +{"train_loss": 0.0005721092456951737, "global_step": 60014, "epoch": 504, "lr": 6.228498805229893e-06} +{"train_loss": 0.0002569564385339618, "global_step": 60015, "epoch": 504, "lr": 6.22742799296438e-06} +{"train_loss": 0.0004277945845387876, "global_step": 60016, "epoch": 504, "lr": 6.226357266641619e-06} +{"train_loss": 0.0002964447485283017, "global_step": 60017, "epoch": 504, "lr": 6.225286626263743e-06} +{"train_loss": 0.00034670313470996916, "global_step": 60018, "epoch": 504, "lr": 6.224216071832828e-06} +{"train_loss": 0.0002636302378959954, "global_step": 60019, "epoch": 504, "lr": 6.2231456033509996e-06} +{"train_loss": 0.00040953169809654355, "global_step": 60020, "epoch": 504, "lr": 6.222075220820334e-06} +{"train_loss": 0.00032412121072411537, "global_step": 60021, "epoch": 504, "lr": 6.221004924242963e-06} +{"train_loss": 0.0005205101333558559, "global_step": 60022, "epoch": 504, "lr": 6.219934713620967e-06} +{"train_loss": 0.00031794828828424215, "global_step": 60023, "epoch": 504, "lr": 6.218864588956441e-06} +{"train_loss": 0.00035110051976516843, "global_step": 60024, "epoch": 504, "lr": 6.21779455025151e-06} +{"train_loss": 0.0003581311902962625, "global_step": 60025, "epoch": 504, "lr": 6.216724597508256e-06} +{"train_loss": 0.00028058834141120315, "global_step": 60026, "epoch": 504, "lr": 6.2156547307287875e-06} +{"train_loss": 0.0002647206129040569, "global_step": 60027, "epoch": 504, "lr": 6.214584949915197e-06} +{"train_loss": 0.0003991733829025179, "global_step": 60028, "epoch": 504, "lr": 6.213515255069602e-06} +{"train_loss": 0.0003851819201372564, "global_step": 60029, "epoch": 504, "lr": 6.212445646194081e-06} +{"train_loss": 0.0005901292315684259, "global_step": 60030, "epoch": 504, "lr": 6.211376123290741e-06} +{"train_loss": 0.0003382572322152555, "global_step": 60031, "epoch": 504, "lr": 6.2103066863616996e-06} +{"train_loss": 0.0003408961638342589, "global_step": 60032, "epoch": 504, "lr": 6.209237335409035e-06} +{"train_loss": 0.00028918750467710197, "global_step": 60033, "epoch": 504, "lr": 6.208168070434861e-06} +{"train_loss": 0.0003523874911479652, "global_step": 60034, "epoch": 504, "lr": 6.207098891441277e-06} +{"train_loss": 0.0003322460106573999, "global_step": 60035, "epoch": 504, "lr": 6.206029798430357e-06} +{"train_loss": 0.0004293376987334341, "global_step": 60036, "epoch": 504, "lr": 6.204960791404235e-06} +{"train_loss": 0.00047361667384393513, "global_step": 60037, "epoch": 504, "lr": 6.203891870364981e-06} +{"train_loss": 0.0004384265630505979, "global_step": 60038, "epoch": 504, "lr": 6.202823035314714e-06} +{"train_loss": 0.00036826933501288295, "global_step": 60039, "epoch": 504, "lr": 6.201754286255518e-06} +{"train_loss": 0.00017687112267594784, "global_step": 60040, "epoch": 504, "lr": 6.2006856231895065e-06} +{"train_loss": 0.0007720094290561974, "global_step": 60041, "epoch": 504, "lr": 6.199617046118772e-06} +{"train_loss": 0.00033252922003157437, "global_step": 60042, "epoch": 504, "lr": 6.198548555045397e-06} +{"train_loss": 0.0003429039497859776, "global_step": 60043, "epoch": 504, "lr": 6.197480149971507e-06} +{"train_loss": 0.00039489715709351003, "global_step": 60044, "epoch": 504, "lr": 6.196411830899173e-06} +{"train_loss": 0.0005816988996230066, "global_step": 60045, "epoch": 504, "lr": 6.195343597830511e-06} +{"train_loss": 0.0003177992766723037, "global_step": 60046, "epoch": 504, "lr": 6.194275450767617e-06} +{"train_loss": 0.00020718162704724818, "global_step": 60047, "epoch": 504, "lr": 6.193207389712569e-06} +{"train_loss": 0.0002708778774831444, "global_step": 60048, "epoch": 504, "lr": 6.192139414667491e-06} +{"train_loss": 0.0003903783217538148, "global_step": 60049, "epoch": 504, "lr": 6.191071525634456e-06} +{"train_loss": 0.00033175182761624455, "global_step": 60050, "epoch": 504, "lr": 6.1900037226155835e-06} +{"train_loss": 0.0007434692815877497, "global_step": 60051, "epoch": 504, "lr": 6.18893600561295e-06} +{"train_loss": 0.00028480851324275136, "global_step": 60052, "epoch": 504, "lr": 6.187868374628664e-06} +{"train_loss": 0.00025180488592013717, "global_step": 60053, "epoch": 504, "lr": 6.186800829664824e-06} +{"train_loss": 0.00040767143946141005, "global_step": 60054, "epoch": 504, "lr": 6.185733370723506e-06} +{"train_loss": 0.0007356369169428945, "global_step": 60055, "epoch": 504, "lr": 6.184665997806832e-06} +{"train_loss": 0.0005129038472659886, "global_step": 60056, "epoch": 504, "lr": 6.183598710916871e-06} +{"train_loss": 0.0004284936876501888, "global_step": 60057, "epoch": 504, "lr": 6.182531510055745e-06} +{"train_loss": 0.00034401967423036695, "global_step": 60058, "epoch": 504, "lr": 6.181464395225528e-06} +{"train_loss": 0.0004631705232895911, "global_step": 60059, "epoch": 504, "lr": 6.180397366428336e-06} +{"train_loss": 0.0004086557019036263, "global_step": 60060, "epoch": 504, "lr": 6.179330423666241e-06} +{"train_loss": 0.00036613672273233533, "global_step": 60061, "epoch": 504, "lr": 6.178263566941356e-06} +{"train_loss": 0.00031978479819372296, "global_step": 60062, "epoch": 504, "lr": 6.177196796255763e-06} +{"train_loss": 0.00027057703118771315, "global_step": 60063, "epoch": 504, "lr": 6.176130111611572e-06} +{"train_loss": 0.0005433107144199312, "global_step": 60064, "epoch": 504, "lr": 6.1750635130108535e-06} +{"train_loss": 0.0002598668506834656, "global_step": 60065, "epoch": 504, "lr": 6.173997000455728e-06} +{"train_loss": 0.00027012109057977796, "global_step": 60066, "epoch": 504, "lr": 6.172930573948272e-06} +{"train_loss": 0.00025103031657636166, "global_step": 60067, "epoch": 504, "lr": 6.171864233490587e-06} +{"train_loss": 0.00032656334224157035, "global_step": 60068, "epoch": 504, "lr": 6.170797979084758e-06} +{"train_loss": 0.0002865355054382235, "global_step": 60069, "epoch": 504, "lr": 6.169731810732898e-06} +{"train_loss": 0.00018925973563455045, "global_step": 60070, "epoch": 504, "lr": 6.168665728437073e-06} +{"train_loss": 0.00019559603242669255, "global_step": 60071, "epoch": 504, "lr": 6.167599732199397e-06} +{"train_loss": 0.0002105707098962739, "global_step": 60072, "epoch": 504, "lr": 6.166533822021964e-06} +{"train_loss": 0.0004203599237371236, "global_step": 60073, "epoch": 504, "lr": 6.165467997906843e-06} +{"train_loss": 0.00037918344605714083, "global_step": 60074, "epoch": 504, "lr": 6.164402259856156e-06} +{"train_loss": 0.0005489556933753192, "global_step": 60075, "epoch": 504, "lr": 6.1633366078719665e-06} +{"train_loss": 0.0005180349107831717, "global_step": 60076, "epoch": 504, "lr": 6.1622710419563965e-06} +{"train_loss": 0.0004097349301446229, "global_step": 60077, "epoch": 504, "lr": 6.161205562111516e-06} +{"train_loss": 0.0003168522089254111, "global_step": 60078, "epoch": 504, "lr": 6.160140168339429e-06} +{"train_loss": 0.0005526440218091011, "global_step": 60079, "epoch": 504, "lr": 6.159074860642228e-06} +{"train_loss": 0.0002920708211604506, "global_step": 60080, "epoch": 504, "lr": 6.158009639021989e-06} +{"train_loss": 0.00044980531674809754, "global_step": 60081, "epoch": 504, "lr": 6.156944503480827e-06} +{"train_loss": 0.00038263635360635817, "global_step": 60082, "epoch": 504, "lr": 6.155879454020802e-06} +{"train_loss": 0.0004482853692024946, "global_step": 60083, "epoch": 504, "lr": 6.1548144906440396e-06} +{"train_loss": 0.00020827146363444626, "global_step": 60084, "epoch": 504, "lr": 6.153749613352616e-06} +{"train_loss": 0.0002325177629245445, "global_step": 60085, "epoch": 504, "lr": 6.1526848221486075e-06} +{"train_loss": 0.0003603362711146474, "global_step": 60086, "epoch": 504, "lr": 6.151620117034129e-06} +{"train_loss": 0.00048610244994051754, "global_step": 60087, "epoch": 504, "lr": 6.150555498011251e-06} +{"train_loss": 0.00042839423986151814, "global_step": 60088, "epoch": 504, "lr": 6.149490965082083e-06} +{"train_loss": 0.000430485320976004, "global_step": 60089, "epoch": 504, "lr": 6.148426518248696e-06} +{"train_loss": 0.00035436026519164443, "global_step": 60090, "epoch": 504, "lr": 6.147362157513192e-06} +{"train_loss": 0.0005021871766075492, "global_step": 60091, "epoch": 504, "lr": 6.1462978828776605e-06} +{"train_loss": 0.0004055440367665142, "global_step": 60092, "epoch": 504, "lr": 6.145233694344182e-06} +{"train_loss": 0.0004707752668764442, "global_step": 60093, "epoch": 504, "lr": 6.14416959191485e-06} +{"train_loss": 0.0003993053929860696, "global_step": 60094, "epoch": 504, "lr": 6.143105575591762e-06, "val_loss": 0.04680126532912254} +{"train_loss": 0.00037004289333708584, "global_step": 60095, "epoch": 505, "lr": 6.142041645376995e-06} +{"train_loss": 0.0004407971864566207, "global_step": 60096, "epoch": 505, "lr": 6.140977801272652e-06} +{"train_loss": 0.0006677934434264898, "global_step": 60097, "epoch": 505, "lr": 6.139914043280803e-06} +{"train_loss": 0.00022649296442978084, "global_step": 60098, "epoch": 505, "lr": 6.13885037140356e-06} +{"train_loss": 0.0005221675965003669, "global_step": 60099, "epoch": 505, "lr": 6.137786785642985e-06} +{"train_loss": 0.0003362014831509441, "global_step": 60100, "epoch": 505, "lr": 6.136723286001189e-06} +{"train_loss": 0.00038531605969183147, "global_step": 60101, "epoch": 505, "lr": 6.135659872480243e-06} +{"train_loss": 0.00037000569864176214, "global_step": 60102, "epoch": 505, "lr": 6.1345965450822555e-06} +{"train_loss": 0.00031909774406813085, "global_step": 60103, "epoch": 505, "lr": 6.133533303809297e-06} +{"train_loss": 0.0003820850106421858, "global_step": 60104, "epoch": 505, "lr": 6.1324701486634494e-06} +{"train_loss": 0.00025739215197972953, "global_step": 60105, "epoch": 505, "lr": 6.1314070796468225e-06} +{"train_loss": 0.00032358962926082313, "global_step": 60106, "epoch": 505, "lr": 6.130344096761481e-06} +{"train_loss": 0.0002217359869973734, "global_step": 60107, "epoch": 505, "lr": 6.129281200009529e-06} +{"train_loss": 0.00041176305967383087, "global_step": 60108, "epoch": 505, "lr": 6.1282183893930366e-06} +{"train_loss": 0.00031571497675031424, "global_step": 60109, "epoch": 505, "lr": 6.127155664914113e-06} +{"train_loss": 0.00036461788113228977, "global_step": 60110, "epoch": 505, "lr": 6.126093026574831e-06} +{"train_loss": 0.0004983917460776865, "global_step": 60111, "epoch": 505, "lr": 6.125030474377269e-06} +{"train_loss": 0.0005045242141932249, "global_step": 60112, "epoch": 505, "lr": 6.123968008323533e-06} +{"train_loss": 0.0004604615969583392, "global_step": 60113, "epoch": 505, "lr": 6.122905628415687e-06} +{"train_loss": 0.0003007483610417694, "global_step": 60114, "epoch": 505, "lr": 6.121843334655836e-06} +{"train_loss": 0.00037772071664221585, "global_step": 60115, "epoch": 505, "lr": 6.1207811270460605e-06} +{"train_loss": 0.00028660654788836837, "global_step": 60116, "epoch": 505, "lr": 6.119719005588437e-06} +{"train_loss": 0.00024978964938782156, "global_step": 60117, "epoch": 505, "lr": 6.118656970285064e-06} +{"train_loss": 0.0003301073156762868, "global_step": 60118, "epoch": 505, "lr": 6.117595021138006e-06} +{"train_loss": 0.00026913295732811093, "global_step": 60119, "epoch": 505, "lr": 6.116533158149379e-06} +{"train_loss": 0.0004524633113760501, "global_step": 60120, "epoch": 505, "lr": 6.115471381321236e-06} +{"train_loss": 0.00026879081269726157, "global_step": 60121, "epoch": 505, "lr": 6.114409690655687e-06} +{"train_loss": 0.00034593199961818755, "global_step": 60122, "epoch": 505, "lr": 6.113348086154808e-06} +{"train_loss": 0.0003458167193457484, "global_step": 60123, "epoch": 505, "lr": 6.112286567820669e-06} +{"train_loss": 0.0010940753854811192, "global_step": 60124, "epoch": 505, "lr": 6.111225135655379e-06} +{"train_loss": 0.0003329058235976845, "global_step": 60125, "epoch": 505, "lr": 6.110163789661e-06} +{"train_loss": 0.00041966960998252034, "global_step": 60126, "epoch": 505, "lr": 6.109102529839633e-06} +{"train_loss": 0.00033739692298695445, "global_step": 60127, "epoch": 505, "lr": 6.108041356193345e-06} +{"train_loss": 0.00020358023175504059, "global_step": 60128, "epoch": 505, "lr": 6.106980268724227e-06} +{"train_loss": 0.0002966081374324858, "global_step": 60129, "epoch": 505, "lr": 6.105919267434379e-06} +{"train_loss": 0.0002814539766404778, "global_step": 60130, "epoch": 505, "lr": 6.104858352325854e-06} +{"train_loss": 0.0002917250385507941, "global_step": 60131, "epoch": 505, "lr": 6.103797523400761e-06} +{"train_loss": 0.000541453598998487, "global_step": 60132, "epoch": 505, "lr": 6.102736780661167e-06} +{"train_loss": 0.0009079108713194728, "global_step": 60133, "epoch": 505, "lr": 6.101676124109163e-06} +{"train_loss": 0.0002498130197636783, "global_step": 60134, "epoch": 505, "lr": 6.10061555374683e-06} +{"train_loss": 0.00021843303693458438, "global_step": 60135, "epoch": 505, "lr": 6.09955506957624e-06} +{"train_loss": 0.00022064850782044232, "global_step": 60136, "epoch": 505, "lr": 6.098494671599492e-06} +{"train_loss": 0.00020259516895748675, "global_step": 60137, "epoch": 505, "lr": 6.097434359818649e-06} +{"train_loss": 0.00048042889102362096, "global_step": 60138, "epoch": 505, "lr": 6.096374134235816e-06} +{"train_loss": 0.0006424002349376678, "global_step": 60139, "epoch": 505, "lr": 6.0953139948530524e-06} +{"train_loss": 0.0005226523499004543, "global_step": 60140, "epoch": 505, "lr": 6.094253941672457e-06} +{"train_loss": 0.0009010256035253406, "global_step": 60141, "epoch": 505, "lr": 6.093193974696104e-06} +{"train_loss": 0.00023458965006284416, "global_step": 60142, "epoch": 505, "lr": 6.092134093926061e-06} +{"train_loss": 0.000560350832529366, "global_step": 60143, "epoch": 505, "lr": 6.091074299364435e-06} +{"train_loss": 0.0005250297836028039, "global_step": 60144, "epoch": 505, "lr": 6.0900145910132826e-06} +{"train_loss": 0.0003690350567921996, "global_step": 60145, "epoch": 505, "lr": 6.08895496887471e-06} +{"train_loss": 0.00025207819999195635, "global_step": 60146, "epoch": 505, "lr": 6.087895432950768e-06} +{"train_loss": 0.0005712199490517378, "global_step": 60147, "epoch": 505, "lr": 6.086835983243561e-06} +{"train_loss": 0.0003117861342616379, "global_step": 60148, "epoch": 505, "lr": 6.085776619755162e-06} +{"train_loss": 0.0003321458352729678, "global_step": 60149, "epoch": 505, "lr": 6.084717342487639e-06} +{"train_loss": 0.00037342574796639383, "global_step": 60150, "epoch": 505, "lr": 6.083658151443095e-06} +{"train_loss": 0.00040778450784273446, "global_step": 60151, "epoch": 505, "lr": 6.082599046623582e-06} +{"train_loss": 0.0004480357747524977, "global_step": 60152, "epoch": 505, "lr": 6.081540028031207e-06} +{"train_loss": 0.000412001769291237, "global_step": 60153, "epoch": 505, "lr": 6.080481095668034e-06} +{"train_loss": 0.00040719719254411757, "global_step": 60154, "epoch": 505, "lr": 6.0794222495361374e-06} +{"train_loss": 0.00028363894671201706, "global_step": 60155, "epoch": 505, "lr": 6.078363489637606e-06} +{"train_loss": 0.0003672995662782341, "global_step": 60156, "epoch": 505, "lr": 6.07730481597451e-06} +{"train_loss": 0.0003734087513294071, "global_step": 60157, "epoch": 505, "lr": 6.076246228548943e-06} +{"train_loss": 0.0004469621053431183, "global_step": 60158, "epoch": 505, "lr": 6.075187727362969e-06} +{"train_loss": 0.0003521183680277318, "global_step": 60159, "epoch": 505, "lr": 6.074129312418675e-06} +{"train_loss": 0.00024937765556387603, "global_step": 60160, "epoch": 505, "lr": 6.073070983718126e-06} +{"train_loss": 0.00044783626799471676, "global_step": 60161, "epoch": 505, "lr": 6.072012741263422e-06} +{"train_loss": 0.0003620363131631166, "global_step": 60162, "epoch": 505, "lr": 6.0709545850566156e-06} +{"train_loss": 0.0005656766588799655, "global_step": 60163, "epoch": 505, "lr": 6.0698965150997985e-06} +{"train_loss": 0.00038646828033961356, "global_step": 60164, "epoch": 505, "lr": 6.068838531395055e-06} +{"train_loss": 0.00027345100534148514, "global_step": 60165, "epoch": 505, "lr": 6.067780633944442e-06} +{"train_loss": 0.0006796069792471826, "global_step": 60166, "epoch": 505, "lr": 6.066722822750059e-06} +{"train_loss": 0.00029425323009490967, "global_step": 60167, "epoch": 505, "lr": 6.065665097813978e-06} +{"train_loss": 0.00046004907926544547, "global_step": 60168, "epoch": 505, "lr": 6.064607459138255e-06} +{"train_loss": 0.0003653625608421862, "global_step": 60169, "epoch": 505, "lr": 6.063549906724992e-06} +{"train_loss": 0.0003774918441195041, "global_step": 60170, "epoch": 505, "lr": 6.0624924405762396e-06} +{"train_loss": 0.0006379400147125125, "global_step": 60171, "epoch": 505, "lr": 6.061435060694104e-06} +{"train_loss": 0.00019052854622714221, "global_step": 60172, "epoch": 505, "lr": 6.060377767080649e-06} +{"train_loss": 0.0006574023864232004, "global_step": 60173, "epoch": 505, "lr": 6.059320559737935e-06} +{"train_loss": 0.0005065351142548025, "global_step": 60174, "epoch": 505, "lr": 6.058263438668061e-06} +{"train_loss": 0.00027974124532192945, "global_step": 60175, "epoch": 505, "lr": 6.057206403873083e-06} +{"train_loss": 0.0003352389030624181, "global_step": 60176, "epoch": 505, "lr": 6.056149455355098e-06} +{"train_loss": 0.0003630218852777034, "global_step": 60177, "epoch": 505, "lr": 6.0550925931161515e-06} +{"train_loss": 0.00041812253766693175, "global_step": 60178, "epoch": 505, "lr": 6.054035817158354e-06} +{"train_loss": 0.0005912489723414183, "global_step": 60179, "epoch": 505, "lr": 6.05297912748376e-06} +{"train_loss": 0.0003505102067720145, "global_step": 60180, "epoch": 505, "lr": 6.051922524094434e-06} +{"train_loss": 0.000434571091318503, "global_step": 60181, "epoch": 505, "lr": 6.050866006992472e-06} +{"train_loss": 0.00044772063847631216, "global_step": 60182, "epoch": 505, "lr": 6.049809576179932e-06} +{"train_loss": 0.0004129156586714089, "global_step": 60183, "epoch": 505, "lr": 6.048753231658904e-06} +{"train_loss": 0.00023235804110299796, "global_step": 60184, "epoch": 505, "lr": 6.0476969734314545e-06} +{"train_loss": 0.0005482553970068693, "global_step": 60185, "epoch": 505, "lr": 6.046640801499648e-06} +{"train_loss": 0.0003554101858753711, "global_step": 60186, "epoch": 505, "lr": 6.045584715865576e-06} +{"train_loss": 0.00031296350061893463, "global_step": 60187, "epoch": 505, "lr": 6.0445287165312894e-06} +{"train_loss": 0.00042629390372894704, "global_step": 60188, "epoch": 505, "lr": 6.04347280349889e-06} +{"train_loss": 0.0004807096265722066, "global_step": 60189, "epoch": 505, "lr": 6.042416976770421e-06} +{"train_loss": 0.00031817107810638845, "global_step": 60190, "epoch": 505, "lr": 6.041361236347981e-06} +{"train_loss": 0.0003429703356232494, "global_step": 60191, "epoch": 505, "lr": 6.040305582233624e-06} +{"train_loss": 0.00035361264599487185, "global_step": 60192, "epoch": 505, "lr": 6.039250014429437e-06} +{"train_loss": 0.0006418669945560396, "global_step": 60193, "epoch": 505, "lr": 6.03819453293748e-06} +{"train_loss": 0.00047198942047543824, "global_step": 60194, "epoch": 505, "lr": 6.0371391377598395e-06} +{"train_loss": 0.0006641194922849536, "global_step": 60195, "epoch": 505, "lr": 6.03608382889857e-06} +{"train_loss": 0.0007391266990453005, "global_step": 60196, "epoch": 505, "lr": 6.035028606355764e-06} +{"train_loss": 0.0002831268066074699, "global_step": 60197, "epoch": 505, "lr": 6.033973470133469e-06} +{"train_loss": 0.00027446402236819267, "global_step": 60198, "epoch": 505, "lr": 6.032918420233785e-06} +{"train_loss": 0.0004752109234686941, "global_step": 60199, "epoch": 505, "lr": 6.031863456658754e-06} +{"train_loss": 0.0005890723550692201, "global_step": 60200, "epoch": 505, "lr": 6.030808579410474e-06} +{"train_loss": 0.0007927244296297431, "global_step": 60201, "epoch": 505, "lr": 6.029753788490994e-06} +{"train_loss": 0.00028901241603307426, "global_step": 60202, "epoch": 505, "lr": 6.028699083902401e-06} +{"train_loss": 0.00027825491270050406, "global_step": 60203, "epoch": 505, "lr": 6.027644465646764e-06} +{"train_loss": 0.00030314200557768345, "global_step": 60204, "epoch": 505, "lr": 6.02658993372614e-06} +{"train_loss": 0.000498597917612642, "global_step": 60205, "epoch": 505, "lr": 6.025535488142614e-06} +{"train_loss": 0.00044821167830377817, "global_step": 60206, "epoch": 505, "lr": 6.024481128898246e-06} +{"train_loss": 0.0004741332959383726, "global_step": 60207, "epoch": 505, "lr": 6.0234268559951175e-06} +{"train_loss": 0.00045570620568469167, "global_step": 60208, "epoch": 505, "lr": 6.0223726694352835e-06} +{"train_loss": 0.00042978947749361396, "global_step": 60209, "epoch": 505, "lr": 6.021318569220835e-06} +{"train_loss": 0.0007658720714971423, "global_step": 60210, "epoch": 505, "lr": 6.020264555353827e-06} +{"train_loss": 0.0005769853596575558, "global_step": 60211, "epoch": 505, "lr": 6.019210627836319e-06} +{"train_loss": 0.0002089271292788908, "global_step": 60212, "epoch": 505, "lr": 6.018156786670409e-06} +{"train_loss": 0.00041504858693640145, "global_step": 60213, "epoch": 505, "lr": 6.017103031858134e-06, "val_loss": 0.021547513082623482, "train_action_mse_error": 5.191572654439369e-06} +{"train_loss": 0.0005262665799818933, "global_step": 60214, "epoch": 506, "lr": 6.016049363401588e-06} +{"train_loss": 0.00023717223666608334, "global_step": 60215, "epoch": 506, "lr": 6.0149957813028234e-06} +{"train_loss": 0.00048006101860664785, "global_step": 60216, "epoch": 506, "lr": 6.0139422855639225e-06} +{"train_loss": 0.00038797938032075763, "global_step": 60217, "epoch": 506, "lr": 6.012888876186945e-06} +{"train_loss": 0.0004342898027971387, "global_step": 60218, "epoch": 506, "lr": 6.0118355531739555e-06} +{"train_loss": 0.00044462678488343954, "global_step": 60219, "epoch": 506, "lr": 6.010782316527036e-06} +{"train_loss": 0.00019657287339214236, "global_step": 60220, "epoch": 506, "lr": 6.009729166248234e-06} +{"train_loss": 0.00038053272874094546, "global_step": 60221, "epoch": 506, "lr": 6.008676102339639e-06} +{"train_loss": 0.0002479793911334127, "global_step": 60222, "epoch": 506, "lr": 6.007623124803313e-06} +{"train_loss": 0.0002927959430962801, "global_step": 60223, "epoch": 506, "lr": 6.006570233641301e-06} +{"train_loss": 0.0003473548567853868, "global_step": 60224, "epoch": 506, "lr": 6.005517428855695e-06} +{"train_loss": 0.0004821990441996604, "global_step": 60225, "epoch": 506, "lr": 6.004464710448565e-06} +{"train_loss": 0.0002534370869398117, "global_step": 60226, "epoch": 506, "lr": 6.003412078421955e-06} +{"train_loss": 0.000308044720441103, "global_step": 60227, "epoch": 506, "lr": 6.002359532777957e-06} +{"train_loss": 0.00048133195377886295, "global_step": 60228, "epoch": 506, "lr": 6.00130707351862e-06} +{"train_loss": 0.00039434482459910214, "global_step": 60229, "epoch": 506, "lr": 6.000254700646019e-06} +{"train_loss": 0.00024779682280495763, "global_step": 60230, "epoch": 506, "lr": 5.999202414162208e-06} +{"train_loss": 0.00021054600074421614, "global_step": 60231, "epoch": 506, "lr": 5.998150214069276e-06} +{"train_loss": 0.0005141994333826005, "global_step": 60232, "epoch": 506, "lr": 5.997098100369264e-06} +{"train_loss": 0.0004438274772837758, "global_step": 60233, "epoch": 506, "lr": 5.99604607306426e-06} +{"train_loss": 0.0004991316236555576, "global_step": 60234, "epoch": 506, "lr": 5.994994132156312e-06} +{"train_loss": 0.0004288194759283215, "global_step": 60235, "epoch": 506, "lr": 5.993942277647491e-06} +{"train_loss": 0.0005686054355464876, "global_step": 60236, "epoch": 506, "lr": 5.992890509539867e-06} +{"train_loss": 0.0003377875837031752, "global_step": 60237, "epoch": 506, "lr": 5.991838827835489e-06} +{"train_loss": 0.00027975294506177306, "global_step": 60238, "epoch": 506, "lr": 5.9907872325364486e-06} +{"train_loss": 0.0002602062013465911, "global_step": 60239, "epoch": 506, "lr": 5.989735723644785e-06} +{"train_loss": 0.0003246930427849293, "global_step": 60240, "epoch": 506, "lr": 5.988684301162583e-06} +{"train_loss": 0.00028960953932255507, "global_step": 60241, "epoch": 506, "lr": 5.9876329650919e-06} +{"train_loss": 0.00023085209249984473, "global_step": 60242, "epoch": 506, "lr": 5.986581715434781e-06} +{"train_loss": 0.00027202971978113055, "global_step": 60243, "epoch": 506, "lr": 5.985530552193325e-06} +{"train_loss": 0.0005212696269154549, "global_step": 60244, "epoch": 506, "lr": 5.984479475369559e-06} +{"train_loss": 0.000388933636713773, "global_step": 60245, "epoch": 506, "lr": 5.983428484965581e-06} +{"train_loss": 0.0003951604594476521, "global_step": 60246, "epoch": 506, "lr": 5.982377580983428e-06} +{"train_loss": 0.000891790259629488, "global_step": 60247, "epoch": 506, "lr": 5.981326763425182e-06} +{"train_loss": 0.0003671564918477088, "global_step": 60248, "epoch": 506, "lr": 5.980276032292898e-06} +{"train_loss": 0.0008151153451763093, "global_step": 60249, "epoch": 506, "lr": 5.979225387588633e-06} +{"train_loss": 0.000416458846302703, "global_step": 60250, "epoch": 506, "lr": 5.978174829314464e-06} +{"train_loss": 0.0008012360194697976, "global_step": 60251, "epoch": 506, "lr": 5.977124357472435e-06} +{"train_loss": 0.0003169765113852918, "global_step": 60252, "epoch": 506, "lr": 5.976073972064627e-06} +{"train_loss": 0.000550720258615911, "global_step": 60253, "epoch": 506, "lr": 5.9750236730931e-06} +{"train_loss": 0.0006942074396647513, "global_step": 60254, "epoch": 506, "lr": 5.973973460559895e-06} +{"train_loss": 0.00024897916591726243, "global_step": 60255, "epoch": 506, "lr": 5.972923334467101e-06} +{"train_loss": 0.0005594048998318613, "global_step": 60256, "epoch": 506, "lr": 5.97187329481676e-06} +{"train_loss": 0.0005574080860242248, "global_step": 60257, "epoch": 506, "lr": 5.970823341610954e-06} +{"train_loss": 0.0003070311213377863, "global_step": 60258, "epoch": 506, "lr": 5.96977347485172e-06} +{"train_loss": 0.0003296054492238909, "global_step": 60259, "epoch": 506, "lr": 5.968723694541134e-06} +{"train_loss": 0.0004222289426252246, "global_step": 60260, "epoch": 506, "lr": 5.967674000681261e-06} +{"train_loss": 0.0004549089935608208, "global_step": 60261, "epoch": 506, "lr": 5.966624393274145e-06} +{"train_loss": 0.00033846477163024247, "global_step": 60262, "epoch": 506, "lr": 5.965574872321872e-06} +{"train_loss": 0.0005307953106239438, "global_step": 60263, "epoch": 506, "lr": 5.964525437826479e-06} +{"train_loss": 0.00043631432345137, "global_step": 60264, "epoch": 506, "lr": 5.9634760897900434e-06} +{"train_loss": 0.00026156092644669116, "global_step": 60265, "epoch": 506, "lr": 5.962426828214607e-06} +{"train_loss": 0.0003504377091303468, "global_step": 60266, "epoch": 506, "lr": 5.961377653102252e-06} +{"train_loss": 0.0005821547820232809, "global_step": 60267, "epoch": 506, "lr": 5.960328564455031e-06} +{"train_loss": 0.00045020401012152433, "global_step": 60268, "epoch": 506, "lr": 5.959279562274983e-06} +{"train_loss": 0.0005024643032811582, "global_step": 60269, "epoch": 506, "lr": 5.9582306465642006e-06} +{"train_loss": 0.0008594586979597807, "global_step": 60270, "epoch": 506, "lr": 5.957181817324714e-06} +{"train_loss": 0.0003042467578779906, "global_step": 60271, "epoch": 506, "lr": 5.956133074558606e-06} +{"train_loss": 0.00033904911833815277, "global_step": 60272, "epoch": 506, "lr": 5.955084418267926e-06} +{"train_loss": 0.0003714075137395412, "global_step": 60273, "epoch": 506, "lr": 5.95403584845472e-06} +{"train_loss": 0.0002179155999328941, "global_step": 60274, "epoch": 506, "lr": 5.952987365121071e-06} +{"train_loss": 0.0004159134114161134, "global_step": 60275, "epoch": 506, "lr": 5.9519389682690105e-06} +{"train_loss": 0.0004026008246000856, "global_step": 60276, "epoch": 506, "lr": 5.950890657900632e-06} +{"train_loss": 0.0009299934608861804, "global_step": 60277, "epoch": 506, "lr": 5.949842434017955e-06} +{"train_loss": 0.000309231982100755, "global_step": 60278, "epoch": 506, "lr": 5.9487942966230725e-06} +{"train_loss": 0.0003436224942561239, "global_step": 60279, "epoch": 506, "lr": 5.947746245718022e-06} +{"train_loss": 0.0003453903482295573, "global_step": 60280, "epoch": 506, "lr": 5.9466982813048575e-06} +{"train_loss": 0.0006914729601703584, "global_step": 60281, "epoch": 506, "lr": 5.945650403385649e-06} +{"train_loss": 0.0003633066371548921, "global_step": 60282, "epoch": 506, "lr": 5.944602611962446e-06} +{"train_loss": 0.00026112853083759546, "global_step": 60283, "epoch": 506, "lr": 5.943554907037319e-06} +{"train_loss": 0.00040184281533584, "global_step": 60284, "epoch": 506, "lr": 5.942507288612304e-06} +{"train_loss": 0.000473249820061028, "global_step": 60285, "epoch": 506, "lr": 5.941459756689477e-06} +{"train_loss": 0.0003705018316395581, "global_step": 60286, "epoch": 506, "lr": 5.940412311270887e-06} +{"train_loss": 0.0008462716941721737, "global_step": 60287, "epoch": 506, "lr": 5.939364952358584e-06} +{"train_loss": 0.00017890484014060348, "global_step": 60288, "epoch": 506, "lr": 5.9383176799546415e-06} +{"train_loss": 0.00023099036479834467, "global_step": 60289, "epoch": 506, "lr": 5.937270494061087e-06} +{"train_loss": 0.00034409930231049657, "global_step": 60290, "epoch": 506, "lr": 5.936223394680012e-06} +{"train_loss": 0.00032423099037259817, "global_step": 60291, "epoch": 506, "lr": 5.93517638181344e-06} +{"train_loss": 0.00037699032691307366, "global_step": 60292, "epoch": 506, "lr": 5.934129455463455e-06} +{"train_loss": 0.00033742416417226195, "global_step": 60293, "epoch": 506, "lr": 5.933082615632091e-06} +{"train_loss": 0.0010717753320932388, "global_step": 60294, "epoch": 506, "lr": 5.932035862321417e-06} +{"train_loss": 0.0004068146809004247, "global_step": 60295, "epoch": 506, "lr": 5.930989195533471e-06} +{"train_loss": 0.0003287850704509765, "global_step": 60296, "epoch": 506, "lr": 5.929942615270323e-06} +{"train_loss": 0.00040112706483341753, "global_step": 60297, "epoch": 506, "lr": 5.928896121534033e-06} +{"train_loss": 0.0006961757899262011, "global_step": 60298, "epoch": 506, "lr": 5.92784971432665e-06} +{"train_loss": 0.00037093620630912483, "global_step": 60299, "epoch": 506, "lr": 5.926803393650215e-06} +{"train_loss": 0.00036078356788493693, "global_step": 60300, "epoch": 506, "lr": 5.9257571595068e-06} +{"train_loss": 0.00041881398647092283, "global_step": 60301, "epoch": 506, "lr": 5.924711011898443e-06} +{"train_loss": 0.0008146910113282502, "global_step": 60302, "epoch": 506, "lr": 5.923664950827223e-06} +{"train_loss": 0.0005581824225373566, "global_step": 60303, "epoch": 506, "lr": 5.922618976295169e-06} +{"train_loss": 0.00036349910078570247, "global_step": 60304, "epoch": 506, "lr": 5.921573088304339e-06} +{"train_loss": 0.0005261970800347626, "global_step": 60305, "epoch": 506, "lr": 5.920527286856803e-06} +{"train_loss": 0.000497673696372658, "global_step": 60306, "epoch": 506, "lr": 5.919481571954588e-06} +{"train_loss": 0.00017210091755259782, "global_step": 60307, "epoch": 506, "lr": 5.918435943599771e-06} +{"train_loss": 0.0006903044413775206, "global_step": 60308, "epoch": 506, "lr": 5.917390401794387e-06} +{"train_loss": 0.0004349200753495097, "global_step": 60309, "epoch": 506, "lr": 5.9163449465405084e-06} +{"train_loss": 0.00048491806956008077, "global_step": 60310, "epoch": 506, "lr": 5.9152995778401775e-06} +{"train_loss": 0.00030169254750944674, "global_step": 60311, "epoch": 506, "lr": 5.914254295695437e-06} +{"train_loss": 0.0005981967551633716, "global_step": 60312, "epoch": 506, "lr": 5.9132091001083575e-06} +{"train_loss": 0.0003528291417751461, "global_step": 60313, "epoch": 506, "lr": 5.9121639910809715e-06} +{"train_loss": 0.0005728866090066731, "global_step": 60314, "epoch": 506, "lr": 5.911118968615348e-06} +{"train_loss": 0.0004505193210206926, "global_step": 60315, "epoch": 506, "lr": 5.9100740327135255e-06} +{"train_loss": 0.000729520688764751, "global_step": 60316, "epoch": 506, "lr": 5.909029183377574e-06} +{"train_loss": 0.00028309153276495636, "global_step": 60317, "epoch": 506, "lr": 5.907984420609531e-06} +{"train_loss": 0.00020052203035447747, "global_step": 60318, "epoch": 506, "lr": 5.906939744411438e-06} +{"train_loss": 0.0005456584040075541, "global_step": 60319, "epoch": 506, "lr": 5.905895154785374e-06} +{"train_loss": 0.00025495002046227455, "global_step": 60320, "epoch": 506, "lr": 5.904850651733357e-06} +{"train_loss": 0.0002944523876067251, "global_step": 60321, "epoch": 506, "lr": 5.90380623525747e-06} +{"train_loss": 0.0003861832956317812, "global_step": 60322, "epoch": 506, "lr": 5.902761905359738e-06} +{"train_loss": 0.0005521774874068797, "global_step": 60323, "epoch": 506, "lr": 5.901717662042228e-06} +{"train_loss": 0.000636087846942246, "global_step": 60324, "epoch": 506, "lr": 5.900673505306981e-06} +{"train_loss": 0.0003687632561195642, "global_step": 60325, "epoch": 506, "lr": 5.899629435156057e-06} +{"train_loss": 0.00029581075068563223, "global_step": 60326, "epoch": 506, "lr": 5.898585451591487e-06} +{"train_loss": 0.00040948286186903715, "global_step": 60327, "epoch": 506, "lr": 5.897541554615344e-06} +{"train_loss": 0.0007360852905549109, "global_step": 60328, "epoch": 506, "lr": 5.8964977442296565e-06} +{"train_loss": 0.00041503895772621036, "global_step": 60329, "epoch": 506, "lr": 5.8954540204364915e-06} +{"train_loss": 0.0010373822879046202, "global_step": 60330, "epoch": 506, "lr": 5.894410383237886e-06} +{"train_loss": 0.00029679149156436324, "global_step": 60331, "epoch": 506, "lr": 5.893366832635899e-06} +{"train_loss": 0.00043676982322187326, "global_step": 60332, "epoch": 506, "lr": 5.892323368632569e-06, "val_loss": 0.031950559467077255} +{"train_loss": 0.00047858580364845693, "global_step": 60333, "epoch": 507, "lr": 5.891279991229953e-06} +{"train_loss": 0.0005728843389078975, "global_step": 60334, "epoch": 507, "lr": 5.890236700430091e-06} +{"train_loss": 0.00041164117283187807, "global_step": 60335, "epoch": 507, "lr": 5.889193496235051e-06} +{"train_loss": 0.00023017475905362517, "global_step": 60336, "epoch": 507, "lr": 5.888150378646861e-06} +{"train_loss": 0.00019986745610367507, "global_step": 60337, "epoch": 507, "lr": 5.887107347667564e-06} +{"train_loss": 0.000576696009375155, "global_step": 60338, "epoch": 507, "lr": 5.886064403299235e-06} +{"train_loss": 0.0003019033174496144, "global_step": 60339, "epoch": 507, "lr": 5.885021545543889e-06} +{"train_loss": 0.0003735785139724612, "global_step": 60340, "epoch": 507, "lr": 5.883978774403604e-06} +{"train_loss": 0.0003951008548028767, "global_step": 60341, "epoch": 507, "lr": 5.8829360898804145e-06} +{"train_loss": 0.00025576516054570675, "global_step": 60342, "epoch": 507, "lr": 5.8818934919763535e-06} +{"train_loss": 0.00034446263452991843, "global_step": 60343, "epoch": 507, "lr": 5.880850980693492e-06} +{"train_loss": 0.0005836159689351916, "global_step": 60344, "epoch": 507, "lr": 5.879808556033855e-06} +{"train_loss": 0.0001802721235435456, "global_step": 60345, "epoch": 507, "lr": 5.878766217999515e-06} +{"train_loss": 0.00034327973844483495, "global_step": 60346, "epoch": 507, "lr": 5.877723966592491e-06} +{"train_loss": 0.00028213203768245876, "global_step": 60347, "epoch": 507, "lr": 5.876681801814854e-06} +{"train_loss": 0.00027916915132664144, "global_step": 60348, "epoch": 507, "lr": 5.8756397236686354e-06} +{"train_loss": 0.0001968028664123267, "global_step": 60349, "epoch": 507, "lr": 5.874597732155879e-06} +{"train_loss": 0.0003576135786715895, "global_step": 60350, "epoch": 507, "lr": 5.8735558272786424e-06} +{"train_loss": 0.000283821631455794, "global_step": 60351, "epoch": 507, "lr": 5.872514009038954e-06} +{"train_loss": 0.0003055363486055285, "global_step": 60352, "epoch": 507, "lr": 5.871472277438877e-06} +{"train_loss": 0.00029016967164352536, "global_step": 60353, "epoch": 507, "lr": 5.870430632480456e-06} +{"train_loss": 0.00047977070789784193, "global_step": 60354, "epoch": 507, "lr": 5.869389074165715e-06} +{"train_loss": 0.00046253998880274594, "global_step": 60355, "epoch": 507, "lr": 5.868347602496732e-06} +{"train_loss": 0.0006517526344396174, "global_step": 60356, "epoch": 507, "lr": 5.8673062174755155e-06} +{"train_loss": 0.00038125261198729277, "global_step": 60357, "epoch": 507, "lr": 5.86626491910413e-06} +{"train_loss": 0.0003663926327135414, "global_step": 60358, "epoch": 507, "lr": 5.865223707384632e-06} +{"train_loss": 0.0002196245186496526, "global_step": 60359, "epoch": 507, "lr": 5.864182582319039e-06} +{"train_loss": 0.00017014244804158807, "global_step": 60360, "epoch": 507, "lr": 5.863141543909417e-06} +{"train_loss": 0.0002771294384729117, "global_step": 60361, "epoch": 507, "lr": 5.8621005921577935e-06} +{"train_loss": 0.00031075201695784926, "global_step": 60362, "epoch": 507, "lr": 5.861059727066232e-06} +{"train_loss": 0.0007544446852989495, "global_step": 60363, "epoch": 507, "lr": 5.860018948636747e-06} +{"train_loss": 0.00046268184087239206, "global_step": 60364, "epoch": 507, "lr": 5.8589782568714165e-06} +{"train_loss": 0.0002127121842931956, "global_step": 60365, "epoch": 507, "lr": 5.857937651772255e-06} +{"train_loss": 0.0004721501609310508, "global_step": 60366, "epoch": 507, "lr": 5.856897133341327e-06} +{"train_loss": 0.00024813052732497454, "global_step": 60367, "epoch": 507, "lr": 5.8558567015806645e-06} +{"train_loss": 0.0006915723788551986, "global_step": 60368, "epoch": 507, "lr": 5.854816356492299e-06} +{"train_loss": 0.0002844587143044919, "global_step": 60369, "epoch": 507, "lr": 5.8537760980782956e-06} +{"train_loss": 0.0003219502395950258, "global_step": 60370, "epoch": 507, "lr": 5.85273592634068e-06} +{"train_loss": 0.00045388666330836713, "global_step": 60371, "epoch": 507, "lr": 5.851695841281507e-06} +{"train_loss": 0.0005207824287936091, "global_step": 60372, "epoch": 507, "lr": 5.850655842902819e-06} +{"train_loss": 0.00075962656410411, "global_step": 60373, "epoch": 507, "lr": 5.849615931206636e-06} +{"train_loss": 0.000490193662699312, "global_step": 60374, "epoch": 507, "lr": 5.848576106195025e-06} +{"train_loss": 0.0005339774070307612, "global_step": 60375, "epoch": 507, "lr": 5.84753636787001e-06} +{"train_loss": 0.00021616992307826877, "global_step": 60376, "epoch": 507, "lr": 5.846496716233652e-06} +{"train_loss": 0.0004166935686953366, "global_step": 60377, "epoch": 507, "lr": 5.8454571512879695e-06} +{"train_loss": 0.000391130248317495, "global_step": 60378, "epoch": 507, "lr": 5.844417673035024e-06} +{"train_loss": 0.00036935386015102267, "global_step": 60379, "epoch": 507, "lr": 5.843378281476847e-06} +{"train_loss": 0.00036105330218560994, "global_step": 60380, "epoch": 507, "lr": 5.842338976615469e-06} +{"train_loss": 0.0003796887176577002, "global_step": 60381, "epoch": 507, "lr": 5.8412997584529505e-06} +{"train_loss": 0.00021391276095528156, "global_step": 60382, "epoch": 507, "lr": 5.840260626991312e-06} +{"train_loss": 0.0003460627340245992, "global_step": 60383, "epoch": 507, "lr": 5.839221582232618e-06} +{"train_loss": 0.00028420324088074267, "global_step": 60384, "epoch": 507, "lr": 5.838182624178878e-06} +{"train_loss": 0.0005581536097452044, "global_step": 60385, "epoch": 507, "lr": 5.837143752832164e-06} +{"train_loss": 0.0006516760913655162, "global_step": 60386, "epoch": 507, "lr": 5.836104968194495e-06} +{"train_loss": 0.0001677517284406349, "global_step": 60387, "epoch": 507, "lr": 5.835066270267908e-06} +{"train_loss": 0.0003534099378157407, "global_step": 60388, "epoch": 507, "lr": 5.834027659054464e-06} +{"train_loss": 0.0008123602019622922, "global_step": 60389, "epoch": 507, "lr": 5.832989134556177e-06} +{"train_loss": 0.00047988331061787903, "global_step": 60390, "epoch": 507, "lr": 5.831950696775101e-06} +{"train_loss": 0.0004067234112881124, "global_step": 60391, "epoch": 507, "lr": 5.830912345713268e-06} +{"train_loss": 0.0003905801277142018, "global_step": 60392, "epoch": 507, "lr": 5.829874081372716e-06} +{"train_loss": 0.000625849817879498, "global_step": 60393, "epoch": 507, "lr": 5.828835903755497e-06} +{"train_loss": 0.00017540196131449193, "global_step": 60394, "epoch": 507, "lr": 5.8277978128636336e-06} +{"train_loss": 0.00024813442723825574, "global_step": 60395, "epoch": 507, "lr": 5.826759808699178e-06} +{"train_loss": 0.0006506724166683853, "global_step": 60396, "epoch": 507, "lr": 5.825721891264152e-06} +{"train_loss": 0.0004293335950933397, "global_step": 60397, "epoch": 507, "lr": 5.824684060560609e-06} +{"train_loss": 0.0004929102142341435, "global_step": 60398, "epoch": 507, "lr": 5.8236463165905805e-06} +{"train_loss": 0.0005144787719473243, "global_step": 60399, "epoch": 507, "lr": 5.822608659356094e-06} +{"train_loss": 0.0004820582107640803, "global_step": 60400, "epoch": 507, "lr": 5.821571088859201e-06} +{"train_loss": 0.00048076259554363787, "global_step": 60401, "epoch": 507, "lr": 5.82053360510193e-06} +{"train_loss": 0.00029046356212347746, "global_step": 60402, "epoch": 507, "lr": 5.819496208086328e-06} +{"train_loss": 0.0004216518718749285, "global_step": 60403, "epoch": 507, "lr": 5.818458897814411e-06} +{"train_loss": 0.0004280898137949407, "global_step": 60404, "epoch": 507, "lr": 5.817421674288248e-06} +{"train_loss": 0.0005644739721901715, "global_step": 60405, "epoch": 507, "lr": 5.81638453750985e-06} +{"train_loss": 0.00033247817191295326, "global_step": 60406, "epoch": 507, "lr": 5.8153474874812545e-06} +{"train_loss": 0.00019725263700820506, "global_step": 60407, "epoch": 507, "lr": 5.814310524204514e-06} +{"train_loss": 0.00028779642889276147, "global_step": 60408, "epoch": 507, "lr": 5.813273647681644e-06} +{"train_loss": 0.000404332677135244, "global_step": 60409, "epoch": 507, "lr": 5.812236857914699e-06} +{"train_loss": 0.00027882104041054845, "global_step": 60410, "epoch": 507, "lr": 5.81120015490571e-06} +{"train_loss": 0.0003362478455528617, "global_step": 60411, "epoch": 507, "lr": 5.810163538656693e-06} +{"train_loss": 0.000309091032249853, "global_step": 60412, "epoch": 507, "lr": 5.809127009169712e-06} +{"train_loss": 0.00043295518844388425, "global_step": 60413, "epoch": 507, "lr": 5.808090566446783e-06} +{"train_loss": 0.0006099003367125988, "global_step": 60414, "epoch": 507, "lr": 5.807054210489954e-06} +{"train_loss": 0.00036330538569018245, "global_step": 60415, "epoch": 507, "lr": 5.806017941301239e-06} +{"train_loss": 0.0003015916736330837, "global_step": 60416, "epoch": 507, "lr": 5.804981758882699e-06} +{"train_loss": 0.0005659518064931035, "global_step": 60417, "epoch": 507, "lr": 5.803945663236354e-06} +{"train_loss": 0.0003474522673059255, "global_step": 60418, "epoch": 507, "lr": 5.802909654364236e-06} +{"train_loss": 0.0003222374361939728, "global_step": 60419, "epoch": 507, "lr": 5.801873732268387e-06} +{"train_loss": 0.000499306945130229, "global_step": 60420, "epoch": 507, "lr": 5.800837896950828e-06} +{"train_loss": 0.0010443194769322872, "global_step": 60421, "epoch": 507, "lr": 5.7998021484136135e-06} +{"train_loss": 0.00038597939419560134, "global_step": 60422, "epoch": 507, "lr": 5.798766486658758e-06} +{"train_loss": 0.00041772809345275164, "global_step": 60423, "epoch": 507, "lr": 5.7977309116883096e-06} +{"train_loss": 0.0005372082232497633, "global_step": 60424, "epoch": 507, "lr": 5.7966954235042785e-06} +{"train_loss": 0.0005090940394438803, "global_step": 60425, "epoch": 507, "lr": 5.795660022108729e-06} +{"train_loss": 0.00027970169321633875, "global_step": 60426, "epoch": 507, "lr": 5.794624707503671e-06} +{"train_loss": 0.00022866892686579376, "global_step": 60427, "epoch": 507, "lr": 5.793589479691142e-06} +{"train_loss": 0.0004451424174476415, "global_step": 60428, "epoch": 507, "lr": 5.792554338673184e-06} +{"train_loss": 0.0003017640847247094, "global_step": 60429, "epoch": 507, "lr": 5.79151928445183e-06} +{"train_loss": 0.00032959526288323104, "global_step": 60430, "epoch": 507, "lr": 5.790484317029088e-06} +{"train_loss": 0.00031100003980100155, "global_step": 60431, "epoch": 507, "lr": 5.789449436407018e-06} +{"train_loss": 0.000808107026387006, "global_step": 60432, "epoch": 507, "lr": 5.788414642587637e-06} +{"train_loss": 0.0002822244423441589, "global_step": 60433, "epoch": 507, "lr": 5.787379935572984e-06} +{"train_loss": 0.00026767110102809966, "global_step": 60434, "epoch": 507, "lr": 5.786345315365077e-06} +{"train_loss": 0.00019669892208185047, "global_step": 60435, "epoch": 507, "lr": 5.7853107819659745e-06} +{"train_loss": 0.0005644246120937169, "global_step": 60436, "epoch": 507, "lr": 5.784276335377681e-06} +{"train_loss": 0.00045750360004603863, "global_step": 60437, "epoch": 507, "lr": 5.783241975602233e-06} +{"train_loss": 0.0006729463348165154, "global_step": 60438, "epoch": 507, "lr": 5.782207702641673e-06} +{"train_loss": 0.0003913407272193581, "global_step": 60439, "epoch": 507, "lr": 5.781173516498017e-06} +{"train_loss": 0.00025115557946264744, "global_step": 60440, "epoch": 507, "lr": 5.780139417173314e-06} +{"train_loss": 0.0003305215504951775, "global_step": 60441, "epoch": 507, "lr": 5.779105404669577e-06} +{"train_loss": 0.0002074085787171498, "global_step": 60442, "epoch": 507, "lr": 5.778071478988839e-06} +{"train_loss": 0.0006983072962611914, "global_step": 60443, "epoch": 507, "lr": 5.7770376401331376e-06} +{"train_loss": 0.0002812586899381131, "global_step": 60444, "epoch": 507, "lr": 5.776003888104492e-06} +{"train_loss": 0.0003571563574951142, "global_step": 60445, "epoch": 507, "lr": 5.774970222904947e-06} +{"train_loss": 0.0005174243124201894, "global_step": 60446, "epoch": 507, "lr": 5.773936644536509e-06} +{"train_loss": 0.0002196457498939708, "global_step": 60447, "epoch": 507, "lr": 5.772903153001241e-06} +{"train_loss": 0.0003282879770267755, "global_step": 60448, "epoch": 507, "lr": 5.771869748301145e-06} +{"train_loss": 0.0003644095850177109, "global_step": 60449, "epoch": 507, "lr": 5.770836430438248e-06} +{"train_loss": 0.0003044702752958983, "global_step": 60450, "epoch": 507, "lr": 5.769803199414603e-06} +{"train_loss": 0.0003984493368301353, "global_step": 60451, "epoch": 507, "lr": 5.768770055232209e-06, "val_loss": 0.021584633737802505} +{"train_loss": 0.00027380252140574157, "global_step": 60452, "epoch": 508, "lr": 5.767736997893125e-06} +{"train_loss": 0.0003799653786700219, "global_step": 60453, "epoch": 508, "lr": 5.76670402739935e-06} +{"train_loss": 0.0005022605764679611, "global_step": 60454, "epoch": 508, "lr": 5.7656711437529375e-06} +{"train_loss": 0.00023693278490100056, "global_step": 60455, "epoch": 508, "lr": 5.764638346955892e-06} +{"train_loss": 0.00045095107634551823, "global_step": 60456, "epoch": 508, "lr": 5.763605637010266e-06} +{"train_loss": 0.0005089229089207947, "global_step": 60457, "epoch": 508, "lr": 5.76257301391806e-06} +{"train_loss": 0.00057980976998806, "global_step": 60458, "epoch": 508, "lr": 5.761540477681332e-06} +{"train_loss": 0.0006606941460631788, "global_step": 60459, "epoch": 508, "lr": 5.760508028302081e-06} +{"train_loss": 0.00021955704141873866, "global_step": 60460, "epoch": 508, "lr": 5.759475665782354e-06} +{"train_loss": 0.0003363019204698503, "global_step": 60461, "epoch": 508, "lr": 5.758443390124157e-06} +{"train_loss": 0.00036036435631103814, "global_step": 60462, "epoch": 508, "lr": 5.757411201329549e-06} +{"train_loss": 0.0003199692291673273, "global_step": 60463, "epoch": 508, "lr": 5.756379099400521e-06} +{"train_loss": 0.0004692187358159572, "global_step": 60464, "epoch": 508, "lr": 5.755347084339125e-06} +{"train_loss": 0.0004965594853274524, "global_step": 60465, "epoch": 508, "lr": 5.7543151561473715e-06} +{"train_loss": 0.000812936807051301, "global_step": 60466, "epoch": 508, "lr": 5.753283314827301e-06} +{"train_loss": 0.00033522132434882224, "global_step": 60467, "epoch": 508, "lr": 5.752251560380933e-06} +{"train_loss": 0.00022471377451438457, "global_step": 60468, "epoch": 508, "lr": 5.751219892810283e-06} +{"train_loss": 0.00019988797430414706, "global_step": 60469, "epoch": 508, "lr": 5.750188312117394e-06} +{"train_loss": 0.0005641707684844732, "global_step": 60470, "epoch": 508, "lr": 5.749156818304274e-06} +{"train_loss": 0.0003725526621565223, "global_step": 60471, "epoch": 508, "lr": 5.748125411372967e-06} +{"train_loss": 0.0003630534920375794, "global_step": 60472, "epoch": 508, "lr": 5.747094091325478e-06} +{"train_loss": 0.0002197821595473215, "global_step": 60473, "epoch": 508, "lr": 5.746062858163853e-06} +{"train_loss": 0.0008729642140679061, "global_step": 60474, "epoch": 508, "lr": 5.745031711890103e-06} +{"train_loss": 0.0005430206074379385, "global_step": 60475, "epoch": 508, "lr": 5.744000652506243e-06} +{"train_loss": 0.0006691002054139972, "global_step": 60476, "epoch": 508, "lr": 5.742969680014326e-06} +{"train_loss": 0.00047487294068560004, "global_step": 60477, "epoch": 508, "lr": 5.741938794416346e-06} +{"train_loss": 0.0003335256187710911, "global_step": 60478, "epoch": 508, "lr": 5.740907995714351e-06} +{"train_loss": 0.0005670447135344148, "global_step": 60479, "epoch": 508, "lr": 5.739877283910355e-06} +{"train_loss": 0.000466423254692927, "global_step": 60480, "epoch": 508, "lr": 5.738846659006375e-06} +{"train_loss": 0.0003403589653316885, "global_step": 60481, "epoch": 508, "lr": 5.737816121004447e-06} +{"train_loss": 0.0004606175934895873, "global_step": 60482, "epoch": 508, "lr": 5.7367856699065805e-06} +{"train_loss": 0.00022479606559500098, "global_step": 60483, "epoch": 508, "lr": 5.735755305714813e-06} +{"train_loss": 0.0003612440195865929, "global_step": 60484, "epoch": 508, "lr": 5.734725028431153e-06} +{"train_loss": 0.00020902328833471984, "global_step": 60485, "epoch": 508, "lr": 5.7336948380576465e-06} +{"train_loss": 0.000505079107824713, "global_step": 60486, "epoch": 508, "lr": 5.732664734596294e-06} +{"train_loss": 0.00021219886548351496, "global_step": 60487, "epoch": 508, "lr": 5.731634718049117e-06} +{"train_loss": 0.00043788846232928336, "global_step": 60488, "epoch": 508, "lr": 5.730604788418159e-06} +{"train_loss": 0.000800501205958426, "global_step": 60489, "epoch": 508, "lr": 5.729574945705413e-06} +{"train_loss": 0.0003803102590609342, "global_step": 60490, "epoch": 508, "lr": 5.728545189912921e-06} +{"train_loss": 0.0006073011318221688, "global_step": 60491, "epoch": 508, "lr": 5.727515521042709e-06} +{"train_loss": 0.00022029461979400367, "global_step": 60492, "epoch": 508, "lr": 5.726485939096782e-06} +{"train_loss": 0.0004971697344444692, "global_step": 60493, "epoch": 508, "lr": 5.725456444077182e-06} +{"train_loss": 0.0005249343812465668, "global_step": 60494, "epoch": 508, "lr": 5.724427035985902e-06} +{"train_loss": 0.00035765141365118325, "global_step": 60495, "epoch": 508, "lr": 5.723397714824996e-06} +{"train_loss": 0.0003568251559045166, "global_step": 60496, "epoch": 508, "lr": 5.7223684805964514e-06} +{"train_loss": 0.00027578813023865223, "global_step": 60497, "epoch": 508, "lr": 5.721339333302322e-06} +{"train_loss": 0.00029060212546028197, "global_step": 60498, "epoch": 508, "lr": 5.720310272944612e-06} +{"train_loss": 0.0004369246889837086, "global_step": 60499, "epoch": 508, "lr": 5.719281299525331e-06} +{"train_loss": 0.0002488130412530154, "global_step": 60500, "epoch": 508, "lr": 5.718252413046516e-06} +{"train_loss": 0.0007330347434617579, "global_step": 60501, "epoch": 508, "lr": 5.717223613510176e-06} +{"train_loss": 0.0002670946705620736, "global_step": 60502, "epoch": 508, "lr": 5.716194900918348e-06} +{"train_loss": 0.0006633701850660145, "global_step": 60503, "epoch": 508, "lr": 5.715166275273026e-06} +{"train_loss": 0.0003610340936575085, "global_step": 60504, "epoch": 508, "lr": 5.714137736576258e-06} +{"train_loss": 0.00032188958721235394, "global_step": 60505, "epoch": 508, "lr": 5.713109284830048e-06} +{"train_loss": 0.00022908332175575197, "global_step": 60506, "epoch": 508, "lr": 5.712080920036406e-06} +{"train_loss": 0.0007063419325277209, "global_step": 60507, "epoch": 508, "lr": 5.711052642197373e-06} +{"train_loss": 0.0004607017617672682, "global_step": 60508, "epoch": 508, "lr": 5.710024451314944e-06} +{"train_loss": 0.00048400944797322154, "global_step": 60509, "epoch": 508, "lr": 5.70899634739116e-06} +{"train_loss": 0.0003384322044439614, "global_step": 60510, "epoch": 508, "lr": 5.7079683304280315e-06} +{"train_loss": 0.00035493538598529994, "global_step": 60511, "epoch": 508, "lr": 5.706940400427563e-06} +{"train_loss": 0.0005423327093012631, "global_step": 60512, "epoch": 508, "lr": 5.7059125573918014e-06} +{"train_loss": 0.00021098167053423822, "global_step": 60513, "epoch": 508, "lr": 5.704884801322729e-06} +{"train_loss": 0.00033927292679436505, "global_step": 60514, "epoch": 508, "lr": 5.703857132222401e-06} +{"train_loss": 0.00047076266491785645, "global_step": 60515, "epoch": 508, "lr": 5.702829550092803e-06} +{"train_loss": 0.0004754515830427408, "global_step": 60516, "epoch": 508, "lr": 5.701802054935978e-06} +{"train_loss": 0.0005470119067467749, "global_step": 60517, "epoch": 508, "lr": 5.700774646753937e-06} +{"train_loss": 0.0002972910297103226, "global_step": 60518, "epoch": 508, "lr": 5.699747325548677e-06} +{"train_loss": 0.0001883881923276931, "global_step": 60519, "epoch": 508, "lr": 5.6987200913222404e-06} +{"train_loss": 0.0005079766269773245, "global_step": 60520, "epoch": 508, "lr": 5.697692944076621e-06} +{"train_loss": 0.00016571122978348285, "global_step": 60521, "epoch": 508, "lr": 5.696665883813862e-06} +{"train_loss": 0.0002299489133292809, "global_step": 60522, "epoch": 508, "lr": 5.695638910535955e-06} +{"train_loss": 0.0003259431687183678, "global_step": 60523, "epoch": 508, "lr": 5.694612024244944e-06} +{"train_loss": 0.0002208361547673121, "global_step": 60524, "epoch": 508, "lr": 5.69358522494281e-06} +{"train_loss": 0.00031515915179625154, "global_step": 60525, "epoch": 508, "lr": 5.692558512631596e-06} +{"train_loss": 0.0002395772171439603, "global_step": 60526, "epoch": 508, "lr": 5.691531887313311e-06} +{"train_loss": 0.0003083394840359688, "global_step": 60527, "epoch": 508, "lr": 5.690505348989966e-06} +{"train_loss": 0.0004969040164723992, "global_step": 60528, "epoch": 508, "lr": 5.689478897663591e-06} +{"train_loss": 0.0004361791943665594, "global_step": 60529, "epoch": 508, "lr": 5.688452533336186e-06} +{"train_loss": 0.00017935896175913513, "global_step": 60530, "epoch": 508, "lr": 5.687426256009765e-06} +{"train_loss": 0.00032203711452893913, "global_step": 60531, "epoch": 508, "lr": 5.686400065686353e-06} +{"train_loss": 0.0004654958611354232, "global_step": 60532, "epoch": 508, "lr": 5.685373962367951e-06} +{"train_loss": 0.0002999014686793089, "global_step": 60533, "epoch": 508, "lr": 5.684347946056595e-06} +{"train_loss": 0.0004410149122122675, "global_step": 60534, "epoch": 508, "lr": 5.6833220167542774e-06} +{"train_loss": 0.000498505134601146, "global_step": 60535, "epoch": 508, "lr": 5.682296174463031e-06} +{"train_loss": 0.00035934263723902404, "global_step": 60536, "epoch": 508, "lr": 5.681270419184865e-06} +{"train_loss": 0.00020022514217998832, "global_step": 60537, "epoch": 508, "lr": 5.680244750921776e-06} +{"train_loss": 0.00023237642017193139, "global_step": 60538, "epoch": 508, "lr": 5.679219169675804e-06} +{"train_loss": 0.0004809514502994716, "global_step": 60539, "epoch": 508, "lr": 5.6781936754489395e-06} +{"train_loss": 0.0006691450835205615, "global_step": 60540, "epoch": 508, "lr": 5.677168268243216e-06} +{"train_loss": 0.00018871124484576285, "global_step": 60541, "epoch": 508, "lr": 5.676142948060637e-06} +{"train_loss": 0.0003378442779649049, "global_step": 60542, "epoch": 508, "lr": 5.675117714903205e-06} +{"train_loss": 0.00025903910864144564, "global_step": 60543, "epoch": 508, "lr": 5.67409256877296e-06} +{"train_loss": 0.0005140546709299088, "global_step": 60544, "epoch": 508, "lr": 5.673067509671881e-06} +{"train_loss": 0.00044379878090694547, "global_step": 60545, "epoch": 508, "lr": 5.672042537602012e-06} +{"train_loss": 0.0003214783500880003, "global_step": 60546, "epoch": 508, "lr": 5.671017652565342e-06} +{"train_loss": 0.00021432149515021592, "global_step": 60547, "epoch": 508, "lr": 5.669992854563905e-06} +{"train_loss": 0.0003504851774778217, "global_step": 60548, "epoch": 508, "lr": 5.6689681435996955e-06} +{"train_loss": 0.000355754658812657, "global_step": 60549, "epoch": 508, "lr": 5.667943519674723e-06} +{"train_loss": 0.0004076843324583024, "global_step": 60550, "epoch": 508, "lr": 5.66691898279102e-06} +{"train_loss": 0.00037984485970810056, "global_step": 60551, "epoch": 508, "lr": 5.665894532950572e-06} +{"train_loss": 0.0003918413713108748, "global_step": 60552, "epoch": 508, "lr": 5.664870170155418e-06} +{"train_loss": 0.0003486680216155946, "global_step": 60553, "epoch": 508, "lr": 5.663845894407538e-06} +{"train_loss": 0.00027182576013728976, "global_step": 60554, "epoch": 508, "lr": 5.662821705708976e-06} +{"train_loss": 0.00037292324122972786, "global_step": 60555, "epoch": 508, "lr": 5.661797604061714e-06} +{"train_loss": 0.00032105809077620506, "global_step": 60556, "epoch": 508, "lr": 5.660773589467788e-06} +{"train_loss": 0.00040741657721810043, "global_step": 60557, "epoch": 508, "lr": 5.659749661929181e-06} +{"train_loss": 0.00018181110499426723, "global_step": 60558, "epoch": 508, "lr": 5.658725821447936e-06} +{"train_loss": 0.0003095654828939587, "global_step": 60559, "epoch": 508, "lr": 5.657702068026033e-06} +{"train_loss": 0.00022532782168127596, "global_step": 60560, "epoch": 508, "lr": 5.6566784016655e-06} +{"train_loss": 0.00035639017005451024, "global_step": 60561, "epoch": 508, "lr": 5.655654822368334e-06} +{"train_loss": 0.00026918697403743863, "global_step": 60562, "epoch": 508, "lr": 5.654631330136567e-06} +{"train_loss": 0.0004791174433194101, "global_step": 60563, "epoch": 508, "lr": 5.653607924972176e-06} +{"train_loss": 0.00026275371783412993, "global_step": 60564, "epoch": 508, "lr": 5.6525846068772036e-06} +{"train_loss": 0.0005656683351844549, "global_step": 60565, "epoch": 508, "lr": 5.651561375853631e-06} +{"train_loss": 0.0004401065525598824, "global_step": 60566, "epoch": 508, "lr": 5.650538231903491e-06} +{"train_loss": 0.0003120037727057934, "global_step": 60567, "epoch": 508, "lr": 5.64951517502878e-06} +{"train_loss": 0.0002527476754039526, "global_step": 60568, "epoch": 508, "lr": 5.648492205231498e-06} +{"train_loss": 0.00021496044064406306, "global_step": 60569, "epoch": 508, "lr": 5.647469322513676e-06} +{"train_loss": 0.0003875804887233427, "global_step": 60570, "epoch": 508, "lr": 5.646446526877297e-06, "val_loss": 0.02613825723528862} +{"train_loss": 0.0005601835437119007, "global_step": 60571, "epoch": 509, "lr": 5.645423818324392e-06} +{"train_loss": 0.00035549013409763575, "global_step": 60572, "epoch": 509, "lr": 5.644401196856952e-06} +{"train_loss": 0.0004991393070667982, "global_step": 60573, "epoch": 509, "lr": 5.643378662476995e-06} +{"train_loss": 0.0003600746567826718, "global_step": 60574, "epoch": 509, "lr": 5.642356215186528e-06} +{"train_loss": 0.0005686574731953442, "global_step": 60575, "epoch": 509, "lr": 5.641333854987551e-06} +{"train_loss": 0.00018263094534631819, "global_step": 60576, "epoch": 509, "lr": 5.640311581882079e-06} +{"train_loss": 0.0004450577835086733, "global_step": 60577, "epoch": 509, "lr": 5.63928939587211e-06} +{"train_loss": 0.00047536264173686504, "global_step": 60578, "epoch": 509, "lr": 5.638267296959665e-06} +{"train_loss": 0.00032303956686519086, "global_step": 60579, "epoch": 509, "lr": 5.6372452851467415e-06} +{"train_loss": 0.0004802743496838957, "global_step": 60580, "epoch": 509, "lr": 5.636223360435339e-06} +{"train_loss": 0.0003388900659047067, "global_step": 60581, "epoch": 509, "lr": 5.635201522827483e-06} +{"train_loss": 0.0004102036473341286, "global_step": 60582, "epoch": 509, "lr": 5.63417977232516e-06} +{"train_loss": 0.00020512855553533882, "global_step": 60583, "epoch": 509, "lr": 5.633158108930392e-06} +{"train_loss": 0.00030518361018039286, "global_step": 60584, "epoch": 509, "lr": 5.632136532645171e-06} +{"train_loss": 0.0007131964666768909, "global_step": 60585, "epoch": 509, "lr": 5.6311150434715185e-06} +{"train_loss": 0.0004973597242496908, "global_step": 60586, "epoch": 509, "lr": 5.6300936414114325e-06} +{"train_loss": 0.00042537826811894774, "global_step": 60587, "epoch": 509, "lr": 5.629072326466911e-06} +{"train_loss": 0.0002871024771593511, "global_step": 60588, "epoch": 509, "lr": 5.628051098639958e-06} +{"train_loss": 0.0005049695610068738, "global_step": 60589, "epoch": 509, "lr": 5.6270299579326e-06} +{"train_loss": 0.00021432567154988647, "global_step": 60590, "epoch": 509, "lr": 5.626008904346819e-06} +{"train_loss": 0.000506004667840898, "global_step": 60591, "epoch": 509, "lr": 5.6249879378846345e-06} +{"train_loss": 0.00023062838590703905, "global_step": 60592, "epoch": 509, "lr": 5.623967058548041e-06} +{"train_loss": 0.0002699202159419656, "global_step": 60593, "epoch": 509, "lr": 5.622946266339058e-06} +{"train_loss": 0.00020144744485151023, "global_step": 60594, "epoch": 509, "lr": 5.621925561259661e-06} +{"train_loss": 0.00024488294729962945, "global_step": 60595, "epoch": 509, "lr": 5.620904943311889e-06} +{"train_loss": 0.0005129729397594929, "global_step": 60596, "epoch": 509, "lr": 5.6198844124977165e-06} +{"train_loss": 0.0003968425444327295, "global_step": 60597, "epoch": 509, "lr": 5.618863968819171e-06} +{"train_loss": 0.0002489019825588912, "global_step": 60598, "epoch": 509, "lr": 5.617843612278245e-06} +{"train_loss": 0.0003075379063375294, "global_step": 60599, "epoch": 509, "lr": 5.616823342876931e-06} +{"train_loss": 0.0003017596318386495, "global_step": 60600, "epoch": 509, "lr": 5.61580316061725e-06} +{"train_loss": 0.00022865773644298315, "global_step": 60601, "epoch": 509, "lr": 5.614783065501189e-06} +{"train_loss": 0.00041660276474431157, "global_step": 60602, "epoch": 509, "lr": 5.613763057530774e-06} +{"train_loss": 0.00035996377118863165, "global_step": 60603, "epoch": 509, "lr": 5.612743136707977e-06} +{"train_loss": 0.0003972429549321532, "global_step": 60604, "epoch": 509, "lr": 5.611723303034827e-06} +{"train_loss": 0.0003302722761873156, "global_step": 60605, "epoch": 509, "lr": 5.610703556513319e-06} +{"train_loss": 0.00038621496059931815, "global_step": 60606, "epoch": 509, "lr": 5.609683897145446e-06} +{"train_loss": 0.00023561742273159325, "global_step": 60607, "epoch": 509, "lr": 5.608664324933222e-06} +{"train_loss": 0.00045830413000658154, "global_step": 60608, "epoch": 509, "lr": 5.607644839878628e-06} +{"train_loss": 0.0005628378130495548, "global_step": 60609, "epoch": 509, "lr": 5.606625441983698e-06} +{"train_loss": 0.00020614186360035092, "global_step": 60610, "epoch": 509, "lr": 5.605606131250418e-06} +{"train_loss": 0.0004638266109395772, "global_step": 60611, "epoch": 509, "lr": 5.60458690768077e-06} +{"train_loss": 0.0007013590657152236, "global_step": 60612, "epoch": 509, "lr": 5.603567771276785e-06} +{"train_loss": 0.0006232709856703877, "global_step": 60613, "epoch": 509, "lr": 5.602548722040446e-06} +{"train_loss": 0.0003210489812772721, "global_step": 60614, "epoch": 509, "lr": 5.601529759973767e-06} +{"train_loss": 0.00036256678868085146, "global_step": 60615, "epoch": 509, "lr": 5.6005108850787304e-06} +{"train_loss": 0.00029781917692162097, "global_step": 60616, "epoch": 509, "lr": 5.599492097357356e-06} +{"train_loss": 0.0001713372184894979, "global_step": 60617, "epoch": 509, "lr": 5.5984733968116375e-06} +{"train_loss": 0.000822651491034776, "global_step": 60618, "epoch": 509, "lr": 5.597454783443562e-06} +{"train_loss": 0.0003297609800938517, "global_step": 60619, "epoch": 509, "lr": 5.59643625725515e-06} +{"train_loss": 0.0011457899818196893, "global_step": 60620, "epoch": 509, "lr": 5.595417818248383e-06} +{"train_loss": 0.00018085696501657367, "global_step": 60621, "epoch": 509, "lr": 5.594399466425276e-06} +{"train_loss": 0.00027342868270352483, "global_step": 60622, "epoch": 509, "lr": 5.593381201787811e-06} +{"train_loss": 0.0006712704780511558, "global_step": 60623, "epoch": 509, "lr": 5.592363024338004e-06} +{"train_loss": 0.0003428373602218926, "global_step": 60624, "epoch": 509, "lr": 5.591344934077852e-06} +{"train_loss": 0.0006967316148802638, "global_step": 60625, "epoch": 509, "lr": 5.590326931009343e-06} +{"train_loss": 0.00029277443536557257, "global_step": 60626, "epoch": 509, "lr": 5.589309015134492e-06} +{"train_loss": 0.0004933396121487021, "global_step": 60627, "epoch": 509, "lr": 5.58829118645528e-06} +{"train_loss": 0.0009421539143659174, "global_step": 60628, "epoch": 509, "lr": 5.587273444973723e-06} +{"train_loss": 0.00019280420383438468, "global_step": 60629, "epoch": 509, "lr": 5.5862557906918075e-06} +{"train_loss": 0.00043452114914543927, "global_step": 60630, "epoch": 509, "lr": 5.585238223611522e-06} +{"train_loss": 0.0002981782890856266, "global_step": 60631, "epoch": 509, "lr": 5.584220743734891e-06} +{"train_loss": 0.00023408708511851728, "global_step": 60632, "epoch": 509, "lr": 5.583203351063887e-06} +{"train_loss": 0.00027461914578452706, "global_step": 60633, "epoch": 509, "lr": 5.582186045600524e-06} +{"train_loss": 0.0003178687475156039, "global_step": 60634, "epoch": 509, "lr": 5.5811688273467886e-06} +{"train_loss": 0.0002132591762347147, "global_step": 60635, "epoch": 509, "lr": 5.580151696304686e-06} +{"train_loss": 0.0003644927346613258, "global_step": 60636, "epoch": 509, "lr": 5.579134652476214e-06} +{"train_loss": 0.00043515668949112296, "global_step": 60637, "epoch": 509, "lr": 5.578117695863355e-06} +{"train_loss": 0.00045417185174301267, "global_step": 60638, "epoch": 509, "lr": 5.5771008264681295e-06} +{"train_loss": 0.0005082401330582798, "global_step": 60639, "epoch": 509, "lr": 5.576084044292507e-06} +{"train_loss": 0.00028643920086324215, "global_step": 60640, "epoch": 509, "lr": 5.5750673493385085e-06} +{"train_loss": 0.00029462689417414367, "global_step": 60641, "epoch": 509, "lr": 5.574050741608111e-06} +{"train_loss": 0.0003507903020363301, "global_step": 60642, "epoch": 509, "lr": 5.573034221103324e-06} +{"train_loss": 0.00029873003950342536, "global_step": 60643, "epoch": 509, "lr": 5.57201778782614e-06} +{"train_loss": 0.0003619318304117769, "global_step": 60644, "epoch": 509, "lr": 5.571001441778545e-06} +{"train_loss": 0.00032099796226248145, "global_step": 60645, "epoch": 509, "lr": 5.56998518296255e-06} +{"train_loss": 0.00035890593426302075, "global_step": 60646, "epoch": 509, "lr": 5.568969011380132e-06} +{"train_loss": 0.0006542006158269942, "global_step": 60647, "epoch": 509, "lr": 5.567952927033304e-06} +{"train_loss": 0.0003680888330563903, "global_step": 60648, "epoch": 509, "lr": 5.56693692992406e-06} +{"train_loss": 0.00034169069840572774, "global_step": 60649, "epoch": 509, "lr": 5.565921020054377e-06} +{"train_loss": 0.000218686880543828, "global_step": 60650, "epoch": 509, "lr": 5.564905197426268e-06} +{"train_loss": 0.0002954807714559138, "global_step": 60651, "epoch": 509, "lr": 5.563889462041711e-06} +{"train_loss": 0.00033712407457642257, "global_step": 60652, "epoch": 509, "lr": 5.562873813902719e-06} +{"train_loss": 0.000382770987926051, "global_step": 60653, "epoch": 509, "lr": 5.561858253011271e-06} +{"train_loss": 0.00018060703587252647, "global_step": 60654, "epoch": 509, "lr": 5.560842779369374e-06} +{"train_loss": 0.00018611870473250747, "global_step": 60655, "epoch": 509, "lr": 5.559827392979e-06} +{"train_loss": 0.00037256782525219023, "global_step": 60656, "epoch": 509, "lr": 5.558812093842175e-06} +{"train_loss": 0.0002896305522881448, "global_step": 60657, "epoch": 509, "lr": 5.5577968819608585e-06} +{"train_loss": 0.00023085239809006453, "global_step": 60658, "epoch": 509, "lr": 5.5567817573370654e-06} +{"train_loss": 0.0003348073805682361, "global_step": 60659, "epoch": 509, "lr": 5.555766719972788e-06} +{"train_loss": 0.0003282036923337728, "global_step": 60660, "epoch": 509, "lr": 5.55475176987002e-06} +{"train_loss": 0.0004709855420514941, "global_step": 60661, "epoch": 509, "lr": 5.553736907030738e-06} +{"train_loss": 0.00018898016423918307, "global_step": 60662, "epoch": 509, "lr": 5.55272213145695e-06} +{"train_loss": 0.0005592979723587632, "global_step": 60663, "epoch": 509, "lr": 5.551707443150639e-06} +{"train_loss": 0.00030162022449076176, "global_step": 60664, "epoch": 509, "lr": 5.550692842113808e-06} +{"train_loss": 0.00018533765978645533, "global_step": 60665, "epoch": 509, "lr": 5.549678328348434e-06} +{"train_loss": 0.0003868841449730098, "global_step": 60666, "epoch": 509, "lr": 5.548663901856527e-06} +{"train_loss": 0.00024538495927117765, "global_step": 60667, "epoch": 509, "lr": 5.547649562640072e-06} +{"train_loss": 0.00020880710508208722, "global_step": 60668, "epoch": 509, "lr": 5.5466353107010485e-06} +{"train_loss": 0.0005088428733870387, "global_step": 60669, "epoch": 509, "lr": 5.545621146041463e-06} +{"train_loss": 0.00025423115584999323, "global_step": 60670, "epoch": 509, "lr": 5.544607068663294e-06} +{"train_loss": 0.0004801219329237938, "global_step": 60671, "epoch": 509, "lr": 5.543593078568548e-06} +{"train_loss": 0.0002620304876472801, "global_step": 60672, "epoch": 509, "lr": 5.5425791757591995e-06} +{"train_loss": 0.0004105143598280847, "global_step": 60673, "epoch": 509, "lr": 5.541565360237255e-06} +{"train_loss": 0.00037861851160414517, "global_step": 60674, "epoch": 509, "lr": 5.540551632004698e-06} +{"train_loss": 0.000227368829655461, "global_step": 60675, "epoch": 509, "lr": 5.539537991063509e-06} +{"train_loss": 0.0003408791380934417, "global_step": 60676, "epoch": 509, "lr": 5.538524437415698e-06} +{"train_loss": 0.00022656697547063231, "global_step": 60677, "epoch": 509, "lr": 5.537510971063237e-06} +{"train_loss": 0.0002717703173402697, "global_step": 60678, "epoch": 509, "lr": 5.536497592008127e-06} +{"train_loss": 0.0003534451243467629, "global_step": 60679, "epoch": 509, "lr": 5.535484300252358e-06} +{"train_loss": 0.00033893410000018775, "global_step": 60680, "epoch": 509, "lr": 5.5344710957979e-06} +{"train_loss": 0.0003565346705727279, "global_step": 60681, "epoch": 509, "lr": 5.533457978646772e-06} +{"train_loss": 0.0005964440642856061, "global_step": 60682, "epoch": 509, "lr": 5.532444948800941e-06} +{"train_loss": 0.0004327901406213641, "global_step": 60683, "epoch": 509, "lr": 5.53143200626241e-06} +{"train_loss": 0.000317486614221707, "global_step": 60684, "epoch": 509, "lr": 5.5304191510331505e-06} +{"train_loss": 0.00031780352583155036, "global_step": 60685, "epoch": 509, "lr": 5.529406383115171e-06} +{"train_loss": 0.0006909872754476964, "global_step": 60686, "epoch": 509, "lr": 5.528393702510448e-06} +{"train_loss": 0.0002826998243108392, "global_step": 60687, "epoch": 509, "lr": 5.527381109220975e-06} +{"train_loss": 0.00047270883806049824, "global_step": 60688, "epoch": 509, "lr": 5.526368603248733e-06} +{"train_loss": 0.00037781058499069116, "global_step": 60689, "epoch": 509, "lr": 5.525356184595726e-06, "val_loss": 0.01533050648868084} +{"train_loss": 0.00026555644581094384, "global_step": 60690, "epoch": 510, "lr": 5.524343853263914e-06} +{"train_loss": 0.00047034252202138305, "global_step": 60691, "epoch": 510, "lr": 5.523331609255317e-06} +{"train_loss": 0.0002748348633758724, "global_step": 60692, "epoch": 510, "lr": 5.522319452571895e-06} +{"train_loss": 0.00023250999220181257, "global_step": 60693, "epoch": 510, "lr": 5.521307383215657e-06} +{"train_loss": 0.0004490331339184195, "global_step": 60694, "epoch": 510, "lr": 5.520295401188569e-06} +{"train_loss": 0.0004566699208226055, "global_step": 60695, "epoch": 510, "lr": 5.519283506492639e-06} +{"train_loss": 0.00029328992241062224, "global_step": 60696, "epoch": 510, "lr": 5.51827169912984e-06} +{"train_loss": 0.0002903815475292504, "global_step": 60697, "epoch": 510, "lr": 5.5172599791021686e-06} +{"train_loss": 0.0004725746694020927, "global_step": 60698, "epoch": 510, "lr": 5.516248346411601e-06} +{"train_loss": 0.00024350540479645133, "global_step": 60699, "epoch": 510, "lr": 5.51523680106012e-06} +{"train_loss": 0.0003865584440063685, "global_step": 60700, "epoch": 510, "lr": 5.514225343049728e-06} +{"train_loss": 0.0004807539808098227, "global_step": 60701, "epoch": 510, "lr": 5.5132139723823975e-06} +{"train_loss": 0.0002625027555041015, "global_step": 60702, "epoch": 510, "lr": 5.51220268906012e-06} +{"train_loss": 0.0003162545326631516, "global_step": 60703, "epoch": 510, "lr": 5.511191493084877e-06} +{"train_loss": 0.0003019833529833704, "global_step": 60704, "epoch": 510, "lr": 5.510180384458663e-06} +{"train_loss": 0.0002861499378923327, "global_step": 60705, "epoch": 510, "lr": 5.5091693631834585e-06} +{"train_loss": 0.00032956310315057635, "global_step": 60706, "epoch": 510, "lr": 5.508158429261234e-06} +{"train_loss": 0.0002449085586704314, "global_step": 60707, "epoch": 510, "lr": 5.507147582694e-06} +{"train_loss": 0.00023812179279047996, "global_step": 60708, "epoch": 510, "lr": 5.506136823483715e-06} +{"train_loss": 0.00038005554233677685, "global_step": 60709, "epoch": 510, "lr": 5.505126151632389e-06} +{"train_loss": 0.0002968020271509886, "global_step": 60710, "epoch": 510, "lr": 5.504115567141988e-06} +{"train_loss": 0.0003224496904294938, "global_step": 60711, "epoch": 510, "lr": 5.503105070014508e-06} +{"train_loss": 0.0005878121010027826, "global_step": 60712, "epoch": 510, "lr": 5.502094660251928e-06} +{"train_loss": 0.0003599297197069973, "global_step": 60713, "epoch": 510, "lr": 5.5010843378562215e-06} +{"train_loss": 0.0001742372551234439, "global_step": 60714, "epoch": 510, "lr": 5.500074102829389e-06} +{"train_loss": 0.0004713198868557811, "global_step": 60715, "epoch": 510, "lr": 5.4990639551734006e-06} +{"train_loss": 0.0004560156085062772, "global_step": 60716, "epoch": 510, "lr": 5.498053894890253e-06} +{"train_loss": 0.00021645826927851886, "global_step": 60717, "epoch": 510, "lr": 5.497043921981926e-06} +{"train_loss": 0.0005792512674815953, "global_step": 60718, "epoch": 510, "lr": 5.496034036450387e-06} +{"train_loss": 0.0002168251376133412, "global_step": 60719, "epoch": 510, "lr": 5.495024238297641e-06} +{"train_loss": 0.00031601625960320234, "global_step": 60720, "epoch": 510, "lr": 5.4940145275256484e-06} +{"train_loss": 0.0003497564175631851, "global_step": 60721, "epoch": 510, "lr": 5.493004904136406e-06} +{"train_loss": 0.0004227310710120946, "global_step": 60722, "epoch": 510, "lr": 5.491995368131903e-06} +{"train_loss": 0.00015385878214146942, "global_step": 60723, "epoch": 510, "lr": 5.490985919514102e-06} +{"train_loss": 0.0005021576653234661, "global_step": 60724, "epoch": 510, "lr": 5.4899765582850035e-06} +{"train_loss": 0.00035703007597476244, "global_step": 60725, "epoch": 510, "lr": 5.4889672844465725e-06} +{"train_loss": 0.00033118578721769154, "global_step": 60726, "epoch": 510, "lr": 5.4879580980008115e-06} +{"train_loss": 0.0003887111088261008, "global_step": 60727, "epoch": 510, "lr": 5.4869489989496756e-06} +{"train_loss": 0.0002492605708539486, "global_step": 60728, "epoch": 510, "lr": 5.485939987295169e-06} +{"train_loss": 0.0004476098110899329, "global_step": 60729, "epoch": 510, "lr": 5.484931063039267e-06} +{"train_loss": 0.00032384751830250025, "global_step": 60730, "epoch": 510, "lr": 5.483922226183935e-06} +{"train_loss": 0.00048293298459611833, "global_step": 60731, "epoch": 510, "lr": 5.482913476731177e-06} +{"train_loss": 0.0002468423335812986, "global_step": 60732, "epoch": 510, "lr": 5.481904814682947e-06} +{"train_loss": 0.00034512029378674924, "global_step": 60733, "epoch": 510, "lr": 5.480896240041256e-06} +{"train_loss": 0.00041876561590470374, "global_step": 60734, "epoch": 510, "lr": 5.47988775280806e-06} +{"train_loss": 0.00023366714594885707, "global_step": 60735, "epoch": 510, "lr": 5.478879352985356e-06} +{"train_loss": 0.0002701395424082875, "global_step": 60736, "epoch": 510, "lr": 5.477871040575116e-06} +{"train_loss": 0.0005655873101204634, "global_step": 60737, "epoch": 510, "lr": 5.476862815579314e-06} +{"train_loss": 0.00033233765861950815, "global_step": 60738, "epoch": 510, "lr": 5.475854677999942e-06} +{"train_loss": 0.0003450509684626013, "global_step": 60739, "epoch": 510, "lr": 5.4748466278389585e-06} +{"train_loss": 0.0001868082326836884, "global_step": 60740, "epoch": 510, "lr": 5.473838665098374e-06} +{"train_loss": 0.0007124891853891313, "global_step": 60741, "epoch": 510, "lr": 5.472830789780137e-06} +{"train_loss": 0.0002667434746399522, "global_step": 60742, "epoch": 510, "lr": 5.47182300188625e-06} +{"train_loss": 0.0007478339248336852, "global_step": 60743, "epoch": 510, "lr": 5.4708153014186805e-06} +{"train_loss": 0.00032563769491389394, "global_step": 60744, "epoch": 510, "lr": 5.469807688379397e-06} +{"train_loss": 0.0006260012160055339, "global_step": 60745, "epoch": 510, "lr": 5.468800162770399e-06} +{"train_loss": 0.00030315195908769965, "global_step": 60746, "epoch": 510, "lr": 5.4677927245936454e-06} +{"train_loss": 0.0003556206065695733, "global_step": 60747, "epoch": 510, "lr": 5.466785373851135e-06} +{"train_loss": 0.00030023843282833695, "global_step": 60748, "epoch": 510, "lr": 5.4657781105448334e-06} +{"train_loss": 0.00047091342275962234, "global_step": 60749, "epoch": 510, "lr": 5.464770934676705e-06} +{"train_loss": 0.00023821057402528822, "global_step": 60750, "epoch": 510, "lr": 5.463763846248754e-06} +{"train_loss": 0.0002709212130866945, "global_step": 60751, "epoch": 510, "lr": 5.46275684526294e-06} +{"train_loss": 0.0003244994150009006, "global_step": 60752, "epoch": 510, "lr": 5.461749931721244e-06} +{"train_loss": 0.00030185203650034964, "global_step": 60753, "epoch": 510, "lr": 5.460743105625643e-06} +{"train_loss": 0.0002443414705339819, "global_step": 60754, "epoch": 510, "lr": 5.4597363669781185e-06} +{"train_loss": 0.00026898123905994, "global_step": 60755, "epoch": 510, "lr": 5.458729715780636e-06} +{"train_loss": 0.0007956972112879157, "global_step": 60756, "epoch": 510, "lr": 5.457723152035177e-06} +{"train_loss": 0.00025098337209783494, "global_step": 60757, "epoch": 510, "lr": 5.456716675743734e-06} +{"train_loss": 0.00029747828375548124, "global_step": 60758, "epoch": 510, "lr": 5.455710286908255e-06} +{"train_loss": 0.00022891334083396941, "global_step": 60759, "epoch": 510, "lr": 5.45470398553074e-06} +{"train_loss": 0.0002995508839376271, "global_step": 60760, "epoch": 510, "lr": 5.453697771613147e-06} +{"train_loss": 0.00041822518687695265, "global_step": 60761, "epoch": 510, "lr": 5.452691645157471e-06} +{"train_loss": 0.0004563269321806729, "global_step": 60762, "epoch": 510, "lr": 5.451685606165674e-06} +{"train_loss": 0.0006187864346429706, "global_step": 60763, "epoch": 510, "lr": 5.450679654639718e-06} +{"train_loss": 0.00022041186457499862, "global_step": 60764, "epoch": 510, "lr": 5.449673790581611e-06} +{"train_loss": 0.0007908771513029933, "global_step": 60765, "epoch": 510, "lr": 5.448668013993297e-06} +{"train_loss": 0.000250190612860024, "global_step": 60766, "epoch": 510, "lr": 5.447662324876774e-06} +{"train_loss": 0.00018569285748526454, "global_step": 60767, "epoch": 510, "lr": 5.446656723234e-06} +{"train_loss": 0.00030084222089499235, "global_step": 60768, "epoch": 510, "lr": 5.445651209066954e-06} +{"train_loss": 0.0005551867070607841, "global_step": 60769, "epoch": 510, "lr": 5.444645782377622e-06} +{"train_loss": 0.0005830004811286926, "global_step": 60770, "epoch": 510, "lr": 5.443640443167952e-06} +{"train_loss": 0.0003304541460238397, "global_step": 60771, "epoch": 510, "lr": 5.4426351914399486e-06} +{"train_loss": 0.0002506663149688393, "global_step": 60772, "epoch": 510, "lr": 5.44163002719556e-06} +{"train_loss": 0.0003666892589535564, "global_step": 60773, "epoch": 510, "lr": 5.440624950436779e-06} +{"train_loss": 0.0003535180876497179, "global_step": 60774, "epoch": 510, "lr": 5.439619961165571e-06} +{"train_loss": 0.0002512535429559648, "global_step": 60775, "epoch": 510, "lr": 5.4386150593839e-06} +{"train_loss": 0.0002422765246592462, "global_step": 60776, "epoch": 510, "lr": 5.437610245093755e-06} +{"train_loss": 0.0004591440374497324, "global_step": 60777, "epoch": 510, "lr": 5.436605518297094e-06} +{"train_loss": 0.0003019941214006394, "global_step": 60778, "epoch": 510, "lr": 5.435600878995906e-06} +{"train_loss": 0.0001626618904992938, "global_step": 60779, "epoch": 510, "lr": 5.434596327192143e-06} +{"train_loss": 0.0002256455336464569, "global_step": 60780, "epoch": 510, "lr": 5.433591862887799e-06} +{"train_loss": 0.0002915053046308458, "global_step": 60781, "epoch": 510, "lr": 5.432587486084839e-06} +{"train_loss": 0.00027466402389109135, "global_step": 60782, "epoch": 510, "lr": 5.431583196785223e-06} +{"train_loss": 0.0003838686097878963, "global_step": 60783, "epoch": 510, "lr": 5.430578994990937e-06} +{"train_loss": 0.0005276961601339281, "global_step": 60784, "epoch": 510, "lr": 5.429574880703941e-06} +{"train_loss": 0.0007541694794781506, "global_step": 60785, "epoch": 510, "lr": 5.428570853926224e-06} +{"train_loss": 0.0004326098714955151, "global_step": 60786, "epoch": 510, "lr": 5.4275669146597315e-06} +{"train_loss": 0.0002534157538320869, "global_step": 60787, "epoch": 510, "lr": 5.426563062906465e-06} +{"train_loss": 0.0003706167044583708, "global_step": 60788, "epoch": 510, "lr": 5.42555929866837e-06} +{"train_loss": 0.0002869110321626067, "global_step": 60789, "epoch": 510, "lr": 5.4245556219474355e-06} +{"train_loss": 0.0002049087343038991, "global_step": 60790, "epoch": 510, "lr": 5.423552032745611e-06} +{"train_loss": 0.0002582112210802734, "global_step": 60791, "epoch": 510, "lr": 5.42254853106488e-06} +{"train_loss": 0.00027027103351429105, "global_step": 60792, "epoch": 510, "lr": 5.4215451169072285e-06} +{"train_loss": 0.00022262349375523627, "global_step": 60793, "epoch": 510, "lr": 5.420541790274608e-06} +{"train_loss": 0.0003782348067034036, "global_step": 60794, "epoch": 510, "lr": 5.419538551168979e-06} +{"train_loss": 0.00015428150072693825, "global_step": 60795, "epoch": 510, "lr": 5.418535399592334e-06} +{"train_loss": 0.0004140162782277912, "global_step": 60796, "epoch": 510, "lr": 5.417532335546621e-06} +{"train_loss": 0.0003884577890858054, "global_step": 60797, "epoch": 510, "lr": 5.416529359033834e-06} +{"train_loss": 0.00045834825141355395, "global_step": 60798, "epoch": 510, "lr": 5.415526470055926e-06} +{"train_loss": 0.00023527038865722716, "global_step": 60799, "epoch": 510, "lr": 5.414523668614857e-06} +{"train_loss": 0.0003535540890879929, "global_step": 60800, "epoch": 510, "lr": 5.41352095471262e-06} +{"train_loss": 0.0003541177720762789, "global_step": 60801, "epoch": 510, "lr": 5.412518328351163e-06} +{"train_loss": 0.00018560739408712834, "global_step": 60802, "epoch": 510, "lr": 5.411515789532467e-06} +{"train_loss": 0.0004977777134627104, "global_step": 60803, "epoch": 510, "lr": 5.410513338258494e-06} +{"train_loss": 0.00037489502574317157, "global_step": 60804, "epoch": 510, "lr": 5.409510974531217e-06} +{"train_loss": 0.0003347457677591592, "global_step": 60805, "epoch": 510, "lr": 5.4085086983526045e-06} +{"train_loss": 0.0004007062816526741, "global_step": 60806, "epoch": 510, "lr": 5.407506509724614e-06} +{"train_loss": 0.00022163552057463676, "global_step": 60807, "epoch": 510, "lr": 5.406504408649227e-06} +{"train_loss": 0.0003556099274203557, "global_step": 60808, "epoch": 510, "lr": 5.405502395128392e-06, "val_loss": 0.013631581328809261, "train_action_mse_error": 5.149336175236385e-06} +{"train_loss": 0.0003805801970884204, "global_step": 60809, "epoch": 511, "lr": 5.404500469164103e-06} +{"train_loss": 0.0002219653397332877, "global_step": 60810, "epoch": 511, "lr": 5.403498630758302e-06} +{"train_loss": 0.00025761648430489004, "global_step": 60811, "epoch": 511, "lr": 5.402496879912977e-06} +{"train_loss": 0.00013787888747174293, "global_step": 60812, "epoch": 511, "lr": 5.401495216630087e-06} +{"train_loss": 0.0003480133891571313, "global_step": 60813, "epoch": 511, "lr": 5.40049364091158e-06} +{"train_loss": 0.00033674659789539874, "global_step": 60814, "epoch": 511, "lr": 5.399492152759456e-06} +{"train_loss": 0.00017572940851096064, "global_step": 60815, "epoch": 511, "lr": 5.39849075217565e-06} +{"train_loss": 0.00035420761560089886, "global_step": 60816, "epoch": 511, "lr": 5.397489439162157e-06} +{"train_loss": 0.0004165636491961777, "global_step": 60817, "epoch": 511, "lr": 5.3964882137209125e-06} +{"train_loss": 0.00023627409245818853, "global_step": 60818, "epoch": 511, "lr": 5.395487075853911e-06} +{"train_loss": 0.0006762855919077992, "global_step": 60819, "epoch": 511, "lr": 5.394486025563095e-06} +{"train_loss": 0.0002904157154262066, "global_step": 60820, "epoch": 511, "lr": 5.393485062850451e-06} +{"train_loss": 0.00023527075245510787, "global_step": 60821, "epoch": 511, "lr": 5.392484187717922e-06} +{"train_loss": 0.00024838148965500295, "global_step": 60822, "epoch": 511, "lr": 5.391483400167496e-06} +{"train_loss": 0.00020616808615159243, "global_step": 60823, "epoch": 511, "lr": 5.390482700201122e-06} +{"train_loss": 0.00031809182837605476, "global_step": 60824, "epoch": 511, "lr": 5.389482087820774e-06} +{"train_loss": 0.00034290540497750044, "global_step": 60825, "epoch": 511, "lr": 5.388481563028397e-06} +{"train_loss": 0.00015670892025809735, "global_step": 60826, "epoch": 511, "lr": 5.387481125825988e-06} +{"train_loss": 0.0003351831983309239, "global_step": 60827, "epoch": 511, "lr": 5.38648077621548e-06} +{"train_loss": 0.00032828046823851764, "global_step": 60828, "epoch": 511, "lr": 5.385480514198865e-06} +{"train_loss": 0.00023965568107087165, "global_step": 60829, "epoch": 511, "lr": 5.384480339778075e-06} +{"train_loss": 0.0010493913432583213, "global_step": 60830, "epoch": 511, "lr": 5.3834802529551086e-06} +{"train_loss": 0.0003776002849917859, "global_step": 60831, "epoch": 511, "lr": 5.3824802537319084e-06} +{"train_loss": 0.00037297719973139465, "global_step": 60832, "epoch": 511, "lr": 5.3814803421104346e-06} +{"train_loss": 0.0003243916144128889, "global_step": 60833, "epoch": 511, "lr": 5.380480518092662e-06} +{"train_loss": 0.00049520906759426, "global_step": 60834, "epoch": 511, "lr": 5.379480781680546e-06} +{"train_loss": 0.0002445834397803992, "global_step": 60835, "epoch": 511, "lr": 5.3784811328760565e-06} +{"train_loss": 0.00014538886898662895, "global_step": 60836, "epoch": 511, "lr": 5.377481571681153e-06} +{"train_loss": 0.0003148743126075715, "global_step": 60837, "epoch": 511, "lr": 5.37648209809779e-06} +{"train_loss": 0.00032379437470808625, "global_step": 60838, "epoch": 511, "lr": 5.375482712127944e-06} +{"train_loss": 0.0004420802288223058, "global_step": 60839, "epoch": 511, "lr": 5.374483413773562e-06} +{"train_loss": 0.0004979649093002081, "global_step": 60840, "epoch": 511, "lr": 5.373484203036627e-06} +{"train_loss": 0.00021214930166024715, "global_step": 60841, "epoch": 511, "lr": 5.372485079919076e-06} +{"train_loss": 0.0003815111122094095, "global_step": 60842, "epoch": 511, "lr": 5.371486044422891e-06} +{"train_loss": 0.00020123440481256694, "global_step": 60843, "epoch": 511, "lr": 5.370487096550025e-06} +{"train_loss": 0.0003967819211538881, "global_step": 60844, "epoch": 511, "lr": 5.369488236302433e-06} +{"train_loss": 0.00047691771760582924, "global_step": 60845, "epoch": 511, "lr": 5.368489463682092e-06} +{"train_loss": 0.00031950988341122866, "global_step": 60846, "epoch": 511, "lr": 5.367490778690943e-06} +{"train_loss": 0.0004318417049944401, "global_step": 60847, "epoch": 511, "lr": 5.366492181330968e-06} +{"train_loss": 0.00017083024431485683, "global_step": 60848, "epoch": 511, "lr": 5.365493671604116e-06} +{"train_loss": 0.00042306986870244145, "global_step": 60849, "epoch": 511, "lr": 5.364495249512336e-06} +{"train_loss": 0.00042869275785051286, "global_step": 60850, "epoch": 511, "lr": 5.363496915057614e-06} +{"train_loss": 0.0005201370804570615, "global_step": 60851, "epoch": 511, "lr": 5.362498668241889e-06} +{"train_loss": 0.0003479112347122282, "global_step": 60852, "epoch": 511, "lr": 5.36150050906713e-06} +{"train_loss": 0.00043903113692067564, "global_step": 60853, "epoch": 511, "lr": 5.360502437535303e-06} +{"train_loss": 0.00015146183432079852, "global_step": 60854, "epoch": 511, "lr": 5.35950445364835e-06} +{"train_loss": 0.00041022637742571533, "global_step": 60855, "epoch": 511, "lr": 5.358506557408249e-06} +{"train_loss": 0.00025572715094313025, "global_step": 60856, "epoch": 511, "lr": 5.357508748816947e-06} +{"train_loss": 0.0005396536435000598, "global_step": 60857, "epoch": 511, "lr": 5.3565110278764095e-06} +{"train_loss": 0.00043409326463006437, "global_step": 60858, "epoch": 511, "lr": 5.35551339458859e-06} +{"train_loss": 0.00038719718577340245, "global_step": 60859, "epoch": 511, "lr": 5.35451584895546e-06} +{"train_loss": 0.0002371392911300063, "global_step": 60860, "epoch": 511, "lr": 5.353518390978956e-06} +{"train_loss": 0.0005372638697735965, "global_step": 60861, "epoch": 511, "lr": 5.3525210206610554e-06} +{"train_loss": 0.0006220599752850831, "global_step": 60862, "epoch": 511, "lr": 5.351523738003717e-06} +{"train_loss": 0.00028810882940888405, "global_step": 60863, "epoch": 511, "lr": 5.350526543008877e-06} +{"train_loss": 0.0002513097133487463, "global_step": 60864, "epoch": 511, "lr": 5.349529435678519e-06} +{"train_loss": 0.000842362002003938, "global_step": 60865, "epoch": 511, "lr": 5.348532416014579e-06} +{"train_loss": 0.00022491301933769137, "global_step": 60866, "epoch": 511, "lr": 5.347535484019039e-06} +{"train_loss": 0.00027085389592684805, "global_step": 60867, "epoch": 511, "lr": 5.346538639693837e-06} +{"train_loss": 0.0003648365964181721, "global_step": 60868, "epoch": 511, "lr": 5.345541883040933e-06} +{"train_loss": 0.00047537218779325485, "global_step": 60869, "epoch": 511, "lr": 5.344545214062291e-06} +{"train_loss": 0.0003235301701352, "global_step": 60870, "epoch": 511, "lr": 5.343548632759854e-06} +{"train_loss": 0.0006807356257922947, "global_step": 60871, "epoch": 511, "lr": 5.342552139135604e-06} +{"train_loss": 0.00029224029276520014, "global_step": 60872, "epoch": 511, "lr": 5.341555733191467e-06} +{"train_loss": 0.0008216766291297972, "global_step": 60873, "epoch": 511, "lr": 5.340559414929424e-06} +{"train_loss": 0.0002103478618664667, "global_step": 60874, "epoch": 511, "lr": 5.339563184351426e-06} +{"train_loss": 0.0004427000239957124, "global_step": 60875, "epoch": 511, "lr": 5.338567041459408e-06} +{"train_loss": 0.00027022906579077244, "global_step": 60876, "epoch": 511, "lr": 5.337570986255358e-06} +{"train_loss": 0.0007565270643681288, "global_step": 60877, "epoch": 511, "lr": 5.336575018741203e-06} +{"train_loss": 0.00022152956807985902, "global_step": 60878, "epoch": 511, "lr": 5.335579138918923e-06} +{"train_loss": 0.00018234866729471833, "global_step": 60879, "epoch": 511, "lr": 5.334583346790445e-06} +{"train_loss": 0.000385079940315336, "global_step": 60880, "epoch": 511, "lr": 5.333587642357757e-06} +{"train_loss": 0.0005330645362846553, "global_step": 60881, "epoch": 511, "lr": 5.332592025622796e-06} +{"train_loss": 0.00020874576875939965, "global_step": 60882, "epoch": 511, "lr": 5.33159649658751e-06} +{"train_loss": 0.00042735799797810614, "global_step": 60883, "epoch": 511, "lr": 5.330601055253876e-06} +{"train_loss": 0.00022557385091204196, "global_step": 60884, "epoch": 511, "lr": 5.329605701623819e-06} +{"train_loss": 0.000470653671072796, "global_step": 60885, "epoch": 511, "lr": 5.328610435699316e-06} +{"train_loss": 0.00023793337459210306, "global_step": 60886, "epoch": 511, "lr": 5.32761525748231e-06} +{"train_loss": 0.00045970745850354433, "global_step": 60887, "epoch": 511, "lr": 5.326620166974755e-06} +{"train_loss": 0.0006045548361726105, "global_step": 60888, "epoch": 511, "lr": 5.325625164178621e-06} +{"train_loss": 0.0002640068414621055, "global_step": 60889, "epoch": 511, "lr": 5.324630249095841e-06} +{"train_loss": 0.0007006312371231616, "global_step": 60890, "epoch": 511, "lr": 5.323635421728385e-06} +{"train_loss": 0.0005882200784981251, "global_step": 60891, "epoch": 511, "lr": 5.322640682078189e-06} +{"train_loss": 0.00042048378963954747, "global_step": 60892, "epoch": 511, "lr": 5.321646030147221e-06} +{"train_loss": 0.00022603706747759134, "global_step": 60893, "epoch": 511, "lr": 5.320651465937432e-06} +{"train_loss": 0.00022893871937412769, "global_step": 60894, "epoch": 511, "lr": 5.319656989450755e-06} +{"train_loss": 0.0007733695092611015, "global_step": 60895, "epoch": 511, "lr": 5.3186626006891725e-06} +{"train_loss": 0.0005064887227490544, "global_step": 60896, "epoch": 511, "lr": 5.317668299654615e-06} +{"train_loss": 0.00042311594006605446, "global_step": 60897, "epoch": 511, "lr": 5.316674086349049e-06} +{"train_loss": 0.00046830426435917616, "global_step": 60898, "epoch": 511, "lr": 5.315679960774406e-06} +{"train_loss": 0.00017535893130116165, "global_step": 60899, "epoch": 511, "lr": 5.314685922932666e-06} +{"train_loss": 0.00040583140798844397, "global_step": 60900, "epoch": 511, "lr": 5.313691972825769e-06} +{"train_loss": 0.00046253198524937034, "global_step": 60901, "epoch": 511, "lr": 5.31269811045565e-06} +{"train_loss": 0.0006151989218778908, "global_step": 60902, "epoch": 511, "lr": 5.3117043358242855e-06} +{"train_loss": 0.0003403102164156735, "global_step": 60903, "epoch": 511, "lr": 5.3107106489336034e-06} +{"train_loss": 0.0003360392583999783, "global_step": 60904, "epoch": 511, "lr": 5.309717049785579e-06} +{"train_loss": 0.00016580420196987689, "global_step": 60905, "epoch": 511, "lr": 5.308723538382148e-06} +{"train_loss": 0.00039627219666726887, "global_step": 60906, "epoch": 511, "lr": 5.307730114725251e-06} +{"train_loss": 0.00021244843082968146, "global_step": 60907, "epoch": 511, "lr": 5.306736778816867e-06} +{"train_loss": 0.00029294576961547136, "global_step": 60908, "epoch": 511, "lr": 5.305743530658919e-06} +{"train_loss": 0.0002890399773605168, "global_step": 60909, "epoch": 511, "lr": 5.30475037025338e-06} +{"train_loss": 0.0005217412253841758, "global_step": 60910, "epoch": 511, "lr": 5.303757297602175e-06} +{"train_loss": 0.00054441939573735, "global_step": 60911, "epoch": 511, "lr": 5.302764312707281e-06} +{"train_loss": 0.0002365741675021127, "global_step": 60912, "epoch": 511, "lr": 5.301771415570633e-06} +{"train_loss": 0.00022555276518687606, "global_step": 60913, "epoch": 511, "lr": 5.300778606194168e-06} +{"train_loss": 0.00034957489697262645, "global_step": 60914, "epoch": 511, "lr": 5.2997858845798666e-06} +{"train_loss": 0.0002789426071103662, "global_step": 60915, "epoch": 511, "lr": 5.298793250729644e-06} +{"train_loss": 0.00025562866358086467, "global_step": 60916, "epoch": 511, "lr": 5.297800704645478e-06} +{"train_loss": 0.0005223364569246769, "global_step": 60917, "epoch": 511, "lr": 5.296808246329294e-06} +{"train_loss": 0.00028048056992702186, "global_step": 60918, "epoch": 511, "lr": 5.295815875783056e-06} +{"train_loss": 0.0005760460626333952, "global_step": 60919, "epoch": 511, "lr": 5.294823593008702e-06} +{"train_loss": 0.00029637390980497, "global_step": 60920, "epoch": 511, "lr": 5.293831398008197e-06} +{"train_loss": 0.00034309393959119916, "global_step": 60921, "epoch": 511, "lr": 5.292839290783469e-06} +{"train_loss": 0.00019604926637839526, "global_step": 60922, "epoch": 511, "lr": 5.291847271336481e-06} +{"train_loss": 0.00033378854277543724, "global_step": 60923, "epoch": 511, "lr": 5.290855339669165e-06} +{"train_loss": 0.0004188126767985523, "global_step": 60924, "epoch": 511, "lr": 5.289863495783492e-06} +{"train_loss": 0.0004421778430696577, "global_step": 60925, "epoch": 511, "lr": 5.288871739681383e-06} +{"train_loss": 0.0005199663573876023, "global_step": 60926, "epoch": 511, "lr": 5.287880071364804e-06} +{"train_loss": 0.00037484458880499005, "global_step": 60927, "epoch": 511, "lr": 5.28688849083569e-06, "val_loss": 0.023414887487888336} +{"train_loss": 0.0002879809762816876, "global_step": 60928, "epoch": 512, "lr": 5.285896998096002e-06} +{"train_loss": 0.000323556741932407, "global_step": 60929, "epoch": 512, "lr": 5.284905593147671e-06} +{"train_loss": 0.0007295060786418617, "global_step": 60930, "epoch": 512, "lr": 5.283914275992657e-06} +{"train_loss": 0.00016721647989470512, "global_step": 60931, "epoch": 512, "lr": 5.282923046632904e-06} +{"train_loss": 0.00036571460077539086, "global_step": 60932, "epoch": 512, "lr": 5.281931905070342e-06} +{"train_loss": 0.00022633367916569114, "global_step": 60933, "epoch": 512, "lr": 5.2809408513069366e-06} +{"train_loss": 0.0005018031224608421, "global_step": 60934, "epoch": 512, "lr": 5.279949885344621e-06} +{"train_loss": 0.0003814218216575682, "global_step": 60935, "epoch": 512, "lr": 5.278959007185353e-06} +{"train_loss": 0.0006937736179679632, "global_step": 60936, "epoch": 512, "lr": 5.277968216831075e-06} +{"train_loss": 0.0002634644042700529, "global_step": 60937, "epoch": 512, "lr": 5.276977514283715e-06} +{"train_loss": 0.0003533806011546403, "global_step": 60938, "epoch": 512, "lr": 5.2759868995452436e-06} +{"train_loss": 0.00041442285873927176, "global_step": 60939, "epoch": 512, "lr": 5.27499637261758e-06} +{"train_loss": 0.0002444526762701571, "global_step": 60940, "epoch": 512, "lr": 5.2740059335026955e-06} +{"train_loss": 0.0005296217277646065, "global_step": 60941, "epoch": 512, "lr": 5.273015582202512e-06} +{"train_loss": 0.00033907368197105825, "global_step": 60942, "epoch": 512, "lr": 5.272025318718998e-06} +{"train_loss": 0.00018790176545735449, "global_step": 60943, "epoch": 512, "lr": 5.271035143054076e-06} +{"train_loss": 0.00023628040798939764, "global_step": 60944, "epoch": 512, "lr": 5.270045055209694e-06} +{"train_loss": 0.00035491041489876807, "global_step": 60945, "epoch": 512, "lr": 5.26905505518781e-06} +{"train_loss": 0.000248377415118739, "global_step": 60946, "epoch": 512, "lr": 5.268065142990342e-06} +{"train_loss": 0.00032258793362416327, "global_step": 60947, "epoch": 512, "lr": 5.267075318619264e-06} +{"train_loss": 0.0002892272314056754, "global_step": 60948, "epoch": 512, "lr": 5.266085582076491e-06} +{"train_loss": 0.00025941539206542075, "global_step": 60949, "epoch": 512, "lr": 5.265095933363995e-06} +{"train_loss": 0.0004445417725946754, "global_step": 60950, "epoch": 512, "lr": 5.2641063724836905e-06} +{"train_loss": 0.0004786345234606415, "global_step": 60951, "epoch": 512, "lr": 5.2631168994375425e-06} +{"train_loss": 0.00041394392610527575, "global_step": 60952, "epoch": 512, "lr": 5.262127514227477e-06} +{"train_loss": 0.0006731207249686122, "global_step": 60953, "epoch": 512, "lr": 5.261138216855454e-06} +{"train_loss": 0.00036573392571881413, "global_step": 60954, "epoch": 512, "lr": 5.260149007323401e-06} +{"train_loss": 0.00020823643717449158, "global_step": 60955, "epoch": 512, "lr": 5.259159885633269e-06} +{"train_loss": 0.00033656504820100963, "global_step": 60956, "epoch": 512, "lr": 5.258170851786992e-06} +{"train_loss": 0.00018379456014372408, "global_step": 60957, "epoch": 512, "lr": 5.257181905786524e-06} +{"train_loss": 0.000376965559553355, "global_step": 60958, "epoch": 512, "lr": 5.2561930476337895e-06} +{"train_loss": 0.00033274281304329634, "global_step": 60959, "epoch": 512, "lr": 5.25520427733075e-06} +{"train_loss": 0.0003058873990084976, "global_step": 60960, "epoch": 512, "lr": 5.2542155948793244e-06} +{"train_loss": 0.00035940538509748876, "global_step": 60961, "epoch": 512, "lr": 5.25322700028148e-06} +{"train_loss": 0.0004572432953864336, "global_step": 60962, "epoch": 512, "lr": 5.252238493539141e-06} +{"train_loss": 0.0006833345396444201, "global_step": 60963, "epoch": 512, "lr": 5.251250074654241e-06} +{"train_loss": 0.0005678928573615849, "global_step": 60964, "epoch": 512, "lr": 5.250261743628743e-06} +{"train_loss": 0.0005931141204200685, "global_step": 60965, "epoch": 512, "lr": 5.2492735004645636e-06} +{"train_loss": 0.00029277504654601216, "global_step": 60966, "epoch": 512, "lr": 5.248285345163662e-06} +{"train_loss": 0.00019796707783825696, "global_step": 60967, "epoch": 512, "lr": 5.247297277727964e-06} +{"train_loss": 0.00039388833101838827, "global_step": 60968, "epoch": 512, "lr": 5.24630929815943e-06} +{"train_loss": 0.0006307189469225705, "global_step": 60969, "epoch": 512, "lr": 5.24532140645998e-06} +{"train_loss": 0.0002991490764543414, "global_step": 60970, "epoch": 512, "lr": 5.244333602631557e-06} +{"train_loss": 0.0002847971045412123, "global_step": 60971, "epoch": 512, "lr": 5.24334588667611e-06} +{"train_loss": 0.0004106211999896914, "global_step": 60972, "epoch": 512, "lr": 5.242358258595559e-06} +{"train_loss": 0.0003860952565446496, "global_step": 60973, "epoch": 512, "lr": 5.241370718391869e-06} +{"train_loss": 0.0002440817916067317, "global_step": 60974, "epoch": 512, "lr": 5.240383266066967e-06} +{"train_loss": 0.0002262685593450442, "global_step": 60975, "epoch": 512, "lr": 5.239395901622779e-06} +{"train_loss": 0.00039609623490832746, "global_step": 60976, "epoch": 512, "lr": 5.238408625061264e-06} +{"train_loss": 0.0012583443894982338, "global_step": 60977, "epoch": 512, "lr": 5.237421436384343e-06} +{"train_loss": 0.0002961153513751924, "global_step": 60978, "epoch": 512, "lr": 5.23643433559397e-06} +{"train_loss": 0.00041112498729489744, "global_step": 60979, "epoch": 512, "lr": 5.235447322692072e-06} +{"train_loss": 0.00015580322360619903, "global_step": 60980, "epoch": 512, "lr": 5.234460397680596e-06} +{"train_loss": 0.00024488428607583046, "global_step": 60981, "epoch": 512, "lr": 5.233473560561475e-06} +{"train_loss": 0.0003521808539517224, "global_step": 60982, "epoch": 512, "lr": 5.23248681133664e-06} +{"train_loss": 0.00048395831254310906, "global_step": 60983, "epoch": 512, "lr": 5.23150015000804e-06} +{"train_loss": 0.0003849995555356145, "global_step": 60984, "epoch": 512, "lr": 5.2305135765776005e-06} +{"train_loss": 0.00037497689481824636, "global_step": 60985, "epoch": 512, "lr": 5.229527091047259e-06} +{"train_loss": 0.0001911358704091981, "global_step": 60986, "epoch": 512, "lr": 5.2285406934189706e-06} +{"train_loss": 0.0004175107169430703, "global_step": 60987, "epoch": 512, "lr": 5.227554383694649e-06} +{"train_loss": 0.0003874615940731019, "global_step": 60988, "epoch": 512, "lr": 5.226568161876255e-06} +{"train_loss": 0.0005429686862044036, "global_step": 60989, "epoch": 512, "lr": 5.225582027965698e-06} +{"train_loss": 0.0002668884990271181, "global_step": 60990, "epoch": 512, "lr": 5.224595981964936e-06} +{"train_loss": 0.00025205378187820315, "global_step": 60991, "epoch": 512, "lr": 5.223610023875891e-06} +{"train_loss": 0.00024132624093908817, "global_step": 60992, "epoch": 512, "lr": 5.222624153700512e-06} +{"train_loss": 0.0004171469481661916, "global_step": 60993, "epoch": 512, "lr": 5.221638371440724e-06} +{"train_loss": 0.0003623421071097255, "global_step": 60994, "epoch": 512, "lr": 5.220652677098453e-06} +{"train_loss": 0.00025862493203021586, "global_step": 60995, "epoch": 512, "lr": 5.21966707067566e-06} +{"train_loss": 0.00042068155016750097, "global_step": 60996, "epoch": 512, "lr": 5.21868155217426e-06} +{"train_loss": 0.00025647826259955764, "global_step": 60997, "epoch": 512, "lr": 5.217696121596199e-06} +{"train_loss": 0.0002053517528111115, "global_step": 60998, "epoch": 512, "lr": 5.216710778943401e-06} +{"train_loss": 0.000309760682284832, "global_step": 60999, "epoch": 512, "lr": 5.2157255242178185e-06} +{"train_loss": 0.00046107734669931233, "global_step": 61000, "epoch": 512, "lr": 5.214740357421372e-06} +{"train_loss": 0.0003462952154222876, "global_step": 61001, "epoch": 512, "lr": 5.213755278555987e-06} +{"train_loss": 0.0003167346294503659, "global_step": 61002, "epoch": 512, "lr": 5.212770287623619e-06} +{"train_loss": 0.00026888333377428353, "global_step": 61003, "epoch": 512, "lr": 5.211785384626184e-06} +{"train_loss": 0.00033247482497245073, "global_step": 61004, "epoch": 512, "lr": 5.2108005695656325e-06} +{"train_loss": 0.0002161558368243277, "global_step": 61005, "epoch": 512, "lr": 5.209815842443888e-06} +{"train_loss": 0.00027865084121003747, "global_step": 61006, "epoch": 512, "lr": 5.2088312032628765e-06} +{"train_loss": 0.0003421996079850942, "global_step": 61007, "epoch": 512, "lr": 5.207846652024545e-06} +{"train_loss": 0.00034938621683977544, "global_step": 61008, "epoch": 512, "lr": 5.2068621887308155e-06} +{"train_loss": 0.0002341906219953671, "global_step": 61009, "epoch": 512, "lr": 5.205877813383636e-06} +{"train_loss": 0.0005591766093857586, "global_step": 61010, "epoch": 512, "lr": 5.2048935259849215e-06} +{"train_loss": 0.0002870737516786903, "global_step": 61011, "epoch": 512, "lr": 5.203909326536621e-06} +{"train_loss": 0.00040715941577218473, "global_step": 61012, "epoch": 512, "lr": 5.20292521504066e-06} +{"train_loss": 0.0005436110659502447, "global_step": 61013, "epoch": 512, "lr": 5.20194119149896e-06} +{"train_loss": 0.0003673352475743741, "global_step": 61014, "epoch": 512, "lr": 5.200957255913469e-06} +{"train_loss": 0.0006243247771635652, "global_step": 61015, "epoch": 512, "lr": 5.199973408286108e-06} +{"train_loss": 0.00023261633759830147, "global_step": 61016, "epoch": 512, "lr": 5.198989648618818e-06} +{"train_loss": 0.0005137237603776157, "global_step": 61017, "epoch": 512, "lr": 5.198005976913517e-06} +{"train_loss": 0.0004141537065152079, "global_step": 61018, "epoch": 512, "lr": 5.197022393172152e-06} +{"train_loss": 0.00046933445264585316, "global_step": 61019, "epoch": 512, "lr": 5.196038897396643e-06} +{"train_loss": 0.00031990944989956915, "global_step": 61020, "epoch": 512, "lr": 5.195055489588924e-06} +{"train_loss": 0.0003278204530943185, "global_step": 61021, "epoch": 512, "lr": 5.1940721697509296e-06} +{"train_loss": 0.000407897838158533, "global_step": 61022, "epoch": 512, "lr": 5.193088937884582e-06} +{"train_loss": 0.0004657023528125137, "global_step": 61023, "epoch": 512, "lr": 5.192105793991831e-06} +{"train_loss": 0.000728666374925524, "global_step": 61024, "epoch": 512, "lr": 5.191122738074588e-06} +{"train_loss": 0.0002440678799757734, "global_step": 61025, "epoch": 512, "lr": 5.190139770134783e-06} +{"train_loss": 0.0005806783447042108, "global_step": 61026, "epoch": 512, "lr": 5.189156890174363e-06} +{"train_loss": 0.00025686106528155506, "global_step": 61027, "epoch": 512, "lr": 5.1881740981952305e-06} +{"train_loss": 0.0001726246118778363, "global_step": 61028, "epoch": 512, "lr": 5.187191394199342e-06} +{"train_loss": 0.0008706353837624192, "global_step": 61029, "epoch": 512, "lr": 5.186208778188606e-06} +{"train_loss": 0.0006073659169487655, "global_step": 61030, "epoch": 512, "lr": 5.185226250164971e-06} +{"train_loss": 0.0004117699572816491, "global_step": 61031, "epoch": 512, "lr": 5.184243810130357e-06} +{"train_loss": 0.00024228084657806903, "global_step": 61032, "epoch": 512, "lr": 5.183261458086686e-06} +{"train_loss": 0.0006733688060194254, "global_step": 61033, "epoch": 512, "lr": 5.1822791940359e-06} +{"train_loss": 0.00025520281633362174, "global_step": 61034, "epoch": 512, "lr": 5.181297017979908e-06} +{"train_loss": 0.0002705115475691855, "global_step": 61035, "epoch": 512, "lr": 5.180314929920665e-06} +{"train_loss": 0.0003842456208076328, "global_step": 61036, "epoch": 512, "lr": 5.1793329298600815e-06} +{"train_loss": 0.00022704846924170852, "global_step": 61037, "epoch": 512, "lr": 5.178351017800082e-06} +{"train_loss": 0.0004358086152933538, "global_step": 61038, "epoch": 512, "lr": 5.177369193742615e-06} +{"train_loss": 0.0005344089004211128, "global_step": 61039, "epoch": 512, "lr": 5.1763874576895795e-06} +{"train_loss": 0.0007808826048858464, "global_step": 61040, "epoch": 512, "lr": 5.17540580964293e-06} +{"train_loss": 0.00035734238917939365, "global_step": 61041, "epoch": 512, "lr": 5.174424249604576e-06} +{"train_loss": 0.0004955398035235703, "global_step": 61042, "epoch": 512, "lr": 5.173442777576459e-06} +{"train_loss": 0.000309739145450294, "global_step": 61043, "epoch": 512, "lr": 5.172461393560496e-06} +{"train_loss": 0.0005332473083399236, "global_step": 61044, "epoch": 512, "lr": 5.171480097558606e-06} +{"train_loss": 0.0004956695483997464, "global_step": 61045, "epoch": 512, "lr": 5.170498889572739e-06} +{"train_loss": 0.0003871648045826093, "global_step": 61046, "epoch": 512, "lr": 5.169517769604792e-06, "val_loss": 0.030792411416769028} +{"train_loss": 0.00027812522603198886, "global_step": 61047, "epoch": 513, "lr": 5.168536737656726e-06} +{"train_loss": 0.0004438218893483281, "global_step": 61048, "epoch": 513, "lr": 5.167555793730433e-06} +{"train_loss": 0.000455041037639603, "global_step": 61049, "epoch": 513, "lr": 5.166574937827867e-06} +{"train_loss": 0.0001964495168067515, "global_step": 61050, "epoch": 513, "lr": 5.165594169950927e-06} +{"train_loss": 0.00043549740803427994, "global_step": 61051, "epoch": 513, "lr": 5.164613490101566e-06} +{"train_loss": 0.0002714037836994976, "global_step": 61052, "epoch": 513, "lr": 5.16363289828169e-06} +{"train_loss": 0.0003643642703536898, "global_step": 61053, "epoch": 513, "lr": 5.162652394493234e-06} +{"train_loss": 0.000560728192795068, "global_step": 61054, "epoch": 513, "lr": 5.161671978738114e-06} +{"train_loss": 0.00017326665692962706, "global_step": 61055, "epoch": 513, "lr": 5.160691651018268e-06} +{"train_loss": 0.0005038853269070387, "global_step": 61056, "epoch": 513, "lr": 5.1597114113356045e-06} +{"train_loss": 0.00045616773422807455, "global_step": 61057, "epoch": 513, "lr": 5.158731259692068e-06} +{"train_loss": 0.0009247667039744556, "global_step": 61058, "epoch": 513, "lr": 5.1577511960895665e-06} +{"train_loss": 0.00031142905936576426, "global_step": 61059, "epoch": 513, "lr": 5.156771220530032e-06} +{"train_loss": 0.0002110200875904411, "global_step": 61060, "epoch": 513, "lr": 5.155791333015381e-06} +{"train_loss": 0.0003093275590799749, "global_step": 61061, "epoch": 513, "lr": 5.154811533547549e-06} +{"train_loss": 0.0002008871379075572, "global_step": 61062, "epoch": 513, "lr": 5.153831822128458e-06} +{"train_loss": 0.0004221505078021437, "global_step": 61063, "epoch": 513, "lr": 5.152852198760016e-06} +{"train_loss": 0.00023716043506283313, "global_step": 61064, "epoch": 513, "lr": 5.151872663444168e-06} +{"train_loss": 0.0004505995020736009, "global_step": 61065, "epoch": 513, "lr": 5.150893216182812e-06} +{"train_loss": 0.000714448862709105, "global_step": 61066, "epoch": 513, "lr": 5.1499138569779e-06} +{"train_loss": 0.0009180197375826538, "global_step": 61067, "epoch": 513, "lr": 5.1489345858313336e-06} +{"train_loss": 0.0005426466814242303, "global_step": 61068, "epoch": 513, "lr": 5.147955402745047e-06} +{"train_loss": 0.0002945398446172476, "global_step": 61069, "epoch": 513, "lr": 5.146976307720958e-06} +{"train_loss": 0.0003913816763088107, "global_step": 61070, "epoch": 513, "lr": 5.145997300760985e-06} +{"train_loss": 0.0004311471711844206, "global_step": 61071, "epoch": 513, "lr": 5.145018381867056e-06} +{"train_loss": 0.0008545674500055611, "global_step": 61072, "epoch": 513, "lr": 5.1440395510410856e-06} +{"train_loss": 0.00022019402240402997, "global_step": 61073, "epoch": 513, "lr": 5.1430608082850165e-06} +{"train_loss": 0.0005356305046007037, "global_step": 61074, "epoch": 513, "lr": 5.1420821536007465e-06} +{"train_loss": 0.00039640863542445004, "global_step": 61075, "epoch": 513, "lr": 5.141103586990203e-06} +{"train_loss": 0.000269914569798857, "global_step": 61076, "epoch": 513, "lr": 5.1401251084553185e-06} +{"train_loss": 0.00034684440470300615, "global_step": 61077, "epoch": 513, "lr": 5.139146717997989e-06} +{"train_loss": 0.0004757822316605598, "global_step": 61078, "epoch": 513, "lr": 5.13816841562017e-06} +{"train_loss": 0.00041961518581956625, "global_step": 61079, "epoch": 513, "lr": 5.13719020132375e-06} +{"train_loss": 0.0006366324378177524, "global_step": 61080, "epoch": 513, "lr": 5.13621207511068e-06} +{"train_loss": 0.0003166274109389633, "global_step": 61081, "epoch": 513, "lr": 5.135234036982861e-06} +{"train_loss": 0.00033902013092301786, "global_step": 61082, "epoch": 513, "lr": 5.134256086942202e-06} +{"train_loss": 0.0003002141020260751, "global_step": 61083, "epoch": 513, "lr": 5.133278224990645e-06} +{"train_loss": 0.00039645947981625795, "global_step": 61084, "epoch": 513, "lr": 5.132300451130112e-06} +{"train_loss": 0.00025330076459795237, "global_step": 61085, "epoch": 513, "lr": 5.131322765362501e-06} +{"train_loss": 0.00039296879549510777, "global_step": 61086, "epoch": 513, "lr": 5.130345167689754e-06} +{"train_loss": 0.0003643561212811619, "global_step": 61087, "epoch": 513, "lr": 5.129367658113771e-06} +{"train_loss": 0.0005713033606298268, "global_step": 61088, "epoch": 513, "lr": 5.128390236636493e-06} +{"train_loss": 0.0004205693257972598, "global_step": 61089, "epoch": 513, "lr": 5.127412903259815e-06} +{"train_loss": 0.00045485631562769413, "global_step": 61090, "epoch": 513, "lr": 5.1264356579856785e-06} +{"train_loss": 0.00027839848189614713, "global_step": 61091, "epoch": 513, "lr": 5.1254585008159825e-06} +{"train_loss": 0.0002494614745955914, "global_step": 61092, "epoch": 513, "lr": 5.124481431752665e-06} +{"train_loss": 0.00020810715795960277, "global_step": 61093, "epoch": 513, "lr": 5.123504450797634e-06} +{"train_loss": 0.0006141601479612291, "global_step": 61094, "epoch": 513, "lr": 5.122527557952794e-06} +{"train_loss": 0.0005211380193941295, "global_step": 61095, "epoch": 513, "lr": 5.1215507532200894e-06} +{"train_loss": 0.0007706835749559104, "global_step": 61096, "epoch": 513, "lr": 5.120574036601416e-06} +{"train_loss": 0.00039561689482070506, "global_step": 61097, "epoch": 513, "lr": 5.119597408098709e-06} +{"train_loss": 0.00028816884150728583, "global_step": 61098, "epoch": 513, "lr": 5.118620867713869e-06} +{"train_loss": 0.00016228915774263442, "global_step": 61099, "epoch": 513, "lr": 5.11764441544883e-06} +{"train_loss": 0.0003903402539435774, "global_step": 61100, "epoch": 513, "lr": 5.116668051305507e-06} +{"train_loss": 0.00024265896354336292, "global_step": 61101, "epoch": 513, "lr": 5.115691775285797e-06} +{"train_loss": 0.0003300062962807715, "global_step": 61102, "epoch": 513, "lr": 5.114715587391639e-06} +{"train_loss": 0.00026679603615775704, "global_step": 61103, "epoch": 513, "lr": 5.1137394876249354e-06} +{"train_loss": 0.00030000341939739883, "global_step": 61104, "epoch": 513, "lr": 5.112763475987614e-06} +{"train_loss": 0.00023214996326714754, "global_step": 61105, "epoch": 513, "lr": 5.1117875524815896e-06} +{"train_loss": 0.00037058271118439734, "global_step": 61106, "epoch": 513, "lr": 5.110811717108765e-06} +{"train_loss": 0.0003491722163744271, "global_step": 61107, "epoch": 513, "lr": 5.1098359698710795e-06} +{"train_loss": 0.0002975765382871032, "global_step": 61108, "epoch": 513, "lr": 5.108860310770419e-06} +{"train_loss": 0.00032692827517166734, "global_step": 61109, "epoch": 513, "lr": 5.107884739808727e-06} +{"train_loss": 0.0011549044866114855, "global_step": 61110, "epoch": 513, "lr": 5.106909256987896e-06} +{"train_loss": 0.00027637960738502443, "global_step": 61111, "epoch": 513, "lr": 5.105933862309864e-06} +{"train_loss": 0.000334464042680338, "global_step": 61112, "epoch": 513, "lr": 5.10495855577654e-06} +{"train_loss": 0.00017466311692260206, "global_step": 61113, "epoch": 513, "lr": 5.103983337389817e-06} +{"train_loss": 0.0003193432348780334, "global_step": 61114, "epoch": 513, "lr": 5.103008207151638e-06} +{"train_loss": 0.00024198944447562099, "global_step": 61115, "epoch": 513, "lr": 5.102033165063896e-06} +{"train_loss": 0.00041908136336132884, "global_step": 61116, "epoch": 513, "lr": 5.101058211128523e-06} +{"train_loss": 0.00023203680757433176, "global_step": 61117, "epoch": 513, "lr": 5.100083345347417e-06} +{"train_loss": 0.00024357455549761653, "global_step": 61118, "epoch": 513, "lr": 5.099108567722505e-06} +{"train_loss": 0.00026968520251102746, "global_step": 61119, "epoch": 513, "lr": 5.098133878255701e-06} +{"train_loss": 0.00025929237017408013, "global_step": 61120, "epoch": 513, "lr": 5.097159276948904e-06} +{"train_loss": 0.00031185903935693204, "global_step": 61121, "epoch": 513, "lr": 5.096184763804046e-06} +{"train_loss": 0.00037516967859119177, "global_step": 61122, "epoch": 513, "lr": 5.0952103388230255e-06} +{"train_loss": 0.0004009482800029218, "global_step": 61123, "epoch": 513, "lr": 5.094236002007774e-06} +{"train_loss": 0.0002695614530239254, "global_step": 61124, "epoch": 513, "lr": 5.09326175336019e-06} +{"train_loss": 0.00034327778848819435, "global_step": 61125, "epoch": 513, "lr": 5.0922875928821774e-06} +{"train_loss": 0.0005321078351698816, "global_step": 61126, "epoch": 513, "lr": 5.091313520575675e-06} +{"train_loss": 0.00023156656243372709, "global_step": 61127, "epoch": 513, "lr": 5.0903395364425676e-06} +{"train_loss": 0.00043447004281915724, "global_step": 61128, "epoch": 513, "lr": 5.089365640484789e-06} +{"train_loss": 0.0005127996555529535, "global_step": 61129, "epoch": 513, "lr": 5.088391832704237e-06} +{"train_loss": 0.00041911783046089113, "global_step": 61130, "epoch": 513, "lr": 5.087418113102837e-06} +{"train_loss": 0.0003091169928666204, "global_step": 61131, "epoch": 513, "lr": 5.086444481682495e-06} +{"train_loss": 0.0004815232241526246, "global_step": 61132, "epoch": 513, "lr": 5.085470938445108e-06} +{"train_loss": 0.0003024347824975848, "global_step": 61133, "epoch": 513, "lr": 5.084497483392614e-06} +{"train_loss": 0.00017883772670757025, "global_step": 61134, "epoch": 513, "lr": 5.083524116526895e-06} +{"train_loss": 0.0005750323180109262, "global_step": 61135, "epoch": 513, "lr": 5.082550837849892e-06} +{"train_loss": 0.000597983889747411, "global_step": 61136, "epoch": 513, "lr": 5.0815776473634945e-06} +{"train_loss": 0.0003902913013007492, "global_step": 61137, "epoch": 513, "lr": 5.080604545069623e-06} +{"train_loss": 0.00030835013603791595, "global_step": 61138, "epoch": 513, "lr": 5.079631530970192e-06} +{"train_loss": 0.0002232838305644691, "global_step": 61139, "epoch": 513, "lr": 5.078658605067093e-06} +{"train_loss": 0.000279122032225132, "global_step": 61140, "epoch": 513, "lr": 5.077685767362256e-06} +{"train_loss": 0.0003759292303584516, "global_step": 61141, "epoch": 513, "lr": 5.076713017857582e-06} +{"train_loss": 0.0006902272580191493, "global_step": 61142, "epoch": 513, "lr": 5.075740356554987e-06} +{"train_loss": 0.0006473517278209329, "global_step": 61143, "epoch": 513, "lr": 5.074767783456374e-06} +{"train_loss": 0.00016287309699691832, "global_step": 61144, "epoch": 513, "lr": 5.07379529856365e-06} +{"train_loss": 0.00025792940868996084, "global_step": 61145, "epoch": 513, "lr": 5.072822901878732e-06} +{"train_loss": 0.0004700617282651365, "global_step": 61146, "epoch": 513, "lr": 5.071850593403527e-06} +{"train_loss": 0.00047807605005800724, "global_step": 61147, "epoch": 513, "lr": 5.070878373139942e-06} +{"train_loss": 0.0005159453721717, "global_step": 61148, "epoch": 513, "lr": 5.069906241089883e-06} +{"train_loss": 0.0004962459206581116, "global_step": 61149, "epoch": 513, "lr": 5.068934197255276e-06} +{"train_loss": 0.000648524786811322, "global_step": 61150, "epoch": 513, "lr": 5.067962241638002e-06} +{"train_loss": 0.0002640916791278869, "global_step": 61151, "epoch": 513, "lr": 5.066990374239999e-06} +{"train_loss": 0.0004965864354744554, "global_step": 61152, "epoch": 513, "lr": 5.066018595063143e-06} +{"train_loss": 0.00021998779266141355, "global_step": 61153, "epoch": 513, "lr": 5.065046904109366e-06} +{"train_loss": 0.00029495195485651493, "global_step": 61154, "epoch": 513, "lr": 5.064075301380572e-06} +{"train_loss": 0.00029094002093188465, "global_step": 61155, "epoch": 513, "lr": 5.06310378687867e-06} +{"train_loss": 0.00016793067334219813, "global_step": 61156, "epoch": 513, "lr": 5.062132360605554e-06} +{"train_loss": 0.00027731055160984397, "global_step": 61157, "epoch": 513, "lr": 5.061161022563149e-06} +{"train_loss": 0.0004062031803186983, "global_step": 61158, "epoch": 513, "lr": 5.0601897727533376e-06} +{"train_loss": 0.0006536206929013133, "global_step": 61159, "epoch": 513, "lr": 5.059218611178057e-06} +{"train_loss": 0.0007798869046382606, "global_step": 61160, "epoch": 513, "lr": 5.0582475378391895e-06} +{"train_loss": 0.0004054612363688648, "global_step": 61161, "epoch": 513, "lr": 5.057276552738666e-06} +{"train_loss": 0.00043456119601614773, "global_step": 61162, "epoch": 513, "lr": 5.056305655878374e-06} +{"train_loss": 0.00017655690317042172, "global_step": 61163, "epoch": 513, "lr": 5.055334847260212e-06} +{"train_loss": 0.00029489988810382783, "global_step": 61164, "epoch": 513, "lr": 5.054364126886113e-06} +{"train_loss": 0.0003915859667335817, "global_step": 61165, "epoch": 513, "lr": 5.053393494757957e-06, "val_loss": 0.030304618179798126} +{"train_loss": 0.0006034296238794923, "global_step": 61166, "epoch": 514, "lr": 5.0524229508776665e-06} +{"train_loss": 0.00035891131847165525, "global_step": 61167, "epoch": 514, "lr": 5.051452495247139e-06} +{"train_loss": 0.0003046261554118246, "global_step": 61168, "epoch": 514, "lr": 5.050482127868289e-06} +{"train_loss": 0.0004904756788164377, "global_step": 61169, "epoch": 514, "lr": 5.049511848743016e-06} +{"train_loss": 0.0003500938764773309, "global_step": 61170, "epoch": 514, "lr": 5.048541657873213e-06} +{"train_loss": 0.00031388684874400496, "global_step": 61171, "epoch": 514, "lr": 5.047571555260805e-06} +{"train_loss": 0.0002690536202862859, "global_step": 61172, "epoch": 514, "lr": 5.046601540907681e-06} +{"train_loss": 0.00021320173982530832, "global_step": 61173, "epoch": 514, "lr": 5.04563161481576e-06} +{"train_loss": 0.0005233616102486849, "global_step": 61174, "epoch": 514, "lr": 5.044661776986936e-06} +{"train_loss": 0.00037624372635036707, "global_step": 61175, "epoch": 514, "lr": 5.043692027423108e-06} +{"train_loss": 0.00023432832676917315, "global_step": 61176, "epoch": 514, "lr": 5.042722366126201e-06} +{"train_loss": 0.0002299704501638189, "global_step": 61177, "epoch": 514, "lr": 5.041752793098092e-06} +{"train_loss": 0.00028724397998303175, "global_step": 61178, "epoch": 514, "lr": 5.040783308340713e-06} +{"train_loss": 0.0002596417907625437, "global_step": 61179, "epoch": 514, "lr": 5.039813911855939e-06} +{"train_loss": 0.0003766497829928994, "global_step": 61180, "epoch": 514, "lr": 5.038844603645698e-06} +{"train_loss": 0.00025762151926755905, "global_step": 61181, "epoch": 514, "lr": 5.037875383711871e-06} +{"train_loss": 0.00024951936211436987, "global_step": 61182, "epoch": 514, "lr": 5.036906252056384e-06} +{"train_loss": 0.0003486085624899715, "global_step": 61183, "epoch": 514, "lr": 5.0359372086811185e-06} +{"train_loss": 0.00031480882898904383, "global_step": 61184, "epoch": 514, "lr": 5.034968253587991e-06} +{"train_loss": 0.0004168521845713258, "global_step": 61185, "epoch": 514, "lr": 5.033999386778898e-06} +{"train_loss": 0.0003836912219412625, "global_step": 61186, "epoch": 514, "lr": 5.0330306082557455e-06} +{"train_loss": 0.00043829288915731013, "global_step": 61187, "epoch": 514, "lr": 5.032061918020431e-06} +{"train_loss": 0.0005643393378704786, "global_step": 61188, "epoch": 514, "lr": 5.031093316074864e-06} +{"train_loss": 0.0002689540560822934, "global_step": 61189, "epoch": 514, "lr": 5.0301248024209325e-06} +{"train_loss": 0.0003800690465141088, "global_step": 61190, "epoch": 514, "lr": 5.029156377060551e-06} +{"train_loss": 0.0003852943773381412, "global_step": 61191, "epoch": 514, "lr": 5.028188039995613e-06} +{"train_loss": 0.00016958247579168528, "global_step": 61192, "epoch": 514, "lr": 5.0272197912280325e-06} +{"train_loss": 0.0005228740046732128, "global_step": 61193, "epoch": 514, "lr": 5.0262516307596985e-06} +{"train_loss": 0.00027448992477729917, "global_step": 61194, "epoch": 514, "lr": 5.025283558592509e-06} +{"train_loss": 0.0002429519809084013, "global_step": 61195, "epoch": 514, "lr": 5.0243155747283775e-06} +{"train_loss": 0.00028782724984921515, "global_step": 61196, "epoch": 514, "lr": 5.023347679169188e-06} +{"train_loss": 0.00021705334074795246, "global_step": 61197, "epoch": 514, "lr": 5.0223798719168606e-06} +{"train_loss": 0.00016767521447036415, "global_step": 61198, "epoch": 514, "lr": 5.021412152973276e-06} +{"train_loss": 0.0004102055972907692, "global_step": 61199, "epoch": 514, "lr": 5.02044452234035e-06} +{"train_loss": 0.0003080819733440876, "global_step": 61200, "epoch": 514, "lr": 5.019476980019977e-06} +{"train_loss": 0.0004710670036729425, "global_step": 61201, "epoch": 514, "lr": 5.018509526014048e-06} +{"train_loss": 0.0003517925797495991, "global_step": 61202, "epoch": 514, "lr": 5.017542160324479e-06} +{"train_loss": 0.000435481546446681, "global_step": 61203, "epoch": 514, "lr": 5.0165748829531515e-06} +{"train_loss": 0.0003346245503053069, "global_step": 61204, "epoch": 514, "lr": 5.0156076939019806e-06} +{"train_loss": 0.0002867658040486276, "global_step": 61205, "epoch": 514, "lr": 5.014640593172848e-06} +{"train_loss": 0.00019813385733868927, "global_step": 61206, "epoch": 514, "lr": 5.013673580767675e-06} +{"train_loss": 0.0002973873633891344, "global_step": 61207, "epoch": 514, "lr": 5.012706656688349e-06} +{"train_loss": 0.0002880973624996841, "global_step": 61208, "epoch": 514, "lr": 5.0117398209367505e-06} +{"train_loss": 0.00046252948231995106, "global_step": 61209, "epoch": 514, "lr": 5.010773073514813e-06} +{"train_loss": 0.00041695829713717103, "global_step": 61210, "epoch": 514, "lr": 5.0098064144244e-06} +{"train_loss": 0.00022040822659619153, "global_step": 61211, "epoch": 514, "lr": 5.00883984366744e-06} +{"train_loss": 0.00020763535576406866, "global_step": 61212, "epoch": 514, "lr": 5.0078733612458125e-06} +{"train_loss": 0.0002665157080627978, "global_step": 61213, "epoch": 514, "lr": 5.006906967161412e-06} +{"train_loss": 0.0002794639440253377, "global_step": 61214, "epoch": 514, "lr": 5.005940661416147e-06} +{"train_loss": 0.000197658795514144, "global_step": 61215, "epoch": 514, "lr": 5.004974444011906e-06} +{"train_loss": 0.0002706224040593952, "global_step": 61216, "epoch": 514, "lr": 5.004008314950592e-06} +{"train_loss": 0.00032618612749502063, "global_step": 61217, "epoch": 514, "lr": 5.00304227423411e-06} +{"train_loss": 0.00030362606048583984, "global_step": 61218, "epoch": 514, "lr": 5.002076321864335e-06} +{"train_loss": 0.00034513164428062737, "global_step": 61219, "epoch": 514, "lr": 5.001110457843184e-06} +{"train_loss": 0.0006816716631874442, "global_step": 61220, "epoch": 514, "lr": 5.000144682172541e-06} +{"train_loss": 0.00028665002901107073, "global_step": 61221, "epoch": 514, "lr": 4.999178994854314e-06} +{"train_loss": 0.0005004771519452333, "global_step": 61222, "epoch": 514, "lr": 4.998213395890378e-06} +{"train_loss": 0.00024790148017928004, "global_step": 61223, "epoch": 514, "lr": 4.997247885282658e-06} +{"train_loss": 0.000196217602933757, "global_step": 61224, "epoch": 514, "lr": 4.996282463033025e-06} +{"train_loss": 0.0003667925193440169, "global_step": 61225, "epoch": 514, "lr": 4.995317129143384e-06} +{"train_loss": 0.0002665601787157357, "global_step": 61226, "epoch": 514, "lr": 4.994351883615634e-06} +{"train_loss": 0.0004735560214612633, "global_step": 61227, "epoch": 514, "lr": 4.993386726451654e-06} +{"train_loss": 0.00020897820650134236, "global_step": 61228, "epoch": 514, "lr": 4.992421657653368e-06} +{"train_loss": 0.0002609092916827649, "global_step": 61229, "epoch": 514, "lr": 4.991456677222639e-06} +{"train_loss": 0.00028665983700193465, "global_step": 61230, "epoch": 514, "lr": 4.990491785161383e-06} +{"train_loss": 0.00036565258051268756, "global_step": 61231, "epoch": 514, "lr": 4.989526981471493e-06} +{"train_loss": 0.00042867675074376166, "global_step": 61232, "epoch": 514, "lr": 4.9885622661548504e-06} +{"train_loss": 0.00037516842712648213, "global_step": 61233, "epoch": 514, "lr": 4.987597639213359e-06} +{"train_loss": 0.00016972536104731262, "global_step": 61234, "epoch": 514, "lr": 4.986633100648908e-06} +{"train_loss": 0.0003214057069271803, "global_step": 61235, "epoch": 514, "lr": 4.985668650463399e-06} +{"train_loss": 0.0007742905290797353, "global_step": 61236, "epoch": 514, "lr": 4.984704288658715e-06} +{"train_loss": 0.00030649008112959564, "global_step": 61237, "epoch": 514, "lr": 4.9837400152367595e-06} +{"train_loss": 0.0008443392580375075, "global_step": 61238, "epoch": 514, "lr": 4.982775830199427e-06} +{"train_loss": 0.00020033895270898938, "global_step": 61239, "epoch": 514, "lr": 4.9818117335485915e-06} +{"train_loss": 0.00031249021412804723, "global_step": 61240, "epoch": 514, "lr": 4.980847725286169e-06} +{"train_loss": 0.0004138934600632638, "global_step": 61241, "epoch": 514, "lr": 4.979883805414031e-06} +{"train_loss": 0.00040554392035119236, "global_step": 61242, "epoch": 514, "lr": 4.978919973934099e-06} +{"train_loss": 0.0004077834018971771, "global_step": 61243, "epoch": 514, "lr": 4.977956230848241e-06} +{"train_loss": 0.0002729922125581652, "global_step": 61244, "epoch": 514, "lr": 4.976992576158346e-06} +{"train_loss": 0.00015367944433819503, "global_step": 61245, "epoch": 514, "lr": 4.976029009866328e-06} +{"train_loss": 0.00040452604298479855, "global_step": 61246, "epoch": 514, "lr": 4.9750655319740545e-06} +{"train_loss": 0.0002969739434774965, "global_step": 61247, "epoch": 514, "lr": 4.974102142483445e-06} +{"train_loss": 0.00047714626998640597, "global_step": 61248, "epoch": 514, "lr": 4.973138841396363e-06} +{"train_loss": 0.0004151643661316484, "global_step": 61249, "epoch": 514, "lr": 4.97217562871472e-06} +{"train_loss": 0.0002339944039704278, "global_step": 61250, "epoch": 514, "lr": 4.971212504440392e-06} +{"train_loss": 0.0002370515139773488, "global_step": 61251, "epoch": 514, "lr": 4.970249468575277e-06} +{"train_loss": 0.0002435510978102684, "global_step": 61252, "epoch": 514, "lr": 4.9692865211212745e-06} +{"train_loss": 0.00020413397578522563, "global_step": 61253, "epoch": 514, "lr": 4.96832366208026e-06} +{"train_loss": 0.00038660652353428304, "global_step": 61254, "epoch": 514, "lr": 4.967360891454142e-06} +{"train_loss": 0.00029719568556174636, "global_step": 61255, "epoch": 514, "lr": 4.9663982092447885e-06} +{"train_loss": 0.0002533446822781116, "global_step": 61256, "epoch": 514, "lr": 4.965435615454111e-06} +{"train_loss": 0.0002684309729374945, "global_step": 61257, "epoch": 514, "lr": 4.964473110083989e-06} +{"train_loss": 0.0005497161182574928, "global_step": 61258, "epoch": 514, "lr": 4.9635106931363026e-06} +{"train_loss": 0.00023339154722634703, "global_step": 61259, "epoch": 514, "lr": 4.962548364612957e-06} +{"train_loss": 0.0004608511517290026, "global_step": 61260, "epoch": 514, "lr": 4.961586124515832e-06} +{"train_loss": 0.001014869543723762, "global_step": 61261, "epoch": 514, "lr": 4.9606239728468285e-06} +{"train_loss": 0.00019562903617043048, "global_step": 61262, "epoch": 514, "lr": 4.9596619096078325e-06} +{"train_loss": 0.0005963363801129162, "global_step": 61263, "epoch": 514, "lr": 4.958699934800714e-06} +{"train_loss": 0.00024114300322253257, "global_step": 61264, "epoch": 514, "lr": 4.957738048427391e-06} +{"train_loss": 0.00028023647610098124, "global_step": 61265, "epoch": 514, "lr": 4.9567762504897195e-06} +{"train_loss": 0.00040296840597875416, "global_step": 61266, "epoch": 514, "lr": 4.955814540989623e-06} +{"train_loss": 0.00024914671666920185, "global_step": 61267, "epoch": 514, "lr": 4.9548529199289594e-06} +{"train_loss": 0.00024442115682177246, "global_step": 61268, "epoch": 514, "lr": 4.953891387309639e-06} +{"train_loss": 0.0006045062327757478, "global_step": 61269, "epoch": 514, "lr": 4.9529299431335385e-06} +{"train_loss": 0.00023696852440480143, "global_step": 61270, "epoch": 514, "lr": 4.951968587402539e-06} +{"train_loss": 0.000287970615318045, "global_step": 61271, "epoch": 514, "lr": 4.95100732011855e-06} +{"train_loss": 0.0002582322049420327, "global_step": 61272, "epoch": 514, "lr": 4.950046141283432e-06} +{"train_loss": 0.00031321318238042295, "global_step": 61273, "epoch": 514, "lr": 4.9490850508991e-06} +{"train_loss": 0.0003889239451382309, "global_step": 61274, "epoch": 514, "lr": 4.948124048967412e-06} +{"train_loss": 0.00033558535506017506, "global_step": 61275, "epoch": 514, "lr": 4.947163135490279e-06} +{"train_loss": 0.00033840766991488636, "global_step": 61276, "epoch": 514, "lr": 4.946202310469578e-06} +{"train_loss": 0.00029791673296131194, "global_step": 61277, "epoch": 514, "lr": 4.945241573907189e-06} +{"train_loss": 0.0004937836201861501, "global_step": 61278, "epoch": 514, "lr": 4.944280925805011e-06} +{"train_loss": 0.000364618405001238, "global_step": 61279, "epoch": 514, "lr": 4.943320366164917e-06} +{"train_loss": 0.0004279662389308214, "global_step": 61280, "epoch": 514, "lr": 4.9423598949888075e-06} +{"train_loss": 0.00027636816957965493, "global_step": 61281, "epoch": 514, "lr": 4.941399512278549e-06} +{"train_loss": 0.0004395289870444685, "global_step": 61282, "epoch": 514, "lr": 4.940439218036052e-06} +{"train_loss": 0.0003469176881480962, "global_step": 61283, "epoch": 514, "lr": 4.939479012263182e-06} +{"train_loss": 0.00034618307677383275, "global_step": 61284, "epoch": 514, "lr": 4.938518894961835e-06, "val_loss": 0.02152068167924881} +{"train_loss": 0.0006999794277362525, "global_step": 61285, "epoch": 515, "lr": 4.937558866133884e-06} +{"train_loss": 0.00024431070778518915, "global_step": 61286, "epoch": 515, "lr": 4.9365989257812216e-06} +{"train_loss": 0.0003211599832866341, "global_step": 61287, "epoch": 515, "lr": 4.93563907390574e-06} +{"train_loss": 0.00024081472656689584, "global_step": 61288, "epoch": 515, "lr": 4.934679310509322e-06} +{"train_loss": 0.00020411987497936934, "global_step": 61289, "epoch": 515, "lr": 4.933719635593836e-06} +{"train_loss": 0.00041867035906761885, "global_step": 61290, "epoch": 515, "lr": 4.9327600491611834e-06} +{"train_loss": 0.0005042950506322086, "global_step": 61291, "epoch": 515, "lr": 4.931800551213234e-06} +{"train_loss": 0.0004691403009928763, "global_step": 61292, "epoch": 515, "lr": 4.93084114175189e-06} +{"train_loss": 0.00022279047698248178, "global_step": 61293, "epoch": 515, "lr": 4.92988182077902e-06} +{"train_loss": 0.0004435949376784265, "global_step": 61294, "epoch": 515, "lr": 4.928922588296509e-06} +{"train_loss": 0.00022187750437296927, "global_step": 61295, "epoch": 515, "lr": 4.927963444306249e-06} +{"train_loss": 0.00026664818869903684, "global_step": 61296, "epoch": 515, "lr": 4.927004388810108e-06} +{"train_loss": 0.0007447270909324288, "global_step": 61297, "epoch": 515, "lr": 4.926045421809988e-06} +{"train_loss": 0.00032085986458696425, "global_step": 61298, "epoch": 515, "lr": 4.9250865433077555e-06} +{"train_loss": 0.0005102480063214898, "global_step": 61299, "epoch": 515, "lr": 4.924127753305307e-06} +{"train_loss": 0.0003079850284848362, "global_step": 61300, "epoch": 515, "lr": 4.9231690518045214e-06} +{"train_loss": 0.0001864376536104828, "global_step": 61301, "epoch": 515, "lr": 4.922210438807262e-06} +{"train_loss": 0.00020258310541976243, "global_step": 61302, "epoch": 515, "lr": 4.921251914315439e-06} +{"train_loss": 0.0004723745514638722, "global_step": 61303, "epoch": 515, "lr": 4.920293478330912e-06} +{"train_loss": 0.00035498992656357586, "global_step": 61304, "epoch": 515, "lr": 4.919335130855584e-06} +{"train_loss": 0.0002329183043912053, "global_step": 61305, "epoch": 515, "lr": 4.918376871891317e-06} +{"train_loss": 0.00022065856319386512, "global_step": 61306, "epoch": 515, "lr": 4.917418701440008e-06} +{"train_loss": 0.0003450371150393039, "global_step": 61307, "epoch": 515, "lr": 4.916460619503532e-06} +{"train_loss": 0.00038729337393306196, "global_step": 61308, "epoch": 515, "lr": 4.915502626083757e-06} +{"train_loss": 0.0007934557506814599, "global_step": 61309, "epoch": 515, "lr": 4.91454472118259e-06} +{"train_loss": 0.0005529022309929132, "global_step": 61310, "epoch": 515, "lr": 4.913586904801882e-06} +{"train_loss": 0.00039809226291254163, "global_step": 61311, "epoch": 515, "lr": 4.912629176943545e-06} +{"train_loss": 0.0002452742191962898, "global_step": 61312, "epoch": 515, "lr": 4.91167153760943e-06} +{"train_loss": 0.00029773631831631064, "global_step": 61313, "epoch": 515, "lr": 4.9107139868014405e-06} +{"train_loss": 0.0003331444750074297, "global_step": 61314, "epoch": 515, "lr": 4.909756524521441e-06} +{"train_loss": 0.00025665719294920564, "global_step": 61315, "epoch": 515, "lr": 4.908799150771326e-06} +{"train_loss": 0.00031978514743968844, "global_step": 61316, "epoch": 515, "lr": 4.907841865552954e-06} +{"train_loss": 0.000253256963333115, "global_step": 61317, "epoch": 515, "lr": 4.906884668868228e-06} +{"train_loss": 0.0003088052326347679, "global_step": 61318, "epoch": 515, "lr": 4.905927560719009e-06} +{"train_loss": 0.0002309157425770536, "global_step": 61319, "epoch": 515, "lr": 4.90497054110719e-06} +{"train_loss": 0.00033181163598783314, "global_step": 61320, "epoch": 515, "lr": 4.904013610034636e-06} +{"train_loss": 0.0002846528950612992, "global_step": 61321, "epoch": 515, "lr": 4.903056767503244e-06} +{"train_loss": 0.0002599129220470786, "global_step": 61322, "epoch": 515, "lr": 4.902100013514871e-06} +{"train_loss": 0.00035648755147121847, "global_step": 61323, "epoch": 515, "lr": 4.901143348071419e-06} +{"train_loss": 0.0003171681601088494, "global_step": 61324, "epoch": 515, "lr": 4.900186771174742e-06} +{"train_loss": 0.00031436351127922535, "global_step": 61325, "epoch": 515, "lr": 4.899230282826739e-06} +{"train_loss": 0.0004199198738206178, "global_step": 61326, "epoch": 515, "lr": 4.898273883029281e-06} +{"train_loss": 0.0003246718551963568, "global_step": 61327, "epoch": 515, "lr": 4.897317571784232e-06} +{"train_loss": 0.0001620584516786039, "global_step": 61328, "epoch": 515, "lr": 4.896361349093493e-06} +{"train_loss": 0.00030943332239985466, "global_step": 61329, "epoch": 515, "lr": 4.895405214958914e-06} +{"train_loss": 0.00017470699094701558, "global_step": 61330, "epoch": 515, "lr": 4.894449169382403e-06} +{"train_loss": 0.0003070460807066411, "global_step": 61331, "epoch": 515, "lr": 4.8934932123658235e-06} +{"train_loss": 0.00041834625881165266, "global_step": 61332, "epoch": 515, "lr": 4.892537343911041e-06} +{"train_loss": 0.00038315291749313474, "global_step": 61333, "epoch": 515, "lr": 4.891581564019954e-06} +{"train_loss": 0.00025213032495230436, "global_step": 61334, "epoch": 515, "lr": 4.8906258726944155e-06} +{"train_loss": 0.00022779652499593794, "global_step": 61335, "epoch": 515, "lr": 4.889670269936319e-06} +{"train_loss": 0.0002660990576259792, "global_step": 61336, "epoch": 515, "lr": 4.888714755747531e-06} +{"train_loss": 0.0003711508761625737, "global_step": 61337, "epoch": 515, "lr": 4.887759330129943e-06} +{"train_loss": 0.0005177180282771587, "global_step": 61338, "epoch": 515, "lr": 4.886803993085415e-06} +{"train_loss": 0.00029502841061912477, "global_step": 61339, "epoch": 515, "lr": 4.885848744615823e-06} +{"train_loss": 0.0003838533884845674, "global_step": 61340, "epoch": 515, "lr": 4.8848935847230545e-06} +{"train_loss": 0.00037424135371111333, "global_step": 61341, "epoch": 515, "lr": 4.88393851340897e-06} +{"train_loss": 0.00020516129734460264, "global_step": 61342, "epoch": 515, "lr": 4.882983530675461e-06} +{"train_loss": 0.00029441702645272017, "global_step": 61343, "epoch": 515, "lr": 4.882028636524394e-06} +{"train_loss": 0.0002905670553445816, "global_step": 61344, "epoch": 515, "lr": 4.881073830957627e-06} +{"train_loss": 0.00040203009848482907, "global_step": 61345, "epoch": 515, "lr": 4.880119113977072e-06} +{"train_loss": 0.0004043793596792966, "global_step": 61346, "epoch": 515, "lr": 4.879164485584564e-06} +{"train_loss": 0.00032520346576347947, "global_step": 61347, "epoch": 515, "lr": 4.878209945782003e-06} +{"train_loss": 0.0004574156191665679, "global_step": 61348, "epoch": 515, "lr": 4.877255494571265e-06} +{"train_loss": 0.0003009852662216872, "global_step": 61349, "epoch": 515, "lr": 4.876301131954203e-06} +{"train_loss": 0.00024287181440740824, "global_step": 61350, "epoch": 515, "lr": 4.875346857932711e-06} +{"train_loss": 0.0002808560384437442, "global_step": 61351, "epoch": 515, "lr": 4.874392672508648e-06} +{"train_loss": 0.00023130534100346267, "global_step": 61352, "epoch": 515, "lr": 4.873438575683903e-06} +{"train_loss": 0.0004919967614114285, "global_step": 61353, "epoch": 515, "lr": 4.8724845674603285e-06} +{"train_loss": 0.0003508135268930346, "global_step": 61354, "epoch": 515, "lr": 4.871530647839823e-06} +{"train_loss": 0.00022027446539141238, "global_step": 61355, "epoch": 515, "lr": 4.870576816824235e-06} +{"train_loss": 0.00040378636913374066, "global_step": 61356, "epoch": 515, "lr": 4.869623074415458e-06} +{"train_loss": 0.0005070685874670744, "global_step": 61357, "epoch": 515, "lr": 4.868669420615352e-06} +{"train_loss": 0.0003398758708499372, "global_step": 61358, "epoch": 515, "lr": 4.867715855425781e-06} +{"train_loss": 0.00033792329486459494, "global_step": 61359, "epoch": 515, "lr": 4.866762378848643e-06} +{"train_loss": 0.0002280981425428763, "global_step": 61360, "epoch": 515, "lr": 4.865808990885784e-06} +{"train_loss": 0.0003291958710178733, "global_step": 61361, "epoch": 515, "lr": 4.864855691539094e-06} +{"train_loss": 0.00028787271003238857, "global_step": 61362, "epoch": 515, "lr": 4.863902480810439e-06} +{"train_loss": 0.0006246979464776814, "global_step": 61363, "epoch": 515, "lr": 4.862949358701685e-06} +{"train_loss": 0.00029909072327427566, "global_step": 61364, "epoch": 515, "lr": 4.861996325214713e-06} +{"train_loss": 0.00030536047415807843, "global_step": 61365, "epoch": 515, "lr": 4.861043380351376e-06} +{"train_loss": 0.0003316843940410763, "global_step": 61366, "epoch": 515, "lr": 4.8600905241135755e-06} +{"train_loss": 0.0007695857784710824, "global_step": 61367, "epoch": 515, "lr": 4.859137756503146e-06} +{"train_loss": 0.00036441005067899823, "global_step": 61368, "epoch": 515, "lr": 4.858185077521993e-06} +{"train_loss": 0.0006514846463687718, "global_step": 61369, "epoch": 515, "lr": 4.85723248717197e-06} +{"train_loss": 0.00015973133849911392, "global_step": 61370, "epoch": 515, "lr": 4.8562799854549364e-06} +{"train_loss": 0.00038554443744942546, "global_step": 61371, "epoch": 515, "lr": 4.855327572372786e-06} +{"train_loss": 0.00032077275682240725, "global_step": 61372, "epoch": 515, "lr": 4.854375247927367e-06} +{"train_loss": 0.00021925852342974395, "global_step": 61373, "epoch": 515, "lr": 4.853423012120567e-06} +{"train_loss": 0.00023478285584133118, "global_step": 61374, "epoch": 515, "lr": 4.852470864954239e-06} +{"train_loss": 0.00025614554760977626, "global_step": 61375, "epoch": 515, "lr": 4.851518806430272e-06} +{"train_loss": 0.0007154960767365992, "global_step": 61376, "epoch": 515, "lr": 4.850566836550524e-06} +{"train_loss": 0.00020806847896892577, "global_step": 61377, "epoch": 515, "lr": 4.849614955316856e-06} +{"train_loss": 0.0001957377971848473, "global_step": 61378, "epoch": 515, "lr": 4.8486631627311544e-06} +{"train_loss": 0.00042451792978681624, "global_step": 61379, "epoch": 515, "lr": 4.847711458795267e-06} +{"train_loss": 0.00017210257647093385, "global_step": 61380, "epoch": 515, "lr": 4.846759843511084e-06} +{"train_loss": 0.00023329009127337486, "global_step": 61381, "epoch": 515, "lr": 4.845808316880457e-06} +{"train_loss": 0.00019277572573628277, "global_step": 61382, "epoch": 515, "lr": 4.844856878905269e-06} +{"train_loss": 0.00021963563631288707, "global_step": 61383, "epoch": 515, "lr": 4.843905529587373e-06} +{"train_loss": 0.0002581045846454799, "global_step": 61384, "epoch": 515, "lr": 4.84295426892864e-06} +{"train_loss": 0.0004870904958806932, "global_step": 61385, "epoch": 515, "lr": 4.8420030969309584e-06} +{"train_loss": 0.00020777330792043358, "global_step": 61386, "epoch": 515, "lr": 4.841052013596164e-06} +{"train_loss": 0.0004203902499284595, "global_step": 61387, "epoch": 515, "lr": 4.840101018926152e-06} +{"train_loss": 0.0002535964304115623, "global_step": 61388, "epoch": 515, "lr": 4.839150112922774e-06} +{"train_loss": 0.000254214828601107, "global_step": 61389, "epoch": 515, "lr": 4.838199295587892e-06} +{"train_loss": 0.00032640009885653853, "global_step": 61390, "epoch": 515, "lr": 4.8372485669233915e-06} +{"train_loss": 0.00021802395349368453, "global_step": 61391, "epoch": 515, "lr": 4.836297926931116e-06} +{"train_loss": 0.00025204994017258286, "global_step": 61392, "epoch": 515, "lr": 4.8353473756129585e-06} +{"train_loss": 0.00023383811640087515, "global_step": 61393, "epoch": 515, "lr": 4.834396912970757e-06} +{"train_loss": 0.00032990341424010694, "global_step": 61394, "epoch": 515, "lr": 4.833446539006403e-06} +{"train_loss": 0.0002951631904579699, "global_step": 61395, "epoch": 515, "lr": 4.832496253721752e-06} +{"train_loss": 0.00026462634559720755, "global_step": 61396, "epoch": 515, "lr": 4.831546057118663e-06} +{"train_loss": 0.0002342741354368627, "global_step": 61397, "epoch": 515, "lr": 4.8305959491990125e-06} +{"train_loss": 0.00037719443207606673, "global_step": 61398, "epoch": 515, "lr": 4.829645929964655e-06} +{"train_loss": 0.0006074990378692746, "global_step": 61399, "epoch": 515, "lr": 4.828695999417471e-06} +{"train_loss": 0.00023824106028769165, "global_step": 61400, "epoch": 515, "lr": 4.827746157559315e-06} +{"train_loss": 0.00014759025361854583, "global_step": 61401, "epoch": 515, "lr": 4.826796404392042e-06} +{"train_loss": 0.0003824423183687031, "global_step": 61402, "epoch": 515, "lr": 4.825846739917539e-06} +{"train_loss": 0.0003345603542255645, "global_step": 61403, "epoch": 515, "lr": 4.824897164137654e-06, "val_loss": 0.029268398880958557, "train_action_mse_error": 6.61016520098201e-06} +{"train_loss": 0.0006128111854195595, "global_step": 61404, "epoch": 516, "lr": 4.823947677054263e-06} +{"train_loss": 0.00019505697127897292, "global_step": 61405, "epoch": 516, "lr": 4.822998278669216e-06} +{"train_loss": 0.0005229451926425099, "global_step": 61406, "epoch": 516, "lr": 4.822048968984394e-06} +{"train_loss": 0.0001496900658821687, "global_step": 61407, "epoch": 516, "lr": 4.821099748001657e-06} +{"train_loss": 0.00014239635493140668, "global_step": 61408, "epoch": 516, "lr": 4.820150615722851e-06} +{"train_loss": 0.00018916842236649245, "global_step": 61409, "epoch": 516, "lr": 4.819201572149862e-06} +{"train_loss": 0.000289456220343709, "global_step": 61410, "epoch": 516, "lr": 4.81825261728453e-06} +{"train_loss": 0.00029818236362189054, "global_step": 61411, "epoch": 516, "lr": 4.817303751128749e-06} +{"train_loss": 0.00037420698208734393, "global_step": 61412, "epoch": 516, "lr": 4.81635497368435e-06} +{"train_loss": 0.0002904580323956907, "global_step": 61413, "epoch": 516, "lr": 4.815406284953222e-06} +{"train_loss": 0.0005567061598412693, "global_step": 61414, "epoch": 516, "lr": 4.814457684937207e-06} +{"train_loss": 0.0002640542224980891, "global_step": 61415, "epoch": 516, "lr": 4.813509173638187e-06} +{"train_loss": 0.00030091425287537277, "global_step": 61416, "epoch": 516, "lr": 4.812560751058004e-06} +{"train_loss": 0.00033161055762320757, "global_step": 61417, "epoch": 516, "lr": 4.811612417198541e-06} +{"train_loss": 0.0006536443834193051, "global_step": 61418, "epoch": 516, "lr": 4.810664172061641e-06} +{"train_loss": 0.00039000011747702956, "global_step": 61419, "epoch": 516, "lr": 4.80971601564918e-06} +{"train_loss": 0.0003248995344620198, "global_step": 61420, "epoch": 516, "lr": 4.808767947963011e-06} +{"train_loss": 0.0003874133399222046, "global_step": 61421, "epoch": 516, "lr": 4.807819969005001e-06} +{"train_loss": 0.00017916511569637805, "global_step": 61422, "epoch": 516, "lr": 4.806872078777003e-06} +{"train_loss": 0.0001777323632268235, "global_step": 61423, "epoch": 516, "lr": 4.805924277280888e-06} +{"train_loss": 0.0005643786862492561, "global_step": 61424, "epoch": 516, "lr": 4.804976564518504e-06} +{"train_loss": 0.0004474147572182119, "global_step": 61425, "epoch": 516, "lr": 4.8040289404917336e-06} +{"train_loss": 0.00031825510086491704, "global_step": 61426, "epoch": 516, "lr": 4.80308140520242e-06} +{"train_loss": 0.0003005493199452758, "global_step": 61427, "epoch": 516, "lr": 4.802133958652422e-06} +{"train_loss": 0.000525555806234479, "global_step": 61428, "epoch": 516, "lr": 4.8011866008436105e-06} +{"train_loss": 0.0003141855413559824, "global_step": 61429, "epoch": 516, "lr": 4.800239331777834e-06} +{"train_loss": 0.00030331825837492943, "global_step": 61430, "epoch": 516, "lr": 4.799292151456969e-06} +{"train_loss": 0.0002908480819314718, "global_step": 61431, "epoch": 516, "lr": 4.798345059882864e-06} +{"train_loss": 0.0005715519073419273, "global_step": 61432, "epoch": 516, "lr": 4.797398057057367e-06} +{"train_loss": 0.0003049929509870708, "global_step": 61433, "epoch": 516, "lr": 4.7964511429823614e-06} +{"train_loss": 0.00035903576645068824, "global_step": 61434, "epoch": 516, "lr": 4.795504317659682e-06} +{"train_loss": 0.0006589156691916287, "global_step": 61435, "epoch": 516, "lr": 4.7945575810912136e-06} +{"train_loss": 0.0002645152562763542, "global_step": 61436, "epoch": 516, "lr": 4.7936109332787915e-06} +{"train_loss": 0.00016241839330177754, "global_step": 61437, "epoch": 516, "lr": 4.792664374224293e-06} +{"train_loss": 0.00041144280112348497, "global_step": 61438, "epoch": 516, "lr": 4.791717903929571e-06} +{"train_loss": 0.00035285146441310644, "global_step": 61439, "epoch": 516, "lr": 4.79077152239647e-06} +{"train_loss": 0.000292874698061496, "global_step": 61440, "epoch": 516, "lr": 4.789825229626871e-06} +{"train_loss": 0.00039426758303306997, "global_step": 61441, "epoch": 516, "lr": 4.788879025622606e-06} +{"train_loss": 0.00019378693832550198, "global_step": 61442, "epoch": 516, "lr": 4.787932910385562e-06} +{"train_loss": 0.0004540513036772609, "global_step": 61443, "epoch": 516, "lr": 4.786986883917565e-06} +{"train_loss": 0.00025586754782125354, "global_step": 61444, "epoch": 516, "lr": 4.786040946220504e-06} +{"train_loss": 0.0005094977677799761, "global_step": 61445, "epoch": 516, "lr": 4.7850950972962104e-06} +{"train_loss": 0.000255044549703598, "global_step": 61446, "epoch": 516, "lr": 4.784149337146565e-06} +{"train_loss": 0.0002519771514926106, "global_step": 61447, "epoch": 516, "lr": 4.783203665773395e-06} +{"train_loss": 0.00033666653325781226, "global_step": 61448, "epoch": 516, "lr": 4.782258083178587e-06} +{"train_loss": 0.0004530263540800661, "global_step": 61449, "epoch": 516, "lr": 4.781312589363979e-06} +{"train_loss": 0.0004605816793628037, "global_step": 61450, "epoch": 516, "lr": 4.780367184331436e-06} +{"train_loss": 0.0007999401423148811, "global_step": 61451, "epoch": 516, "lr": 4.779421868082806e-06} +{"train_loss": 0.00020304090867284685, "global_step": 61452, "epoch": 516, "lr": 4.778476640619955e-06} +{"train_loss": 0.0005958712426945567, "global_step": 61453, "epoch": 516, "lr": 4.7775315019447266e-06} +{"train_loss": 0.0002546693431213498, "global_step": 61454, "epoch": 516, "lr": 4.7765864520589955e-06} +{"train_loss": 0.00028563692467287183, "global_step": 61455, "epoch": 516, "lr": 4.775641490964594e-06} +{"train_loss": 0.00030600393074564636, "global_step": 61456, "epoch": 516, "lr": 4.774696618663399e-06} +{"train_loss": 0.0002959592966362834, "global_step": 61457, "epoch": 516, "lr": 4.773751835157253e-06} +{"train_loss": 0.00016273927758447826, "global_step": 61458, "epoch": 516, "lr": 4.7728071404480045e-06} +{"train_loss": 0.00041025999234989285, "global_step": 61459, "epoch": 516, "lr": 4.77186253453753e-06} +{"train_loss": 0.0003014336107298732, "global_step": 61460, "epoch": 516, "lr": 4.770918017427661e-06} +{"train_loss": 0.0004260859568603337, "global_step": 61461, "epoch": 516, "lr": 4.769973589120269e-06} +{"train_loss": 0.0005089994519948959, "global_step": 61462, "epoch": 516, "lr": 4.769029249617208e-06} +{"train_loss": 0.0003190278948750347, "global_step": 61463, "epoch": 516, "lr": 4.768084998920313e-06} +{"train_loss": 0.0005268939421512187, "global_step": 61464, "epoch": 516, "lr": 4.767140837031458e-06} +{"train_loss": 0.00028016712167300284, "global_step": 61465, "epoch": 516, "lr": 4.76619676395248e-06} +{"train_loss": 0.0006684661493636668, "global_step": 61466, "epoch": 516, "lr": 4.765252779685253e-06} +{"train_loss": 0.0003380725102033466, "global_step": 61467, "epoch": 516, "lr": 4.764308884231611e-06} +{"train_loss": 0.0003524462808854878, "global_step": 61468, "epoch": 516, "lr": 4.763365077593429e-06} +{"train_loss": 0.00016126796253956854, "global_step": 61469, "epoch": 516, "lr": 4.762421359772539e-06} +{"train_loss": 0.0005916225491091609, "global_step": 61470, "epoch": 516, "lr": 4.761477730770797e-06} +{"train_loss": 0.0003666697593871504, "global_step": 61471, "epoch": 516, "lr": 4.760534190590071e-06} +{"train_loss": 0.00044429791159927845, "global_step": 61472, "epoch": 516, "lr": 4.759590739232189e-06} +{"train_loss": 0.00030338193755596876, "global_step": 61473, "epoch": 516, "lr": 4.758647376699032e-06} +{"train_loss": 0.000224514544242993, "global_step": 61474, "epoch": 516, "lr": 4.757704102992422e-06} +{"train_loss": 0.00048390161828137934, "global_step": 61475, "epoch": 516, "lr": 4.756760918114239e-06} +{"train_loss": 0.0002619781589601189, "global_step": 61476, "epoch": 516, "lr": 4.755817822066322e-06} +{"train_loss": 0.00035910875885747373, "global_step": 61477, "epoch": 516, "lr": 4.754874814850519e-06} +{"train_loss": 0.0002909853064920753, "global_step": 61478, "epoch": 516, "lr": 4.753931896468689e-06} +{"train_loss": 0.00041859049815684557, "global_step": 61479, "epoch": 516, "lr": 4.75298906692267e-06} +{"train_loss": 0.0005041823606006801, "global_step": 61480, "epoch": 516, "lr": 4.7520463262143266e-06} +{"train_loss": 0.00048510869964957237, "global_step": 61481, "epoch": 516, "lr": 4.751103674345514e-06} +{"train_loss": 0.0005681197508238256, "global_step": 61482, "epoch": 516, "lr": 4.750161111318063e-06} +{"train_loss": 0.0004629447066690773, "global_step": 61483, "epoch": 516, "lr": 4.749218637133851e-06} +{"train_loss": 0.0008967961766757071, "global_step": 61484, "epoch": 516, "lr": 4.7482762517947035e-06} +{"train_loss": 0.000803115894086659, "global_step": 61485, "epoch": 516, "lr": 4.7473339553024855e-06} +{"train_loss": 0.0003598382754717022, "global_step": 61486, "epoch": 516, "lr": 4.7463917476590406e-06} +{"train_loss": 0.00033736511250026524, "global_step": 61487, "epoch": 516, "lr": 4.745449628866222e-06} +{"train_loss": 0.0002077875251416117, "global_step": 61488, "epoch": 516, "lr": 4.744507598925885e-06} +{"train_loss": 0.0002664584608282894, "global_step": 61489, "epoch": 516, "lr": 4.74356565783986e-06} +{"train_loss": 0.00018522789468988776, "global_step": 61490, "epoch": 516, "lr": 4.7426238056100196e-06} +{"train_loss": 0.000675913121085614, "global_step": 61491, "epoch": 516, "lr": 4.741682042238194e-06} +{"train_loss": 0.0004816250002477318, "global_step": 61492, "epoch": 516, "lr": 4.740740367726248e-06} +{"train_loss": 0.0003066854551434517, "global_step": 61493, "epoch": 516, "lr": 4.739798782076016e-06} +{"train_loss": 0.00045487858005799353, "global_step": 61494, "epoch": 516, "lr": 4.738857285289361e-06} +{"train_loss": 0.00022625079145655036, "global_step": 61495, "epoch": 516, "lr": 4.737915877368121e-06} +{"train_loss": 0.00018838231335394084, "global_step": 61496, "epoch": 516, "lr": 4.736974558314144e-06} +{"train_loss": 0.00040065610664896667, "global_step": 61497, "epoch": 516, "lr": 4.736033328129291e-06} +{"train_loss": 0.00039628130616620183, "global_step": 61498, "epoch": 516, "lr": 4.735092186815388e-06} +{"train_loss": 0.00039144192123785615, "global_step": 61499, "epoch": 516, "lr": 4.734151134374304e-06} +{"train_loss": 0.00044551503378897905, "global_step": 61500, "epoch": 516, "lr": 4.733210170807883e-06} +{"train_loss": 0.0003930412058252841, "global_step": 61501, "epoch": 516, "lr": 4.732269296117958e-06} +{"train_loss": 0.0006028114585205913, "global_step": 61502, "epoch": 516, "lr": 4.731328510306393e-06} +{"train_loss": 0.0004628689493983984, "global_step": 61503, "epoch": 516, "lr": 4.73038781337502e-06} +{"train_loss": 0.0003864917962346226, "global_step": 61504, "epoch": 516, "lr": 4.729447205325699e-06} +{"train_loss": 0.0004023243091069162, "global_step": 61505, "epoch": 516, "lr": 4.728506686160267e-06} +{"train_loss": 0.00039556363481096923, "global_step": 61506, "epoch": 516, "lr": 4.7275662558805885e-06} +{"train_loss": 0.0002780411159619689, "global_step": 61507, "epoch": 516, "lr": 4.726625914488492e-06} +{"train_loss": 0.0004093596071470529, "global_step": 61508, "epoch": 516, "lr": 4.725685661985818e-06} +{"train_loss": 0.0003467245551291853, "global_step": 61509, "epoch": 516, "lr": 4.724745498374439e-06} +{"train_loss": 0.00048702105414122343, "global_step": 61510, "epoch": 516, "lr": 4.723805423656169e-06} +{"train_loss": 0.0003163624496664852, "global_step": 61511, "epoch": 516, "lr": 4.722865437832885e-06} +{"train_loss": 0.0002086147287627682, "global_step": 61512, "epoch": 516, "lr": 4.721925540906402e-06} +{"train_loss": 0.0006645827670581639, "global_step": 61513, "epoch": 516, "lr": 4.7209857328785965e-06} +{"train_loss": 0.0006761407712474465, "global_step": 61514, "epoch": 516, "lr": 4.720046013751284e-06} +{"train_loss": 0.0004741908051073551, "global_step": 61515, "epoch": 516, "lr": 4.719106383526328e-06} +{"train_loss": 0.0004643592401407659, "global_step": 61516, "epoch": 516, "lr": 4.718166842205579e-06} +{"train_loss": 0.00023194080858957022, "global_step": 61517, "epoch": 516, "lr": 4.717227389790857e-06} +{"train_loss": 0.00033125144545920193, "global_step": 61518, "epoch": 516, "lr": 4.716288026284033e-06} +{"train_loss": 0.0003194592136424035, "global_step": 61519, "epoch": 516, "lr": 4.715348751686944e-06} +{"train_loss": 0.00023855669132899493, "global_step": 61520, "epoch": 516, "lr": 4.714409566001416e-06} +{"train_loss": 0.0002992133377119899, "global_step": 61521, "epoch": 516, "lr": 4.713470469229314e-06} +{"train_loss": 0.00038419994148973594, "global_step": 61522, "epoch": 516, "lr": 4.712531461372466e-06, "val_loss": 0.03296903520822525} +{"train_loss": 0.0004049092240165919, "global_step": 61523, "epoch": 517, "lr": 4.711592542432736e-06} +{"train_loss": 0.00041224429151043296, "global_step": 61524, "epoch": 517, "lr": 4.71065371241195e-06} +{"train_loss": 0.0004278209526091814, "global_step": 61525, "epoch": 517, "lr": 4.709714971311957e-06} +{"train_loss": 0.00023128261091187596, "global_step": 61526, "epoch": 517, "lr": 4.708776319134606e-06} +{"train_loss": 0.000612009025644511, "global_step": 61527, "epoch": 517, "lr": 4.707837755881727e-06} +{"train_loss": 0.00023364994558505714, "global_step": 61528, "epoch": 517, "lr": 4.706899281555177e-06} +{"train_loss": 0.0005033224588260055, "global_step": 61529, "epoch": 517, "lr": 4.705960896156781e-06} +{"train_loss": 0.00047581284889020026, "global_step": 61530, "epoch": 517, "lr": 4.7050225996883966e-06} +{"train_loss": 0.0004499669303186238, "global_step": 61531, "epoch": 517, "lr": 4.704084392151869e-06} +{"train_loss": 0.00018376967636868358, "global_step": 61532, "epoch": 517, "lr": 4.703146273549019e-06} +{"train_loss": 0.00021349370945245028, "global_step": 61533, "epoch": 517, "lr": 4.702208243881711e-06} +{"train_loss": 0.0003928568330593407, "global_step": 61534, "epoch": 517, "lr": 4.701270303151773e-06} +{"train_loss": 0.00026789517141878605, "global_step": 61535, "epoch": 517, "lr": 4.700332451361056e-06} +{"train_loss": 0.00017527730960864574, "global_step": 61536, "epoch": 517, "lr": 4.699394688511388e-06} +{"train_loss": 0.0005729915574193001, "global_step": 61537, "epoch": 517, "lr": 4.698457014604629e-06} +{"train_loss": 0.00022394991538021713, "global_step": 61538, "epoch": 517, "lr": 4.6975194296426104e-06} +{"train_loss": 0.00019394072296563536, "global_step": 61539, "epoch": 517, "lr": 4.696581933627164e-06} +{"train_loss": 0.00025876666768454015, "global_step": 61540, "epoch": 517, "lr": 4.69564452656015e-06} +{"train_loss": 0.0003641600487753749, "global_step": 61541, "epoch": 517, "lr": 4.694707208443383e-06} +{"train_loss": 0.000475612236186862, "global_step": 61542, "epoch": 517, "lr": 4.6937699792787335e-06} +{"train_loss": 0.00041201073327101767, "global_step": 61543, "epoch": 517, "lr": 4.692832839068012e-06} +{"train_loss": 0.0001729058858472854, "global_step": 61544, "epoch": 517, "lr": 4.691895787813083e-06} +{"train_loss": 0.00016213086200878024, "global_step": 61545, "epoch": 517, "lr": 4.690958825515767e-06} +{"train_loss": 0.0004363691550679505, "global_step": 61546, "epoch": 517, "lr": 4.690021952177925e-06} +{"train_loss": 0.0002146796468878165, "global_step": 61547, "epoch": 517, "lr": 4.689085167801372e-06} +{"train_loss": 0.00019146798877045512, "global_step": 61548, "epoch": 517, "lr": 4.688148472387971e-06} +{"train_loss": 0.0004715943068731576, "global_step": 61549, "epoch": 517, "lr": 4.687211865939539e-06} +{"train_loss": 0.0002463643904775381, "global_step": 61550, "epoch": 517, "lr": 4.686275348457936e-06} +{"train_loss": 0.0004581321554724127, "global_step": 61551, "epoch": 517, "lr": 4.685338919944976e-06} +{"train_loss": 0.00030574543052352965, "global_step": 61552, "epoch": 517, "lr": 4.68440258040253e-06} +{"train_loss": 0.0006071598618291318, "global_step": 61553, "epoch": 517, "lr": 4.683466329832403e-06} +{"train_loss": 0.00048252716078422964, "global_step": 61554, "epoch": 517, "lr": 4.68253016823646e-06} +{"train_loss": 0.00018028976046480238, "global_step": 61555, "epoch": 517, "lr": 4.681594095616515e-06} +{"train_loss": 0.0002729855477809906, "global_step": 61556, "epoch": 517, "lr": 4.6806581119744285e-06} +{"train_loss": 0.00029147902387194335, "global_step": 61557, "epoch": 517, "lr": 4.679722217312032e-06} +{"train_loss": 0.00021737185306847095, "global_step": 61558, "epoch": 517, "lr": 4.678786411631148e-06} +{"train_loss": 0.00026504043489694595, "global_step": 61559, "epoch": 517, "lr": 4.677850694933633e-06} +{"train_loss": 0.00034655019408091903, "global_step": 61560, "epoch": 517, "lr": 4.676915067221305e-06} +{"train_loss": 0.00016701703134458512, "global_step": 61561, "epoch": 517, "lr": 4.675979528496028e-06} +{"train_loss": 0.00020773302821908146, "global_step": 61562, "epoch": 517, "lr": 4.675044078759605e-06} +{"train_loss": 0.0001463353110011667, "global_step": 61563, "epoch": 517, "lr": 4.674108718013909e-06} +{"train_loss": 0.00029934552730992436, "global_step": 61564, "epoch": 517, "lr": 4.673173446260753e-06} +{"train_loss": 0.0002501570852473378, "global_step": 61565, "epoch": 517, "lr": 4.6722382635019715e-06} +{"train_loss": 0.00028486046358011663, "global_step": 61566, "epoch": 517, "lr": 4.671303169739416e-06} +{"train_loss": 0.00021130425739102066, "global_step": 61567, "epoch": 517, "lr": 4.670368164974903e-06} +{"train_loss": 0.00035590320476330817, "global_step": 61568, "epoch": 517, "lr": 4.669433249210292e-06} +{"train_loss": 0.00048185396008193493, "global_step": 61569, "epoch": 517, "lr": 4.6684984224474035e-06} +{"train_loss": 0.0001732234813971445, "global_step": 61570, "epoch": 517, "lr": 4.667563684688064e-06} +{"train_loss": 0.00022008562518749386, "global_step": 61571, "epoch": 517, "lr": 4.666629035934133e-06} +{"train_loss": 0.00042908755131065845, "global_step": 61572, "epoch": 517, "lr": 4.665694476187421e-06} +{"train_loss": 0.00028149172430858016, "global_step": 61573, "epoch": 517, "lr": 4.664760005449787e-06} +{"train_loss": 0.00047863577492535114, "global_step": 61574, "epoch": 517, "lr": 4.66382562372304e-06} +{"train_loss": 0.00027881551068276167, "global_step": 61575, "epoch": 517, "lr": 4.662891331009039e-06} +{"train_loss": 0.001076473854482174, "global_step": 61576, "epoch": 517, "lr": 4.661957127309613e-06} +{"train_loss": 0.00036311271833255887, "global_step": 61577, "epoch": 517, "lr": 4.661023012626576e-06} +{"train_loss": 0.0006424932507798076, "global_step": 61578, "epoch": 517, "lr": 4.660088986961775e-06} +{"train_loss": 0.00022506601817440242, "global_step": 61579, "epoch": 517, "lr": 4.659155050317054e-06} +{"train_loss": 0.00041783819324336946, "global_step": 61580, "epoch": 517, "lr": 4.658221202694235e-06} +{"train_loss": 0.0003876855771522969, "global_step": 61581, "epoch": 517, "lr": 4.65728744409516e-06} +{"train_loss": 0.00025780100258998573, "global_step": 61582, "epoch": 517, "lr": 4.656353774521649e-06} +{"train_loss": 0.00013949703134130687, "global_step": 61583, "epoch": 517, "lr": 4.655420193975552e-06} +{"train_loss": 0.0005175520200282335, "global_step": 61584, "epoch": 517, "lr": 4.654486702458682e-06} +{"train_loss": 0.00042957160621881485, "global_step": 61585, "epoch": 517, "lr": 4.65355329997289e-06} +{"train_loss": 0.0002712483983486891, "global_step": 61586, "epoch": 517, "lr": 4.652619986519996e-06} +{"train_loss": 0.0003255166229791939, "global_step": 61587, "epoch": 517, "lr": 4.651686762101848e-06} +{"train_loss": 0.0005432105390354991, "global_step": 61588, "epoch": 517, "lr": 4.6507536267202666e-06} +{"train_loss": 0.00031279673567041755, "global_step": 61589, "epoch": 517, "lr": 4.649820580377079e-06} +{"train_loss": 0.00031823976314626634, "global_step": 61590, "epoch": 517, "lr": 4.648887623074127e-06} +{"train_loss": 0.00043774105142802, "global_step": 61591, "epoch": 517, "lr": 4.647954754813238e-06} +{"train_loss": 0.00033047582837753, "global_step": 61592, "epoch": 517, "lr": 4.64702197559625e-06} +{"train_loss": 0.00027770601445809007, "global_step": 61593, "epoch": 517, "lr": 4.646089285424976e-06} +{"train_loss": 0.0002594008983578533, "global_step": 61594, "epoch": 517, "lr": 4.645156684301272e-06} +{"train_loss": 0.000389254855690524, "global_step": 61595, "epoch": 517, "lr": 4.644224172226963e-06} +{"train_loss": 0.0005650988314300776, "global_step": 61596, "epoch": 517, "lr": 4.643291749203859e-06} +{"train_loss": 0.0005214004777371883, "global_step": 61597, "epoch": 517, "lr": 4.6423594152338155e-06} +{"train_loss": 0.000359637284418568, "global_step": 61598, "epoch": 517, "lr": 4.641427170318646e-06} +{"train_loss": 0.0003350492042955011, "global_step": 61599, "epoch": 517, "lr": 4.6404950144601996e-06} +{"train_loss": 0.00025944403023459017, "global_step": 61600, "epoch": 517, "lr": 4.639562947660292e-06} +{"train_loss": 0.00040382222505286336, "global_step": 61601, "epoch": 517, "lr": 4.6386309699207485e-06} +{"train_loss": 0.00020510893955361098, "global_step": 61602, "epoch": 517, "lr": 4.637699081243413e-06} +{"train_loss": 0.0003215497126802802, "global_step": 61603, "epoch": 517, "lr": 4.636767281630106e-06} +{"train_loss": 0.00031482515623793006, "global_step": 61604, "epoch": 517, "lr": 4.635835571082664e-06} +{"train_loss": 0.00044341973261907697, "global_step": 61605, "epoch": 517, "lr": 4.634903949602904e-06} +{"train_loss": 0.00034611980663612485, "global_step": 61606, "epoch": 517, "lr": 4.633972417192678e-06} +{"train_loss": 0.0005757704493589699, "global_step": 61607, "epoch": 517, "lr": 4.633040973853791e-06} +{"train_loss": 0.0003639548958744854, "global_step": 61608, "epoch": 517, "lr": 4.632109619588082e-06} +{"train_loss": 0.00023850348952692002, "global_step": 61609, "epoch": 517, "lr": 4.631178354397381e-06} +{"train_loss": 0.00031651524477638304, "global_step": 61610, "epoch": 517, "lr": 4.630247178283509e-06} +{"train_loss": 0.00043206370901316404, "global_step": 61611, "epoch": 517, "lr": 4.629316091248309e-06} +{"train_loss": 0.00048099004197865725, "global_step": 61612, "epoch": 517, "lr": 4.6283850932935855e-06} +{"train_loss": 0.00029990437906235456, "global_step": 61613, "epoch": 517, "lr": 4.627454184421187e-06} +{"train_loss": 0.00016952017904259264, "global_step": 61614, "epoch": 517, "lr": 4.62652336463294e-06} +{"train_loss": 0.0003600688942242414, "global_step": 61615, "epoch": 517, "lr": 4.625592633930659e-06} +{"train_loss": 0.00038948917062953115, "global_step": 61616, "epoch": 517, "lr": 4.6246619923161925e-06} +{"train_loss": 0.00038880747160874307, "global_step": 61617, "epoch": 517, "lr": 4.62373143979134e-06} +{"train_loss": 0.000275011028861627, "global_step": 61618, "epoch": 517, "lr": 4.622800976357955e-06} +{"train_loss": 0.00017442580428905785, "global_step": 61619, "epoch": 517, "lr": 4.6218706020178474e-06} +{"train_loss": 0.0003749484312720597, "global_step": 61620, "epoch": 517, "lr": 4.620940316772842e-06} +{"train_loss": 0.00046712910989299417, "global_step": 61621, "epoch": 517, "lr": 4.620010120624785e-06} +{"train_loss": 0.00044850129052065313, "global_step": 61622, "epoch": 517, "lr": 4.619080013575477e-06} +{"train_loss": 0.00018490200454834849, "global_step": 61623, "epoch": 517, "lr": 4.61814999562677e-06} +{"train_loss": 0.00027382178814150393, "global_step": 61624, "epoch": 517, "lr": 4.617220066780464e-06} +{"train_loss": 0.0005450351163744926, "global_step": 61625, "epoch": 517, "lr": 4.616290227038411e-06} +{"train_loss": 0.00042284352821297944, "global_step": 61626, "epoch": 517, "lr": 4.615360476402425e-06} +{"train_loss": 0.0003742568369489163, "global_step": 61627, "epoch": 517, "lr": 4.6144308148743155e-06} +{"train_loss": 0.0003171409189235419, "global_step": 61628, "epoch": 517, "lr": 4.613501242455937e-06} +{"train_loss": 0.00029134159558452666, "global_step": 61629, "epoch": 517, "lr": 4.6125717591490865e-06} +{"train_loss": 0.0002834083279594779, "global_step": 61630, "epoch": 517, "lr": 4.61164236495561e-06} +{"train_loss": 0.0004088565765414387, "global_step": 61631, "epoch": 517, "lr": 4.610713059877319e-06} +{"train_loss": 0.00038601510459557176, "global_step": 61632, "epoch": 517, "lr": 4.6097838439160545e-06} +{"train_loss": 0.00038019343628548086, "global_step": 61633, "epoch": 517, "lr": 4.608854717073624e-06} +{"train_loss": 0.00039829275920055807, "global_step": 61634, "epoch": 517, "lr": 4.607925679351854e-06} +{"train_loss": 0.00038858471089042723, "global_step": 61635, "epoch": 517, "lr": 4.606996730752583e-06} +{"train_loss": 0.0002731245185714215, "global_step": 61636, "epoch": 517, "lr": 4.606067871277608e-06} +{"train_loss": 0.00037750491173937917, "global_step": 61637, "epoch": 517, "lr": 4.6051391009287845e-06} +{"train_loss": 0.00039949530037119985, "global_step": 61638, "epoch": 517, "lr": 4.604210419707922e-06} +{"train_loss": 0.00019624424749054015, "global_step": 61639, "epoch": 517, "lr": 4.603281827616829e-06} +{"train_loss": 0.0002666484797373414, "global_step": 61640, "epoch": 517, "lr": 4.602353324657349e-06} +{"train_loss": 0.00034702758580160587, "global_step": 61641, "epoch": 517, "lr": 4.601424910831292e-06, "val_loss": 0.05979235842823982} +{"train_loss": 0.00038841302739456296, "global_step": 61642, "epoch": 518, "lr": 4.600496586140501e-06} +{"train_loss": 0.00021158020535949618, "global_step": 61643, "epoch": 518, "lr": 4.599568350586769e-06} +{"train_loss": 0.00033344788243994117, "global_step": 61644, "epoch": 518, "lr": 4.598640204171944e-06} +{"train_loss": 0.00047429659753106534, "global_step": 61645, "epoch": 518, "lr": 4.597712146897837e-06} +{"train_loss": 0.00019630664610303938, "global_step": 61646, "epoch": 518, "lr": 4.596784178766272e-06} +{"train_loss": 0.0002665273495949805, "global_step": 61647, "epoch": 518, "lr": 4.5958562997790665e-06} +{"train_loss": 0.00024084147298708558, "global_step": 61648, "epoch": 518, "lr": 4.5949285099380405e-06} +{"train_loss": 0.0002704482467379421, "global_step": 61649, "epoch": 518, "lr": 4.594000809245036e-06} +{"train_loss": 0.00022941516363061965, "global_step": 61650, "epoch": 518, "lr": 4.5930731977018585e-06} +{"train_loss": 0.00017808920529205352, "global_step": 61651, "epoch": 518, "lr": 4.592145675310322e-06} +{"train_loss": 0.00041916206828318536, "global_step": 61652, "epoch": 518, "lr": 4.591218242072265e-06} +{"train_loss": 0.0001610939798410982, "global_step": 61653, "epoch": 518, "lr": 4.590290897989491e-06} +{"train_loss": 0.00019420038734097034, "global_step": 61654, "epoch": 518, "lr": 4.5893636430638375e-06} +{"train_loss": 0.00030012684874236584, "global_step": 61655, "epoch": 518, "lr": 4.588436477297109e-06} +{"train_loss": 0.0005056145018897951, "global_step": 61656, "epoch": 518, "lr": 4.5875094006911475e-06} +{"train_loss": 0.000312209187541157, "global_step": 61657, "epoch": 518, "lr": 4.586582413247753e-06} +{"train_loss": 0.00021854584338143468, "global_step": 61658, "epoch": 518, "lr": 4.585655514968745e-06} +{"train_loss": 0.000545353745110333, "global_step": 61659, "epoch": 518, "lr": 4.584728705855962e-06} +{"train_loss": 0.00033714884193614125, "global_step": 61660, "epoch": 518, "lr": 4.5838019859112016e-06} +{"train_loss": 0.00024378590751439333, "global_step": 61661, "epoch": 518, "lr": 4.582875355136301e-06} +{"train_loss": 0.0001502323430031538, "global_step": 61662, "epoch": 518, "lr": 4.581948813533066e-06} +{"train_loss": 0.0003621151263359934, "global_step": 61663, "epoch": 518, "lr": 4.581022361103332e-06} +{"train_loss": 0.00033696836908347905, "global_step": 61664, "epoch": 518, "lr": 4.580095997848904e-06} +{"train_loss": 0.0004028320836368948, "global_step": 61665, "epoch": 518, "lr": 4.579169723771598e-06} +{"train_loss": 0.00040736625669524074, "global_step": 61666, "epoch": 518, "lr": 4.57824353887325e-06} +{"train_loss": 0.00022915328736416996, "global_step": 61667, "epoch": 518, "lr": 4.57731744315566e-06} +{"train_loss": 0.0002887444570660591, "global_step": 61668, "epoch": 518, "lr": 4.576391436620664e-06} +{"train_loss": 0.00021384820865932852, "global_step": 61669, "epoch": 518, "lr": 4.575465519270067e-06} +{"train_loss": 0.0001615878863958642, "global_step": 61670, "epoch": 518, "lr": 4.5745396911056835e-06} +{"train_loss": 0.0004922025837004185, "global_step": 61671, "epoch": 518, "lr": 4.573613952129352e-06} +{"train_loss": 0.00017970266344491392, "global_step": 61672, "epoch": 518, "lr": 4.572688302342859e-06} +{"train_loss": 0.000888059614226222, "global_step": 61673, "epoch": 518, "lr": 4.571762741748053e-06} +{"train_loss": 0.0004940260550938547, "global_step": 61674, "epoch": 518, "lr": 4.570837270346728e-06} +{"train_loss": 0.00019257554959040135, "global_step": 61675, "epoch": 518, "lr": 4.569911888140721e-06} +{"train_loss": 0.0001986863644560799, "global_step": 61676, "epoch": 518, "lr": 4.568986595131824e-06} +{"train_loss": 0.0002488621976226568, "global_step": 61677, "epoch": 518, "lr": 4.568061391321882e-06} +{"train_loss": 0.0006210992578417063, "global_step": 61678, "epoch": 518, "lr": 4.5671362767126916e-06} +{"train_loss": 0.0002353495656279847, "global_step": 61679, "epoch": 518, "lr": 4.5662112513060794e-06} +{"train_loss": 0.00030439288821071386, "global_step": 61680, "epoch": 518, "lr": 4.56528631510385e-06} +{"train_loss": 0.00019179344235453755, "global_step": 61681, "epoch": 518, "lr": 4.564361468107836e-06} +{"train_loss": 0.0002571311197243631, "global_step": 61682, "epoch": 518, "lr": 4.563436710319835e-06} +{"train_loss": 0.0005096428794786334, "global_step": 61683, "epoch": 518, "lr": 4.562512041741679e-06} +{"train_loss": 0.00020394304010551423, "global_step": 61684, "epoch": 518, "lr": 4.561587462375166e-06} +{"train_loss": 0.000488107034470886, "global_step": 61685, "epoch": 518, "lr": 4.560662972222135e-06} +{"train_loss": 0.0002919753605965525, "global_step": 61686, "epoch": 518, "lr": 4.559738571284378e-06} +{"train_loss": 0.00022330257343128324, "global_step": 61687, "epoch": 518, "lr": 4.558814259563726e-06} +{"train_loss": 0.0002743881777860224, "global_step": 61688, "epoch": 518, "lr": 4.55789003706199e-06} +{"train_loss": 0.0003904994227923453, "global_step": 61689, "epoch": 518, "lr": 4.556965903780974e-06} +{"train_loss": 0.0002549265627749264, "global_step": 61690, "epoch": 518, "lr": 4.556041859722509e-06} +{"train_loss": 0.00039169940282590687, "global_step": 61691, "epoch": 518, "lr": 4.55511790488839e-06} +{"train_loss": 0.0003764408465940505, "global_step": 61692, "epoch": 518, "lr": 4.554194039280451e-06} +{"train_loss": 0.0005518364487215877, "global_step": 61693, "epoch": 518, "lr": 4.553270262900494e-06} +{"train_loss": 0.0002955083327833563, "global_step": 61694, "epoch": 518, "lr": 4.552346575750338e-06} +{"train_loss": 0.00037026326754130423, "global_step": 61695, "epoch": 518, "lr": 4.551422977831793e-06} +{"train_loss": 0.0002936058153863996, "global_step": 61696, "epoch": 518, "lr": 4.550499469146668e-06} +{"train_loss": 0.00023009632423054427, "global_step": 61697, "epoch": 518, "lr": 4.549576049696791e-06} +{"train_loss": 0.00023892491299193352, "global_step": 61698, "epoch": 518, "lr": 4.548652719483959e-06} +{"train_loss": 0.0003149811818730086, "global_step": 61699, "epoch": 518, "lr": 4.5477294785099935e-06} +{"train_loss": 0.00021666893735527992, "global_step": 61700, "epoch": 518, "lr": 4.5468063267767035e-06} +{"train_loss": 0.0003122914640698582, "global_step": 61701, "epoch": 518, "lr": 4.545883264285905e-06} +{"train_loss": 0.00035056620254181325, "global_step": 61702, "epoch": 518, "lr": 4.544960291039413e-06} +{"train_loss": 0.0005619926378130913, "global_step": 61703, "epoch": 518, "lr": 4.544037407039026e-06} +{"train_loss": 0.0009624816593714058, "global_step": 61704, "epoch": 518, "lr": 4.543114612286576e-06} +{"train_loss": 0.0004315570113249123, "global_step": 61705, "epoch": 518, "lr": 4.542191906783855e-06} +{"train_loss": 0.00023763977515045553, "global_step": 61706, "epoch": 518, "lr": 4.54126929053269e-06} +{"train_loss": 0.0003002985322382301, "global_step": 61707, "epoch": 518, "lr": 4.540346763534886e-06} +{"train_loss": 0.0002349240385228768, "global_step": 61708, "epoch": 518, "lr": 4.539424325792246e-06} +{"train_loss": 0.0006568895187228918, "global_step": 61709, "epoch": 518, "lr": 4.538501977306603e-06} +{"train_loss": 0.00024820928229019046, "global_step": 61710, "epoch": 518, "lr": 4.537579718079738e-06} +{"train_loss": 0.0002756153990048915, "global_step": 61711, "epoch": 518, "lr": 4.536657548113482e-06} +{"train_loss": 0.0001852514105848968, "global_step": 61712, "epoch": 518, "lr": 4.535735467409652e-06} +{"train_loss": 0.0002761673822533339, "global_step": 61713, "epoch": 518, "lr": 4.53481347597004e-06} +{"train_loss": 0.00047565283603034914, "global_step": 61714, "epoch": 518, "lr": 4.5338915737964724e-06} +{"train_loss": 0.00022154430916998535, "global_step": 61715, "epoch": 518, "lr": 4.532969760890737e-06} +{"train_loss": 0.0002861810498870909, "global_step": 61716, "epoch": 518, "lr": 4.532048037254677e-06} +{"train_loss": 0.00038424815284088254, "global_step": 61717, "epoch": 518, "lr": 4.531126402890068e-06} +{"train_loss": 0.0003887904167640954, "global_step": 61718, "epoch": 518, "lr": 4.530204857798742e-06} +{"train_loss": 0.00030192703707143664, "global_step": 61719, "epoch": 518, "lr": 4.529283401982503e-06} +{"train_loss": 0.00021044386085122824, "global_step": 61720, "epoch": 518, "lr": 4.528362035443151e-06} +{"train_loss": 0.00027478006086312234, "global_step": 61721, "epoch": 518, "lr": 4.527440758182511e-06} +{"train_loss": 0.0004476330941542983, "global_step": 61722, "epoch": 518, "lr": 4.52651957020237e-06} +{"train_loss": 0.0002816604683175683, "global_step": 61723, "epoch": 518, "lr": 4.525598471504566e-06} +{"train_loss": 0.0004734140238724649, "global_step": 61724, "epoch": 518, "lr": 4.524677462090876e-06} +{"train_loss": 0.0002124856400769204, "global_step": 61725, "epoch": 518, "lr": 4.523756541963137e-06} +{"train_loss": 0.00038551315083168447, "global_step": 61726, "epoch": 518, "lr": 4.522835711123141e-06} +{"train_loss": 0.0006298633525148034, "global_step": 61727, "epoch": 518, "lr": 4.521914969572688e-06} +{"train_loss": 0.0005408466095104814, "global_step": 61728, "epoch": 518, "lr": 4.520994317313604e-06} +{"train_loss": 0.0006018158746883273, "global_step": 61729, "epoch": 518, "lr": 4.520073754347687e-06} +{"train_loss": 0.00024274919996969402, "global_step": 61730, "epoch": 518, "lr": 4.519153280676752e-06} +{"train_loss": 0.00046911678509786725, "global_step": 61731, "epoch": 518, "lr": 4.518232896302587e-06} +{"train_loss": 0.000280505046248436, "global_step": 61732, "epoch": 518, "lr": 4.517312601227025e-06} +{"train_loss": 0.00021170669060666114, "global_step": 61733, "epoch": 518, "lr": 4.5163923954518626e-06} +{"train_loss": 0.00046403511078096926, "global_step": 61734, "epoch": 518, "lr": 4.515472278978894e-06} +{"train_loss": 0.00028824707260355353, "global_step": 61735, "epoch": 518, "lr": 4.514552251809944e-06} +{"train_loss": 0.0005431391764432192, "global_step": 61736, "epoch": 518, "lr": 4.5136323139468084e-06} +{"train_loss": 0.00022826397616881877, "global_step": 61737, "epoch": 518, "lr": 4.5127124653913e-06} +{"train_loss": 0.00036490551428869367, "global_step": 61738, "epoch": 518, "lr": 4.511792706145218e-06} +{"train_loss": 0.000386888044886291, "global_step": 61739, "epoch": 518, "lr": 4.510873036210367e-06} +{"train_loss": 0.00045334655442275107, "global_step": 61740, "epoch": 518, "lr": 4.509953455588567e-06} +{"train_loss": 0.00040540233021602035, "global_step": 61741, "epoch": 518, "lr": 4.509033964281601e-06} +{"train_loss": 0.0004095410695299506, "global_step": 61742, "epoch": 518, "lr": 4.508114562291299e-06} +{"train_loss": 0.00032519802334718406, "global_step": 61743, "epoch": 518, "lr": 4.507195249619439e-06} +{"train_loss": 0.0004985948908142745, "global_step": 61744, "epoch": 518, "lr": 4.5062760262678585e-06} +{"train_loss": 0.0002474802895449102, "global_step": 61745, "epoch": 518, "lr": 4.505356892238327e-06} +{"train_loss": 0.0002718295727390796, "global_step": 61746, "epoch": 518, "lr": 4.504437847532672e-06} +{"train_loss": 0.0003088408848270774, "global_step": 61747, "epoch": 518, "lr": 4.503518892152703e-06} +{"train_loss": 0.0006241396768018603, "global_step": 61748, "epoch": 518, "lr": 4.502600026100201e-06} +{"train_loss": 0.00041504346881993115, "global_step": 61749, "epoch": 518, "lr": 4.501681249376994e-06} +{"train_loss": 0.0002783542440738529, "global_step": 61750, "epoch": 518, "lr": 4.500762561984867e-06} +{"train_loss": 0.0003382417489774525, "global_step": 61751, "epoch": 518, "lr": 4.499843963925643e-06} +{"train_loss": 0.000388806511182338, "global_step": 61752, "epoch": 518, "lr": 4.4989254552011084e-06} +{"train_loss": 0.00023741887707728893, "global_step": 61753, "epoch": 518, "lr": 4.498007035813068e-06} +{"train_loss": 0.00036032023490406573, "global_step": 61754, "epoch": 518, "lr": 4.497088705763336e-06} +{"train_loss": 0.00022768479539081454, "global_step": 61755, "epoch": 518, "lr": 4.4961704650537e-06} +{"train_loss": 0.00047741911839693785, "global_step": 61756, "epoch": 518, "lr": 4.4952523136859824e-06} +{"train_loss": 0.0005842407699674368, "global_step": 61757, "epoch": 518, "lr": 4.49433425166198e-06} +{"train_loss": 0.00016524497186765075, "global_step": 61758, "epoch": 518, "lr": 4.4934162789834756e-06} +{"train_loss": 0.00020080052490811795, "global_step": 61759, "epoch": 518, "lr": 4.492498395652295e-06} +{"train_loss": 0.00034576246124582696, "global_step": 61760, "epoch": 518, "lr": 4.4915806016702256e-06, "val_loss": 0.04200589284300804} +{"train_loss": 0.00034715174115262926, "global_step": 61761, "epoch": 519, "lr": 4.4906628970390826e-06} +{"train_loss": 0.0002601669984869659, "global_step": 61762, "epoch": 519, "lr": 4.489745281760655e-06} +{"train_loss": 0.0002463757700752467, "global_step": 61763, "epoch": 519, "lr": 4.488827755836761e-06} +{"train_loss": 0.0001836895098676905, "global_step": 61764, "epoch": 519, "lr": 4.487910319269189e-06} +{"train_loss": 0.00028627028223127127, "global_step": 61765, "epoch": 519, "lr": 4.4869929720597335e-06} +{"train_loss": 0.00019367063941899687, "global_step": 61766, "epoch": 519, "lr": 4.486075714210214e-06} +{"train_loss": 0.0004889810807071626, "global_step": 61767, "epoch": 519, "lr": 4.485158545722412e-06} +{"train_loss": 0.0004720425931736827, "global_step": 61768, "epoch": 519, "lr": 4.484241466598149e-06} +{"train_loss": 0.0006997577729634941, "global_step": 61769, "epoch": 519, "lr": 4.4833244768392176e-06} +{"train_loss": 0.000584710855036974, "global_step": 61770, "epoch": 519, "lr": 4.482407576447406e-06} +{"train_loss": 0.0002714429865591228, "global_step": 61771, "epoch": 519, "lr": 4.481490765424528e-06} +{"train_loss": 0.00035911606391891837, "global_step": 61772, "epoch": 519, "lr": 4.480574043772379e-06} +{"train_loss": 0.00037488137604668736, "global_step": 61773, "epoch": 519, "lr": 4.47965741149276e-06} +{"train_loss": 0.0002457777736708522, "global_step": 61774, "epoch": 519, "lr": 4.478740868587467e-06} +{"train_loss": 0.0003461181477177888, "global_step": 61775, "epoch": 519, "lr": 4.477824415058313e-06} +{"train_loss": 0.00016707854229025543, "global_step": 61776, "epoch": 519, "lr": 4.4769080509070745e-06} +{"train_loss": 0.0003624562523327768, "global_step": 61777, "epoch": 519, "lr": 4.475991776135579e-06} +{"train_loss": 0.00044703285675495863, "global_step": 61778, "epoch": 519, "lr": 4.475075590745598e-06} +{"train_loss": 0.0003047354693990201, "global_step": 61779, "epoch": 519, "lr": 4.47415949473895e-06} +{"train_loss": 0.0004418842145241797, "global_step": 61780, "epoch": 519, "lr": 4.473243488117418e-06} +{"train_loss": 0.0002893425989896059, "global_step": 61781, "epoch": 519, "lr": 4.472327570882806e-06} +{"train_loss": 0.0003814449009951204, "global_step": 61782, "epoch": 519, "lr": 4.471411743036924e-06} +{"train_loss": 0.00034620266524143517, "global_step": 61783, "epoch": 519, "lr": 4.4704960045815645e-06} +{"train_loss": 0.0002751847787294537, "global_step": 61784, "epoch": 519, "lr": 4.46958035551851e-06} +{"train_loss": 0.00028099550399929285, "global_step": 61785, "epoch": 519, "lr": 4.468664795849581e-06} +{"train_loss": 0.0004365684580989182, "global_step": 61786, "epoch": 519, "lr": 4.467749325576559e-06} +{"train_loss": 0.0003814604424405843, "global_step": 61787, "epoch": 519, "lr": 4.466833944701249e-06} +{"train_loss": 0.0003733153862413019, "global_step": 61788, "epoch": 519, "lr": 4.4659186532254485e-06} +{"train_loss": 0.0002682983176782727, "global_step": 61789, "epoch": 519, "lr": 4.465003451150945e-06} +{"train_loss": 0.000809837831184268, "global_step": 61790, "epoch": 519, "lr": 4.464088338479549e-06} +{"train_loss": 0.000648862449452281, "global_step": 61791, "epoch": 519, "lr": 4.463173315213043e-06} +{"train_loss": 0.00032974471105262637, "global_step": 61792, "epoch": 519, "lr": 4.46225838135324e-06} +{"train_loss": 0.00026138522662222385, "global_step": 61793, "epoch": 519, "lr": 4.4613435369019185e-06} +{"train_loss": 0.0003110031539108604, "global_step": 61794, "epoch": 519, "lr": 4.460428781860898e-06} +{"train_loss": 0.0002644607156980783, "global_step": 61795, "epoch": 519, "lr": 4.459514116231955e-06} +{"train_loss": 0.0005437051295302808, "global_step": 61796, "epoch": 519, "lr": 4.4585995400168835e-06} +{"train_loss": 0.0004198907990939915, "global_step": 61797, "epoch": 519, "lr": 4.457685053217492e-06} +{"train_loss": 0.0002617494319565594, "global_step": 61798, "epoch": 519, "lr": 4.456770655835563e-06} +{"train_loss": 0.0004795807763002813, "global_step": 61799, "epoch": 519, "lr": 4.455856347872911e-06} +{"train_loss": 0.00040546254604123533, "global_step": 61800, "epoch": 519, "lr": 4.454942129331308e-06} +{"train_loss": 0.0003122097405139357, "global_step": 61801, "epoch": 519, "lr": 4.454028000212568e-06} +{"train_loss": 0.0002451775362715125, "global_step": 61802, "epoch": 519, "lr": 4.4531139605184845e-06} +{"train_loss": 0.0008025629795156419, "global_step": 61803, "epoch": 519, "lr": 4.452200010250829e-06} +{"train_loss": 0.0001542679383419454, "global_step": 61804, "epoch": 519, "lr": 4.4512861494114265e-06} +{"train_loss": 0.0006736303330399096, "global_step": 61805, "epoch": 519, "lr": 4.450372378002043e-06} +{"train_loss": 0.0002126527833752334, "global_step": 61806, "epoch": 519, "lr": 4.449458696024505e-06} +{"train_loss": 0.0005446106661111116, "global_step": 61807, "epoch": 519, "lr": 4.448545103480583e-06} +{"train_loss": 0.0005243861814960837, "global_step": 61808, "epoch": 519, "lr": 4.447631600372065e-06} +{"train_loss": 0.0005989668425172567, "global_step": 61809, "epoch": 519, "lr": 4.44671818670076e-06} +{"train_loss": 0.0001780186576070264, "global_step": 61810, "epoch": 519, "lr": 4.445804862468467e-06} +{"train_loss": 0.00045436230720952153, "global_step": 61811, "epoch": 519, "lr": 4.444891627676956e-06} +{"train_loss": 0.00022428572992794216, "global_step": 61812, "epoch": 519, "lr": 4.443978482328043e-06} +{"train_loss": 0.00042710232082754374, "global_step": 61813, "epoch": 519, "lr": 4.443065426423504e-06} +{"train_loss": 0.0002780685608740896, "global_step": 61814, "epoch": 519, "lr": 4.442152459965148e-06} +{"train_loss": 0.0004406261723488569, "global_step": 61815, "epoch": 519, "lr": 4.441239582954748e-06} +{"train_loss": 0.000380870362278074, "global_step": 61816, "epoch": 519, "lr": 4.440326795394117e-06} +{"train_loss": 0.0004205558798275888, "global_step": 61817, "epoch": 519, "lr": 4.4394140972850325e-06} +{"train_loss": 0.0004350590461399406, "global_step": 61818, "epoch": 519, "lr": 4.438501488629293e-06} +{"train_loss": 0.0007007213425822556, "global_step": 61819, "epoch": 519, "lr": 4.437588969428686e-06} +{"train_loss": 0.00041220910497941077, "global_step": 61820, "epoch": 519, "lr": 4.436676539685008e-06} +{"train_loss": 0.00020793134171981364, "global_step": 61821, "epoch": 519, "lr": 4.43576419940005e-06} +{"train_loss": 0.0006930941017344594, "global_step": 61822, "epoch": 519, "lr": 4.434851948575591e-06} +{"train_loss": 0.00046309910248965025, "global_step": 61823, "epoch": 519, "lr": 4.433939787213443e-06} +{"train_loss": 0.0009485681657679379, "global_step": 61824, "epoch": 519, "lr": 4.43302771531538e-06} +{"train_loss": 0.000321942672599107, "global_step": 61825, "epoch": 519, "lr": 4.432115732883202e-06} +{"train_loss": 0.00033650349359959364, "global_step": 61826, "epoch": 519, "lr": 4.431203839918701e-06} +{"train_loss": 0.00029968531453050673, "global_step": 61827, "epoch": 519, "lr": 4.43029203642365e-06} +{"train_loss": 0.00026076548965647817, "global_step": 61828, "epoch": 519, "lr": 4.429380322399867e-06} +{"train_loss": 0.0004490118008106947, "global_step": 61829, "epoch": 519, "lr": 4.428468697849114e-06} +{"train_loss": 0.00037240952951833606, "global_step": 61830, "epoch": 519, "lr": 4.427557162773205e-06} +{"train_loss": 0.0002929503680206835, "global_step": 61831, "epoch": 519, "lr": 4.426645717173911e-06} +{"train_loss": 0.000370851659681648, "global_step": 61832, "epoch": 519, "lr": 4.4257343610530355e-06} +{"train_loss": 0.00030871416674926877, "global_step": 61833, "epoch": 519, "lr": 4.4248230944123616e-06} +{"train_loss": 0.00048700475599616766, "global_step": 61834, "epoch": 519, "lr": 4.42391191725367e-06} +{"train_loss": 0.0002521351270843297, "global_step": 61835, "epoch": 519, "lr": 4.423000829578766e-06} +{"train_loss": 0.00025505165103822947, "global_step": 61836, "epoch": 519, "lr": 4.4220898313894256e-06} +{"train_loss": 0.00030523299938067794, "global_step": 61837, "epoch": 519, "lr": 4.4211789226874465e-06} +{"train_loss": 0.00036324310349300504, "global_step": 61838, "epoch": 519, "lr": 4.420268103474617e-06} +{"train_loss": 0.0002592112577985972, "global_step": 61839, "epoch": 519, "lr": 4.419357373752714e-06} +{"train_loss": 0.0005379071226343513, "global_step": 61840, "epoch": 519, "lr": 4.418446733523535e-06} +{"train_loss": 0.0005502478452399373, "global_step": 61841, "epoch": 519, "lr": 4.417536182788862e-06} +{"train_loss": 0.0003983390342909843, "global_step": 61842, "epoch": 519, "lr": 4.416625721550499e-06} +{"train_loss": 0.0003615930036175996, "global_step": 61843, "epoch": 519, "lr": 4.415715349810207e-06} +{"train_loss": 0.00022567377891391516, "global_step": 61844, "epoch": 519, "lr": 4.4148050675697935e-06} +{"train_loss": 0.0006407024338841438, "global_step": 61845, "epoch": 519, "lr": 4.413894874831043e-06} +{"train_loss": 0.0006341527914628386, "global_step": 61846, "epoch": 519, "lr": 4.412984771595735e-06} +{"train_loss": 0.000430309068178758, "global_step": 61847, "epoch": 519, "lr": 4.41207475786567e-06} +{"train_loss": 0.0003063410986214876, "global_step": 61848, "epoch": 519, "lr": 4.411164833642612e-06} +{"train_loss": 0.0003798324032686651, "global_step": 61849, "epoch": 519, "lr": 4.410254998928376e-06} +{"train_loss": 0.00036444023135118186, "global_step": 61850, "epoch": 519, "lr": 4.409345253724722e-06} +{"train_loss": 0.00029389336123131216, "global_step": 61851, "epoch": 519, "lr": 4.408435598033461e-06} +{"train_loss": 0.0002204531047027558, "global_step": 61852, "epoch": 519, "lr": 4.407526031856363e-06} +{"train_loss": 0.0008036473300307989, "global_step": 61853, "epoch": 519, "lr": 4.406616555195203e-06} +{"train_loss": 0.00032437534537166357, "global_step": 61854, "epoch": 519, "lr": 4.405707168051798e-06} +{"train_loss": 0.0005274387076497078, "global_step": 61855, "epoch": 519, "lr": 4.404797870427901e-06} +{"train_loss": 0.0006370773771777749, "global_step": 61856, "epoch": 519, "lr": 4.4038886623253225e-06} +{"train_loss": 0.0002802143862936646, "global_step": 61857, "epoch": 519, "lr": 4.402979543745839e-06} +{"train_loss": 0.00048348502605222166, "global_step": 61858, "epoch": 519, "lr": 4.402070514691226e-06} +{"train_loss": 0.0005842268001288176, "global_step": 61859, "epoch": 519, "lr": 4.401161575163282e-06} +{"train_loss": 0.0005596759729087353, "global_step": 61860, "epoch": 519, "lr": 4.4002527251637784e-06} +{"train_loss": 0.00019456601876299828, "global_step": 61861, "epoch": 519, "lr": 4.399343964694513e-06} +{"train_loss": 0.00035364634823054075, "global_step": 61862, "epoch": 519, "lr": 4.398435293757258e-06} +{"train_loss": 0.00044664315646514297, "global_step": 61863, "epoch": 519, "lr": 4.397526712353811e-06} +{"train_loss": 0.0004591324832290411, "global_step": 61864, "epoch": 519, "lr": 4.396618220485954e-06} +{"train_loss": 0.0005494006909430027, "global_step": 61865, "epoch": 519, "lr": 4.395709818155447e-06} +{"train_loss": 0.0003113156126346439, "global_step": 61866, "epoch": 519, "lr": 4.394801505364104e-06} +{"train_loss": 0.00026463408721610904, "global_step": 61867, "epoch": 519, "lr": 4.3938932821136925e-06} +{"train_loss": 0.0004426398081704974, "global_step": 61868, "epoch": 519, "lr": 4.392985148406003e-06} +{"train_loss": 0.00032138096867129207, "global_step": 61869, "epoch": 519, "lr": 4.3920771042428086e-06} +{"train_loss": 0.000743640644941479, "global_step": 61870, "epoch": 519, "lr": 4.391169149625901e-06} +{"train_loss": 0.0004863979993388057, "global_step": 61871, "epoch": 519, "lr": 4.390261284557068e-06} +{"train_loss": 0.00062914117006585, "global_step": 61872, "epoch": 519, "lr": 4.389353509038069e-06} +{"train_loss": 0.00013895297888666391, "global_step": 61873, "epoch": 519, "lr": 4.388445823070714e-06} +{"train_loss": 0.00034658072399906814, "global_step": 61874, "epoch": 519, "lr": 4.3875382266567625e-06} +{"train_loss": 0.0003052634128835052, "global_step": 61875, "epoch": 519, "lr": 4.386630719798018e-06} +{"train_loss": 0.0003078483568970114, "global_step": 61876, "epoch": 519, "lr": 4.385723302496242e-06} +{"train_loss": 0.0004830013494938612, "global_step": 61877, "epoch": 519, "lr": 4.384815974753231e-06} +{"train_loss": 0.00021368375746533275, "global_step": 61878, "epoch": 519, "lr": 4.383908736570752e-06} +{"train_loss": 0.0004014954397194635, "global_step": 61879, "epoch": 519, "lr": 4.383001587950597e-06, "val_loss": 0.01699654385447502} +{"train_loss": 0.0005895071080885828, "global_step": 61880, "epoch": 520, "lr": 4.382094528894554e-06} +{"train_loss": 0.0005694206920452416, "global_step": 61881, "epoch": 520, "lr": 4.381187559404382e-06} +{"train_loss": 0.0002556414110586047, "global_step": 61882, "epoch": 520, "lr": 4.380280679481891e-06} +{"train_loss": 0.0002172838430851698, "global_step": 61883, "epoch": 520, "lr": 4.379373889128841e-06} +{"train_loss": 0.0003874773974530399, "global_step": 61884, "epoch": 520, "lr": 4.378467188347002e-06} +{"train_loss": 0.0004383905616123229, "global_step": 61885, "epoch": 520, "lr": 4.377560577138185e-06} +{"train_loss": 0.00042431059409864247, "global_step": 61886, "epoch": 520, "lr": 4.376654055504143e-06} +{"train_loss": 0.0005088824545964599, "global_step": 61887, "epoch": 520, "lr": 4.375747623446674e-06} +{"train_loss": 0.0004925547982566059, "global_step": 61888, "epoch": 520, "lr": 4.37484128096754e-06} +{"train_loss": 0.0004519357462413609, "global_step": 61889, "epoch": 520, "lr": 4.373935028068543e-06} +{"train_loss": 0.0002328003174625337, "global_step": 61890, "epoch": 520, "lr": 4.3730288647514495e-06} +{"train_loss": 0.00033085691393353045, "global_step": 61891, "epoch": 520, "lr": 4.372122791018029e-06} +{"train_loss": 0.0004290210781618953, "global_step": 61892, "epoch": 520, "lr": 4.371216806870082e-06} +{"train_loss": 0.0004748909268528223, "global_step": 61893, "epoch": 520, "lr": 4.370310912309367e-06} +{"train_loss": 0.0003508837544359267, "global_step": 61894, "epoch": 520, "lr": 4.369405107337682e-06} +{"train_loss": 0.00029276846908032894, "global_step": 61895, "epoch": 520, "lr": 4.368499391956793e-06} +{"train_loss": 0.0004555709601845592, "global_step": 61896, "epoch": 520, "lr": 4.3675937661684706e-06} +{"train_loss": 0.00018013527733273804, "global_step": 61897, "epoch": 520, "lr": 4.3666882299745135e-06} +{"train_loss": 0.00044943401007913053, "global_step": 61898, "epoch": 520, "lr": 4.365782783376676e-06} +{"train_loss": 0.0003761240222956985, "global_step": 61899, "epoch": 520, "lr": 4.364877426376762e-06} +{"train_loss": 0.00028468668460845947, "global_step": 61900, "epoch": 520, "lr": 4.363972158976526e-06} +{"train_loss": 0.000185004246304743, "global_step": 61901, "epoch": 520, "lr": 4.36306698117776e-06} +{"train_loss": 0.00037957783206366, "global_step": 61902, "epoch": 520, "lr": 4.362161892982242e-06} +{"train_loss": 0.00030772772151976824, "global_step": 61903, "epoch": 520, "lr": 4.3612568943917356e-06} +{"train_loss": 0.00031186226988211274, "global_step": 61904, "epoch": 520, "lr": 4.360351985408029e-06} +{"train_loss": 0.0005948061589151621, "global_step": 61905, "epoch": 520, "lr": 4.359447166032887e-06} +{"train_loss": 0.00023577276442665607, "global_step": 61906, "epoch": 520, "lr": 4.358542436268104e-06} +{"train_loss": 0.000311888346914202, "global_step": 61907, "epoch": 520, "lr": 4.357637796115444e-06} +{"train_loss": 0.0006001031142659485, "global_step": 61908, "epoch": 520, "lr": 4.356733245576688e-06} +{"train_loss": 0.00026269591762684286, "global_step": 61909, "epoch": 520, "lr": 4.355828784653604e-06} +{"train_loss": 0.00045419129310175776, "global_step": 61910, "epoch": 520, "lr": 4.354924413347983e-06} +{"train_loss": 0.0008255313732661307, "global_step": 61911, "epoch": 520, "lr": 4.354020131661579e-06} +{"train_loss": 0.00038093881448730826, "global_step": 61912, "epoch": 520, "lr": 4.353115939596192e-06} +{"train_loss": 0.0002947912726085633, "global_step": 61913, "epoch": 520, "lr": 4.352211837153575e-06} +{"train_loss": 0.00032879592617973685, "global_step": 61914, "epoch": 520, "lr": 4.351307824335521e-06} +{"train_loss": 0.0006156029994599521, "global_step": 61915, "epoch": 520, "lr": 4.35040390114379e-06} +{"train_loss": 0.000395662325900048, "global_step": 61916, "epoch": 520, "lr": 4.349500067580175e-06} +{"train_loss": 0.0003528448869474232, "global_step": 61917, "epoch": 520, "lr": 4.3485963236464255e-06} +{"train_loss": 0.000403811369324103, "global_step": 61918, "epoch": 520, "lr": 4.347692669344345e-06} +{"train_loss": 0.00042912852950394154, "global_step": 61919, "epoch": 520, "lr": 4.346789104675681e-06} +{"train_loss": 0.000353202543919906, "global_step": 61920, "epoch": 520, "lr": 4.345885629642227e-06} +{"train_loss": 0.0004410420951899141, "global_step": 61921, "epoch": 520, "lr": 4.344982244245749e-06} +{"train_loss": 0.0005291683482937515, "global_step": 61922, "epoch": 520, "lr": 4.344078948488012e-06} +{"train_loss": 0.00023783408687449992, "global_step": 61923, "epoch": 520, "lr": 4.343175742370809e-06} +{"train_loss": 0.00048458040691912174, "global_step": 61924, "epoch": 520, "lr": 4.342272625895893e-06} +{"train_loss": 0.0005416559870354831, "global_step": 61925, "epoch": 520, "lr": 4.34136959906506e-06} +{"train_loss": 0.0004213769279886037, "global_step": 61926, "epoch": 520, "lr": 4.340466661880066e-06} +{"train_loss": 0.00024398049572482705, "global_step": 61927, "epoch": 520, "lr": 4.339563814342673e-06} +{"train_loss": 0.0003948607773054391, "global_step": 61928, "epoch": 520, "lr": 4.3386610564546846e-06} +{"train_loss": 0.0002703510399442166, "global_step": 61929, "epoch": 520, "lr": 4.33775838821785e-06} +{"train_loss": 0.0006466400227509439, "global_step": 61930, "epoch": 520, "lr": 4.336855809633949e-06} +{"train_loss": 0.00017781958740670234, "global_step": 61931, "epoch": 520, "lr": 4.33595332070475e-06} +{"train_loss": 0.0001983410766115412, "global_step": 61932, "epoch": 520, "lr": 4.335050921432038e-06} +{"train_loss": 0.0003284828853793442, "global_step": 61933, "epoch": 520, "lr": 4.334148611817573e-06} +{"train_loss": 0.00029330700635910034, "global_step": 61934, "epoch": 520, "lr": 4.333246391863122e-06} +{"train_loss": 0.00035073820617981255, "global_step": 61935, "epoch": 520, "lr": 4.33234426157047e-06} +{"train_loss": 0.0006720829987898469, "global_step": 61936, "epoch": 520, "lr": 4.331442220941368e-06} +{"train_loss": 0.00046188972191885114, "global_step": 61937, "epoch": 520, "lr": 4.330540269977612e-06} +{"train_loss": 0.00047827200614847243, "global_step": 61938, "epoch": 520, "lr": 4.329638408680953e-06} +{"train_loss": 0.00043282299884594977, "global_step": 61939, "epoch": 520, "lr": 4.328736637053182e-06} +{"train_loss": 0.0002486482262611389, "global_step": 61940, "epoch": 520, "lr": 4.327834955096044e-06} +{"train_loss": 0.00024434749502688646, "global_step": 61941, "epoch": 520, "lr": 4.326933362811336e-06} +{"train_loss": 0.00035118445521220565, "global_step": 61942, "epoch": 520, "lr": 4.326031860200802e-06} +{"train_loss": 0.000394674192648381, "global_step": 61943, "epoch": 520, "lr": 4.325130447266235e-06} +{"train_loss": 0.0003123483620584011, "global_step": 61944, "epoch": 520, "lr": 4.324229124009383e-06} +{"train_loss": 0.00019345439795870334, "global_step": 61945, "epoch": 520, "lr": 4.323327890432038e-06} +{"train_loss": 0.00036538447602652013, "global_step": 61946, "epoch": 520, "lr": 4.322426746535951e-06} +{"train_loss": 0.00016563657845836133, "global_step": 61947, "epoch": 520, "lr": 4.321525692322909e-06} +{"train_loss": 0.00038945444975979626, "global_step": 61948, "epoch": 520, "lr": 4.3206247277946645e-06} +{"train_loss": 0.0003456665435805917, "global_step": 61949, "epoch": 520, "lr": 4.319723852952995e-06} +{"train_loss": 0.00028778929845429957, "global_step": 61950, "epoch": 520, "lr": 4.318823067799665e-06} +{"train_loss": 0.0005674121202901006, "global_step": 61951, "epoch": 520, "lr": 4.3179223723364525e-06} +{"train_loss": 0.00036903482396155596, "global_step": 61952, "epoch": 520, "lr": 4.317021766565116e-06} +{"train_loss": 0.0005845798877999187, "global_step": 61953, "epoch": 520, "lr": 4.316121250487421e-06} +{"train_loss": 0.0002472504274919629, "global_step": 61954, "epoch": 520, "lr": 4.315220824105148e-06} +{"train_loss": 0.00028674339409917593, "global_step": 61955, "epoch": 520, "lr": 4.314320487420054e-06} +{"train_loss": 0.0003688409342430532, "global_step": 61956, "epoch": 520, "lr": 4.313420240433919e-06} +{"train_loss": 0.0004009122203569859, "global_step": 61957, "epoch": 520, "lr": 4.312520083148497e-06} +{"train_loss": 0.000462259107735008, "global_step": 61958, "epoch": 520, "lr": 4.3116200155655535e-06} +{"train_loss": 0.000551955250557512, "global_step": 61959, "epoch": 520, "lr": 4.3107200376868775e-06} +{"train_loss": 0.00016672916535753757, "global_step": 61960, "epoch": 520, "lr": 4.309820149514204e-06} +{"train_loss": 0.00037027645157650113, "global_step": 61961, "epoch": 520, "lr": 4.308920351049334e-06} +{"train_loss": 0.0003839920391328633, "global_step": 61962, "epoch": 520, "lr": 4.308020642294003e-06} +{"train_loss": 0.0002535328676458448, "global_step": 61963, "epoch": 520, "lr": 4.307121023250005e-06} +{"train_loss": 0.00019374580006115139, "global_step": 61964, "epoch": 520, "lr": 4.306221493919094e-06} +{"train_loss": 0.00036728495615534484, "global_step": 61965, "epoch": 520, "lr": 4.305322054303023e-06} +{"train_loss": 0.0003039782459381968, "global_step": 61966, "epoch": 520, "lr": 4.304422704403582e-06} +{"train_loss": 0.0004116016789339483, "global_step": 61967, "epoch": 520, "lr": 4.3035234442225125e-06} +{"train_loss": 0.00022788871137890965, "global_step": 61968, "epoch": 520, "lr": 4.3026242737616075e-06} +{"train_loss": 0.00027586883516050875, "global_step": 61969, "epoch": 520, "lr": 4.301725193022604e-06} +{"train_loss": 0.0002904603024944663, "global_step": 61970, "epoch": 520, "lr": 4.300826202007291e-06} +{"train_loss": 0.00035404195659793913, "global_step": 61971, "epoch": 520, "lr": 4.299927300717421e-06} +{"train_loss": 0.0003534237330313772, "global_step": 61972, "epoch": 520, "lr": 4.299028489154755e-06} +{"train_loss": 0.0006420112331397831, "global_step": 61973, "epoch": 520, "lr": 4.298129767321074e-06} +{"train_loss": 0.0006055405247025192, "global_step": 61974, "epoch": 520, "lr": 4.297231135218121e-06} +{"train_loss": 0.0003537486190907657, "global_step": 61975, "epoch": 520, "lr": 4.2963325928476796e-06} +{"train_loss": 0.0004312254022806883, "global_step": 61976, "epoch": 520, "lr": 4.295434140211507e-06} +{"train_loss": 0.0002996963157784194, "global_step": 61977, "epoch": 520, "lr": 4.294535777311359e-06} +{"train_loss": 0.0002788343990687281, "global_step": 61978, "epoch": 520, "lr": 4.293637504149017e-06} +{"train_loss": 0.00023744150530546904, "global_step": 61979, "epoch": 520, "lr": 4.29273932072623e-06} +{"train_loss": 0.0006693876930512488, "global_step": 61980, "epoch": 520, "lr": 4.291841227044768e-06} +{"train_loss": 0.00030424364376813173, "global_step": 61981, "epoch": 520, "lr": 4.290943223106392e-06} +{"train_loss": 0.000480616552522406, "global_step": 61982, "epoch": 520, "lr": 4.290045308912865e-06} +{"train_loss": 0.0002041562256636098, "global_step": 61983, "epoch": 520, "lr": 4.289147484465955e-06} +{"train_loss": 0.0007502256776206195, "global_step": 61984, "epoch": 520, "lr": 4.288249749767414e-06} +{"train_loss": 0.00017500536341685802, "global_step": 61985, "epoch": 520, "lr": 4.2873521048190204e-06} +{"train_loss": 0.00027458506519906223, "global_step": 61986, "epoch": 520, "lr": 4.286454549622515e-06} +{"train_loss": 0.0002596007543615997, "global_step": 61987, "epoch": 520, "lr": 4.285557084179681e-06} +{"train_loss": 0.0006754666101187468, "global_step": 61988, "epoch": 520, "lr": 4.2846597084922614e-06} +{"train_loss": 0.00020928685262333602, "global_step": 61989, "epoch": 520, "lr": 4.2837624225620434e-06} +{"train_loss": 0.0002516060194466263, "global_step": 61990, "epoch": 520, "lr": 4.28286522639077e-06} +{"train_loss": 0.0006962916231714189, "global_step": 61991, "epoch": 520, "lr": 4.281968119980195e-06} +{"train_loss": 0.00020098479581065476, "global_step": 61992, "epoch": 520, "lr": 4.2810711033321075e-06} +{"train_loss": 0.00022443130728788674, "global_step": 61993, "epoch": 520, "lr": 4.280174176448238e-06} +{"train_loss": 0.00017849757568910718, "global_step": 61994, "epoch": 520, "lr": 4.279277339330373e-06} +{"train_loss": 0.00044849052210338414, "global_step": 61995, "epoch": 520, "lr": 4.278380591980264e-06} +{"train_loss": 0.00037011338281445205, "global_step": 61996, "epoch": 520, "lr": 4.277483934399656e-06} +{"train_loss": 0.00025439279852434993, "global_step": 61997, "epoch": 520, "lr": 4.2765873665903345e-06} +{"train_loss": 0.00038176399551453303, "global_step": 61998, "epoch": 520, "lr": 4.27569088855404e-06, "val_loss": 0.016495438292622566, "train_action_mse_error": 3.957329681725241e-06} +{"train_loss": 0.00021210004342719913, "global_step": 61999, "epoch": 521, "lr": 4.274794500292551e-06} +{"train_loss": 0.0004936835030093789, "global_step": 62000, "epoch": 521, "lr": 4.273898201807613e-06} +{"train_loss": 0.00034294312354177237, "global_step": 62001, "epoch": 521, "lr": 4.273001993100995e-06} +{"train_loss": 0.0002753825392574072, "global_step": 62002, "epoch": 521, "lr": 4.272105874174453e-06} +{"train_loss": 0.0002096673269988969, "global_step": 62003, "epoch": 521, "lr": 4.271209845029739e-06} +{"train_loss": 0.00025477749295532703, "global_step": 62004, "epoch": 521, "lr": 4.270313905668627e-06} +{"train_loss": 0.0006222327356226742, "global_step": 62005, "epoch": 521, "lr": 4.2694180560928556e-06} +{"train_loss": 0.0005389360012486577, "global_step": 62006, "epoch": 521, "lr": 4.268522296304211e-06} +{"train_loss": 0.0003704346308950335, "global_step": 62007, "epoch": 521, "lr": 4.267626626304422e-06} +{"train_loss": 0.00031621631933376193, "global_step": 62008, "epoch": 521, "lr": 4.266731046095274e-06} +{"train_loss": 0.0008987047476693988, "global_step": 62009, "epoch": 521, "lr": 4.26583555567851e-06} +{"train_loss": 0.0004228484758641571, "global_step": 62010, "epoch": 521, "lr": 4.264940155055891e-06} +{"train_loss": 0.0006323272245936096, "global_step": 62011, "epoch": 521, "lr": 4.2640448442291756e-06} +{"train_loss": 0.0005822770181111991, "global_step": 62012, "epoch": 521, "lr": 4.263149623200119e-06} +{"train_loss": 0.00026452328893356025, "global_step": 62013, "epoch": 521, "lr": 4.2622544919704906e-06} +{"train_loss": 0.00018583495693746954, "global_step": 62014, "epoch": 521, "lr": 4.2613594505420406e-06} +{"train_loss": 0.00017734550056047738, "global_step": 62015, "epoch": 521, "lr": 4.260464498916511e-06} +{"train_loss": 0.00039838041993789375, "global_step": 62016, "epoch": 521, "lr": 4.259569637095684e-06} +{"train_loss": 0.00023435137700289488, "global_step": 62017, "epoch": 521, "lr": 4.258674865081297e-06} +{"train_loss": 0.00025935028679668903, "global_step": 62018, "epoch": 521, "lr": 4.257780182875126e-06} +{"train_loss": 0.0004235701053403318, "global_step": 62019, "epoch": 521, "lr": 4.256885590478909e-06} +{"train_loss": 0.0005777952610515058, "global_step": 62020, "epoch": 521, "lr": 4.255991087894418e-06} +{"train_loss": 0.00035030575236305594, "global_step": 62021, "epoch": 521, "lr": 4.255096675123399e-06} +{"train_loss": 0.00043805138557218015, "global_step": 62022, "epoch": 521, "lr": 4.254202352167602e-06} +{"train_loss": 0.0003207409754395485, "global_step": 62023, "epoch": 521, "lr": 4.253308119028798e-06} +{"train_loss": 0.0003039954463019967, "global_step": 62024, "epoch": 521, "lr": 4.25241397570873e-06} +{"train_loss": 0.00044595380313694477, "global_step": 62025, "epoch": 521, "lr": 4.251519922209169e-06} +{"train_loss": 0.00030322218663059175, "global_step": 62026, "epoch": 521, "lr": 4.250625958531862e-06} +{"train_loss": 0.0003466125053819269, "global_step": 62027, "epoch": 521, "lr": 4.249732084678554e-06} +{"train_loss": 0.00022067438112571836, "global_step": 62028, "epoch": 521, "lr": 4.2488383006510205e-06} +{"train_loss": 0.0001621614646865055, "global_step": 62029, "epoch": 521, "lr": 4.247944606450993e-06} +{"train_loss": 0.00020232579845469445, "global_step": 62030, "epoch": 521, "lr": 4.247051002080249e-06} +{"train_loss": 0.000423663790570572, "global_step": 62031, "epoch": 521, "lr": 4.246157487540519e-06} +{"train_loss": 0.0003310329921077937, "global_step": 62032, "epoch": 521, "lr": 4.245264062833581e-06} +{"train_loss": 0.00019019623869098723, "global_step": 62033, "epoch": 521, "lr": 4.244370727961183e-06} +{"train_loss": 0.0003344731230754405, "global_step": 62034, "epoch": 521, "lr": 4.243477482925062e-06} +{"train_loss": 0.0001694710663286969, "global_step": 62035, "epoch": 521, "lr": 4.242584327727e-06} +{"train_loss": 0.00033937065745703876, "global_step": 62036, "epoch": 521, "lr": 4.241691262368719e-06} +{"train_loss": 0.0001849014952313155, "global_step": 62037, "epoch": 521, "lr": 4.240798286851999e-06} +{"train_loss": 0.00034736504312604666, "global_step": 62038, "epoch": 521, "lr": 4.2399054011785785e-06} +{"train_loss": 0.0003829469787888229, "global_step": 62039, "epoch": 521, "lr": 4.239012605350218e-06} +{"train_loss": 0.0004052086442243308, "global_step": 62040, "epoch": 521, "lr": 4.238119899368665e-06} +{"train_loss": 0.0004262372967787087, "global_step": 62041, "epoch": 521, "lr": 4.237227283235678e-06} +{"train_loss": 0.0004146867722738534, "global_step": 62042, "epoch": 521, "lr": 4.2363347569529975e-06} +{"train_loss": 0.00016738049453124404, "global_step": 62043, "epoch": 521, "lr": 4.235442320522393e-06} +{"train_loss": 0.00041399532346986234, "global_step": 62044, "epoch": 521, "lr": 4.234549973945601e-06} +{"train_loss": 0.00024578673765063286, "global_step": 62045, "epoch": 521, "lr": 4.233657717224393e-06} +{"train_loss": 0.0002787229896057397, "global_step": 62046, "epoch": 521, "lr": 4.232765550360496e-06} +{"train_loss": 0.00033951917430385947, "global_step": 62047, "epoch": 521, "lr": 4.231873473355685e-06} +{"train_loss": 0.00019784893083851784, "global_step": 62048, "epoch": 521, "lr": 4.230981486211688e-06} +{"train_loss": 0.0002677039010450244, "global_step": 62049, "epoch": 521, "lr": 4.2300895889302805e-06} +{"train_loss": 0.0006803398719057441, "global_step": 62050, "epoch": 521, "lr": 4.229197781513195e-06} +{"train_loss": 0.00040267957956530154, "global_step": 62051, "epoch": 521, "lr": 4.228306063962195e-06} +{"train_loss": 0.00026659711147658527, "global_step": 62052, "epoch": 521, "lr": 4.227414436279031e-06} +{"train_loss": 0.00027551865787245333, "global_step": 62053, "epoch": 521, "lr": 4.226522898465434e-06} +{"train_loss": 0.00036530225770547986, "global_step": 62054, "epoch": 521, "lr": 4.225631450523188e-06} +{"train_loss": 0.00021194404689595103, "global_step": 62055, "epoch": 521, "lr": 4.224740092454005e-06} +{"train_loss": 0.0003809166664723307, "global_step": 62056, "epoch": 521, "lr": 4.223848824259668e-06} +{"train_loss": 0.00017710024258121848, "global_step": 62057, "epoch": 521, "lr": 4.222957645941905e-06} +{"train_loss": 0.0002768328122328967, "global_step": 62058, "epoch": 521, "lr": 4.22206655750248e-06} +{"train_loss": 0.0002087164029944688, "global_step": 62059, "epoch": 521, "lr": 4.221175558943136e-06} +{"train_loss": 0.00029782485216856003, "global_step": 62060, "epoch": 521, "lr": 4.220284650265621e-06} +{"train_loss": 0.000389549823012203, "global_step": 62061, "epoch": 521, "lr": 4.219393831471691e-06} +{"train_loss": 0.0003829569322988391, "global_step": 62062, "epoch": 521, "lr": 4.218503102563076e-06} +{"train_loss": 0.00027976924320682883, "global_step": 62063, "epoch": 521, "lr": 4.217612463541554e-06} +{"train_loss": 0.0005247308872640133, "global_step": 62064, "epoch": 521, "lr": 4.216721914408861e-06} +{"train_loss": 0.0003420162829570472, "global_step": 62065, "epoch": 521, "lr": 4.21583145516673e-06} +{"train_loss": 0.00028609918081201613, "global_step": 62066, "epoch": 521, "lr": 4.214941085816931e-06} +{"train_loss": 0.00062093063024804, "global_step": 62067, "epoch": 521, "lr": 4.214050806361197e-06} +{"train_loss": 0.00039558979915454984, "global_step": 62068, "epoch": 521, "lr": 4.213160616801292e-06} +{"train_loss": 0.0001860374177340418, "global_step": 62069, "epoch": 521, "lr": 4.212270517138944e-06} +{"train_loss": 0.0005246664513833821, "global_step": 62070, "epoch": 521, "lr": 4.211380507375923e-06} +{"train_loss": 0.000276318343821913, "global_step": 62071, "epoch": 521, "lr": 4.21049058751396e-06} +{"train_loss": 0.0002670707763172686, "global_step": 62072, "epoch": 521, "lr": 4.209600757554799e-06} +{"train_loss": 0.0004128038708586246, "global_step": 62073, "epoch": 521, "lr": 4.2087110175002e-06} +{"train_loss": 0.00015060012810863554, "global_step": 62074, "epoch": 521, "lr": 4.207821367351911e-06} +{"train_loss": 0.0003299586824141443, "global_step": 62075, "epoch": 521, "lr": 4.206931807111658e-06} +{"train_loss": 0.0011979466071352363, "global_step": 62076, "epoch": 521, "lr": 4.206042336781219e-06} +{"train_loss": 0.00021438219118863344, "global_step": 62077, "epoch": 521, "lr": 4.2051529563623124e-06} +{"train_loss": 0.00030700949719175696, "global_step": 62078, "epoch": 521, "lr": 4.2042636658567005e-06} +{"train_loss": 0.00020509921887423843, "global_step": 62079, "epoch": 521, "lr": 4.2033744652661186e-06} +{"train_loss": 0.0003778665268328041, "global_step": 62080, "epoch": 521, "lr": 4.2024853545923285e-06} +{"train_loss": 0.0001778604491846636, "global_step": 62081, "epoch": 521, "lr": 4.201596333837055e-06} +{"train_loss": 0.0002683976199477911, "global_step": 62082, "epoch": 521, "lr": 4.2007074030020635e-06} +{"train_loss": 0.000463625299744308, "global_step": 62083, "epoch": 521, "lr": 4.199818562089086e-06} +{"train_loss": 0.0003234379692003131, "global_step": 62084, "epoch": 521, "lr": 4.198929811099872e-06} +{"train_loss": 0.00030001995037309825, "global_step": 62085, "epoch": 521, "lr": 4.198041150036169e-06} +{"train_loss": 0.00022010522661730647, "global_step": 62086, "epoch": 521, "lr": 4.19715257889971e-06} +{"train_loss": 0.0005398158682510257, "global_step": 62087, "epoch": 521, "lr": 4.196264097692259e-06} +{"train_loss": 0.0001996009232243523, "global_step": 62088, "epoch": 521, "lr": 4.1953757064155385e-06} +{"train_loss": 0.00021755283523816615, "global_step": 62089, "epoch": 521, "lr": 4.194487405071318e-06} +{"train_loss": 0.0002887170703615993, "global_step": 62090, "epoch": 521, "lr": 4.193599193661324e-06} +{"train_loss": 0.0002448921441100538, "global_step": 62091, "epoch": 521, "lr": 4.192711072187294e-06} +{"train_loss": 0.00029818102484568954, "global_step": 62092, "epoch": 521, "lr": 4.191823040650994e-06} +{"train_loss": 0.0001753328542690724, "global_step": 62093, "epoch": 521, "lr": 4.1909350990541495e-06} +{"train_loss": 0.0002805550757329911, "global_step": 62094, "epoch": 521, "lr": 4.190047247398515e-06} +{"train_loss": 0.0007204866269603372, "global_step": 62095, "epoch": 521, "lr": 4.189159485685828e-06} +{"train_loss": 0.00031092591234482825, "global_step": 62096, "epoch": 521, "lr": 4.1882718139178215e-06} +{"train_loss": 0.0005505034932866693, "global_step": 62097, "epoch": 521, "lr": 4.187384232096264e-06} +{"train_loss": 0.0005312236025929451, "global_step": 62098, "epoch": 521, "lr": 4.186496740222873e-06} +{"train_loss": 0.0002639897575136274, "global_step": 62099, "epoch": 521, "lr": 4.185609338299407e-06} +{"train_loss": 0.00020552209753077477, "global_step": 62100, "epoch": 521, "lr": 4.1847220263275925e-06} +{"train_loss": 0.0005100978305563331, "global_step": 62101, "epoch": 521, "lr": 4.183834804309194e-06} +{"train_loss": 0.00021758434013463557, "global_step": 62102, "epoch": 521, "lr": 4.182947672245941e-06} +{"train_loss": 0.0002775734174065292, "global_step": 62103, "epoch": 521, "lr": 4.182060630139561e-06} +{"train_loss": 0.00022462962078861892, "global_step": 62104, "epoch": 521, "lr": 4.181173677991829e-06} +{"train_loss": 0.00023410691937897354, "global_step": 62105, "epoch": 521, "lr": 4.1802868158044515e-06} +{"train_loss": 0.0003563827776815742, "global_step": 62106, "epoch": 521, "lr": 4.179400043579196e-06} +{"train_loss": 0.0004230531048960984, "global_step": 62107, "epoch": 521, "lr": 4.178513361317782e-06} +{"train_loss": 0.0002976128307636827, "global_step": 62108, "epoch": 521, "lr": 4.177626769021964e-06} +{"train_loss": 0.00018883247685153037, "global_step": 62109, "epoch": 521, "lr": 4.176740266693491e-06} +{"train_loss": 0.00022110607824288309, "global_step": 62110, "epoch": 521, "lr": 4.175853854334083e-06} +{"train_loss": 0.000468619866296649, "global_step": 62111, "epoch": 521, "lr": 4.1749675319455004e-06} +{"train_loss": 0.0004216344386804849, "global_step": 62112, "epoch": 521, "lr": 4.174081299529465e-06} +{"train_loss": 0.0003730584285221994, "global_step": 62113, "epoch": 521, "lr": 4.173195157087728e-06} +{"train_loss": 0.0005830684094689786, "global_step": 62114, "epoch": 521, "lr": 4.1723091046220295e-06} +{"train_loss": 0.00045929604675620794, "global_step": 62115, "epoch": 521, "lr": 4.171423142134101e-06} +{"train_loss": 0.0002793322200886905, "global_step": 62116, "epoch": 521, "lr": 4.17053726962569e-06} +{"train_loss": 0.00034743751276444893, "global_step": 62117, "epoch": 521, "lr": 4.16965148709853e-06, "val_loss": 0.014571852050721645} +{"train_loss": 0.000196609427803196, "global_step": 62118, "epoch": 522, "lr": 4.168765794554369e-06} +{"train_loss": 0.0002922241692431271, "global_step": 62119, "epoch": 522, "lr": 4.167880191994933e-06} +{"train_loss": 0.0003013685345649719, "global_step": 62120, "epoch": 522, "lr": 4.166994679421976e-06} +{"train_loss": 0.0004496746987570077, "global_step": 62121, "epoch": 522, "lr": 4.1661092568372255e-06} +{"train_loss": 0.0002455870562698692, "global_step": 62122, "epoch": 522, "lr": 4.165223924242418e-06} +{"train_loss": 0.00017996081442106515, "global_step": 62123, "epoch": 522, "lr": 4.164338681639302e-06} +{"train_loss": 0.00032815293525345623, "global_step": 62124, "epoch": 522, "lr": 4.163453529029604e-06} +{"train_loss": 0.000416531169321388, "global_step": 62125, "epoch": 522, "lr": 4.162568466415074e-06} +{"train_loss": 0.0006021651206538081, "global_step": 62126, "epoch": 522, "lr": 4.161683493797435e-06} +{"train_loss": 0.00022656501096207649, "global_step": 62127, "epoch": 522, "lr": 4.1607986111784455e-06} +{"train_loss": 0.00022733790683560073, "global_step": 62128, "epoch": 522, "lr": 4.15991381855983e-06} +{"train_loss": 0.00025537164765410125, "global_step": 62129, "epoch": 522, "lr": 4.159029115943314e-06} +{"train_loss": 0.00030054207309149206, "global_step": 62130, "epoch": 522, "lr": 4.158144503330657e-06} +{"train_loss": 0.00019254117796663195, "global_step": 62131, "epoch": 522, "lr": 4.157259980723582e-06} +{"train_loss": 0.00028713810024783015, "global_step": 62132, "epoch": 522, "lr": 4.156375548123831e-06} +{"train_loss": 0.0004579344531521201, "global_step": 62133, "epoch": 522, "lr": 4.155491205533147e-06} +{"train_loss": 0.00042837890214286745, "global_step": 62134, "epoch": 522, "lr": 4.154606952953244e-06} +{"train_loss": 0.0002577179402578622, "global_step": 62135, "epoch": 522, "lr": 4.153722790385883e-06} +{"train_loss": 0.0003083948977291584, "global_step": 62136, "epoch": 522, "lr": 4.15283871783278e-06} +{"train_loss": 0.00022260399418883026, "global_step": 62137, "epoch": 522, "lr": 4.151954735295687e-06} +{"train_loss": 0.0001924537937156856, "global_step": 62138, "epoch": 522, "lr": 4.1510708427763276e-06} +{"train_loss": 0.000276535953162238, "global_step": 62139, "epoch": 522, "lr": 4.150187040276449e-06} +{"train_loss": 0.00026188671472482383, "global_step": 62140, "epoch": 522, "lr": 4.149303327797771e-06} +{"train_loss": 0.00045086638419888914, "global_step": 62141, "epoch": 522, "lr": 4.1484197053420435e-06} +{"train_loss": 0.00041371554834768176, "global_step": 62142, "epoch": 522, "lr": 4.147536172910993e-06} +{"train_loss": 0.0002737388713285327, "global_step": 62143, "epoch": 522, "lr": 4.146652730506351e-06} +{"train_loss": 0.00030572712421417236, "global_step": 62144, "epoch": 522, "lr": 4.145769378129871e-06} +{"train_loss": 0.00025320288841612637, "global_step": 62145, "epoch": 522, "lr": 4.14488611578327e-06} +{"train_loss": 0.000325348082697019, "global_step": 62146, "epoch": 522, "lr": 4.144002943468278e-06} +{"train_loss": 0.00024441356072202325, "global_step": 62147, "epoch": 522, "lr": 4.143119861186645e-06} +{"train_loss": 0.00032293665572069585, "global_step": 62148, "epoch": 522, "lr": 4.142236868940092e-06} +{"train_loss": 0.0004310729564167559, "global_step": 62149, "epoch": 522, "lr": 4.141353966730366e-06} +{"train_loss": 0.0003614006855059415, "global_step": 62150, "epoch": 522, "lr": 4.140471154559184e-06} +{"train_loss": 0.00027322195819579065, "global_step": 62151, "epoch": 522, "lr": 4.139588432428293e-06} +{"train_loss": 0.00026547940797172487, "global_step": 62152, "epoch": 522, "lr": 4.138705800339421e-06} +{"train_loss": 0.0003315548528917134, "global_step": 62153, "epoch": 522, "lr": 4.137823258294293e-06} +{"train_loss": 0.00034304874134249985, "global_step": 62154, "epoch": 522, "lr": 4.136940806294659e-06} +{"train_loss": 0.00019507012621033937, "global_step": 62155, "epoch": 522, "lr": 4.136058444342233e-06} +{"train_loss": 0.0005941201816312969, "global_step": 62156, "epoch": 522, "lr": 4.135176172438765e-06} +{"train_loss": 0.00045778744970448315, "global_step": 62157, "epoch": 522, "lr": 4.134293990585969e-06} +{"train_loss": 0.00030496830004267395, "global_step": 62158, "epoch": 522, "lr": 4.133411898785594e-06} +{"train_loss": 0.0002882842964027077, "global_step": 62159, "epoch": 522, "lr": 4.132529897039367e-06} +{"train_loss": 0.0001988866424653679, "global_step": 62160, "epoch": 522, "lr": 4.1316479853490134e-06} +{"train_loss": 0.0002798292553052306, "global_step": 62161, "epoch": 522, "lr": 4.130766163716271e-06} +{"train_loss": 0.00047903915401548147, "global_step": 62162, "epoch": 522, "lr": 4.129884432142861e-06} +{"train_loss": 0.0003780894330702722, "global_step": 62163, "epoch": 522, "lr": 4.129002790630532e-06} +{"train_loss": 0.00040019475272856653, "global_step": 62164, "epoch": 522, "lr": 4.128121239181004e-06} +{"train_loss": 0.00034197221975773573, "global_step": 62165, "epoch": 522, "lr": 4.127239777795999e-06} +{"train_loss": 0.0008865987765602767, "global_step": 62166, "epoch": 522, "lr": 4.126358406477271e-06} +{"train_loss": 0.0002991235814988613, "global_step": 62167, "epoch": 522, "lr": 4.125477125226529e-06} +{"train_loss": 0.0003389374469406903, "global_step": 62168, "epoch": 522, "lr": 4.124595934045516e-06} +{"train_loss": 0.0006003350135870278, "global_step": 62169, "epoch": 522, "lr": 4.123714832935949e-06} +{"train_loss": 0.0003812127106357366, "global_step": 62170, "epoch": 522, "lr": 4.12283382189958e-06} +{"train_loss": 0.0002850097371265292, "global_step": 62171, "epoch": 522, "lr": 4.121952900938114e-06} +{"train_loss": 0.0009604929946362972, "global_step": 62172, "epoch": 522, "lr": 4.1210720700533e-06} +{"train_loss": 0.00023565476294606924, "global_step": 62173, "epoch": 522, "lr": 4.120191329246853e-06} +{"train_loss": 0.00025945258676074445, "global_step": 62174, "epoch": 522, "lr": 4.119310678520516e-06} +{"train_loss": 0.00034279172541573644, "global_step": 62175, "epoch": 522, "lr": 4.118430117876004e-06} +{"train_loss": 0.0002638667938299477, "global_step": 62176, "epoch": 522, "lr": 4.117549647315061e-06} +{"train_loss": 0.0002483700809534639, "global_step": 62177, "epoch": 522, "lr": 4.116669266839396e-06} +{"train_loss": 0.0005637923604808748, "global_step": 62178, "epoch": 522, "lr": 4.115788976450763e-06} +{"train_loss": 0.0004011275595985353, "global_step": 62179, "epoch": 522, "lr": 4.114908776150861e-06} +{"train_loss": 0.0002446628059260547, "global_step": 62180, "epoch": 522, "lr": 4.114028665941449e-06} +{"train_loss": 0.0005546444444917142, "global_step": 62181, "epoch": 522, "lr": 4.113148645824227e-06} +{"train_loss": 0.00031815856345929205, "global_step": 62182, "epoch": 522, "lr": 4.112268715800943e-06} +{"train_loss": 0.0004242976719979197, "global_step": 62183, "epoch": 522, "lr": 4.111388875873318e-06} +{"train_loss": 0.00018566900689620525, "global_step": 62184, "epoch": 522, "lr": 4.110509126043072e-06} +{"train_loss": 0.0002978667034767568, "global_step": 62185, "epoch": 522, "lr": 4.109629466311943e-06} +{"train_loss": 0.00019775042892433703, "global_step": 62186, "epoch": 522, "lr": 4.108749896681652e-06} +{"train_loss": 0.00028060763725079596, "global_step": 62187, "epoch": 522, "lr": 4.10787041715393e-06} +{"train_loss": 0.00028018082957714796, "global_step": 62188, "epoch": 522, "lr": 4.106991027730494e-06} +{"train_loss": 0.0007066523539833724, "global_step": 62189, "epoch": 522, "lr": 4.106111728413093e-06} +{"train_loss": 0.00019057834288105369, "global_step": 62190, "epoch": 522, "lr": 4.105232519203428e-06} +{"train_loss": 0.0004148765583522618, "global_step": 62191, "epoch": 522, "lr": 4.104353400103233e-06} +{"train_loss": 0.00021182447380851954, "global_step": 62192, "epoch": 522, "lr": 4.103474371114246e-06} +{"train_loss": 0.00032984893186949193, "global_step": 62193, "epoch": 522, "lr": 4.102595432238176e-06} +{"train_loss": 0.0004985605482943356, "global_step": 62194, "epoch": 522, "lr": 4.1017165834767616e-06} +{"train_loss": 0.00018640696362126619, "global_step": 62195, "epoch": 522, "lr": 4.100837824831722e-06} +{"train_loss": 0.0006206537364050746, "global_step": 62196, "epoch": 522, "lr": 4.099959156304784e-06} +{"train_loss": 0.00021685368847101927, "global_step": 62197, "epoch": 522, "lr": 4.099080577897674e-06} +{"train_loss": 0.00035792560083791614, "global_step": 62198, "epoch": 522, "lr": 4.098202089612108e-06} +{"train_loss": 0.00023653768585063517, "global_step": 62199, "epoch": 522, "lr": 4.097323691449828e-06} +{"train_loss": 0.00027633027639240026, "global_step": 62200, "epoch": 522, "lr": 4.096445383412539e-06} +{"train_loss": 0.00020943852723576128, "global_step": 62201, "epoch": 522, "lr": 4.095567165501984e-06} +{"train_loss": 0.0003167247341480106, "global_step": 62202, "epoch": 522, "lr": 4.094689037719879e-06} +{"train_loss": 0.0001925425312947482, "global_step": 62203, "epoch": 522, "lr": 4.093811000067943e-06} +{"train_loss": 0.0002497373498044908, "global_step": 62204, "epoch": 522, "lr": 4.0929330525479095e-06} +{"train_loss": 0.00046375967212952673, "global_step": 62205, "epoch": 522, "lr": 4.092055195161487e-06} +{"train_loss": 0.0004132871108595282, "global_step": 62206, "epoch": 522, "lr": 4.091177427910414e-06} +{"train_loss": 0.00020846827828790992, "global_step": 62207, "epoch": 522, "lr": 4.0902997507964166e-06} +{"train_loss": 0.0001773325348040089, "global_step": 62208, "epoch": 522, "lr": 4.0894221638211995e-06} +{"train_loss": 0.0004957318888045847, "global_step": 62209, "epoch": 522, "lr": 4.08854466698651e-06} +{"train_loss": 0.0002220496244262904, "global_step": 62210, "epoch": 522, "lr": 4.087667260294048e-06} +{"train_loss": 0.00019812650862149894, "global_step": 62211, "epoch": 522, "lr": 4.08678994374555e-06} +{"train_loss": 0.0004500828217715025, "global_step": 62212, "epoch": 522, "lr": 4.085912717342733e-06} +{"train_loss": 0.0004879642801824957, "global_step": 62213, "epoch": 522, "lr": 4.085035581087327e-06} +{"train_loss": 0.00027239148039370775, "global_step": 62214, "epoch": 522, "lr": 4.0841585349810475e-06} +{"train_loss": 0.0001754545228322968, "global_step": 62215, "epoch": 522, "lr": 4.083281579025611e-06} +{"train_loss": 0.0004885917296633124, "global_step": 62216, "epoch": 522, "lr": 4.082404713222754e-06} +{"train_loss": 0.0003234523464925587, "global_step": 62217, "epoch": 522, "lr": 4.0815279375741814e-06} +{"train_loss": 0.00021398856188170612, "global_step": 62218, "epoch": 522, "lr": 4.08065125208163e-06} +{"train_loss": 0.00019867329683620483, "global_step": 62219, "epoch": 522, "lr": 4.079774656746804e-06} +{"train_loss": 0.00026235642144456506, "global_step": 62220, "epoch": 522, "lr": 4.078898151571447e-06} +{"train_loss": 0.00033091616933234036, "global_step": 62221, "epoch": 522, "lr": 4.078021736557264e-06} +{"train_loss": 0.00039873772766441107, "global_step": 62222, "epoch": 522, "lr": 4.077145411705974e-06} +{"train_loss": 0.00031957696774043143, "global_step": 62223, "epoch": 522, "lr": 4.0762691770193095e-06} +{"train_loss": 0.0002373484312556684, "global_step": 62224, "epoch": 522, "lr": 4.075393032498975e-06} +{"train_loss": 0.00046798030962236226, "global_step": 62225, "epoch": 522, "lr": 4.074516978146709e-06} +{"train_loss": 0.000593446777202189, "global_step": 62226, "epoch": 522, "lr": 4.073641013964219e-06} +{"train_loss": 0.0007404159987345338, "global_step": 62227, "epoch": 522, "lr": 4.072765139953233e-06} +{"train_loss": 0.0004812132683582604, "global_step": 62228, "epoch": 522, "lr": 4.071889356115461e-06} +{"train_loss": 0.00021427753381431103, "global_step": 62229, "epoch": 522, "lr": 4.071013662452628e-06} +{"train_loss": 0.0003739834937732667, "global_step": 62230, "epoch": 522, "lr": 4.070138058966455e-06} +{"train_loss": 0.0001805332285584882, "global_step": 62231, "epoch": 522, "lr": 4.069262545658653e-06} +{"train_loss": 0.00031165609834715724, "global_step": 62232, "epoch": 522, "lr": 4.068387122530954e-06} +{"train_loss": 0.0003198429476469755, "global_step": 62233, "epoch": 522, "lr": 4.067511789585071e-06} +{"train_loss": 0.000279528321698308, "global_step": 62234, "epoch": 522, "lr": 4.066636546822711e-06} +{"train_loss": 0.0003147203824482858, "global_step": 62235, "epoch": 522, "lr": 4.0657613942456154e-06} +{"train_loss": 0.0003381858770823607, "global_step": 62236, "epoch": 522, "lr": 4.064886331855477e-06, "val_loss": 0.02880941890180111} +{"train_loss": 0.00028137676417827606, "global_step": 62237, "epoch": 523, "lr": 4.0640113596540405e-06} +{"train_loss": 0.00021582750196103007, "global_step": 62238, "epoch": 523, "lr": 4.063136477642998e-06} +{"train_loss": 0.00024942460004240274, "global_step": 62239, "epoch": 523, "lr": 4.062261685824087e-06} +{"train_loss": 0.0007299702265299857, "global_step": 62240, "epoch": 523, "lr": 4.061386984199011e-06} +{"train_loss": 0.00017098078387789428, "global_step": 62241, "epoch": 523, "lr": 4.060512372769493e-06} +{"train_loss": 0.0003099085879512131, "global_step": 62242, "epoch": 523, "lr": 4.059637851537262e-06} +{"train_loss": 0.0001691204379312694, "global_step": 62243, "epoch": 523, "lr": 4.058763420504014e-06} +{"train_loss": 0.0005580276483669877, "global_step": 62244, "epoch": 523, "lr": 4.057889079671484e-06} +{"train_loss": 0.0002302482898812741, "global_step": 62245, "epoch": 523, "lr": 4.057014829041372e-06} +{"train_loss": 0.0002577363629825413, "global_step": 62246, "epoch": 523, "lr": 4.05614066861541e-06} +{"train_loss": 0.00019390639499761164, "global_step": 62247, "epoch": 523, "lr": 4.055266598395308e-06} +{"train_loss": 0.0004228528414387256, "global_step": 62248, "epoch": 523, "lr": 4.054392618382774e-06} +{"train_loss": 0.00033704782254062593, "global_step": 62249, "epoch": 523, "lr": 4.053518728579542e-06} +{"train_loss": 0.0004939381033182144, "global_step": 62250, "epoch": 523, "lr": 4.052644928987304e-06} +{"train_loss": 0.0003188069094903767, "global_step": 62251, "epoch": 523, "lr": 4.051771219607803e-06} +{"train_loss": 0.0004373465199023485, "global_step": 62252, "epoch": 523, "lr": 4.0508976004427376e-06} +{"train_loss": 0.0002644227060955018, "global_step": 62253, "epoch": 523, "lr": 4.0500240714938185e-06} +{"train_loss": 0.0003034250403288752, "global_step": 62254, "epoch": 523, "lr": 4.049150632762777e-06} +{"train_loss": 0.00036404255661182106, "global_step": 62255, "epoch": 523, "lr": 4.048277284251306e-06} +{"train_loss": 0.00021985081548336893, "global_step": 62256, "epoch": 523, "lr": 4.047404025961144e-06} +{"train_loss": 0.0003630186547525227, "global_step": 62257, "epoch": 523, "lr": 4.046530857893988e-06} +{"train_loss": 0.00018808087042998523, "global_step": 62258, "epoch": 523, "lr": 4.0456577800515706e-06} +{"train_loss": 0.00016751476505305618, "global_step": 62259, "epoch": 523, "lr": 4.044784792435591e-06} +{"train_loss": 0.00037552410503849387, "global_step": 62260, "epoch": 523, "lr": 4.043911895047758e-06} +{"train_loss": 0.0003788066387642175, "global_step": 62261, "epoch": 523, "lr": 4.0430390878898e-06} +{"train_loss": 0.0003644353128038347, "global_step": 62262, "epoch": 523, "lr": 4.0421663709634235e-06} +{"train_loss": 0.00036678623291663826, "global_step": 62263, "epoch": 523, "lr": 4.041293744270347e-06} +{"train_loss": 0.0002423308469587937, "global_step": 62264, "epoch": 523, "lr": 4.040421207812284e-06} +{"train_loss": 0.00020205770852044225, "global_step": 62265, "epoch": 523, "lr": 4.039548761590928e-06} +{"train_loss": 0.0002521115820854902, "global_step": 62266, "epoch": 523, "lr": 4.038676405608022e-06} +{"train_loss": 0.0001830577093642205, "global_step": 62267, "epoch": 523, "lr": 4.037804139865259e-06} +{"train_loss": 0.0002192288520745933, "global_step": 62268, "epoch": 523, "lr": 4.03693196436436e-06} +{"train_loss": 0.00017149662016890943, "global_step": 62269, "epoch": 523, "lr": 4.0360598791070294e-06} +{"train_loss": 0.0003410613862797618, "global_step": 62270, "epoch": 523, "lr": 4.035187884094993e-06} +{"train_loss": 0.00017733486311044544, "global_step": 62271, "epoch": 523, "lr": 4.034315979329945e-06} +{"train_loss": 0.0006661389488726854, "global_step": 62272, "epoch": 523, "lr": 4.033444164813616e-06} +{"train_loss": 0.00023343812790699303, "global_step": 62273, "epoch": 523, "lr": 4.032572440547699e-06} +{"train_loss": 0.00038483028765767813, "global_step": 62274, "epoch": 523, "lr": 4.031700806533923e-06} +{"train_loss": 0.0002624513581395149, "global_step": 62275, "epoch": 523, "lr": 4.030829262773983e-06} +{"train_loss": 0.00033134923432953656, "global_step": 62276, "epoch": 523, "lr": 4.029957809269602e-06} +{"train_loss": 0.00040186874684877694, "global_step": 62277, "epoch": 523, "lr": 4.029086446022495e-06} +{"train_loss": 0.00019529509881976992, "global_step": 62278, "epoch": 523, "lr": 4.028215173034361e-06} +{"train_loss": 0.0002594097168184817, "global_step": 62279, "epoch": 523, "lr": 4.027343990306914e-06} +{"train_loss": 0.0003097597509622574, "global_step": 62280, "epoch": 523, "lr": 4.026472897841871e-06} +{"train_loss": 0.00022634858032688498, "global_step": 62281, "epoch": 523, "lr": 4.025601895640923e-06} +{"train_loss": 0.0002640613238327205, "global_step": 62282, "epoch": 523, "lr": 4.02473098370581e-06} +{"train_loss": 0.0004333301039878279, "global_step": 62283, "epoch": 523, "lr": 4.023860162038223e-06} +{"train_loss": 0.0003353222564328462, "global_step": 62284, "epoch": 523, "lr": 4.022989430639868e-06} +{"train_loss": 0.00038902219966985285, "global_step": 62285, "epoch": 523, "lr": 4.022118789512469e-06} +{"train_loss": 0.0005182040622457862, "global_step": 62286, "epoch": 523, "lr": 4.021248238657716e-06} +{"train_loss": 0.000229466546443291, "global_step": 62287, "epoch": 523, "lr": 4.020377778077344e-06} +{"train_loss": 0.0002629261580295861, "global_step": 62288, "epoch": 523, "lr": 4.0195074077730324e-06} +{"train_loss": 0.0001853670837590471, "global_step": 62289, "epoch": 523, "lr": 4.018637127746522e-06} +{"train_loss": 0.0002195242850575596, "global_step": 62290, "epoch": 523, "lr": 4.017766937999501e-06} +{"train_loss": 0.00021361245308071375, "global_step": 62291, "epoch": 523, "lr": 4.016896838533673e-06} +{"train_loss": 0.0004367827787064016, "global_step": 62292, "epoch": 523, "lr": 4.0160268293507665e-06} +{"train_loss": 0.0006610552663914859, "global_step": 62293, "epoch": 523, "lr": 4.015156910452467e-06} +{"train_loss": 0.00024298598873429, "global_step": 62294, "epoch": 523, "lr": 4.0142870818405064e-06} +{"train_loss": 0.000213969629839994, "global_step": 62295, "epoch": 523, "lr": 4.013417343516568e-06} +{"train_loss": 0.000644457817543298, "global_step": 62296, "epoch": 523, "lr": 4.012547695482383e-06} +{"train_loss": 0.0005168003845028579, "global_step": 62297, "epoch": 523, "lr": 4.011678137739649e-06} +{"train_loss": 0.0003385573800187558, "global_step": 62298, "epoch": 523, "lr": 4.0108086702900615e-06} +{"train_loss": 0.0002047958259936422, "global_step": 62299, "epoch": 523, "lr": 4.009939293135345e-06} +{"train_loss": 0.00023018752108328044, "global_step": 62300, "epoch": 523, "lr": 4.009070006277193e-06} +{"train_loss": 0.00018728226132225245, "global_step": 62301, "epoch": 523, "lr": 4.0082008097173275e-06} +{"train_loss": 0.0005137954140082002, "global_step": 62302, "epoch": 523, "lr": 4.00733170345744e-06} +{"train_loss": 0.00040719128446653485, "global_step": 62303, "epoch": 523, "lr": 4.006462687499241e-06} +{"train_loss": 0.0005135605460964143, "global_step": 62304, "epoch": 523, "lr": 4.005593761844439e-06} +{"train_loss": 0.00047453411389142275, "global_step": 62305, "epoch": 523, "lr": 4.004724926494746e-06} +{"train_loss": 0.0002560557040851563, "global_step": 62306, "epoch": 523, "lr": 4.003856181451854e-06} +{"train_loss": 0.00021302158711478114, "global_step": 62307, "epoch": 523, "lr": 4.002987526717483e-06} +{"train_loss": 0.00021635956363752484, "global_step": 62308, "epoch": 523, "lr": 4.002118962293328e-06} +{"train_loss": 0.0002065696899080649, "global_step": 62309, "epoch": 523, "lr": 4.001250488181102e-06} +{"train_loss": 0.0003120995534118265, "global_step": 62310, "epoch": 523, "lr": 4.0003821043825e-06} +{"train_loss": 0.0003329583560116589, "global_step": 62311, "epoch": 523, "lr": 3.999513810899241e-06} +{"train_loss": 0.00046020446461625397, "global_step": 62312, "epoch": 523, "lr": 3.998645607733015e-06} +{"train_loss": 0.0002088401815854013, "global_step": 62313, "epoch": 523, "lr": 3.997777494885541e-06} +{"train_loss": 0.00044959818478673697, "global_step": 62314, "epoch": 523, "lr": 3.996909472358506e-06} +{"train_loss": 0.00036334714968688786, "global_step": 62315, "epoch": 523, "lr": 3.996041540153639e-06} +{"train_loss": 0.0004164588754065335, "global_step": 62316, "epoch": 523, "lr": 3.995173698272625e-06} +{"train_loss": 0.000628755777142942, "global_step": 62317, "epoch": 523, "lr": 3.994305946717164e-06} +{"train_loss": 0.0002915000659413636, "global_step": 62318, "epoch": 523, "lr": 3.9934382854889816e-06} +{"train_loss": 0.00025938902399502695, "global_step": 62319, "epoch": 523, "lr": 3.992570714589755e-06} +{"train_loss": 0.0004631507326848805, "global_step": 62320, "epoch": 523, "lr": 3.9917032340212105e-06} +{"train_loss": 0.00047018774785101414, "global_step": 62321, "epoch": 523, "lr": 3.99083584378504e-06} +{"train_loss": 0.0002985166502185166, "global_step": 62322, "epoch": 523, "lr": 3.989968543882944e-06} +{"train_loss": 0.00032192590879276395, "global_step": 62323, "epoch": 523, "lr": 3.989101334316631e-06} +{"train_loss": 0.0004255032690707594, "global_step": 62324, "epoch": 523, "lr": 3.9882342150877995e-06} +{"train_loss": 0.0003439259307924658, "global_step": 62325, "epoch": 523, "lr": 3.9873671861981595e-06} +{"train_loss": 0.0004369599628262222, "global_step": 62326, "epoch": 523, "lr": 3.9865002476493994e-06} +{"train_loss": 0.00022712757345288992, "global_step": 62327, "epoch": 523, "lr": 3.985633399443239e-06} +{"train_loss": 0.00035938856308348477, "global_step": 62328, "epoch": 523, "lr": 3.984766641581372e-06} +{"train_loss": 0.0002460666000843048, "global_step": 62329, "epoch": 523, "lr": 3.983899974065491e-06} +{"train_loss": 0.0001911615690914914, "global_step": 62330, "epoch": 523, "lr": 3.983033396897317e-06} +{"train_loss": 0.0003429624775890261, "global_step": 62331, "epoch": 523, "lr": 3.982166910078533e-06} +{"train_loss": 0.0003450455260463059, "global_step": 62332, "epoch": 523, "lr": 3.981300513610853e-06} +{"train_loss": 0.00026259978767484426, "global_step": 62333, "epoch": 523, "lr": 3.980434207495975e-06} +{"train_loss": 0.00027253100415691733, "global_step": 62334, "epoch": 523, "lr": 3.979567991735588e-06} +{"train_loss": 0.0005847980501130223, "global_step": 62335, "epoch": 523, "lr": 3.978701866331414e-06} +{"train_loss": 0.00022284637088887393, "global_step": 62336, "epoch": 523, "lr": 3.977835831285132e-06} +{"train_loss": 0.0003794092044699937, "global_step": 62337, "epoch": 523, "lr": 3.976969886598458e-06} +{"train_loss": 0.00023214210523292422, "global_step": 62338, "epoch": 523, "lr": 3.976104032273081e-06} +{"train_loss": 0.00020116489031352103, "global_step": 62339, "epoch": 523, "lr": 3.97523826831071e-06} +{"train_loss": 0.0004133972979616374, "global_step": 62340, "epoch": 523, "lr": 3.974372594713044e-06} +{"train_loss": 0.00040149304550141096, "global_step": 62341, "epoch": 523, "lr": 3.973507011481775e-06} +{"train_loss": 0.0003414337697904557, "global_step": 62342, "epoch": 523, "lr": 3.9726415186186194e-06} +{"train_loss": 0.0006061709718778729, "global_step": 62343, "epoch": 523, "lr": 3.971776116125253e-06} +{"train_loss": 0.0002898376842495054, "global_step": 62344, "epoch": 523, "lr": 3.970910804003392e-06} +{"train_loss": 0.00019406045612413436, "global_step": 62345, "epoch": 523, "lr": 3.970045582254728e-06} +{"train_loss": 0.0004072030424140394, "global_step": 62346, "epoch": 523, "lr": 3.969180450880966e-06} +{"train_loss": 0.00021645650849677622, "global_step": 62347, "epoch": 523, "lr": 3.968315409883805e-06} +{"train_loss": 0.00039553610258735716, "global_step": 62348, "epoch": 523, "lr": 3.967450459264926e-06} +{"train_loss": 0.00030827330192551017, "global_step": 62349, "epoch": 523, "lr": 3.966585599026052e-06} +{"train_loss": 0.00018520603771321476, "global_step": 62350, "epoch": 523, "lr": 3.965720829168856e-06} +{"train_loss": 0.00020656778360716999, "global_step": 62351, "epoch": 523, "lr": 3.964856149695062e-06} +{"train_loss": 0.0006141072954051197, "global_step": 62352, "epoch": 523, "lr": 3.963991560606351e-06} +{"train_loss": 0.0002012337208725512, "global_step": 62353, "epoch": 523, "lr": 3.96312706190442e-06} +{"train_loss": 0.0002241938200313598, "global_step": 62354, "epoch": 523, "lr": 3.962262653590976e-06} +{"train_loss": 0.0003275269871878931, "global_step": 62355, "epoch": 523, "lr": 3.9613983356677045e-06, "val_loss": 0.01721854880452156} +{"train_loss": 0.0004904552479274571, "global_step": 62356, "epoch": 524, "lr": 3.960534108136316e-06} +{"train_loss": 0.0003075782733503729, "global_step": 62357, "epoch": 524, "lr": 3.959669970998492e-06} +{"train_loss": 0.0002773646847344935, "global_step": 62358, "epoch": 524, "lr": 3.958805924255948e-06} +{"train_loss": 0.00022197423095349222, "global_step": 62359, "epoch": 524, "lr": 3.957941967910367e-06} +{"train_loss": 0.00045442377449944615, "global_step": 62360, "epoch": 524, "lr": 3.9570781019634405e-06} +{"train_loss": 0.0003845164901576936, "global_step": 62361, "epoch": 524, "lr": 3.956214326416879e-06} +{"train_loss": 0.0002526604803279042, "global_step": 62362, "epoch": 524, "lr": 3.955350641272365e-06} +{"train_loss": 0.00029386734240688384, "global_step": 62363, "epoch": 524, "lr": 3.954487046531608e-06} +{"train_loss": 0.00045576499542221427, "global_step": 62364, "epoch": 524, "lr": 3.953623542196289e-06} +{"train_loss": 0.000517527456395328, "global_step": 62365, "epoch": 524, "lr": 3.952760128268118e-06} +{"train_loss": 0.0003412057412788272, "global_step": 62366, "epoch": 524, "lr": 3.951896804748789e-06} +{"train_loss": 0.0007695864769630134, "global_step": 62367, "epoch": 524, "lr": 3.951033571639978e-06} +{"train_loss": 0.0005524326115846634, "global_step": 62368, "epoch": 524, "lr": 3.9501704289434005e-06} +{"train_loss": 0.0002596242993604392, "global_step": 62369, "epoch": 524, "lr": 3.949307376660738e-06} +{"train_loss": 0.0002748641127254814, "global_step": 62370, "epoch": 524, "lr": 3.948444414793695e-06} +{"train_loss": 0.00025138407363556325, "global_step": 62371, "epoch": 524, "lr": 3.947581543343954e-06} +{"train_loss": 0.00022368454665411264, "global_step": 62372, "epoch": 524, "lr": 3.9467187623132285e-06} +{"train_loss": 0.0002854737685993314, "global_step": 62373, "epoch": 524, "lr": 3.945856071703191e-06} +{"train_loss": 0.00036247368552722037, "global_step": 62374, "epoch": 524, "lr": 3.94499347151554e-06} +{"train_loss": 0.0005505512817762792, "global_step": 62375, "epoch": 524, "lr": 3.944130961751991e-06} +{"train_loss": 0.0003544591600075364, "global_step": 62376, "epoch": 524, "lr": 3.943268542414208e-06} +{"train_loss": 0.00022943860676605254, "global_step": 62377, "epoch": 524, "lr": 3.942406213503902e-06} +{"train_loss": 0.00030173728009685874, "global_step": 62378, "epoch": 524, "lr": 3.941543975022766e-06} +{"train_loss": 0.00034959788899868727, "global_step": 62379, "epoch": 524, "lr": 3.940681826972475e-06} +{"train_loss": 0.0005782548687420785, "global_step": 62380, "epoch": 524, "lr": 3.939819769354747e-06} +{"train_loss": 0.00023620249703526497, "global_step": 62381, "epoch": 524, "lr": 3.9389578021712505e-06} +{"train_loss": 0.00026578374672681093, "global_step": 62382, "epoch": 524, "lr": 3.938095925423702e-06} +{"train_loss": 0.0005677514709532261, "global_step": 62383, "epoch": 524, "lr": 3.9372341391137765e-06} +{"train_loss": 0.0002084833540720865, "global_step": 62384, "epoch": 524, "lr": 3.936372443243164e-06} +{"train_loss": 0.00022298401745501906, "global_step": 62385, "epoch": 524, "lr": 3.935510837813572e-06} +{"train_loss": 0.000644730287604034, "global_step": 62386, "epoch": 524, "lr": 3.934649322826672e-06} +{"train_loss": 0.0006971508846618235, "global_step": 62387, "epoch": 524, "lr": 3.93378789828418e-06} +{"train_loss": 0.00021675637981388718, "global_step": 62388, "epoch": 524, "lr": 3.932926564187761e-06} +{"train_loss": 0.00048436864744871855, "global_step": 62389, "epoch": 524, "lr": 3.93206532053913e-06} +{"train_loss": 0.00048228594823740423, "global_step": 62390, "epoch": 524, "lr": 3.9312041673399695e-06} +{"train_loss": 0.0005378341302275658, "global_step": 62391, "epoch": 524, "lr": 3.930343104591955e-06} +{"train_loss": 0.00031513068825006485, "global_step": 62392, "epoch": 524, "lr": 3.929482132296802e-06} +{"train_loss": 0.00042551071965135634, "global_step": 62393, "epoch": 524, "lr": 3.928621250456177e-06} +{"train_loss": 0.0005217351135797799, "global_step": 62394, "epoch": 524, "lr": 3.927760459071794e-06} +{"train_loss": 0.0002624655608087778, "global_step": 62395, "epoch": 524, "lr": 3.926899758145319e-06} +{"train_loss": 0.0006504927878268063, "global_step": 62396, "epoch": 524, "lr": 3.9260391476784675e-06} +{"train_loss": 0.0002969754859805107, "global_step": 62397, "epoch": 524, "lr": 3.92517862767291e-06} +{"train_loss": 0.00037123815855011344, "global_step": 62398, "epoch": 524, "lr": 3.924318198130339e-06} +{"train_loss": 0.00029377915780059993, "global_step": 62399, "epoch": 524, "lr": 3.923457859052449e-06} +{"train_loss": 0.00020497287914622575, "global_step": 62400, "epoch": 524, "lr": 3.9225976104409255e-06} +{"train_loss": 0.0003082639304921031, "global_step": 62401, "epoch": 524, "lr": 3.9217374522974636e-06} +{"train_loss": 0.00025547793484292924, "global_step": 62402, "epoch": 524, "lr": 3.920877384623739e-06} +{"train_loss": 0.00020984222646802664, "global_step": 62403, "epoch": 524, "lr": 3.9200174074214555e-06} +{"train_loss": 0.0002275307779200375, "global_step": 62404, "epoch": 524, "lr": 3.919157520692291e-06} +{"train_loss": 0.0003640226204879582, "global_step": 62405, "epoch": 524, "lr": 3.9182977244379415e-06} +{"train_loss": 0.00022499360784422606, "global_step": 62406, "epoch": 524, "lr": 3.917438018660086e-06} +{"train_loss": 0.0006850433419458568, "global_step": 62407, "epoch": 524, "lr": 3.9165784033604265e-06} +{"train_loss": 0.00046710058813914657, "global_step": 62408, "epoch": 524, "lr": 3.91571887854063e-06} +{"train_loss": 0.0002532897051423788, "global_step": 62409, "epoch": 524, "lr": 3.914859444202406e-06} +{"train_loss": 0.0001732090167934075, "global_step": 62410, "epoch": 524, "lr": 3.914000100347426e-06} +{"train_loss": 0.00045465922448784113, "global_step": 62411, "epoch": 524, "lr": 3.913140846977392e-06} +{"train_loss": 0.0007993221515789628, "global_step": 62412, "epoch": 524, "lr": 3.912281684093971e-06} +{"train_loss": 0.00028002349426969886, "global_step": 62413, "epoch": 524, "lr": 3.911422611698873e-06} +{"train_loss": 0.00035839976044371724, "global_step": 62414, "epoch": 524, "lr": 3.910563629793762e-06} +{"train_loss": 0.00024696195032447577, "global_step": 62415, "epoch": 524, "lr": 3.909704738380343e-06} +{"train_loss": 0.00039277452742680907, "global_step": 62416, "epoch": 524, "lr": 3.908845937460293e-06} +{"train_loss": 0.00047936232294887304, "global_step": 62417, "epoch": 524, "lr": 3.907987227035298e-06} +{"train_loss": 0.0005931217456236482, "global_step": 62418, "epoch": 524, "lr": 3.907128607107047e-06} +{"train_loss": 0.0003755727375391871, "global_step": 62419, "epoch": 524, "lr": 3.906270077677221e-06} +{"train_loss": 0.0006010229117237031, "global_step": 62420, "epoch": 524, "lr": 3.905411638747519e-06} +{"train_loss": 0.000345563399605453, "global_step": 62421, "epoch": 524, "lr": 3.904553290319612e-06} +{"train_loss": 0.00037414769758470356, "global_step": 62422, "epoch": 524, "lr": 3.9036950323951826e-06} +{"train_loss": 0.00024202416534535587, "global_step": 62423, "epoch": 524, "lr": 3.902836864975934e-06} +{"train_loss": 0.00018498365534469485, "global_step": 62424, "epoch": 524, "lr": 3.9019787880635315e-06} +{"train_loss": 0.0002657382283359766, "global_step": 62425, "epoch": 524, "lr": 3.9011208016596745e-06} +{"train_loss": 0.0006036154227331281, "global_step": 62426, "epoch": 524, "lr": 3.900262905766039e-06} +{"train_loss": 0.0002790334983728826, "global_step": 62427, "epoch": 524, "lr": 3.899405100384318e-06} +{"train_loss": 0.00031539349583908916, "global_step": 62428, "epoch": 524, "lr": 3.898547385516188e-06} +{"train_loss": 0.00019889358372893184, "global_step": 62429, "epoch": 524, "lr": 3.897689761163325e-06} +{"train_loss": 0.0003385145391803235, "global_step": 62430, "epoch": 524, "lr": 3.896832227327435e-06} +{"train_loss": 0.0005467328592203557, "global_step": 62431, "epoch": 524, "lr": 3.895974784010181e-06} +{"train_loss": 0.00033567979699000716, "global_step": 62432, "epoch": 524, "lr": 3.895117431213263e-06} +{"train_loss": 0.0002570246870163828, "global_step": 62433, "epoch": 524, "lr": 3.894260168938346e-06} +{"train_loss": 0.0003124902432318777, "global_step": 62434, "epoch": 524, "lr": 3.893402997187135e-06} +{"train_loss": 0.0003741885011550039, "global_step": 62435, "epoch": 524, "lr": 3.892545915961293e-06} +{"train_loss": 0.000224394301767461, "global_step": 62436, "epoch": 524, "lr": 3.891688925262516e-06} +{"train_loss": 0.0003702374524436891, "global_step": 62437, "epoch": 524, "lr": 3.890832025092478e-06} +{"train_loss": 0.00021384500723797828, "global_step": 62438, "epoch": 524, "lr": 3.889975215452868e-06} +{"train_loss": 0.0001803646591724828, "global_step": 62439, "epoch": 524, "lr": 3.889118496345362e-06} +{"train_loss": 0.0001287124614464119, "global_step": 62440, "epoch": 524, "lr": 3.888261867771653e-06} +{"train_loss": 0.000481502094771713, "global_step": 62441, "epoch": 524, "lr": 3.8874053297334064e-06} +{"train_loss": 0.0002225041826022789, "global_step": 62442, "epoch": 524, "lr": 3.886548882232322e-06} +{"train_loss": 0.00032355583971366286, "global_step": 62443, "epoch": 524, "lr": 3.885692525270063e-06} +{"train_loss": 0.000251205638051033, "global_step": 62444, "epoch": 524, "lr": 3.8848362588483286e-06} +{"train_loss": 0.00033437920501455665, "global_step": 62445, "epoch": 524, "lr": 3.883980082968785e-06} +{"train_loss": 0.0005419097142294049, "global_step": 62446, "epoch": 524, "lr": 3.883123997633126e-06} +{"train_loss": 0.0003809010668192059, "global_step": 62447, "epoch": 524, "lr": 3.8822680028430255e-06} +{"train_loss": 0.00017359211051370949, "global_step": 62448, "epoch": 524, "lr": 3.881412098600162e-06} +{"train_loss": 0.00041544955456629395, "global_step": 62449, "epoch": 524, "lr": 3.880556284906223e-06} +{"train_loss": 0.00019110004359390587, "global_step": 62450, "epoch": 524, "lr": 3.879700561762873e-06} +{"train_loss": 0.0007967908168211579, "global_step": 62451, "epoch": 524, "lr": 3.878844929171815e-06} +{"train_loss": 0.0003535322321113199, "global_step": 62452, "epoch": 524, "lr": 3.877989387134717e-06} +{"train_loss": 0.0003421804285608232, "global_step": 62453, "epoch": 524, "lr": 3.877133935653254e-06} +{"train_loss": 0.0002106124593410641, "global_step": 62454, "epoch": 524, "lr": 3.87627857472912e-06} +{"train_loss": 0.00024339501396752894, "global_step": 62455, "epoch": 524, "lr": 3.8754233043639735e-06} +{"train_loss": 0.00025264552095904946, "global_step": 62456, "epoch": 524, "lr": 3.874568124559514e-06} +{"train_loss": 0.0006295953644439578, "global_step": 62457, "epoch": 524, "lr": 3.873713035317406e-06} +{"train_loss": 0.0007602536934427917, "global_step": 62458, "epoch": 524, "lr": 3.872858036639343e-06} +{"train_loss": 0.00023251074890140444, "global_step": 62459, "epoch": 524, "lr": 3.872003128526991e-06} +{"train_loss": 0.00028378545539453626, "global_step": 62460, "epoch": 524, "lr": 3.8711483109820316e-06} +{"train_loss": 0.00040079557220451534, "global_step": 62461, "epoch": 524, "lr": 3.870293584006146e-06} +{"train_loss": 0.0003568873507902026, "global_step": 62462, "epoch": 524, "lr": 3.869438947601006e-06} +{"train_loss": 0.00034912151750177145, "global_step": 62463, "epoch": 524, "lr": 3.868584401768299e-06} +{"train_loss": 0.000337194767780602, "global_step": 62464, "epoch": 524, "lr": 3.867729946509696e-06} +{"train_loss": 0.0002830226148944348, "global_step": 62465, "epoch": 524, "lr": 3.866875581826879e-06} +{"train_loss": 0.0002874887431971729, "global_step": 62466, "epoch": 524, "lr": 3.866021307721529e-06} +{"train_loss": 0.00031482582562603056, "global_step": 62467, "epoch": 524, "lr": 3.865167124195302e-06} +{"train_loss": 0.0004671058268286288, "global_step": 62468, "epoch": 524, "lr": 3.864313031249905e-06} +{"train_loss": 0.0003760128456633538, "global_step": 62469, "epoch": 524, "lr": 3.86345902888699e-06} +{"train_loss": 0.000514744024258107, "global_step": 62470, "epoch": 524, "lr": 3.862605117108253e-06} +{"train_loss": 0.00021967144857626408, "global_step": 62471, "epoch": 524, "lr": 3.8617512959153504e-06} +{"train_loss": 0.0009282745304517448, "global_step": 62472, "epoch": 524, "lr": 3.8608975653099735e-06} +{"train_loss": 0.0002920846454799175, "global_step": 62473, "epoch": 524, "lr": 3.860043925293805e-06} +{"train_loss": 0.0003686729683335323, "global_step": 62474, "epoch": 524, "lr": 3.859190375868499e-06, "val_loss": 0.028480514883995056} +{"train_loss": 0.0003153001016471535, "global_step": 62475, "epoch": 525, "lr": 3.858336917035749e-06} +{"train_loss": 0.00043892726534977555, "global_step": 62476, "epoch": 525, "lr": 3.857483548797225e-06} +{"train_loss": 0.00030511280056089163, "global_step": 62477, "epoch": 525, "lr": 3.8566302711546045e-06} +{"train_loss": 0.00024161739565897733, "global_step": 62478, "epoch": 525, "lr": 3.855777084109563e-06} +{"train_loss": 0.00027941944426856935, "global_step": 62479, "epoch": 525, "lr": 3.854923987663761e-06} +{"train_loss": 0.0004078044439665973, "global_step": 62480, "epoch": 525, "lr": 3.854070981818897e-06} +{"train_loss": 0.0002551102079451084, "global_step": 62481, "epoch": 525, "lr": 3.85321806657663e-06} +{"train_loss": 0.00025458927848376334, "global_step": 62482, "epoch": 525, "lr": 3.852365241938644e-06} +{"train_loss": 0.00019421704928390682, "global_step": 62483, "epoch": 525, "lr": 3.8515125079066014e-06} +{"train_loss": 0.0002354855096200481, "global_step": 62484, "epoch": 525, "lr": 3.8506598644821925e-06} +{"train_loss": 0.00013390005915425718, "global_step": 62485, "epoch": 525, "lr": 3.849807311667081e-06} +{"train_loss": 0.0003827514301519841, "global_step": 62486, "epoch": 525, "lr": 3.848954849462932e-06} +{"train_loss": 0.00015518625150434673, "global_step": 62487, "epoch": 525, "lr": 3.84810247787144e-06} +{"train_loss": 0.0005938968388363719, "global_step": 62488, "epoch": 525, "lr": 3.847250196894264e-06} +{"train_loss": 0.00034884896012954414, "global_step": 62489, "epoch": 525, "lr": 3.846398006533086e-06} +{"train_loss": 0.0002730555133894086, "global_step": 62490, "epoch": 525, "lr": 3.845545906789577e-06} +{"train_loss": 0.0003807774337474257, "global_step": 62491, "epoch": 525, "lr": 3.844693897665397e-06} +{"train_loss": 0.00043230262235738337, "global_step": 62492, "epoch": 525, "lr": 3.8438419791622384e-06} +{"train_loss": 0.00019961553334724158, "global_step": 62493, "epoch": 525, "lr": 3.842990151281756e-06} +{"train_loss": 0.00014994075172580779, "global_step": 62494, "epoch": 525, "lr": 3.842138414025642e-06} +{"train_loss": 0.0005215032724663615, "global_step": 62495, "epoch": 525, "lr": 3.8412867673955465e-06} +{"train_loss": 0.0002794999163597822, "global_step": 62496, "epoch": 525, "lr": 3.840435211393162e-06} +{"train_loss": 0.0006602043868042529, "global_step": 62497, "epoch": 525, "lr": 3.839583746020153e-06} +{"train_loss": 0.0006591079290956259, "global_step": 62498, "epoch": 525, "lr": 3.838732371278181e-06} +{"train_loss": 0.0003249376022722572, "global_step": 62499, "epoch": 525, "lr": 3.837881087168932e-06} +{"train_loss": 0.0002943410654552281, "global_step": 62500, "epoch": 525, "lr": 3.837029893694066e-06} +{"train_loss": 0.00021154273417778313, "global_step": 62501, "epoch": 525, "lr": 3.836178790855271e-06} +{"train_loss": 0.00034413562389090657, "global_step": 62502, "epoch": 525, "lr": 3.835327778654197e-06} +{"train_loss": 0.0002815478073898703, "global_step": 62503, "epoch": 525, "lr": 3.834476857092534e-06} +{"train_loss": 0.0005082364077679813, "global_step": 62504, "epoch": 525, "lr": 3.833626026171933e-06} +{"train_loss": 0.00027113669784739614, "global_step": 62505, "epoch": 525, "lr": 3.832775285894086e-06} +{"train_loss": 0.0001815243886085227, "global_step": 62506, "epoch": 525, "lr": 3.831924636260642e-06} +{"train_loss": 0.001545117935165763, "global_step": 62507, "epoch": 525, "lr": 3.831074077273278e-06} +{"train_loss": 0.00034808661439456046, "global_step": 62508, "epoch": 525, "lr": 3.8302236089336805e-06} +{"train_loss": 0.0004063736414536834, "global_step": 62509, "epoch": 525, "lr": 3.829373231243505e-06} +{"train_loss": 0.000490016711410135, "global_step": 62510, "epoch": 525, "lr": 3.828522944204415e-06} +{"train_loss": 0.00031305846641771495, "global_step": 62511, "epoch": 525, "lr": 3.827672747818101e-06} +{"train_loss": 0.00034729024628177285, "global_step": 62512, "epoch": 525, "lr": 3.826822642086203e-06} +{"train_loss": 0.00018468812049832195, "global_step": 62513, "epoch": 525, "lr": 3.825972627010415e-06} +{"train_loss": 0.00028434430714696646, "global_step": 62514, "epoch": 525, "lr": 3.825122702592393e-06} +{"train_loss": 0.00022445074864663184, "global_step": 62515, "epoch": 525, "lr": 3.824272868833812e-06} +{"train_loss": 0.00022439900203607976, "global_step": 62516, "epoch": 525, "lr": 3.8234231257363414e-06} +{"train_loss": 0.0003275784256402403, "global_step": 62517, "epoch": 525, "lr": 3.822573473301638e-06} +{"train_loss": 0.0002303685323568061, "global_step": 62518, "epoch": 525, "lr": 3.821723911531389e-06} +{"train_loss": 0.0002712169080041349, "global_step": 62519, "epoch": 525, "lr": 3.8208744404272355e-06} +{"train_loss": 0.00034174221218563616, "global_step": 62520, "epoch": 525, "lr": 3.820025059990878e-06} +{"train_loss": 0.00045882188715040684, "global_step": 62521, "epoch": 525, "lr": 3.819175770223965e-06} +{"train_loss": 0.0003768599999602884, "global_step": 62522, "epoch": 525, "lr": 3.8183265711281555e-06} +{"train_loss": 0.0008122593862935901, "global_step": 62523, "epoch": 525, "lr": 3.817477462705138e-06} +{"train_loss": 0.0003880242584273219, "global_step": 62524, "epoch": 525, "lr": 3.816628444956566e-06} +{"train_loss": 0.0004291074874345213, "global_step": 62525, "epoch": 525, "lr": 3.81577951788411e-06} +{"train_loss": 0.00019827618962153792, "global_step": 62526, "epoch": 525, "lr": 3.814930681489437e-06} +{"train_loss": 0.00042118632700294256, "global_step": 62527, "epoch": 525, "lr": 3.8140819357742163e-06} +{"train_loss": 0.00023329630494117737, "global_step": 62528, "epoch": 525, "lr": 3.813233280740114e-06} +{"train_loss": 0.0002810561563819647, "global_step": 62529, "epoch": 525, "lr": 3.8123847163887836e-06} +{"train_loss": 0.0008250108803622425, "global_step": 62530, "epoch": 525, "lr": 3.811536242721908e-06} +{"train_loss": 0.00047526563866995275, "global_step": 62531, "epoch": 525, "lr": 3.810687859741141e-06} +{"train_loss": 0.00031703917193226516, "global_step": 62532, "epoch": 525, "lr": 3.8098395674481647e-06} +{"train_loss": 0.00032910695881582797, "global_step": 62533, "epoch": 525, "lr": 3.808991365844622e-06} +{"train_loss": 0.00035851047141477466, "global_step": 62534, "epoch": 525, "lr": 3.8081432549322004e-06} +{"train_loss": 0.00034269073512405157, "global_step": 62535, "epoch": 525, "lr": 3.8072952347125434e-06} +{"train_loss": 0.00022586902196053416, "global_step": 62536, "epoch": 525, "lr": 3.8064473051873383e-06} +{"train_loss": 0.0002829187433235347, "global_step": 62537, "epoch": 525, "lr": 3.8055994663582285e-06} +{"train_loss": 0.00028140764334239066, "global_step": 62538, "epoch": 525, "lr": 3.8047517182268955e-06} +{"train_loss": 0.00023772551503498107, "global_step": 62539, "epoch": 525, "lr": 3.803904060794994e-06} +{"train_loss": 0.00021959093282930553, "global_step": 62540, "epoch": 525, "lr": 3.8030564940641945e-06} +{"train_loss": 0.00026079468079842627, "global_step": 62541, "epoch": 525, "lr": 3.8022090180361515e-06} +{"train_loss": 0.0003243209794163704, "global_step": 62542, "epoch": 525, "lr": 3.801361632712547e-06} +{"train_loss": 0.0006284110131673515, "global_step": 62543, "epoch": 525, "lr": 3.8005143380950235e-06} +{"train_loss": 0.00042652367847040296, "global_step": 62544, "epoch": 525, "lr": 3.799667134185264e-06} +{"train_loss": 0.00024827508605085313, "global_step": 62545, "epoch": 525, "lr": 3.798820020984911e-06} +{"train_loss": 0.00022253603674471378, "global_step": 62546, "epoch": 525, "lr": 3.797972998495647e-06} +{"train_loss": 0.0005593231180682778, "global_step": 62547, "epoch": 525, "lr": 3.797126066719131e-06} +{"train_loss": 0.0002426602877676487, "global_step": 62548, "epoch": 525, "lr": 3.7962792256570124e-06} +{"train_loss": 0.00031859628506936133, "global_step": 62549, "epoch": 525, "lr": 3.7954324753109673e-06} +{"train_loss": 0.0006531390827149153, "global_step": 62550, "epoch": 525, "lr": 3.7945858156826496e-06} +{"train_loss": 0.0003736431826837361, "global_step": 62551, "epoch": 525, "lr": 3.7937392467737367e-06} +{"train_loss": 0.00028932717395946383, "global_step": 62552, "epoch": 525, "lr": 3.792892768585865e-06} +{"train_loss": 0.0005550088826566935, "global_step": 62553, "epoch": 525, "lr": 3.7920463811207283e-06} +{"train_loss": 0.00024796900106593966, "global_step": 62554, "epoch": 525, "lr": 3.79120008437997e-06} +{"train_loss": 0.00024512637173756957, "global_step": 62555, "epoch": 525, "lr": 3.7903538783652435e-06} +{"train_loss": 0.00026134680956602097, "global_step": 62556, "epoch": 525, "lr": 3.7895077630782262e-06} +{"train_loss": 0.00017205721815116704, "global_step": 62557, "epoch": 525, "lr": 3.788661738520566e-06} +{"train_loss": 0.00023565908486489207, "global_step": 62558, "epoch": 525, "lr": 3.787815804693945e-06} +{"train_loss": 0.00039309676503762603, "global_step": 62559, "epoch": 525, "lr": 3.7869699616000065e-06} +{"train_loss": 0.00048357536434195936, "global_step": 62560, "epoch": 525, "lr": 3.7861242092404105e-06} +{"train_loss": 0.0002446502912789583, "global_step": 62561, "epoch": 525, "lr": 3.7852785476168274e-06} +{"train_loss": 0.00022613847977481782, "global_step": 62562, "epoch": 525, "lr": 3.7844329767309063e-06} +{"train_loss": 0.00024649364058859646, "global_step": 62563, "epoch": 525, "lr": 3.7835874965843177e-06} +{"train_loss": 0.00039930868661031127, "global_step": 62564, "epoch": 525, "lr": 3.7827421071787106e-06} +{"train_loss": 0.0002036829973803833, "global_step": 62565, "epoch": 525, "lr": 3.7818968085157613e-06} +{"train_loss": 0.0002937423123512417, "global_step": 62566, "epoch": 525, "lr": 3.7810516005971242e-06} +{"train_loss": 0.00028570264112204313, "global_step": 62567, "epoch": 525, "lr": 3.780206483424442e-06} +{"train_loss": 0.0006115761352702975, "global_step": 62568, "epoch": 525, "lr": 3.7793614569993864e-06} +{"train_loss": 0.0003142241621389985, "global_step": 62569, "epoch": 525, "lr": 3.778516521323627e-06} +{"train_loss": 0.0004238972323946655, "global_step": 62570, "epoch": 525, "lr": 3.777671676398803e-06} +{"train_loss": 0.00038541649701073766, "global_step": 62571, "epoch": 525, "lr": 3.7768269222265894e-06} +{"train_loss": 0.0002500750415492803, "global_step": 62572, "epoch": 525, "lr": 3.7759822588086303e-06} +{"train_loss": 0.00031320806010626256, "global_step": 62573, "epoch": 525, "lr": 3.7751376861466013e-06} +{"train_loss": 0.0003321973781567067, "global_step": 62574, "epoch": 525, "lr": 3.774293204242141e-06} +{"train_loss": 0.00031071933335624635, "global_step": 62575, "epoch": 525, "lr": 3.773448813096925e-06} +{"train_loss": 0.0004398224991746247, "global_step": 62576, "epoch": 525, "lr": 3.7726045127125965e-06} +{"train_loss": 0.0003498407604638487, "global_step": 62577, "epoch": 525, "lr": 3.7717603030908266e-06} +{"train_loss": 0.0005797194316983223, "global_step": 62578, "epoch": 525, "lr": 3.7709161842332695e-06} +{"train_loss": 0.00019166887796018273, "global_step": 62579, "epoch": 525, "lr": 3.7700721561415743e-06} +{"train_loss": 0.0001984880364034325, "global_step": 62580, "epoch": 525, "lr": 3.7692282188174054e-06} +{"train_loss": 0.0005996499676257372, "global_step": 62581, "epoch": 525, "lr": 3.7683843722624123e-06} +{"train_loss": 0.00031387642957270145, "global_step": 62582, "epoch": 525, "lr": 3.7675406164782656e-06} +{"train_loss": 0.00035443183151073754, "global_step": 62583, "epoch": 525, "lr": 3.7666969514666084e-06} +{"train_loss": 0.0003289732267148793, "global_step": 62584, "epoch": 525, "lr": 3.765853377229106e-06} +{"train_loss": 0.0005105582531541586, "global_step": 62585, "epoch": 525, "lr": 3.765009893767413e-06} +{"train_loss": 0.0004462676588445902, "global_step": 62586, "epoch": 525, "lr": 3.764166501083177e-06} +{"train_loss": 0.00019456825975794345, "global_step": 62587, "epoch": 525, "lr": 3.763323199178065e-06} +{"train_loss": 0.00033960959990508854, "global_step": 62588, "epoch": 525, "lr": 3.762479988053724e-06} +{"train_loss": 0.0004189394530840218, "global_step": 62589, "epoch": 525, "lr": 3.7616368677118208e-06} +{"train_loss": 0.0003308770537842065, "global_step": 62590, "epoch": 525, "lr": 3.7607938381540032e-06} +{"train_loss": 0.0004942964296787977, "global_step": 62591, "epoch": 525, "lr": 3.75995089938192e-06} +{"train_loss": 0.0002181931777158752, "global_step": 62592, "epoch": 525, "lr": 3.7591080513972367e-06} +{"train_loss": 0.00035414938213785, "global_step": 62593, "epoch": 525, "lr": 3.7582652942016016e-06, "val_loss": 0.034253086894750595, "train_action_mse_error": 4.535367679636693e-06} +{"train_loss": 0.00034959460026584566, "global_step": 62594, "epoch": 526, "lr": 3.7574226277966805e-06} +{"train_loss": 0.00017695345741230994, "global_step": 62595, "epoch": 526, "lr": 3.756580052184111e-06} +{"train_loss": 0.00030165319913066924, "global_step": 62596, "epoch": 526, "lr": 3.7557375673655636e-06} +{"train_loss": 0.00021150370594114065, "global_step": 62597, "epoch": 526, "lr": 3.754895173342682e-06} +{"train_loss": 0.000271842407528311, "global_step": 62598, "epoch": 526, "lr": 3.7540528701171198e-06} +{"train_loss": 0.00025788811035454273, "global_step": 62599, "epoch": 526, "lr": 3.7532106576905368e-06} +{"train_loss": 0.0005129731143824756, "global_step": 62600, "epoch": 526, "lr": 3.752368536064582e-06} +{"train_loss": 0.0005264236824586987, "global_step": 62601, "epoch": 526, "lr": 3.7515265052409156e-06} +{"train_loss": 0.0002619641600176692, "global_step": 62602, "epoch": 526, "lr": 3.7506845652211795e-06} +{"train_loss": 0.00026444089598953724, "global_step": 62603, "epoch": 526, "lr": 3.749842716007029e-06} +{"train_loss": 0.0004977901699021459, "global_step": 62604, "epoch": 526, "lr": 3.749000957600135e-06} +{"train_loss": 0.00019583365065045655, "global_step": 62605, "epoch": 526, "lr": 3.7481592900021234e-06} +{"train_loss": 0.00013145308184903115, "global_step": 62606, "epoch": 526, "lr": 3.7473177132146706e-06} +{"train_loss": 0.0004741264565382153, "global_step": 62607, "epoch": 526, "lr": 3.7464762272394095e-06} +{"train_loss": 0.0004236216191202402, "global_step": 62608, "epoch": 526, "lr": 3.74563483207801e-06} +{"train_loss": 0.00025177892530336976, "global_step": 62609, "epoch": 526, "lr": 3.7447935277321156e-06} +{"train_loss": 0.0002896713267546147, "global_step": 62610, "epoch": 526, "lr": 3.743952314203364e-06} +{"train_loss": 0.0002484176366124302, "global_step": 62611, "epoch": 526, "lr": 3.7431111914934368e-06} +{"train_loss": 0.00014873890904709697, "global_step": 62612, "epoch": 526, "lr": 3.7422701596039557e-06} +{"train_loss": 0.0002564432506915182, "global_step": 62613, "epoch": 526, "lr": 3.7414292185365905e-06} +{"train_loss": 0.00030034041265025735, "global_step": 62614, "epoch": 526, "lr": 3.7405883682929853e-06} +{"train_loss": 0.0003007149789482355, "global_step": 62615, "epoch": 526, "lr": 3.739747608874794e-06} +{"train_loss": 0.00026631582295522094, "global_step": 62616, "epoch": 526, "lr": 3.7389069402836706e-06} +{"train_loss": 0.0003541774640325457, "global_step": 62617, "epoch": 526, "lr": 3.738066362521253e-06} +{"train_loss": 0.00024894948001019657, "global_step": 62618, "epoch": 526, "lr": 3.7372258755892066e-06} +{"train_loss": 0.00030185715877451, "global_step": 62619, "epoch": 526, "lr": 3.7363854794891686e-06} +{"train_loss": 0.00022554214228875935, "global_step": 62620, "epoch": 526, "lr": 3.7355451742228042e-06} +{"train_loss": 0.0003471653035376221, "global_step": 62621, "epoch": 526, "lr": 3.7347049597917406e-06} +{"train_loss": 0.00026444197283126414, "global_step": 62622, "epoch": 526, "lr": 3.7338648361976537e-06} +{"train_loss": 0.00018104385526385158, "global_step": 62623, "epoch": 526, "lr": 3.7330248034421812e-06} +{"train_loss": 0.00019073674047831446, "global_step": 62624, "epoch": 526, "lr": 3.7321848615269604e-06} +{"train_loss": 0.00022711169731337577, "global_step": 62625, "epoch": 526, "lr": 3.731345010453663e-06} +{"train_loss": 0.00032943286350928247, "global_step": 62626, "epoch": 526, "lr": 3.7305052502239147e-06} +{"train_loss": 0.00026778384926728904, "global_step": 62627, "epoch": 526, "lr": 3.7296655808393865e-06} +{"train_loss": 0.0003596534370444715, "global_step": 62628, "epoch": 526, "lr": 3.7288260023017164e-06} +{"train_loss": 0.00026743215858004987, "global_step": 62629, "epoch": 526, "lr": 3.7279865146125413e-06} +{"train_loss": 0.00034627190325409174, "global_step": 62630, "epoch": 526, "lr": 3.727147117773533e-06} +{"train_loss": 0.0003328734601382166, "global_step": 62631, "epoch": 526, "lr": 3.7263078117863226e-06} +{"train_loss": 0.0003810183552559465, "global_step": 62632, "epoch": 526, "lr": 3.725468596652565e-06} +{"train_loss": 0.00024848367320373654, "global_step": 62633, "epoch": 526, "lr": 3.724629472373903e-06} +{"train_loss": 0.00025464833015576005, "global_step": 62634, "epoch": 526, "lr": 3.7237904389519906e-06} +{"train_loss": 0.00032297411235049367, "global_step": 62635, "epoch": 526, "lr": 3.722951496388466e-06} +{"train_loss": 0.0005576092517003417, "global_step": 62636, "epoch": 526, "lr": 3.7221126446849943e-06} +{"train_loss": 0.0003372341161593795, "global_step": 62637, "epoch": 526, "lr": 3.721273883843196e-06} +{"train_loss": 0.00027759274234995246, "global_step": 62638, "epoch": 526, "lr": 3.7204352138647424e-06} +{"train_loss": 0.00021975042182020843, "global_step": 62639, "epoch": 526, "lr": 3.7195966347512655e-06} +{"train_loss": 0.00024308671709150076, "global_step": 62640, "epoch": 526, "lr": 3.71875814650442e-06} +{"train_loss": 0.0002991516375914216, "global_step": 62641, "epoch": 526, "lr": 3.7179197491258424e-06} +{"train_loss": 0.0003519502643030137, "global_step": 62642, "epoch": 526, "lr": 3.717081442617193e-06} +{"train_loss": 0.00036212330451235175, "global_step": 62643, "epoch": 526, "lr": 3.7162432269800984e-06} +{"train_loss": 0.0004068761190865189, "global_step": 62644, "epoch": 526, "lr": 3.7154051022162294e-06} +{"train_loss": 0.00047829755931161344, "global_step": 62645, "epoch": 526, "lr": 3.714567068327207e-06} +{"train_loss": 0.00036251830169931054, "global_step": 62646, "epoch": 526, "lr": 3.713729125314691e-06} +{"train_loss": 0.0002911393530666828, "global_step": 62647, "epoch": 526, "lr": 3.71289127318033e-06} +{"train_loss": 0.0001587699807714671, "global_step": 62648, "epoch": 526, "lr": 3.7120535119257503e-06} +{"train_loss": 0.00018654893210623413, "global_step": 62649, "epoch": 526, "lr": 3.7112158415526178e-06} +{"train_loss": 0.00037518044700846076, "global_step": 62650, "epoch": 526, "lr": 3.7103782620625583e-06} +{"train_loss": 0.00037128489930182695, "global_step": 62651, "epoch": 526, "lr": 3.709540773457232e-06} +{"train_loss": 0.0004777975264005363, "global_step": 62652, "epoch": 526, "lr": 3.7087033757382703e-06} +{"train_loss": 0.0004051717114634812, "global_step": 62653, "epoch": 526, "lr": 3.7078660689073343e-06} +{"train_loss": 0.0005203657201491296, "global_step": 62654, "epoch": 526, "lr": 3.7070288529660545e-06} +{"train_loss": 0.00038547051372006536, "global_step": 62655, "epoch": 526, "lr": 3.706191727916075e-06} +{"train_loss": 0.0002736712631303817, "global_step": 62656, "epoch": 526, "lr": 3.7053546937590444e-06} +{"train_loss": 0.00022326390899252146, "global_step": 62657, "epoch": 526, "lr": 3.7045177504966e-06} +{"train_loss": 0.00019957304175477475, "global_step": 62658, "epoch": 526, "lr": 3.7036808981303962e-06} +{"train_loss": 0.000482378585729748, "global_step": 62659, "epoch": 526, "lr": 3.7028441366620646e-06} +{"train_loss": 0.00018165554502047598, "global_step": 62660, "epoch": 526, "lr": 3.702007466093249e-06} +{"train_loss": 0.0005075514782220125, "global_step": 62661, "epoch": 526, "lr": 3.7011708864256034e-06} +{"train_loss": 0.0003563315258361399, "global_step": 62662, "epoch": 526, "lr": 3.700334397660754e-06} +{"train_loss": 0.0004173977649770677, "global_step": 62663, "epoch": 526, "lr": 3.699497999800361e-06} +{"train_loss": 0.0006759435636922717, "global_step": 62664, "epoch": 526, "lr": 3.698661692846045e-06} +{"train_loss": 0.0002932615752797574, "global_step": 62665, "epoch": 526, "lr": 3.6978254767994713e-06} +{"train_loss": 0.0001790829555829987, "global_step": 62666, "epoch": 526, "lr": 3.696989351662261e-06} +{"train_loss": 0.0002690760884433985, "global_step": 62667, "epoch": 526, "lr": 3.696153317436074e-06} +{"train_loss": 0.0004306138725951314, "global_step": 62668, "epoch": 526, "lr": 3.6953173741225366e-06} +{"train_loss": 0.00026671733940020204, "global_step": 62669, "epoch": 526, "lr": 3.694481521723303e-06} +{"train_loss": 0.0004703241866081953, "global_step": 62670, "epoch": 526, "lr": 3.6936457602399997e-06} +{"train_loss": 0.0002930297050625086, "global_step": 62671, "epoch": 526, "lr": 3.6928100896742866e-06} +{"train_loss": 0.000334857904817909, "global_step": 62672, "epoch": 526, "lr": 3.6919745100277793e-06} +{"train_loss": 0.0008249063394032419, "global_step": 62673, "epoch": 526, "lr": 3.6911390213021478e-06} +{"train_loss": 0.0002753818698693067, "global_step": 62674, "epoch": 526, "lr": 3.6903036234990085e-06} +{"train_loss": 0.00044048199197277427, "global_step": 62675, "epoch": 526, "lr": 3.689468316620015e-06} +{"train_loss": 0.00025535235181450844, "global_step": 62676, "epoch": 526, "lr": 3.688633100666794e-06} +{"train_loss": 0.00023186720500234514, "global_step": 62677, "epoch": 526, "lr": 3.6877979756410054e-06} +{"train_loss": 0.00022187030117493123, "global_step": 62678, "epoch": 526, "lr": 3.6869629415442807e-06} +{"train_loss": 0.00036793964682146907, "global_step": 62679, "epoch": 526, "lr": 3.6861279983782416e-06} +{"train_loss": 0.00022515549790114164, "global_step": 62680, "epoch": 526, "lr": 3.685293146144553e-06} +{"train_loss": 0.00036867408198304474, "global_step": 62681, "epoch": 526, "lr": 3.6844583848448356e-06} +{"train_loss": 0.0002843234105966985, "global_step": 62682, "epoch": 526, "lr": 3.6836237144807497e-06} +{"train_loss": 0.0005548022454604506, "global_step": 62683, "epoch": 526, "lr": 3.6827891350539045e-06} +{"train_loss": 0.0003588594263419509, "global_step": 62684, "epoch": 526, "lr": 3.681954646565966e-06} +{"train_loss": 0.0003716964565683156, "global_step": 62685, "epoch": 526, "lr": 3.6811202490185605e-06} +{"train_loss": 0.0003327281738165766, "global_step": 62686, "epoch": 526, "lr": 3.6802859424133197e-06} +{"train_loss": 0.0002562754671089351, "global_step": 62687, "epoch": 526, "lr": 3.6794517267518926e-06} +{"train_loss": 0.000563375186175108, "global_step": 62688, "epoch": 526, "lr": 3.6786176020359107e-06} +{"train_loss": 0.0001525921543361619, "global_step": 62689, "epoch": 526, "lr": 3.6777835682670236e-06} +{"train_loss": 0.00033376074861735106, "global_step": 62690, "epoch": 526, "lr": 3.676949625446846e-06} +{"train_loss": 0.0002788290730677545, "global_step": 62691, "epoch": 526, "lr": 3.676115773577038e-06} +{"train_loss": 0.00019918431644327939, "global_step": 62692, "epoch": 526, "lr": 3.6752820126592315e-06} +{"train_loss": 0.00035612023202702403, "global_step": 62693, "epoch": 526, "lr": 3.6744483426950525e-06} +{"train_loss": 0.0002741551725193858, "global_step": 62694, "epoch": 526, "lr": 3.673614763686145e-06} +{"train_loss": 0.00033411631011404097, "global_step": 62695, "epoch": 526, "lr": 3.672781275634146e-06} +{"train_loss": 0.0004339097940828651, "global_step": 62696, "epoch": 526, "lr": 3.6719478785406935e-06} +{"train_loss": 0.00023310424876399338, "global_step": 62697, "epoch": 526, "lr": 3.6711145724074248e-06} +{"train_loss": 0.00023692358809057623, "global_step": 62698, "epoch": 526, "lr": 3.6702813572359663e-06} +{"train_loss": 0.0002989009371958673, "global_step": 62699, "epoch": 526, "lr": 3.669448233027967e-06} +{"train_loss": 0.0005358716007322073, "global_step": 62700, "epoch": 526, "lr": 3.6686151997850527e-06} +{"train_loss": 0.0003206112014595419, "global_step": 62701, "epoch": 526, "lr": 3.667782257508856e-06} +{"train_loss": 0.0004412813577800989, "global_step": 62702, "epoch": 526, "lr": 3.6669494062010313e-06} +{"train_loss": 0.0002292766876053065, "global_step": 62703, "epoch": 526, "lr": 3.6661166458631936e-06} +{"train_loss": 0.00031415148987434804, "global_step": 62704, "epoch": 526, "lr": 3.6652839764969917e-06} +{"train_loss": 0.0007003181963227689, "global_step": 62705, "epoch": 526, "lr": 3.664451398104046e-06} +{"train_loss": 0.00023441600205842406, "global_step": 62706, "epoch": 526, "lr": 3.663618910686012e-06} +{"train_loss": 0.00036421738332137465, "global_step": 62707, "epoch": 526, "lr": 3.6627865142444985e-06} +{"train_loss": 0.00041221987339667976, "global_step": 62708, "epoch": 526, "lr": 3.6619542087811653e-06} +{"train_loss": 0.0003895115223713219, "global_step": 62709, "epoch": 526, "lr": 3.6611219942976338e-06} +{"train_loss": 0.000282802851870656, "global_step": 62710, "epoch": 526, "lr": 3.6602898707955247e-06} +{"train_loss": 0.00019023922504857183, "global_step": 62711, "epoch": 526, "lr": 3.6594578382765033e-06} +{"train_loss": 0.00032955710800607226, "global_step": 62712, "epoch": 526, "lr": 3.658625896742174e-06, "val_loss": 0.018524959683418274} +{"train_loss": 0.00038557095103897154, "global_step": 62713, "epoch": 527, "lr": 3.657794046194185e-06} +{"train_loss": 0.00031043143826536834, "global_step": 62714, "epoch": 527, "lr": 3.6569622866341635e-06} +{"train_loss": 0.0001936716871568933, "global_step": 62715, "epoch": 527, "lr": 3.6561306180637523e-06} +{"train_loss": 0.00029950105817988515, "global_step": 62716, "epoch": 527, "lr": 3.6552990404845777e-06} +{"train_loss": 0.00044258852722123265, "global_step": 62717, "epoch": 527, "lr": 3.6544675538982664e-06} +{"train_loss": 0.00042833134648390114, "global_step": 62718, "epoch": 527, "lr": 3.6536361583064617e-06} +{"train_loss": 0.00046150307753123343, "global_step": 62719, "epoch": 527, "lr": 3.652804853710784e-06} +{"train_loss": 0.0005230577080510557, "global_step": 62720, "epoch": 527, "lr": 3.6519736401128824e-06} +{"train_loss": 0.0003241430385969579, "global_step": 62721, "epoch": 527, "lr": 3.6511425175143667e-06} +{"train_loss": 0.0005322211654856801, "global_step": 62722, "epoch": 527, "lr": 3.6503114859168908e-06} +{"train_loss": 0.00024412729544565082, "global_step": 62723, "epoch": 527, "lr": 3.6494805453220813e-06} +{"train_loss": 0.00035234156530350447, "global_step": 62724, "epoch": 527, "lr": 3.6486496957315485e-06} +{"train_loss": 0.00020839292847085744, "global_step": 62725, "epoch": 527, "lr": 3.6478189371469573e-06} +{"train_loss": 0.0004795223940163851, "global_step": 62726, "epoch": 527, "lr": 3.6469882695699063e-06} +{"train_loss": 0.0001905479875858873, "global_step": 62727, "epoch": 527, "lr": 3.6461576930020503e-06} +{"train_loss": 0.00034986596438102424, "global_step": 62728, "epoch": 527, "lr": 3.645327207445015e-06} +{"train_loss": 0.0006331143085844815, "global_step": 62729, "epoch": 527, "lr": 3.6444968129004166e-06} +{"train_loss": 0.0002598011342342943, "global_step": 62730, "epoch": 527, "lr": 3.6436665093699085e-06} +{"train_loss": 0.00030230171978473663, "global_step": 62731, "epoch": 527, "lr": 3.6428362968550955e-06} +{"train_loss": 0.00044078848441131413, "global_step": 62732, "epoch": 527, "lr": 3.642006175357632e-06} +{"train_loss": 0.0006013095262460411, "global_step": 62733, "epoch": 527, "lr": 3.641176144879127e-06} +{"train_loss": 0.00043586446554400027, "global_step": 62734, "epoch": 527, "lr": 3.6403462054212302e-06} +{"train_loss": 0.0004296101978980005, "global_step": 62735, "epoch": 527, "lr": 3.6395163569855505e-06} +{"train_loss": 0.0002107352192979306, "global_step": 62736, "epoch": 527, "lr": 3.6386865995737316e-06} +{"train_loss": 0.00046055938582867384, "global_step": 62737, "epoch": 527, "lr": 3.637856933187406e-06} +{"train_loss": 0.00018645012460183352, "global_step": 62738, "epoch": 527, "lr": 3.6370273578281823e-06} +{"train_loss": 0.0004811316030099988, "global_step": 62739, "epoch": 527, "lr": 3.6361978734977155e-06} +{"train_loss": 0.000428685249062255, "global_step": 62740, "epoch": 527, "lr": 3.6353684801976094e-06} +{"train_loss": 0.0003092024417128414, "global_step": 62741, "epoch": 527, "lr": 3.6345391779295134e-06} +{"train_loss": 0.0005062103737145662, "global_step": 62742, "epoch": 527, "lr": 3.6337099666950426e-06} +{"train_loss": 0.00040001317393034697, "global_step": 62743, "epoch": 527, "lr": 3.632880846495823e-06} +{"train_loss": 0.00017558001854922622, "global_step": 62744, "epoch": 527, "lr": 3.6320518173334984e-06} +{"train_loss": 0.00030465854797512293, "global_step": 62745, "epoch": 527, "lr": 3.631222879209678e-06} +{"train_loss": 0.0002960116835311055, "global_step": 62746, "epoch": 527, "lr": 3.6303940321260054e-06} +{"train_loss": 0.000194686945178546, "global_step": 62747, "epoch": 527, "lr": 3.6295652760841017e-06} +{"train_loss": 0.00031006024801172316, "global_step": 62748, "epoch": 527, "lr": 3.6287366110855813e-06} +{"train_loss": 0.00046294991625472903, "global_step": 62749, "epoch": 527, "lr": 3.6279080371320883e-06} +{"train_loss": 0.0002509404148440808, "global_step": 62750, "epoch": 527, "lr": 3.6270795542252436e-06} +{"train_loss": 0.000333104602759704, "global_step": 62751, "epoch": 527, "lr": 3.6262511623666784e-06} +{"train_loss": 0.0003018424613401294, "global_step": 62752, "epoch": 527, "lr": 3.625422861558003e-06} +{"train_loss": 0.00023425318067893386, "global_step": 62753, "epoch": 527, "lr": 3.624594651800867e-06} +{"train_loss": 0.00044406906818039715, "global_step": 62754, "epoch": 527, "lr": 3.623766533096884e-06} +{"train_loss": 0.00023769293329678476, "global_step": 62755, "epoch": 527, "lr": 3.6229385054476763e-06} +{"train_loss": 0.00030240515479817986, "global_step": 62756, "epoch": 527, "lr": 3.622110568854875e-06} +{"train_loss": 0.00024260208010673523, "global_step": 62757, "epoch": 527, "lr": 3.621282723320102e-06} +{"train_loss": 0.0004056582401972264, "global_step": 62758, "epoch": 527, "lr": 3.620454968844994e-06} +{"train_loss": 0.00045803203829564154, "global_step": 62759, "epoch": 527, "lr": 3.6196273054311668e-06} +{"train_loss": 0.0002931538037955761, "global_step": 62760, "epoch": 527, "lr": 3.618799733080236e-06} +{"train_loss": 0.0003318158851470798, "global_step": 62761, "epoch": 527, "lr": 3.6179722517938496e-06} +{"train_loss": 0.0005222497275099158, "global_step": 62762, "epoch": 527, "lr": 3.617144861573607e-06} +{"train_loss": 0.00032229788484983146, "global_step": 62763, "epoch": 527, "lr": 3.6163175624211566e-06} +{"train_loss": 0.00046281301183626056, "global_step": 62764, "epoch": 527, "lr": 3.615490354338097e-06} +{"train_loss": 0.00022950852871872485, "global_step": 62765, "epoch": 527, "lr": 3.6146632373260825e-06} +{"train_loss": 0.00036410882603377104, "global_step": 62766, "epoch": 527, "lr": 3.6138362113867063e-06} +{"train_loss": 0.0002851468452718109, "global_step": 62767, "epoch": 527, "lr": 3.613009276521623e-06} +{"train_loss": 0.0005171304801478982, "global_step": 62768, "epoch": 527, "lr": 3.612182432732425e-06} +{"train_loss": 0.00040848104981705546, "global_step": 62769, "epoch": 527, "lr": 3.6113556800207616e-06} +{"train_loss": 0.00034965641680173576, "global_step": 62770, "epoch": 527, "lr": 3.6105290183882367e-06} +{"train_loss": 0.000277292710961774, "global_step": 62771, "epoch": 527, "lr": 3.6097024478364827e-06} +{"train_loss": 0.0004958543577231467, "global_step": 62772, "epoch": 527, "lr": 3.6088759683671315e-06} +{"train_loss": 0.00043719381210394204, "global_step": 62773, "epoch": 527, "lr": 3.6080495799817925e-06} +{"train_loss": 0.00024191447300836444, "global_step": 62774, "epoch": 527, "lr": 3.607223282682087e-06} +{"train_loss": 0.00028388574719429016, "global_step": 62775, "epoch": 527, "lr": 3.606397076469653e-06} +{"train_loss": 0.0002576562692411244, "global_step": 62776, "epoch": 527, "lr": 3.6055709613460886e-06} +{"train_loss": 0.00020560933626256883, "global_step": 62777, "epoch": 527, "lr": 3.604744937313037e-06} +{"train_loss": 0.00026731067919172347, "global_step": 62778, "epoch": 527, "lr": 3.6039190043721137e-06} +{"train_loss": 0.00033577761496417224, "global_step": 62779, "epoch": 527, "lr": 3.603093162524934e-06} +{"train_loss": 0.0002723510842770338, "global_step": 62780, "epoch": 527, "lr": 3.6022674117731304e-06} +{"train_loss": 0.00023617123952135444, "global_step": 62781, "epoch": 527, "lr": 3.6014417521183066e-06} +{"train_loss": 0.0005436234059743583, "global_step": 62782, "epoch": 527, "lr": 3.6006161835621057e-06} +{"train_loss": 0.00022425585484597832, "global_step": 62783, "epoch": 527, "lr": 3.5997907061061267e-06} +{"train_loss": 0.00045193370897322893, "global_step": 62784, "epoch": 527, "lr": 3.5989653197520122e-06} +{"train_loss": 0.00027772324392572045, "global_step": 62785, "epoch": 527, "lr": 3.598140024501373e-06} +{"train_loss": 0.0003243554965592921, "global_step": 62786, "epoch": 527, "lr": 3.597314820355818e-06} +{"train_loss": 0.00016759925347287208, "global_step": 62787, "epoch": 527, "lr": 3.5964897073169913e-06} +{"train_loss": 0.0006283613620325923, "global_step": 62788, "epoch": 527, "lr": 3.595664685386485e-06} +{"train_loss": 0.0002033511846093461, "global_step": 62789, "epoch": 527, "lr": 3.594839754565943e-06} +{"train_loss": 0.00022345519391819835, "global_step": 62790, "epoch": 527, "lr": 3.594014914856969e-06} +{"train_loss": 0.0004951341543346643, "global_step": 62791, "epoch": 527, "lr": 3.5931901662611956e-06} +{"train_loss": 0.00019139309006277472, "global_step": 62792, "epoch": 527, "lr": 3.5923655087802376e-06} +{"train_loss": 0.00028368152561597526, "global_step": 62793, "epoch": 527, "lr": 3.5915409424157055e-06} +{"train_loss": 0.00035429850686341524, "global_step": 62794, "epoch": 527, "lr": 3.5907164671692307e-06} +{"train_loss": 0.00023658230202272534, "global_step": 62795, "epoch": 527, "lr": 3.5898920830424176e-06} +{"train_loss": 0.0005816011689603329, "global_step": 62796, "epoch": 527, "lr": 3.5890677900368984e-06} +{"train_loss": 0.00021063793974462897, "global_step": 62797, "epoch": 527, "lr": 3.5882435881542887e-06} +{"train_loss": 0.00023408126435242593, "global_step": 62798, "epoch": 527, "lr": 3.587419477396198e-06} +{"train_loss": 0.00020820948702748865, "global_step": 62799, "epoch": 527, "lr": 3.586595457764247e-06} +{"train_loss": 0.0001436685270164162, "global_step": 62800, "epoch": 527, "lr": 3.585771529260068e-06} +{"train_loss": 0.0003695302875712514, "global_step": 62801, "epoch": 527, "lr": 3.5849476918852596e-06} +{"train_loss": 0.0002473707718309015, "global_step": 62802, "epoch": 527, "lr": 3.5841239456414543e-06} +{"train_loss": 0.00038617377867922187, "global_step": 62803, "epoch": 527, "lr": 3.583300290530256e-06} +{"train_loss": 0.00039948325138539076, "global_step": 62804, "epoch": 527, "lr": 3.5824767265532964e-06} +{"train_loss": 0.0004224226577207446, "global_step": 62805, "epoch": 527, "lr": 3.5816532537121803e-06} +{"train_loss": 0.0004217094974592328, "global_step": 62806, "epoch": 527, "lr": 3.5808298720085343e-06} +{"train_loss": 0.00044989713933318853, "global_step": 62807, "epoch": 527, "lr": 3.5800065814439622e-06} +{"train_loss": 0.00013540091458708048, "global_step": 62808, "epoch": 527, "lr": 3.579183382020096e-06} +{"train_loss": 0.00027989610680378973, "global_step": 62809, "epoch": 527, "lr": 3.5783602737385345e-06} +{"train_loss": 0.00028689359896816313, "global_step": 62810, "epoch": 527, "lr": 3.5775372566009103e-06} +{"train_loss": 0.0005611091037280858, "global_step": 62811, "epoch": 527, "lr": 3.5767143306088326e-06} +{"train_loss": 0.00030134638654999435, "global_step": 62812, "epoch": 527, "lr": 3.575891495763911e-06} +{"train_loss": 0.00045714378939010203, "global_step": 62813, "epoch": 527, "lr": 3.575068752067773e-06} +{"train_loss": 0.0003080056922044605, "global_step": 62814, "epoch": 527, "lr": 3.5742460995220163e-06} +{"train_loss": 0.0003999706532340497, "global_step": 62815, "epoch": 527, "lr": 3.5734235381282844e-06} +{"train_loss": 0.0006333532510325313, "global_step": 62816, "epoch": 527, "lr": 3.5726010678881704e-06} +{"train_loss": 0.0005578416748903692, "global_step": 62817, "epoch": 527, "lr": 3.5717786888032846e-06} +{"train_loss": 0.00023705593775957823, "global_step": 62818, "epoch": 527, "lr": 3.5709564008752582e-06} +{"train_loss": 0.00032160678529180586, "global_step": 62819, "epoch": 527, "lr": 3.570134204105696e-06} +{"train_loss": 0.0003383067378308624, "global_step": 62820, "epoch": 527, "lr": 3.5693120984962193e-06} +{"train_loss": 0.0003185480018146336, "global_step": 62821, "epoch": 527, "lr": 3.5684900840484315e-06} +{"train_loss": 0.0003432798548601568, "global_step": 62822, "epoch": 527, "lr": 3.5676681607639596e-06} +{"train_loss": 0.0005292703281156719, "global_step": 62823, "epoch": 527, "lr": 3.566846328644413e-06} +{"train_loss": 0.0002826887648552656, "global_step": 62824, "epoch": 527, "lr": 3.5660245876913912e-06} +{"train_loss": 0.00045614116243086755, "global_step": 62825, "epoch": 527, "lr": 3.5652029379065312e-06} +{"train_loss": 0.00042760162614285946, "global_step": 62826, "epoch": 527, "lr": 3.5643813792914204e-06} +{"train_loss": 0.0002483196440152824, "global_step": 62827, "epoch": 527, "lr": 3.5635599118477025e-06} +{"train_loss": 0.0001900882343761623, "global_step": 62828, "epoch": 527, "lr": 3.5627385355769704e-06} +{"train_loss": 0.00031451854738406837, "global_step": 62829, "epoch": 527, "lr": 3.5619172504808287e-06} +{"train_loss": 0.00018848299805540591, "global_step": 62830, "epoch": 527, "lr": 3.5610960565609143e-06} +{"train_loss": 0.0003473455800005712, "global_step": 62831, "epoch": 527, "lr": 3.560274953818815e-06, "val_loss": 0.03631792962551117} +{"train_loss": 0.000232199759921059, "global_step": 62832, "epoch": 528, "lr": 3.5594539422561635e-06} +{"train_loss": 0.0004739492724183947, "global_step": 62833, "epoch": 528, "lr": 3.558633021874552e-06} +{"train_loss": 0.00021233172446954995, "global_step": 62834, "epoch": 528, "lr": 3.557812192675608e-06} +{"train_loss": 0.00028994944295845926, "global_step": 62835, "epoch": 528, "lr": 3.5569914546609408e-06} +{"train_loss": 0.0003449464275036007, "global_step": 62836, "epoch": 528, "lr": 3.5561708078321544e-06} +{"train_loss": 0.0001758789730956778, "global_step": 62837, "epoch": 528, "lr": 3.5553502521908753e-06} +{"train_loss": 0.00027542567113414407, "global_step": 62838, "epoch": 528, "lr": 3.5545297877386917e-06} +{"train_loss": 0.0006770811160095036, "global_step": 62839, "epoch": 528, "lr": 3.5537094144772353e-06} +{"train_loss": 0.00024260733334813267, "global_step": 62840, "epoch": 528, "lr": 3.552889132408105e-06} +{"train_loss": 0.0006011424120515585, "global_step": 62841, "epoch": 528, "lr": 3.5520689415329156e-06} +{"train_loss": 0.0002994136593770236, "global_step": 62842, "epoch": 528, "lr": 3.551248841853283e-06} +{"train_loss": 0.0004175962822046131, "global_step": 62843, "epoch": 528, "lr": 3.5504288333708003e-06} +{"train_loss": 0.0003321030526421964, "global_step": 62844, "epoch": 528, "lr": 3.5496089160870936e-06} +{"train_loss": 0.00028537336038425565, "global_step": 62845, "epoch": 528, "lr": 3.5487890900037623e-06} +{"train_loss": 0.0002735668676905334, "global_step": 62846, "epoch": 528, "lr": 3.5479693551224323e-06} +{"train_loss": 0.00033399026142433286, "global_step": 62847, "epoch": 528, "lr": 3.5471497114446973e-06} +{"train_loss": 0.00026043297839351, "global_step": 62848, "epoch": 528, "lr": 3.546330158972161e-06} +{"train_loss": 0.0004886548267677426, "global_step": 62849, "epoch": 528, "lr": 3.5455106977064555e-06} +{"train_loss": 0.00017538890824653208, "global_step": 62850, "epoch": 528, "lr": 3.5446913276491687e-06} +{"train_loss": 0.0006033339304849505, "global_step": 62851, "epoch": 528, "lr": 3.5438720488019216e-06} +{"train_loss": 0.00017101441335398704, "global_step": 62852, "epoch": 528, "lr": 3.543052861166313e-06} +{"train_loss": 0.0001825488725444302, "global_step": 62853, "epoch": 528, "lr": 3.542233764743963e-06} +{"train_loss": 0.0001719874271657318, "global_step": 62854, "epoch": 528, "lr": 3.5414147595364767e-06} +{"train_loss": 0.0002056638040812686, "global_step": 62855, "epoch": 528, "lr": 3.5405958455454525e-06} +{"train_loss": 0.0001496441545896232, "global_step": 62856, "epoch": 528, "lr": 3.5397770227725113e-06} +{"train_loss": 0.00024815776851028204, "global_step": 62857, "epoch": 528, "lr": 3.538958291219241e-06} +{"train_loss": 0.00031953485449776053, "global_step": 62858, "epoch": 528, "lr": 3.538139650887279e-06} +{"train_loss": 0.0002029721363214776, "global_step": 62859, "epoch": 528, "lr": 3.5373211017782016e-06} +{"train_loss": 0.00022311614884529263, "global_step": 62860, "epoch": 528, "lr": 3.5365026438936412e-06} +{"train_loss": 0.00019770125800278038, "global_step": 62861, "epoch": 528, "lr": 3.5356842772351905e-06} +{"train_loss": 0.00047381804324686527, "global_step": 62862, "epoch": 528, "lr": 3.5348660018044543e-06} +{"train_loss": 0.00044228759361431, "global_step": 62863, "epoch": 528, "lr": 3.5340478176030532e-06} +{"train_loss": 0.00020347886311355978, "global_step": 62864, "epoch": 528, "lr": 3.533229724632581e-06} +{"train_loss": 0.00015228339179884642, "global_step": 62865, "epoch": 528, "lr": 3.5324117228946517e-06} +{"train_loss": 0.00041812381823547184, "global_step": 62866, "epoch": 528, "lr": 3.5315938123908597e-06} +{"train_loss": 0.00021056461264379323, "global_step": 62867, "epoch": 528, "lr": 3.530775993122826e-06} +{"train_loss": 0.00021037466649431735, "global_step": 62868, "epoch": 528, "lr": 3.5299582650921426e-06} +{"train_loss": 0.00039665575604885817, "global_step": 62869, "epoch": 528, "lr": 3.5291406283004204e-06} +{"train_loss": 0.0002643046318553388, "global_step": 62870, "epoch": 528, "lr": 3.528323082749274e-06} +{"train_loss": 0.0002063646534224972, "global_step": 62871, "epoch": 528, "lr": 3.5275056284402917e-06} +{"train_loss": 0.000248888653004542, "global_step": 62872, "epoch": 528, "lr": 3.5266882653751e-06} +{"train_loss": 0.00022398571309167892, "global_step": 62873, "epoch": 528, "lr": 3.5258709935552857e-06} +{"train_loss": 0.0002457723021507263, "global_step": 62874, "epoch": 528, "lr": 3.525053812982454e-06} +{"train_loss": 0.00018524804909247905, "global_step": 62875, "epoch": 528, "lr": 3.5242367236582195e-06} +{"train_loss": 0.0003820362617261708, "global_step": 62876, "epoch": 528, "lr": 3.5234197255841706e-06} +{"train_loss": 0.0002862986584659666, "global_step": 62877, "epoch": 528, "lr": 3.522602818761933e-06} +{"train_loss": 0.00018498764256946743, "global_step": 62878, "epoch": 528, "lr": 3.5217860031931007e-06} +{"train_loss": 0.00013735487300436944, "global_step": 62879, "epoch": 528, "lr": 3.520969278879266e-06} +{"train_loss": 0.000624440610408783, "global_step": 62880, "epoch": 528, "lr": 3.520152645822056e-06} +{"train_loss": 0.0002386691194260493, "global_step": 62881, "epoch": 528, "lr": 3.5193361040230465e-06} +{"train_loss": 0.0004287861520424485, "global_step": 62882, "epoch": 528, "lr": 3.518519653483865e-06} +{"train_loss": 0.0003782546555157751, "global_step": 62883, "epoch": 528, "lr": 3.517703294206093e-06} +{"train_loss": 0.00016759989375714213, "global_step": 62884, "epoch": 528, "lr": 3.5168870261913565e-06} +{"train_loss": 0.0004715091781690717, "global_step": 62885, "epoch": 528, "lr": 3.516070849441244e-06} +{"train_loss": 0.0002880588872358203, "global_step": 62886, "epoch": 528, "lr": 3.5152547639573543e-06} +{"train_loss": 0.00031681812833994627, "global_step": 62887, "epoch": 528, "lr": 3.5144387697413017e-06} +{"train_loss": 0.0002227489894721657, "global_step": 62888, "epoch": 528, "lr": 3.5136228667946802e-06} +{"train_loss": 0.00013326395128387958, "global_step": 62889, "epoch": 528, "lr": 3.512807055119094e-06} +{"train_loss": 0.00029422331135720015, "global_step": 62890, "epoch": 528, "lr": 3.5119913347161415e-06} +{"train_loss": 0.00047933589667081833, "global_step": 62891, "epoch": 528, "lr": 3.511175705587433e-06} +{"train_loss": 0.0005402668612077832, "global_step": 62892, "epoch": 528, "lr": 3.5103601677345664e-06} +{"train_loss": 0.00038200931157916784, "global_step": 62893, "epoch": 528, "lr": 3.5095447211591303e-06} +{"train_loss": 0.0007745370385237038, "global_step": 62894, "epoch": 528, "lr": 3.508729365862745e-06} +{"train_loss": 0.0003149361291434616, "global_step": 62895, "epoch": 528, "lr": 3.5079141018469983e-06} +{"train_loss": 0.0002194759581470862, "global_step": 62896, "epoch": 528, "lr": 3.5070989291135004e-06} +{"train_loss": 0.00022678376990370452, "global_step": 62897, "epoch": 528, "lr": 3.506283847663838e-06} +{"train_loss": 0.0006129263201728463, "global_step": 62898, "epoch": 528, "lr": 3.505468857499633e-06} +{"train_loss": 0.00025188756990246475, "global_step": 62899, "epoch": 528, "lr": 3.504653958622456e-06} +{"train_loss": 0.00041627147584222257, "global_step": 62900, "epoch": 528, "lr": 3.5038391510339385e-06} +{"train_loss": 0.0001715530815999955, "global_step": 62901, "epoch": 528, "lr": 3.503024434735658e-06} +{"train_loss": 0.000248784403083846, "global_step": 62902, "epoch": 528, "lr": 3.5022098097292234e-06} +{"train_loss": 0.00034214131301268935, "global_step": 62903, "epoch": 528, "lr": 3.501395276016228e-06} +{"train_loss": 0.0004073510062880814, "global_step": 62904, "epoch": 528, "lr": 3.5005808335982825e-06} +{"train_loss": 0.0005486240843310952, "global_step": 62905, "epoch": 528, "lr": 3.4997664824769737e-06} +{"train_loss": 0.00030648778192698956, "global_step": 62906, "epoch": 528, "lr": 3.498952222653912e-06} +{"train_loss": 0.00027224092627875507, "global_step": 62907, "epoch": 528, "lr": 3.4981380541306783e-06} +{"train_loss": 0.0004438920004758984, "global_step": 62908, "epoch": 528, "lr": 3.497323976908895e-06} +{"train_loss": 0.00032227393239736557, "global_step": 62909, "epoch": 528, "lr": 3.496509990990138e-06} +{"train_loss": 0.00029051018645986915, "global_step": 62910, "epoch": 528, "lr": 3.4956960963760276e-06} +{"train_loss": 0.0004706021281890571, "global_step": 62911, "epoch": 528, "lr": 3.494882293068147e-06} +{"train_loss": 0.0002833370817825198, "global_step": 62912, "epoch": 528, "lr": 3.494068581068083e-06} +{"train_loss": 0.00040072904084809124, "global_step": 62913, "epoch": 528, "lr": 3.493254960377462e-06} +{"train_loss": 0.0003356526722200215, "global_step": 62914, "epoch": 528, "lr": 3.492441430997856e-06} +{"train_loss": 0.0003691158490255475, "global_step": 62915, "epoch": 528, "lr": 3.491627992930879e-06} +{"train_loss": 0.00022627570433542132, "global_step": 62916, "epoch": 528, "lr": 3.4908146461781256e-06} +{"train_loss": 0.00034493469865992665, "global_step": 62917, "epoch": 528, "lr": 3.4900013907411765e-06} +{"train_loss": 0.0001352538529317826, "global_step": 62918, "epoch": 528, "lr": 3.4891882266216534e-06} +{"train_loss": 0.0003518291050568223, "global_step": 62919, "epoch": 528, "lr": 3.488375153821127e-06} +{"train_loss": 0.00023974452051334083, "global_step": 62920, "epoch": 528, "lr": 3.487562172341219e-06} +{"train_loss": 0.00018000115233007818, "global_step": 62921, "epoch": 528, "lr": 3.4867492821835044e-06} +{"train_loss": 0.00023101111582946032, "global_step": 62922, "epoch": 528, "lr": 3.4859364833495945e-06} +{"train_loss": 0.00036159378942102194, "global_step": 62923, "epoch": 528, "lr": 3.4851237758410815e-06} +{"train_loss": 0.0005963264266029, "global_step": 62924, "epoch": 528, "lr": 3.484311159659548e-06} +{"train_loss": 0.00034184689866378903, "global_step": 62925, "epoch": 528, "lr": 3.4834986348066143e-06} +{"train_loss": 0.00017430265143048018, "global_step": 62926, "epoch": 528, "lr": 3.4826862012838466e-06} +{"train_loss": 0.00017760794435162097, "global_step": 62927, "epoch": 528, "lr": 3.4818738590928655e-06} +{"train_loss": 0.0006371778436005116, "global_step": 62928, "epoch": 528, "lr": 3.481061608235248e-06} +{"train_loss": 0.0001982448884518817, "global_step": 62929, "epoch": 528, "lr": 3.4802494487126024e-06} +{"train_loss": 0.0003710227319970727, "global_step": 62930, "epoch": 528, "lr": 3.479437380526518e-06} +{"train_loss": 0.00019010140385944396, "global_step": 62931, "epoch": 528, "lr": 3.4786254036785813e-06} +{"train_loss": 0.000449726969236508, "global_step": 62932, "epoch": 528, "lr": 3.4778135181703918e-06} +{"train_loss": 0.0001922420779010281, "global_step": 62933, "epoch": 528, "lr": 3.4770017240035535e-06} +{"train_loss": 0.0003156334860250354, "global_step": 62934, "epoch": 528, "lr": 3.4761900211796485e-06} +{"train_loss": 0.00037144013913348317, "global_step": 62935, "epoch": 528, "lr": 3.475378409700275e-06} +{"train_loss": 0.00036648617242462933, "global_step": 62936, "epoch": 528, "lr": 3.4745668895670214e-06} +{"train_loss": 0.00020286129438318312, "global_step": 62937, "epoch": 528, "lr": 3.4737554607814915e-06} +{"train_loss": 0.0003378214605618268, "global_step": 62938, "epoch": 528, "lr": 3.4729441233452675e-06} +{"train_loss": 0.0003047438513021916, "global_step": 62939, "epoch": 528, "lr": 3.472132877259954e-06} +{"train_loss": 0.000531101948581636, "global_step": 62940, "epoch": 528, "lr": 3.4713217225271267e-06} +{"train_loss": 0.0005673315608873963, "global_step": 62941, "epoch": 528, "lr": 3.470510659148396e-06} +{"train_loss": 0.0003145446244161576, "global_step": 62942, "epoch": 528, "lr": 3.4696996871253497e-06} +{"train_loss": 0.00028324799495749176, "global_step": 62943, "epoch": 528, "lr": 3.4688888064595694e-06} +{"train_loss": 0.0002949486661236733, "global_step": 62944, "epoch": 528, "lr": 3.4680780171526596e-06} +{"train_loss": 0.00026702164905145764, "global_step": 62945, "epoch": 528, "lr": 3.467267319206202e-06} +{"train_loss": 0.00029607859323732555, "global_step": 62946, "epoch": 528, "lr": 3.466456712621796e-06} +{"train_loss": 0.00038821244379505515, "global_step": 62947, "epoch": 528, "lr": 3.4656461974010346e-06} +{"train_loss": 0.00037943379720672965, "global_step": 62948, "epoch": 528, "lr": 3.4648357735454993e-06} +{"train_loss": 0.0003990100813098252, "global_step": 62949, "epoch": 528, "lr": 3.4640254410567953e-06} +{"train_loss": 0.00032057354990745106, "global_step": 62950, "epoch": 528, "lr": 3.463215199936498e-06, "val_loss": 0.017630960792303085} +{"train_loss": 0.00024008206673897803, "global_step": 62951, "epoch": 529, "lr": 3.4624050501862126e-06} +{"train_loss": 0.00045437971130013466, "global_step": 62952, "epoch": 529, "lr": 3.4615949918075152e-06} +{"train_loss": 0.00021200760966166854, "global_step": 62953, "epoch": 529, "lr": 3.46078502480201e-06} +{"train_loss": 0.00032928481232374907, "global_step": 62954, "epoch": 529, "lr": 3.459975149171285e-06} +{"train_loss": 0.0005699289031326771, "global_step": 62955, "epoch": 529, "lr": 3.4591653649169165e-06} +{"train_loss": 0.0003870904038194567, "global_step": 62956, "epoch": 529, "lr": 3.458355672040514e-06} +{"train_loss": 0.000288741517579183, "global_step": 62957, "epoch": 529, "lr": 3.457546070543649e-06} +{"train_loss": 0.00022302378783933818, "global_step": 62958, "epoch": 529, "lr": 3.4567365604279256e-06} +{"train_loss": 0.0003861351578962058, "global_step": 62959, "epoch": 529, "lr": 3.45592714169492e-06} +{"train_loss": 0.0004328858631197363, "global_step": 62960, "epoch": 529, "lr": 3.4551178143462427e-06} +{"train_loss": 0.00023962042178027332, "global_step": 62961, "epoch": 529, "lr": 3.4543085783834638e-06} +{"train_loss": 0.00039060719427652657, "global_step": 62962, "epoch": 529, "lr": 3.4534994338081715e-06} +{"train_loss": 0.0003680689842440188, "global_step": 62963, "epoch": 529, "lr": 3.45269038062197e-06} +{"train_loss": 0.0002610381634440273, "global_step": 62964, "epoch": 529, "lr": 3.4518814188264247e-06} +{"train_loss": 0.0003242372185923159, "global_step": 62965, "epoch": 529, "lr": 3.451072548423151e-06} +{"train_loss": 0.0002858572988770902, "global_step": 62966, "epoch": 529, "lr": 3.4502637694137087e-06} +{"train_loss": 0.0003333012282382697, "global_step": 62967, "epoch": 529, "lr": 3.4494550817997073e-06} +{"train_loss": 0.0002628384972922504, "global_step": 62968, "epoch": 529, "lr": 3.4486464855827293e-06} +{"train_loss": 0.0003410358040127903, "global_step": 62969, "epoch": 529, "lr": 3.447837980764357e-06} +{"train_loss": 0.00029062939574941993, "global_step": 62970, "epoch": 529, "lr": 3.4470295673461883e-06} +{"train_loss": 0.00038675672840327024, "global_step": 62971, "epoch": 529, "lr": 3.446221245329795e-06} +{"train_loss": 0.0001453736622352153, "global_step": 62972, "epoch": 529, "lr": 3.4454130147167805e-06} +{"train_loss": 0.00027204951038584113, "global_step": 62973, "epoch": 529, "lr": 3.444604875508728e-06} +{"train_loss": 0.0007595902425237, "global_step": 62974, "epoch": 529, "lr": 3.4437968277072073e-06} +{"train_loss": 0.00017708497762214392, "global_step": 62975, "epoch": 529, "lr": 3.4429888713138294e-06} +{"train_loss": 0.0004745115293189883, "global_step": 62976, "epoch": 529, "lr": 3.4421810063301584e-06} +{"train_loss": 0.0002767518162727356, "global_step": 62977, "epoch": 529, "lr": 3.4413732327578e-06} +{"train_loss": 0.00025016808649525046, "global_step": 62978, "epoch": 529, "lr": 3.4405655505983236e-06} +{"train_loss": 0.0003223526291549206, "global_step": 62979, "epoch": 529, "lr": 3.439757959853329e-06} +{"train_loss": 0.0003285001730546355, "global_step": 62980, "epoch": 529, "lr": 3.4389504605243984e-06} +{"train_loss": 0.0003418375563342124, "global_step": 62981, "epoch": 529, "lr": 3.438143052613102e-06} +{"train_loss": 0.000255792576353997, "global_step": 62982, "epoch": 529, "lr": 3.4373357361210445e-06} +{"train_loss": 0.0003143422945868224, "global_step": 62983, "epoch": 529, "lr": 3.4365285110498024e-06} +{"train_loss": 0.0004334718978498131, "global_step": 62984, "epoch": 529, "lr": 3.4357213774009633e-06} +{"train_loss": 0.00033019535476341844, "global_step": 62985, "epoch": 529, "lr": 3.434914335176115e-06} +{"train_loss": 0.0003447413328103721, "global_step": 62986, "epoch": 529, "lr": 3.434107384376828e-06} +{"train_loss": 0.00037690726458095014, "global_step": 62987, "epoch": 529, "lr": 3.433300525004707e-06} +{"train_loss": 0.0002048273745458573, "global_step": 62988, "epoch": 529, "lr": 3.4324937570613115e-06} +{"train_loss": 0.00037301782867871225, "global_step": 62989, "epoch": 529, "lr": 3.4316870805482516e-06} +{"train_loss": 0.00020034854242112488, "global_step": 62990, "epoch": 529, "lr": 3.4308804954670926e-06} +{"train_loss": 0.00024771085008978844, "global_step": 62991, "epoch": 529, "lr": 3.4300740018194277e-06} +{"train_loss": 0.0003794002695940435, "global_step": 62992, "epoch": 529, "lr": 3.4292675996068447e-06} +{"train_loss": 0.000340331404004246, "global_step": 62993, "epoch": 529, "lr": 3.428461288830903e-06} +{"train_loss": 0.0003708232252392918, "global_step": 62994, "epoch": 529, "lr": 3.427655069493213e-06} +{"train_loss": 0.0003440453438088298, "global_step": 62995, "epoch": 529, "lr": 3.4268489415953396e-06} +{"train_loss": 0.00032140861731022596, "global_step": 62996, "epoch": 529, "lr": 3.426042905138882e-06} +{"train_loss": 0.00030937479459680617, "global_step": 62997, "epoch": 529, "lr": 3.4252369601254054e-06} +{"train_loss": 0.0006334990612231195, "global_step": 62998, "epoch": 529, "lr": 3.4244311065565084e-06} +{"train_loss": 0.00028953561559319496, "global_step": 62999, "epoch": 529, "lr": 3.4236253444337564e-06} +{"train_loss": 0.0008028558222576976, "global_step": 63000, "epoch": 529, "lr": 3.4228196737587427e-06} +{"train_loss": 0.00039599317824468017, "global_step": 63001, "epoch": 529, "lr": 3.422014094533044e-06} +{"train_loss": 0.00028451753314584494, "global_step": 63002, "epoch": 529, "lr": 3.421208606758247e-06} +{"train_loss": 0.00033188232919201255, "global_step": 63003, "epoch": 529, "lr": 3.420403210435935e-06} +{"train_loss": 0.00025445190840400755, "global_step": 63004, "epoch": 529, "lr": 3.419597905567684e-06} +{"train_loss": 0.0006545834476128221, "global_step": 63005, "epoch": 529, "lr": 3.4187926921550705e-06} +{"train_loss": 0.0003522737242747098, "global_step": 63006, "epoch": 529, "lr": 3.4179875701996877e-06} +{"train_loss": 0.00023353933647740632, "global_step": 63007, "epoch": 529, "lr": 3.417182539703101e-06} +{"train_loss": 0.00028649671003222466, "global_step": 63008, "epoch": 529, "lr": 3.416377600666909e-06} +{"train_loss": 0.0003724017005879432, "global_step": 63009, "epoch": 529, "lr": 3.4155727530926774e-06} +{"train_loss": 0.00020426725677680224, "global_step": 63010, "epoch": 529, "lr": 3.4147679969819935e-06} +{"train_loss": 0.0002795819891616702, "global_step": 63011, "epoch": 529, "lr": 3.4139633323364396e-06} +{"train_loss": 0.000226695163291879, "global_step": 63012, "epoch": 529, "lr": 3.4131587591575865e-06} +{"train_loss": 0.00036836316576227546, "global_step": 63013, "epoch": 529, "lr": 3.412354277447022e-06} +{"train_loss": 0.0001694606035016477, "global_step": 63014, "epoch": 529, "lr": 3.4115498872063166e-06} +{"train_loss": 0.000604204076807946, "global_step": 63015, "epoch": 529, "lr": 3.4107455884370643e-06} +{"train_loss": 0.0002842718386091292, "global_step": 63016, "epoch": 529, "lr": 3.4099413811408356e-06} +{"train_loss": 0.0005816059419885278, "global_step": 63017, "epoch": 529, "lr": 3.409137265319201e-06} +{"train_loss": 0.0006332931807264686, "global_step": 63018, "epoch": 529, "lr": 3.4083332409737545e-06} +{"train_loss": 0.00018830425688065588, "global_step": 63019, "epoch": 529, "lr": 3.4075293081060667e-06} +{"train_loss": 0.0003684751281980425, "global_step": 63020, "epoch": 529, "lr": 3.4067254667177196e-06} +{"train_loss": 0.0004211563500575721, "global_step": 63021, "epoch": 529, "lr": 3.4059217168102788e-06} +{"train_loss": 0.000397006660932675, "global_step": 63022, "epoch": 529, "lr": 3.405118058385348e-06} +{"train_loss": 0.00029431862640194595, "global_step": 63023, "epoch": 529, "lr": 3.4043144914444826e-06} +{"train_loss": 0.00019296343089081347, "global_step": 63024, "epoch": 529, "lr": 3.4035110159892637e-06} +{"train_loss": 0.00019769843493122607, "global_step": 63025, "epoch": 529, "lr": 3.402707632021285e-06} +{"train_loss": 0.00031937408493831754, "global_step": 63026, "epoch": 529, "lr": 3.4019043395420945e-06} +{"train_loss": 0.0003891953092534095, "global_step": 63027, "epoch": 529, "lr": 3.401101138553303e-06} +{"train_loss": 0.0003667361452244222, "global_step": 63028, "epoch": 529, "lr": 3.400298029056459e-06} +{"train_loss": 0.00025531111168675125, "global_step": 63029, "epoch": 529, "lr": 3.399495011053161e-06} +{"train_loss": 0.0001716508559184149, "global_step": 63030, "epoch": 529, "lr": 3.398692084544963e-06} +{"train_loss": 0.0005220022867433727, "global_step": 63031, "epoch": 529, "lr": 3.3978892495334702e-06} +{"train_loss": 0.0002862908586394042, "global_step": 63032, "epoch": 529, "lr": 3.3970865060202306e-06} +{"train_loss": 0.0002855638740584254, "global_step": 63033, "epoch": 529, "lr": 3.3962838540068378e-06} +{"train_loss": 0.00016757358389440924, "global_step": 63034, "epoch": 529, "lr": 3.395481293494862e-06} +{"train_loss": 0.00032697751885280013, "global_step": 63035, "epoch": 529, "lr": 3.3946788244858807e-06} +{"train_loss": 0.0002547210024204105, "global_step": 63036, "epoch": 529, "lr": 3.3938764469814644e-06} +{"train_loss": 0.0003182891523465514, "global_step": 63037, "epoch": 529, "lr": 3.3930741609832007e-06} +{"train_loss": 0.00031555938767269254, "global_step": 63038, "epoch": 529, "lr": 3.3922719664926495e-06} +{"train_loss": 0.00017672096146270633, "global_step": 63039, "epoch": 529, "lr": 3.3914698635113984e-06} +{"train_loss": 0.00029016859480179846, "global_step": 63040, "epoch": 529, "lr": 3.3906678520410128e-06} +{"train_loss": 0.0003257484931964427, "global_step": 63041, "epoch": 529, "lr": 3.389865932083075e-06} +{"train_loss": 0.00038502237293869257, "global_step": 63042, "epoch": 529, "lr": 3.3890641036391556e-06} +{"train_loss": 0.00037312268977984786, "global_step": 63043, "epoch": 529, "lr": 3.388262366710826e-06} +{"train_loss": 0.00016903340292628855, "global_step": 63044, "epoch": 529, "lr": 3.387460721299668e-06} +{"train_loss": 0.0005027109873481095, "global_step": 63045, "epoch": 529, "lr": 3.386659167407241e-06} +{"train_loss": 0.0004593298363033682, "global_step": 63046, "epoch": 529, "lr": 3.3858577050351394e-06} +{"train_loss": 0.0002283219073433429, "global_step": 63047, "epoch": 529, "lr": 3.385056334184922e-06} +{"train_loss": 0.00020111125195398927, "global_step": 63048, "epoch": 529, "lr": 3.3842550548581707e-06} +{"train_loss": 0.0003803541185334325, "global_step": 63049, "epoch": 529, "lr": 3.383453867056452e-06} +{"train_loss": 0.0005095212254673243, "global_step": 63050, "epoch": 529, "lr": 3.382652770781336e-06} +{"train_loss": 0.0004768774379044771, "global_step": 63051, "epoch": 529, "lr": 3.3818517660344106e-06} +{"train_loss": 0.0001604102726560086, "global_step": 63052, "epoch": 529, "lr": 3.3810508528172247e-06} +{"train_loss": 0.00033413467463105917, "global_step": 63053, "epoch": 529, "lr": 3.3802500311313767e-06} +{"train_loss": 0.0003077167202718556, "global_step": 63054, "epoch": 529, "lr": 3.3794493009784322e-06} +{"train_loss": 0.0005670854006893933, "global_step": 63055, "epoch": 529, "lr": 3.3786486623599457e-06} +{"train_loss": 0.0003402011643629521, "global_step": 63056, "epoch": 529, "lr": 3.37784811527751e-06} +{"train_loss": 0.00023077234800439328, "global_step": 63057, "epoch": 529, "lr": 3.3770476597326795e-06} +{"train_loss": 0.00017430041043553501, "global_step": 63058, "epoch": 529, "lr": 3.376247295727042e-06} +{"train_loss": 0.00037158248596824706, "global_step": 63059, "epoch": 529, "lr": 3.375447023262157e-06} +{"train_loss": 0.0003345418081153184, "global_step": 63060, "epoch": 529, "lr": 3.374646842339607e-06} +{"train_loss": 0.0002867303555831313, "global_step": 63061, "epoch": 529, "lr": 3.3738467529609576e-06} +{"train_loss": 0.0002445541904307902, "global_step": 63062, "epoch": 529, "lr": 3.3730467551277733e-06} +{"train_loss": 0.00022700373665429652, "global_step": 63063, "epoch": 529, "lr": 3.3722468488416257e-06} +{"train_loss": 0.00021057443518657237, "global_step": 63064, "epoch": 529, "lr": 3.3714470341041026e-06} +{"train_loss": 0.0002477440284565091, "global_step": 63065, "epoch": 529, "lr": 3.370647310916747e-06} +{"train_loss": 0.0002674363204278052, "global_step": 63066, "epoch": 529, "lr": 3.369847679281157e-06} +{"train_loss": 0.00027213164139539003, "global_step": 63067, "epoch": 529, "lr": 3.3690481391988826e-06} +{"train_loss": 0.0006571906269527972, "global_step": 63068, "epoch": 529, "lr": 3.368248690671505e-06} +{"train_loss": 0.00033731705424994103, "global_step": 63069, "epoch": 529, "lr": 3.367449333700584e-06, "val_loss": 0.07105842232704163} +{"train_loss": 0.0005456228973343968, "global_step": 63070, "epoch": 530, "lr": 3.366650068287697e-06} +{"train_loss": 0.00019490225531626493, "global_step": 63071, "epoch": 530, "lr": 3.3658508944344083e-06} +{"train_loss": 0.00025677960366010666, "global_step": 63072, "epoch": 530, "lr": 3.3650518121422946e-06} +{"train_loss": 0.0005493165808729827, "global_step": 63073, "epoch": 530, "lr": 3.364252821412922e-06} +{"train_loss": 0.0002817551721818745, "global_step": 63074, "epoch": 530, "lr": 3.3634539222478444e-06} +{"train_loss": 0.00022997987980488688, "global_step": 63075, "epoch": 530, "lr": 3.3626551146486553e-06} +{"train_loss": 0.0003350717597641051, "global_step": 63076, "epoch": 530, "lr": 3.361856398616897e-06} +{"train_loss": 0.00025590285076759756, "global_step": 63077, "epoch": 530, "lr": 3.3610577741541636e-06} +{"train_loss": 0.0004325473273638636, "global_step": 63078, "epoch": 530, "lr": 3.3602592412619984e-06} +{"train_loss": 0.00021288904827088118, "global_step": 63079, "epoch": 530, "lr": 3.3594607999419938e-06} +{"train_loss": 0.00026800521300174296, "global_step": 63080, "epoch": 530, "lr": 3.358662450195704e-06} +{"train_loss": 0.00025349640054628253, "global_step": 63081, "epoch": 530, "lr": 3.35786419202469e-06} +{"train_loss": 0.0003789504698943347, "global_step": 63082, "epoch": 530, "lr": 3.357066025430533e-06} +{"train_loss": 0.0005506820161826909, "global_step": 63083, "epoch": 530, "lr": 3.3562679504147877e-06} +{"train_loss": 0.000313891185214743, "global_step": 63084, "epoch": 530, "lr": 3.3554699669790303e-06} +{"train_loss": 0.00019955656898673624, "global_step": 63085, "epoch": 530, "lr": 3.3546720751248318e-06} +{"train_loss": 0.000324070657370612, "global_step": 63086, "epoch": 530, "lr": 3.3538742748537354e-06} +{"train_loss": 0.00036857897066511214, "global_step": 63087, "epoch": 530, "lr": 3.3530765661673403e-06} +{"train_loss": 0.0001919329515658319, "global_step": 63088, "epoch": 530, "lr": 3.3522789490671835e-06} +{"train_loss": 0.0002503347350284457, "global_step": 63089, "epoch": 530, "lr": 3.3514814235548473e-06} +{"train_loss": 0.00023992787464521825, "global_step": 63090, "epoch": 530, "lr": 3.350683989631892e-06} +{"train_loss": 0.00041579976095817983, "global_step": 63091, "epoch": 530, "lr": 3.349886647299888e-06} +{"train_loss": 0.00026707665529102087, "global_step": 63092, "epoch": 530, "lr": 3.3490893965604007e-06} +{"train_loss": 0.00026661489391699433, "global_step": 63093, "epoch": 530, "lr": 3.348292237414985e-06} +{"train_loss": 0.0002433579065836966, "global_step": 63094, "epoch": 530, "lr": 3.3474951698652224e-06} +{"train_loss": 0.0005272843409329653, "global_step": 63095, "epoch": 530, "lr": 3.346698193912656e-06} +{"train_loss": 0.00021939299767836928, "global_step": 63096, "epoch": 530, "lr": 3.3459013095588745e-06} +{"train_loss": 0.00032094819471240044, "global_step": 63097, "epoch": 530, "lr": 3.3451045168054252e-06} +{"train_loss": 0.00023840258654672652, "global_step": 63098, "epoch": 530, "lr": 3.3443078156538853e-06} +{"train_loss": 0.0003139389446005225, "global_step": 63099, "epoch": 530, "lr": 3.3435112061058038e-06} +{"train_loss": 0.0001537978823762387, "global_step": 63100, "epoch": 530, "lr": 3.342714688162757e-06} +{"train_loss": 0.00037307041930034757, "global_step": 63101, "epoch": 530, "lr": 3.34191826182631e-06} +{"train_loss": 0.00021392230701167136, "global_step": 63102, "epoch": 530, "lr": 3.341121927098012e-06} +{"train_loss": 0.0003147423849441111, "global_step": 63103, "epoch": 530, "lr": 3.340325683979445e-06} +{"train_loss": 0.00021740309603046626, "global_step": 63104, "epoch": 530, "lr": 3.3395295324721687e-06} +{"train_loss": 0.0010485452366992831, "global_step": 63105, "epoch": 530, "lr": 3.3387334725777262e-06} +{"train_loss": 0.00015236128820106387, "global_step": 63106, "epoch": 530, "lr": 3.3379375042977113e-06} +{"train_loss": 0.00025109396665357053, "global_step": 63107, "epoch": 530, "lr": 3.3371416276336553e-06} +{"train_loss": 0.000460269016912207, "global_step": 63108, "epoch": 530, "lr": 3.336345842587152e-06} +{"train_loss": 0.0002904000284615904, "global_step": 63109, "epoch": 530, "lr": 3.335550149159733e-06} +{"train_loss": 0.00035302407923154533, "global_step": 63110, "epoch": 530, "lr": 3.3347545473529864e-06} +{"train_loss": 0.00024170230608433485, "global_step": 63111, "epoch": 530, "lr": 3.333959037168466e-06} +{"train_loss": 0.0002696781884878874, "global_step": 63112, "epoch": 530, "lr": 3.333163618607721e-06} +{"train_loss": 0.0005620291922241449, "global_step": 63113, "epoch": 530, "lr": 3.332368291672333e-06} +{"train_loss": 0.0001875671005109325, "global_step": 63114, "epoch": 530, "lr": 3.331573056363846e-06} +{"train_loss": 0.0008141350117512047, "global_step": 63115, "epoch": 530, "lr": 3.3307779126838413e-06} +{"train_loss": 0.00041055295150727034, "global_step": 63116, "epoch": 530, "lr": 3.3299828606338567e-06} +{"train_loss": 0.0003926978388335556, "global_step": 63117, "epoch": 530, "lr": 3.329187900215469e-06} +{"train_loss": 0.0005784195964224637, "global_step": 63118, "epoch": 530, "lr": 3.328393031430238e-06} +{"train_loss": 0.0002429129381198436, "global_step": 63119, "epoch": 530, "lr": 3.3275982542797177e-06} +{"train_loss": 0.00033441049163229764, "global_step": 63120, "epoch": 530, "lr": 3.326803568765474e-06} +{"train_loss": 0.0003240028745494783, "global_step": 63121, "epoch": 530, "lr": 3.326008974889061e-06} +{"train_loss": 0.000358874473022297, "global_step": 63122, "epoch": 530, "lr": 3.3252144726520497e-06} +{"train_loss": 0.00048372315359301865, "global_step": 63123, "epoch": 530, "lr": 3.3244200620559885e-06} +{"train_loss": 0.00021524740441236645, "global_step": 63124, "epoch": 530, "lr": 3.3236257431024433e-06} +{"train_loss": 0.0002811641898006201, "global_step": 63125, "epoch": 530, "lr": 3.3228315157929735e-06} +{"train_loss": 0.00019593254546634853, "global_step": 63126, "epoch": 530, "lr": 3.3220373801291283e-06} +{"train_loss": 0.00041170226177200675, "global_step": 63127, "epoch": 530, "lr": 3.3212433361124895e-06} +{"train_loss": 0.00024975609267130494, "global_step": 63128, "epoch": 530, "lr": 3.3204493837445895e-06} +{"train_loss": 0.0005364110111258924, "global_step": 63129, "epoch": 530, "lr": 3.31965552302701e-06} +{"train_loss": 0.0005650036036968231, "global_step": 63130, "epoch": 530, "lr": 3.3188617539612945e-06} +{"train_loss": 0.00029406286193989217, "global_step": 63131, "epoch": 530, "lr": 3.3180680765490136e-06} +{"train_loss": 0.00025749695487320423, "global_step": 63132, "epoch": 530, "lr": 3.317274490791705e-06} +{"train_loss": 0.0003285020065959543, "global_step": 63133, "epoch": 530, "lr": 3.316480996690957e-06} +{"train_loss": 0.00030483139562420547, "global_step": 63134, "epoch": 530, "lr": 3.315687594248296e-06} +{"train_loss": 0.0002821207162924111, "global_step": 63135, "epoch": 530, "lr": 3.3148942834653086e-06} +{"train_loss": 0.0005714299040846527, "global_step": 63136, "epoch": 530, "lr": 3.3141010643435276e-06} +{"train_loss": 0.0005871282774023712, "global_step": 63137, "epoch": 530, "lr": 3.31330793688453e-06} +{"train_loss": 0.0004290523356758058, "global_step": 63138, "epoch": 530, "lr": 3.312514901089858e-06} +{"train_loss": 0.00023473205510526896, "global_step": 63139, "epoch": 530, "lr": 3.3117219569610834e-06} +{"train_loss": 0.00027898681582883, "global_step": 63140, "epoch": 530, "lr": 3.3109291044997436e-06} +{"train_loss": 0.0003136381274089217, "global_step": 63141, "epoch": 530, "lr": 3.310136343707415e-06} +{"train_loss": 0.00019968200649600476, "global_step": 63142, "epoch": 530, "lr": 3.3093436745856467e-06} +{"train_loss": 0.00034590988070704043, "global_step": 63143, "epoch": 530, "lr": 3.308551097135987e-06} +{"train_loss": 0.0003547580272424966, "global_step": 63144, "epoch": 530, "lr": 3.3077586113600066e-06} +{"train_loss": 0.0006324111018329859, "global_step": 63145, "epoch": 530, "lr": 3.306966217259244e-06} +{"train_loss": 0.0008101971470750868, "global_step": 63146, "epoch": 530, "lr": 3.3061739148352755e-06} +{"train_loss": 0.00031742072314955294, "global_step": 63147, "epoch": 530, "lr": 3.3053817040896384e-06} +{"train_loss": 0.0005730187403969467, "global_step": 63148, "epoch": 530, "lr": 3.304589585023904e-06} +{"train_loss": 0.0003853927773889154, "global_step": 63149, "epoch": 530, "lr": 3.3037975576396153e-06} +{"train_loss": 0.0007756987470202148, "global_step": 63150, "epoch": 530, "lr": 3.3030056219383265e-06} +{"train_loss": 0.0002598277060315013, "global_step": 63151, "epoch": 530, "lr": 3.3022137779216034e-06} +{"train_loss": 0.00021523360919672996, "global_step": 63152, "epoch": 530, "lr": 3.301422025590989e-06} +{"train_loss": 0.0007157155778259039, "global_step": 63153, "epoch": 530, "lr": 3.3006303649480486e-06} +{"train_loss": 0.0005661816685460508, "global_step": 63154, "epoch": 530, "lr": 3.299838795994331e-06} +{"train_loss": 0.00024352100444957614, "global_step": 63155, "epoch": 530, "lr": 3.2990473187313854e-06} +{"train_loss": 0.0002510178601369262, "global_step": 63156, "epoch": 530, "lr": 3.2982559331607766e-06} +{"train_loss": 0.0004896807949990034, "global_step": 63157, "epoch": 530, "lr": 3.297464639284048e-06} +{"train_loss": 0.00014244834892451763, "global_step": 63158, "epoch": 530, "lr": 3.2966734371027652e-06} +{"train_loss": 0.0005478247767314315, "global_step": 63159, "epoch": 530, "lr": 3.295882326618466e-06} +{"train_loss": 0.0007165715796872973, "global_step": 63160, "epoch": 530, "lr": 3.2950913078327206e-06} +{"train_loss": 0.00019814263214357197, "global_step": 63161, "epoch": 530, "lr": 3.2943003807470674e-06} +{"train_loss": 0.00029156458913348615, "global_step": 63162, "epoch": 530, "lr": 3.2935095453630715e-06} +{"train_loss": 0.00019463255011942238, "global_step": 63163, "epoch": 530, "lr": 3.292718801682271e-06} +{"train_loss": 0.00029858946800231934, "global_step": 63164, "epoch": 530, "lr": 3.291928149706236e-06} +{"train_loss": 0.00026803213404491544, "global_step": 63165, "epoch": 530, "lr": 3.2911375894364994e-06} +{"train_loss": 0.00026906863786280155, "global_step": 63166, "epoch": 530, "lr": 3.2903471208746372e-06} +{"train_loss": 0.00021901342552155256, "global_step": 63167, "epoch": 530, "lr": 3.289556744022176e-06} +{"train_loss": 0.00028335824026726186, "global_step": 63168, "epoch": 530, "lr": 3.288766458880693e-06} +{"train_loss": 0.0002478207170497626, "global_step": 63169, "epoch": 530, "lr": 3.2879762654517145e-06} +{"train_loss": 0.00027512983069755137, "global_step": 63170, "epoch": 530, "lr": 3.2871861637368106e-06} +{"train_loss": 0.0002694893046282232, "global_step": 63171, "epoch": 530, "lr": 3.28639615373752e-06} +{"train_loss": 0.00028057172312401235, "global_step": 63172, "epoch": 530, "lr": 3.2856062354554075e-06} +{"train_loss": 0.00033147286740131676, "global_step": 63173, "epoch": 530, "lr": 3.284816408892022e-06} +{"train_loss": 0.0003821914142463356, "global_step": 63174, "epoch": 530, "lr": 3.2840266740488956e-06} +{"train_loss": 0.0002527264005038887, "global_step": 63175, "epoch": 530, "lr": 3.2832370309275994e-06} +{"train_loss": 0.00020073096675332636, "global_step": 63176, "epoch": 530, "lr": 3.282447479529671e-06} +{"train_loss": 0.00030849495669826865, "global_step": 63177, "epoch": 530, "lr": 3.2816580198566706e-06} +{"train_loss": 0.00019151349260937423, "global_step": 63178, "epoch": 530, "lr": 3.280868651910135e-06} +{"train_loss": 0.00018689480202738196, "global_step": 63179, "epoch": 530, "lr": 3.280079375691636e-06} +{"train_loss": 0.0002001789544010535, "global_step": 63180, "epoch": 530, "lr": 3.2792901912027053e-06} +{"train_loss": 0.000245338975219056, "global_step": 63181, "epoch": 530, "lr": 3.2785010984448918e-06} +{"train_loss": 0.00035627876059152186, "global_step": 63182, "epoch": 530, "lr": 3.277712097419755e-06} +{"train_loss": 0.0002589692594483495, "global_step": 63183, "epoch": 530, "lr": 3.276923188128833e-06} +{"train_loss": 0.0008058376843109727, "global_step": 63184, "epoch": 530, "lr": 3.2761343705736914e-06} +{"train_loss": 0.0002476824156474322, "global_step": 63185, "epoch": 530, "lr": 3.275345644755862e-06} +{"train_loss": 0.0008554898668080568, "global_step": 63186, "epoch": 530, "lr": 3.2745570106768984e-06} +{"train_loss": 0.00029114261269569397, "global_step": 63187, "epoch": 530, "lr": 3.2737684683383506e-06} +{"train_loss": 0.0003509744237511646, "global_step": 63188, "epoch": 530, "lr": 3.2729800177417612e-06, "val_loss": 0.035436540842056274, "train_action_mse_error": 4.190505933365785e-06} +{"train_loss": 0.00027208260144107044, "global_step": 63189, "epoch": 531, "lr": 3.2721916588886958e-06} +{"train_loss": 0.0003185550740454346, "global_step": 63190, "epoch": 531, "lr": 3.271403391780681e-06} +{"train_loss": 0.00025982363149523735, "global_step": 63191, "epoch": 531, "lr": 3.270615216419276e-06} +{"train_loss": 0.0002182278549298644, "global_step": 63192, "epoch": 531, "lr": 3.2698271328060304e-06} +{"train_loss": 0.0002942366118077189, "global_step": 63193, "epoch": 531, "lr": 3.269039140942476e-06} +{"train_loss": 0.0002467985323164612, "global_step": 63194, "epoch": 531, "lr": 3.2682512408301836e-06} +{"train_loss": 0.0007094164029695094, "global_step": 63195, "epoch": 531, "lr": 3.267463432470674e-06} +{"train_loss": 0.00044768318184651434, "global_step": 63196, "epoch": 531, "lr": 3.266675715865508e-06} +{"train_loss": 0.00020517705706879497, "global_step": 63197, "epoch": 531, "lr": 3.2658880910162394e-06} +{"train_loss": 0.00015695391630288213, "global_step": 63198, "epoch": 531, "lr": 3.2651005579243998e-06} +{"train_loss": 0.0004980852245353162, "global_step": 63199, "epoch": 531, "lr": 3.264313116591555e-06} +{"train_loss": 0.0004922648658975959, "global_step": 63200, "epoch": 531, "lr": 3.2635257670192265e-06} +{"train_loss": 0.0003171559947077185, "global_step": 63201, "epoch": 531, "lr": 3.262738509208979e-06} +{"train_loss": 0.00018034463573712856, "global_step": 63202, "epoch": 531, "lr": 3.261951343162345e-06} +{"train_loss": 0.0001792469120118767, "global_step": 63203, "epoch": 531, "lr": 3.2611642688808785e-06} +{"train_loss": 0.0005303311627358198, "global_step": 63204, "epoch": 531, "lr": 3.2603772863661284e-06} +{"train_loss": 0.0005017280345782638, "global_step": 63205, "epoch": 531, "lr": 3.259590395619627e-06} +{"train_loss": 0.00021815768559463322, "global_step": 63206, "epoch": 531, "lr": 3.2588035966429344e-06} +{"train_loss": 0.00039952542283572257, "global_step": 63207, "epoch": 531, "lr": 3.258016889437576e-06} +{"train_loss": 0.0003257253556512296, "global_step": 63208, "epoch": 531, "lr": 3.2572302740051185e-06} +{"train_loss": 0.0005477891536429524, "global_step": 63209, "epoch": 531, "lr": 3.2564437503470823e-06} +{"train_loss": 0.000432783825090155, "global_step": 63210, "epoch": 531, "lr": 3.2556573184650384e-06} +{"train_loss": 0.00020744586072396487, "global_step": 63211, "epoch": 531, "lr": 3.254870978360519e-06} +{"train_loss": 0.00021290563745424151, "global_step": 63212, "epoch": 531, "lr": 3.2540847300350563e-06} +{"train_loss": 0.000492407416459173, "global_step": 63213, "epoch": 531, "lr": 3.25329857349021e-06} +{"train_loss": 0.00015532830730080605, "global_step": 63214, "epoch": 531, "lr": 3.252512508727512e-06} +{"train_loss": 0.0005350552964955568, "global_step": 63215, "epoch": 531, "lr": 3.251726535748517e-06} +{"train_loss": 0.00026609186897985637, "global_step": 63216, "epoch": 531, "lr": 3.250940654554757e-06} +{"train_loss": 0.0004274762759450823, "global_step": 63217, "epoch": 531, "lr": 3.2501548651477864e-06} +{"train_loss": 0.0003778116952162236, "global_step": 63218, "epoch": 531, "lr": 3.249369167529148e-06} +{"train_loss": 0.0004947085399180651, "global_step": 63219, "epoch": 531, "lr": 3.2485835617003634e-06} +{"train_loss": 0.0002973681839648634, "global_step": 63220, "epoch": 531, "lr": 3.247798047663003e-06} +{"train_loss": 0.0001915330794872716, "global_step": 63221, "epoch": 531, "lr": 3.2470126254185884e-06} +{"train_loss": 0.00024062246666289866, "global_step": 63222, "epoch": 531, "lr": 3.2462272949686733e-06} +{"train_loss": 0.00029412301955744624, "global_step": 63223, "epoch": 531, "lr": 3.2454420563148015e-06} +{"train_loss": 0.00015191914280876517, "global_step": 63224, "epoch": 531, "lr": 3.244656909458499e-06} +{"train_loss": 0.00030633245478384197, "global_step": 63225, "epoch": 531, "lr": 3.24387185440132e-06} +{"train_loss": 0.00041401234921067953, "global_step": 63226, "epoch": 531, "lr": 3.243086891144803e-06} +{"train_loss": 0.0006636215839534998, "global_step": 63227, "epoch": 531, "lr": 3.2423020196904963e-06} +{"train_loss": 0.0004145696002524346, "global_step": 63228, "epoch": 531, "lr": 3.2415172400399262e-06} +{"train_loss": 0.00026510778116062284, "global_step": 63229, "epoch": 531, "lr": 3.2407325521946474e-06} +{"train_loss": 0.0008201639866456389, "global_step": 63230, "epoch": 531, "lr": 3.239947956156186e-06} +{"train_loss": 0.00018554877897258848, "global_step": 63231, "epoch": 531, "lr": 3.239163451926097e-06} +{"train_loss": 0.0002747096586972475, "global_step": 63232, "epoch": 531, "lr": 3.2383790395059176e-06} +{"train_loss": 0.0004883802030235529, "global_step": 63233, "epoch": 531, "lr": 3.23759471889718e-06} +{"train_loss": 0.00037114645238034427, "global_step": 63234, "epoch": 531, "lr": 3.236810490101433e-06} +{"train_loss": 0.0005253354320302606, "global_step": 63235, "epoch": 531, "lr": 3.2360263531202086e-06} +{"train_loss": 0.0004714074602816254, "global_step": 63236, "epoch": 531, "lr": 3.2352423079550553e-06} +{"train_loss": 0.00037894080742262304, "global_step": 63237, "epoch": 531, "lr": 3.2344583546075115e-06} +{"train_loss": 0.000268648931523785, "global_step": 63238, "epoch": 531, "lr": 3.233674493079103e-06} +{"train_loss": 0.0002650069654919207, "global_step": 63239, "epoch": 531, "lr": 3.23289072337139e-06} +{"train_loss": 0.00019041119958274066, "global_step": 63240, "epoch": 531, "lr": 3.232107045485888e-06} +{"train_loss": 0.00041043743840418756, "global_step": 63241, "epoch": 531, "lr": 3.2313234594241513e-06} +{"train_loss": 0.0003522046026773751, "global_step": 63242, "epoch": 531, "lr": 3.230539965187723e-06} +{"train_loss": 0.00024974497500807047, "global_step": 63243, "epoch": 531, "lr": 3.229756562778119e-06} +{"train_loss": 0.00040653476025909185, "global_step": 63244, "epoch": 531, "lr": 3.2289732521968986e-06} +{"train_loss": 0.00015864633314777166, "global_step": 63245, "epoch": 531, "lr": 3.2281900334455885e-06} +{"train_loss": 0.0003092226688750088, "global_step": 63246, "epoch": 531, "lr": 3.2274069065257373e-06} +{"train_loss": 0.0002577183477114886, "global_step": 63247, "epoch": 531, "lr": 3.2266238714388664e-06} +{"train_loss": 0.00035038363421335816, "global_step": 63248, "epoch": 531, "lr": 3.2258409281865297e-06} +{"train_loss": 0.0003408921475056559, "global_step": 63249, "epoch": 531, "lr": 3.22505807677026e-06} +{"train_loss": 0.000263658759649843, "global_step": 63250, "epoch": 531, "lr": 3.224275317191583e-06} +{"train_loss": 0.0005305691156536341, "global_step": 63251, "epoch": 531, "lr": 3.2234926494520535e-06} +{"train_loss": 0.0002811321464832872, "global_step": 63252, "epoch": 531, "lr": 3.2227100735531867e-06} +{"train_loss": 0.00018897322297561914, "global_step": 63253, "epoch": 531, "lr": 3.221927589496543e-06} +{"train_loss": 0.00034691428299993277, "global_step": 63254, "epoch": 531, "lr": 3.2211451972836424e-06} +{"train_loss": 0.00046667689457535744, "global_step": 63255, "epoch": 531, "lr": 3.220362896916024e-06} +{"train_loss": 0.00026278369477950037, "global_step": 63256, "epoch": 531, "lr": 3.2195806883952297e-06} +{"train_loss": 0.0003394833183847368, "global_step": 63257, "epoch": 531, "lr": 3.218798571722781e-06} +{"train_loss": 0.00022986228577792645, "global_step": 63258, "epoch": 531, "lr": 3.2180165469002377e-06} +{"train_loss": 0.00023482329561375082, "global_step": 63259, "epoch": 531, "lr": 3.21723461392911e-06} +{"train_loss": 0.00014058341912459582, "global_step": 63260, "epoch": 531, "lr": 3.216452772810946e-06} +{"train_loss": 0.00022941056522540748, "global_step": 63261, "epoch": 531, "lr": 3.2156710235472786e-06} +{"train_loss": 0.0002505739394109696, "global_step": 63262, "epoch": 531, "lr": 3.214889366139651e-06} +{"train_loss": 0.0002352589217480272, "global_step": 63263, "epoch": 531, "lr": 3.2141078005895775e-06} +{"train_loss": 0.00045021134428679943, "global_step": 63264, "epoch": 531, "lr": 3.2133263268986137e-06} +{"train_loss": 0.0003595707530621439, "global_step": 63265, "epoch": 531, "lr": 3.2125449450682798e-06} +{"train_loss": 0.00014558502880390733, "global_step": 63266, "epoch": 531, "lr": 3.211763655100114e-06} +{"train_loss": 0.0004172641201876104, "global_step": 63267, "epoch": 531, "lr": 3.2109824569956594e-06} +{"train_loss": 0.0002179656585212797, "global_step": 63268, "epoch": 531, "lr": 3.210201350756442e-06} +{"train_loss": 0.0003020290459971875, "global_step": 63269, "epoch": 531, "lr": 3.209420336383989e-06} +{"train_loss": 0.00018718655337579548, "global_step": 63270, "epoch": 531, "lr": 3.208639413879844e-06} +{"train_loss": 0.00014564958109986037, "global_step": 63271, "epoch": 531, "lr": 3.207858583245532e-06} +{"train_loss": 0.0002701298799365759, "global_step": 63272, "epoch": 531, "lr": 3.2070778444826032e-06} +{"train_loss": 0.0003055215929634869, "global_step": 63273, "epoch": 531, "lr": 3.206297197592573e-06} +{"train_loss": 0.0002726847887970507, "global_step": 63274, "epoch": 531, "lr": 3.2055166425769667e-06} +{"train_loss": 0.00018898410780820996, "global_step": 63275, "epoch": 531, "lr": 3.204736179437345e-06} +{"train_loss": 0.00034912966657429934, "global_step": 63276, "epoch": 531, "lr": 3.203955808175213e-06} +{"train_loss": 0.00023678150319028646, "global_step": 63277, "epoch": 531, "lr": 3.203175528792124e-06} +{"train_loss": 0.00013595027849078178, "global_step": 63278, "epoch": 531, "lr": 3.202395341289588e-06} +{"train_loss": 0.00021033408120274544, "global_step": 63279, "epoch": 531, "lr": 3.2016152456691595e-06} +{"train_loss": 0.00020908591977786273, "global_step": 63280, "epoch": 531, "lr": 3.200835241932365e-06} +{"train_loss": 0.0003324643475934863, "global_step": 63281, "epoch": 531, "lr": 3.2000553300807146e-06} +{"train_loss": 0.00019845842325594276, "global_step": 63282, "epoch": 531, "lr": 3.1992755101157677e-06} +{"train_loss": 0.0001829816319514066, "global_step": 63283, "epoch": 531, "lr": 3.1984957820390348e-06} +{"train_loss": 0.00031393254175782204, "global_step": 63284, "epoch": 531, "lr": 3.1977161458520642e-06} +{"train_loss": 0.0003259192162659019, "global_step": 63285, "epoch": 531, "lr": 3.196936601556372e-06} +{"train_loss": 0.00019485857046674937, "global_step": 63286, "epoch": 531, "lr": 3.1961571491535005e-06} +{"train_loss": 0.00020941394905094057, "global_step": 63287, "epoch": 531, "lr": 3.195377788644971e-06} +{"train_loss": 0.00022183448891155422, "global_step": 63288, "epoch": 531, "lr": 3.1945985200323105e-06} +{"train_loss": 0.000281621643807739, "global_step": 63289, "epoch": 531, "lr": 3.193819343317067e-06} +{"train_loss": 0.00018578725575935096, "global_step": 63290, "epoch": 531, "lr": 3.193040258500746e-06} +{"train_loss": 0.00022966678079683334, "global_step": 63291, "epoch": 531, "lr": 3.1922612655849003e-06} +{"train_loss": 0.00014821012155152857, "global_step": 63292, "epoch": 531, "lr": 3.1914823645710466e-06} +{"train_loss": 0.0005360161303542554, "global_step": 63293, "epoch": 531, "lr": 3.190703555460711e-06} +{"train_loss": 0.00041472347220405936, "global_step": 63294, "epoch": 531, "lr": 3.1899248382554315e-06} +{"train_loss": 0.0001709676143946126, "global_step": 63295, "epoch": 531, "lr": 3.189146212956734e-06} +{"train_loss": 0.0001822977210395038, "global_step": 63296, "epoch": 531, "lr": 3.1883676795661454e-06} +{"train_loss": 0.0002909268660005182, "global_step": 63297, "epoch": 531, "lr": 3.187589238085198e-06} +{"train_loss": 0.0008149421191774309, "global_step": 63298, "epoch": 531, "lr": 3.186810888515418e-06} +{"train_loss": 0.00038609153125435114, "global_step": 63299, "epoch": 531, "lr": 3.186032630858332e-06} +{"train_loss": 0.0004790054226759821, "global_step": 63300, "epoch": 531, "lr": 3.185254465115467e-06} +{"train_loss": 0.0003741910040844232, "global_step": 63301, "epoch": 531, "lr": 3.1844763912883603e-06} +{"train_loss": 0.0004442275094334036, "global_step": 63302, "epoch": 531, "lr": 3.1836984093785273e-06} +{"train_loss": 0.00021032222139183432, "global_step": 63303, "epoch": 531, "lr": 3.1829205193875058e-06} +{"train_loss": 0.000634192896541208, "global_step": 63304, "epoch": 531, "lr": 3.182142721316811e-06} +{"train_loss": 0.00014778813056182116, "global_step": 63305, "epoch": 531, "lr": 3.1813650151679865e-06} +{"train_loss": 0.00027629159740172327, "global_step": 63306, "epoch": 531, "lr": 3.1805874009425475e-06} +{"train_loss": 0.000321038653452865, "global_step": 63307, "epoch": 531, "lr": 3.179809878642015e-06, "val_loss": 0.012427584268152714} +{"train_loss": 0.0007744634058326483, "global_step": 63308, "epoch": 532, "lr": 3.179032448267938e-06} +{"train_loss": 0.0002170986554119736, "global_step": 63309, "epoch": 532, "lr": 3.178255109821815e-06} +{"train_loss": 0.0003890210937242955, "global_step": 63310, "epoch": 532, "lr": 3.1774778633051948e-06} +{"train_loss": 0.00017820126959122717, "global_step": 63311, "epoch": 532, "lr": 3.176700708719593e-06} +{"train_loss": 0.00025546213146299124, "global_step": 63312, "epoch": 532, "lr": 3.175923646066531e-06} +{"train_loss": 0.0002011303004110232, "global_step": 63313, "epoch": 532, "lr": 3.1751466753475456e-06} +{"train_loss": 0.00027128751389682293, "global_step": 63314, "epoch": 532, "lr": 3.174369796564153e-06} +{"train_loss": 0.0004962502280250192, "global_step": 63315, "epoch": 532, "lr": 3.17359300971789e-06} +{"train_loss": 0.00015433429507538676, "global_step": 63316, "epoch": 532, "lr": 3.1728163148102675e-06} +{"train_loss": 0.0003699469962157309, "global_step": 63317, "epoch": 532, "lr": 3.1720397118428224e-06} +{"train_loss": 0.0001656011154409498, "global_step": 63318, "epoch": 532, "lr": 3.1712632008170763e-06} +{"train_loss": 0.0002670828253030777, "global_step": 63319, "epoch": 532, "lr": 3.170486781734544e-06} +{"train_loss": 0.00034076449810527265, "global_step": 63320, "epoch": 532, "lr": 3.169710454596764e-06} +{"train_loss": 0.00032128611928783357, "global_step": 63321, "epoch": 532, "lr": 3.1689342194052506e-06} +{"train_loss": 0.0003703230177052319, "global_step": 63322, "epoch": 532, "lr": 3.168158076161537e-06} +{"train_loss": 0.0001614395878277719, "global_step": 63323, "epoch": 532, "lr": 3.1673820248671436e-06} +{"train_loss": 0.0001334396074526012, "global_step": 63324, "epoch": 532, "lr": 3.166606065523581e-06} +{"train_loss": 0.0002771841536741704, "global_step": 63325, "epoch": 532, "lr": 3.165830198132391e-06} +{"train_loss": 0.00028876704163849354, "global_step": 63326, "epoch": 532, "lr": 3.165054422695085e-06} +{"train_loss": 0.0003731267643161118, "global_step": 63327, "epoch": 532, "lr": 3.1642787392132e-06} +{"train_loss": 0.0005422563408501446, "global_step": 63328, "epoch": 532, "lr": 3.1635031476882405e-06} +{"train_loss": 0.0003230397996958345, "global_step": 63329, "epoch": 532, "lr": 3.1627276481217383e-06} +{"train_loss": 0.00022428776719607413, "global_step": 63330, "epoch": 532, "lr": 3.161952240515226e-06} +{"train_loss": 0.00024123789626173675, "global_step": 63331, "epoch": 532, "lr": 3.1611769248702074e-06} +{"train_loss": 0.00029064726550132036, "global_step": 63332, "epoch": 532, "lr": 3.1604017011882204e-06} +{"train_loss": 0.0003458805149421096, "global_step": 63333, "epoch": 532, "lr": 3.159626569470775e-06} +{"train_loss": 0.00029255275148898363, "global_step": 63334, "epoch": 532, "lr": 3.158851529719409e-06} +{"train_loss": 0.0006433942471630871, "global_step": 63335, "epoch": 532, "lr": 3.1580765819356207e-06} +{"train_loss": 0.00013271298666950315, "global_step": 63336, "epoch": 532, "lr": 3.1573017261209537e-06} +{"train_loss": 0.00032189107150770724, "global_step": 63337, "epoch": 532, "lr": 3.1565269622769234e-06} +{"train_loss": 0.00017746543744578958, "global_step": 63338, "epoch": 532, "lr": 3.1557522904050396e-06} +{"train_loss": 0.00043843433377332985, "global_step": 63339, "epoch": 532, "lr": 3.1549777105068346e-06} +{"train_loss": 0.0002151947992388159, "global_step": 63340, "epoch": 532, "lr": 3.1542032225838237e-06} +{"train_loss": 0.000385826948331669, "global_step": 63341, "epoch": 532, "lr": 3.1534288266375387e-06} +{"train_loss": 0.0002960547572001815, "global_step": 63342, "epoch": 532, "lr": 3.152654522669485e-06} +{"train_loss": 0.00022523372899740934, "global_step": 63343, "epoch": 532, "lr": 3.151880310681188e-06} +{"train_loss": 0.00035908978316001594, "global_step": 63344, "epoch": 532, "lr": 3.1511061906741747e-06} +{"train_loss": 0.00021719071082770824, "global_step": 63345, "epoch": 532, "lr": 3.1503321626499493e-06} +{"train_loss": 0.0002819487708620727, "global_step": 63346, "epoch": 532, "lr": 3.14955822661005e-06} +{"train_loss": 0.0001989280863199383, "global_step": 63347, "epoch": 532, "lr": 3.1487843825559803e-06} +{"train_loss": 0.00019115918257739395, "global_step": 63348, "epoch": 532, "lr": 3.1480106304892733e-06} +{"train_loss": 0.0001794218405848369, "global_step": 63349, "epoch": 532, "lr": 3.147236970411449e-06} +{"train_loss": 0.0004062499210704118, "global_step": 63350, "epoch": 532, "lr": 3.146463402324007e-06} +{"train_loss": 0.0012014498934149742, "global_step": 63351, "epoch": 532, "lr": 3.1456899262284845e-06} +{"train_loss": 0.0002600050938781351, "global_step": 63352, "epoch": 532, "lr": 3.144916542126386e-06} +{"train_loss": 0.00032528315205127, "global_step": 63353, "epoch": 532, "lr": 3.1441432500192493e-06} +{"train_loss": 0.00019588139548432082, "global_step": 63354, "epoch": 532, "lr": 3.1433700499085728e-06} +{"train_loss": 0.00017429680156055838, "global_step": 63355, "epoch": 532, "lr": 3.142596941795889e-06} +{"train_loss": 0.00046124530490487814, "global_step": 63356, "epoch": 532, "lr": 3.1418239256827132e-06} +{"train_loss": 0.0002938415855169296, "global_step": 63357, "epoch": 532, "lr": 3.14105100157055e-06} +{"train_loss": 0.0002641841128934175, "global_step": 63358, "epoch": 532, "lr": 3.1402781694609364e-06} +{"train_loss": 0.00020952496561221778, "global_step": 63359, "epoch": 532, "lr": 3.1395054293553717e-06} +{"train_loss": 0.0012703934917226434, "global_step": 63360, "epoch": 532, "lr": 3.138732781255388e-06} +{"train_loss": 0.00023844932729844004, "global_step": 63361, "epoch": 532, "lr": 3.137960225162495e-06} +{"train_loss": 0.00021329091396182775, "global_step": 63362, "epoch": 532, "lr": 3.1371877610782084e-06} +{"train_loss": 0.00023402899387292564, "global_step": 63363, "epoch": 532, "lr": 3.1364153890040492e-06} +{"train_loss": 0.00043963795178569853, "global_step": 63364, "epoch": 532, "lr": 3.1356431089415273e-06} +{"train_loss": 0.0002528813201934099, "global_step": 63365, "epoch": 532, "lr": 3.134870920892169e-06} +{"train_loss": 0.0003461874439381063, "global_step": 63366, "epoch": 532, "lr": 3.1340988248574787e-06} +{"train_loss": 0.00016391022654715925, "global_step": 63367, "epoch": 532, "lr": 3.1333268208389887e-06} +{"train_loss": 0.0004871714045293629, "global_step": 63368, "epoch": 532, "lr": 3.1325549088381978e-06} +{"train_loss": 0.000425929029006511, "global_step": 63369, "epoch": 532, "lr": 3.1317830888566267e-06} +{"train_loss": 0.0005439221276901662, "global_step": 63370, "epoch": 532, "lr": 3.131011360895797e-06} +{"train_loss": 0.0004658173129428178, "global_step": 63371, "epoch": 532, "lr": 3.1302397249572122e-06} +{"train_loss": 0.0003545036306604743, "global_step": 63372, "epoch": 532, "lr": 3.1294681810424054e-06} +{"train_loss": 0.0003471540112514049, "global_step": 63373, "epoch": 532, "lr": 3.1286967291528802e-06} +{"train_loss": 0.0004665384767577052, "global_step": 63374, "epoch": 532, "lr": 3.127925369290141e-06} +{"train_loss": 0.00039941060822457075, "global_step": 63375, "epoch": 532, "lr": 3.1271541014557204e-06} +{"train_loss": 0.00032299599843099713, "global_step": 63376, "epoch": 532, "lr": 3.126382925651117e-06} +{"train_loss": 0.00040293767233379185, "global_step": 63377, "epoch": 532, "lr": 3.1256118418778622e-06} +{"train_loss": 0.00021967917564325035, "global_step": 63378, "epoch": 532, "lr": 3.1248408501374505e-06} +{"train_loss": 0.00017489344463683665, "global_step": 63379, "epoch": 532, "lr": 3.1240699504314188e-06} +{"train_loss": 0.0003513165866024792, "global_step": 63380, "epoch": 532, "lr": 3.1232991427612657e-06} +{"train_loss": 0.0008038777741603553, "global_step": 63381, "epoch": 532, "lr": 3.1225284271284962e-06} +{"train_loss": 0.00024817799567244947, "global_step": 63382, "epoch": 532, "lr": 3.121757803534642e-06} +{"train_loss": 0.00024787563597783446, "global_step": 63383, "epoch": 532, "lr": 3.1209872719812016e-06} +{"train_loss": 0.0004631956689991057, "global_step": 63384, "epoch": 532, "lr": 3.1202168324697025e-06} +{"train_loss": 0.00013638313976116478, "global_step": 63385, "epoch": 532, "lr": 3.1194464850016425e-06} +{"train_loss": 0.0001626268494874239, "global_step": 63386, "epoch": 532, "lr": 3.118676229578549e-06} +{"train_loss": 0.0008411958697251976, "global_step": 63387, "epoch": 532, "lr": 3.1179060662019255e-06} +{"train_loss": 0.00024191170814447105, "global_step": 63388, "epoch": 532, "lr": 3.117135994873277e-06} +{"train_loss": 0.0003556292213033885, "global_step": 63389, "epoch": 532, "lr": 3.11636601559413e-06} +{"train_loss": 0.00016644489369355142, "global_step": 63390, "epoch": 532, "lr": 3.115596128365983e-06} +{"train_loss": 0.00041704802424646914, "global_step": 63391, "epoch": 532, "lr": 3.1148263331903625e-06} +{"train_loss": 0.0003228148852940649, "global_step": 63392, "epoch": 532, "lr": 3.1140566300687625e-06} +{"train_loss": 0.00028227141592651606, "global_step": 63393, "epoch": 532, "lr": 3.1132870190027087e-06} +{"train_loss": 0.0003516020951792598, "global_step": 63394, "epoch": 532, "lr": 3.1125174999937e-06} +{"train_loss": 0.0002535358944442123, "global_step": 63395, "epoch": 532, "lr": 3.1117480730432635e-06} +{"train_loss": 0.0004387276712805033, "global_step": 63396, "epoch": 532, "lr": 3.110978738152892e-06} +{"train_loss": 0.000367092143278569, "global_step": 63397, "epoch": 532, "lr": 3.110209495324112e-06} +{"train_loss": 0.000262536748778075, "global_step": 63398, "epoch": 532, "lr": 3.109440344558423e-06} +{"train_loss": 0.0002700054319575429, "global_step": 63399, "epoch": 532, "lr": 3.1086712858573395e-06} +{"train_loss": 0.0003255483170505613, "global_step": 63400, "epoch": 532, "lr": 3.1079023192223664e-06} +{"train_loss": 0.000843841175083071, "global_step": 63401, "epoch": 532, "lr": 3.107133444655025e-06} +{"train_loss": 0.000245536066358909, "global_step": 63402, "epoch": 532, "lr": 3.1063646621568078e-06} +{"train_loss": 0.00031947006937116385, "global_step": 63403, "epoch": 532, "lr": 3.1055959717292414e-06} +{"train_loss": 0.0003070938400924206, "global_step": 63404, "epoch": 532, "lr": 3.1048273733738198e-06} +{"train_loss": 0.0002624901244416833, "global_step": 63405, "epoch": 532, "lr": 3.104058867092069e-06} +{"train_loss": 0.0005617084680125117, "global_step": 63406, "epoch": 532, "lr": 3.103290452885488e-06} +{"train_loss": 0.00020206140470691025, "global_step": 63407, "epoch": 532, "lr": 3.1025221307555754e-06} +{"train_loss": 0.00032830433337949216, "global_step": 63408, "epoch": 532, "lr": 3.1017539007038574e-06} +{"train_loss": 0.000430007727118209, "global_step": 63409, "epoch": 532, "lr": 3.1009857627318338e-06} +{"train_loss": 0.0005243723280727863, "global_step": 63410, "epoch": 532, "lr": 3.1002177168410197e-06} +{"train_loss": 0.000229284429224208, "global_step": 63411, "epoch": 532, "lr": 3.0994497630329133e-06} +{"train_loss": 0.0004510934231802821, "global_step": 63412, "epoch": 532, "lr": 3.098681901309025e-06} +{"train_loss": 0.0002538556873332709, "global_step": 63413, "epoch": 532, "lr": 3.0979141316708706e-06} +{"train_loss": 0.0005491594201885164, "global_step": 63414, "epoch": 532, "lr": 3.097146454119937e-06} +{"train_loss": 0.0002517544198781252, "global_step": 63415, "epoch": 532, "lr": 3.0963788686577623e-06} +{"train_loss": 0.0007234985241666436, "global_step": 63416, "epoch": 532, "lr": 3.0956113752858227e-06} +{"train_loss": 0.00021919122082181275, "global_step": 63417, "epoch": 532, "lr": 3.094843974005651e-06} +{"train_loss": 0.00019025981600861996, "global_step": 63418, "epoch": 532, "lr": 3.09407666481874e-06} +{"train_loss": 0.00040654881740920246, "global_step": 63419, "epoch": 532, "lr": 3.093309447726589e-06} +{"train_loss": 0.00018335301137994975, "global_step": 63420, "epoch": 532, "lr": 3.092542322730724e-06} +{"train_loss": 0.0002999157295562327, "global_step": 63421, "epoch": 532, "lr": 3.0917752898326324e-06} +{"train_loss": 0.000552212237380445, "global_step": 63422, "epoch": 532, "lr": 3.091008349033836e-06} +{"train_loss": 0.0002602233143988997, "global_step": 63423, "epoch": 532, "lr": 3.090241500335822e-06} +{"train_loss": 0.0003547605883795768, "global_step": 63424, "epoch": 532, "lr": 3.0894747437401228e-06} +{"train_loss": 0.00021240887872409075, "global_step": 63425, "epoch": 532, "lr": 3.0887080792482204e-06} +{"train_loss": 0.00034295757970784424, "global_step": 63426, "epoch": 532, "lr": 3.0879415068616245e-06, "val_loss": 0.02246401645243168} +{"train_loss": 0.00022575868933927268, "global_step": 63427, "epoch": 533, "lr": 3.0871750265818457e-06} +{"train_loss": 0.0003965083451475948, "global_step": 63428, "epoch": 533, "lr": 3.086408638410393e-06} +{"train_loss": 0.00023405866522807628, "global_step": 63429, "epoch": 533, "lr": 3.0856423423487546e-06} +{"train_loss": 0.00038372669951058924, "global_step": 63430, "epoch": 533, "lr": 3.0848761383984514e-06} +{"train_loss": 0.0002867731964215636, "global_step": 63431, "epoch": 533, "lr": 3.0841100265609768e-06} +{"train_loss": 0.0002981268335133791, "global_step": 63432, "epoch": 533, "lr": 3.0833440068378515e-06} +{"train_loss": 0.0008072786731645465, "global_step": 63433, "epoch": 533, "lr": 3.0825780792305583e-06} +{"train_loss": 0.00034243782283738256, "global_step": 63434, "epoch": 533, "lr": 3.081812243740617e-06} +{"train_loss": 0.00037544494261965156, "global_step": 63435, "epoch": 533, "lr": 3.0810465003695168e-06} +{"train_loss": 0.0004028373514302075, "global_step": 63436, "epoch": 533, "lr": 3.080280849118777e-06} +{"train_loss": 0.0002369541471125558, "global_step": 63437, "epoch": 533, "lr": 3.079515289989893e-06} +{"train_loss": 0.00026696029817685485, "global_step": 63438, "epoch": 533, "lr": 3.0787498229843615e-06} +{"train_loss": 0.0002671356778591871, "global_step": 63439, "epoch": 533, "lr": 3.077984448103699e-06} +{"train_loss": 0.0003167225222568959, "global_step": 63440, "epoch": 533, "lr": 3.077219165349393e-06} +{"train_loss": 0.00026778699248097837, "global_step": 63441, "epoch": 533, "lr": 3.0764539747229594e-06} +{"train_loss": 0.0002946861204691231, "global_step": 63442, "epoch": 533, "lr": 3.075688876225896e-06} +{"train_loss": 0.0003227703273296356, "global_step": 63443, "epoch": 533, "lr": 3.0749238698597025e-06} +{"train_loss": 0.00027412071358412504, "global_step": 63444, "epoch": 533, "lr": 3.0741589556258832e-06} +{"train_loss": 0.0004944831016473472, "global_step": 63445, "epoch": 533, "lr": 3.0733941335259366e-06} +{"train_loss": 0.00020048867736477405, "global_step": 63446, "epoch": 533, "lr": 3.072629403561378e-06} +{"train_loss": 0.00022326858015730977, "global_step": 63447, "epoch": 533, "lr": 3.071864765733684e-06} +{"train_loss": 0.00017330906121060252, "global_step": 63448, "epoch": 533, "lr": 3.0711002200443816e-06} +{"train_loss": 0.00023058704391587526, "global_step": 63449, "epoch": 533, "lr": 3.070335766494958e-06} +{"train_loss": 0.0005356361507438123, "global_step": 63450, "epoch": 533, "lr": 3.0695714050869074e-06} +{"train_loss": 0.0003107003285549581, "global_step": 63451, "epoch": 533, "lr": 3.0688071358217498e-06} +{"train_loss": 0.00024970248341560364, "global_step": 63452, "epoch": 533, "lr": 3.0680429587009675e-06} +{"train_loss": 0.0002658779267221689, "global_step": 63453, "epoch": 533, "lr": 3.067278873726076e-06} +{"train_loss": 0.00019441301992628723, "global_step": 63454, "epoch": 533, "lr": 3.066514880898558e-06} +{"train_loss": 0.00018356897635385394, "global_step": 63455, "epoch": 533, "lr": 3.0657509802199393e-06} +{"train_loss": 0.0005519697442650795, "global_step": 63456, "epoch": 533, "lr": 3.064987171691697e-06} +{"train_loss": 0.00030637855525128543, "global_step": 63457, "epoch": 533, "lr": 3.064223455315335e-06} +{"train_loss": 0.00019858585437759757, "global_step": 63458, "epoch": 533, "lr": 3.063459831092358e-06} +{"train_loss": 0.00016404416237492114, "global_step": 63459, "epoch": 533, "lr": 3.062696299024259e-06} +{"train_loss": 0.00019938050536438823, "global_step": 63460, "epoch": 533, "lr": 3.061932859112554e-06} +{"train_loss": 0.00041443409281782806, "global_step": 63461, "epoch": 533, "lr": 3.0611695113587134e-06} +{"train_loss": 0.00023439254437107593, "global_step": 63462, "epoch": 533, "lr": 3.060406255764253e-06} +{"train_loss": 0.00028728676261380315, "global_step": 63463, "epoch": 533, "lr": 3.059643092330683e-06} +{"train_loss": 0.00031293212668970227, "global_step": 63464, "epoch": 533, "lr": 3.0588800210594794e-06} +{"train_loss": 0.00029501403332687914, "global_step": 63465, "epoch": 533, "lr": 3.0581170419521577e-06} +{"train_loss": 0.00026842611259780824, "global_step": 63466, "epoch": 533, "lr": 3.057354155010195e-06} +{"train_loss": 0.0003739497915375978, "global_step": 63467, "epoch": 533, "lr": 3.056591360235117e-06} +{"train_loss": 0.00021653712610714138, "global_step": 63468, "epoch": 533, "lr": 3.055828657628401e-06} +{"train_loss": 0.0003659857320599258, "global_step": 63469, "epoch": 533, "lr": 3.055066047191546e-06} +{"train_loss": 0.0004498372145462781, "global_step": 63470, "epoch": 533, "lr": 3.0543035289260613e-06} +{"train_loss": 0.0005388407735154033, "global_step": 63471, "epoch": 533, "lr": 3.0535411028334295e-06} +{"train_loss": 0.0002595872210804373, "global_step": 63472, "epoch": 533, "lr": 3.05277876891516e-06} +{"train_loss": 0.00017507877782918513, "global_step": 63473, "epoch": 533, "lr": 3.052016527172735e-06} +{"train_loss": 0.0002815825864672661, "global_step": 63474, "epoch": 533, "lr": 3.0512543776076707e-06} +{"train_loss": 0.00022735593665856868, "global_step": 63475, "epoch": 533, "lr": 3.0504923202214487e-06} +{"train_loss": 0.00021588560775853693, "global_step": 63476, "epoch": 533, "lr": 3.0497303550155675e-06} +{"train_loss": 0.00022008686210028827, "global_step": 63477, "epoch": 533, "lr": 3.0489684819915265e-06} +{"train_loss": 0.00024681357899680734, "global_step": 63478, "epoch": 533, "lr": 3.048206701150813e-06} +{"train_loss": 0.0003067132201977074, "global_step": 63479, "epoch": 533, "lr": 3.0474450124949426e-06} +{"train_loss": 0.0003667855344247073, "global_step": 63480, "epoch": 533, "lr": 3.046683416025392e-06} +{"train_loss": 0.0003393813385628164, "global_step": 63481, "epoch": 533, "lr": 3.04592191174366e-06} +{"train_loss": 0.0004188369493931532, "global_step": 63482, "epoch": 533, "lr": 3.045160499651245e-06} +{"train_loss": 0.00039952920633368194, "global_step": 63483, "epoch": 533, "lr": 3.0443991797496353e-06} +{"train_loss": 0.00017646461492404342, "global_step": 63484, "epoch": 533, "lr": 3.0436379520403404e-06} +{"train_loss": 0.0003010001964867115, "global_step": 63485, "epoch": 533, "lr": 3.0428768165248422e-06} +{"train_loss": 0.00033700827043503523, "global_step": 63486, "epoch": 533, "lr": 3.04211577320464e-06} +{"train_loss": 0.0001971303572645411, "global_step": 63487, "epoch": 533, "lr": 3.0413548220812326e-06} +{"train_loss": 0.000326188892358914, "global_step": 63488, "epoch": 533, "lr": 3.0405939631560963e-06} +{"train_loss": 0.00044116334174759686, "global_step": 63489, "epoch": 533, "lr": 3.0398331964307415e-06} +{"train_loss": 0.0002827608841471374, "global_step": 63490, "epoch": 533, "lr": 3.039072521906655e-06} +{"train_loss": 0.0003724182315636426, "global_step": 63491, "epoch": 533, "lr": 3.0383119395853366e-06} +{"train_loss": 0.00038732271059416234, "global_step": 63492, "epoch": 533, "lr": 3.037551449468273e-06} +{"train_loss": 0.00029425337561406195, "global_step": 63493, "epoch": 533, "lr": 3.036791051556964e-06} +{"train_loss": 0.00030835127108730376, "global_step": 63494, "epoch": 533, "lr": 3.0360307458528913e-06} +{"train_loss": 0.00022268007160164416, "global_step": 63495, "epoch": 533, "lr": 3.0352705323575646e-06} +{"train_loss": 0.0002508146862965077, "global_step": 63496, "epoch": 533, "lr": 3.0345104110724553e-06} +{"train_loss": 0.0001827957312343642, "global_step": 63497, "epoch": 533, "lr": 3.0337503819990677e-06} +{"train_loss": 0.00020865927217528224, "global_step": 63498, "epoch": 533, "lr": 3.0329904451389058e-06} +{"train_loss": 0.00024304648104589432, "global_step": 63499, "epoch": 533, "lr": 3.0322306004934462e-06} +{"train_loss": 0.0003164942318107933, "global_step": 63500, "epoch": 533, "lr": 3.0314708480641774e-06} +{"train_loss": 0.00014303372881840914, "global_step": 63501, "epoch": 533, "lr": 3.0307111878526027e-06} +{"train_loss": 0.0005054858047515154, "global_step": 63502, "epoch": 533, "lr": 3.0299516198602053e-06} +{"train_loss": 0.00028274834039621055, "global_step": 63503, "epoch": 533, "lr": 3.0291921440884828e-06} +{"train_loss": 0.00028620933881029487, "global_step": 63504, "epoch": 533, "lr": 3.0284327605389183e-06} +{"train_loss": 0.0003688128781504929, "global_step": 63505, "epoch": 533, "lr": 3.027673469213016e-06} +{"train_loss": 0.0001475625904276967, "global_step": 63506, "epoch": 533, "lr": 3.0269142701122578e-06} +{"train_loss": 0.00033810330205596983, "global_step": 63507, "epoch": 533, "lr": 3.026155163238126e-06} +{"train_loss": 0.0003444723261054605, "global_step": 63508, "epoch": 533, "lr": 3.02539614859213e-06} +{"train_loss": 0.00029881694354116917, "global_step": 63509, "epoch": 533, "lr": 3.0246372261757415e-06} +{"train_loss": 0.0002327763504581526, "global_step": 63510, "epoch": 533, "lr": 3.0238783959904704e-06} +{"train_loss": 0.00037005526246502995, "global_step": 63511, "epoch": 533, "lr": 3.0231196580377873e-06} +{"train_loss": 0.00026520155370235443, "global_step": 63512, "epoch": 533, "lr": 3.0223610123191913e-06} +{"train_loss": 0.0003572214627638459, "global_step": 63513, "epoch": 533, "lr": 3.0216024588361704e-06} +{"train_loss": 0.000340268830768764, "global_step": 63514, "epoch": 533, "lr": 3.0208439975902115e-06} +{"train_loss": 0.0003358476096764207, "global_step": 63515, "epoch": 533, "lr": 3.0200856285828138e-06} +{"train_loss": 0.0001924401003634557, "global_step": 63516, "epoch": 533, "lr": 3.0193273518154486e-06} +{"train_loss": 0.00031694918288849294, "global_step": 63517, "epoch": 533, "lr": 3.0185691672896254e-06} +{"train_loss": 0.00020245180348865688, "global_step": 63518, "epoch": 533, "lr": 3.0178110750068213e-06} +{"train_loss": 0.00027464012964628637, "global_step": 63519, "epoch": 533, "lr": 3.017053074968518e-06} +{"train_loss": 0.0001765060587786138, "global_step": 63520, "epoch": 533, "lr": 3.0162951671762195e-06} +{"train_loss": 0.0002533268416300416, "global_step": 63521, "epoch": 533, "lr": 3.015537351631403e-06} +{"train_loss": 0.0003386808675713837, "global_step": 63522, "epoch": 533, "lr": 3.0147796283355624e-06} +{"train_loss": 0.000498700188472867, "global_step": 63523, "epoch": 533, "lr": 3.014021997290173e-06} +{"train_loss": 0.0003828149929177016, "global_step": 63524, "epoch": 533, "lr": 3.0132644584967396e-06} +{"train_loss": 0.00023222449817694724, "global_step": 63525, "epoch": 533, "lr": 3.012507011956739e-06} +{"train_loss": 0.0006895101978443563, "global_step": 63526, "epoch": 533, "lr": 3.011749657671664e-06} +{"train_loss": 0.0003302825498394668, "global_step": 63527, "epoch": 533, "lr": 3.010992395642992e-06} +{"train_loss": 0.0003895111149176955, "global_step": 63528, "epoch": 533, "lr": 3.010235225872221e-06} +{"train_loss": 0.0002461944241076708, "global_step": 63529, "epoch": 533, "lr": 3.0094781483608336e-06} +{"train_loss": 0.00026994390645995736, "global_step": 63530, "epoch": 533, "lr": 3.0087211631103175e-06} +{"train_loss": 0.0004351281386334449, "global_step": 63531, "epoch": 533, "lr": 3.007964270122149e-06} +{"train_loss": 0.00019801215967163444, "global_step": 63532, "epoch": 533, "lr": 3.0072074693978324e-06} +{"train_loss": 0.00025415487471036613, "global_step": 63533, "epoch": 533, "lr": 3.0064507609388336e-06} +{"train_loss": 0.0003675175248645246, "global_step": 63534, "epoch": 533, "lr": 3.005694144746657e-06} +{"train_loss": 0.00032678418210707605, "global_step": 63535, "epoch": 533, "lr": 3.004937620822773e-06} +{"train_loss": 0.0001756916899466887, "global_step": 63536, "epoch": 533, "lr": 3.0041811891686754e-06} +{"train_loss": 0.00031055277213454247, "global_step": 63537, "epoch": 533, "lr": 3.003424849785852e-06} +{"train_loss": 0.00035113489138893783, "global_step": 63538, "epoch": 533, "lr": 3.002668602675779e-06} +{"train_loss": 0.00016738817794248462, "global_step": 63539, "epoch": 533, "lr": 3.001912447839944e-06} +{"train_loss": 0.00019463086209725589, "global_step": 63540, "epoch": 533, "lr": 3.00115638527983e-06} +{"train_loss": 0.00046351554919965565, "global_step": 63541, "epoch": 533, "lr": 3.0004004149969346e-06} +{"train_loss": 0.00020580536511261016, "global_step": 63542, "epoch": 533, "lr": 2.9996445369927186e-06} +{"train_loss": 0.0004270477802492678, "global_step": 63543, "epoch": 533, "lr": 2.9988887512686913e-06} +{"train_loss": 0.00033545171027071774, "global_step": 63544, "epoch": 533, "lr": 2.9981330578263244e-06} +{"train_loss": 0.0003066595960232359, "global_step": 63545, "epoch": 533, "lr": 2.997377456667094e-06, "val_loss": 0.020044784992933273} +{"train_loss": 0.00034698101808317006, "global_step": 63546, "epoch": 534, "lr": 2.9966219477924996e-06} +{"train_loss": 0.0009397227549925447, "global_step": 63547, "epoch": 534, "lr": 2.9958665312040056e-06} +{"train_loss": 0.00022411264944821596, "global_step": 63548, "epoch": 534, "lr": 2.9951112069031117e-06} +{"train_loss": 0.00022013770649209619, "global_step": 63549, "epoch": 534, "lr": 2.9943559748912996e-06} +{"train_loss": 0.00035495631163939834, "global_step": 63550, "epoch": 534, "lr": 2.9936008351700408e-06} +{"train_loss": 0.00032468524295836687, "global_step": 63551, "epoch": 534, "lr": 2.9928457877408334e-06} +{"train_loss": 0.00021920959989074618, "global_step": 63552, "epoch": 534, "lr": 2.9920908326051376e-06} +{"train_loss": 0.0004066348192282021, "global_step": 63553, "epoch": 534, "lr": 2.9913359697644637e-06} +{"train_loss": 0.0007476165774278343, "global_step": 63554, "epoch": 534, "lr": 2.9905811992202657e-06} +{"train_loss": 0.00048029818572103977, "global_step": 63555, "epoch": 534, "lr": 2.989826520974054e-06} +{"train_loss": 0.000353515351889655, "global_step": 63556, "epoch": 534, "lr": 2.989071935027288e-06} +{"train_loss": 0.0002356237091589719, "global_step": 63557, "epoch": 534, "lr": 2.9883174413814552e-06} +{"train_loss": 0.0006424267194233835, "global_step": 63558, "epoch": 534, "lr": 2.987563040038044e-06} +{"train_loss": 0.000270308752078563, "global_step": 63559, "epoch": 534, "lr": 2.986808730998525e-06} +{"train_loss": 0.00041540773236192763, "global_step": 63560, "epoch": 534, "lr": 2.98605451426438e-06} +{"train_loss": 0.0001986936549656093, "global_step": 63561, "epoch": 534, "lr": 2.9853003898371037e-06} +{"train_loss": 0.00047609108150936663, "global_step": 63562, "epoch": 534, "lr": 2.9845463577181597e-06} +{"train_loss": 0.00021378824021667242, "global_step": 63563, "epoch": 534, "lr": 2.9837924179090426e-06} +{"train_loss": 0.00018653985171113163, "global_step": 63564, "epoch": 534, "lr": 2.983038570411223e-06} +{"train_loss": 0.00029641896253451705, "global_step": 63565, "epoch": 534, "lr": 2.9822848152261886e-06} +{"train_loss": 0.00046039195149205625, "global_step": 63566, "epoch": 534, "lr": 2.9815311523554045e-06} +{"train_loss": 0.0002609499206300825, "global_step": 63567, "epoch": 534, "lr": 2.9807775818003756e-06} +{"train_loss": 0.00022193351469468325, "global_step": 63568, "epoch": 534, "lr": 2.980024103562562e-06} +{"train_loss": 0.00042418111115694046, "global_step": 63569, "epoch": 534, "lr": 2.9792707176434397e-06} +{"train_loss": 0.0003131854464299977, "global_step": 63570, "epoch": 534, "lr": 2.9785174240445023e-06} +{"train_loss": 0.0002314703306183219, "global_step": 63571, "epoch": 534, "lr": 2.977764222767221e-06} +{"train_loss": 0.00016457930905744433, "global_step": 63572, "epoch": 534, "lr": 2.9770111138130775e-06} +{"train_loss": 0.0002961623831652105, "global_step": 63573, "epoch": 534, "lr": 2.976258097183543e-06} +{"train_loss": 0.00031132830190472305, "global_step": 63574, "epoch": 534, "lr": 2.9755051728801107e-06} +{"train_loss": 0.0002775154425762594, "global_step": 63575, "epoch": 534, "lr": 2.9747523409042464e-06} +{"train_loss": 0.00035597255919128656, "global_step": 63576, "epoch": 534, "lr": 2.973999601257427e-06} +{"train_loss": 0.0006421397556550801, "global_step": 63577, "epoch": 534, "lr": 2.9732469539411444e-06} +{"train_loss": 0.00026909896405413747, "global_step": 63578, "epoch": 534, "lr": 2.97249439895686e-06} +{"train_loss": 0.00039553086389787495, "global_step": 63579, "epoch": 534, "lr": 2.971741936306066e-06} +{"train_loss": 0.00016586383571848273, "global_step": 63580, "epoch": 534, "lr": 2.9709895659902287e-06} +{"train_loss": 0.00022750980861019343, "global_step": 63581, "epoch": 534, "lr": 2.9702372880108243e-06} +{"train_loss": 0.0003146589733660221, "global_step": 63582, "epoch": 534, "lr": 2.969485102369346e-06} +{"train_loss": 0.00034300738479942083, "global_step": 63583, "epoch": 534, "lr": 2.9687330090672483e-06} +{"train_loss": 0.0002260937326354906, "global_step": 63584, "epoch": 534, "lr": 2.9679810081060243e-06} +{"train_loss": 0.0002185899647884071, "global_step": 63585, "epoch": 534, "lr": 2.96722909948714e-06} +{"train_loss": 0.00017804988601710647, "global_step": 63586, "epoch": 534, "lr": 2.9664772832120824e-06} +{"train_loss": 0.00031203264370560646, "global_step": 63587, "epoch": 534, "lr": 2.965725559282323e-06} +{"train_loss": 0.0005616601556539536, "global_step": 63588, "epoch": 534, "lr": 2.9649739276993273e-06} +{"train_loss": 0.0005929285543970764, "global_step": 63589, "epoch": 534, "lr": 2.964222388464588e-06} +{"train_loss": 0.00029514648485928774, "global_step": 63590, "epoch": 534, "lr": 2.963470941579566e-06} +{"train_loss": 0.0005071776686236262, "global_step": 63591, "epoch": 534, "lr": 2.962719587045754e-06} +{"train_loss": 0.00022746319882571697, "global_step": 63592, "epoch": 534, "lr": 2.9619683248646055e-06} +{"train_loss": 0.00035512252361513674, "global_step": 63593, "epoch": 534, "lr": 2.9612171550376157e-06} +{"train_loss": 0.00014814699534326792, "global_step": 63594, "epoch": 534, "lr": 2.9604660775662487e-06} +{"train_loss": 0.00025680565158836544, "global_step": 63595, "epoch": 534, "lr": 2.959715092451976e-06} +{"train_loss": 0.0002512035134714097, "global_step": 63596, "epoch": 534, "lr": 2.9589641996962846e-06} +{"train_loss": 0.0003047542995773256, "global_step": 63597, "epoch": 534, "lr": 2.95821339930063e-06} +{"train_loss": 0.00019057410827372223, "global_step": 63598, "epoch": 534, "lr": 2.9574626912665104e-06} +{"train_loss": 0.00021734311303589493, "global_step": 63599, "epoch": 534, "lr": 2.9567120755953857e-06} +{"train_loss": 0.00035623324220068753, "global_step": 63600, "epoch": 534, "lr": 2.9559615522887273e-06} +{"train_loss": 0.0004977735225111246, "global_step": 63601, "epoch": 534, "lr": 2.955211121348017e-06} +{"train_loss": 0.00021556475257966667, "global_step": 63602, "epoch": 534, "lr": 2.954460782774715e-06} +{"train_loss": 0.0002886238507926464, "global_step": 63603, "epoch": 534, "lr": 2.953710536570309e-06} +{"train_loss": 0.0003775462682824582, "global_step": 63604, "epoch": 534, "lr": 2.952960382736264e-06} +{"train_loss": 0.00021554929844569415, "global_step": 63605, "epoch": 534, "lr": 2.952210321274057e-06} +{"train_loss": 0.00034992193104699254, "global_step": 63606, "epoch": 534, "lr": 2.951460352185159e-06} +{"train_loss": 0.0001578985684318468, "global_step": 63607, "epoch": 534, "lr": 2.9507104754710413e-06} +{"train_loss": 0.000317523255944252, "global_step": 63608, "epoch": 534, "lr": 2.94996069113318e-06} +{"train_loss": 0.00028198532527312636, "global_step": 63609, "epoch": 534, "lr": 2.9492109991730355e-06} +{"train_loss": 0.0005481262924149632, "global_step": 63610, "epoch": 534, "lr": 2.9484613995921007e-06} +{"train_loss": 0.0004120056109968573, "global_step": 63611, "epoch": 534, "lr": 2.9477118923918244e-06} +{"train_loss": 0.00019292494107503444, "global_step": 63612, "epoch": 534, "lr": 2.9469624775736946e-06} +{"train_loss": 0.0007899999036453664, "global_step": 63613, "epoch": 534, "lr": 2.946213155139177e-06} +{"train_loss": 0.00017837890482041985, "global_step": 63614, "epoch": 534, "lr": 2.945463925089742e-06} +{"train_loss": 0.00022064914810471237, "global_step": 63615, "epoch": 534, "lr": 2.944714787426861e-06} +{"train_loss": 0.00031621914240531623, "global_step": 63616, "epoch": 534, "lr": 2.943965742152005e-06} +{"train_loss": 0.0004434462753124535, "global_step": 63617, "epoch": 534, "lr": 2.9432167892666505e-06} +{"train_loss": 0.0005146870389580727, "global_step": 63618, "epoch": 534, "lr": 2.942467928772258e-06} +{"train_loss": 0.00030828395392745733, "global_step": 63619, "epoch": 534, "lr": 2.9417191606702976e-06} +{"train_loss": 0.00023357449390459806, "global_step": 63620, "epoch": 534, "lr": 2.9409704849622523e-06} +{"train_loss": 0.00039614515844732523, "global_step": 63621, "epoch": 534, "lr": 2.940221901649576e-06} +{"train_loss": 0.00026891095330938697, "global_step": 63622, "epoch": 534, "lr": 2.939473410733756e-06} +{"train_loss": 0.0002579286228865385, "global_step": 63623, "epoch": 534, "lr": 2.9387250122162424e-06} +{"train_loss": 0.00023051189782563597, "global_step": 63624, "epoch": 534, "lr": 2.937976706098522e-06} +{"train_loss": 0.0004152804031036794, "global_step": 63625, "epoch": 534, "lr": 2.937228492382049e-06} +{"train_loss": 0.0003152645076625049, "global_step": 63626, "epoch": 534, "lr": 2.936480371068312e-06} +{"train_loss": 0.00030345292179845273, "global_step": 63627, "epoch": 534, "lr": 2.9357323421587534e-06} +{"train_loss": 0.0004208291065879166, "global_step": 63628, "epoch": 534, "lr": 2.934984405654867e-06} +{"train_loss": 0.00027767400024458766, "global_step": 63629, "epoch": 534, "lr": 2.934236561558107e-06} +{"train_loss": 0.0003316011861898005, "global_step": 63630, "epoch": 534, "lr": 2.9334888098699442e-06} +{"train_loss": 0.0002611689269542694, "global_step": 63631, "epoch": 534, "lr": 2.9327411505918447e-06} +{"train_loss": 0.00032541286782361567, "global_step": 63632, "epoch": 534, "lr": 2.93199358372529e-06} +{"train_loss": 0.0003430597425904125, "global_step": 63633, "epoch": 534, "lr": 2.9312461092717293e-06} +{"train_loss": 0.0002582992019597441, "global_step": 63634, "epoch": 534, "lr": 2.930498727232639e-06} +{"train_loss": 0.00018030010687652975, "global_step": 63635, "epoch": 534, "lr": 2.929751437609485e-06} +{"train_loss": 0.00039548586937598884, "global_step": 63636, "epoch": 534, "lr": 2.929004240403738e-06} +{"train_loss": 0.0002268546522827819, "global_step": 63637, "epoch": 534, "lr": 2.9282571356168687e-06} +{"train_loss": 0.00030426663579419255, "global_step": 63638, "epoch": 534, "lr": 2.9275101232503265e-06} +{"train_loss": 0.00025772530352696776, "global_step": 63639, "epoch": 534, "lr": 2.9267632033055935e-06} +{"train_loss": 0.0002680459583643824, "global_step": 63640, "epoch": 534, "lr": 2.9260163757841296e-06} +{"train_loss": 0.0003227158449590206, "global_step": 63641, "epoch": 534, "lr": 2.9252696406874114e-06} +{"train_loss": 0.0006258238572627306, "global_step": 63642, "epoch": 534, "lr": 2.9245229980168876e-06} +{"train_loss": 0.00017853776807896793, "global_step": 63643, "epoch": 534, "lr": 2.9237764477740404e-06} +{"train_loss": 0.00024845849839039147, "global_step": 63644, "epoch": 534, "lr": 2.923029989960324e-06} +{"train_loss": 0.00025506442761979997, "global_step": 63645, "epoch": 534, "lr": 2.92228362457721e-06} +{"train_loss": 0.0004250801866874099, "global_step": 63646, "epoch": 534, "lr": 2.9215373516261636e-06} +{"train_loss": 0.00020350218983367085, "global_step": 63647, "epoch": 534, "lr": 2.9207911711086446e-06} +{"train_loss": 0.00031987385591492057, "global_step": 63648, "epoch": 534, "lr": 2.9200450830261294e-06} +{"train_loss": 0.00023220464936457574, "global_step": 63649, "epoch": 534, "lr": 2.9192990873800784e-06} +{"train_loss": 0.0003136908635497093, "global_step": 63650, "epoch": 534, "lr": 2.918553184171946e-06} +{"train_loss": 0.000289568561129272, "global_step": 63651, "epoch": 534, "lr": 2.9178073734032086e-06} +{"train_loss": 0.0004857097228523344, "global_step": 63652, "epoch": 534, "lr": 2.9170616550753206e-06} +{"train_loss": 0.0003122398629784584, "global_step": 63653, "epoch": 534, "lr": 2.9163160291897586e-06} +{"train_loss": 0.0005454084603115916, "global_step": 63654, "epoch": 534, "lr": 2.915570495747971e-06} +{"train_loss": 0.0002379173383815214, "global_step": 63655, "epoch": 534, "lr": 2.914825054751441e-06} +{"train_loss": 0.0005739277112297714, "global_step": 63656, "epoch": 534, "lr": 2.9140797062016168e-06} +{"train_loss": 0.000569015508517623, "global_step": 63657, "epoch": 534, "lr": 2.9133344500999693e-06} +{"train_loss": 0.00024268710694741458, "global_step": 63658, "epoch": 534, "lr": 2.912589286447953e-06} +{"train_loss": 0.0003464028413873166, "global_step": 63659, "epoch": 534, "lr": 2.911844215247045e-06} +{"train_loss": 0.0005568914930336177, "global_step": 63660, "epoch": 534, "lr": 2.9110992364986933e-06} +{"train_loss": 0.0006204285891726613, "global_step": 63661, "epoch": 534, "lr": 2.910354350204375e-06} +{"train_loss": 0.00034351981594227254, "global_step": 63662, "epoch": 534, "lr": 2.9096095563655333e-06} +{"train_loss": 0.0002993951493408531, "global_step": 63663, "epoch": 534, "lr": 2.908864854983656e-06} +{"train_loss": 0.0003374979102215143, "global_step": 63664, "epoch": 534, "lr": 2.908120246060181e-06, "val_loss": 0.04478009045124054} +{"train_loss": 0.000289342540781945, "global_step": 63665, "epoch": 535, "lr": 2.9073757295965897e-06} +{"train_loss": 0.000689586391672492, "global_step": 63666, "epoch": 535, "lr": 2.9066313055943264e-06} +{"train_loss": 0.00029819668270647526, "global_step": 63667, "epoch": 535, "lr": 2.9058869740548665e-06} +{"train_loss": 0.00035850232234224677, "global_step": 63668, "epoch": 535, "lr": 2.9051427349796713e-06} +{"train_loss": 0.00021537163411267102, "global_step": 63669, "epoch": 535, "lr": 2.9043985883701886e-06} +{"train_loss": 0.00016314124513883144, "global_step": 63670, "epoch": 535, "lr": 2.90365453422789e-06} +{"train_loss": 0.0001919812784763053, "global_step": 63671, "epoch": 535, "lr": 2.902910572554235e-06} +{"train_loss": 0.0003922651812899858, "global_step": 63672, "epoch": 535, "lr": 2.902166703350684e-06} +{"train_loss": 0.00026007011183537543, "global_step": 63673, "epoch": 535, "lr": 2.901422926618691e-06} +{"train_loss": 0.00021454272791743279, "global_step": 63674, "epoch": 535, "lr": 2.9006792423597327e-06} +{"train_loss": 0.00015901910956017673, "global_step": 63675, "epoch": 535, "lr": 2.8999356505752585e-06} +{"train_loss": 0.0007452938589267433, "global_step": 63676, "epoch": 535, "lr": 2.8991921512667164e-06} +{"train_loss": 0.0002753031440079212, "global_step": 63677, "epoch": 535, "lr": 2.898448744435589e-06} +{"train_loss": 0.00018844290752895176, "global_step": 63678, "epoch": 535, "lr": 2.8977054300833195e-06} +{"train_loss": 0.00019509022240526974, "global_step": 63679, "epoch": 535, "lr": 2.896962208211379e-06} +{"train_loss": 0.00032592102070339024, "global_step": 63680, "epoch": 535, "lr": 2.8962190788212216e-06} +{"train_loss": 0.00025515659945085645, "global_step": 63681, "epoch": 535, "lr": 2.8954760419143025e-06} +{"train_loss": 0.00016970407159533352, "global_step": 63682, "epoch": 535, "lr": 2.894733097492086e-06} +{"train_loss": 0.00015438863192684948, "global_step": 63683, "epoch": 535, "lr": 2.893990245556022e-06} +{"train_loss": 0.00047386891674250364, "global_step": 63684, "epoch": 535, "lr": 2.893247486107581e-06} +{"train_loss": 0.00017451756866648793, "global_step": 63685, "epoch": 535, "lr": 2.8925048191482118e-06} +{"train_loss": 0.0003916295536328107, "global_step": 63686, "epoch": 535, "lr": 2.891762244679386e-06} +{"train_loss": 0.0004673252406064421, "global_step": 63687, "epoch": 535, "lr": 2.891019762702546e-06} +{"train_loss": 0.00024412517086602747, "global_step": 63688, "epoch": 535, "lr": 2.8902773732191525e-06} +{"train_loss": 0.000205283155082725, "global_step": 63689, "epoch": 535, "lr": 2.889535076230676e-06} +{"train_loss": 0.0003598056791815907, "global_step": 63690, "epoch": 535, "lr": 2.888792871738555e-06} +{"train_loss": 0.0004282319569028914, "global_step": 63691, "epoch": 535, "lr": 2.888050759744254e-06} +{"train_loss": 0.0003102784976363182, "global_step": 63692, "epoch": 535, "lr": 2.8873087402492393e-06} +{"train_loss": 0.000879927072674036, "global_step": 63693, "epoch": 535, "lr": 2.8865668132549538e-06} +{"train_loss": 0.0001864254445536062, "global_step": 63694, "epoch": 535, "lr": 2.885824978762869e-06} +{"train_loss": 0.00046058493899181485, "global_step": 63695, "epoch": 535, "lr": 2.8850832367744273e-06} +{"train_loss": 0.0002295150188729167, "global_step": 63696, "epoch": 535, "lr": 2.8843415872911005e-06} +{"train_loss": 0.000297735066851601, "global_step": 63697, "epoch": 535, "lr": 2.8836000303143264e-06} +{"train_loss": 0.0004857926396653056, "global_step": 63698, "epoch": 535, "lr": 2.8828585658455755e-06} +{"train_loss": 0.0005988593329675496, "global_step": 63699, "epoch": 535, "lr": 2.8821171938862966e-06} +{"train_loss": 0.00023685164342168719, "global_step": 63700, "epoch": 535, "lr": 2.881375914437945e-06} +{"train_loss": 0.0004734403919428587, "global_step": 63701, "epoch": 535, "lr": 2.8806347275019795e-06} +{"train_loss": 0.0002613744291011244, "global_step": 63702, "epoch": 535, "lr": 2.8798936330798496e-06} +{"train_loss": 0.00018227101827505976, "global_step": 63703, "epoch": 535, "lr": 2.879152631173021e-06} +{"train_loss": 0.0005231931572780013, "global_step": 63704, "epoch": 535, "lr": 2.8784117217829366e-06} +{"train_loss": 0.00032879228820092976, "global_step": 63705, "epoch": 535, "lr": 2.8776709049110618e-06} +{"train_loss": 0.00030616644653491676, "global_step": 63706, "epoch": 535, "lr": 2.8769301805588454e-06} +{"train_loss": 0.0005200302693992853, "global_step": 63707, "epoch": 535, "lr": 2.8761895487277367e-06} +{"train_loss": 0.00043000237201340497, "global_step": 63708, "epoch": 535, "lr": 2.875449009419201e-06} +{"train_loss": 0.0001558312214910984, "global_step": 63709, "epoch": 535, "lr": 2.8747085626346815e-06} +{"train_loss": 0.0001473829906899482, "global_step": 63710, "epoch": 535, "lr": 2.873968208375638e-06} +{"train_loss": 0.0003933726984541863, "global_step": 63711, "epoch": 535, "lr": 2.873227946643525e-06} +{"train_loss": 0.000298883649520576, "global_step": 63712, "epoch": 535, "lr": 2.8724877774397973e-06} +{"train_loss": 0.0003029104263987392, "global_step": 63713, "epoch": 535, "lr": 2.871747700765903e-06} +{"train_loss": 0.0005787324625998735, "global_step": 63714, "epoch": 535, "lr": 2.871007716623292e-06} +{"train_loss": 0.00040848509524948895, "global_step": 63715, "epoch": 535, "lr": 2.8702678250134284e-06} +{"train_loss": 0.00021123157057445496, "global_step": 63716, "epoch": 535, "lr": 2.8695280259377567e-06} +{"train_loss": 0.0004131323075853288, "global_step": 63717, "epoch": 535, "lr": 2.8687883193977362e-06} +{"train_loss": 0.00016566930571570992, "global_step": 63718, "epoch": 535, "lr": 2.8680487053948104e-06} +{"train_loss": 0.00026248666108585894, "global_step": 63719, "epoch": 535, "lr": 2.8673091839304335e-06} +{"train_loss": 0.00029207635088823736, "global_step": 63720, "epoch": 535, "lr": 2.8665697550060655e-06} +{"train_loss": 0.0002631680981721729, "global_step": 63721, "epoch": 535, "lr": 2.8658304186231445e-06} +{"train_loss": 0.00021309313888195902, "global_step": 63722, "epoch": 535, "lr": 2.8650911747831356e-06} +{"train_loss": 0.00034952446003444493, "global_step": 63723, "epoch": 535, "lr": 2.8643520234874765e-06} +{"train_loss": 0.0002970593923237175, "global_step": 63724, "epoch": 535, "lr": 2.8636129647376387e-06} +{"train_loss": 0.0004698947013821453, "global_step": 63725, "epoch": 535, "lr": 2.8628739985350483e-06} +{"train_loss": 0.0002270691329613328, "global_step": 63726, "epoch": 535, "lr": 2.8621351248811824e-06} +{"train_loss": 0.0002568696509115398, "global_step": 63727, "epoch": 535, "lr": 2.861396343777467e-06} +{"train_loss": 0.0002818772045429796, "global_step": 63728, "epoch": 535, "lr": 2.8606576552253627e-06} +{"train_loss": 0.00037511761183850467, "global_step": 63729, "epoch": 535, "lr": 2.859919059226329e-06} +{"train_loss": 0.00020605410099960864, "global_step": 63730, "epoch": 535, "lr": 2.859180555781804e-06} +{"train_loss": 0.00024617198505438864, "global_step": 63731, "epoch": 535, "lr": 2.8584421448932475e-06} +{"train_loss": 0.00025596815976314247, "global_step": 63732, "epoch": 535, "lr": 2.8577038265621024e-06} +{"train_loss": 0.00016780980513431132, "global_step": 63733, "epoch": 535, "lr": 2.8569656007898126e-06} +{"train_loss": 0.00029282638570293784, "global_step": 63734, "epoch": 535, "lr": 2.8562274675778434e-06} +{"train_loss": 0.00015353744674939662, "global_step": 63735, "epoch": 535, "lr": 2.855489426927627e-06} +{"train_loss": 0.00039038361865095794, "global_step": 63736, "epoch": 535, "lr": 2.8547514788406227e-06} +{"train_loss": 0.0002909734903369099, "global_step": 63737, "epoch": 535, "lr": 2.8540136233182803e-06} +{"train_loss": 0.0006595815066248178, "global_step": 63738, "epoch": 535, "lr": 2.8532758603620426e-06} +{"train_loss": 0.00023713379050605, "global_step": 63739, "epoch": 535, "lr": 2.852538189973364e-06} +{"train_loss": 0.00022479324252344668, "global_step": 63740, "epoch": 535, "lr": 2.8518006121536823e-06} +{"train_loss": 0.00041204836452379823, "global_step": 63741, "epoch": 535, "lr": 2.851063126904463e-06} +{"train_loss": 0.00030122286989353597, "global_step": 63742, "epoch": 535, "lr": 2.8503257342271327e-06} +{"train_loss": 0.00041218343540094793, "global_step": 63743, "epoch": 535, "lr": 2.8495884341231573e-06} +{"train_loss": 0.00019078330660704523, "global_step": 63744, "epoch": 535, "lr": 2.8488512265939847e-06} +{"train_loss": 0.00020173015946056694, "global_step": 63745, "epoch": 535, "lr": 2.8481141116410425e-06} +{"train_loss": 0.00038051482988521457, "global_step": 63746, "epoch": 535, "lr": 2.847377089265796e-06} +{"train_loss": 0.000193557541933842, "global_step": 63747, "epoch": 535, "lr": 2.846640159469688e-06} +{"train_loss": 0.00037525055813603103, "global_step": 63748, "epoch": 535, "lr": 2.845903322254162e-06} +{"train_loss": 0.00036917621036991477, "global_step": 63749, "epoch": 535, "lr": 2.845166577620673e-06} +{"train_loss": 0.00023493837215937674, "global_step": 63750, "epoch": 535, "lr": 2.8444299255706574e-06} +{"train_loss": 0.0005821032682433724, "global_step": 63751, "epoch": 535, "lr": 2.8436933661055656e-06} +{"train_loss": 0.00019799872825387865, "global_step": 63752, "epoch": 535, "lr": 2.8429568992268394e-06} +{"train_loss": 0.0006483899778686464, "global_step": 63753, "epoch": 535, "lr": 2.84222052493594e-06} +{"train_loss": 0.0003191886644344777, "global_step": 63754, "epoch": 535, "lr": 2.8414842432342935e-06} +{"train_loss": 0.00025816739071160555, "global_step": 63755, "epoch": 535, "lr": 2.84074805412336e-06} +{"train_loss": 0.00029840946081094444, "global_step": 63756, "epoch": 535, "lr": 2.8400119576045714e-06} +{"train_loss": 0.00014435993216466159, "global_step": 63757, "epoch": 535, "lr": 2.8392759536793932e-06} +{"train_loss": 0.00025551943690516055, "global_step": 63758, "epoch": 535, "lr": 2.838540042349247e-06} +{"train_loss": 0.00014813218149356544, "global_step": 63759, "epoch": 535, "lr": 2.8378042236155976e-06} +{"train_loss": 0.00016274204244837165, "global_step": 63760, "epoch": 535, "lr": 2.8370684974798724e-06} +{"train_loss": 0.0002536180545575917, "global_step": 63761, "epoch": 535, "lr": 2.8363328639435305e-06} +{"train_loss": 0.00027001972193829715, "global_step": 63762, "epoch": 535, "lr": 2.8355973230080046e-06} +{"train_loss": 0.00022980128414928913, "global_step": 63763, "epoch": 535, "lr": 2.8348618746747546e-06} +{"train_loss": 0.0003404894086997956, "global_step": 63764, "epoch": 535, "lr": 2.834126518945207e-06} +{"train_loss": 0.00026608718326315284, "global_step": 63765, "epoch": 535, "lr": 2.8333912558208164e-06} +{"train_loss": 0.0002603317843750119, "global_step": 63766, "epoch": 535, "lr": 2.8326560853030204e-06} +{"train_loss": 0.00017602216394152492, "global_step": 63767, "epoch": 535, "lr": 2.8319210073932677e-06} +{"train_loss": 0.00022929035185370594, "global_step": 63768, "epoch": 535, "lr": 2.831186022093002e-06} +{"train_loss": 0.00023160189448390156, "global_step": 63769, "epoch": 535, "lr": 2.830451129403655e-06} +{"train_loss": 0.0003379920672159642, "global_step": 63770, "epoch": 535, "lr": 2.829716329326687e-06} +{"train_loss": 0.0003768819151446223, "global_step": 63771, "epoch": 535, "lr": 2.828981621863519e-06} +{"train_loss": 0.00047007776447571814, "global_step": 63772, "epoch": 535, "lr": 2.8282470070156166e-06} +{"train_loss": 0.000135684764245525, "global_step": 63773, "epoch": 535, "lr": 2.827512484784406e-06} +{"train_loss": 0.0002704801445361227, "global_step": 63774, "epoch": 535, "lr": 2.826778055171342e-06} +{"train_loss": 0.00025353473029099405, "global_step": 63775, "epoch": 535, "lr": 2.8260437181778567e-06} +{"train_loss": 0.0002396240597590804, "global_step": 63776, "epoch": 535, "lr": 2.825309473805393e-06} +{"train_loss": 0.00025937645114026964, "global_step": 63777, "epoch": 535, "lr": 2.824575322055395e-06} +{"train_loss": 0.00018046765762846917, "global_step": 63778, "epoch": 535, "lr": 2.8238412629292997e-06} +{"train_loss": 0.00015589245595037937, "global_step": 63779, "epoch": 535, "lr": 2.8231072964285567e-06} +{"train_loss": 0.00027490421780385077, "global_step": 63780, "epoch": 535, "lr": 2.822373422554597e-06} +{"train_loss": 0.00033576422720216215, "global_step": 63781, "epoch": 535, "lr": 2.8216396413088764e-06} +{"train_loss": 0.0002456969232298434, "global_step": 63782, "epoch": 535, "lr": 2.820905952692826e-06} +{"train_loss": 0.00030832829923826824, "global_step": 63783, "epoch": 535, "lr": 2.820172356707873e-06, "val_loss": 0.037245672196149826, "train_action_mse_error": 5.338222763384692e-06} +{"train_loss": 0.0002642391191329807, "global_step": 63784, "epoch": 536, "lr": 2.8194388533554826e-06} +{"train_loss": 0.00042529311031103134, "global_step": 63785, "epoch": 536, "lr": 2.818705442637076e-06} +{"train_loss": 0.00018477901176083833, "global_step": 63786, "epoch": 536, "lr": 2.817972124554108e-06} +{"train_loss": 0.0002703079953789711, "global_step": 63787, "epoch": 536, "lr": 2.817238899108016e-06} +{"train_loss": 0.0002321566134924069, "global_step": 63788, "epoch": 536, "lr": 2.8165057663002202e-06} +{"train_loss": 0.00019719285774044693, "global_step": 63789, "epoch": 536, "lr": 2.8157727261321763e-06} +{"train_loss": 0.0002910960465669632, "global_step": 63790, "epoch": 536, "lr": 2.8150397786053328e-06} +{"train_loss": 0.00023665785556659102, "global_step": 63791, "epoch": 536, "lr": 2.814306923721105e-06} +{"train_loss": 0.0002851312165148556, "global_step": 63792, "epoch": 536, "lr": 2.813574161480953e-06} +{"train_loss": 0.0003050318919122219, "global_step": 63793, "epoch": 536, "lr": 2.8128414918863033e-06} +{"train_loss": 0.0002213844854850322, "global_step": 63794, "epoch": 536, "lr": 2.8121089149385994e-06} +{"train_loss": 0.0004491860745474696, "global_step": 63795, "epoch": 536, "lr": 2.8113764306392788e-06} +{"train_loss": 0.0003052616957575083, "global_step": 63796, "epoch": 536, "lr": 2.8106440389897793e-06} +{"train_loss": 0.0006254892796278, "global_step": 63797, "epoch": 536, "lr": 2.8099117399915388e-06} +{"train_loss": 0.0003708553849719465, "global_step": 63798, "epoch": 536, "lr": 2.8091795336459947e-06} +{"train_loss": 0.0004823849303647876, "global_step": 63799, "epoch": 536, "lr": 2.8084474199545907e-06} +{"train_loss": 0.00020681046589743346, "global_step": 63800, "epoch": 536, "lr": 2.807715398918748e-06} +{"train_loss": 0.00029711518436670303, "global_step": 63801, "epoch": 536, "lr": 2.80698347053992e-06} +{"train_loss": 0.00020686360949184746, "global_step": 63802, "epoch": 536, "lr": 2.8062516348195343e-06} +{"train_loss": 0.00022597071074414998, "global_step": 63803, "epoch": 536, "lr": 2.8055198917590397e-06} +{"train_loss": 0.0002621236490085721, "global_step": 63804, "epoch": 536, "lr": 2.804788241359857e-06} +{"train_loss": 0.00020483146363403648, "global_step": 63805, "epoch": 536, "lr": 2.804056683623435e-06} +{"train_loss": 0.00033125668414868414, "global_step": 63806, "epoch": 536, "lr": 2.803325218551206e-06} +{"train_loss": 0.0005073040956631303, "global_step": 63807, "epoch": 536, "lr": 2.802593846144602e-06} +{"train_loss": 0.00019185671408195049, "global_step": 63808, "epoch": 536, "lr": 2.801862566405067e-06} +{"train_loss": 0.00025315850507467985, "global_step": 63809, "epoch": 536, "lr": 2.8011313793340268e-06} +{"train_loss": 0.00047989096492528915, "global_step": 63810, "epoch": 536, "lr": 2.8004002849329247e-06} +{"train_loss": 0.0002003862027777359, "global_step": 63811, "epoch": 536, "lr": 2.7996692832031936e-06} +{"train_loss": 0.00021911552175879478, "global_step": 63812, "epoch": 536, "lr": 2.798938374146276e-06} +{"train_loss": 0.00027808264712803066, "global_step": 63813, "epoch": 536, "lr": 2.7982075577635934e-06} +{"train_loss": 0.00025577223277650774, "global_step": 63814, "epoch": 536, "lr": 2.7974768340565894e-06} +{"train_loss": 0.00033372422331012785, "global_step": 63815, "epoch": 536, "lr": 2.7967462030266953e-06} +{"train_loss": 0.0004694423114415258, "global_step": 63816, "epoch": 536, "lr": 2.7960156646753445e-06} +{"train_loss": 0.00024930768995545805, "global_step": 63817, "epoch": 536, "lr": 2.7952852190039844e-06} +{"train_loss": 0.00023127923486754298, "global_step": 63818, "epoch": 536, "lr": 2.794554866014032e-06} +{"train_loss": 0.00036898039979860187, "global_step": 63819, "epoch": 536, "lr": 2.793824605706924e-06} +{"train_loss": 0.00034775727544911206, "global_step": 63820, "epoch": 536, "lr": 2.7930944380841095e-06} +{"train_loss": 0.0004513124586082995, "global_step": 63821, "epoch": 536, "lr": 2.7923643631469985e-06} +{"train_loss": 0.00030807158327661455, "global_step": 63822, "epoch": 536, "lr": 2.791634380897046e-06} +{"train_loss": 0.0004292292578611523, "global_step": 63823, "epoch": 536, "lr": 2.790904491335666e-06} +{"train_loss": 0.00023664190666750073, "global_step": 63824, "epoch": 536, "lr": 2.7901746944643035e-06} +{"train_loss": 0.00022085751697886735, "global_step": 63825, "epoch": 536, "lr": 2.7894449902843954e-06} +{"train_loss": 0.0003566499217413366, "global_step": 63826, "epoch": 536, "lr": 2.788715378797363e-06} +{"train_loss": 0.00035110017051920295, "global_step": 63827, "epoch": 536, "lr": 2.787985860004649e-06} +{"train_loss": 0.00026920344680547714, "global_step": 63828, "epoch": 536, "lr": 2.7872564339076757e-06} +{"train_loss": 0.0003634396125562489, "global_step": 63829, "epoch": 536, "lr": 2.786527100507885e-06} +{"train_loss": 0.0003538002783898264, "global_step": 63830, "epoch": 536, "lr": 2.785797859806699e-06} +{"train_loss": 0.0003677470958791673, "global_step": 63831, "epoch": 536, "lr": 2.785068711805561e-06} +{"train_loss": 0.0002705463266465813, "global_step": 63832, "epoch": 536, "lr": 2.7843396565058964e-06} +{"train_loss": 0.0003376641543582082, "global_step": 63833, "epoch": 536, "lr": 2.7836106939091332e-06} +{"train_loss": 0.0005183881148695946, "global_step": 63834, "epoch": 536, "lr": 2.7828818240167088e-06} +{"train_loss": 0.00029775031725876033, "global_step": 63835, "epoch": 536, "lr": 2.782153046830044e-06} +{"train_loss": 0.0005458301166072488, "global_step": 63836, "epoch": 536, "lr": 2.7814243623505876e-06} +{"train_loss": 0.0003188952978234738, "global_step": 63837, "epoch": 536, "lr": 2.780695770579761e-06} +{"train_loss": 0.00020377934561111033, "global_step": 63838, "epoch": 536, "lr": 2.779967271518985e-06} +{"train_loss": 0.00046148934052325785, "global_step": 63839, "epoch": 536, "lr": 2.7792388651697033e-06} +{"train_loss": 0.0002911763440351933, "global_step": 63840, "epoch": 536, "lr": 2.7785105515333364e-06} +{"train_loss": 0.00020380117348395288, "global_step": 63841, "epoch": 536, "lr": 2.7777823306113227e-06} +{"train_loss": 0.0003118072054348886, "global_step": 63842, "epoch": 536, "lr": 2.777054202405088e-06} +{"train_loss": 0.00018304870172869414, "global_step": 63843, "epoch": 536, "lr": 2.7763261669160655e-06} +{"train_loss": 0.0001374111307086423, "global_step": 63844, "epoch": 536, "lr": 2.7755982241456813e-06} +{"train_loss": 0.00028235846548341215, "global_step": 63845, "epoch": 536, "lr": 2.7748703740953562e-06} +{"train_loss": 0.0006281214882619679, "global_step": 63846, "epoch": 536, "lr": 2.774142616766534e-06} +{"train_loss": 0.00031143700471147895, "global_step": 63847, "epoch": 536, "lr": 2.7734149521606356e-06} +{"train_loss": 0.00047737424029037356, "global_step": 63848, "epoch": 536, "lr": 2.7726873802790987e-06} +{"train_loss": 0.00023022138339001685, "global_step": 63849, "epoch": 536, "lr": 2.771959901123333e-06} +{"train_loss": 0.00014835396723356098, "global_step": 63850, "epoch": 536, "lr": 2.7712325146947883e-06} +{"train_loss": 0.00015820421685930341, "global_step": 63851, "epoch": 536, "lr": 2.770505220994879e-06} +{"train_loss": 0.000544874812476337, "global_step": 63852, "epoch": 536, "lr": 2.7697780200250324e-06} +{"train_loss": 0.00026860105572268367, "global_step": 63853, "epoch": 536, "lr": 2.7690509117866914e-06} +{"train_loss": 0.0004696012765634805, "global_step": 63854, "epoch": 536, "lr": 2.7683238962812608e-06} +{"train_loss": 0.0006280698580667377, "global_step": 63855, "epoch": 536, "lr": 2.767596973510189e-06} +{"train_loss": 0.0006941345636732876, "global_step": 63856, "epoch": 536, "lr": 2.7668701434748923e-06} +{"train_loss": 0.0003358151006978005, "global_step": 63857, "epoch": 536, "lr": 2.7661434061768022e-06} +{"train_loss": 0.00020584480080287904, "global_step": 63858, "epoch": 536, "lr": 2.7654167616173345e-06} +{"train_loss": 0.0001925047836266458, "global_step": 63859, "epoch": 536, "lr": 2.7646902097979266e-06} +{"train_loss": 0.0005343439406715333, "global_step": 63860, "epoch": 536, "lr": 2.763963750720011e-06} +{"train_loss": 0.0003590764827094972, "global_step": 63861, "epoch": 536, "lr": 2.763237384384998e-06} +{"train_loss": 0.00025554324383847415, "global_step": 63862, "epoch": 536, "lr": 2.7625111107943302e-06} +{"train_loss": 0.0005252209375612438, "global_step": 63863, "epoch": 536, "lr": 2.7617849299494293e-06} +{"train_loss": 0.0002180835435865447, "global_step": 63864, "epoch": 536, "lr": 2.7610588418517046e-06} +{"train_loss": 0.0004045036039315164, "global_step": 63865, "epoch": 536, "lr": 2.7603328465026e-06} +{"train_loss": 0.0003916741698049009, "global_step": 63866, "epoch": 536, "lr": 2.759606943903531e-06} +{"train_loss": 0.0006709884619340301, "global_step": 63867, "epoch": 536, "lr": 2.7588811340559295e-06} +{"train_loss": 0.0002032395132118836, "global_step": 63868, "epoch": 536, "lr": 2.758155416961222e-06} +{"train_loss": 0.0002440164826111868, "global_step": 63869, "epoch": 536, "lr": 2.757429792620825e-06} +{"train_loss": 0.0003053293330594897, "global_step": 63870, "epoch": 536, "lr": 2.7567042610361695e-06} +{"train_loss": 0.0002907730813603848, "global_step": 63871, "epoch": 536, "lr": 2.7559788222086712e-06} +{"train_loss": 0.0002136463299393654, "global_step": 63872, "epoch": 536, "lr": 2.7552534761397684e-06} +{"train_loss": 0.00025679817190393806, "global_step": 63873, "epoch": 536, "lr": 2.754528222830877e-06} +{"train_loss": 0.00027915945975109935, "global_step": 63874, "epoch": 536, "lr": 2.753803062283422e-06} +{"train_loss": 0.0002294298610650003, "global_step": 63875, "epoch": 536, "lr": 2.7530779944988316e-06} +{"train_loss": 0.00015606090892106295, "global_step": 63876, "epoch": 536, "lr": 2.7523530194785152e-06} +{"train_loss": 0.00025492708664387465, "global_step": 63877, "epoch": 536, "lr": 2.7516281372239106e-06} +{"train_loss": 0.00023439554206561297, "global_step": 63878, "epoch": 536, "lr": 2.750903347736433e-06} +{"train_loss": 0.00022330746287479997, "global_step": 63879, "epoch": 536, "lr": 2.7501786510175155e-06} +{"train_loss": 0.00030287622939795256, "global_step": 63880, "epoch": 536, "lr": 2.749454047068567e-06} +{"train_loss": 0.00019913018331862986, "global_step": 63881, "epoch": 536, "lr": 2.748729535891026e-06} +{"train_loss": 0.0002892346237786114, "global_step": 63882, "epoch": 536, "lr": 2.748005117486302e-06} +{"train_loss": 0.0003099247987847775, "global_step": 63883, "epoch": 536, "lr": 2.747280791855822e-06} +{"train_loss": 0.00022015318972989917, "global_step": 63884, "epoch": 536, "lr": 2.746556559001007e-06} +{"train_loss": 0.00020243322069291025, "global_step": 63885, "epoch": 536, "lr": 2.7458324189232775e-06} +{"train_loss": 0.0003568606625776738, "global_step": 63886, "epoch": 536, "lr": 2.7451083716240665e-06} +{"train_loss": 0.0008072241325862706, "global_step": 63887, "epoch": 536, "lr": 2.7443844171047784e-06} +{"train_loss": 0.0003764111315831542, "global_step": 63888, "epoch": 536, "lr": 2.7436605553668447e-06} +{"train_loss": 0.0002333511656615883, "global_step": 63889, "epoch": 536, "lr": 2.7429367864116816e-06} +{"train_loss": 0.0004755138361360878, "global_step": 63890, "epoch": 536, "lr": 2.742213110240721e-06} +{"train_loss": 0.00013991069863550365, "global_step": 63891, "epoch": 536, "lr": 2.741489526855373e-06} +{"train_loss": 0.0002704226935748011, "global_step": 63892, "epoch": 536, "lr": 2.740766036257064e-06} +{"train_loss": 0.00029463949613273144, "global_step": 63893, "epoch": 536, "lr": 2.7400426384472045e-06} +{"train_loss": 0.00016141320520546287, "global_step": 63894, "epoch": 536, "lr": 2.7393193334272315e-06} +{"train_loss": 0.0004773886175826192, "global_step": 63895, "epoch": 536, "lr": 2.7385961211985447e-06} +{"train_loss": 0.00027857019449584186, "global_step": 63896, "epoch": 536, "lr": 2.7378730017625866e-06} +{"train_loss": 0.00017662238678894937, "global_step": 63897, "epoch": 536, "lr": 2.737149975120756e-06} +{"train_loss": 0.0002130100765498355, "global_step": 63898, "epoch": 536, "lr": 2.736427041274492e-06} +{"train_loss": 0.0002746742684394121, "global_step": 63899, "epoch": 536, "lr": 2.7357042002251976e-06} +{"train_loss": 0.00048784600221551955, "global_step": 63900, "epoch": 536, "lr": 2.7349814519743e-06} +{"train_loss": 0.00020319357281550765, "global_step": 63901, "epoch": 536, "lr": 2.73425879652322e-06} +{"train_loss": 0.00031845680581789245, "global_step": 63902, "epoch": 536, "lr": 2.7335362338733683e-06, "val_loss": 0.01910228654742241} +{"train_loss": 0.00028541425126604736, "global_step": 63903, "epoch": 537, "lr": 2.7328137640261706e-06} +{"train_loss": 0.0001628917525522411, "global_step": 63904, "epoch": 537, "lr": 2.7320913869830435e-06} +{"train_loss": 0.0004226084565743804, "global_step": 63905, "epoch": 537, "lr": 2.731369102745407e-06} +{"train_loss": 0.00015620345948264003, "global_step": 63906, "epoch": 537, "lr": 2.730646911314677e-06} +{"train_loss": 0.00040596970939077437, "global_step": 63907, "epoch": 537, "lr": 2.7299248126922696e-06} +{"train_loss": 0.00020985558512620628, "global_step": 63908, "epoch": 537, "lr": 2.729202806879605e-06} +{"train_loss": 0.00035001771175302565, "global_step": 63909, "epoch": 537, "lr": 2.7284808938780994e-06} +{"train_loss": 0.0001904169184854254, "global_step": 63910, "epoch": 537, "lr": 2.7277590736891736e-06} +{"train_loss": 0.00034435681300237775, "global_step": 63911, "epoch": 537, "lr": 2.7270373463142374e-06} +{"train_loss": 0.0008336812607012689, "global_step": 63912, "epoch": 537, "lr": 2.7263157117547233e-06} +{"train_loss": 0.00042339536594226956, "global_step": 63913, "epoch": 537, "lr": 2.725594170012036e-06} +{"train_loss": 0.0003870339714922011, "global_step": 63914, "epoch": 537, "lr": 2.7248727210875845e-06} +{"train_loss": 0.00031196713098324835, "global_step": 63915, "epoch": 537, "lr": 2.724151364982802e-06} +{"train_loss": 0.0003636236651800573, "global_step": 63916, "epoch": 537, "lr": 2.7234301016990926e-06} +{"train_loss": 0.0004777227877639234, "global_step": 63917, "epoch": 537, "lr": 2.722708931237883e-06} +{"train_loss": 0.00018964274204336107, "global_step": 63918, "epoch": 537, "lr": 2.721987853600577e-06} +{"train_loss": 0.00032927829306572676, "global_step": 63919, "epoch": 537, "lr": 2.7212668687886078e-06} +{"train_loss": 0.0005234130658209324, "global_step": 63920, "epoch": 537, "lr": 2.7205459768033734e-06} +{"train_loss": 0.00042880032560788095, "global_step": 63921, "epoch": 537, "lr": 2.719825177646296e-06} +{"train_loss": 0.00020580002455972135, "global_step": 63922, "epoch": 537, "lr": 2.719104471318784e-06} +{"train_loss": 0.0002182406751671806, "global_step": 63923, "epoch": 537, "lr": 2.718383857822271e-06} +{"train_loss": 0.0003809356421697885, "global_step": 63924, "epoch": 537, "lr": 2.7176633371581497e-06} +{"train_loss": 0.0003004959726240486, "global_step": 63925, "epoch": 537, "lr": 2.7169429093278575e-06} +{"train_loss": 0.0002532461076043546, "global_step": 63926, "epoch": 537, "lr": 2.716222574332783e-06} +{"train_loss": 0.0002176087291445583, "global_step": 63927, "epoch": 537, "lr": 2.7155023321743635e-06} +{"train_loss": 0.0003343425632920116, "global_step": 63928, "epoch": 537, "lr": 2.7147821828539975e-06} +{"train_loss": 0.0003064243937842548, "global_step": 63929, "epoch": 537, "lr": 2.714062126373107e-06} +{"train_loss": 0.00031415262492373586, "global_step": 63930, "epoch": 537, "lr": 2.7133421627331013e-06} +{"train_loss": 0.00016962134395726025, "global_step": 63931, "epoch": 537, "lr": 2.712622291935407e-06} +{"train_loss": 0.0003046715573873371, "global_step": 63932, "epoch": 537, "lr": 2.711902513981418e-06} +{"train_loss": 0.00021611103147733957, "global_step": 63933, "epoch": 537, "lr": 2.711182828872555e-06} +{"train_loss": 0.0001661921269260347, "global_step": 63934, "epoch": 537, "lr": 2.710463236610239e-06} +{"train_loss": 0.00033495083334855735, "global_step": 63935, "epoch": 537, "lr": 2.709743737195869e-06} +{"train_loss": 0.0002810780133586377, "global_step": 63936, "epoch": 537, "lr": 2.7090243306308716e-06} +{"train_loss": 0.0002559598069638014, "global_step": 63937, "epoch": 537, "lr": 2.708305016916657e-06} +{"train_loss": 0.00044523068936541677, "global_step": 63938, "epoch": 537, "lr": 2.7075857960546182e-06} +{"train_loss": 0.00032613970688544214, "global_step": 63939, "epoch": 537, "lr": 2.706866668046193e-06} +{"train_loss": 0.00026820425409823656, "global_step": 63940, "epoch": 537, "lr": 2.7061476328927746e-06} +{"train_loss": 0.00016364658949896693, "global_step": 63941, "epoch": 537, "lr": 2.705428690595796e-06} +{"train_loss": 0.00014738566824235022, "global_step": 63942, "epoch": 537, "lr": 2.7047098411566386e-06} +{"train_loss": 0.0003226072294637561, "global_step": 63943, "epoch": 537, "lr": 2.7039910845767457e-06} +{"train_loss": 0.0001904811360873282, "global_step": 63944, "epoch": 537, "lr": 2.703272420857511e-06} +{"train_loss": 0.0004977862699888647, "global_step": 63945, "epoch": 537, "lr": 2.702553850000339e-06} +{"train_loss": 0.00031073775608092546, "global_step": 63946, "epoch": 537, "lr": 2.7018353720066557e-06} +{"train_loss": 0.0004656527889892459, "global_step": 63947, "epoch": 537, "lr": 2.7011169868778606e-06} +{"train_loss": 0.0002950020134449005, "global_step": 63948, "epoch": 537, "lr": 2.7003986946153747e-06} +{"train_loss": 0.000502955459523946, "global_step": 63949, "epoch": 537, "lr": 2.699680495220597e-06} +{"train_loss": 0.00021585171634797007, "global_step": 63950, "epoch": 537, "lr": 2.6989623886949535e-06} +{"train_loss": 0.00034851563395932317, "global_step": 63951, "epoch": 537, "lr": 2.6982443750398376e-06} +{"train_loss": 0.0002692638954613358, "global_step": 63952, "epoch": 537, "lr": 2.697526454256666e-06} +{"train_loss": 0.0002278746251249686, "global_step": 63953, "epoch": 537, "lr": 2.696808626346847e-06} +{"train_loss": 0.00018708055722527206, "global_step": 63954, "epoch": 537, "lr": 2.6960908913117865e-06} +{"train_loss": 0.00025276668020524085, "global_step": 63955, "epoch": 537, "lr": 2.695373249152905e-06} +{"train_loss": 0.000370440015103668, "global_step": 63956, "epoch": 537, "lr": 2.694655699871601e-06} +{"train_loss": 0.0002682810300029814, "global_step": 63957, "epoch": 537, "lr": 2.693938243469285e-06} +{"train_loss": 0.0002757552720140666, "global_step": 63958, "epoch": 537, "lr": 2.6932208799473724e-06} +{"train_loss": 0.0003031099622603506, "global_step": 63959, "epoch": 537, "lr": 2.6925036093072565e-06} +{"train_loss": 0.0003327948215883225, "global_step": 63960, "epoch": 537, "lr": 2.691786431550369e-06} +{"train_loss": 0.0002212182298535481, "global_step": 63961, "epoch": 537, "lr": 2.6910693466780934e-06} +{"train_loss": 0.00033953090314753354, "global_step": 63962, "epoch": 537, "lr": 2.690352354691855e-06} +{"train_loss": 0.00020576122915372252, "global_step": 63963, "epoch": 537, "lr": 2.689635455593059e-06} +{"train_loss": 0.0001920077920658514, "global_step": 63964, "epoch": 537, "lr": 2.688918649383104e-06} +{"train_loss": 0.0005423991242423654, "global_step": 63965, "epoch": 537, "lr": 2.6882019360634057e-06} +{"train_loss": 0.00026556907687336206, "global_step": 63966, "epoch": 537, "lr": 2.687485315635363e-06} +{"train_loss": 0.0002872580080293119, "global_step": 63967, "epoch": 537, "lr": 2.686768788100397e-06} +{"train_loss": 0.0001789258240023628, "global_step": 63968, "epoch": 537, "lr": 2.6860523534598947e-06} +{"train_loss": 0.0002656341530382633, "global_step": 63969, "epoch": 537, "lr": 2.6853360117152836e-06} +{"train_loss": 0.0003151592391077429, "global_step": 63970, "epoch": 537, "lr": 2.6846197628679627e-06} +{"train_loss": 0.00022232969058677554, "global_step": 63971, "epoch": 537, "lr": 2.6839036069193247e-06} +{"train_loss": 0.0002711950510274619, "global_step": 63972, "epoch": 537, "lr": 2.6831875438707967e-06} +{"train_loss": 0.0001738748833304271, "global_step": 63973, "epoch": 537, "lr": 2.682471573723766e-06} +{"train_loss": 0.00040311162592843175, "global_step": 63974, "epoch": 537, "lr": 2.681755696479654e-06} +{"train_loss": 0.0004091676673851907, "global_step": 63975, "epoch": 537, "lr": 2.68103991213986e-06} +{"train_loss": 0.00021838782413396984, "global_step": 63976, "epoch": 537, "lr": 2.6803242207057823e-06} +{"train_loss": 0.000327347923303023, "global_step": 63977, "epoch": 537, "lr": 2.679608622178842e-06} +{"train_loss": 0.0002928691101260483, "global_step": 63978, "epoch": 537, "lr": 2.6788931165604215e-06} +{"train_loss": 0.00018338876543566585, "global_step": 63979, "epoch": 537, "lr": 2.6781777038519527e-06} +{"train_loss": 0.00020116627274546772, "global_step": 63980, "epoch": 537, "lr": 2.677462384054813e-06} +{"train_loss": 0.00020542947459034622, "global_step": 63981, "epoch": 537, "lr": 2.676747157170434e-06} +{"train_loss": 0.0004934316384606063, "global_step": 63982, "epoch": 537, "lr": 2.6760320232002035e-06} +{"train_loss": 0.00016422857879661024, "global_step": 63983, "epoch": 537, "lr": 2.6753169821455203e-06} +{"train_loss": 0.0002105839957948774, "global_step": 63984, "epoch": 537, "lr": 2.6746020340078005e-06} +{"train_loss": 0.0002441435353830457, "global_step": 63985, "epoch": 537, "lr": 2.673887178788442e-06} +{"train_loss": 0.000401280471123755, "global_step": 63986, "epoch": 537, "lr": 2.6731724164888506e-06} +{"train_loss": 0.00018039932183455676, "global_step": 63987, "epoch": 537, "lr": 2.6724577471104293e-06} +{"train_loss": 0.00019935259479098022, "global_step": 63988, "epoch": 537, "lr": 2.6717431706545835e-06} +{"train_loss": 0.0004631923511624336, "global_step": 63989, "epoch": 537, "lr": 2.671028687122706e-06} +{"train_loss": 0.0002396955678705126, "global_step": 63990, "epoch": 537, "lr": 2.6703142965162186e-06} +{"train_loss": 0.0002642534382175654, "global_step": 63991, "epoch": 537, "lr": 2.6695999988365027e-06} +{"train_loss": 0.00038747943472117186, "global_step": 63992, "epoch": 537, "lr": 2.6688857940849742e-06} +{"train_loss": 0.0006333644269034266, "global_step": 63993, "epoch": 537, "lr": 2.6681716822630322e-06} +{"train_loss": 0.0003821567224804312, "global_step": 63994, "epoch": 537, "lr": 2.667457663372086e-06} +{"train_loss": 0.00018754768825601786, "global_step": 63995, "epoch": 537, "lr": 2.6667437374135185e-06} +{"train_loss": 0.00013587498688139021, "global_step": 63996, "epoch": 537, "lr": 2.6660299043887505e-06} +{"train_loss": 0.00021763143013231456, "global_step": 63997, "epoch": 537, "lr": 2.66531616429917e-06} +{"train_loss": 0.0003213009040337056, "global_step": 63998, "epoch": 537, "lr": 2.6646025171461864e-06} +{"train_loss": 0.00015864947636146098, "global_step": 63999, "epoch": 537, "lr": 2.6638889629311992e-06} +{"train_loss": 0.0005007384461350739, "global_step": 64000, "epoch": 537, "lr": 2.6631755016556125e-06} +{"train_loss": 0.0005792611627839506, "global_step": 64001, "epoch": 537, "lr": 2.6624621333208198e-06} +{"train_loss": 0.0002316055615665391, "global_step": 64002, "epoch": 537, "lr": 2.6617488579282257e-06} +{"train_loss": 0.00028232246404513717, "global_step": 64003, "epoch": 537, "lr": 2.6610356754792342e-06} +{"train_loss": 0.0002543575537856668, "global_step": 64004, "epoch": 537, "lr": 2.6603225859752333e-06} +{"train_loss": 0.00030779014923609793, "global_step": 64005, "epoch": 537, "lr": 2.6596095894176388e-06} +{"train_loss": 0.00023051475000102073, "global_step": 64006, "epoch": 537, "lr": 2.6588966858078435e-06} +{"train_loss": 0.00026300171157345176, "global_step": 64007, "epoch": 537, "lr": 2.658183875147241e-06} +{"train_loss": 0.0004946325207129121, "global_step": 64008, "epoch": 537, "lr": 2.6574711574372412e-06} +{"train_loss": 0.0004806455981452018, "global_step": 64009, "epoch": 537, "lr": 2.656758532679232e-06} +{"train_loss": 0.0002907568705268204, "global_step": 64010, "epoch": 537, "lr": 2.656046000874629e-06} +{"train_loss": 0.0002492810017429292, "global_step": 64011, "epoch": 537, "lr": 2.6553335620248145e-06} +{"train_loss": 0.0003309686726424843, "global_step": 64012, "epoch": 537, "lr": 2.6546212161312036e-06} +{"train_loss": 0.00023086709552444518, "global_step": 64013, "epoch": 537, "lr": 2.6539089631951785e-06} +{"train_loss": 0.0003267092979513109, "global_step": 64014, "epoch": 537, "lr": 2.6531968032181442e-06} +{"train_loss": 0.00033176896977238357, "global_step": 64015, "epoch": 537, "lr": 2.652484736201505e-06} +{"train_loss": 0.00038625329034402966, "global_step": 64016, "epoch": 537, "lr": 2.6517727621466483e-06} +{"train_loss": 0.00019143159443046898, "global_step": 64017, "epoch": 537, "lr": 2.651060881054984e-06} +{"train_loss": 0.00022679675021208823, "global_step": 64018, "epoch": 537, "lr": 2.650349092927895e-06} +{"train_loss": 0.00039708820986561477, "global_step": 64019, "epoch": 537, "lr": 2.649637397766791e-06} +{"train_loss": 0.00018050028302241117, "global_step": 64020, "epoch": 537, "lr": 2.648925795573065e-06} +{"train_loss": 0.00030299181538289647, "global_step": 64021, "epoch": 537, "lr": 2.6482142863481164e-06, "val_loss": 0.02959534339606762} +{"train_loss": 0.00020011485321447253, "global_step": 64022, "epoch": 538, "lr": 2.6475028700933325e-06} +{"train_loss": 0.00046133744763210416, "global_step": 64023, "epoch": 538, "lr": 2.646791546810129e-06} +{"train_loss": 0.00023518799571320415, "global_step": 64024, "epoch": 538, "lr": 2.6460803164998826e-06} +{"train_loss": 0.0005045526195317507, "global_step": 64025, "epoch": 538, "lr": 2.6453691791640036e-06} +{"train_loss": 0.00022468194947578013, "global_step": 64026, "epoch": 538, "lr": 2.644658134803879e-06} +{"train_loss": 0.0002630834642332047, "global_step": 64027, "epoch": 538, "lr": 2.643947183420914e-06} +{"train_loss": 0.00027078803395852447, "global_step": 64028, "epoch": 538, "lr": 2.643236325016496e-06} +{"train_loss": 0.00022171322780195624, "global_step": 64029, "epoch": 538, "lr": 2.6425255595920296e-06} +{"train_loss": 0.0002484493888914585, "global_step": 64030, "epoch": 538, "lr": 2.6418148871488967e-06} +{"train_loss": 0.0002709731343202293, "global_step": 64031, "epoch": 538, "lr": 2.641104307688508e-06} +{"train_loss": 0.00032147299498319626, "global_step": 64032, "epoch": 538, "lr": 2.6403938212122505e-06} +{"train_loss": 0.0003111810947302729, "global_step": 64033, "epoch": 538, "lr": 2.639683427721512e-06} +{"train_loss": 0.00029524078126996756, "global_step": 64034, "epoch": 538, "lr": 2.6389731272177032e-06} +{"train_loss": 0.0005032114568166435, "global_step": 64035, "epoch": 538, "lr": 2.6382629197022056e-06} +{"train_loss": 0.0002186003839597106, "global_step": 64036, "epoch": 538, "lr": 2.6375528051764244e-06} +{"train_loss": 0.00032310374081134796, "global_step": 64037, "epoch": 538, "lr": 2.6368427836417462e-06} +{"train_loss": 0.000284568959614262, "global_step": 64038, "epoch": 538, "lr": 2.636132855099571e-06} +{"train_loss": 0.00020424593822099268, "global_step": 64039, "epoch": 538, "lr": 2.6354230195512863e-06} +{"train_loss": 0.0002510305494070053, "global_step": 64040, "epoch": 538, "lr": 2.63471327699828e-06} +{"train_loss": 0.0002643442712724209, "global_step": 64041, "epoch": 538, "lr": 2.6340036274419668e-06} +{"train_loss": 0.00027405074797570705, "global_step": 64042, "epoch": 538, "lr": 2.6332940708837185e-06} +{"train_loss": 0.0005077640525996685, "global_step": 64043, "epoch": 538, "lr": 2.6325846073249394e-06} +{"train_loss": 0.0003054373664781451, "global_step": 64044, "epoch": 538, "lr": 2.631875236767023e-06} +{"train_loss": 0.0005743139190599322, "global_step": 64045, "epoch": 538, "lr": 2.631165959211357e-06} +{"train_loss": 0.00017184649186674505, "global_step": 64046, "epoch": 538, "lr": 2.6304567746593344e-06} +{"train_loss": 0.00025113640003837645, "global_step": 64047, "epoch": 538, "lr": 2.629747683112349e-06} +{"train_loss": 0.0001601070980541408, "global_step": 64048, "epoch": 538, "lr": 2.629038684571794e-06} +{"train_loss": 0.0004712739901151508, "global_step": 64049, "epoch": 538, "lr": 2.628329779039057e-06} +{"train_loss": 0.0004119630320928991, "global_step": 64050, "epoch": 538, "lr": 2.627620966515543e-06} +{"train_loss": 0.0003501644532661885, "global_step": 64051, "epoch": 538, "lr": 2.626912247002633e-06} +{"train_loss": 0.00012057254934916273, "global_step": 64052, "epoch": 538, "lr": 2.6262036205017103e-06} +{"train_loss": 0.00041391811100766063, "global_step": 64053, "epoch": 538, "lr": 2.6254950870141846e-06} +{"train_loss": 0.00019719764532055706, "global_step": 64054, "epoch": 538, "lr": 2.6247866465414327e-06} +{"train_loss": 0.00042156450217589736, "global_step": 64055, "epoch": 538, "lr": 2.624078299084848e-06} +{"train_loss": 0.00043726610601879656, "global_step": 64056, "epoch": 538, "lr": 2.6233700446458287e-06} +{"train_loss": 0.0002597644052002579, "global_step": 64057, "epoch": 538, "lr": 2.622661883225758e-06} +{"train_loss": 0.0004896455793641508, "global_step": 64058, "epoch": 538, "lr": 2.6219538148260392e-06} +{"train_loss": 0.00030765251722186804, "global_step": 64059, "epoch": 538, "lr": 2.621245839448039e-06} +{"train_loss": 0.00044954416807740927, "global_step": 64060, "epoch": 538, "lr": 2.620537957093172e-06} +{"train_loss": 0.0003958767338190228, "global_step": 64061, "epoch": 538, "lr": 2.6198301677628046e-06} +{"train_loss": 0.00017176414257846773, "global_step": 64062, "epoch": 538, "lr": 2.619122471458352e-06} +{"train_loss": 0.0002953285293187946, "global_step": 64063, "epoch": 538, "lr": 2.6184148681811904e-06} +{"train_loss": 0.00018431527132634073, "global_step": 64064, "epoch": 538, "lr": 2.617707357932697e-06} +{"train_loss": 0.00035101830144412816, "global_step": 64065, "epoch": 538, "lr": 2.616999940714282e-06} +{"train_loss": 0.00030971376691013575, "global_step": 64066, "epoch": 538, "lr": 2.6162926165273218e-06} +{"train_loss": 0.00027508108178153634, "global_step": 64067, "epoch": 538, "lr": 2.615585385373215e-06} +{"train_loss": 0.00039102829759940505, "global_step": 64068, "epoch": 538, "lr": 2.614878247253333e-06} +{"train_loss": 0.00034080303157679737, "global_step": 64069, "epoch": 538, "lr": 2.614171202169086e-06} +{"train_loss": 0.00035165779991075397, "global_step": 64070, "epoch": 538, "lr": 2.6134642501218497e-06} +{"train_loss": 0.00018265904509462416, "global_step": 64071, "epoch": 538, "lr": 2.6127573911130077e-06} +{"train_loss": 0.000204363779630512, "global_step": 64072, "epoch": 538, "lr": 2.6120506251439637e-06} +{"train_loss": 0.00020294662681408226, "global_step": 64073, "epoch": 538, "lr": 2.6113439522160833e-06} +{"train_loss": 0.00037332388455979526, "global_step": 64074, "epoch": 538, "lr": 2.6106373723307766e-06} +{"train_loss": 0.0003916893037967384, "global_step": 64075, "epoch": 538, "lr": 2.60993088548942e-06} +{"train_loss": 0.0004954042378813028, "global_step": 64076, "epoch": 538, "lr": 2.609224491693396e-06} +{"train_loss": 0.00029646919574588537, "global_step": 64077, "epoch": 538, "lr": 2.608518190944098e-06} +{"train_loss": 0.0001849403779488057, "global_step": 64078, "epoch": 538, "lr": 2.607811983242908e-06} +{"train_loss": 0.00021394772920757532, "global_step": 64079, "epoch": 538, "lr": 2.6071058685912253e-06} +{"train_loss": 0.00036472026840783656, "global_step": 64080, "epoch": 538, "lr": 2.6063998469904206e-06} +{"train_loss": 0.0001717903360258788, "global_step": 64081, "epoch": 538, "lr": 2.605693918441887e-06} +{"train_loss": 0.00019820388115476817, "global_step": 64082, "epoch": 538, "lr": 2.604988082947013e-06} +{"train_loss": 0.00033454730873927474, "global_step": 64083, "epoch": 538, "lr": 2.60428234050718e-06} +{"train_loss": 0.0003541730693541467, "global_step": 64084, "epoch": 538, "lr": 2.6035766911237767e-06} +{"train_loss": 0.0003589297120925039, "global_step": 64085, "epoch": 538, "lr": 2.6028711347981793e-06} +{"train_loss": 0.0005186088383197784, "global_step": 64086, "epoch": 538, "lr": 2.602165671531792e-06} +{"train_loss": 0.00016315958055201918, "global_step": 64087, "epoch": 538, "lr": 2.6014603013259754e-06} +{"train_loss": 0.0002969400957226753, "global_step": 64088, "epoch": 538, "lr": 2.600755024182139e-06} +{"train_loss": 0.00032602125429548323, "global_step": 64089, "epoch": 538, "lr": 2.6000498401016482e-06} +{"train_loss": 0.0003189963463228196, "global_step": 64090, "epoch": 538, "lr": 2.599344749085897e-06} +{"train_loss": 0.0001736005360726267, "global_step": 64091, "epoch": 538, "lr": 2.598639751136278e-06} +{"train_loss": 0.0002920899714808911, "global_step": 64092, "epoch": 538, "lr": 2.597934846254152e-06} +{"train_loss": 0.00020462019892875105, "global_step": 64093, "epoch": 538, "lr": 2.5972300344409283e-06} +{"train_loss": 0.00017527582531329244, "global_step": 64094, "epoch": 538, "lr": 2.5965253156979785e-06} +{"train_loss": 0.00023283148766495287, "global_step": 64095, "epoch": 538, "lr": 2.595820690026679e-06} +{"train_loss": 0.00017852376913651824, "global_step": 64096, "epoch": 538, "lr": 2.595116157428429e-06} +{"train_loss": 0.00026605004677549005, "global_step": 64097, "epoch": 538, "lr": 2.5944117179045936e-06} +{"train_loss": 0.00021549507800955325, "global_step": 64098, "epoch": 538, "lr": 2.5937073714565774e-06} +{"train_loss": 0.00045875500654801726, "global_step": 64099, "epoch": 538, "lr": 2.593003118085746e-06} +{"train_loss": 0.00017752642452251166, "global_step": 64100, "epoch": 538, "lr": 2.592298957793493e-06} +{"train_loss": 0.00025791540974751115, "global_step": 64101, "epoch": 538, "lr": 2.591594890581195e-06} +{"train_loss": 0.0004097239871043712, "global_step": 64102, "epoch": 538, "lr": 2.590890916450228e-06} +{"train_loss": 0.00025583268143236637, "global_step": 64103, "epoch": 538, "lr": 2.590187035401992e-06} +{"train_loss": 0.0005739282350987196, "global_step": 64104, "epoch": 538, "lr": 2.5894832474378515e-06} +{"train_loss": 0.00032862144871614873, "global_step": 64105, "epoch": 538, "lr": 2.5887795525592006e-06} +{"train_loss": 0.00032765226205810905, "global_step": 64106, "epoch": 538, "lr": 2.5880759507674157e-06} +{"train_loss": 0.00045065689482726157, "global_step": 64107, "epoch": 538, "lr": 2.5873724420638733e-06} +{"train_loss": 0.00033471581991761923, "global_step": 64108, "epoch": 538, "lr": 2.586669026449967e-06} +{"train_loss": 0.000236635678447783, "global_step": 64109, "epoch": 538, "lr": 2.5859657039270624e-06} +{"train_loss": 0.0001699864660622552, "global_step": 64110, "epoch": 538, "lr": 2.5852624744965583e-06} +{"train_loss": 0.0003929204831365496, "global_step": 64111, "epoch": 538, "lr": 2.5845593381598142e-06} +{"train_loss": 0.0008374334429390728, "global_step": 64112, "epoch": 538, "lr": 2.5838562949182354e-06} +{"train_loss": 0.0001894214074127376, "global_step": 64113, "epoch": 538, "lr": 2.5831533447731817e-06} +{"train_loss": 0.0002856557257473469, "global_step": 64114, "epoch": 538, "lr": 2.58245048772604e-06} +{"train_loss": 0.000336355937179178, "global_step": 64115, "epoch": 538, "lr": 2.581747723778194e-06} +{"train_loss": 0.00020895370107609779, "global_step": 64116, "epoch": 538, "lr": 2.5810450529310136e-06} +{"train_loss": 0.000297865248285234, "global_step": 64117, "epoch": 538, "lr": 2.580342475185893e-06} +{"train_loss": 0.0003470925730653107, "global_step": 64118, "epoch": 538, "lr": 2.5796399905442024e-06} +{"train_loss": 0.0003933410334866494, "global_step": 64119, "epoch": 538, "lr": 2.5789375990073193e-06} +{"train_loss": 0.0004191290936432779, "global_step": 64120, "epoch": 538, "lr": 2.5782353005766256e-06} +{"train_loss": 0.0002368621208006516, "global_step": 64121, "epoch": 538, "lr": 2.577533095253509e-06} +{"train_loss": 0.00029853242449462414, "global_step": 64122, "epoch": 538, "lr": 2.57683098303933e-06} +{"train_loss": 0.00040868681389838457, "global_step": 64123, "epoch": 538, "lr": 2.5761289639354813e-06} +{"train_loss": 0.0003563862992450595, "global_step": 64124, "epoch": 538, "lr": 2.5754270379433343e-06} +{"train_loss": 0.00018887298938352615, "global_step": 64125, "epoch": 538, "lr": 2.5747252050642766e-06} +{"train_loss": 0.00020313453569542617, "global_step": 64126, "epoch": 538, "lr": 2.5740234652996685e-06} +{"train_loss": 0.0004990032175555825, "global_step": 64127, "epoch": 538, "lr": 2.573321818650909e-06} +{"train_loss": 0.00023019767832010984, "global_step": 64128, "epoch": 538, "lr": 2.572620265119358e-06} +{"train_loss": 0.0002638041914906353, "global_step": 64129, "epoch": 538, "lr": 2.571918804706408e-06} +{"train_loss": 0.00027255568420514464, "global_step": 64130, "epoch": 538, "lr": 2.5712174374134144e-06} +{"train_loss": 0.0003368206671439111, "global_step": 64131, "epoch": 538, "lr": 2.570516163241782e-06} +{"train_loss": 0.000514532788656652, "global_step": 64132, "epoch": 538, "lr": 2.569814982192875e-06} +{"train_loss": 0.00021400985133368522, "global_step": 64133, "epoch": 538, "lr": 2.5691138942680604e-06} +{"train_loss": 0.00021164958889130503, "global_step": 64134, "epoch": 538, "lr": 2.568412899468731e-06} +{"train_loss": 0.0005137372645549476, "global_step": 64135, "epoch": 538, "lr": 2.567711997796246e-06} +{"train_loss": 0.0003479455772321671, "global_step": 64136, "epoch": 538, "lr": 2.567011189252e-06} +{"train_loss": 0.00017631596710998565, "global_step": 64137, "epoch": 538, "lr": 2.5663104738373523e-06} +{"train_loss": 0.0002926528104580939, "global_step": 64138, "epoch": 538, "lr": 2.5656098515536964e-06} +{"train_loss": 0.0002631422830745578, "global_step": 64139, "epoch": 538, "lr": 2.5649093224023923e-06} +{"train_loss": 0.0003114437390076771, "global_step": 64140, "epoch": 538, "lr": 2.564208886384817e-06, "val_loss": 0.022205442190170288} +{"train_loss": 0.00019253541540820152, "global_step": 64141, "epoch": 539, "lr": 2.5635085435023577e-06} +{"train_loss": 0.00035497036878950894, "global_step": 64142, "epoch": 539, "lr": 2.5628082937563748e-06} +{"train_loss": 0.00023508603044319898, "global_step": 64143, "epoch": 539, "lr": 2.562108137148256e-06} +{"train_loss": 0.0002693587448447943, "global_step": 64144, "epoch": 539, "lr": 2.5614080736793667e-06} +{"train_loss": 0.0003061900788452476, "global_step": 64145, "epoch": 539, "lr": 2.560708103351084e-06} +{"train_loss": 0.0003225863038096577, "global_step": 64146, "epoch": 539, "lr": 2.560008226164784e-06} +{"train_loss": 0.000214352214243263, "global_step": 64147, "epoch": 539, "lr": 2.559308442121838e-06} +{"train_loss": 0.00027574202977120876, "global_step": 64148, "epoch": 539, "lr": 2.5586087512236235e-06} +{"train_loss": 0.00018933744286186993, "global_step": 64149, "epoch": 539, "lr": 2.5579091534715104e-06} +{"train_loss": 0.000267566938418895, "global_step": 64150, "epoch": 539, "lr": 2.557209648866876e-06} +{"train_loss": 0.00016348519420716912, "global_step": 64151, "epoch": 539, "lr": 2.556510237411086e-06} +{"train_loss": 0.0002925931476056576, "global_step": 64152, "epoch": 539, "lr": 2.555810919105528e-06} +{"train_loss": 0.0003289021260570735, "global_step": 64153, "epoch": 539, "lr": 2.5551116939515618e-06} +{"train_loss": 0.00035095986095257103, "global_step": 64154, "epoch": 539, "lr": 2.55441256195057e-06} +{"train_loss": 0.0002643708139657974, "global_step": 64155, "epoch": 539, "lr": 2.553713523103912e-06} +{"train_loss": 0.00037064452772028744, "global_step": 64156, "epoch": 539, "lr": 2.5530145774129766e-06} +{"train_loss": 0.00047069982974790037, "global_step": 64157, "epoch": 539, "lr": 2.5523157248791228e-06} +{"train_loss": 0.0005019519594497979, "global_step": 64158, "epoch": 539, "lr": 2.5516169655037338e-06} +{"train_loss": 0.00021913848468102515, "global_step": 64159, "epoch": 539, "lr": 2.5509182992881687e-06} +{"train_loss": 0.00020148187468294054, "global_step": 64160, "epoch": 539, "lr": 2.5502197262338103e-06} +{"train_loss": 0.00024424277944490314, "global_step": 64161, "epoch": 539, "lr": 2.5495212463420235e-06} +{"train_loss": 0.0008653359254822135, "global_step": 64162, "epoch": 539, "lr": 2.548822859614186e-06} +{"train_loss": 0.0004052403965033591, "global_step": 64163, "epoch": 539, "lr": 2.5481245660516683e-06} +{"train_loss": 0.0002260079054394737, "global_step": 64164, "epoch": 539, "lr": 2.5474263656558307e-06} +{"train_loss": 0.00021337057114578784, "global_step": 64165, "epoch": 539, "lr": 2.5467282584280603e-06} +{"train_loss": 0.0005551449721679091, "global_step": 64166, "epoch": 539, "lr": 2.546030244369707e-06} +{"train_loss": 0.00018750716117210686, "global_step": 64167, "epoch": 539, "lr": 2.5453323234821634e-06} +{"train_loss": 0.00017239958106074482, "global_step": 64168, "epoch": 539, "lr": 2.5446344957667847e-06} +{"train_loss": 0.0003205246466677636, "global_step": 64169, "epoch": 539, "lr": 2.543936761224952e-06} +{"train_loss": 0.0003359953116159886, "global_step": 64170, "epoch": 539, "lr": 2.543239119858032e-06} +{"train_loss": 0.0002430054300930351, "global_step": 64171, "epoch": 539, "lr": 2.542541571667384e-06} +{"train_loss": 0.00024207140086218715, "global_step": 64172, "epoch": 539, "lr": 2.5418441166543904e-06} +{"train_loss": 0.0003790265182033181, "global_step": 64173, "epoch": 539, "lr": 2.5411467548204116e-06} +{"train_loss": 0.0005285551305860281, "global_step": 64174, "epoch": 539, "lr": 2.5404494861668236e-06} +{"train_loss": 0.00040706314030103385, "global_step": 64175, "epoch": 539, "lr": 2.5397523106949984e-06} +{"train_loss": 0.00016668868192937225, "global_step": 64176, "epoch": 539, "lr": 2.539055228406284e-06} +{"train_loss": 0.0003765850269701332, "global_step": 64177, "epoch": 539, "lr": 2.53835823930208e-06} +{"train_loss": 0.00020298868184909225, "global_step": 64178, "epoch": 539, "lr": 2.537661343383729e-06} +{"train_loss": 0.00028127949917688966, "global_step": 64179, "epoch": 539, "lr": 2.5369645406526145e-06} +{"train_loss": 0.0004229515325278044, "global_step": 64180, "epoch": 539, "lr": 2.5362678311100953e-06} +{"train_loss": 0.00025947540416382253, "global_step": 64181, "epoch": 539, "lr": 2.5355712147575485e-06} +{"train_loss": 0.00022418332810048014, "global_step": 64182, "epoch": 539, "lr": 2.534874691596334e-06} +{"train_loss": 0.00022505743254441768, "global_step": 64183, "epoch": 539, "lr": 2.5341782616278175e-06} +{"train_loss": 0.0002070781629299745, "global_step": 64184, "epoch": 539, "lr": 2.5334819248533815e-06} +{"train_loss": 0.0002835035847965628, "global_step": 64185, "epoch": 539, "lr": 2.532785681274369e-06} +{"train_loss": 0.0003007905324921012, "global_step": 64186, "epoch": 539, "lr": 2.5320895308921732e-06} +{"train_loss": 0.00043366034515202045, "global_step": 64187, "epoch": 539, "lr": 2.531393473708138e-06} +{"train_loss": 0.0002767359255813062, "global_step": 64188, "epoch": 539, "lr": 2.530697509723645e-06} +{"train_loss": 0.0003752137126866728, "global_step": 64189, "epoch": 539, "lr": 2.5300016389400606e-06} +{"train_loss": 0.00031328326440416276, "global_step": 64190, "epoch": 539, "lr": 2.5293058613587384e-06} +{"train_loss": 0.00016704454901628196, "global_step": 64191, "epoch": 539, "lr": 2.528610176981061e-06} +{"train_loss": 0.0004339269653428346, "global_step": 64192, "epoch": 539, "lr": 2.5279145858083776e-06} +{"train_loss": 0.0002543070004321635, "global_step": 64193, "epoch": 539, "lr": 2.5272190878420698e-06} +{"train_loss": 0.00035118585219606757, "global_step": 64194, "epoch": 539, "lr": 2.5265236830834983e-06} +{"train_loss": 0.000323609565384686, "global_step": 64195, "epoch": 539, "lr": 2.525828371534017e-06} +{"train_loss": 0.0005979276611469686, "global_step": 64196, "epoch": 539, "lr": 2.5251331531950027e-06} +{"train_loss": 0.00021823676070198417, "global_step": 64197, "epoch": 539, "lr": 2.524438028067816e-06} +{"train_loss": 0.00033025050652213395, "global_step": 64198, "epoch": 539, "lr": 2.5237429961538273e-06} +{"train_loss": 0.00015009223716333508, "global_step": 64199, "epoch": 539, "lr": 2.5230480574543912e-06} +{"train_loss": 0.00016680575208738446, "global_step": 64200, "epoch": 539, "lr": 2.522353211970885e-06} +{"train_loss": 0.000343398074619472, "global_step": 64201, "epoch": 539, "lr": 2.5216584597046676e-06} +{"train_loss": 0.0002231758990092203, "global_step": 64202, "epoch": 539, "lr": 2.520963800657089e-06} +{"train_loss": 0.00021647009998559952, "global_step": 64203, "epoch": 539, "lr": 2.5202692348295365e-06} +{"train_loss": 0.0002610756200738251, "global_step": 64204, "epoch": 539, "lr": 2.519574762223359e-06} +{"train_loss": 0.0003172515134792775, "global_step": 64205, "epoch": 539, "lr": 2.5188803828399275e-06} +{"train_loss": 0.0004233783402014524, "global_step": 64206, "epoch": 539, "lr": 2.518186096680597e-06} +{"train_loss": 0.0002672518021427095, "global_step": 64207, "epoch": 539, "lr": 2.5174919037467383e-06} +{"train_loss": 0.00023432821035385132, "global_step": 64208, "epoch": 539, "lr": 2.5167978040397113e-06} +{"train_loss": 0.0004099773068446666, "global_step": 64209, "epoch": 539, "lr": 2.516103797560876e-06} +{"train_loss": 0.0003106851945631206, "global_step": 64210, "epoch": 539, "lr": 2.5154098843116035e-06} +{"train_loss": 0.0005371749866753817, "global_step": 64211, "epoch": 539, "lr": 2.5147160642932433e-06} +{"train_loss": 0.0004575836064759642, "global_step": 64212, "epoch": 539, "lr": 2.5140223375071716e-06} +{"train_loss": 0.0008086459129117429, "global_step": 64213, "epoch": 539, "lr": 2.513328703954748e-06} +{"train_loss": 0.00021399831166490912, "global_step": 64214, "epoch": 539, "lr": 2.512635163637317e-06} +{"train_loss": 0.00021020908025093377, "global_step": 64215, "epoch": 539, "lr": 2.5119417165562653e-06} +{"train_loss": 0.00027907430194318295, "global_step": 64216, "epoch": 539, "lr": 2.511248362712931e-06} +{"train_loss": 0.00017602146544959396, "global_step": 64217, "epoch": 539, "lr": 2.510555102108697e-06} +{"train_loss": 0.0003394882078282535, "global_step": 64218, "epoch": 539, "lr": 2.5098619347449114e-06} +{"train_loss": 0.00023234142281580716, "global_step": 64219, "epoch": 539, "lr": 2.5091688606229404e-06} +{"train_loss": 0.00036576701677404344, "global_step": 64220, "epoch": 539, "lr": 2.5084758797441376e-06} +{"train_loss": 0.00040132328285835683, "global_step": 64221, "epoch": 539, "lr": 2.507782992109875e-06} +{"train_loss": 0.00023530173348262906, "global_step": 64222, "epoch": 539, "lr": 2.5070901977214955e-06} +{"train_loss": 0.0002509860787540674, "global_step": 64223, "epoch": 539, "lr": 2.506397496580376e-06} +{"train_loss": 0.00027008558390662074, "global_step": 64224, "epoch": 539, "lr": 2.5057048886878762e-06} +{"train_loss": 0.0004978991346433759, "global_step": 64225, "epoch": 539, "lr": 2.505012374045346e-06} +{"train_loss": 0.00020844937535002828, "global_step": 64226, "epoch": 539, "lr": 2.504319952654155e-06} +{"train_loss": 0.0003849337517749518, "global_step": 64227, "epoch": 539, "lr": 2.5036276245156587e-06} +{"train_loss": 0.00043311461922712624, "global_step": 64228, "epoch": 539, "lr": 2.5029353896312057e-06} +{"train_loss": 0.0006119285826571286, "global_step": 64229, "epoch": 539, "lr": 2.5022432480021728e-06} +{"train_loss": 0.0008215598063543439, "global_step": 64230, "epoch": 539, "lr": 2.5015511996299037e-06} +{"train_loss": 0.000365390966180712, "global_step": 64231, "epoch": 539, "lr": 2.500859244515774e-06} +{"train_loss": 0.0001501808874309063, "global_step": 64232, "epoch": 539, "lr": 2.500167382661128e-06} +{"train_loss": 0.0002588402130641043, "global_step": 64233, "epoch": 539, "lr": 2.499475614067326e-06} +{"train_loss": 0.0008236231515184045, "global_step": 64234, "epoch": 539, "lr": 2.498783938735738e-06} +{"train_loss": 0.00026639073621481657, "global_step": 64235, "epoch": 539, "lr": 2.498092356667697e-06} +{"train_loss": 0.00022651268227491528, "global_step": 64236, "epoch": 539, "lr": 2.497400867864591e-06} +{"train_loss": 0.00044818141032010317, "global_step": 64237, "epoch": 539, "lr": 2.4967094723277575e-06} +{"train_loss": 0.0003028545470442623, "global_step": 64238, "epoch": 539, "lr": 2.4960181700585617e-06} +{"train_loss": 0.00017479780944995582, "global_step": 64239, "epoch": 539, "lr": 2.495326961058364e-06} +{"train_loss": 0.00026259024161845446, "global_step": 64240, "epoch": 539, "lr": 2.494635845328508e-06} +{"train_loss": 0.000302774365991354, "global_step": 64241, "epoch": 539, "lr": 2.493944822870364e-06} +{"train_loss": 0.0003782252606470138, "global_step": 64242, "epoch": 539, "lr": 2.4932538936852766e-06} +{"train_loss": 0.00022959992929827422, "global_step": 64243, "epoch": 539, "lr": 2.4925630577746216e-06} +{"train_loss": 0.0002637965080793947, "global_step": 64244, "epoch": 539, "lr": 2.491872315139743e-06} +{"train_loss": 0.00013359871809370816, "global_step": 64245, "epoch": 539, "lr": 2.4911816657819887e-06} +{"train_loss": 0.00015904821339063346, "global_step": 64246, "epoch": 539, "lr": 2.4904911097027307e-06} +{"train_loss": 0.0003548178938217461, "global_step": 64247, "epoch": 539, "lr": 2.4898006469033063e-06} +{"train_loss": 0.00022407140932045877, "global_step": 64248, "epoch": 539, "lr": 2.4891102773850984e-06} +{"train_loss": 0.0005117086111567914, "global_step": 64249, "epoch": 539, "lr": 2.488420001149433e-06} +{"train_loss": 0.00039269874105229974, "global_step": 64250, "epoch": 539, "lr": 2.487729818197687e-06} +{"train_loss": 0.0006206209072843194, "global_step": 64251, "epoch": 539, "lr": 2.487039728531204e-06} +{"train_loss": 0.00023944901477079839, "global_step": 64252, "epoch": 539, "lr": 2.486349732151344e-06} +{"train_loss": 0.00021636001474689692, "global_step": 64253, "epoch": 539, "lr": 2.4856598290594613e-06} +{"train_loss": 0.000172532643773593, "global_step": 64254, "epoch": 539, "lr": 2.4849700192569103e-06} +{"train_loss": 0.00026061790413223207, "global_step": 64255, "epoch": 539, "lr": 2.48428030274504e-06} +{"train_loss": 0.0004219192487653345, "global_step": 64256, "epoch": 539, "lr": 2.483590679525211e-06} +{"train_loss": 0.000138503237394616, "global_step": 64257, "epoch": 539, "lr": 2.4829011495987763e-06} +{"train_loss": 0.0002923867432400584, "global_step": 64258, "epoch": 539, "lr": 2.482211712967086e-06} +{"train_loss": 0.00031913555850384426, "global_step": 64259, "epoch": 539, "lr": 2.4815223696315004e-06, "val_loss": 0.02940376102924347} +{"train_loss": 0.00020181265426799655, "global_step": 64260, "epoch": 540, "lr": 2.4808331195933678e-06} +{"train_loss": 0.00023149829939939082, "global_step": 64261, "epoch": 540, "lr": 2.480143962854037e-06} +{"train_loss": 0.0005607267958112061, "global_step": 64262, "epoch": 540, "lr": 2.479454899414879e-06} +{"train_loss": 0.00019704055739566684, "global_step": 64263, "epoch": 540, "lr": 2.478765929277227e-06} +{"train_loss": 0.00025642450782470405, "global_step": 64264, "epoch": 540, "lr": 2.4780770524424403e-06} +{"train_loss": 0.0005876783980056643, "global_step": 64265, "epoch": 540, "lr": 2.477388268911879e-06} +{"train_loss": 0.0004345137276686728, "global_step": 64266, "epoch": 540, "lr": 2.476699578686875e-06} +{"train_loss": 0.0004583677218761295, "global_step": 64267, "epoch": 540, "lr": 2.4760109817688116e-06} +{"train_loss": 0.00016776435950305313, "global_step": 64268, "epoch": 540, "lr": 2.475322478159009e-06} +{"train_loss": 0.00035195230157114565, "global_step": 64269, "epoch": 540, "lr": 2.4746340678588444e-06} +{"train_loss": 0.0007284219609573483, "global_step": 64270, "epoch": 540, "lr": 2.473945750869655e-06} +{"train_loss": 0.00017243002366740257, "global_step": 64271, "epoch": 540, "lr": 2.4732575271927905e-06} +{"train_loss": 0.00026133196661248803, "global_step": 64272, "epoch": 540, "lr": 2.4725693968296105e-06} +{"train_loss": 0.00040078311576507986, "global_step": 64273, "epoch": 540, "lr": 2.471881359781464e-06} +{"train_loss": 0.00015827285824343562, "global_step": 64274, "epoch": 540, "lr": 2.4711934160496997e-06} +{"train_loss": 0.0002184051991207525, "global_step": 64275, "epoch": 540, "lr": 2.470505565635667e-06} +{"train_loss": 0.00024789918097667396, "global_step": 64276, "epoch": 540, "lr": 2.4698178085407254e-06} +{"train_loss": 0.0002538041735533625, "global_step": 64277, "epoch": 540, "lr": 2.4691301447662187e-06} +{"train_loss": 0.00034387019695714116, "global_step": 64278, "epoch": 540, "lr": 2.46844257431349e-06} +{"train_loss": 0.00017621443839743733, "global_step": 64279, "epoch": 540, "lr": 2.4677550971838993e-06} +{"train_loss": 0.0002942965365946293, "global_step": 64280, "epoch": 540, "lr": 2.46706771337879e-06} +{"train_loss": 0.0002398458746029064, "global_step": 64281, "epoch": 540, "lr": 2.4663804228995224e-06} +{"train_loss": 0.00016928029072005302, "global_step": 64282, "epoch": 540, "lr": 2.4656932257474395e-06} +{"train_loss": 0.0003355085209477693, "global_step": 64283, "epoch": 540, "lr": 2.4650061219238798e-06} +{"train_loss": 0.000429427542258054, "global_step": 64284, "epoch": 540, "lr": 2.464319111430208e-06} +{"train_loss": 0.00013678314280696213, "global_step": 64285, "epoch": 540, "lr": 2.4636321942677676e-06} +{"train_loss": 0.0001584212586749345, "global_step": 64286, "epoch": 540, "lr": 2.4629453704379023e-06} +{"train_loss": 0.0003291113825980574, "global_step": 64287, "epoch": 540, "lr": 2.4622586399419723e-06} +{"train_loss": 0.0002854498161468655, "global_step": 64288, "epoch": 540, "lr": 2.4615720027813093e-06} +{"train_loss": 0.0005423026159405708, "global_step": 64289, "epoch": 540, "lr": 2.4608854589572794e-06} +{"train_loss": 0.00026633369270712137, "global_step": 64290, "epoch": 540, "lr": 2.46019900847122e-06} +{"train_loss": 0.0005662687472067773, "global_step": 64291, "epoch": 540, "lr": 2.4595126513244803e-06} +{"train_loss": 0.000246991723543033, "global_step": 64292, "epoch": 540, "lr": 2.4588263875184093e-06} +{"train_loss": 0.00016899863840080798, "global_step": 64293, "epoch": 540, "lr": 2.4581402170543557e-06} +{"train_loss": 0.0004073188465554267, "global_step": 64294, "epoch": 540, "lr": 2.4574541399336628e-06} +{"train_loss": 0.0003263893595431, "global_step": 64295, "epoch": 540, "lr": 2.4567681561576794e-06} +{"train_loss": 0.0003689372097142041, "global_step": 64296, "epoch": 540, "lr": 2.456082265727755e-06} +{"train_loss": 0.0002395837364019826, "global_step": 64297, "epoch": 540, "lr": 2.455396468645227e-06} +{"train_loss": 0.00048403878463432193, "global_step": 64298, "epoch": 540, "lr": 2.4547107649114554e-06} +{"train_loss": 0.0002929832262452692, "global_step": 64299, "epoch": 540, "lr": 2.454025154527773e-06} +{"train_loss": 0.0002360733924433589, "global_step": 64300, "epoch": 540, "lr": 2.453339637495539e-06} +{"train_loss": 0.0006779790273867548, "global_step": 64301, "epoch": 540, "lr": 2.4526542138160913e-06} +{"train_loss": 0.0003414524835534394, "global_step": 64302, "epoch": 540, "lr": 2.4519688834907737e-06} +{"train_loss": 0.0002936628588940948, "global_step": 64303, "epoch": 540, "lr": 2.451283646520941e-06} +{"train_loss": 0.0010041685309261084, "global_step": 64304, "epoch": 540, "lr": 2.4505985029079305e-06} +{"train_loss": 0.00029552282649092376, "global_step": 64305, "epoch": 540, "lr": 2.449913452653091e-06} +{"train_loss": 0.00019627265282906592, "global_step": 64306, "epoch": 540, "lr": 2.4492284957577607e-06} +{"train_loss": 0.00028929050313308835, "global_step": 64307, "epoch": 540, "lr": 2.448543632223299e-06} +{"train_loss": 0.00039054302033036947, "global_step": 64308, "epoch": 540, "lr": 2.447858862051039e-06} +{"train_loss": 0.00024988496443256736, "global_step": 64309, "epoch": 540, "lr": 2.4471741852423237e-06} +{"train_loss": 0.0003528925299178809, "global_step": 64310, "epoch": 540, "lr": 2.4464896017985074e-06} +{"train_loss": 0.00048403738765046, "global_step": 64311, "epoch": 540, "lr": 2.4458051117209224e-06} +{"train_loss": 0.0001972313766600564, "global_step": 64312, "epoch": 540, "lr": 2.4451207150109233e-06} +{"train_loss": 0.0002000056701945141, "global_step": 64313, "epoch": 540, "lr": 2.444436411669854e-06} +{"train_loss": 0.0002628267393447459, "global_step": 64314, "epoch": 540, "lr": 2.44375220169904e-06} +{"train_loss": 0.0003022535820491612, "global_step": 64315, "epoch": 540, "lr": 2.443068085099848e-06} +{"train_loss": 0.0002752500004135072, "global_step": 64316, "epoch": 540, "lr": 2.4423840618736037e-06} +{"train_loss": 0.0003587974060792476, "global_step": 64317, "epoch": 540, "lr": 2.4417001320216628e-06} +{"train_loss": 0.0001696596445981413, "global_step": 64318, "epoch": 540, "lr": 2.441016295545362e-06} +{"train_loss": 0.00032389274565503, "global_step": 64319, "epoch": 540, "lr": 2.4403325524460396e-06} +{"train_loss": 0.0003186253015883267, "global_step": 64320, "epoch": 540, "lr": 2.43964890272505e-06} +{"train_loss": 0.00020698098524007946, "global_step": 64321, "epoch": 540, "lr": 2.438965346383726e-06} +{"train_loss": 0.00030246013193391263, "global_step": 64322, "epoch": 540, "lr": 2.4382818834234157e-06} +{"train_loss": 0.00043723886483348906, "global_step": 64323, "epoch": 540, "lr": 2.4375985138454517e-06} +{"train_loss": 0.0002049990725936368, "global_step": 64324, "epoch": 540, "lr": 2.4369152376511884e-06} +{"train_loss": 0.0003856270923279226, "global_step": 64325, "epoch": 540, "lr": 2.4362320548419525e-06} +{"train_loss": 0.0004310796794015914, "global_step": 64326, "epoch": 540, "lr": 2.4355489654190986e-06} +{"train_loss": 0.00019886130758095533, "global_step": 64327, "epoch": 540, "lr": 2.434865969383965e-06} +{"train_loss": 0.00022224607528187335, "global_step": 64328, "epoch": 540, "lr": 2.4341830667378886e-06} +{"train_loss": 0.00023448684078175575, "global_step": 64329, "epoch": 540, "lr": 2.433500257482213e-06} +{"train_loss": 0.00031732115894556046, "global_step": 64330, "epoch": 540, "lr": 2.4328175416182708e-06} +{"train_loss": 0.00031895676511339843, "global_step": 64331, "epoch": 540, "lr": 2.432134919147422e-06} +{"train_loss": 0.00042798047070391476, "global_step": 64332, "epoch": 540, "lr": 2.4314523900709875e-06} +{"train_loss": 0.0002797160414047539, "global_step": 64333, "epoch": 540, "lr": 2.430769954390311e-06} +{"train_loss": 0.00025583000387996435, "global_step": 64334, "epoch": 540, "lr": 2.4300876121067463e-06} +{"train_loss": 0.0005060411640442908, "global_step": 64335, "epoch": 540, "lr": 2.4294053632216097e-06} +{"train_loss": 0.0002877761726267636, "global_step": 64336, "epoch": 540, "lr": 2.428723207736261e-06} +{"train_loss": 0.0001910687715280801, "global_step": 64337, "epoch": 540, "lr": 2.428041145652027e-06} +{"train_loss": 0.0003816003736574203, "global_step": 64338, "epoch": 540, "lr": 2.4273591769702563e-06} +{"train_loss": 0.00026364150107838213, "global_step": 64339, "epoch": 540, "lr": 2.4266773016922874e-06} +{"train_loss": 0.00038834690349176526, "global_step": 64340, "epoch": 540, "lr": 2.425995519819446e-06} +{"train_loss": 0.0003341201809234917, "global_step": 64341, "epoch": 540, "lr": 2.4253138313530876e-06} +{"train_loss": 0.0004291613004170358, "global_step": 64342, "epoch": 540, "lr": 2.424632236294533e-06} +{"train_loss": 0.00016221849364228547, "global_step": 64343, "epoch": 540, "lr": 2.4239507346451416e-06} +{"train_loss": 0.00043294590432196856, "global_step": 64344, "epoch": 540, "lr": 2.42326932640623e-06} +{"train_loss": 0.0006568828830495477, "global_step": 64345, "epoch": 540, "lr": 2.4225880115791576e-06} +{"train_loss": 0.00019576224440243095, "global_step": 64346, "epoch": 540, "lr": 2.421906790165246e-06} +{"train_loss": 0.00040271796751767397, "global_step": 64347, "epoch": 540, "lr": 2.4212256621658325e-06} +{"train_loss": 0.0002444420533720404, "global_step": 64348, "epoch": 540, "lr": 2.4205446275822663e-06} +{"train_loss": 0.0002380403020652011, "global_step": 64349, "epoch": 540, "lr": 2.4198636864158687e-06} +{"train_loss": 0.00025725807063281536, "global_step": 64350, "epoch": 540, "lr": 2.4191828386679938e-06} +{"train_loss": 0.00015851735952310264, "global_step": 64351, "epoch": 540, "lr": 2.418502084339963e-06} +{"train_loss": 0.00014835683396086097, "global_step": 64352, "epoch": 540, "lr": 2.417821423433131e-06} +{"train_loss": 0.00038026546826586127, "global_step": 64353, "epoch": 540, "lr": 2.4171408559488075e-06} +{"train_loss": 0.00019549389253370464, "global_step": 64354, "epoch": 540, "lr": 2.4164603818883523e-06} +{"train_loss": 0.0003182559448760003, "global_step": 64355, "epoch": 540, "lr": 2.4157800012530985e-06} +{"train_loss": 0.00016293708176817745, "global_step": 64356, "epoch": 540, "lr": 2.4150997140443667e-06} +{"train_loss": 0.00030480336863547564, "global_step": 64357, "epoch": 540, "lr": 2.414419520263517e-06} +{"train_loss": 0.00029619724955409765, "global_step": 64358, "epoch": 540, "lr": 2.4137394199118647e-06} +{"train_loss": 0.00027034772210754454, "global_step": 64359, "epoch": 540, "lr": 2.413059412990748e-06} +{"train_loss": 0.00024770930758677423, "global_step": 64360, "epoch": 540, "lr": 2.4123794995015103e-06} +{"train_loss": 0.0001897908077808097, "global_step": 64361, "epoch": 540, "lr": 2.4116996794454728e-06} +{"train_loss": 0.00024701980873942375, "global_step": 64362, "epoch": 540, "lr": 2.411019952823984e-06} +{"train_loss": 0.00018969950906466693, "global_step": 64363, "epoch": 540, "lr": 2.410340319638377e-06} +{"train_loss": 0.000238446329603903, "global_step": 64364, "epoch": 540, "lr": 2.4096607798899772e-06} +{"train_loss": 0.00037416789564304054, "global_step": 64365, "epoch": 540, "lr": 2.408981333580129e-06} +{"train_loss": 0.0006251148879528046, "global_step": 64366, "epoch": 540, "lr": 2.4083019807101536e-06} +{"train_loss": 0.00015397438255604357, "global_step": 64367, "epoch": 540, "lr": 2.4076227212814053e-06} +{"train_loss": 0.0002921735867857933, "global_step": 64368, "epoch": 540, "lr": 2.4069435552951934e-06} +{"train_loss": 0.0002102040743920952, "global_step": 64369, "epoch": 540, "lr": 2.406264482752868e-06} +{"train_loss": 0.0002705479273572564, "global_step": 64370, "epoch": 540, "lr": 2.4055855036557605e-06} +{"train_loss": 0.00021125042985659093, "global_step": 64371, "epoch": 540, "lr": 2.4049066180051984e-06} +{"train_loss": 0.00022213628108147532, "global_step": 64372, "epoch": 540, "lr": 2.4042278258025186e-06} +{"train_loss": 0.00046292002662084997, "global_step": 64373, "epoch": 540, "lr": 2.4035491270490482e-06} +{"train_loss": 0.00029302394250407815, "global_step": 64374, "epoch": 540, "lr": 2.402870521746131e-06} +{"train_loss": 0.00020763651991728693, "global_step": 64375, "epoch": 540, "lr": 2.4021920098950823e-06} +{"train_loss": 0.0002481237752363086, "global_step": 64376, "epoch": 540, "lr": 2.4015135914972563e-06} +{"train_loss": 0.0003294041089247912, "global_step": 64377, "epoch": 540, "lr": 2.400835266553969e-06} +{"train_loss": 0.0003115550459346914, "global_step": 64378, "epoch": 540, "lr": 2.4001570350665527e-06, "val_loss": 0.026161327958106995, "train_action_mse_error": 3.2723942240409087e-06} +{"train_loss": 0.0005715707666240633, "global_step": 64379, "epoch": 541, "lr": 2.39947889703635e-06} +{"train_loss": 0.00023642333690077066, "global_step": 64380, "epoch": 541, "lr": 2.3988008524646775e-06} +{"train_loss": 0.00026743178023025393, "global_step": 64381, "epoch": 541, "lr": 2.3981229013528785e-06} +{"train_loss": 0.00035538311931304634, "global_step": 64382, "epoch": 541, "lr": 2.3974450437022735e-06} +{"train_loss": 0.00023531398619525135, "global_step": 64383, "epoch": 541, "lr": 2.396767279514206e-06} +{"train_loss": 0.00031904454226605594, "global_step": 64384, "epoch": 541, "lr": 2.3960896087899974e-06} +{"train_loss": 0.00030838241218589246, "global_step": 64385, "epoch": 541, "lr": 2.395412031530986e-06} +{"train_loss": 0.0003494851407594979, "global_step": 64386, "epoch": 541, "lr": 2.3947345477384863e-06} +{"train_loss": 0.0002714501169975847, "global_step": 64387, "epoch": 541, "lr": 2.3940571574138535e-06} +{"train_loss": 0.00022382351744454354, "global_step": 64388, "epoch": 541, "lr": 2.3933798605583925e-06} +{"train_loss": 0.00023953741765581071, "global_step": 64389, "epoch": 541, "lr": 2.3927026571734514e-06} +{"train_loss": 0.00022077703033573925, "global_step": 64390, "epoch": 541, "lr": 2.392025547260346e-06} +{"train_loss": 0.0002435917704133317, "global_step": 64391, "epoch": 541, "lr": 2.39134853082042e-06} +{"train_loss": 0.00018926247139461339, "global_step": 64392, "epoch": 541, "lr": 2.390671607854983e-06} +{"train_loss": 0.0005128970369696617, "global_step": 64393, "epoch": 541, "lr": 2.3899947783653896e-06} +{"train_loss": 0.00013453263090923429, "global_step": 64394, "epoch": 541, "lr": 2.389318042352945e-06} +{"train_loss": 0.0006611786084249616, "global_step": 64395, "epoch": 541, "lr": 2.3886413998189972e-06} +{"train_loss": 0.00014753158029634506, "global_step": 64396, "epoch": 541, "lr": 2.3879648507648623e-06} +{"train_loss": 0.0005355663015507162, "global_step": 64397, "epoch": 541, "lr": 2.387288395191867e-06} +{"train_loss": 0.00022852855909150094, "global_step": 64398, "epoch": 541, "lr": 2.3866120331013484e-06} +{"train_loss": 0.0004799042653758079, "global_step": 64399, "epoch": 541, "lr": 2.3859357644946232e-06} +{"train_loss": 0.00020489357120823115, "global_step": 64400, "epoch": 541, "lr": 2.38525958937304e-06} +{"train_loss": 0.00034002374741248786, "global_step": 64401, "epoch": 541, "lr": 2.384583507737903e-06} +{"train_loss": 0.00031061546178534627, "global_step": 64402, "epoch": 541, "lr": 2.38390751959055e-06} +{"train_loss": 0.00022579719370696694, "global_step": 64403, "epoch": 541, "lr": 2.3832316249323138e-06} +{"train_loss": 0.0003023502940777689, "global_step": 64404, "epoch": 541, "lr": 2.382555823764504e-06} +{"train_loss": 0.00018496272969059646, "global_step": 64405, "epoch": 541, "lr": 2.3818801160884695e-06} +{"train_loss": 0.00014409562572836876, "global_step": 64406, "epoch": 541, "lr": 2.381204501905515e-06} +{"train_loss": 0.00019604546832852066, "global_step": 64407, "epoch": 541, "lr": 2.3805289812169894e-06} +{"train_loss": 0.00032487473799847066, "global_step": 64408, "epoch": 541, "lr": 2.3798535540242084e-06} +{"train_loss": 0.00031166558619588614, "global_step": 64409, "epoch": 541, "lr": 2.3791782203284872e-06} +{"train_loss": 0.00020943876006640494, "global_step": 64410, "epoch": 541, "lr": 2.37850298013117e-06} +{"train_loss": 0.00018362294940743595, "global_step": 64411, "epoch": 541, "lr": 2.3778278334335657e-06} +{"train_loss": 0.00022198143415153027, "global_step": 64412, "epoch": 541, "lr": 2.3771527802370186e-06} +{"train_loss": 0.0005817558849230409, "global_step": 64413, "epoch": 541, "lr": 2.3764778205428385e-06} +{"train_loss": 0.00016105384565889835, "global_step": 64414, "epoch": 541, "lr": 2.375802954352363e-06} +{"train_loss": 0.00037840483128093183, "global_step": 64415, "epoch": 541, "lr": 2.375128181666908e-06} +{"train_loss": 0.0005167970666661859, "global_step": 64416, "epoch": 541, "lr": 2.3744535024877944e-06} +{"train_loss": 0.0001768395450199023, "global_step": 64417, "epoch": 541, "lr": 2.373778916816355e-06} +{"train_loss": 0.0002102875296259299, "global_step": 64418, "epoch": 541, "lr": 2.373104424653916e-06} +{"train_loss": 0.00033191530383192003, "global_step": 64419, "epoch": 541, "lr": 2.372430026001793e-06} +{"train_loss": 0.00017632385424803942, "global_step": 64420, "epoch": 541, "lr": 2.371755720861324e-06} +{"train_loss": 0.0002511010388843715, "global_step": 64421, "epoch": 541, "lr": 2.3710815092338135e-06} +{"train_loss": 0.00020841682271566242, "global_step": 64422, "epoch": 541, "lr": 2.370407391120605e-06} +{"train_loss": 0.00019371746748220176, "global_step": 64423, "epoch": 541, "lr": 2.369733366523008e-06} +{"train_loss": 0.00019088518456555903, "global_step": 64424, "epoch": 541, "lr": 2.3690594354423556e-06} +{"train_loss": 0.0003201062500011176, "global_step": 64425, "epoch": 541, "lr": 2.368385597879963e-06} +{"train_loss": 0.00024639751063659787, "global_step": 64426, "epoch": 541, "lr": 2.3677118538371624e-06} +{"train_loss": 0.00035257224226370454, "global_step": 64427, "epoch": 541, "lr": 2.367038203315269e-06} +{"train_loss": 0.0003908718645107001, "global_step": 64428, "epoch": 541, "lr": 2.3663646463155996e-06} +{"train_loss": 0.00022056516900192946, "global_step": 64429, "epoch": 541, "lr": 2.365691182839491e-06} +{"train_loss": 0.00018910536891780794, "global_step": 64430, "epoch": 541, "lr": 2.365017812888254e-06} +{"train_loss": 0.0004209835024084896, "global_step": 64431, "epoch": 541, "lr": 2.3643445364632255e-06} +{"train_loss": 0.00016157676873262972, "global_step": 64432, "epoch": 541, "lr": 2.3636713535657105e-06} +{"train_loss": 0.0002506445161998272, "global_step": 64433, "epoch": 541, "lr": 2.362998264197036e-06} +{"train_loss": 0.0004189946048427373, "global_step": 64434, "epoch": 541, "lr": 2.3623252683585283e-06} +{"train_loss": 0.00030135444831103086, "global_step": 64435, "epoch": 541, "lr": 2.3616523660515034e-06} +{"train_loss": 0.00024929051869548857, "global_step": 64436, "epoch": 541, "lr": 2.3609795572772874e-06} +{"train_loss": 0.0002844136906787753, "global_step": 64437, "epoch": 541, "lr": 2.360306842037191e-06} +{"train_loss": 0.00020658245193772018, "global_step": 64438, "epoch": 541, "lr": 2.3596342203325518e-06} +{"train_loss": 0.00055936339776963, "global_step": 64439, "epoch": 541, "lr": 2.3589616921646794e-06} +{"train_loss": 0.00024943496100604534, "global_step": 64440, "epoch": 541, "lr": 2.35828925753489e-06} +{"train_loss": 0.0003886467020493001, "global_step": 64441, "epoch": 541, "lr": 2.357616916444516e-06} +{"train_loss": 0.0002033789933193475, "global_step": 64442, "epoch": 541, "lr": 2.356944668894867e-06} +{"train_loss": 0.00037737013190053403, "global_step": 64443, "epoch": 541, "lr": 2.3562725148872757e-06} +{"train_loss": 0.00023403746308758855, "global_step": 64444, "epoch": 541, "lr": 2.35560045442304e-06} +{"train_loss": 0.00019670921028591692, "global_step": 64445, "epoch": 541, "lr": 2.354928487503505e-06} +{"train_loss": 0.00019419660384301096, "global_step": 64446, "epoch": 541, "lr": 2.354256614129974e-06} +{"train_loss": 0.00019778015848714858, "global_step": 64447, "epoch": 541, "lr": 2.353584834303768e-06} +{"train_loss": 0.0005566290928982198, "global_step": 64448, "epoch": 541, "lr": 2.352913148026209e-06} +{"train_loss": 0.00036608788650482893, "global_step": 64449, "epoch": 541, "lr": 2.352241555298612e-06} +{"train_loss": 0.000268045550910756, "global_step": 64450, "epoch": 541, "lr": 2.3515700561223042e-06} +{"train_loss": 0.0002074349467875436, "global_step": 64451, "epoch": 541, "lr": 2.3508986504985896e-06} +{"train_loss": 0.00036476447712630033, "global_step": 64452, "epoch": 541, "lr": 2.3502273384287954e-06} +{"train_loss": 0.00037953892024233937, "global_step": 64453, "epoch": 541, "lr": 2.349556119914248e-06} +{"train_loss": 0.0003275782219134271, "global_step": 64454, "epoch": 541, "lr": 2.3488849949562465e-06} +{"train_loss": 0.0001837491145124659, "global_step": 64455, "epoch": 541, "lr": 2.3482139635561285e-06} +{"train_loss": 0.0005109001067467034, "global_step": 64456, "epoch": 541, "lr": 2.347543025715193e-06} +{"train_loss": 0.00017029960872605443, "global_step": 64457, "epoch": 541, "lr": 2.346872181434773e-06} +{"train_loss": 0.00023534342471975833, "global_step": 64458, "epoch": 541, "lr": 2.3462014307161773e-06} +{"train_loss": 0.0003786342276725918, "global_step": 64459, "epoch": 541, "lr": 2.3455307735607222e-06} +{"train_loss": 0.00020117878739256412, "global_step": 64460, "epoch": 541, "lr": 2.3448602099697292e-06} +{"train_loss": 0.0002918723621405661, "global_step": 64461, "epoch": 541, "lr": 2.3441897399445024e-06} +{"train_loss": 0.0002785138785839081, "global_step": 64462, "epoch": 541, "lr": 2.3435193634863796e-06} +{"train_loss": 0.0002449716266710311, "global_step": 64463, "epoch": 541, "lr": 2.3428490805966542e-06} +{"train_loss": 0.0002864162379410118, "global_step": 64464, "epoch": 541, "lr": 2.342178891276664e-06} +{"train_loss": 0.0003004884347319603, "global_step": 64465, "epoch": 541, "lr": 2.3415087955277136e-06} +{"train_loss": 0.00037149203126318753, "global_step": 64466, "epoch": 541, "lr": 2.340838793351108e-06} +{"train_loss": 0.00024394552747253329, "global_step": 64467, "epoch": 541, "lr": 2.340168884748184e-06} +{"train_loss": 0.00022755726240575314, "global_step": 64468, "epoch": 541, "lr": 2.339499069720241e-06} +{"train_loss": 0.0002637138532008976, "global_step": 64469, "epoch": 541, "lr": 2.3388293482686065e-06} +{"train_loss": 0.00039228933746926486, "global_step": 64470, "epoch": 541, "lr": 2.338159720394584e-06} +{"train_loss": 0.00020869109721388668, "global_step": 64471, "epoch": 541, "lr": 2.337490186099489e-06} +{"train_loss": 0.00018438781262375414, "global_step": 64472, "epoch": 541, "lr": 2.336820745384649e-06} +{"train_loss": 0.00023125007282942533, "global_step": 64473, "epoch": 541, "lr": 2.336151398251363e-06} +{"train_loss": 0.000449611950898543, "global_step": 64474, "epoch": 541, "lr": 2.3354821447009566e-06} +{"train_loss": 0.0003118898894172162, "global_step": 64475, "epoch": 541, "lr": 2.33481298473473e-06} +{"train_loss": 0.00019958407210651785, "global_step": 64476, "epoch": 541, "lr": 2.334143918354015e-06} +{"train_loss": 0.00019205984426662326, "global_step": 64477, "epoch": 541, "lr": 2.3334749455601156e-06} +{"train_loss": 0.00044982077088207006, "global_step": 64478, "epoch": 541, "lr": 2.3328060663543373e-06} +{"train_loss": 0.00019775066175498068, "global_step": 64479, "epoch": 541, "lr": 2.3321372807380116e-06} +{"train_loss": 0.00016815034905448556, "global_step": 64480, "epoch": 541, "lr": 2.3314685887124322e-06} +{"train_loss": 0.0002733097644522786, "global_step": 64481, "epoch": 541, "lr": 2.3307999902789313e-06} +{"train_loss": 0.00016374464030377567, "global_step": 64482, "epoch": 541, "lr": 2.330131485438802e-06} +{"train_loss": 0.0002762430813163519, "global_step": 64483, "epoch": 541, "lr": 2.329463074193372e-06} +{"train_loss": 0.0003557907184585929, "global_step": 64484, "epoch": 541, "lr": 2.328794756543945e-06} +{"train_loss": 0.00020700796449091285, "global_step": 64485, "epoch": 541, "lr": 2.3281265324918478e-06} +{"train_loss": 0.00032537608058191836, "global_step": 64486, "epoch": 541, "lr": 2.3274584020383683e-06} +{"train_loss": 0.0001788899680832401, "global_step": 64487, "epoch": 541, "lr": 2.326790365184833e-06} +{"train_loss": 0.0003499227750580758, "global_step": 64488, "epoch": 541, "lr": 2.3261224219325583e-06} +{"train_loss": 0.00040536755113862455, "global_step": 64489, "epoch": 541, "lr": 2.325454572282848e-06} +{"train_loss": 0.0002523189759813249, "global_step": 64490, "epoch": 541, "lr": 2.324786816237007e-06} +{"train_loss": 0.00023385185340885073, "global_step": 64491, "epoch": 541, "lr": 2.3241191537963616e-06} +{"train_loss": 0.0002840063243638724, "global_step": 64492, "epoch": 541, "lr": 2.3234515849622053e-06} +{"train_loss": 0.00019729761697817594, "global_step": 64493, "epoch": 541, "lr": 2.3227841097358703e-06} +{"train_loss": 0.00022251445625443012, "global_step": 64494, "epoch": 541, "lr": 2.322116728118645e-06} +{"train_loss": 0.00019904537475667894, "global_step": 64495, "epoch": 541, "lr": 2.321449440111856e-06} +{"train_loss": 0.00025235721841454506, "global_step": 64496, "epoch": 541, "lr": 2.320782245716813e-06} +{"train_loss": 0.0002856331181853321, "global_step": 64497, "epoch": 541, "lr": 2.320115144934809e-06, "val_loss": 0.03658907487988472} +{"train_loss": 0.00020225705520715564, "global_step": 64498, "epoch": 542, "lr": 2.319448137767172e-06} +{"train_loss": 0.0002758128975983709, "global_step": 64499, "epoch": 542, "lr": 2.3187812242151995e-06} +{"train_loss": 0.00031566937104798853, "global_step": 64500, "epoch": 542, "lr": 2.3181144042802083e-06} +{"train_loss": 0.00021513050887733698, "global_step": 64501, "epoch": 542, "lr": 2.317447677963508e-06} +{"train_loss": 0.0002869389718398452, "global_step": 64502, "epoch": 542, "lr": 2.316781045266403e-06} +{"train_loss": 0.00017424013640265912, "global_step": 64503, "epoch": 542, "lr": 2.3161145061902034e-06} +{"train_loss": 0.00034828431671485305, "global_step": 64504, "epoch": 542, "lr": 2.3154480607362196e-06} +{"train_loss": 0.00027230047271586955, "global_step": 64505, "epoch": 542, "lr": 2.314781708905761e-06} +{"train_loss": 0.00019498422625474632, "global_step": 64506, "epoch": 542, "lr": 2.3141154507001273e-06} +{"train_loss": 0.00037584148230962455, "global_step": 64507, "epoch": 542, "lr": 2.313449286120639e-06} +{"train_loss": 0.0006796859088353813, "global_step": 64508, "epoch": 542, "lr": 2.3127832151686014e-06} +{"train_loss": 0.0003688590368255973, "global_step": 64509, "epoch": 542, "lr": 2.3121172378453126e-06} +{"train_loss": 0.0003140409826301038, "global_step": 64510, "epoch": 542, "lr": 2.3114513541520942e-06} +{"train_loss": 0.00017125604790635407, "global_step": 64511, "epoch": 542, "lr": 2.310785564090234e-06} +{"train_loss": 0.0001278839772567153, "global_step": 64512, "epoch": 542, "lr": 2.3101198676610646e-06} +{"train_loss": 0.00022139122302178293, "global_step": 64513, "epoch": 542, "lr": 2.3094542648658678e-06} +{"train_loss": 0.00017194105021189898, "global_step": 64514, "epoch": 542, "lr": 2.3087887557059763e-06} +{"train_loss": 0.00024384706921409816, "global_step": 64515, "epoch": 542, "lr": 2.308123340182672e-06} +{"train_loss": 0.0006453021196648479, "global_step": 64516, "epoch": 542, "lr": 2.307458018297276e-06} +{"train_loss": 0.00022685900330543518, "global_step": 64517, "epoch": 542, "lr": 2.306792790051088e-06} +{"train_loss": 0.00019107360276393592, "global_step": 64518, "epoch": 542, "lr": 2.3061276554454282e-06} +{"train_loss": 0.00016381798195652664, "global_step": 64519, "epoch": 542, "lr": 2.305462614481579e-06} +{"train_loss": 0.00025890531833283603, "global_step": 64520, "epoch": 542, "lr": 2.304797667160863e-06} +{"train_loss": 0.00044045704999007285, "global_step": 64521, "epoch": 542, "lr": 2.304132813484583e-06} +{"train_loss": 0.0001747545029502362, "global_step": 64522, "epoch": 542, "lr": 2.303468053454044e-06} +{"train_loss": 0.00026508368318900466, "global_step": 64523, "epoch": 542, "lr": 2.30280338707054e-06} +{"train_loss": 0.0004222863935865462, "global_step": 64524, "epoch": 542, "lr": 2.3021388143353974e-06} +{"train_loss": 0.0007374720880761743, "global_step": 64525, "epoch": 542, "lr": 2.3014743352499036e-06} +{"train_loss": 0.00016125888214446604, "global_step": 64526, "epoch": 542, "lr": 2.300809949815369e-06} +{"train_loss": 0.0002711036941036582, "global_step": 64527, "epoch": 542, "lr": 2.3001456580331038e-06} +{"train_loss": 0.00022457474551629275, "global_step": 64528, "epoch": 542, "lr": 2.299481459904401e-06} +{"train_loss": 0.00034311701892875135, "global_step": 64529, "epoch": 542, "lr": 2.2988173554305713e-06} +{"train_loss": 0.00029916284256614745, "global_step": 64530, "epoch": 542, "lr": 2.298153344612919e-06} +{"train_loss": 0.000580536900088191, "global_step": 64531, "epoch": 542, "lr": 2.297489427452748e-06} +{"train_loss": 0.00021364640269894153, "global_step": 64532, "epoch": 542, "lr": 2.2968256039513527e-06} +{"train_loss": 0.00028601367375813425, "global_step": 64533, "epoch": 542, "lr": 2.2961618741100534e-06} +{"train_loss": 0.00022778534912504256, "global_step": 64534, "epoch": 542, "lr": 2.2954982379301435e-06} +{"train_loss": 0.00019636045908555388, "global_step": 64535, "epoch": 542, "lr": 2.2948346954129173e-06} +{"train_loss": 0.00019679282559081912, "global_step": 64536, "epoch": 542, "lr": 2.2941712465596953e-06} +{"train_loss": 0.0004498831112869084, "global_step": 64537, "epoch": 542, "lr": 2.2935078913717654e-06} +{"train_loss": 0.00026246588095091283, "global_step": 64538, "epoch": 542, "lr": 2.292844629850438e-06} +{"train_loss": 0.00019758258713409305, "global_step": 64539, "epoch": 542, "lr": 2.2921814619970173e-06} +{"train_loss": 0.0010871472768485546, "global_step": 64540, "epoch": 542, "lr": 2.2915183878127966e-06} +{"train_loss": 0.0002710944099817425, "global_step": 64541, "epoch": 542, "lr": 2.290855407299086e-06} +{"train_loss": 0.00048592849634587765, "global_step": 64542, "epoch": 542, "lr": 2.2901925204571793e-06} +{"train_loss": 0.0002920422120951116, "global_step": 64543, "epoch": 542, "lr": 2.2895297272883866e-06} +{"train_loss": 0.0002795153995975852, "global_step": 64544, "epoch": 542, "lr": 2.2888670277940004e-06} +{"train_loss": 0.0001569204468978569, "global_step": 64545, "epoch": 542, "lr": 2.288204421975332e-06} +{"train_loss": 0.00028407256468199193, "global_step": 64546, "epoch": 542, "lr": 2.287541909833679e-06} +{"train_loss": 0.00027442420832812786, "global_step": 64547, "epoch": 542, "lr": 2.2868794913703308e-06} +{"train_loss": 0.0002789455757010728, "global_step": 64548, "epoch": 542, "lr": 2.286217166586607e-06} +{"train_loss": 0.0001313209068030119, "global_step": 64549, "epoch": 542, "lr": 2.2855549354837912e-06} +{"train_loss": 0.00015496234118472785, "global_step": 64550, "epoch": 542, "lr": 2.2848927980631872e-06} +{"train_loss": 0.00032237518462352455, "global_step": 64551, "epoch": 542, "lr": 2.284230754326111e-06} +{"train_loss": 0.0001244375598616898, "global_step": 64552, "epoch": 542, "lr": 2.283568804273839e-06} +{"train_loss": 0.00027156894793733954, "global_step": 64553, "epoch": 542, "lr": 2.2829069479076925e-06} +{"train_loss": 0.0002633130643516779, "global_step": 64554, "epoch": 542, "lr": 2.282245185228948e-06} +{"train_loss": 0.00018131341494154185, "global_step": 64555, "epoch": 542, "lr": 2.2815835162389275e-06} +{"train_loss": 0.0003290509048383683, "global_step": 64556, "epoch": 542, "lr": 2.2809219409389127e-06} +{"train_loss": 0.00026856950717046857, "global_step": 64557, "epoch": 542, "lr": 2.280260459330219e-06} +{"train_loss": 0.0002947064640466124, "global_step": 64558, "epoch": 542, "lr": 2.279599071414129e-06} +{"train_loss": 0.00016604211123194546, "global_step": 64559, "epoch": 542, "lr": 2.2789377771919474e-06} +{"train_loss": 0.0007233492215164006, "global_step": 64560, "epoch": 542, "lr": 2.2782765766649785e-06} +{"train_loss": 0.0004284101305529475, "global_step": 64561, "epoch": 542, "lr": 2.2776154698345097e-06} +{"train_loss": 0.0003813797084148973, "global_step": 64562, "epoch": 542, "lr": 2.2769544567018463e-06} +{"train_loss": 0.0002183247997891158, "global_step": 64563, "epoch": 542, "lr": 2.2762935372682815e-06} +{"train_loss": 0.0004936742479912937, "global_step": 64564, "epoch": 542, "lr": 2.2756327115351195e-06} +{"train_loss": 0.0002197971334680915, "global_step": 64565, "epoch": 542, "lr": 2.2749719795036597e-06} +{"train_loss": 0.0003979741013608873, "global_step": 64566, "epoch": 542, "lr": 2.2743113411751837e-06} +{"train_loss": 0.0002807762648444623, "global_step": 64567, "epoch": 542, "lr": 2.2736507965510023e-06} +{"train_loss": 0.00022998852364253253, "global_step": 64568, "epoch": 542, "lr": 2.2729903456324085e-06} +{"train_loss": 0.0001202348867082037, "global_step": 64569, "epoch": 542, "lr": 2.2723299884207015e-06} +{"train_loss": 0.00021559880406130105, "global_step": 64570, "epoch": 542, "lr": 2.271669724917175e-06} +{"train_loss": 0.0002082066930597648, "global_step": 64571, "epoch": 542, "lr": 2.2710095551231213e-06} +{"train_loss": 0.00016449743998236954, "global_step": 64572, "epoch": 542, "lr": 2.2703494790398462e-06} +{"train_loss": 0.0003077338042203337, "global_step": 64573, "epoch": 542, "lr": 2.2696894966686364e-06} +{"train_loss": 0.00029881764203310013, "global_step": 64574, "epoch": 542, "lr": 2.2690296080107976e-06} +{"train_loss": 0.0003575723385438323, "global_step": 64575, "epoch": 542, "lr": 2.2683698130676168e-06} +{"train_loss": 0.00020880045485682786, "global_step": 64576, "epoch": 542, "lr": 2.2677101118403933e-06} +{"train_loss": 0.00024390907492488623, "global_step": 64577, "epoch": 542, "lr": 2.2670505043304257e-06} +{"train_loss": 0.00047324306797236204, "global_step": 64578, "epoch": 542, "lr": 2.266390990538997e-06} +{"train_loss": 0.00025709293549880385, "global_step": 64579, "epoch": 542, "lr": 2.2657315704674166e-06} +{"train_loss": 0.00019616438657976687, "global_step": 64580, "epoch": 542, "lr": 2.2650722441169615e-06} +{"train_loss": 0.000275025813607499, "global_step": 64581, "epoch": 542, "lr": 2.264413011488953e-06} +{"train_loss": 0.0005720503395423293, "global_step": 64582, "epoch": 542, "lr": 2.2637538725846562e-06} +{"train_loss": 0.00025807571364566684, "global_step": 64583, "epoch": 542, "lr": 2.2630948274053874e-06} +{"train_loss": 0.00025577371707186103, "global_step": 64584, "epoch": 542, "lr": 2.2624358759524233e-06} +{"train_loss": 0.00026022334350273013, "global_step": 64585, "epoch": 542, "lr": 2.2617770182270683e-06} +{"train_loss": 0.0003196464094799012, "global_step": 64586, "epoch": 542, "lr": 2.261118254230621e-06} +{"train_loss": 0.0003449897048994899, "global_step": 64587, "epoch": 542, "lr": 2.2604595839643638e-06} +{"train_loss": 0.00022397663269657642, "global_step": 64588, "epoch": 542, "lr": 2.259801007429596e-06} +{"train_loss": 0.0003752511984203011, "global_step": 64589, "epoch": 542, "lr": 2.259142524627611e-06} +{"train_loss": 0.0001856817107181996, "global_step": 64590, "epoch": 542, "lr": 2.2584841355596908e-06} +{"train_loss": 0.000178095098817721, "global_step": 64591, "epoch": 542, "lr": 2.257825840227146e-06} +{"train_loss": 0.0003159863408654928, "global_step": 64592, "epoch": 542, "lr": 2.2571676386312525e-06} +{"train_loss": 0.0004966906271874905, "global_step": 64593, "epoch": 542, "lr": 2.256509530773315e-06} +{"train_loss": 0.0002716204326134175, "global_step": 64594, "epoch": 542, "lr": 2.2558515166546114e-06} +{"train_loss": 0.00019747050828300416, "global_step": 64595, "epoch": 542, "lr": 2.255193596276456e-06} +{"train_loss": 0.0003630689752753824, "global_step": 64596, "epoch": 542, "lr": 2.2545357696401204e-06} +{"train_loss": 0.00032948271837085485, "global_step": 64597, "epoch": 542, "lr": 2.253878036746898e-06} +{"train_loss": 0.00029368625837378204, "global_step": 64598, "epoch": 542, "lr": 2.253220397598094e-06} +{"train_loss": 0.00020307695376686752, "global_step": 64599, "epoch": 542, "lr": 2.2525628521949838e-06} +{"train_loss": 0.0003360102709848434, "global_step": 64600, "epoch": 542, "lr": 2.2519054005388727e-06} +{"train_loss": 0.0003175098972860724, "global_step": 64601, "epoch": 542, "lr": 2.2512480426310435e-06} +{"train_loss": 0.00018495302356313914, "global_step": 64602, "epoch": 542, "lr": 2.2505907784727777e-06} +{"train_loss": 0.00024355496861971915, "global_step": 64603, "epoch": 542, "lr": 2.2499336080653856e-06} +{"train_loss": 0.00017755264707375318, "global_step": 64604, "epoch": 542, "lr": 2.2492765314101383e-06} +{"train_loss": 0.00023429853899870068, "global_step": 64605, "epoch": 542, "lr": 2.248619548508346e-06} +{"train_loss": 0.00020550793851725757, "global_step": 64606, "epoch": 542, "lr": 2.24796265936128e-06} +{"train_loss": 0.00013747144839726388, "global_step": 64607, "epoch": 542, "lr": 2.2473058639702392e-06} +{"train_loss": 0.0002547101175878197, "global_step": 64608, "epoch": 542, "lr": 2.246649162336517e-06} +{"train_loss": 0.00044487405102699995, "global_step": 64609, "epoch": 542, "lr": 2.2459925544613903e-06} +{"train_loss": 0.0009769655298441648, "global_step": 64610, "epoch": 542, "lr": 2.245336040346163e-06} +{"train_loss": 0.0002769347629509866, "global_step": 64611, "epoch": 542, "lr": 2.244679619992107e-06} +{"train_loss": 0.00043213542085140944, "global_step": 64612, "epoch": 542, "lr": 2.244023293400527e-06} +{"train_loss": 0.00025499408366158605, "global_step": 64613, "epoch": 542, "lr": 2.243367060572699e-06} +{"train_loss": 0.00020489249436650425, "global_step": 64614, "epoch": 542, "lr": 2.2427109215099272e-06} +{"train_loss": 0.00018967378127854317, "global_step": 64615, "epoch": 542, "lr": 2.242054876213484e-06} +{"train_loss": 0.00030023772021248825, "global_step": 64616, "epoch": 542, "lr": 2.241398924684668e-06, "val_loss": 0.06810726225376129} +{"train_loss": 0.0005086843157187104, "global_step": 64617, "epoch": 543, "lr": 2.240743066924755e-06} +{"train_loss": 0.00034151243744418025, "global_step": 64618, "epoch": 543, "lr": 2.240087302935051e-06} +{"train_loss": 0.0003715134516824037, "global_step": 64619, "epoch": 543, "lr": 2.2394316327168208e-06} +{"train_loss": 0.0006014819373376667, "global_step": 64620, "epoch": 543, "lr": 2.23877605627138e-06} +{"train_loss": 0.00035395327722653747, "global_step": 64621, "epoch": 543, "lr": 2.2381205735999833e-06} +{"train_loss": 0.000424415833549574, "global_step": 64622, "epoch": 543, "lr": 2.2374651847039463e-06} +{"train_loss": 0.0003677161002997309, "global_step": 64623, "epoch": 543, "lr": 2.2368098895845346e-06} +{"train_loss": 0.0003192239673808217, "global_step": 64624, "epoch": 543, "lr": 2.236154688243053e-06} +{"train_loss": 0.00019325919856783003, "global_step": 64625, "epoch": 543, "lr": 2.235499580680772e-06} +{"train_loss": 0.0002971711801365018, "global_step": 64626, "epoch": 543, "lr": 2.2348445668989915e-06} +{"train_loss": 0.0007645510486327112, "global_step": 64627, "epoch": 543, "lr": 2.234189646898993e-06} +{"train_loss": 0.0007722055306658149, "global_step": 64628, "epoch": 543, "lr": 2.2335348206820483e-06} +{"train_loss": 0.0001593292545294389, "global_step": 64629, "epoch": 543, "lr": 2.2328800882494614e-06} +{"train_loss": 0.00027975731063634157, "global_step": 64630, "epoch": 543, "lr": 2.2322254496025097e-06} +{"train_loss": 0.00047339327284134924, "global_step": 64631, "epoch": 543, "lr": 2.231570904742486e-06} +{"train_loss": 0.00019180212984792888, "global_step": 64632, "epoch": 543, "lr": 2.230916453670656e-06} +{"train_loss": 0.0007190589676611125, "global_step": 64633, "epoch": 543, "lr": 2.23026209638833e-06} +{"train_loss": 0.00044049409916624427, "global_step": 64634, "epoch": 543, "lr": 2.229607832896785e-06} +{"train_loss": 0.00045092665823176503, "global_step": 64635, "epoch": 543, "lr": 2.228953663197286e-06} +{"train_loss": 0.0002547441690694541, "global_step": 64636, "epoch": 543, "lr": 2.2282995872911436e-06} +{"train_loss": 0.0003442168526817113, "global_step": 64637, "epoch": 543, "lr": 2.2276456051796292e-06} +{"train_loss": 0.00033271528081968427, "global_step": 64638, "epoch": 543, "lr": 2.2269917168640296e-06} +{"train_loss": 0.00041175182559527457, "global_step": 64639, "epoch": 543, "lr": 2.2263379223456283e-06} +{"train_loss": 0.00035425028181634843, "global_step": 64640, "epoch": 543, "lr": 2.2256842216257066e-06} +{"train_loss": 0.00020302976190578192, "global_step": 64641, "epoch": 543, "lr": 2.225030614705553e-06} +{"train_loss": 0.00025872685364447534, "global_step": 64642, "epoch": 543, "lr": 2.224377101586439e-06} +{"train_loss": 0.00020452114404179156, "global_step": 64643, "epoch": 543, "lr": 2.2237236822696683e-06} +{"train_loss": 0.00019912909192498773, "global_step": 64644, "epoch": 543, "lr": 2.2230703567565016e-06} +{"train_loss": 0.0002749759005382657, "global_step": 64645, "epoch": 543, "lr": 2.222417125048243e-06} +{"train_loss": 0.0003735495556611568, "global_step": 64646, "epoch": 543, "lr": 2.221763987146158e-06} +{"train_loss": 0.00019002131011802703, "global_step": 64647, "epoch": 543, "lr": 2.22111094305153e-06} +{"train_loss": 0.0006658196216449142, "global_step": 64648, "epoch": 543, "lr": 2.220457992765651e-06} +{"train_loss": 0.0002813534811139107, "global_step": 64649, "epoch": 543, "lr": 2.2198051362897987e-06} +{"train_loss": 0.0004131845780648291, "global_step": 64650, "epoch": 543, "lr": 2.219152373625255e-06} +{"train_loss": 0.0002908030874095857, "global_step": 64651, "epoch": 543, "lr": 2.2184997047733023e-06} +{"train_loss": 0.0001936428452609107, "global_step": 64652, "epoch": 543, "lr": 2.2178471297352122e-06} +{"train_loss": 0.0004230798513162881, "global_step": 64653, "epoch": 543, "lr": 2.217194648512283e-06} +{"train_loss": 0.0003695093037094921, "global_step": 64654, "epoch": 543, "lr": 2.216542261105786e-06} +{"train_loss": 0.0003741465916391462, "global_step": 64655, "epoch": 543, "lr": 2.2158899675170043e-06} +{"train_loss": 0.00021460145944729447, "global_step": 64656, "epoch": 543, "lr": 2.215237767747214e-06} +{"train_loss": 0.0001553056645207107, "global_step": 64657, "epoch": 543, "lr": 2.2145856617977025e-06} +{"train_loss": 0.00040701794205233455, "global_step": 64658, "epoch": 543, "lr": 2.2139336496697473e-06} +{"train_loss": 0.0004981079837307334, "global_step": 64659, "epoch": 543, "lr": 2.2132817313646248e-06} +{"train_loss": 0.0003991240228060633, "global_step": 64660, "epoch": 543, "lr": 2.212629906883623e-06} +{"train_loss": 0.00026031502056866884, "global_step": 64661, "epoch": 543, "lr": 2.211978176228008e-06} +{"train_loss": 0.00022453303972724825, "global_step": 64662, "epoch": 543, "lr": 2.211326539399078e-06} +{"train_loss": 0.00018448963237460703, "global_step": 64663, "epoch": 543, "lr": 2.210674996398099e-06} +{"train_loss": 0.00037803553277626634, "global_step": 64664, "epoch": 543, "lr": 2.2100235472263585e-06} +{"train_loss": 0.00040020656888373196, "global_step": 64665, "epoch": 543, "lr": 2.2093721918851283e-06} +{"train_loss": 0.00029000334325246513, "global_step": 64666, "epoch": 543, "lr": 2.208720930375685e-06} +{"train_loss": 0.00033477661781944335, "global_step": 64667, "epoch": 543, "lr": 2.2080697626993217e-06} +{"train_loss": 0.00021681231737602502, "global_step": 64668, "epoch": 543, "lr": 2.207418688857299e-06} +{"train_loss": 0.0002564449096098542, "global_step": 64669, "epoch": 543, "lr": 2.2067677088509098e-06} +{"train_loss": 0.0007098487694747746, "global_step": 64670, "epoch": 543, "lr": 2.2061168226814255e-06} +{"train_loss": 0.00030369844171218574, "global_step": 64671, "epoch": 543, "lr": 2.2054660303501174e-06} +{"train_loss": 0.0003234108444303274, "global_step": 64672, "epoch": 543, "lr": 2.2048153318582844e-06} +{"train_loss": 0.0002885236172005534, "global_step": 64673, "epoch": 543, "lr": 2.2041647272071754e-06} +{"train_loss": 0.0002377846249146387, "global_step": 64674, "epoch": 543, "lr": 2.203514216398095e-06} +{"train_loss": 0.0004386940854601562, "global_step": 64675, "epoch": 543, "lr": 2.2028637994322974e-06} +{"train_loss": 0.0003499306330922991, "global_step": 64676, "epoch": 543, "lr": 2.2022134763110767e-06} +{"train_loss": 0.00025594979524612427, "global_step": 64677, "epoch": 543, "lr": 2.2015632470357096e-06} +{"train_loss": 0.00036866526352241635, "global_step": 64678, "epoch": 543, "lr": 2.2009131116074554e-06} +{"train_loss": 0.00047687868936918676, "global_step": 64679, "epoch": 543, "lr": 2.200263070027608e-06} +{"train_loss": 0.00025928474497050047, "global_step": 64680, "epoch": 543, "lr": 2.199613122297428e-06} +{"train_loss": 0.0002682201156858355, "global_step": 64681, "epoch": 543, "lr": 2.198963268418214e-06} +{"train_loss": 0.000367977365385741, "global_step": 64682, "epoch": 543, "lr": 2.19831350839122e-06} +{"train_loss": 0.0004606545844580978, "global_step": 64683, "epoch": 543, "lr": 2.1976638422177286e-06} +{"train_loss": 0.00027439792756922543, "global_step": 64684, "epoch": 543, "lr": 2.1970142698990224e-06} +{"train_loss": 0.0002175252157030627, "global_step": 64685, "epoch": 543, "lr": 2.196364791436373e-06} +{"train_loss": 0.00049541553016752, "global_step": 64686, "epoch": 543, "lr": 2.1957154068310505e-06} +{"train_loss": 0.00041329284431412816, "global_step": 64687, "epoch": 543, "lr": 2.195066116084332e-06} +{"train_loss": 0.0004119492368772626, "global_step": 64688, "epoch": 543, "lr": 2.1944169191975007e-06} +{"train_loss": 0.0002917919773608446, "global_step": 64689, "epoch": 543, "lr": 2.1937678161718268e-06} +{"train_loss": 0.0002623718464747071, "global_step": 64690, "epoch": 543, "lr": 2.193118807008576e-06} +{"train_loss": 0.0002289859257871285, "global_step": 64691, "epoch": 543, "lr": 2.1924698917090313e-06} +{"train_loss": 0.00020185348694212735, "global_step": 64692, "epoch": 543, "lr": 2.191821070274458e-06} +{"train_loss": 0.00044498531497083604, "global_step": 64693, "epoch": 543, "lr": 2.191172342706149e-06} +{"train_loss": 0.0001984415139304474, "global_step": 64694, "epoch": 543, "lr": 2.1905237090053545e-06} +{"train_loss": 0.00020630542712751776, "global_step": 64695, "epoch": 543, "lr": 2.189875169173361e-06} +{"train_loss": 0.0001998451625695452, "global_step": 64696, "epoch": 543, "lr": 2.189226723211446e-06} +{"train_loss": 0.00026284411433152854, "global_step": 64697, "epoch": 543, "lr": 2.1885783711208696e-06} +{"train_loss": 0.00033367465948686004, "global_step": 64698, "epoch": 543, "lr": 2.1879301129029196e-06} +{"train_loss": 0.00023649950162507594, "global_step": 64699, "epoch": 543, "lr": 2.1872819485588503e-06} +{"train_loss": 0.00023921382671687752, "global_step": 64700, "epoch": 543, "lr": 2.186633878089955e-06} +{"train_loss": 0.00021509914950001985, "global_step": 64701, "epoch": 543, "lr": 2.1859859014974835e-06} +{"train_loss": 0.0002953711082227528, "global_step": 64702, "epoch": 543, "lr": 2.1853380187827344e-06} +{"train_loss": 0.00029723599436692894, "global_step": 64703, "epoch": 543, "lr": 2.1846902299469617e-06} +{"train_loss": 0.00032376052695326507, "global_step": 64704, "epoch": 543, "lr": 2.1840425349914373e-06} +{"train_loss": 0.00029351614648476243, "global_step": 64705, "epoch": 543, "lr": 2.1833949339174373e-06} +{"train_loss": 0.00016999557556118816, "global_step": 64706, "epoch": 543, "lr": 2.182747426726234e-06} +{"train_loss": 0.00045872447662986815, "global_step": 64707, "epoch": 543, "lr": 2.1821000134191028e-06} +{"train_loss": 0.00019162354874424636, "global_step": 64708, "epoch": 543, "lr": 2.1814526939973047e-06} +{"train_loss": 0.000581390515435487, "global_step": 64709, "epoch": 543, "lr": 2.180805468462116e-06} +{"train_loss": 0.0002970312489196658, "global_step": 64710, "epoch": 543, "lr": 2.1801583368148084e-06} +{"train_loss": 0.0002114139642799273, "global_step": 64711, "epoch": 543, "lr": 2.1795112990566467e-06} +{"train_loss": 0.0004330261144787073, "global_step": 64712, "epoch": 543, "lr": 2.1788643551889087e-06} +{"train_loss": 0.00022467343660537153, "global_step": 64713, "epoch": 543, "lr": 2.1782175052128594e-06} +{"train_loss": 0.00018650986021384597, "global_step": 64714, "epoch": 543, "lr": 2.177570749129776e-06} +{"train_loss": 0.0003087376826442778, "global_step": 64715, "epoch": 543, "lr": 2.176924086940918e-06} +{"train_loss": 0.00022025052749086171, "global_step": 64716, "epoch": 543, "lr": 2.1762775186475624e-06} +{"train_loss": 0.0005684159696102142, "global_step": 64717, "epoch": 543, "lr": 2.1756310442509754e-06} +{"train_loss": 0.0003104734350927174, "global_step": 64718, "epoch": 543, "lr": 2.1749846637524273e-06} +{"train_loss": 0.00020677101565524936, "global_step": 64719, "epoch": 543, "lr": 2.17433837715319e-06} +{"train_loss": 0.0008960776613093913, "global_step": 64720, "epoch": 543, "lr": 2.173692184454529e-06} +{"train_loss": 0.00025144219398498535, "global_step": 64721, "epoch": 543, "lr": 2.173046085657715e-06} +{"train_loss": 0.00026427878765389323, "global_step": 64722, "epoch": 543, "lr": 2.17240008076402e-06} +{"train_loss": 0.0002336938923690468, "global_step": 64723, "epoch": 543, "lr": 2.171754169774698e-06} +{"train_loss": 0.0001864754012785852, "global_step": 64724, "epoch": 543, "lr": 2.171108352691037e-06} +{"train_loss": 0.00040716261719353497, "global_step": 64725, "epoch": 543, "lr": 2.170462629514286e-06} +{"train_loss": 0.00014826515689492226, "global_step": 64726, "epoch": 543, "lr": 2.1698170002457274e-06} +{"train_loss": 0.00019798087305389345, "global_step": 64727, "epoch": 543, "lr": 2.1691714648866213e-06} +{"train_loss": 0.00016053863510023803, "global_step": 64728, "epoch": 543, "lr": 2.1685260234382334e-06} +{"train_loss": 0.0001904263044707477, "global_step": 64729, "epoch": 543, "lr": 2.16788067590184e-06} +{"train_loss": 0.00026701739989221096, "global_step": 64730, "epoch": 543, "lr": 2.1672354222787015e-06} +{"train_loss": 0.00036529891076497734, "global_step": 64731, "epoch": 543, "lr": 2.166590262570084e-06} +{"train_loss": 0.0006101857288740575, "global_step": 64732, "epoch": 543, "lr": 2.165945196777258e-06} +{"train_loss": 0.00017559895059093833, "global_step": 64733, "epoch": 543, "lr": 2.1653002249014898e-06} +{"train_loss": 0.00022303906735032797, "global_step": 64734, "epoch": 543, "lr": 2.1646553469440443e-06} +{"train_loss": 0.00033043590550381344, "global_step": 64735, "epoch": 543, "lr": 2.1640105629061825e-06, "val_loss": 0.011231629177927971} +{"train_loss": 0.00020629270875360817, "global_step": 64736, "epoch": 544, "lr": 2.1633658727891804e-06} +{"train_loss": 0.00023262031027115881, "global_step": 64737, "epoch": 544, "lr": 2.1627212765942984e-06} +{"train_loss": 0.00022670724138151854, "global_step": 64738, "epoch": 544, "lr": 2.162076774322802e-06} +{"train_loss": 0.00019524862000253052, "global_step": 64739, "epoch": 544, "lr": 2.161432365975957e-06} +{"train_loss": 0.0003707737778313458, "global_step": 64740, "epoch": 544, "lr": 2.160788051555024e-06} +{"train_loss": 0.00022068926773499697, "global_step": 64741, "epoch": 544, "lr": 2.1601438310612843e-06} +{"train_loss": 0.00012777437223121524, "global_step": 64742, "epoch": 544, "lr": 2.1594997044959763e-06} +{"train_loss": 0.0002625164343044162, "global_step": 64743, "epoch": 544, "lr": 2.1588556718603936e-06} +{"train_loss": 0.0005188305513001978, "global_step": 64744, "epoch": 544, "lr": 2.158211733155774e-06} +{"train_loss": 0.00024536921409890056, "global_step": 64745, "epoch": 544, "lr": 2.157567888383405e-06} +{"train_loss": 0.00024672175641171634, "global_step": 64746, "epoch": 544, "lr": 2.15692413754453e-06} +{"train_loss": 0.0003466122143436223, "global_step": 64747, "epoch": 544, "lr": 2.1562804806404322e-06} +{"train_loss": 0.0004784519551321864, "global_step": 64748, "epoch": 544, "lr": 2.15563691767236e-06} +{"train_loss": 0.0002083217550534755, "global_step": 64749, "epoch": 544, "lr": 2.1549934486415903e-06} +{"train_loss": 0.0003224745742045343, "global_step": 64750, "epoch": 544, "lr": 2.1543500735493717e-06} +{"train_loss": 0.00037509322282858193, "global_step": 64751, "epoch": 544, "lr": 2.153706792396987e-06} +{"train_loss": 0.0001514488540124148, "global_step": 64752, "epoch": 544, "lr": 2.153063605185673e-06} +{"train_loss": 0.000258850835962221, "global_step": 64753, "epoch": 544, "lr": 2.1524205119167195e-06} +{"train_loss": 0.00027631461853161454, "global_step": 64754, "epoch": 544, "lr": 2.151777512591363e-06} +{"train_loss": 0.0003641593793872744, "global_step": 64755, "epoch": 544, "lr": 2.1511346072108916e-06} +{"train_loss": 0.00015002880536485463, "global_step": 64756, "epoch": 544, "lr": 2.150491795776549e-06} +{"train_loss": 0.0003083802876062691, "global_step": 64757, "epoch": 544, "lr": 2.149849078289606e-06} +{"train_loss": 0.0003419087443035096, "global_step": 64758, "epoch": 544, "lr": 2.1492064547513292e-06} +{"train_loss": 0.0005236136494204402, "global_step": 64759, "epoch": 544, "lr": 2.1485639251629606e-06} +{"train_loss": 0.00038312820834107697, "global_step": 64760, "epoch": 544, "lr": 2.1479214895257836e-06} +{"train_loss": 0.0002961926511488855, "global_step": 64761, "epoch": 544, "lr": 2.1472791478410415e-06} +{"train_loss": 0.0002471102343406528, "global_step": 64762, "epoch": 544, "lr": 2.146636900110016e-06} +{"train_loss": 0.00017334478616248816, "global_step": 64763, "epoch": 544, "lr": 2.1459947463339458e-06} +{"train_loss": 0.00022416679712478071, "global_step": 64764, "epoch": 544, "lr": 2.1453526865141125e-06} +{"train_loss": 0.00031012052204459906, "global_step": 64765, "epoch": 544, "lr": 2.144710720651766e-06} +{"train_loss": 0.0001518295321147889, "global_step": 64766, "epoch": 544, "lr": 2.1440688487481596e-06} +{"train_loss": 0.00019983974925708026, "global_step": 64767, "epoch": 544, "lr": 2.1434270708045655e-06} +{"train_loss": 0.0004107592103537172, "global_step": 64768, "epoch": 544, "lr": 2.1427853868222324e-06} +{"train_loss": 0.00021583960915450007, "global_step": 64769, "epoch": 544, "lr": 2.1421437968024373e-06} +{"train_loss": 0.00016425045032519847, "global_step": 64770, "epoch": 544, "lr": 2.141502300746423e-06} +{"train_loss": 0.00022810710652265698, "global_step": 64771, "epoch": 544, "lr": 2.1408608986554666e-06} +{"train_loss": 0.0001693710801191628, "global_step": 64772, "epoch": 544, "lr": 2.140219590530812e-06} +{"train_loss": 0.00030963157769292593, "global_step": 64773, "epoch": 544, "lr": 2.1395783763737187e-06} +{"train_loss": 0.0003851077926810831, "global_step": 64774, "epoch": 544, "lr": 2.138937256185453e-06} +{"train_loss": 0.0003660490328911692, "global_step": 64775, "epoch": 544, "lr": 2.138296229967268e-06} +{"train_loss": 0.0002472414926160127, "global_step": 64776, "epoch": 544, "lr": 2.137655297720431e-06} +{"train_loss": 0.00042437773663550615, "global_step": 64777, "epoch": 544, "lr": 2.1370144594461904e-06} +{"train_loss": 0.00030476352549158037, "global_step": 64778, "epoch": 544, "lr": 2.136373715145806e-06} +{"train_loss": 0.0002716053859330714, "global_step": 64779, "epoch": 544, "lr": 2.135733064820539e-06} +{"train_loss": 0.00013048943947069347, "global_step": 64780, "epoch": 544, "lr": 2.1350925084716534e-06} +{"train_loss": 0.00024866126477718353, "global_step": 64781, "epoch": 544, "lr": 2.1344520461003937e-06} +{"train_loss": 0.00027322719688527286, "global_step": 64782, "epoch": 544, "lr": 2.1338116777080252e-06} +{"train_loss": 0.00030224359943531454, "global_step": 64783, "epoch": 544, "lr": 2.133171403295803e-06} +{"train_loss": 0.00029223773162811995, "global_step": 64784, "epoch": 544, "lr": 2.132531222864986e-06} +{"train_loss": 0.00047864147927612066, "global_step": 64785, "epoch": 544, "lr": 2.1318911364168303e-06} +{"train_loss": 0.00020562249119393528, "global_step": 64786, "epoch": 544, "lr": 2.131251143952595e-06} +{"train_loss": 0.0005962533177807927, "global_step": 64787, "epoch": 544, "lr": 2.130611245473524e-06} +{"train_loss": 0.00031973555451259017, "global_step": 64788, "epoch": 544, "lr": 2.1299714409808935e-06} +{"train_loss": 0.0002521425485610962, "global_step": 64789, "epoch": 544, "lr": 2.129331730475953e-06} +{"train_loss": 0.00038065476110205054, "global_step": 64790, "epoch": 544, "lr": 2.128692113959946e-06} +{"train_loss": 0.00015752404578961432, "global_step": 64791, "epoch": 544, "lr": 2.128052591434143e-06} +{"train_loss": 0.00040842677117325366, "global_step": 64792, "epoch": 544, "lr": 2.1274131628997885e-06} +{"train_loss": 0.0002838532964233309, "global_step": 64793, "epoch": 544, "lr": 2.1267738283581527e-06} +{"train_loss": 0.00020495579519774765, "global_step": 64794, "epoch": 544, "lr": 2.1261345878104742e-06} +{"train_loss": 0.00027103559114038944, "global_step": 64795, "epoch": 544, "lr": 2.125495441258024e-06} +{"train_loss": 0.00029013724997639656, "global_step": 64796, "epoch": 544, "lr": 2.1248563887020454e-06} +{"train_loss": 0.00034828358911909163, "global_step": 64797, "epoch": 544, "lr": 2.1242174301437934e-06} +{"train_loss": 0.00043139205081388354, "global_step": 64798, "epoch": 544, "lr": 2.1235785655845276e-06} +{"train_loss": 0.0005455365753732622, "global_step": 64799, "epoch": 544, "lr": 2.122939795025497e-06} +{"train_loss": 0.0004142209654673934, "global_step": 64800, "epoch": 544, "lr": 2.1223011184679675e-06} +{"train_loss": 0.0004268553457222879, "global_step": 64801, "epoch": 544, "lr": 2.121662535913177e-06} +{"train_loss": 0.00027912884252145886, "global_step": 64802, "epoch": 544, "lr": 2.121024047362391e-06} +{"train_loss": 0.00028122635558247566, "global_step": 64803, "epoch": 544, "lr": 2.1203856528168643e-06} +{"train_loss": 0.00023266702191904187, "global_step": 64804, "epoch": 544, "lr": 2.1197473522778345e-06} +{"train_loss": 0.0001694866077741608, "global_step": 64805, "epoch": 544, "lr": 2.119109145746573e-06} +{"train_loss": 0.0004136312927585095, "global_step": 64806, "epoch": 544, "lr": 2.1184710332243176e-06} +{"train_loss": 0.0006371996132656932, "global_step": 64807, "epoch": 544, "lr": 2.117833014712334e-06} +{"train_loss": 0.00020126154413446784, "global_step": 64808, "epoch": 544, "lr": 2.1171950902118764e-06} +{"train_loss": 0.0002667604712769389, "global_step": 64809, "epoch": 544, "lr": 2.116557259724178e-06} +{"train_loss": 0.00032001902582123876, "global_step": 64810, "epoch": 544, "lr": 2.1159195232505148e-06} +{"train_loss": 0.0002145324251614511, "global_step": 64811, "epoch": 544, "lr": 2.115281880792119e-06} +{"train_loss": 0.0004677889228332788, "global_step": 64812, "epoch": 544, "lr": 2.1146443323502574e-06} +{"train_loss": 0.00022859453747514635, "global_step": 64813, "epoch": 544, "lr": 2.1140068779261724e-06} +{"train_loss": 0.00035399312037043273, "global_step": 64814, "epoch": 544, "lr": 2.1133695175211186e-06} +{"train_loss": 0.00016394136764574796, "global_step": 64815, "epoch": 544, "lr": 2.112732251136351e-06} +{"train_loss": 0.0002985040773637593, "global_step": 64816, "epoch": 544, "lr": 2.112095078773113e-06} +{"train_loss": 0.00014882902905810624, "global_step": 64817, "epoch": 544, "lr": 2.1114580004326646e-06} +{"train_loss": 0.00028006252250634134, "global_step": 64818, "epoch": 544, "lr": 2.110821016116249e-06} +{"train_loss": 0.00026061126845888793, "global_step": 64819, "epoch": 544, "lr": 2.110184125825121e-06} +{"train_loss": 0.0004951725713908672, "global_step": 64820, "epoch": 544, "lr": 2.1095473295605295e-06} +{"train_loss": 0.0005621786694973707, "global_step": 64821, "epoch": 544, "lr": 2.108910627323729e-06} +{"train_loss": 0.000270948454272002, "global_step": 64822, "epoch": 544, "lr": 2.108274019115969e-06} +{"train_loss": 0.00014359969645738602, "global_step": 64823, "epoch": 544, "lr": 2.1076375049384867e-06} +{"train_loss": 0.00017546357412356883, "global_step": 64824, "epoch": 544, "lr": 2.1070010847925535e-06} +{"train_loss": 0.0005996621330268681, "global_step": 64825, "epoch": 544, "lr": 2.1063647586793968e-06} +{"train_loss": 0.0002591099473647773, "global_step": 64826, "epoch": 544, "lr": 2.105728526600281e-06} +{"train_loss": 0.0002487074816599488, "global_step": 64827, "epoch": 544, "lr": 2.105092388556451e-06} +{"train_loss": 0.00024677219334989786, "global_step": 64828, "epoch": 544, "lr": 2.104456344549155e-06} +{"train_loss": 0.00021194313012529165, "global_step": 64829, "epoch": 544, "lr": 2.103820394579642e-06} +{"train_loss": 0.00014714371354784817, "global_step": 64830, "epoch": 544, "lr": 2.1031845386491555e-06} +{"train_loss": 0.0003040415176656097, "global_step": 64831, "epoch": 544, "lr": 2.1025487767589556e-06} +{"train_loss": 0.00016667527961544693, "global_step": 64832, "epoch": 544, "lr": 2.1019131089102807e-06} +{"train_loss": 0.0002975187380798161, "global_step": 64833, "epoch": 544, "lr": 2.1012775351043846e-06} +{"train_loss": 0.0002227046206826344, "global_step": 64834, "epoch": 544, "lr": 2.100642055342511e-06} +{"train_loss": 0.0002752765722107142, "global_step": 64835, "epoch": 544, "lr": 2.1000066696259092e-06} +{"train_loss": 0.0005189386429265141, "global_step": 64836, "epoch": 544, "lr": 2.0993713779558276e-06} +{"train_loss": 0.00016655617218930274, "global_step": 64837, "epoch": 544, "lr": 2.09873618033351e-06} +{"train_loss": 0.00018071343947667629, "global_step": 64838, "epoch": 544, "lr": 2.0981010767602116e-06} +{"train_loss": 0.00021792885672766715, "global_step": 64839, "epoch": 544, "lr": 2.0974660672371693e-06} +{"train_loss": 0.00017714561545290053, "global_step": 64840, "epoch": 544, "lr": 2.0968311517656437e-06} +{"train_loss": 0.00027976540150120854, "global_step": 64841, "epoch": 544, "lr": 2.0961963303468667e-06} +{"train_loss": 0.0005408694851212204, "global_step": 64842, "epoch": 544, "lr": 2.095561602982088e-06} +{"train_loss": 0.00029985932633280754, "global_step": 64843, "epoch": 544, "lr": 2.0949269696725615e-06} +{"train_loss": 0.00023659673752263188, "global_step": 64844, "epoch": 544, "lr": 2.09429243041952e-06} +{"train_loss": 0.00022108475968707353, "global_step": 64845, "epoch": 544, "lr": 2.093657985224223e-06} +{"train_loss": 0.00036028746399097145, "global_step": 64846, "epoch": 544, "lr": 2.0930236340879094e-06} +{"train_loss": 0.00019387886277399957, "global_step": 64847, "epoch": 544, "lr": 2.0923893770118275e-06} +{"train_loss": 0.0002696855808608234, "global_step": 64848, "epoch": 544, "lr": 2.0917552139972154e-06} +{"train_loss": 0.00028260439285077155, "global_step": 64849, "epoch": 544, "lr": 2.091121145045327e-06} +{"train_loss": 0.00031972385477274656, "global_step": 64850, "epoch": 544, "lr": 2.0904871701574016e-06} +{"train_loss": 0.00019786597113125026, "global_step": 64851, "epoch": 544, "lr": 2.089853289334687e-06} +{"train_loss": 0.00022808599169366062, "global_step": 64852, "epoch": 544, "lr": 2.089219502578432e-06} +{"train_loss": 0.00030258524930104613, "global_step": 64853, "epoch": 544, "lr": 2.0885858098898757e-06} +{"train_loss": 0.0002948791184853919, "global_step": 64854, "epoch": 544, "lr": 2.0879522112702553e-06, "val_loss": 0.008859606459736824} +{"train_loss": 0.00016346917254850268, "global_step": 64855, "epoch": 545, "lr": 2.087318706720831e-06} +{"train_loss": 0.00021461413416545838, "global_step": 64856, "epoch": 545, "lr": 2.0866852962428294e-06} +{"train_loss": 0.00028218142688274384, "global_step": 64857, "epoch": 545, "lr": 2.0860519798375112e-06} +{"train_loss": 0.0006443916354328394, "global_step": 64858, "epoch": 545, "lr": 2.085418757506108e-06} +{"train_loss": 0.000244037204538472, "global_step": 64859, "epoch": 545, "lr": 2.0847856292498635e-06} +{"train_loss": 0.0003003375604748726, "global_step": 64860, "epoch": 545, "lr": 2.0841525950700267e-06} +{"train_loss": 0.0002883790584746748, "global_step": 64861, "epoch": 545, "lr": 2.0835196549678304e-06} +{"train_loss": 0.00038757725269533694, "global_step": 64862, "epoch": 545, "lr": 2.0828868089445286e-06} +{"train_loss": 0.0002533821971155703, "global_step": 64863, "epoch": 545, "lr": 2.0822540570013595e-06} +{"train_loss": 0.0003052949905395508, "global_step": 64864, "epoch": 545, "lr": 2.081621399139566e-06} +{"train_loss": 0.00015261786757037044, "global_step": 64865, "epoch": 545, "lr": 2.0809888353603925e-06} +{"train_loss": 0.00031884326017461717, "global_step": 64866, "epoch": 545, "lr": 2.0803563656650704e-06} +{"train_loss": 0.0001670949422987178, "global_step": 64867, "epoch": 545, "lr": 2.079723990054855e-06} +{"train_loss": 0.0002320635539945215, "global_step": 64868, "epoch": 545, "lr": 2.079091708530978e-06} +{"train_loss": 0.00026682333555072546, "global_step": 64869, "epoch": 545, "lr": 2.078459521094689e-06} +{"train_loss": 0.00038940043305046856, "global_step": 64870, "epoch": 545, "lr": 2.0778274277472198e-06} +{"train_loss": 0.00031035993015393615, "global_step": 64871, "epoch": 545, "lr": 2.0771954284898253e-06} +{"train_loss": 0.0005284318467602134, "global_step": 64872, "epoch": 545, "lr": 2.0765635233237323e-06} +{"train_loss": 0.00022254166833590716, "global_step": 64873, "epoch": 545, "lr": 2.075931712250184e-06} +{"train_loss": 0.00024732580641284585, "global_step": 64874, "epoch": 545, "lr": 2.07529999527043e-06} +{"train_loss": 0.0002049651084234938, "global_step": 64875, "epoch": 545, "lr": 2.0746683723856963e-06} +{"train_loss": 0.0003846950421575457, "global_step": 64876, "epoch": 545, "lr": 2.0740368435972377e-06} +{"train_loss": 0.00022918469039723277, "global_step": 64877, "epoch": 545, "lr": 2.073405408906287e-06} +{"train_loss": 0.00020607888291124254, "global_step": 64878, "epoch": 545, "lr": 2.0727740683140873e-06} +{"train_loss": 0.00028269007452763617, "global_step": 64879, "epoch": 545, "lr": 2.0721428218218653e-06} +{"train_loss": 0.00024123929324559867, "global_step": 64880, "epoch": 545, "lr": 2.0715116694308813e-06} +{"train_loss": 0.00026953048654831946, "global_step": 64881, "epoch": 545, "lr": 2.070880611142356e-06} +{"train_loss": 0.00028412704705260694, "global_step": 64882, "epoch": 545, "lr": 2.070249646957545e-06} +{"train_loss": 0.0002709034306462854, "global_step": 64883, "epoch": 545, "lr": 2.069618776877669e-06} +{"train_loss": 0.0003895767731592059, "global_step": 64884, "epoch": 545, "lr": 2.068988000903982e-06} +{"train_loss": 0.0003093052073381841, "global_step": 64885, "epoch": 545, "lr": 2.0683573190377114e-06} +{"train_loss": 0.0002928110188804567, "global_step": 64886, "epoch": 545, "lr": 2.0677267312801064e-06} +{"train_loss": 0.00015096559945959598, "global_step": 64887, "epoch": 545, "lr": 2.067096237632388e-06} +{"train_loss": 0.00023930591123644263, "global_step": 64888, "epoch": 545, "lr": 2.0664658380958214e-06} +{"train_loss": 0.0006207709666341543, "global_step": 64889, "epoch": 545, "lr": 2.0658355326716115e-06} +{"train_loss": 0.0002769693674053997, "global_step": 64890, "epoch": 545, "lr": 2.0652053213610244e-06} +{"train_loss": 0.0005993600934743881, "global_step": 64891, "epoch": 545, "lr": 2.0645752041652866e-06} +{"train_loss": 0.00013907042739447206, "global_step": 64892, "epoch": 545, "lr": 2.0639451810856246e-06} +{"train_loss": 0.00022432993864640594, "global_step": 64893, "epoch": 545, "lr": 2.0633152521232933e-06} +{"train_loss": 0.0003847353800665587, "global_step": 64894, "epoch": 545, "lr": 2.0626854172795197e-06} +{"train_loss": 0.00043021663441322744, "global_step": 64895, "epoch": 545, "lr": 2.062055676555541e-06} +{"train_loss": 0.0006317157531157136, "global_step": 64896, "epoch": 545, "lr": 2.0614260299525954e-06} +{"train_loss": 0.00018824647122528404, "global_step": 64897, "epoch": 545, "lr": 2.0607964774719156e-06} +{"train_loss": 0.00028252051561139524, "global_step": 64898, "epoch": 545, "lr": 2.0601670191147447e-06} +{"train_loss": 0.00015771955077070743, "global_step": 64899, "epoch": 545, "lr": 2.0595376548823097e-06} +{"train_loss": 0.0005150004290044308, "global_step": 64900, "epoch": 545, "lr": 2.058908384775854e-06} +{"train_loss": 0.0001632517814869061, "global_step": 64901, "epoch": 545, "lr": 2.0582792087966042e-06} +{"train_loss": 0.0003968955425079912, "global_step": 64902, "epoch": 545, "lr": 2.057650126945809e-06} +{"train_loss": 0.00020029536972288042, "global_step": 64903, "epoch": 545, "lr": 2.0570211392246963e-06} +{"train_loss": 0.0004338210273999721, "global_step": 64904, "epoch": 545, "lr": 2.056392245634492e-06} +{"train_loss": 0.00022890295076649636, "global_step": 64905, "epoch": 545, "lr": 2.055763446176445e-06} +{"train_loss": 0.0001882896904135123, "global_step": 64906, "epoch": 545, "lr": 2.055134740851783e-06} +{"train_loss": 0.0003202009538654238, "global_step": 64907, "epoch": 545, "lr": 2.054506129661743e-06} +{"train_loss": 0.00033788118162192404, "global_step": 64908, "epoch": 545, "lr": 2.0538776126075632e-06} +{"train_loss": 0.0002387801359873265, "global_step": 64909, "epoch": 545, "lr": 2.0532491896904595e-06} +{"train_loss": 0.0001818947639549151, "global_step": 64910, "epoch": 545, "lr": 2.0526208609116915e-06} +{"train_loss": 0.000220812507905066, "global_step": 64911, "epoch": 545, "lr": 2.05199262627247e-06} +{"train_loss": 0.00027971892268396914, "global_step": 64912, "epoch": 545, "lr": 2.0513644857740375e-06} +{"train_loss": 0.00029305406496860087, "global_step": 64913, "epoch": 545, "lr": 2.0507364394176388e-06} +{"train_loss": 0.0002708390820771456, "global_step": 64914, "epoch": 545, "lr": 2.0501084872044886e-06} +{"train_loss": 0.0004272392834536731, "global_step": 64915, "epoch": 545, "lr": 2.0494806291358306e-06} +{"train_loss": 0.00015693956811446697, "global_step": 64916, "epoch": 545, "lr": 2.048852865212891e-06} +{"train_loss": 0.00026477835490368307, "global_step": 64917, "epoch": 545, "lr": 2.0482251954369146e-06} +{"train_loss": 0.00019907143723685294, "global_step": 64918, "epoch": 545, "lr": 2.0475976198091164e-06} +{"train_loss": 0.0005364150274544954, "global_step": 64919, "epoch": 545, "lr": 2.0469701383307447e-06} +{"train_loss": 0.00022083423391450197, "global_step": 64920, "epoch": 545, "lr": 2.0463427510030163e-06} +{"train_loss": 0.0002694599097594619, "global_step": 64921, "epoch": 545, "lr": 2.045715457827174e-06} +{"train_loss": 0.00036984545295126736, "global_step": 64922, "epoch": 545, "lr": 2.0450882588044506e-06} +{"train_loss": 0.0003594151057768613, "global_step": 64923, "epoch": 545, "lr": 2.0444611539360668e-06} +{"train_loss": 0.0004626289301086217, "global_step": 64924, "epoch": 545, "lr": 2.0438341432232666e-06} +{"train_loss": 0.00024293700698763132, "global_step": 64925, "epoch": 545, "lr": 2.0432072266672654e-06} +{"train_loss": 0.0003433647798374295, "global_step": 64926, "epoch": 545, "lr": 2.042580404269312e-06} +{"train_loss": 0.00048777792835608125, "global_step": 64927, "epoch": 545, "lr": 2.0419536760306336e-06} +{"train_loss": 0.00030069416970945895, "global_step": 64928, "epoch": 545, "lr": 2.04132704195244e-06} +{"train_loss": 0.0001702584995655343, "global_step": 64929, "epoch": 545, "lr": 2.0407005020359914e-06} +{"train_loss": 0.0003054834087379277, "global_step": 64930, "epoch": 545, "lr": 2.0400740562824928e-06} +{"train_loss": 0.00022383248142432421, "global_step": 64931, "epoch": 545, "lr": 2.0394477046931924e-06} +{"train_loss": 0.00039620159077458084, "global_step": 64932, "epoch": 545, "lr": 2.0388214472693013e-06} +{"train_loss": 0.00036133237881585956, "global_step": 64933, "epoch": 545, "lr": 2.0381952840120733e-06} +{"train_loss": 0.0002684415958356112, "global_step": 64934, "epoch": 545, "lr": 2.0375692149227243e-06} +{"train_loss": 0.0003314776695333421, "global_step": 64935, "epoch": 545, "lr": 2.0369432400024755e-06} +{"train_loss": 0.00030803121626377106, "global_step": 64936, "epoch": 545, "lr": 2.0363173592525707e-06} +{"train_loss": 0.00014619965804740787, "global_step": 64937, "epoch": 545, "lr": 2.0356915726742308e-06} +{"train_loss": 0.00023425584367942065, "global_step": 64938, "epoch": 545, "lr": 2.0350658802686883e-06} +{"train_loss": 0.00021647725952789187, "global_step": 64939, "epoch": 545, "lr": 2.0344402820371646e-06} +{"train_loss": 0.0003370091144461185, "global_step": 64940, "epoch": 545, "lr": 2.033814777980897e-06} +{"train_loss": 0.0002659967285580933, "global_step": 64941, "epoch": 545, "lr": 2.0331893681011127e-06} +{"train_loss": 0.00026202338631264865, "global_step": 64942, "epoch": 545, "lr": 2.0325640523990273e-06} +{"train_loss": 0.0003015943511854857, "global_step": 64943, "epoch": 545, "lr": 2.0319388308758846e-06} +{"train_loss": 0.00025446011568419635, "global_step": 64944, "epoch": 545, "lr": 2.0313137035329e-06} +{"train_loss": 0.0003039860166609287, "global_step": 64945, "epoch": 545, "lr": 2.030688670371317e-06} +{"train_loss": 0.0006284074042923748, "global_step": 64946, "epoch": 545, "lr": 2.03006373139234e-06} +{"train_loss": 0.00015670459833927453, "global_step": 64947, "epoch": 545, "lr": 2.0294388865972127e-06} +{"train_loss": 0.00038427303661592305, "global_step": 64948, "epoch": 545, "lr": 2.028814135987156e-06} +{"train_loss": 0.0002369727153563872, "global_step": 64949, "epoch": 545, "lr": 2.028189479563397e-06} +{"train_loss": 0.00016850276733748615, "global_step": 64950, "epoch": 545, "lr": 2.027564917327168e-06} +{"train_loss": 0.0004769404768012464, "global_step": 64951, "epoch": 545, "lr": 2.026940449279685e-06} +{"train_loss": 0.0002551190846133977, "global_step": 64952, "epoch": 545, "lr": 2.0263160754221853e-06} +{"train_loss": 0.00021852186182513833, "global_step": 64953, "epoch": 545, "lr": 2.025691795755891e-06} +{"train_loss": 0.00028888435917906463, "global_step": 64954, "epoch": 545, "lr": 2.025067610282011e-06} +{"train_loss": 0.00034816915285773575, "global_step": 64955, "epoch": 545, "lr": 2.024443519001801e-06} +{"train_loss": 0.0003443589375820011, "global_step": 64956, "epoch": 545, "lr": 2.023819521916459e-06} +{"train_loss": 0.0004006480739917606, "global_step": 64957, "epoch": 545, "lr": 2.0231956190272294e-06} +{"train_loss": 0.0003098839079029858, "global_step": 64958, "epoch": 545, "lr": 2.022571810335322e-06} +{"train_loss": 0.00023153505753725767, "global_step": 64959, "epoch": 545, "lr": 2.02194809584198e-06} +{"train_loss": 0.0002030159957939759, "global_step": 64960, "epoch": 545, "lr": 2.021324475548414e-06} +{"train_loss": 0.00025458354502916336, "global_step": 64961, "epoch": 545, "lr": 2.0207009494558447e-06} +{"train_loss": 0.0003313722263555974, "global_step": 64962, "epoch": 545, "lr": 2.0200775175655105e-06} +{"train_loss": 0.00020681957539636642, "global_step": 64963, "epoch": 545, "lr": 2.0194541798786216e-06} +{"train_loss": 0.0001891553110908717, "global_step": 64964, "epoch": 545, "lr": 2.0188309363964153e-06} +{"train_loss": 0.00016110396245494485, "global_step": 64965, "epoch": 545, "lr": 2.0182077871201076e-06} +{"train_loss": 0.00024976616259664297, "global_step": 64966, "epoch": 545, "lr": 2.01758473205092e-06} +{"train_loss": 0.00022169518342707306, "global_step": 64967, "epoch": 545, "lr": 2.016961771190079e-06} +{"train_loss": 0.00023170516942627728, "global_step": 64968, "epoch": 545, "lr": 2.016338904538806e-06} +{"train_loss": 0.0003267843567300588, "global_step": 64969, "epoch": 545, "lr": 2.0157161320983275e-06} +{"train_loss": 0.00025197883951477706, "global_step": 64970, "epoch": 545, "lr": 2.015093453869865e-06} +{"train_loss": 0.00033734290627762675, "global_step": 64971, "epoch": 545, "lr": 2.0144708698546398e-06} +{"train_loss": 0.00014994427328929305, "global_step": 64972, "epoch": 545, "lr": 2.0138483800538733e-06} +{"train_loss": 0.00029534880637324283, "global_step": 64973, "epoch": 545, "lr": 2.013225984468786e-06, "val_loss": 0.036688413470983505, "train_action_mse_error": 3.649112841230817e-06} +{"train_loss": 0.0003255708725191653, "global_step": 64974, "epoch": 546, "lr": 2.0126036831006113e-06} +{"train_loss": 0.00021438655676320195, "global_step": 64975, "epoch": 546, "lr": 2.011981475950553e-06} +{"train_loss": 0.00020873514586128294, "global_step": 64976, "epoch": 546, "lr": 2.011359363019849e-06} +{"train_loss": 0.00023344143119174987, "global_step": 64977, "epoch": 546, "lr": 2.0107373443097045e-06} +{"train_loss": 0.0002054496726486832, "global_step": 64978, "epoch": 546, "lr": 2.0101154198213625e-06} +{"train_loss": 0.0002330617280676961, "global_step": 64979, "epoch": 546, "lr": 2.009493589556022e-06} +{"train_loss": 0.0004021397908218205, "global_step": 64980, "epoch": 546, "lr": 2.008871853514921e-06} +{"train_loss": 0.00036698326584883034, "global_step": 64981, "epoch": 546, "lr": 2.0082502116992696e-06} +{"train_loss": 0.00023427788983099163, "global_step": 64982, "epoch": 546, "lr": 2.0076286641102895e-06} +{"train_loss": 0.0002293600409757346, "global_step": 64983, "epoch": 546, "lr": 2.0070072107492067e-06} +{"train_loss": 0.0002965228632092476, "global_step": 64984, "epoch": 546, "lr": 2.006385851617243e-06} +{"train_loss": 0.00033852498745545745, "global_step": 64985, "epoch": 546, "lr": 2.0057645867156027e-06} +{"train_loss": 0.00017255540296901017, "global_step": 64986, "epoch": 546, "lr": 2.0051434160455242e-06} +{"train_loss": 0.0002459055685903877, "global_step": 64987, "epoch": 546, "lr": 2.0045223396082114e-06} +{"train_loss": 0.0003093560226261616, "global_step": 64988, "epoch": 546, "lr": 2.003901357404897e-06} +{"train_loss": 0.0002930391929112375, "global_step": 64989, "epoch": 546, "lr": 2.0032804694367913e-06} +{"train_loss": 0.00027909569325856864, "global_step": 64990, "epoch": 546, "lr": 2.0026596757051264e-06} +{"train_loss": 0.0004959878278896213, "global_step": 64991, "epoch": 546, "lr": 2.002038976211107e-06} +{"train_loss": 0.00020483382104430348, "global_step": 64992, "epoch": 546, "lr": 2.0014183709559486e-06} +{"train_loss": 0.00018200030899606645, "global_step": 64993, "epoch": 546, "lr": 2.0007978599408837e-06} +{"train_loss": 0.0002655712887644768, "global_step": 64994, "epoch": 546, "lr": 2.000177443167123e-06} +{"train_loss": 0.0002130391076207161, "global_step": 64995, "epoch": 546, "lr": 1.9995571206358865e-06} +{"train_loss": 0.00044584693387150764, "global_step": 64996, "epoch": 546, "lr": 1.998936892348391e-06} +{"train_loss": 0.0001686899340711534, "global_step": 64997, "epoch": 546, "lr": 1.9983167583058513e-06} +{"train_loss": 0.00023199492716230452, "global_step": 64998, "epoch": 546, "lr": 1.997696718509495e-06} +{"train_loss": 0.000362295686500147, "global_step": 64999, "epoch": 546, "lr": 1.997076772960527e-06} +{"train_loss": 0.00016367630450986326, "global_step": 65000, "epoch": 546, "lr": 1.996456921660178e-06} +{"train_loss": 0.00018583182827569544, "global_step": 65001, "epoch": 546, "lr": 1.9958371646096487e-06} +{"train_loss": 0.00033026968594640493, "global_step": 65002, "epoch": 546, "lr": 1.9952175018101703e-06} +{"train_loss": 0.000461081275716424, "global_step": 65003, "epoch": 546, "lr": 1.9945979332629537e-06} +{"train_loss": 0.0003199419006705284, "global_step": 65004, "epoch": 546, "lr": 1.993978458969209e-06} +{"train_loss": 0.00026129442267119884, "global_step": 65005, "epoch": 546, "lr": 1.9933590789301682e-06} +{"train_loss": 0.0003222011437173933, "global_step": 65006, "epoch": 546, "lr": 1.9927397931470303e-06} +{"train_loss": 0.000460184586700052, "global_step": 65007, "epoch": 546, "lr": 1.9921206016210226e-06} +{"train_loss": 0.000155637098941952, "global_step": 65008, "epoch": 546, "lr": 1.991501504353355e-06} +{"train_loss": 0.0002511099446564913, "global_step": 65009, "epoch": 546, "lr": 1.9908825013452483e-06} +{"train_loss": 0.00038596728700213134, "global_step": 65010, "epoch": 546, "lr": 1.990263592597913e-06} +{"train_loss": 0.0004242075374349952, "global_step": 65011, "epoch": 546, "lr": 1.9896447781125647e-06} +{"train_loss": 0.00021754149929620326, "global_step": 65012, "epoch": 546, "lr": 1.9890260578904196e-06} +{"train_loss": 0.00018355440988671035, "global_step": 65013, "epoch": 546, "lr": 1.9884074319326983e-06} +{"train_loss": 0.00017064387793652713, "global_step": 65014, "epoch": 546, "lr": 1.9877889002406004e-06} +{"train_loss": 0.0001455505844205618, "global_step": 65015, "epoch": 546, "lr": 1.9871704628153577e-06} +{"train_loss": 0.0006707358988933265, "global_step": 65016, "epoch": 546, "lr": 1.986552119658175e-06} +{"train_loss": 0.00013010611291974783, "global_step": 65017, "epoch": 546, "lr": 1.9859338707702678e-06} +{"train_loss": 0.00020732864504680037, "global_step": 65018, "epoch": 546, "lr": 1.985315716152847e-06} +{"train_loss": 0.00020163373847026378, "global_step": 65019, "epoch": 546, "lr": 1.984697655807133e-06} +{"train_loss": 0.0002111667999997735, "global_step": 65020, "epoch": 546, "lr": 1.9840796897343307e-06} +{"train_loss": 0.0003000326396431774, "global_step": 65021, "epoch": 546, "lr": 1.9834618179356614e-06} +{"train_loss": 0.0004510570433922112, "global_step": 65022, "epoch": 546, "lr": 1.9828440404123348e-06} +{"train_loss": 0.00023284307098947465, "global_step": 65023, "epoch": 546, "lr": 1.982226357165562e-06} +{"train_loss": 0.00034538950421847403, "global_step": 65024, "epoch": 546, "lr": 1.9816087681965636e-06} +{"train_loss": 0.0004045938258059323, "global_step": 65025, "epoch": 546, "lr": 1.980991273506538e-06} +{"train_loss": 0.00018742137763183564, "global_step": 65026, "epoch": 546, "lr": 1.9803738730967135e-06} +{"train_loss": 0.0003322819829918444, "global_step": 65027, "epoch": 546, "lr": 1.979756566968288e-06} +{"train_loss": 0.0002354811440454796, "global_step": 65028, "epoch": 546, "lr": 1.9791393551224835e-06} +{"train_loss": 0.00029842203366570175, "global_step": 65029, "epoch": 546, "lr": 1.978522237560515e-06} +{"train_loss": 0.0001852264831541106, "global_step": 65030, "epoch": 546, "lr": 1.9779052142835763e-06} +{"train_loss": 0.00033542807796038687, "global_step": 65031, "epoch": 546, "lr": 1.9772882852928996e-06} +{"train_loss": 0.0001767432113410905, "global_step": 65032, "epoch": 546, "lr": 1.976671450589679e-06} +{"train_loss": 0.0002330001152586192, "global_step": 65033, "epoch": 546, "lr": 1.9760547101751404e-06} +{"train_loss": 0.0002780598297249526, "global_step": 65034, "epoch": 546, "lr": 1.975438064050489e-06} +{"train_loss": 0.00020308876992203295, "global_step": 65035, "epoch": 546, "lr": 1.9748215122169233e-06} +{"train_loss": 0.00011337412433931604, "global_step": 65036, "epoch": 546, "lr": 1.9742050546756765e-06} +{"train_loss": 0.00024264825333375484, "global_step": 65037, "epoch": 546, "lr": 1.9735886914279357e-06} +{"train_loss": 0.0002458901726640761, "global_step": 65038, "epoch": 546, "lr": 1.9729724224749336e-06} +{"train_loss": 0.00021744758123531938, "global_step": 65039, "epoch": 546, "lr": 1.972356247817864e-06} +{"train_loss": 0.00014126957103144377, "global_step": 65040, "epoch": 546, "lr": 1.971740167457942e-06} +{"train_loss": 0.00025398057186976075, "global_step": 65041, "epoch": 546, "lr": 1.971124181396383e-06} +{"train_loss": 0.0003488612419459969, "global_step": 65042, "epoch": 546, "lr": 1.970508289634382e-06} +{"train_loss": 0.00036532379454001784, "global_step": 65043, "epoch": 546, "lr": 1.9698924921731643e-06} +{"train_loss": 0.00020424836839083582, "global_step": 65044, "epoch": 546, "lr": 1.9692767890139243e-06} +{"train_loss": 0.0003540156758390367, "global_step": 65045, "epoch": 546, "lr": 1.968661180157877e-06} +{"train_loss": 0.00013736959954258054, "global_step": 65046, "epoch": 546, "lr": 1.9680456656062384e-06} +{"train_loss": 0.00029009795980527997, "global_step": 65047, "epoch": 546, "lr": 1.9674302453602024e-06} +{"train_loss": 0.00039750771247781813, "global_step": 65048, "epoch": 546, "lr": 1.9668149194209953e-06} +{"train_loss": 0.000320032995659858, "global_step": 65049, "epoch": 546, "lr": 1.9661996877898105e-06} +{"train_loss": 0.00044053251622244716, "global_step": 65050, "epoch": 546, "lr": 1.9655845504678637e-06} +{"train_loss": 0.0001529074797872454, "global_step": 65051, "epoch": 546, "lr": 1.9649695074563545e-06} +{"train_loss": 0.0009198124171234667, "global_step": 65052, "epoch": 546, "lr": 1.9643545587565037e-06} +{"train_loss": 0.0003029335930477828, "global_step": 65053, "epoch": 546, "lr": 1.9637397043695105e-06} +{"train_loss": 0.00018436313257552683, "global_step": 65054, "epoch": 546, "lr": 1.963124944296574e-06} +{"train_loss": 0.0006338444072753191, "global_step": 65055, "epoch": 546, "lr": 1.9625102785389205e-06} +{"train_loss": 0.0004261356370989233, "global_step": 65056, "epoch": 546, "lr": 1.9618957070977328e-06} +{"train_loss": 0.00042640595347620547, "global_step": 65057, "epoch": 546, "lr": 1.9612812299742435e-06} +{"train_loss": 0.00034253631019964814, "global_step": 65058, "epoch": 546, "lr": 1.9606668471696343e-06} +{"train_loss": 0.00045417039655148983, "global_step": 65059, "epoch": 546, "lr": 1.9600525586851325e-06} +{"train_loss": 0.0004173513734713197, "global_step": 65060, "epoch": 546, "lr": 1.959438364521937e-06} +{"train_loss": 0.0002864487178158015, "global_step": 65061, "epoch": 546, "lr": 1.958824264681247e-06} +{"train_loss": 0.0002518797409720719, "global_step": 65062, "epoch": 546, "lr": 1.9582102591642725e-06} +{"train_loss": 0.00022940013150218874, "global_step": 65063, "epoch": 546, "lr": 1.957596347972218e-06} +{"train_loss": 0.00020871599554084241, "global_step": 65064, "epoch": 546, "lr": 1.9569825311062996e-06} +{"train_loss": 0.00019506232638377696, "global_step": 65065, "epoch": 546, "lr": 1.9563688085677102e-06} +{"train_loss": 0.0002296700404258445, "global_step": 65066, "epoch": 546, "lr": 1.955755180357649e-06} +{"train_loss": 0.00026194658130407333, "global_step": 65067, "epoch": 546, "lr": 1.9551416464773376e-06} +{"train_loss": 0.0003189968119841069, "global_step": 65068, "epoch": 546, "lr": 1.954528206927969e-06} +{"train_loss": 0.0007676150999031961, "global_step": 65069, "epoch": 546, "lr": 1.9539148617107594e-06} +{"train_loss": 0.00032522191759198904, "global_step": 65070, "epoch": 546, "lr": 1.953301610826891e-06} +{"train_loss": 0.0001794087584130466, "global_step": 65071, "epoch": 546, "lr": 1.9526884542775958e-06} +{"train_loss": 0.00029417587211355567, "global_step": 65072, "epoch": 546, "lr": 1.9520753920640565e-06} +{"train_loss": 0.0002191324019804597, "global_step": 65073, "epoch": 546, "lr": 1.9514624241874835e-06} +{"train_loss": 0.00027315152692608535, "global_step": 65074, "epoch": 546, "lr": 1.9508495506490864e-06} +{"train_loss": 0.0012509083608165383, "global_step": 65075, "epoch": 546, "lr": 1.9502367714500537e-06} +{"train_loss": 0.0003400997957214713, "global_step": 65076, "epoch": 546, "lr": 1.949624086591606e-06} +{"train_loss": 0.0002572019584476948, "global_step": 65077, "epoch": 546, "lr": 1.9490114960749316e-06} +{"train_loss": 0.0002871495671570301, "global_step": 65078, "epoch": 546, "lr": 1.9483989999012466e-06} +{"train_loss": 0.0003800216654781252, "global_step": 65079, "epoch": 546, "lr": 1.947786598071738e-06} +{"train_loss": 0.0004360318125691265, "global_step": 65080, "epoch": 546, "lr": 1.947174290587622e-06} +{"train_loss": 0.0005970955826342106, "global_step": 65081, "epoch": 546, "lr": 1.946562077450098e-06} +{"train_loss": 0.00041073482134379447, "global_step": 65082, "epoch": 546, "lr": 1.945949958660359e-06} +{"train_loss": 0.0004143472178839147, "global_step": 65083, "epoch": 546, "lr": 1.945337934219621e-06} +{"train_loss": 0.0002741318312473595, "global_step": 65084, "epoch": 546, "lr": 1.9447260041290773e-06} +{"train_loss": 0.00015588865790050477, "global_step": 65085, "epoch": 546, "lr": 1.944114168389921e-06} +{"train_loss": 0.0005263724597170949, "global_step": 65086, "epoch": 546, "lr": 1.9435024270033743e-06} +{"train_loss": 0.0002742718788795173, "global_step": 65087, "epoch": 546, "lr": 1.9428907799706186e-06} +{"train_loss": 0.00023677713761571795, "global_step": 65088, "epoch": 546, "lr": 1.9422792272928648e-06} +{"train_loss": 0.00022098247427493334, "global_step": 65089, "epoch": 546, "lr": 1.9416677689713113e-06} +{"train_loss": 0.00017213910177815706, "global_step": 65090, "epoch": 546, "lr": 1.9410564050071634e-06} +{"train_loss": 0.000254573009442538, "global_step": 65091, "epoch": 546, "lr": 1.940445135401614e-06} +{"train_loss": 0.00030552490217906637, "global_step": 65092, "epoch": 546, "lr": 1.9398339601558625e-06, "val_loss": 0.038028258830308914} +{"train_loss": 0.00023883377434685826, "global_step": 65093, "epoch": 547, "lr": 1.939222879271119e-06} +{"train_loss": 0.00028960281633771956, "global_step": 65094, "epoch": 547, "lr": 1.9386118927485653e-06} +{"train_loss": 0.00017843955720309168, "global_step": 65095, "epoch": 547, "lr": 1.9380010005894233e-06} +{"train_loss": 0.00015535083366557956, "global_step": 65096, "epoch": 547, "lr": 1.937390202794881e-06} +{"train_loss": 0.00025633463519625366, "global_step": 65097, "epoch": 547, "lr": 1.936779499366137e-06} +{"train_loss": 0.00025119015481323004, "global_step": 65098, "epoch": 547, "lr": 1.936168890304391e-06} +{"train_loss": 0.0003752975317183882, "global_step": 65099, "epoch": 547, "lr": 1.935558375610841e-06} +{"train_loss": 0.0002412320172879845, "global_step": 65100, "epoch": 547, "lr": 1.9349479552866867e-06} +{"train_loss": 0.0004107857239432633, "global_step": 65101, "epoch": 547, "lr": 1.9343376293331273e-06} +{"train_loss": 0.0002721952914725989, "global_step": 65102, "epoch": 547, "lr": 1.933727397751367e-06} +{"train_loss": 0.00019988177518825978, "global_step": 65103, "epoch": 547, "lr": 1.933117260542594e-06} +{"train_loss": 0.00030029407935217023, "global_step": 65104, "epoch": 547, "lr": 1.9325072177080073e-06} +{"train_loss": 0.00022821230231784284, "global_step": 65105, "epoch": 547, "lr": 1.9318972692488115e-06} +{"train_loss": 0.00037540087942034006, "global_step": 65106, "epoch": 547, "lr": 1.931287415166194e-06} +{"train_loss": 0.00023171745124273002, "global_step": 65107, "epoch": 547, "lr": 1.930677655461366e-06} +{"train_loss": 0.0002837012871168554, "global_step": 65108, "epoch": 547, "lr": 1.930067990135509e-06} +{"train_loss": 0.0003484408080112189, "global_step": 65109, "epoch": 547, "lr": 1.9294584191898336e-06} +{"train_loss": 0.00021579016174655408, "global_step": 65110, "epoch": 547, "lr": 1.9288489426255274e-06} +{"train_loss": 0.0004206899320706725, "global_step": 65111, "epoch": 547, "lr": 1.9282395604437952e-06} +{"train_loss": 0.00018783989071380347, "global_step": 65112, "epoch": 547, "lr": 1.927630272645825e-06} +{"train_loss": 0.00014719073078595102, "global_step": 65113, "epoch": 547, "lr": 1.9270210792328212e-06} +{"train_loss": 0.0003052188258152455, "global_step": 65114, "epoch": 547, "lr": 1.926411980205967e-06} +{"train_loss": 0.00025450956309214234, "global_step": 65115, "epoch": 547, "lr": 1.9258029755664763e-06} +{"train_loss": 0.0006426401669159532, "global_step": 65116, "epoch": 547, "lr": 1.9251940653155276e-06} +{"train_loss": 0.0003461475425865501, "global_step": 65117, "epoch": 547, "lr": 1.924585249454336e-06} +{"train_loss": 0.00016222357226070017, "global_step": 65118, "epoch": 547, "lr": 1.9239765279840725e-06} +{"train_loss": 0.0002582323213573545, "global_step": 65119, "epoch": 547, "lr": 1.9233679009059535e-06} +{"train_loss": 0.0003819205448962748, "global_step": 65120, "epoch": 547, "lr": 1.9227593682211608e-06} +{"train_loss": 0.00037634011823683977, "global_step": 65121, "epoch": 547, "lr": 1.9221509299308936e-06} +{"train_loss": 0.00018567961524240673, "global_step": 65122, "epoch": 547, "lr": 1.921542586036351e-06} +{"train_loss": 0.00022100105707067996, "global_step": 65123, "epoch": 547, "lr": 1.920934336538721e-06} +{"train_loss": 0.00026175385573878884, "global_step": 65124, "epoch": 547, "lr": 1.9203261814392027e-06} +{"train_loss": 0.0006649267161265016, "global_step": 65125, "epoch": 547, "lr": 1.919718120738978e-06} +{"train_loss": 0.00024167758238036186, "global_step": 65126, "epoch": 547, "lr": 1.9191101544392575e-06} +{"train_loss": 0.0004066159890498966, "global_step": 65127, "epoch": 547, "lr": 1.9185022825412235e-06} +{"train_loss": 0.0002692266716621816, "global_step": 65128, "epoch": 547, "lr": 1.9178945050460805e-06} +{"train_loss": 0.00022609626466874033, "global_step": 65129, "epoch": 547, "lr": 1.9172868219550167e-06} +{"train_loss": 0.0002176412963308394, "global_step": 65130, "epoch": 547, "lr": 1.9166792332692084e-06} +{"train_loss": 0.000198720779735595, "global_step": 65131, "epoch": 547, "lr": 1.9160717389898774e-06} +{"train_loss": 0.0003361054405104369, "global_step": 65132, "epoch": 547, "lr": 1.9154643391181946e-06} +{"train_loss": 0.00032662859302945435, "global_step": 65133, "epoch": 547, "lr": 1.914857033655365e-06} +{"train_loss": 0.0003343589196447283, "global_step": 65134, "epoch": 547, "lr": 1.9142498226025817e-06} +{"train_loss": 0.00026588619221001863, "global_step": 65135, "epoch": 547, "lr": 1.913642705961016e-06} +{"train_loss": 0.00025459431344643235, "global_step": 65136, "epoch": 547, "lr": 1.9130356837318895e-06} +{"train_loss": 0.00021679920610040426, "global_step": 65137, "epoch": 547, "lr": 1.9124287559163735e-06} +{"train_loss": 0.0002575984108261764, "global_step": 65138, "epoch": 547, "lr": 1.911821922515672e-06} +{"train_loss": 0.0004343949258327484, "global_step": 65139, "epoch": 547, "lr": 1.9112151835309623e-06} +{"train_loss": 0.0004750022490043193, "global_step": 65140, "epoch": 547, "lr": 1.9106085389634485e-06} +{"train_loss": 0.00022280316625256091, "global_step": 65141, "epoch": 547, "lr": 1.9100019888143196e-06} +{"train_loss": 0.00031209990265779197, "global_step": 65142, "epoch": 547, "lr": 1.9093955330847567e-06} +{"train_loss": 0.0002683595521375537, "global_step": 65143, "epoch": 547, "lr": 1.9087891717759597e-06} +{"train_loss": 0.00038954205228947103, "global_step": 65144, "epoch": 547, "lr": 1.9081829048891276e-06} +{"train_loss": 0.00016524139209650457, "global_step": 65145, "epoch": 547, "lr": 1.9075767324254257e-06} +{"train_loss": 0.00029256759444251657, "global_step": 65146, "epoch": 547, "lr": 1.90697065438607e-06} +{"train_loss": 0.00021317369828466326, "global_step": 65147, "epoch": 547, "lr": 1.9063646707722315e-06} +{"train_loss": 0.0001237889373442158, "global_step": 65148, "epoch": 547, "lr": 1.9057587815851152e-06} +{"train_loss": 0.0009458850836381316, "global_step": 65149, "epoch": 547, "lr": 1.9051529868258977e-06} +{"train_loss": 0.00016176495410036296, "global_step": 65150, "epoch": 547, "lr": 1.9045472864957836e-06} +{"train_loss": 0.00028081642813049257, "global_step": 65151, "epoch": 547, "lr": 1.9039416805959386e-06} +{"train_loss": 0.0005997818661853671, "global_step": 65152, "epoch": 547, "lr": 1.9033361691275787e-06} +{"train_loss": 0.0002557383559178561, "global_step": 65153, "epoch": 547, "lr": 1.9027307520918747e-06} +{"train_loss": 0.0002163752942578867, "global_step": 65154, "epoch": 547, "lr": 1.9021254294900204e-06} +{"train_loss": 0.0001882393262349069, "global_step": 65155, "epoch": 547, "lr": 1.9015202013232037e-06} +{"train_loss": 0.000276459933957085, "global_step": 65156, "epoch": 547, "lr": 1.9009150675926124e-06} +{"train_loss": 0.00034421816235408187, "global_step": 65157, "epoch": 547, "lr": 1.9003100282994401e-06} +{"train_loss": 0.00016672776837367564, "global_step": 65158, "epoch": 547, "lr": 1.8997050834448637e-06} +{"train_loss": 0.00029359894688241184, "global_step": 65159, "epoch": 547, "lr": 1.8991002330300877e-06} +{"train_loss": 0.0003564660728443414, "global_step": 65160, "epoch": 547, "lr": 1.8984954770562836e-06} +{"train_loss": 0.0003655561013147235, "global_step": 65161, "epoch": 547, "lr": 1.897890815524639e-06} +{"train_loss": 0.00019402058387640864, "global_step": 65162, "epoch": 547, "lr": 1.8972862484363585e-06} +{"train_loss": 0.0002177284623030573, "global_step": 65163, "epoch": 547, "lr": 1.8966817757926082e-06} +{"train_loss": 0.00023491907631978393, "global_step": 65164, "epoch": 547, "lr": 1.8960773975945866e-06} +{"train_loss": 0.0002902522392105311, "global_step": 65165, "epoch": 547, "lr": 1.8954731138434823e-06} +{"train_loss": 0.00031082346686162055, "global_step": 65166, "epoch": 547, "lr": 1.8948689245404716e-06} +{"train_loss": 0.00043455915874801576, "global_step": 65167, "epoch": 547, "lr": 1.8942648296867483e-06} +{"train_loss": 0.00016639336536172777, "global_step": 65168, "epoch": 547, "lr": 1.8936608292834946e-06} +{"train_loss": 0.00023010713630355895, "global_step": 65169, "epoch": 547, "lr": 1.893056923331904e-06} +{"train_loss": 0.0004196859081275761, "global_step": 65170, "epoch": 547, "lr": 1.8924531118331534e-06} +{"train_loss": 0.0004003935609944165, "global_step": 65171, "epoch": 547, "lr": 1.8918493947884308e-06} +{"train_loss": 0.00022751629876438528, "global_step": 65172, "epoch": 547, "lr": 1.891245772198924e-06} +{"train_loss": 0.00028407954960130155, "global_step": 65173, "epoch": 547, "lr": 1.8906422440658156e-06} +{"train_loss": 0.00016198433877434582, "global_step": 65174, "epoch": 547, "lr": 1.8900388103902934e-06} +{"train_loss": 0.0002906274748966098, "global_step": 65175, "epoch": 547, "lr": 1.889435471173534e-06} +{"train_loss": 0.0003398989501874894, "global_step": 65176, "epoch": 547, "lr": 1.8888322264167369e-06} +{"train_loss": 0.0002593832032289356, "global_step": 65177, "epoch": 547, "lr": 1.8882290761210675e-06} +{"train_loss": 0.00021418806863948703, "global_step": 65178, "epoch": 547, "lr": 1.887626020287725e-06} +{"train_loss": 0.00020497074001468718, "global_step": 65179, "epoch": 547, "lr": 1.8870230589178916e-06} +{"train_loss": 0.00034905964275822043, "global_step": 65180, "epoch": 547, "lr": 1.8864201920127445e-06} +{"train_loss": 0.00036501380964182317, "global_step": 65181, "epoch": 547, "lr": 1.8858174195734769e-06} +{"train_loss": 0.000215872612898238, "global_step": 65182, "epoch": 547, "lr": 1.8852147416012544e-06} +{"train_loss": 0.0002068789763143286, "global_step": 65183, "epoch": 547, "lr": 1.8846121580972874e-06} +{"train_loss": 0.0002483423741068691, "global_step": 65184, "epoch": 547, "lr": 1.8840096690627418e-06} +{"train_loss": 0.0004808332596439868, "global_step": 65185, "epoch": 547, "lr": 1.8834072744987942e-06} +{"train_loss": 0.00021488411584869027, "global_step": 65186, "epoch": 547, "lr": 1.8828049744066434e-06} +{"train_loss": 0.0005318205221556127, "global_step": 65187, "epoch": 547, "lr": 1.8822027687874554e-06} +{"train_loss": 0.0003162759530823678, "global_step": 65188, "epoch": 547, "lr": 1.8816006576424295e-06} +{"train_loss": 0.0002037880040006712, "global_step": 65189, "epoch": 547, "lr": 1.8809986409727365e-06} +{"train_loss": 0.0002725796075537801, "global_step": 65190, "epoch": 547, "lr": 1.8803967187795646e-06} +{"train_loss": 0.0003350936167407781, "global_step": 65191, "epoch": 547, "lr": 1.879794891064096e-06} +{"train_loss": 0.00013899497571401298, "global_step": 65192, "epoch": 547, "lr": 1.8791931578275025e-06} +{"train_loss": 0.0002825126575771719, "global_step": 65193, "epoch": 547, "lr": 1.8785915190709769e-06} +{"train_loss": 0.0003985098737757653, "global_step": 65194, "epoch": 547, "lr": 1.8779899747956908e-06} +{"train_loss": 0.00019236752996221185, "global_step": 65195, "epoch": 547, "lr": 1.8773885250028378e-06} +{"train_loss": 0.00036679088952951133, "global_step": 65196, "epoch": 547, "lr": 1.876787169693578e-06} +{"train_loss": 0.00024058880808297545, "global_step": 65197, "epoch": 547, "lr": 1.8761859088691213e-06} +{"train_loss": 0.0002009486051974818, "global_step": 65198, "epoch": 547, "lr": 1.8755847425306282e-06} +{"train_loss": 0.00045688412501476705, "global_step": 65199, "epoch": 547, "lr": 1.8749836706792756e-06} +{"train_loss": 0.00035355554427951574, "global_step": 65200, "epoch": 547, "lr": 1.8743826933162567e-06} +{"train_loss": 0.00032950699096545577, "global_step": 65201, "epoch": 547, "lr": 1.8737818104427429e-06} +{"train_loss": 0.0002252821868751198, "global_step": 65202, "epoch": 547, "lr": 1.8731810220599222e-06} +{"train_loss": 0.0002800453803502023, "global_step": 65203, "epoch": 547, "lr": 1.8725803281689658e-06} +{"train_loss": 0.0001701911969576031, "global_step": 65204, "epoch": 547, "lr": 1.8719797287710562e-06} +{"train_loss": 0.00019671994959935546, "global_step": 65205, "epoch": 547, "lr": 1.8713792238673756e-06} +{"train_loss": 0.000214297222555615, "global_step": 65206, "epoch": 547, "lr": 1.8707788134590898e-06} +{"train_loss": 0.0005656989524140954, "global_step": 65207, "epoch": 547, "lr": 1.870178497547398e-06} +{"train_loss": 0.0001975017657969147, "global_step": 65208, "epoch": 547, "lr": 1.8695782761334657e-06} +{"train_loss": 0.0007524846005253494, "global_step": 65209, "epoch": 547, "lr": 1.8689781492184755e-06} +{"train_loss": 0.00042521749855950475, "global_step": 65210, "epoch": 547, "lr": 1.868378116803604e-06} +{"train_loss": 0.00029764708230358024, "global_step": 65211, "epoch": 547, "lr": 1.8677781788900283e-06, "val_loss": 0.022824738174676895} +{"train_loss": 0.00022685436124447733, "global_step": 65212, "epoch": 548, "lr": 1.8671783354789308e-06} +{"train_loss": 0.0001807907538022846, "global_step": 65213, "epoch": 548, "lr": 1.866578586571477e-06} +{"train_loss": 0.0003103524795733392, "global_step": 65214, "epoch": 548, "lr": 1.8659789321688658e-06} +{"train_loss": 0.00024076428962871432, "global_step": 65215, "epoch": 548, "lr": 1.8653793722722634e-06} +{"train_loss": 0.0005247661611065269, "global_step": 65216, "epoch": 548, "lr": 1.864779906882841e-06} +{"train_loss": 0.0003443924942985177, "global_step": 65217, "epoch": 548, "lr": 1.8641805360017805e-06} +{"train_loss": 0.00020125883747823536, "global_step": 65218, "epoch": 548, "lr": 1.8635812596302594e-06} +{"train_loss": 0.0006014270475134254, "global_step": 65219, "epoch": 548, "lr": 1.862982077769454e-06} +{"train_loss": 0.00015285800327546895, "global_step": 65220, "epoch": 548, "lr": 1.8623829904205413e-06} +{"train_loss": 0.00040664724656380713, "global_step": 65221, "epoch": 548, "lr": 1.8617839975846984e-06} +{"train_loss": 0.000654147588647902, "global_step": 65222, "epoch": 548, "lr": 1.861185099263102e-06} +{"train_loss": 0.00019887193047907203, "global_step": 65223, "epoch": 548, "lr": 1.8605862954569175e-06} +{"train_loss": 0.00021538622968364507, "global_step": 65224, "epoch": 548, "lr": 1.8599875861673333e-06} +{"train_loss": 0.00027645615045912564, "global_step": 65225, "epoch": 548, "lr": 1.8593889713955204e-06} +{"train_loss": 0.00029687891947105527, "global_step": 65226, "epoch": 548, "lr": 1.8587904511426557e-06} +{"train_loss": 0.0004308583738747984, "global_step": 65227, "epoch": 548, "lr": 1.858192025409905e-06} +{"train_loss": 0.00015382780111394823, "global_step": 65228, "epoch": 548, "lr": 1.8575936941984617e-06} +{"train_loss": 0.00023402684018947184, "global_step": 65229, "epoch": 548, "lr": 1.8569954575094862e-06} +{"train_loss": 0.00021740118972957134, "global_step": 65230, "epoch": 548, "lr": 1.856397315344155e-06} +{"train_loss": 0.0002939683326985687, "global_step": 65231, "epoch": 548, "lr": 1.8557992677036452e-06} +{"train_loss": 0.00027075555408373475, "global_step": 65232, "epoch": 548, "lr": 1.8552013145891279e-06} +{"train_loss": 0.00022855232236906886, "global_step": 65233, "epoch": 548, "lr": 1.8546034560017856e-06} +{"train_loss": 0.0002642898471094668, "global_step": 65234, "epoch": 548, "lr": 1.854005691942784e-06} +{"train_loss": 0.0005091638886369765, "global_step": 65235, "epoch": 548, "lr": 1.8534080224132943e-06} +{"train_loss": 0.000196635999600403, "global_step": 65236, "epoch": 548, "lr": 1.8528104474144991e-06} +{"train_loss": 0.00043440418085083365, "global_step": 65237, "epoch": 548, "lr": 1.8522129669475584e-06} +{"train_loss": 0.00043951824773103, "global_step": 65238, "epoch": 548, "lr": 1.8516155810136659e-06} +{"train_loss": 0.0005152227822691202, "global_step": 65239, "epoch": 548, "lr": 1.8510182896139705e-06} +{"train_loss": 0.0005246727378107607, "global_step": 65240, "epoch": 548, "lr": 1.8504210927496656e-06} +{"train_loss": 0.0003359023539815098, "global_step": 65241, "epoch": 548, "lr": 1.849823990421906e-06} +{"train_loss": 0.00044637679820880294, "global_step": 65242, "epoch": 548, "lr": 1.8492269826318854e-06} +{"train_loss": 0.00017899434897117317, "global_step": 65243, "epoch": 548, "lr": 1.8486300693807524e-06} +{"train_loss": 0.0003051568928640336, "global_step": 65244, "epoch": 548, "lr": 1.8480332506696952e-06} +{"train_loss": 0.00020877463975921273, "global_step": 65245, "epoch": 548, "lr": 1.8474365264998738e-06} +{"train_loss": 0.0003180726198479533, "global_step": 65246, "epoch": 548, "lr": 1.8468398968724765e-06} +{"train_loss": 0.000167238074936904, "global_step": 65247, "epoch": 548, "lr": 1.8462433617886576e-06} +{"train_loss": 0.00016457904712297022, "global_step": 65248, "epoch": 548, "lr": 1.8456469212495997e-06} +{"train_loss": 0.00028734811348840594, "global_step": 65249, "epoch": 548, "lr": 1.8450505752564628e-06} +{"train_loss": 0.00031679923995397985, "global_step": 65250, "epoch": 548, "lr": 1.844454323810435e-06} +{"train_loss": 0.00031574099557474256, "global_step": 65251, "epoch": 548, "lr": 1.8438581669126654e-06} +{"train_loss": 0.00020356343884486705, "global_step": 65252, "epoch": 548, "lr": 1.8432621045643416e-06} +{"train_loss": 0.0003125186776742339, "global_step": 65253, "epoch": 548, "lr": 1.8426661367666298e-06} +{"train_loss": 0.00018505750631447881, "global_step": 65254, "epoch": 548, "lr": 1.8420702635206954e-06} +{"train_loss": 0.0001435996382497251, "global_step": 65255, "epoch": 548, "lr": 1.8414744848277154e-06} +{"train_loss": 0.0003867889172397554, "global_step": 65256, "epoch": 548, "lr": 1.8408788006888445e-06} +{"train_loss": 0.00026518836966715753, "global_step": 65257, "epoch": 548, "lr": 1.840283211105276e-06} +{"train_loss": 0.0003950672107748687, "global_step": 65258, "epoch": 548, "lr": 1.8396877160781535e-06} +{"train_loss": 0.00020157211110927165, "global_step": 65259, "epoch": 548, "lr": 1.8390923156086703e-06} +{"train_loss": 0.00018966906645800918, "global_step": 65260, "epoch": 548, "lr": 1.8384970096979815e-06} +{"train_loss": 0.00019650773901958019, "global_step": 65261, "epoch": 548, "lr": 1.8379017983472524e-06} +{"train_loss": 0.0002980755816679448, "global_step": 65262, "epoch": 548, "lr": 1.8373066815576657e-06} +{"train_loss": 0.0001761471648933366, "global_step": 65263, "epoch": 548, "lr": 1.8367116593303756e-06} +{"train_loss": 0.00025523907970637083, "global_step": 65264, "epoch": 548, "lr": 1.8361167316665596e-06} +{"train_loss": 0.00015557731967419386, "global_step": 65265, "epoch": 548, "lr": 1.8355218985673773e-06} +{"train_loss": 0.0006599261541850865, "global_step": 65266, "epoch": 548, "lr": 1.8349271600340112e-06} +{"train_loss": 0.0002242462505819276, "global_step": 65267, "epoch": 548, "lr": 1.834332516067616e-06} +{"train_loss": 0.00018353793711867183, "global_step": 65268, "epoch": 548, "lr": 1.8337379666693633e-06} +{"train_loss": 0.0005585543694905937, "global_step": 65269, "epoch": 548, "lr": 1.8331435118404238e-06} +{"train_loss": 0.0001365470525342971, "global_step": 65270, "epoch": 548, "lr": 1.8325491515819526e-06} +{"train_loss": 0.0002295989979756996, "global_step": 65271, "epoch": 548, "lr": 1.8319548858951318e-06} +{"train_loss": 0.00029182175057940185, "global_step": 65272, "epoch": 548, "lr": 1.8313607147811219e-06} +{"train_loss": 0.0003816882090177387, "global_step": 65273, "epoch": 548, "lr": 1.8307666382410827e-06} +{"train_loss": 0.0003182203508913517, "global_step": 65274, "epoch": 548, "lr": 1.8301726562761967e-06} +{"train_loss": 0.0002701212069950998, "global_step": 65275, "epoch": 548, "lr": 1.8295787688876131e-06} +{"train_loss": 0.00019665622676257044, "global_step": 65276, "epoch": 548, "lr": 1.8289849760765033e-06} +{"train_loss": 0.00017942136037163436, "global_step": 65277, "epoch": 548, "lr": 1.8283912778440382e-06} +{"train_loss": 0.0003777264792006463, "global_step": 65278, "epoch": 548, "lr": 1.8277976741913783e-06} +{"train_loss": 0.0003329195606056601, "global_step": 65279, "epoch": 548, "lr": 1.8272041651197002e-06} +{"train_loss": 0.00019587358110584319, "global_step": 65280, "epoch": 548, "lr": 1.8266107506301477e-06} +{"train_loss": 0.0004198963288217783, "global_step": 65281, "epoch": 548, "lr": 1.8260174307239085e-06} +{"train_loss": 0.0002845442795660347, "global_step": 65282, "epoch": 548, "lr": 1.825424205402132e-06} +{"train_loss": 0.00041763726039789617, "global_step": 65283, "epoch": 548, "lr": 1.8248310746659946e-06} +{"train_loss": 0.00020235693955328315, "global_step": 65284, "epoch": 548, "lr": 1.8242380385166513e-06} +{"train_loss": 0.0004681013524532318, "global_step": 65285, "epoch": 548, "lr": 1.8236450969552676e-06} +{"train_loss": 0.00023900375526864082, "global_step": 65286, "epoch": 548, "lr": 1.8230522499830148e-06} +{"train_loss": 0.00029996305238455534, "global_step": 65287, "epoch": 548, "lr": 1.8224594976010424e-06} +{"train_loss": 0.0003859105345327407, "global_step": 65288, "epoch": 548, "lr": 1.8218668398105321e-06} +{"train_loss": 0.00021204243239481002, "global_step": 65289, "epoch": 548, "lr": 1.8212742766126334e-06} +{"train_loss": 0.00018964431365020573, "global_step": 65290, "epoch": 548, "lr": 1.8206818080085231e-06} +{"train_loss": 0.00038590209442190826, "global_step": 65291, "epoch": 548, "lr": 1.8200894339993558e-06} +{"train_loss": 0.00024301852681674063, "global_step": 65292, "epoch": 548, "lr": 1.8194971545862916e-06} +{"train_loss": 0.00027297623455524445, "global_step": 65293, "epoch": 548, "lr": 1.8189049697705018e-06} +{"train_loss": 0.00029213493689894676, "global_step": 65294, "epoch": 548, "lr": 1.8183128795531356e-06} +{"train_loss": 0.00044617944513447583, "global_step": 65295, "epoch": 548, "lr": 1.8177208839353753e-06} +{"train_loss": 0.000646972912363708, "global_step": 65296, "epoch": 548, "lr": 1.817128982918359e-06} +{"train_loss": 0.00036132437526248395, "global_step": 65297, "epoch": 548, "lr": 1.8165371765032746e-06} +{"train_loss": 0.00022370652004610747, "global_step": 65298, "epoch": 548, "lr": 1.815945464691271e-06} +{"train_loss": 0.00036405029823072255, "global_step": 65299, "epoch": 548, "lr": 1.8153538474835086e-06} +{"train_loss": 0.0002402173267910257, "global_step": 65300, "epoch": 548, "lr": 1.814762324881153e-06} +{"train_loss": 0.00024339332594536245, "global_step": 65301, "epoch": 548, "lr": 1.8141708968853532e-06} +{"train_loss": 0.0005131912766955793, "global_step": 65302, "epoch": 548, "lr": 1.813579563497292e-06} +{"train_loss": 0.00027585605857893825, "global_step": 65303, "epoch": 548, "lr": 1.8129883247181235e-06} +{"train_loss": 0.0002517091343179345, "global_step": 65304, "epoch": 548, "lr": 1.8123971805489914e-06} +{"train_loss": 0.00022874155547469854, "global_step": 65305, "epoch": 548, "lr": 1.8118061309910783e-06} +{"train_loss": 0.00023291466641239822, "global_step": 65306, "epoch": 548, "lr": 1.8112151760455275e-06} +{"train_loss": 0.0005077581736259162, "global_step": 65307, "epoch": 548, "lr": 1.810624315713516e-06} +{"train_loss": 0.000393727415939793, "global_step": 65308, "epoch": 548, "lr": 1.8100335499961873e-06} +{"train_loss": 0.0004102169186808169, "global_step": 65309, "epoch": 548, "lr": 1.8094428788947182e-06} +{"train_loss": 0.00034623840474523604, "global_step": 65310, "epoch": 548, "lr": 1.808852302410252e-06} +{"train_loss": 0.00038841625791974366, "global_step": 65311, "epoch": 548, "lr": 1.808261820543955e-06} +{"train_loss": 0.0001194505239254795, "global_step": 65312, "epoch": 548, "lr": 1.807671433296998e-06} +{"train_loss": 0.00033676219754852355, "global_step": 65313, "epoch": 548, "lr": 1.8070811406705191e-06} +{"train_loss": 0.00020391664293128997, "global_step": 65314, "epoch": 548, "lr": 1.806490942665695e-06} +{"train_loss": 0.0001900012866826728, "global_step": 65315, "epoch": 548, "lr": 1.8059008392836696e-06} +{"train_loss": 0.00012891454389318824, "global_step": 65316, "epoch": 548, "lr": 1.8053108305256138e-06} +{"train_loss": 0.00024704422685317695, "global_step": 65317, "epoch": 548, "lr": 1.8047209163926882e-06} +{"train_loss": 0.00022883506608195603, "global_step": 65318, "epoch": 548, "lr": 1.8041310968860303e-06} +{"train_loss": 0.00034386824700050056, "global_step": 65319, "epoch": 548, "lr": 1.8035413720068228e-06} +{"train_loss": 0.00030558131402358413, "global_step": 65320, "epoch": 548, "lr": 1.8029517417562036e-06} +{"train_loss": 0.0002146088081644848, "global_step": 65321, "epoch": 548, "lr": 1.8023622061353495e-06} +{"train_loss": 0.00021296535851433873, "global_step": 65322, "epoch": 548, "lr": 1.8017727651454043e-06} +{"train_loss": 0.0002633579424582422, "global_step": 65323, "epoch": 548, "lr": 1.8011834187875276e-06} +{"train_loss": 0.00028988427948206663, "global_step": 65324, "epoch": 548, "lr": 1.80059416706288e-06} +{"train_loss": 0.0003565738152246922, "global_step": 65325, "epoch": 548, "lr": 1.8000050099726106e-06} +{"train_loss": 0.0002462874981574714, "global_step": 65326, "epoch": 548, "lr": 1.7994159475178906e-06} +{"train_loss": 0.00013899458281230181, "global_step": 65327, "epoch": 548, "lr": 1.798826979699858e-06} +{"train_loss": 0.00022463880304712802, "global_step": 65328, "epoch": 548, "lr": 1.7982381065196896e-06} +{"train_loss": 0.0003194480377715081, "global_step": 65329, "epoch": 548, "lr": 1.797649327978529e-06} +{"train_loss": 0.00029755310181620286, "global_step": 65330, "epoch": 548, "lr": 1.797060644077525e-06, "val_loss": 0.030662626028060913} +{"train_loss": 0.0002022573462454602, "global_step": 65331, "epoch": 549, "lr": 1.796472054817855e-06} +{"train_loss": 0.00020805025997105986, "global_step": 65332, "epoch": 549, "lr": 1.7958835602006508e-06} +{"train_loss": 0.0002916470111813396, "global_step": 65333, "epoch": 549, "lr": 1.7952951602270895e-06} +{"train_loss": 0.0002041737170657143, "global_step": 65334, "epoch": 549, "lr": 1.7947068548983092e-06} +{"train_loss": 0.00022679641551803797, "global_step": 65335, "epoch": 549, "lr": 1.7941186442154756e-06} +{"train_loss": 0.00029895215993747115, "global_step": 65336, "epoch": 549, "lr": 1.7935305281797432e-06} +{"train_loss": 0.0006129152025096118, "global_step": 65337, "epoch": 549, "lr": 1.7929425067922556e-06} +{"train_loss": 0.0002804886025842279, "global_step": 65338, "epoch": 549, "lr": 1.7923545800541785e-06} +{"train_loss": 0.0003101724723819643, "global_step": 65339, "epoch": 549, "lr": 1.791766747966661e-06} +{"train_loss": 0.0002488122845534235, "global_step": 65340, "epoch": 549, "lr": 1.7911790105308635e-06} +{"train_loss": 0.0006470255902968347, "global_step": 65341, "epoch": 549, "lr": 1.7905913677479292e-06} +{"train_loss": 0.0005007351282984018, "global_step": 65342, "epoch": 549, "lr": 1.7900038196190295e-06} +{"train_loss": 0.00034976931056007743, "global_step": 65343, "epoch": 549, "lr": 1.7894163661452967e-06} +{"train_loss": 0.0002911037881858647, "global_step": 65344, "epoch": 549, "lr": 1.7888290073278968e-06} +{"train_loss": 0.0002820666995830834, "global_step": 65345, "epoch": 549, "lr": 1.7882417431679787e-06} +{"train_loss": 0.00020216057600919157, "global_step": 65346, "epoch": 549, "lr": 1.7876545736666972e-06} +{"train_loss": 0.00012767419684678316, "global_step": 65347, "epoch": 549, "lr": 1.7870674988252124e-06} +{"train_loss": 0.000568968418519944, "global_step": 65348, "epoch": 549, "lr": 1.7864805186446677e-06} +{"train_loss": 0.00035037717316299677, "global_step": 65349, "epoch": 549, "lr": 1.7858936331262122e-06} +{"train_loss": 0.0003013386740349233, "global_step": 65350, "epoch": 549, "lr": 1.7853068422710062e-06} +{"train_loss": 0.00020206136105116457, "global_step": 65351, "epoch": 549, "lr": 1.7847201460801988e-06} +{"train_loss": 0.00014668387302663177, "global_step": 65352, "epoch": 549, "lr": 1.7841335445549446e-06} +{"train_loss": 0.00026327912928536534, "global_step": 65353, "epoch": 549, "lr": 1.783547037696398e-06} +{"train_loss": 0.00021584867499768734, "global_step": 65354, "epoch": 549, "lr": 1.7829606255056974e-06} +{"train_loss": 0.0006699503865092993, "global_step": 65355, "epoch": 549, "lr": 1.7823743079840028e-06} +{"train_loss": 0.00024041146389208734, "global_step": 65356, "epoch": 549, "lr": 1.7817880851324632e-06} +{"train_loss": 0.0003103723283857107, "global_step": 65357, "epoch": 549, "lr": 1.7812019569522388e-06} +{"train_loss": 0.0002744774392340332, "global_step": 65358, "epoch": 549, "lr": 1.7806159234444674e-06} +{"train_loss": 0.0002664824132807553, "global_step": 65359, "epoch": 549, "lr": 1.7800299846103097e-06} +{"train_loss": 0.00018967616779264063, "global_step": 65360, "epoch": 549, "lr": 1.7794441404509088e-06} +{"train_loss": 0.0002517539251130074, "global_step": 65361, "epoch": 549, "lr": 1.778858390967414e-06} +{"train_loss": 0.00035135741927661, "global_step": 65362, "epoch": 549, "lr": 1.7782727361609851e-06} +{"train_loss": 0.0002530018682591617, "global_step": 65363, "epoch": 549, "lr": 1.7776871760327607e-06} +{"train_loss": 0.0002598875144030899, "global_step": 65364, "epoch": 549, "lr": 1.7771017105839004e-06} +{"train_loss": 0.00019433630222920328, "global_step": 65365, "epoch": 549, "lr": 1.7765163398155427e-06} +{"train_loss": 0.00019046044326387346, "global_step": 65366, "epoch": 549, "lr": 1.775931063728853e-06} +{"train_loss": 0.00023763476929161698, "global_step": 65367, "epoch": 549, "lr": 1.775345882324969e-06} +{"train_loss": 0.0002363335370318964, "global_step": 65368, "epoch": 549, "lr": 1.774760795605035e-06} +{"train_loss": 0.0002575540856923908, "global_step": 65369, "epoch": 549, "lr": 1.7741758035702106e-06} +{"train_loss": 0.0002845028939191252, "global_step": 65370, "epoch": 549, "lr": 1.7735909062216339e-06} +{"train_loss": 0.00035061241942457855, "global_step": 65371, "epoch": 549, "lr": 1.773006103560465e-06} +{"train_loss": 0.0004071044095326215, "global_step": 65372, "epoch": 549, "lr": 1.772421395587842e-06} +{"train_loss": 0.0003498271689750254, "global_step": 65373, "epoch": 549, "lr": 1.7718367823049197e-06} +{"train_loss": 0.00014371611177921295, "global_step": 65374, "epoch": 549, "lr": 1.7712522637128416e-06} +{"train_loss": 0.00013919491902925074, "global_step": 65375, "epoch": 549, "lr": 1.770667839812762e-06} +{"train_loss": 0.00040076495497487485, "global_step": 65376, "epoch": 549, "lr": 1.7700835106058188e-06} +{"train_loss": 0.00018499082943890244, "global_step": 65377, "epoch": 549, "lr": 1.7694992760931671e-06} +{"train_loss": 0.0005399399669840932, "global_step": 65378, "epoch": 549, "lr": 1.7689151362759449e-06} +{"train_loss": 0.00022245579748414457, "global_step": 65379, "epoch": 549, "lr": 1.7683310911553118e-06} +{"train_loss": 0.00047438699402846396, "global_step": 65380, "epoch": 549, "lr": 1.7677471407324065e-06} +{"train_loss": 0.00022106808319222182, "global_step": 65381, "epoch": 549, "lr": 1.7671632850083775e-06} +{"train_loss": 0.0002630584640428424, "global_step": 65382, "epoch": 549, "lr": 1.7665795239843686e-06} +{"train_loss": 0.00035704413312487304, "global_step": 65383, "epoch": 549, "lr": 1.7659958576615287e-06} +{"train_loss": 0.0001452706492273137, "global_step": 65384, "epoch": 549, "lr": 1.7654122860410016e-06} +{"train_loss": 0.00023118534591048956, "global_step": 65385, "epoch": 549, "lr": 1.7648288091239362e-06} +{"train_loss": 0.0002995668910443783, "global_step": 65386, "epoch": 549, "lr": 1.764245426911476e-06} +{"train_loss": 0.00027590504032559693, "global_step": 65387, "epoch": 549, "lr": 1.7636621394047648e-06} +{"train_loss": 0.0003185922687407583, "global_step": 65388, "epoch": 549, "lr": 1.7630789466049513e-06} +{"train_loss": 0.00036471334169618785, "global_step": 65389, "epoch": 549, "lr": 1.7624958485131792e-06} +{"train_loss": 0.0002031304029515013, "global_step": 65390, "epoch": 549, "lr": 1.7619128451305923e-06} +{"train_loss": 0.00015991248073987663, "global_step": 65391, "epoch": 549, "lr": 1.7613299364583392e-06} +{"train_loss": 0.00016700620471965522, "global_step": 65392, "epoch": 549, "lr": 1.760747122497558e-06} +{"train_loss": 0.0004292883677408099, "global_step": 65393, "epoch": 549, "lr": 1.760164403249398e-06} +{"train_loss": 0.000206826749490574, "global_step": 65394, "epoch": 549, "lr": 1.759581778714997e-06} +{"train_loss": 0.0004638835380319506, "global_step": 65395, "epoch": 549, "lr": 1.7589992488955097e-06} +{"train_loss": 0.00025310934870503843, "global_step": 65396, "epoch": 549, "lr": 1.7584168137920631e-06} +{"train_loss": 0.00045948970364406705, "global_step": 65397, "epoch": 549, "lr": 1.7578344734058227e-06} +{"train_loss": 0.000161287491209805, "global_step": 65398, "epoch": 549, "lr": 1.757252227737921e-06} +{"train_loss": 0.00023144151782616973, "global_step": 65399, "epoch": 549, "lr": 1.7566700767894905e-06} +{"train_loss": 0.00044109602458775043, "global_step": 65400, "epoch": 549, "lr": 1.7560880205616914e-06} +{"train_loss": 0.00023697852157056332, "global_step": 65401, "epoch": 549, "lr": 1.755506059055656e-06} +{"train_loss": 0.00013363672769628465, "global_step": 65402, "epoch": 549, "lr": 1.7549241922725335e-06} +{"train_loss": 0.00017447398568037897, "global_step": 65403, "epoch": 549, "lr": 1.7543424202134674e-06} +{"train_loss": 0.00017666998610366136, "global_step": 65404, "epoch": 549, "lr": 1.7537607428795844e-06} +{"train_loss": 0.0005267698434181511, "global_step": 65405, "epoch": 549, "lr": 1.753179160272045e-06} +{"train_loss": 0.00029513100162148476, "global_step": 65406, "epoch": 549, "lr": 1.7525976723919812e-06} +{"train_loss": 0.00025084917433559895, "global_step": 65407, "epoch": 549, "lr": 1.7520162792405315e-06} +{"train_loss": 0.0002792270970530808, "global_step": 65408, "epoch": 549, "lr": 1.7514349808188557e-06} +{"train_loss": 0.00023155796225182712, "global_step": 65409, "epoch": 549, "lr": 1.7508537771280754e-06} +{"train_loss": 0.00018564598576631397, "global_step": 65410, "epoch": 549, "lr": 1.7502726681693394e-06} +{"train_loss": 0.00019030352996196598, "global_step": 65411, "epoch": 549, "lr": 1.7496916539437858e-06} +{"train_loss": 0.00020749421673826873, "global_step": 65412, "epoch": 549, "lr": 1.7491107344525637e-06} +{"train_loss": 0.0003094134444836527, "global_step": 65413, "epoch": 549, "lr": 1.7485299096968056e-06} +{"train_loss": 0.00025913590798154473, "global_step": 65414, "epoch": 549, "lr": 1.7479491796776548e-06} +{"train_loss": 0.00016217640950344503, "global_step": 65415, "epoch": 549, "lr": 1.7473685443962494e-06} +{"train_loss": 0.00021277136693242937, "global_step": 65416, "epoch": 549, "lr": 1.7467880038537331e-06} +{"train_loss": 0.00016890121332835406, "global_step": 65417, "epoch": 549, "lr": 1.7462075580512438e-06} +{"train_loss": 0.00016207597218453884, "global_step": 65418, "epoch": 549, "lr": 1.7456272069899192e-06} +{"train_loss": 0.0002546020841691643, "global_step": 65419, "epoch": 549, "lr": 1.7450469506709033e-06} +{"train_loss": 0.00026713067200034857, "global_step": 65420, "epoch": 549, "lr": 1.7444667890953227e-06} +{"train_loss": 0.00023486645659431815, "global_step": 65421, "epoch": 549, "lr": 1.7438867222643374e-06} +{"train_loss": 0.00023309321841225028, "global_step": 65422, "epoch": 549, "lr": 1.7433067501790744e-06} +{"train_loss": 0.0003044139011763036, "global_step": 65423, "epoch": 549, "lr": 1.7427268728406666e-06} +{"train_loss": 0.0003636558831203729, "global_step": 65424, "epoch": 549, "lr": 1.7421470902502624e-06} +{"train_loss": 0.00020146546012256294, "global_step": 65425, "epoch": 549, "lr": 1.7415674024089946e-06} +{"train_loss": 0.00031507221865467727, "global_step": 65426, "epoch": 549, "lr": 1.7409878093180065e-06} +{"train_loss": 0.00024312816094607115, "global_step": 65427, "epoch": 549, "lr": 1.7404083109784253e-06} +{"train_loss": 0.0005522965220734477, "global_step": 65428, "epoch": 549, "lr": 1.7398289073914054e-06} +{"train_loss": 0.00030045336461625993, "global_step": 65429, "epoch": 549, "lr": 1.7392495985580792e-06} +{"train_loss": 0.0002738106995820999, "global_step": 65430, "epoch": 549, "lr": 1.7386703844795681e-06} +{"train_loss": 0.0004463415243662894, "global_step": 65431, "epoch": 549, "lr": 1.7380912651570324e-06} +{"train_loss": 0.00017989909974858165, "global_step": 65432, "epoch": 549, "lr": 1.7375122405915932e-06} +{"train_loss": 0.0002678879245650023, "global_step": 65433, "epoch": 549, "lr": 1.7369333107843944e-06} +{"train_loss": 0.0002519030822440982, "global_step": 65434, "epoch": 549, "lr": 1.736354475736568e-06} +{"train_loss": 0.00015807751333341002, "global_step": 65435, "epoch": 549, "lr": 1.7357757354492577e-06} +{"train_loss": 0.00012547842925414443, "global_step": 65436, "epoch": 549, "lr": 1.7351970899235959e-06} +{"train_loss": 0.0002713915309868753, "global_step": 65437, "epoch": 549, "lr": 1.734618539160715e-06} +{"train_loss": 0.0005610653315670788, "global_step": 65438, "epoch": 549, "lr": 1.734040083161753e-06} +{"train_loss": 0.0003836072573903948, "global_step": 65439, "epoch": 549, "lr": 1.733461721927848e-06} +{"train_loss": 0.00027043488807976246, "global_step": 65440, "epoch": 549, "lr": 1.7328834554601381e-06} +{"train_loss": 0.0006163910147733986, "global_step": 65441, "epoch": 549, "lr": 1.7323052837597497e-06} +{"train_loss": 0.00017547271272633225, "global_step": 65442, "epoch": 549, "lr": 1.7317272068278213e-06} +{"train_loss": 0.0001868491235654801, "global_step": 65443, "epoch": 549, "lr": 1.7311492246654959e-06} +{"train_loss": 0.00031214585760608315, "global_step": 65444, "epoch": 549, "lr": 1.7305713372738952e-06} +{"train_loss": 0.0001600228133611381, "global_step": 65445, "epoch": 549, "lr": 1.7299935446541682e-06} +{"train_loss": 0.00019164780678693205, "global_step": 65446, "epoch": 549, "lr": 1.7294158468074418e-06} +{"train_loss": 0.00020826021500397474, "global_step": 65447, "epoch": 549, "lr": 1.7288382437348483e-06} +{"train_loss": 0.0002144596364814788, "global_step": 65448, "epoch": 549, "lr": 1.7282607354375258e-06} +{"train_loss": 0.00028265428586526453, "global_step": 65449, "epoch": 549, "lr": 1.7276833219166012e-06, "val_loss": 0.03190485015511513} +{"train_loss": 0.00045459275133907795, "global_step": 65450, "epoch": 550, "lr": 1.7271060031732178e-06} +{"train_loss": 0.00016027649689931422, "global_step": 65451, "epoch": 550, "lr": 1.7265287792085027e-06} +{"train_loss": 0.00025492225540801883, "global_step": 65452, "epoch": 550, "lr": 1.725951650023594e-06} +{"train_loss": 0.00013354999828152359, "global_step": 65453, "epoch": 550, "lr": 1.7253746156196183e-06} +{"train_loss": 0.00028577467310242355, "global_step": 65454, "epoch": 550, "lr": 1.7247976759977137e-06} +{"train_loss": 0.0002773923333734274, "global_step": 65455, "epoch": 550, "lr": 1.7242208311590125e-06} +{"train_loss": 0.0003264537954237312, "global_step": 65456, "epoch": 550, "lr": 1.7236440811046416e-06} +{"train_loss": 0.0003005021426361054, "global_step": 65457, "epoch": 550, "lr": 1.723067425835745e-06} +{"train_loss": 0.00038150313775986433, "global_step": 65458, "epoch": 550, "lr": 1.7224908653534434e-06} +{"train_loss": 0.00020207800844218582, "global_step": 65459, "epoch": 550, "lr": 1.721914399658875e-06} +{"train_loss": 0.00023224360484164208, "global_step": 65460, "epoch": 550, "lr": 1.7213380287531722e-06} +{"train_loss": 0.000177264359081164, "global_step": 65461, "epoch": 550, "lr": 1.7207617526374565e-06} +{"train_loss": 0.0002556194958742708, "global_step": 65462, "epoch": 550, "lr": 1.7201855713128767e-06} +{"train_loss": 0.0001777662109816447, "global_step": 65463, "epoch": 550, "lr": 1.7196094847805433e-06} +{"train_loss": 0.000147202517837286, "global_step": 65464, "epoch": 550, "lr": 1.7190334930416107e-06} +{"train_loss": 0.00016973933088593185, "global_step": 65465, "epoch": 550, "lr": 1.7184575960971895e-06} +{"train_loss": 0.00016051104466896504, "global_step": 65466, "epoch": 550, "lr": 1.7178817939484226e-06} +{"train_loss": 0.000338854908477515, "global_step": 65467, "epoch": 550, "lr": 1.7173060865964375e-06} +{"train_loss": 0.0003130568074993789, "global_step": 65468, "epoch": 550, "lr": 1.7167304740423606e-06} +{"train_loss": 0.0003032577224075794, "global_step": 65469, "epoch": 550, "lr": 1.7161549562873246e-06} +{"train_loss": 0.0002279785112477839, "global_step": 65470, "epoch": 550, "lr": 1.715579533332462e-06} +{"train_loss": 0.00023487808357458562, "global_step": 65471, "epoch": 550, "lr": 1.7150042051788995e-06} +{"train_loss": 0.0002202327159466222, "global_step": 65472, "epoch": 550, "lr": 1.7144289718277695e-06} +{"train_loss": 0.0001278017443837598, "global_step": 65473, "epoch": 550, "lr": 1.713853833280199e-06} +{"train_loss": 0.00025223148986697197, "global_step": 65474, "epoch": 550, "lr": 1.7132787895373147e-06} +{"train_loss": 0.0003073512052651495, "global_step": 65475, "epoch": 550, "lr": 1.7127038406002549e-06} +{"train_loss": 0.0001982246176339686, "global_step": 65476, "epoch": 550, "lr": 1.712128986470135e-06} +{"train_loss": 0.00023007015988696367, "global_step": 65477, "epoch": 550, "lr": 1.711554227148099e-06} +{"train_loss": 0.00023281501489691436, "global_step": 65478, "epoch": 550, "lr": 1.7109795626352565e-06} +{"train_loss": 0.00022558349883183837, "global_step": 65479, "epoch": 550, "lr": 1.710404992932757e-06} +{"train_loss": 0.0003160014748573303, "global_step": 65480, "epoch": 550, "lr": 1.7098305180417107e-06} +{"train_loss": 0.0006023359601385891, "global_step": 65481, "epoch": 550, "lr": 1.709256137963261e-06} +{"train_loss": 0.0003165830858051777, "global_step": 65482, "epoch": 550, "lr": 1.7086818526985238e-06} +{"train_loss": 0.0002507561584934592, "global_step": 65483, "epoch": 550, "lr": 1.7081076622486313e-06} +{"train_loss": 0.00024365571152884513, "global_step": 65484, "epoch": 550, "lr": 1.7075335666147051e-06} +{"train_loss": 0.000495032116305083, "global_step": 65485, "epoch": 550, "lr": 1.7069595657978831e-06} +{"train_loss": 0.00034087043604813516, "global_step": 65486, "epoch": 550, "lr": 1.7063856597992923e-06} +{"train_loss": 0.0002431336761219427, "global_step": 65487, "epoch": 550, "lr": 1.7058118486200425e-06} +{"train_loss": 0.00022445320792030543, "global_step": 65488, "epoch": 550, "lr": 1.7052381322612775e-06} +{"train_loss": 0.00023654161486774683, "global_step": 65489, "epoch": 550, "lr": 1.7046645107241132e-06} +{"train_loss": 0.00019017890735995024, "global_step": 65490, "epoch": 550, "lr": 1.7040909840096875e-06} +{"train_loss": 0.000508515106048435, "global_step": 65491, "epoch": 550, "lr": 1.7035175521191216e-06} +{"train_loss": 0.0002498468093108386, "global_step": 65492, "epoch": 550, "lr": 1.7029442150535312e-06} +{"train_loss": 0.0002464074350427836, "global_step": 65493, "epoch": 550, "lr": 1.7023709728140547e-06} +{"train_loss": 0.00018664830713532865, "global_step": 65494, "epoch": 550, "lr": 1.7017978254018074e-06} +{"train_loss": 0.00019425229402258992, "global_step": 65495, "epoch": 550, "lr": 1.701224772817922e-06} +{"train_loss": 0.000156607071403414, "global_step": 65496, "epoch": 550, "lr": 1.7006518150635252e-06} +{"train_loss": 0.00020895969646517187, "global_step": 65497, "epoch": 550, "lr": 1.7000789521397388e-06} +{"train_loss": 0.00035638452391140163, "global_step": 65498, "epoch": 550, "lr": 1.6995061840476833e-06} +{"train_loss": 0.00020015894551761448, "global_step": 65499, "epoch": 550, "lr": 1.6989335107884862e-06} +{"train_loss": 0.00015475667896680534, "global_step": 65500, "epoch": 550, "lr": 1.6983609323632798e-06} +{"train_loss": 0.0002105503372149542, "global_step": 65501, "epoch": 550, "lr": 1.6977884487731743e-06} +{"train_loss": 0.00019708143372554332, "global_step": 65502, "epoch": 550, "lr": 1.6972160600193077e-06} +{"train_loss": 0.0001949962752405554, "global_step": 65503, "epoch": 550, "lr": 1.6966437661027901e-06} +{"train_loss": 0.0003467942005954683, "global_step": 65504, "epoch": 550, "lr": 1.6960715670247597e-06} +{"train_loss": 0.00031420309096574783, "global_step": 65505, "epoch": 550, "lr": 1.6954994627863264e-06} +{"train_loss": 0.0003423144808039069, "global_step": 65506, "epoch": 550, "lr": 1.6949274533886228e-06} +{"train_loss": 0.00015031812654342502, "global_step": 65507, "epoch": 550, "lr": 1.6943555388327593e-06} +{"train_loss": 0.0002132386580342427, "global_step": 65508, "epoch": 550, "lr": 1.693783719119879e-06} +{"train_loss": 0.00012947246432304382, "global_step": 65509, "epoch": 550, "lr": 1.693211994251087e-06} +{"train_loss": 0.00015979573072399944, "global_step": 65510, "epoch": 550, "lr": 1.6926403642275158e-06} +{"train_loss": 0.00021482480224221945, "global_step": 65511, "epoch": 550, "lr": 1.6920688290502807e-06} +{"train_loss": 0.00012073357356712222, "global_step": 65512, "epoch": 550, "lr": 1.6914973887205143e-06} +{"train_loss": 0.00021819469111505896, "global_step": 65513, "epoch": 550, "lr": 1.690926043239327e-06} +{"train_loss": 0.0002745617530308664, "global_step": 65514, "epoch": 550, "lr": 1.6903547926078455e-06} +{"train_loss": 0.0003038542054127902, "global_step": 65515, "epoch": 550, "lr": 1.6897836368271912e-06} +{"train_loss": 0.0002697413437999785, "global_step": 65516, "epoch": 550, "lr": 1.689212575898491e-06} +{"train_loss": 0.00024839083198457956, "global_step": 65517, "epoch": 550, "lr": 1.6886416098228553e-06} +{"train_loss": 0.00018743163673207164, "global_step": 65518, "epoch": 550, "lr": 1.6880707386014105e-06} +{"train_loss": 0.00037675106432288885, "global_step": 65519, "epoch": 550, "lr": 1.6874999622352782e-06} +{"train_loss": 0.00029132768395356834, "global_step": 65520, "epoch": 550, "lr": 1.6869292807255799e-06} +{"train_loss": 0.00017785611271392554, "global_step": 65521, "epoch": 550, "lr": 1.6863586940734311e-06} +{"train_loss": 0.0005605453625321388, "global_step": 65522, "epoch": 550, "lr": 1.6857882022799643e-06} +{"train_loss": 0.00037451667594723403, "global_step": 65523, "epoch": 550, "lr": 1.6852178053462786e-06} +{"train_loss": 0.0001637377281440422, "global_step": 65524, "epoch": 550, "lr": 1.684647503273512e-06} +{"train_loss": 0.0003563737263903022, "global_step": 65525, "epoch": 550, "lr": 1.6840772960627748e-06} +{"train_loss": 0.0002815313055180013, "global_step": 65526, "epoch": 550, "lr": 1.6835071837151994e-06} +{"train_loss": 0.00013953108282294124, "global_step": 65527, "epoch": 550, "lr": 1.682937166231885e-06} +{"train_loss": 0.00025974807795137167, "global_step": 65528, "epoch": 550, "lr": 1.6823672436139693e-06} +{"train_loss": 0.00028720797854475677, "global_step": 65529, "epoch": 550, "lr": 1.6817974158625626e-06} +{"train_loss": 0.0003008860512636602, "global_step": 65530, "epoch": 550, "lr": 1.6812276829787755e-06} +{"train_loss": 0.000256138329859823, "global_step": 65531, "epoch": 550, "lr": 1.6806580449637455e-06} +{"train_loss": 0.00014175250544212759, "global_step": 65532, "epoch": 550, "lr": 1.6800885018185774e-06} +{"train_loss": 0.00029669483774341643, "global_step": 65533, "epoch": 550, "lr": 1.6795190535443927e-06} +{"train_loss": 0.00016786919150035828, "global_step": 65534, "epoch": 550, "lr": 1.678949700142307e-06} +{"train_loss": 0.00026299571618437767, "global_step": 65535, "epoch": 550, "lr": 1.678380441613453e-06} +{"train_loss": 0.0001628838654141873, "global_step": 65536, "epoch": 550, "lr": 1.6778112779589294e-06} +{"train_loss": 0.00022931124840397388, "global_step": 65537, "epoch": 550, "lr": 1.6772422091798578e-06} +{"train_loss": 0.00014118418039288372, "global_step": 65538, "epoch": 550, "lr": 1.6766732352773651e-06} +{"train_loss": 0.0003162849461659789, "global_step": 65539, "epoch": 550, "lr": 1.6761043562525558e-06} +{"train_loss": 0.00027306360425427556, "global_step": 65540, "epoch": 550, "lr": 1.6755355721065514e-06} +{"train_loss": 0.0003269124135840684, "global_step": 65541, "epoch": 550, "lr": 1.674966882840473e-06} +{"train_loss": 0.0002623313048388809, "global_step": 65542, "epoch": 550, "lr": 1.6743982884554366e-06} +{"train_loss": 0.0001427117531420663, "global_step": 65543, "epoch": 550, "lr": 1.6738297889525578e-06} +{"train_loss": 0.00034361082362011075, "global_step": 65544, "epoch": 550, "lr": 1.6732613843329414e-06} +{"train_loss": 0.00023548428725916892, "global_step": 65545, "epoch": 550, "lr": 1.6726930745977255e-06} +{"train_loss": 0.00021466643374878913, "global_step": 65546, "epoch": 550, "lr": 1.6721248597480033e-06} +{"train_loss": 0.00036481916322372854, "global_step": 65547, "epoch": 550, "lr": 1.671556739784913e-06} +{"train_loss": 0.00022696320957038552, "global_step": 65548, "epoch": 550, "lr": 1.6709887147095537e-06} +{"train_loss": 0.00016974321624729782, "global_step": 65549, "epoch": 550, "lr": 1.6704207845230358e-06} +{"train_loss": 0.00026326667284592986, "global_step": 65550, "epoch": 550, "lr": 1.669852949226497e-06} +{"train_loss": 0.00034474304993636906, "global_step": 65551, "epoch": 550, "lr": 1.6692852088210254e-06} +{"train_loss": 0.00032569459290243685, "global_step": 65552, "epoch": 550, "lr": 1.668717563307759e-06} +{"train_loss": 0.00044777654693461955, "global_step": 65553, "epoch": 550, "lr": 1.668150012687797e-06} +{"train_loss": 0.0002206119243055582, "global_step": 65554, "epoch": 550, "lr": 1.6675825569622605e-06} +{"train_loss": 0.0004011490091215819, "global_step": 65555, "epoch": 550, "lr": 1.6670151961322656e-06} +{"train_loss": 0.0003308845916762948, "global_step": 65556, "epoch": 550, "lr": 1.6664479301989166e-06} +{"train_loss": 0.00023288119700737298, "global_step": 65557, "epoch": 550, "lr": 1.6658807591633408e-06} +{"train_loss": 0.00029870515572838485, "global_step": 65558, "epoch": 550, "lr": 1.6653136830266313e-06} +{"train_loss": 0.0004737021226901561, "global_step": 65559, "epoch": 550, "lr": 1.6647467017899264e-06} +{"train_loss": 0.0002577702689450234, "global_step": 65560, "epoch": 550, "lr": 1.664179815454331e-06} +{"train_loss": 0.0002895751385949552, "global_step": 65561, "epoch": 550, "lr": 1.6636130240209436e-06} +{"train_loss": 0.0003021267184522003, "global_step": 65562, "epoch": 550, "lr": 1.6630463274908914e-06} +{"train_loss": 0.00022134851315058768, "global_step": 65563, "epoch": 550, "lr": 1.6624797258652846e-06} +{"train_loss": 0.0002405658015049994, "global_step": 65564, "epoch": 550, "lr": 1.6619132191452337e-06} +{"train_loss": 0.00020801789651159197, "global_step": 65565, "epoch": 550, "lr": 1.661346807331854e-06} +{"train_loss": 0.0002642939507495612, "global_step": 65566, "epoch": 550, "lr": 1.6607804904262558e-06} +{"train_loss": 0.00036309362621977925, "global_step": 65567, "epoch": 550, "lr": 1.6602142684295496e-06} +{"train_loss": 0.00026433133254093785, "global_step": 65568, "epoch": 550, "lr": 1.6596481413428455e-06, "val_loss": 0.028734587132930756, "train_action_mse_error": 3.2251473385258578e-06} +{"train_loss": 0.0001771537063177675, "global_step": 65569, "epoch": 551, "lr": 1.6590821091672648e-06} +{"train_loss": 0.00017421846860088408, "global_step": 65570, "epoch": 551, "lr": 1.658516171903901e-06} +{"train_loss": 0.0001925696269609034, "global_step": 65571, "epoch": 551, "lr": 1.6579503295538867e-06} +{"train_loss": 0.00027075022808276117, "global_step": 65572, "epoch": 551, "lr": 1.6573845821183154e-06} +{"train_loss": 0.00022078004258219153, "global_step": 65573, "epoch": 551, "lr": 1.656818929598314e-06} +{"train_loss": 0.00025869597448036075, "global_step": 65574, "epoch": 551, "lr": 1.6562533719949703e-06} +{"train_loss": 0.00039682743954472244, "global_step": 65575, "epoch": 551, "lr": 1.6556879093094169e-06} +{"train_loss": 0.00019983964739367366, "global_step": 65576, "epoch": 551, "lr": 1.6551225415427528e-06} +{"train_loss": 0.00023981646518222988, "global_step": 65577, "epoch": 551, "lr": 1.6545572686960887e-06} +{"train_loss": 0.00031546104582957923, "global_step": 65578, "epoch": 551, "lr": 1.6539920907705453e-06} +{"train_loss": 0.000265319220488891, "global_step": 65579, "epoch": 551, "lr": 1.653427007767222e-06} +{"train_loss": 0.0001095855695893988, "global_step": 65580, "epoch": 551, "lr": 1.6528620196872235e-06} +{"train_loss": 0.0003597323957365006, "global_step": 65581, "epoch": 551, "lr": 1.6522971265316656e-06} +{"train_loss": 0.0002781699295155704, "global_step": 65582, "epoch": 551, "lr": 1.6517323283016585e-06} +{"train_loss": 0.00014249395462684333, "global_step": 65583, "epoch": 551, "lr": 1.6511676249983122e-06} +{"train_loss": 0.0005119381239637733, "global_step": 65584, "epoch": 551, "lr": 1.6506030166227315e-06} +{"train_loss": 0.0002911576011683792, "global_step": 65585, "epoch": 551, "lr": 1.6500385031760269e-06} +{"train_loss": 0.0002813819737639278, "global_step": 65586, "epoch": 551, "lr": 1.6494740846593083e-06} +{"train_loss": 0.00013629536260850728, "global_step": 65587, "epoch": 551, "lr": 1.6489097610736749e-06} +{"train_loss": 0.00036206471850164235, "global_step": 65588, "epoch": 551, "lr": 1.648345532420248e-06} +{"train_loss": 0.000209969628485851, "global_step": 65589, "epoch": 551, "lr": 1.6477813987001267e-06} +{"train_loss": 0.00020379254419822246, "global_step": 65590, "epoch": 551, "lr": 1.6472173599144215e-06} +{"train_loss": 0.00014118045510258526, "global_step": 65591, "epoch": 551, "lr": 1.6466534160642422e-06} +{"train_loss": 0.00019882744527421892, "global_step": 65592, "epoch": 551, "lr": 1.6460895671506827e-06} +{"train_loss": 0.00019893846183549613, "global_step": 65593, "epoch": 551, "lr": 1.6455258131748751e-06} +{"train_loss": 0.0002679428434930742, "global_step": 65594, "epoch": 551, "lr": 1.6449621541378968e-06} +{"train_loss": 0.0001971810415852815, "global_step": 65595, "epoch": 551, "lr": 1.6443985900408798e-06} +{"train_loss": 0.000381710211513564, "global_step": 65596, "epoch": 551, "lr": 1.6438351208849122e-06} +{"train_loss": 0.00017777044558897614, "global_step": 65597, "epoch": 551, "lr": 1.6432717466711156e-06} +{"train_loss": 0.0005122201982885599, "global_step": 65598, "epoch": 551, "lr": 1.6427084674005888e-06} +{"train_loss": 0.00017464757547713816, "global_step": 65599, "epoch": 551, "lr": 1.6421452830744366e-06} +{"train_loss": 0.00036505053867585957, "global_step": 65600, "epoch": 551, "lr": 1.6415821936937636e-06} +{"train_loss": 0.0006122320774011314, "global_step": 65601, "epoch": 551, "lr": 1.6410191992596746e-06} +{"train_loss": 0.0002158390561817214, "global_step": 65602, "epoch": 551, "lr": 1.6404562997732854e-06} +{"train_loss": 0.00024361519899684936, "global_step": 65603, "epoch": 551, "lr": 1.6398934952356892e-06} +{"train_loss": 0.00022799034195486456, "global_step": 65604, "epoch": 551, "lr": 1.6393307856479966e-06} +{"train_loss": 0.0003688140131998807, "global_step": 65605, "epoch": 551, "lr": 1.6387681710113068e-06} +{"train_loss": 0.0002546736504882574, "global_step": 65606, "epoch": 551, "lr": 1.6382056513267407e-06} +{"train_loss": 0.000211849735933356, "global_step": 65607, "epoch": 551, "lr": 1.6376432265953813e-06} +{"train_loss": 0.0002236896543763578, "global_step": 65608, "epoch": 551, "lr": 1.6370808968183438e-06} +{"train_loss": 0.00014816310431342572, "global_step": 65609, "epoch": 551, "lr": 1.6365186619967333e-06} +{"train_loss": 0.00041127667645923793, "global_step": 65610, "epoch": 551, "lr": 1.6359565221316543e-06} +{"train_loss": 0.00026662542950361967, "global_step": 65611, "epoch": 551, "lr": 1.6353944772242003e-06} +{"train_loss": 0.0002406557323411107, "global_step": 65612, "epoch": 551, "lr": 1.6348325272754872e-06} +{"train_loss": 0.0006018769345246255, "global_step": 65613, "epoch": 551, "lr": 1.6342706722866085e-06} +{"train_loss": 0.00012899913417641073, "global_step": 65614, "epoch": 551, "lr": 1.6337089122586801e-06} +{"train_loss": 0.00028447105432860553, "global_step": 65615, "epoch": 551, "lr": 1.63314724719279e-06} +{"train_loss": 0.0002195273118559271, "global_step": 65616, "epoch": 551, "lr": 1.6325856770900539e-06} +{"train_loss": 0.0001966645213542506, "global_step": 65617, "epoch": 551, "lr": 1.6320242019515708e-06} +{"train_loss": 0.0001647206663619727, "global_step": 65618, "epoch": 551, "lr": 1.6314628217784289e-06} +{"train_loss": 0.000522718473803252, "global_step": 65619, "epoch": 551, "lr": 1.630901536571755e-06} +{"train_loss": 0.00031268977909348905, "global_step": 65620, "epoch": 551, "lr": 1.6303403463326261e-06} +{"train_loss": 0.00013734924141317606, "global_step": 65621, "epoch": 551, "lr": 1.629779251062169e-06} +{"train_loss": 0.00031991503783501685, "global_step": 65622, "epoch": 551, "lr": 1.6292182507614605e-06} +{"train_loss": 0.00018893966625910252, "global_step": 65623, "epoch": 551, "lr": 1.6286573454316223e-06} +{"train_loss": 0.0002570867945905775, "global_step": 65624, "epoch": 551, "lr": 1.6280965350737532e-06} +{"train_loss": 0.0002979193814098835, "global_step": 65625, "epoch": 551, "lr": 1.6275358196889356e-06} +{"train_loss": 0.00039370733429677784, "global_step": 65626, "epoch": 551, "lr": 1.6269751992782912e-06} +{"train_loss": 0.00018406087474431843, "global_step": 65627, "epoch": 551, "lr": 1.6264146738429077e-06} +{"train_loss": 0.0002217294240836054, "global_step": 65628, "epoch": 551, "lr": 1.6258542433839009e-06} +{"train_loss": 0.0003067778015974909, "global_step": 65629, "epoch": 551, "lr": 1.6252939079023588e-06} +{"train_loss": 0.00021108199143782258, "global_step": 65630, "epoch": 551, "lr": 1.6247336673993751e-06} +{"train_loss": 0.00016674664220772684, "global_step": 65631, "epoch": 551, "lr": 1.6241735218760657e-06} +{"train_loss": 0.00025834585539996624, "global_step": 65632, "epoch": 551, "lr": 1.6236134713335182e-06} +{"train_loss": 0.00037783742300234735, "global_step": 65633, "epoch": 551, "lr": 1.6230535157728432e-06} +{"train_loss": 0.0003426139010116458, "global_step": 65634, "epoch": 551, "lr": 1.6224936551951285e-06} +{"train_loss": 0.00015015286044217646, "global_step": 65635, "epoch": 551, "lr": 1.6219338896014903e-06} +{"train_loss": 0.0004501879739109427, "global_step": 65636, "epoch": 551, "lr": 1.6213742189930103e-06} +{"train_loss": 0.00041469812276773155, "global_step": 65637, "epoch": 551, "lr": 1.6208146433707883e-06} +{"train_loss": 0.0006221348303370178, "global_step": 65638, "epoch": 551, "lr": 1.6202551627359286e-06} +{"train_loss": 0.0002063518768409267, "global_step": 65639, "epoch": 551, "lr": 1.619695777089536e-06} +{"train_loss": 0.00030012978822924197, "global_step": 65640, "epoch": 551, "lr": 1.619136486432693e-06} +{"train_loss": 0.0003890903026331216, "global_step": 65641, "epoch": 551, "lr": 1.6185772907665153e-06} +{"train_loss": 0.0001802369370125234, "global_step": 65642, "epoch": 551, "lr": 1.6180181900920855e-06} +{"train_loss": 0.00021511992963496596, "global_step": 65643, "epoch": 551, "lr": 1.6174591844105191e-06} +{"train_loss": 0.0006277915090322495, "global_step": 65644, "epoch": 551, "lr": 1.6169002737228877e-06} +{"train_loss": 0.0002616426791064441, "global_step": 65645, "epoch": 551, "lr": 1.6163414580303182e-06} +{"train_loss": 0.00018806323350872844, "global_step": 65646, "epoch": 551, "lr": 1.6157827373338818e-06} +{"train_loss": 0.0005409105215221643, "global_step": 65647, "epoch": 551, "lr": 1.6152241116346944e-06} +{"train_loss": 0.0003523645573295653, "global_step": 65648, "epoch": 551, "lr": 1.614665580933844e-06} +{"train_loss": 0.0003426730399951339, "global_step": 65649, "epoch": 551, "lr": 1.614107145232424e-06} +{"train_loss": 0.0003178661863785237, "global_step": 65650, "epoch": 551, "lr": 1.613548804531545e-06} +{"train_loss": 0.00018388248281553388, "global_step": 65651, "epoch": 551, "lr": 1.6129905588322835e-06} +{"train_loss": 0.00026560944388620555, "global_step": 65652, "epoch": 551, "lr": 1.61243240813575e-06} +{"train_loss": 0.0003068030928261578, "global_step": 65653, "epoch": 551, "lr": 1.6118743524430324e-06} +{"train_loss": 0.000252458150498569, "global_step": 65654, "epoch": 551, "lr": 1.6113163917552353e-06} +{"train_loss": 0.0002213745901826769, "global_step": 65655, "epoch": 551, "lr": 1.610758526073447e-06} +{"train_loss": 0.00038225323078222573, "global_step": 65656, "epoch": 551, "lr": 1.6102007553987608e-06} +{"train_loss": 0.00014946794544812292, "global_step": 65657, "epoch": 551, "lr": 1.6096430797322815e-06} +{"train_loss": 0.00021494258544407785, "global_step": 65658, "epoch": 551, "lr": 1.6090854990750969e-06} +{"train_loss": 0.0002934994117822498, "global_step": 65659, "epoch": 551, "lr": 1.608528013428301e-06} +{"train_loss": 0.00010781850141938776, "global_step": 65660, "epoch": 551, "lr": 1.607970622792998e-06} +{"train_loss": 0.00020378251792863011, "global_step": 65661, "epoch": 551, "lr": 1.607413327170265e-06} +{"train_loss": 0.00047373250708915293, "global_step": 65662, "epoch": 551, "lr": 1.606856126561207e-06} +{"train_loss": 0.00018012704094871879, "global_step": 65663, "epoch": 551, "lr": 1.6062990209669171e-06} +{"train_loss": 0.0002783063391689211, "global_step": 65664, "epoch": 551, "lr": 1.6057420103884945e-06} +{"train_loss": 0.00042778291390277445, "global_step": 65665, "epoch": 551, "lr": 1.605185094827022e-06} +{"train_loss": 0.00035483032115735114, "global_step": 65666, "epoch": 551, "lr": 1.604628274283604e-06} +{"train_loss": 0.0002504279837012291, "global_step": 65667, "epoch": 551, "lr": 1.6040715487593228e-06} +{"train_loss": 0.00021532661048695445, "global_step": 65668, "epoch": 551, "lr": 1.6035149182552778e-06} +{"train_loss": 0.000492663006298244, "global_step": 65669, "epoch": 551, "lr": 1.6029583827725624e-06} +{"train_loss": 0.0001506244734628126, "global_step": 65670, "epoch": 551, "lr": 1.602401942312265e-06} +{"train_loss": 0.0003024264005944133, "global_step": 65671, "epoch": 551, "lr": 1.6018455968754842e-06} +{"train_loss": 0.0001509441644884646, "global_step": 65672, "epoch": 551, "lr": 1.6012893464633028e-06} +{"train_loss": 0.0003054403350688517, "global_step": 65673, "epoch": 551, "lr": 1.6007331910768252e-06} +{"train_loss": 0.00018815651128534228, "global_step": 65674, "epoch": 551, "lr": 1.6001771307171343e-06} +{"train_loss": 0.00021610541443806142, "global_step": 65675, "epoch": 551, "lr": 1.5996211653853232e-06} +{"train_loss": 0.00022315514797810465, "global_step": 65676, "epoch": 551, "lr": 1.5990652950824913e-06} +{"train_loss": 0.00027150040841661394, "global_step": 65677, "epoch": 551, "lr": 1.598509519809721e-06} +{"train_loss": 0.00019516890461090952, "global_step": 65678, "epoch": 551, "lr": 1.597953839568106e-06} +{"train_loss": 0.00019086894462816417, "global_step": 65679, "epoch": 551, "lr": 1.5973982543587396e-06} +{"train_loss": 0.00019019121828023344, "global_step": 65680, "epoch": 551, "lr": 1.5968427641827044e-06} +{"train_loss": 0.00017127390310633928, "global_step": 65681, "epoch": 551, "lr": 1.5962873690411051e-06} +{"train_loss": 0.0003587533428799361, "global_step": 65682, "epoch": 551, "lr": 1.5957320689350186e-06} +{"train_loss": 0.00037658115616068244, "global_step": 65683, "epoch": 551, "lr": 1.5951768638655495e-06} +{"train_loss": 0.00020687827782239765, "global_step": 65684, "epoch": 551, "lr": 1.5946217538337692e-06} +{"train_loss": 0.00020076261716894805, "global_step": 65685, "epoch": 551, "lr": 1.5940667388407826e-06} +{"train_loss": 0.00034385002800263464, "global_step": 65686, "epoch": 551, "lr": 1.5935118188876774e-06} +{"train_loss": 0.00027553949083452026, "global_step": 65687, "epoch": 551, "lr": 1.5929569939755306e-06, "val_loss": 0.04680512845516205} +{"train_loss": 0.00019012243137694895, "global_step": 65688, "epoch": 552, "lr": 1.5924022641054526e-06} +{"train_loss": 0.00030214019352570176, "global_step": 65689, "epoch": 552, "lr": 1.591847629278509e-06} +{"train_loss": 0.0003050139348488301, "global_step": 65690, "epoch": 552, "lr": 1.59129308949581e-06} +{"train_loss": 0.0003086378565058112, "global_step": 65691, "epoch": 552, "lr": 1.5907386447584327e-06} +{"train_loss": 0.00010966052650474012, "global_step": 65692, "epoch": 552, "lr": 1.5901842950674705e-06} +{"train_loss": 0.00024731626035645604, "global_step": 65693, "epoch": 552, "lr": 1.5896300404240117e-06} +{"train_loss": 0.0001573561312397942, "global_step": 65694, "epoch": 552, "lr": 1.589075880829133e-06} +{"train_loss": 0.00018400886619929224, "global_step": 65695, "epoch": 552, "lr": 1.5885218162839388e-06} +{"train_loss": 0.0003131479606963694, "global_step": 65696, "epoch": 552, "lr": 1.5879678467895064e-06} +{"train_loss": 0.0004096826014574617, "global_step": 65697, "epoch": 552, "lr": 1.587413972346935e-06} +{"train_loss": 0.0003065618802793324, "global_step": 65698, "epoch": 552, "lr": 1.5868601929572957e-06} +{"train_loss": 0.00018173469288740307, "global_step": 65699, "epoch": 552, "lr": 1.5863065086216877e-06} +{"train_loss": 0.00016888139361981302, "global_step": 65700, "epoch": 552, "lr": 1.5857529193411935e-06} +{"train_loss": 0.0005130028584972024, "global_step": 65701, "epoch": 552, "lr": 1.5851994251169011e-06} +{"train_loss": 0.00017174793174490333, "global_step": 65702, "epoch": 552, "lr": 1.5846460259498986e-06} +{"train_loss": 0.00029200915014371276, "global_step": 65703, "epoch": 552, "lr": 1.5840927218412682e-06} +{"train_loss": 0.0002548321208450943, "global_step": 65704, "epoch": 552, "lr": 1.5835395127921038e-06} +{"train_loss": 0.00025237860972993076, "global_step": 65705, "epoch": 552, "lr": 1.582986398803482e-06} +{"train_loss": 0.0001993279147427529, "global_step": 65706, "epoch": 552, "lr": 1.5824333798764967e-06} +{"train_loss": 0.00022778772108722478, "global_step": 65707, "epoch": 552, "lr": 1.5818804560122247e-06} +{"train_loss": 0.0002160887379432097, "global_step": 65708, "epoch": 552, "lr": 1.581327627211765e-06} +{"train_loss": 0.0001795437274267897, "global_step": 65709, "epoch": 552, "lr": 1.5807748934761946e-06} +{"train_loss": 0.00019612129835877568, "global_step": 65710, "epoch": 552, "lr": 1.5802222548066015e-06} +{"train_loss": 0.00020732611301355064, "global_step": 65711, "epoch": 552, "lr": 1.5796697112040625e-06} +{"train_loss": 0.00027047941694036126, "global_step": 65712, "epoch": 552, "lr": 1.5791172626696772e-06} +{"train_loss": 0.0003006091865245253, "global_step": 65713, "epoch": 552, "lr": 1.5785649092045162e-06} +{"train_loss": 0.0003396034589968622, "global_step": 65714, "epoch": 552, "lr": 1.5780126508096738e-06} +{"train_loss": 0.00027966074412688613, "global_step": 65715, "epoch": 552, "lr": 1.5774604874862264e-06} +{"train_loss": 0.00025301246205344796, "global_step": 65716, "epoch": 552, "lr": 1.5769084192352679e-06} +{"train_loss": 0.0002309788396814838, "global_step": 65717, "epoch": 552, "lr": 1.576356446057875e-06} +{"train_loss": 0.00029052249738015234, "global_step": 65718, "epoch": 552, "lr": 1.5758045679551304e-06} +{"train_loss": 0.00023496050562243909, "global_step": 65719, "epoch": 552, "lr": 1.5752527849281218e-06} +{"train_loss": 0.00034956910531036556, "global_step": 65720, "epoch": 552, "lr": 1.5747010969779263e-06} +{"train_loss": 0.00023824346135370433, "global_step": 65721, "epoch": 552, "lr": 1.5741495041056376e-06} +{"train_loss": 0.00025185910635627806, "global_step": 65722, "epoch": 552, "lr": 1.5735980063123267e-06} +{"train_loss": 0.0001800384052330628, "global_step": 65723, "epoch": 552, "lr": 1.5730466035990875e-06} +{"train_loss": 0.00034273831988684833, "global_step": 65724, "epoch": 552, "lr": 1.5724952959670024e-06} +{"train_loss": 0.0002019617095356807, "global_step": 65725, "epoch": 552, "lr": 1.5719440834171373e-06} +{"train_loss": 0.0002733917208388448, "global_step": 65726, "epoch": 552, "lr": 1.5713929659505966e-06} +{"train_loss": 0.0002600227890070528, "global_step": 65727, "epoch": 552, "lr": 1.5708419435684462e-06} +{"train_loss": 0.00014690562966279685, "global_step": 65728, "epoch": 552, "lr": 1.5702910162717744e-06} +{"train_loss": 0.000254310347372666, "global_step": 65729, "epoch": 552, "lr": 1.5697401840616687e-06} +{"train_loss": 0.0002561392611823976, "global_step": 65730, "epoch": 552, "lr": 1.5691894469391954e-06} +{"train_loss": 0.0002492977073416114, "global_step": 65731, "epoch": 552, "lr": 1.568638804905448e-06} +{"train_loss": 0.00019875714497175068, "global_step": 65732, "epoch": 552, "lr": 1.568088257961503e-06} +{"train_loss": 0.00018981909670401365, "global_step": 65733, "epoch": 552, "lr": 1.5675378061084435e-06} +{"train_loss": 0.00037179741775617003, "global_step": 65734, "epoch": 552, "lr": 1.5669874493473459e-06} +{"train_loss": 0.00021434130030684173, "global_step": 65735, "epoch": 552, "lr": 1.5664371876792982e-06} +{"train_loss": 0.0003088323283009231, "global_step": 65736, "epoch": 552, "lr": 1.5658870211053723e-06} +{"train_loss": 0.0001853986905189231, "global_step": 65737, "epoch": 552, "lr": 1.5653369496266612e-06} +{"train_loss": 0.00018689448188524693, "global_step": 65738, "epoch": 552, "lr": 1.5647869732442255e-06} +{"train_loss": 0.0001465990935685113, "global_step": 65739, "epoch": 552, "lr": 1.5642370919591642e-06} +{"train_loss": 0.00032566607114858925, "global_step": 65740, "epoch": 552, "lr": 1.5636873057725486e-06} +{"train_loss": 0.00018249031563755125, "global_step": 65741, "epoch": 552, "lr": 1.5631376146854559e-06} +{"train_loss": 0.0001616496592760086, "global_step": 65742, "epoch": 552, "lr": 1.5625880186989682e-06} +{"train_loss": 0.00020107936870772392, "global_step": 65743, "epoch": 552, "lr": 1.5620385178141627e-06} +{"train_loss": 0.0001970368466572836, "global_step": 65744, "epoch": 552, "lr": 1.5614891120321217e-06} +{"train_loss": 0.00015177243039943278, "global_step": 65745, "epoch": 552, "lr": 1.5609398013539224e-06} +{"train_loss": 0.00021672312868759036, "global_step": 65746, "epoch": 552, "lr": 1.5603905857806412e-06} +{"train_loss": 0.00018779253878165036, "global_step": 65747, "epoch": 552, "lr": 1.559841465313361e-06} +{"train_loss": 0.0004689634370151907, "global_step": 65748, "epoch": 552, "lr": 1.5592924399531529e-06} +{"train_loss": 0.00019144501129630953, "global_step": 65749, "epoch": 552, "lr": 1.5587435097010993e-06} +{"train_loss": 0.00018315434863325208, "global_step": 65750, "epoch": 552, "lr": 1.5581946745582831e-06} +{"train_loss": 0.00035747859510593116, "global_step": 65751, "epoch": 552, "lr": 1.55764593452577e-06} +{"train_loss": 0.00023174946545623243, "global_step": 65752, "epoch": 552, "lr": 1.5570972896046476e-06} +{"train_loss": 0.00036697537871077657, "global_step": 65753, "epoch": 552, "lr": 1.5565487397959877e-06} +{"train_loss": 0.0006700422381982207, "global_step": 65754, "epoch": 552, "lr": 1.556000285100867e-06} +{"train_loss": 0.00015678969793953001, "global_step": 65755, "epoch": 552, "lr": 1.5554519255203736e-06} +{"train_loss": 0.00042504200246185064, "global_step": 65756, "epoch": 552, "lr": 1.5549036610555624e-06} +{"train_loss": 0.00026349950348958373, "global_step": 65757, "epoch": 552, "lr": 1.554355491707532e-06} +{"train_loss": 0.00016573845641687512, "global_step": 65758, "epoch": 552, "lr": 1.5538074174773375e-06} +{"train_loss": 0.0002474747016094625, "global_step": 65759, "epoch": 552, "lr": 1.5532594383660782e-06} +{"train_loss": 0.00022436183644458652, "global_step": 65760, "epoch": 552, "lr": 1.5527115543748082e-06} +{"train_loss": 0.00015600855113007128, "global_step": 65761, "epoch": 552, "lr": 1.5521637655046217e-06} +{"train_loss": 0.00023701997997704893, "global_step": 65762, "epoch": 552, "lr": 1.5516160717565843e-06} +{"train_loss": 0.0003510428359732032, "global_step": 65763, "epoch": 552, "lr": 1.5510684731317726e-06} +{"train_loss": 0.0001360907917842269, "global_step": 65764, "epoch": 552, "lr": 1.5505209696312585e-06} +{"train_loss": 0.00030357969808392227, "global_step": 65765, "epoch": 552, "lr": 1.5499735612561238e-06} +{"train_loss": 0.0005218590376898646, "global_step": 65766, "epoch": 552, "lr": 1.5494262480074406e-06} +{"train_loss": 0.00014571075735148042, "global_step": 65767, "epoch": 552, "lr": 1.54887902988628e-06} +{"train_loss": 0.00024358097289223224, "global_step": 65768, "epoch": 552, "lr": 1.5483319068937186e-06} +{"train_loss": 0.000281581305898726, "global_step": 65769, "epoch": 552, "lr": 1.5477848790308336e-06} +{"train_loss": 0.0002661332837305963, "global_step": 65770, "epoch": 552, "lr": 1.5472379462986907e-06} +{"train_loss": 0.00023348831746261567, "global_step": 65771, "epoch": 552, "lr": 1.5466911086983726e-06} +{"train_loss": 0.00019773675012402236, "global_step": 65772, "epoch": 552, "lr": 1.5461443662309561e-06} +{"train_loss": 0.00016060513735283166, "global_step": 65773, "epoch": 552, "lr": 1.5455977188975013e-06} +{"train_loss": 0.00028732226928696036, "global_step": 65774, "epoch": 552, "lr": 1.5450511666990907e-06} +{"train_loss": 0.0001401959452778101, "global_step": 65775, "epoch": 552, "lr": 1.544504709636796e-06} +{"train_loss": 0.0001865864178398624, "global_step": 65776, "epoch": 552, "lr": 1.5439583477116938e-06} +{"train_loss": 0.0003160982159897685, "global_step": 65777, "epoch": 552, "lr": 1.5434120809248443e-06} +{"train_loss": 0.0002563358866609633, "global_step": 65778, "epoch": 552, "lr": 1.5428659092773357e-06} +{"train_loss": 0.0005120692658238113, "global_step": 65779, "epoch": 552, "lr": 1.5423198327702337e-06} +{"train_loss": 0.00020319133182056248, "global_step": 65780, "epoch": 552, "lr": 1.5417738514046043e-06} +{"train_loss": 0.00032706858473829925, "global_step": 65781, "epoch": 552, "lr": 1.5412279651815298e-06} +{"train_loss": 0.00015235572936944664, "global_step": 65782, "epoch": 552, "lr": 1.5406821741020705e-06} +{"train_loss": 0.00027872962527908385, "global_step": 65783, "epoch": 552, "lr": 1.540136478167309e-06} +{"train_loss": 0.00029829138657078147, "global_step": 65784, "epoch": 552, "lr": 1.5395908773783108e-06} +{"train_loss": 0.0002739228948485106, "global_step": 65785, "epoch": 552, "lr": 1.539045371736153e-06} +{"train_loss": 0.0003500036254990846, "global_step": 65786, "epoch": 552, "lr": 1.5384999612419015e-06} +{"train_loss": 0.0003283109108451754, "global_step": 65787, "epoch": 552, "lr": 1.5379546458966221e-06} +{"train_loss": 0.00022444117348641157, "global_step": 65788, "epoch": 552, "lr": 1.5374094257013972e-06} +{"train_loss": 0.00021789925813209265, "global_step": 65789, "epoch": 552, "lr": 1.536864300657287e-06} +{"train_loss": 0.0001276936091016978, "global_step": 65790, "epoch": 552, "lr": 1.5363192707653684e-06} +{"train_loss": 0.0001834394788602367, "global_step": 65791, "epoch": 552, "lr": 1.5357743360267074e-06} +{"train_loss": 0.00023967528250068426, "global_step": 65792, "epoch": 552, "lr": 1.5352294964423807e-06} +{"train_loss": 0.00034320290433242917, "global_step": 65793, "epoch": 552, "lr": 1.5346847520134543e-06} +{"train_loss": 0.0002524301817175001, "global_step": 65794, "epoch": 552, "lr": 1.5341401027409885e-06} +{"train_loss": 0.00023502654221374542, "global_step": 65795, "epoch": 552, "lr": 1.5335955486260655e-06} +{"train_loss": 0.00017077938537113369, "global_step": 65796, "epoch": 552, "lr": 1.5330510896697459e-06} +{"train_loss": 0.00032538259983994067, "global_step": 65797, "epoch": 552, "lr": 1.5325067258731062e-06} +{"train_loss": 0.0003090778482146561, "global_step": 65798, "epoch": 552, "lr": 1.5319624572372181e-06} +{"train_loss": 0.00016314124513883144, "global_step": 65799, "epoch": 552, "lr": 1.5314182837631307e-06} +{"train_loss": 0.00016574452456552535, "global_step": 65800, "epoch": 552, "lr": 1.5308742054519376e-06} +{"train_loss": 0.00027510663494467735, "global_step": 65801, "epoch": 552, "lr": 1.5303302223046823e-06} +{"train_loss": 0.000278423132840544, "global_step": 65802, "epoch": 552, "lr": 1.5297863343224529e-06} +{"train_loss": 0.00028435615240596235, "global_step": 65803, "epoch": 552, "lr": 1.5292425415063095e-06} +{"train_loss": 0.0006137611344456673, "global_step": 65804, "epoch": 552, "lr": 1.528698843857318e-06} +{"train_loss": 0.000283299305010587, "global_step": 65805, "epoch": 552, "lr": 1.52815524137655e-06} +{"train_loss": 0.00025734702783574136, "global_step": 65806, "epoch": 552, "lr": 1.5276117340650653e-06, "val_loss": 0.014320136979222298} +{"train_loss": 0.0008857332286424935, "global_step": 65807, "epoch": 553, "lr": 1.5270683219239411e-06} +{"train_loss": 0.00042262059287168086, "global_step": 65808, "epoch": 553, "lr": 1.5265250049542379e-06} +{"train_loss": 0.0003671148733701557, "global_step": 65809, "epoch": 553, "lr": 1.5259817831570267e-06} +{"train_loss": 0.00026532597257755697, "global_step": 65810, "epoch": 553, "lr": 1.5254386565333678e-06} +{"train_loss": 0.0006311399047262967, "global_step": 65811, "epoch": 553, "lr": 1.5248956250843383e-06} +{"train_loss": 0.0003458032151684165, "global_step": 65812, "epoch": 553, "lr": 1.5243526888109926e-06} +{"train_loss": 0.0003244592226110399, "global_step": 65813, "epoch": 553, "lr": 1.5238098477144026e-06} +{"train_loss": 0.000500551366712898, "global_step": 65814, "epoch": 553, "lr": 1.5232671017956334e-06} +{"train_loss": 0.00017900178499985486, "global_step": 65815, "epoch": 553, "lr": 1.522724451055746e-06} +{"train_loss": 0.0001667997712502256, "global_step": 65816, "epoch": 553, "lr": 1.5221818954958168e-06} +{"train_loss": 0.0004172273329459131, "global_step": 65817, "epoch": 553, "lr": 1.5216394351169062e-06} +{"train_loss": 0.00020103779388591647, "global_step": 65818, "epoch": 553, "lr": 1.5210970699200688e-06} +{"train_loss": 0.0004170504689682275, "global_step": 65819, "epoch": 553, "lr": 1.520554799906382e-06} +{"train_loss": 0.00020987322204746306, "global_step": 65820, "epoch": 553, "lr": 1.5200126250769053e-06} +{"train_loss": 0.00020921594114042819, "global_step": 65821, "epoch": 553, "lr": 1.519470545432705e-06} +{"train_loss": 0.0005832732422277331, "global_step": 65822, "epoch": 553, "lr": 1.518928560974847e-06} +{"train_loss": 0.0002592502860352397, "global_step": 65823, "epoch": 553, "lr": 1.5183866717043915e-06} +{"train_loss": 0.00019865174544975162, "global_step": 65824, "epoch": 553, "lr": 1.5178448776224097e-06} +{"train_loss": 0.00027780505479313433, "global_step": 65825, "epoch": 553, "lr": 1.5173031787299507e-06} +{"train_loss": 0.00014058095985092223, "global_step": 65826, "epoch": 553, "lr": 1.5167615750280917e-06} +{"train_loss": 0.0003833681985270232, "global_step": 65827, "epoch": 553, "lr": 1.516220066517887e-06} +{"train_loss": 0.00030504161259159446, "global_step": 65828, "epoch": 553, "lr": 1.515678653200414e-06} +{"train_loss": 0.00019958960183430463, "global_step": 65829, "epoch": 553, "lr": 1.5151373350767161e-06} +{"train_loss": 0.0001922582450788468, "global_step": 65830, "epoch": 553, "lr": 1.5145961121478758e-06} +{"train_loss": 0.0003342501586303115, "global_step": 65831, "epoch": 553, "lr": 1.5140549844149422e-06} +{"train_loss": 0.00031924282666295767, "global_step": 65832, "epoch": 553, "lr": 1.513513951878981e-06} +{"train_loss": 0.00015681942750234157, "global_step": 65833, "epoch": 553, "lr": 1.5129730145410526e-06} +{"train_loss": 0.0004871354321949184, "global_step": 65834, "epoch": 553, "lr": 1.5124321724022228e-06} +{"train_loss": 0.00017280140309594572, "global_step": 65835, "epoch": 553, "lr": 1.5118914254635574e-06} +{"train_loss": 0.0001539737277198583, "global_step": 65836, "epoch": 553, "lr": 1.5113507737261057e-06} +{"train_loss": 0.0002202371833845973, "global_step": 65837, "epoch": 553, "lr": 1.5108102171909444e-06} +{"train_loss": 0.0007029063417576253, "global_step": 65838, "epoch": 553, "lr": 1.5102697558591172e-06} +{"train_loss": 0.000354029587469995, "global_step": 65839, "epoch": 553, "lr": 1.509729389731701e-06} +{"train_loss": 0.00042874147766269743, "global_step": 65840, "epoch": 553, "lr": 1.5091891188097506e-06} +{"train_loss": 0.000252085505053401, "global_step": 65841, "epoch": 553, "lr": 1.5086489430943207e-06} +{"train_loss": 0.00018454495875630528, "global_step": 65842, "epoch": 553, "lr": 1.5081088625864881e-06} +{"train_loss": 0.0002039870450971648, "global_step": 65843, "epoch": 553, "lr": 1.507568877287302e-06} +{"train_loss": 0.00017693314293865114, "global_step": 65844, "epoch": 553, "lr": 1.507028987197817e-06} +{"train_loss": 0.00027626307564787567, "global_step": 65845, "epoch": 553, "lr": 1.506489192319105e-06} +{"train_loss": 0.0006185509264469147, "global_step": 65846, "epoch": 553, "lr": 1.5059494926522143e-06} +{"train_loss": 0.00016691979544702917, "global_step": 65847, "epoch": 553, "lr": 1.505409888198217e-06} +{"train_loss": 0.00017925837892107666, "global_step": 65848, "epoch": 553, "lr": 1.5048703789581676e-06} +{"train_loss": 0.00024197313177864999, "global_step": 65849, "epoch": 553, "lr": 1.5043309649331205e-06} +{"train_loss": 0.00028606405248865485, "global_step": 65850, "epoch": 553, "lr": 1.5037916461241419e-06} +{"train_loss": 0.000291567703243345, "global_step": 65851, "epoch": 553, "lr": 1.5032524225322809e-06} +{"train_loss": 0.0004134635382797569, "global_step": 65852, "epoch": 553, "lr": 1.5027132941586086e-06} +{"train_loss": 0.0001560735545353964, "global_step": 65853, "epoch": 553, "lr": 1.5021742610041745e-06} +{"train_loss": 0.0008901681285351515, "global_step": 65854, "epoch": 553, "lr": 1.5016353230700442e-06} +{"train_loss": 0.00018424073641654104, "global_step": 65855, "epoch": 553, "lr": 1.5010964803572724e-06} +{"train_loss": 0.00035368313547223806, "global_step": 65856, "epoch": 553, "lr": 1.5005577328669084e-06} +{"train_loss": 0.0002607755595818162, "global_step": 65857, "epoch": 553, "lr": 1.5000190806000293e-06} +{"train_loss": 0.00040420691948384047, "global_step": 65858, "epoch": 553, "lr": 1.499480523557667e-06} +{"train_loss": 0.00011878648365382105, "global_step": 65859, "epoch": 553, "lr": 1.4989420617409045e-06} +{"train_loss": 0.00017365155508741736, "global_step": 65860, "epoch": 553, "lr": 1.4984036951507796e-06} +{"train_loss": 0.0001359531015623361, "global_step": 65861, "epoch": 553, "lr": 1.4978654237883638e-06} +{"train_loss": 0.00022516038734465837, "global_step": 65862, "epoch": 553, "lr": 1.4973272476547117e-06} +{"train_loss": 0.0003013511304743588, "global_step": 65863, "epoch": 553, "lr": 1.4967891667508616e-06} +{"train_loss": 0.00021814364299643785, "global_step": 65864, "epoch": 553, "lr": 1.4962511810778957e-06} +{"train_loss": 0.0005166445043869317, "global_step": 65865, "epoch": 553, "lr": 1.4957132906368522e-06} +{"train_loss": 0.0003026471531484276, "global_step": 65866, "epoch": 553, "lr": 1.4951754954288022e-06} +{"train_loss": 0.00024976133136078715, "global_step": 65867, "epoch": 553, "lr": 1.494637795454784e-06} +{"train_loss": 0.00019688732572831213, "global_step": 65868, "epoch": 553, "lr": 1.4941001907158691e-06} +{"train_loss": 0.00013415017747320235, "global_step": 65869, "epoch": 553, "lr": 1.4935626812130953e-06} +{"train_loss": 0.00020510811009444296, "global_step": 65870, "epoch": 553, "lr": 1.4930252669475397e-06} +{"train_loss": 0.00014873914187774062, "global_step": 65871, "epoch": 553, "lr": 1.4924879479202457e-06} +{"train_loss": 0.0003427428309805691, "global_step": 65872, "epoch": 553, "lr": 1.4919507241322683e-06} +{"train_loss": 0.00020790513372048736, "global_step": 65873, "epoch": 553, "lr": 1.4914135955846563e-06} +{"train_loss": 0.00032320176251232624, "global_step": 65874, "epoch": 553, "lr": 1.4908765622784814e-06} +{"train_loss": 0.0001532492315163836, "global_step": 65875, "epoch": 553, "lr": 1.4903396242147816e-06} +{"train_loss": 0.0002571391814853996, "global_step": 65876, "epoch": 553, "lr": 1.4898027813946224e-06} +{"train_loss": 0.00036402029218152165, "global_step": 65877, "epoch": 553, "lr": 1.4892660338190478e-06} +{"train_loss": 0.00022188856382854283, "global_step": 65878, "epoch": 553, "lr": 1.4887293814891234e-06} +{"train_loss": 0.0003152243443764746, "global_step": 65879, "epoch": 553, "lr": 1.4881928244058874e-06} +{"train_loss": 0.0002021918335231021, "global_step": 65880, "epoch": 553, "lr": 1.4876563625704109e-06} +{"train_loss": 0.0002773439628072083, "global_step": 65881, "epoch": 553, "lr": 1.4871199959837378e-06} +{"train_loss": 0.000498589884955436, "global_step": 65882, "epoch": 553, "lr": 1.486583724646917e-06} +{"train_loss": 0.00022763216111343354, "global_step": 65883, "epoch": 553, "lr": 1.4860475485610093e-06} +{"train_loss": 0.00022268539760261774, "global_step": 65884, "epoch": 553, "lr": 1.4855114677270577e-06} +{"train_loss": 0.00023245108604896814, "global_step": 65885, "epoch": 553, "lr": 1.4849754821461282e-06} +{"train_loss": 0.0001796792639652267, "global_step": 65886, "epoch": 553, "lr": 1.48443959181927e-06} +{"train_loss": 0.0005137281841598451, "global_step": 65887, "epoch": 553, "lr": 1.483903796747521e-06} +{"train_loss": 0.00020383998344186693, "global_step": 65888, "epoch": 553, "lr": 1.483368096931953e-06} +{"train_loss": 0.0003124222857877612, "global_step": 65889, "epoch": 553, "lr": 1.4828324923735982e-06} +{"train_loss": 0.00022779652499593794, "global_step": 65890, "epoch": 553, "lr": 1.482296983073528e-06} +{"train_loss": 0.00027914479142054915, "global_step": 65891, "epoch": 553, "lr": 1.4817615690327746e-06} +{"train_loss": 0.00030665742815472186, "global_step": 65892, "epoch": 553, "lr": 1.48122625025241e-06} +{"train_loss": 0.0001892369327833876, "global_step": 65893, "epoch": 553, "lr": 1.4806910267334718e-06} +{"train_loss": 0.00020910584134981036, "global_step": 65894, "epoch": 553, "lr": 1.4801558984770093e-06} +{"train_loss": 0.00021854197257198393, "global_step": 65895, "epoch": 553, "lr": 1.4796208654840772e-06} +{"train_loss": 0.0003326949954498559, "global_step": 65896, "epoch": 553, "lr": 1.4790859277557245e-06} +{"train_loss": 0.00017727745580486953, "global_step": 65897, "epoch": 553, "lr": 1.4785510852930118e-06} +{"train_loss": 0.0002236841683043167, "global_step": 65898, "epoch": 553, "lr": 1.4780163380969713e-06} +{"train_loss": 0.0003778640821110457, "global_step": 65899, "epoch": 553, "lr": 1.4774816861686636e-06} +{"train_loss": 0.000432825880125165, "global_step": 65900, "epoch": 553, "lr": 1.476947129509143e-06} +{"train_loss": 0.00041252488153986633, "global_step": 65901, "epoch": 553, "lr": 1.4764126681194424e-06} +{"train_loss": 0.00018625202937982976, "global_step": 65902, "epoch": 553, "lr": 1.4758783020006272e-06} +{"train_loss": 0.00023293145932257175, "global_step": 65903, "epoch": 553, "lr": 1.4753440311537414e-06} +{"train_loss": 0.00015001717838458717, "global_step": 65904, "epoch": 553, "lr": 1.4748098555798285e-06} +{"train_loss": 0.00017977833340410143, "global_step": 65905, "epoch": 553, "lr": 1.4742757752799485e-06} +{"train_loss": 0.0002410791057627648, "global_step": 65906, "epoch": 553, "lr": 1.4737417902551398e-06} +{"train_loss": 0.00014981537242420018, "global_step": 65907, "epoch": 553, "lr": 1.4732079005064569e-06} +{"train_loss": 0.00023349672846961766, "global_step": 65908, "epoch": 553, "lr": 1.4726741060349437e-06} +{"train_loss": 0.00019727936887647957, "global_step": 65909, "epoch": 553, "lr": 1.4721404068416544e-06} +{"train_loss": 0.0002265776856802404, "global_step": 65910, "epoch": 553, "lr": 1.4716068029276276e-06} +{"train_loss": 0.0005746973911300302, "global_step": 65911, "epoch": 553, "lr": 1.471073294293923e-06} +{"train_loss": 0.000362422491889447, "global_step": 65912, "epoch": 553, "lr": 1.4705398809415794e-06} +{"train_loss": 0.000160449359100312, "global_step": 65913, "epoch": 553, "lr": 1.4700065628716454e-06} +{"train_loss": 0.00027072729426436126, "global_step": 65914, "epoch": 553, "lr": 1.4694733400851702e-06} +{"train_loss": 0.0001582505356054753, "global_step": 65915, "epoch": 553, "lr": 1.468940212583192e-06} +{"train_loss": 0.0001809115638025105, "global_step": 65916, "epoch": 553, "lr": 1.4684071803667765e-06} +{"train_loss": 0.0002576785918790847, "global_step": 65917, "epoch": 553, "lr": 1.4678742434369509e-06} +{"train_loss": 0.0007300113793462515, "global_step": 65918, "epoch": 553, "lr": 1.4673414017947696e-06} +{"train_loss": 0.00014849880244582891, "global_step": 65919, "epoch": 553, "lr": 1.466808655441282e-06} +{"train_loss": 0.00020269591186661273, "global_step": 65920, "epoch": 553, "lr": 1.4662760043775258e-06} +{"train_loss": 0.0002509126497898251, "global_step": 65921, "epoch": 553, "lr": 1.4657434486045563e-06} +{"train_loss": 0.0002571225631982088, "global_step": 65922, "epoch": 553, "lr": 1.465210988123411e-06} +{"train_loss": 0.0002377797063672915, "global_step": 65923, "epoch": 553, "lr": 1.464678622935145e-06} +{"train_loss": 0.00018284650286659598, "global_step": 65924, "epoch": 553, "lr": 1.4641463530407906e-06} +{"train_loss": 0.0002896018696072347, "global_step": 65925, "epoch": 553, "lr": 1.4636141784414027e-06, "val_loss": 0.05583711713552475} +{"train_loss": 0.00046752189518883824, "global_step": 65926, "epoch": 554, "lr": 1.4630820991380244e-06} +{"train_loss": 0.0002519392583053559, "global_step": 65927, "epoch": 554, "lr": 1.462550115131689e-06} +{"train_loss": 0.0002180948358727619, "global_step": 65928, "epoch": 554, "lr": 1.4620182264234616e-06} +{"train_loss": 0.00022334919776767492, "global_step": 65929, "epoch": 554, "lr": 1.4614864330143696e-06} +{"train_loss": 0.00023292971309274435, "global_step": 65930, "epoch": 554, "lr": 1.4609547349054676e-06} +{"train_loss": 0.0003445713082328439, "global_step": 65931, "epoch": 554, "lr": 1.460423132097799e-06} +{"train_loss": 0.00015860487474128604, "global_step": 65932, "epoch": 554, "lr": 1.4598916245923965e-06} +{"train_loss": 0.00023986866290215403, "global_step": 65933, "epoch": 554, "lr": 1.459360212390315e-06} +{"train_loss": 0.0002341417857678607, "global_step": 65934, "epoch": 554, "lr": 1.4588288954925922e-06} +{"train_loss": 0.0003134296857751906, "global_step": 65935, "epoch": 554, "lr": 1.458297673900272e-06} +{"train_loss": 0.00017603739979676902, "global_step": 65936, "epoch": 554, "lr": 1.4577665476143976e-06} +{"train_loss": 0.00020652437524404377, "global_step": 65937, "epoch": 554, "lr": 1.4572355166360185e-06} +{"train_loss": 0.00018037181871477515, "global_step": 65938, "epoch": 554, "lr": 1.4567045809661673e-06} +{"train_loss": 0.0002818938810378313, "global_step": 65939, "epoch": 554, "lr": 1.4561737406058873e-06} +{"train_loss": 0.00014940481923986226, "global_step": 65940, "epoch": 554, "lr": 1.4556429955562278e-06} +{"train_loss": 0.0003222092054784298, "global_step": 65941, "epoch": 554, "lr": 1.4551123458182269e-06} +{"train_loss": 0.0002492305065970868, "global_step": 65942, "epoch": 554, "lr": 1.4545817913929283e-06} +{"train_loss": 0.0002714180154725909, "global_step": 65943, "epoch": 554, "lr": 1.4540513322813698e-06} +{"train_loss": 0.0002589348005130887, "global_step": 65944, "epoch": 554, "lr": 1.4535209684845951e-06} +{"train_loss": 0.00021590532560367137, "global_step": 65945, "epoch": 554, "lr": 1.452990700003648e-06} +{"train_loss": 0.0001314888650085777, "global_step": 65946, "epoch": 554, "lr": 1.4524605268395664e-06} +{"train_loss": 0.0002639777376316488, "global_step": 65947, "epoch": 554, "lr": 1.4519304489933883e-06} +{"train_loss": 0.000325726781738922, "global_step": 65948, "epoch": 554, "lr": 1.4514004664661629e-06} +{"train_loss": 0.00017888502043206245, "global_step": 65949, "epoch": 554, "lr": 1.4508705792589228e-06} +{"train_loss": 0.0002981575671583414, "global_step": 65950, "epoch": 554, "lr": 1.450340787372717e-06} +{"train_loss": 0.0002455140929669142, "global_step": 65951, "epoch": 554, "lr": 1.4498110908085726e-06} +{"train_loss": 0.00018610450206324458, "global_step": 65952, "epoch": 554, "lr": 1.4492814895675444e-06} +{"train_loss": 0.00018298673967365175, "global_step": 65953, "epoch": 554, "lr": 1.4487519836506592e-06} +{"train_loss": 0.00034303806023672223, "global_step": 65954, "epoch": 554, "lr": 1.448222573058966e-06} +{"train_loss": 0.00032413905137218535, "global_step": 65955, "epoch": 554, "lr": 1.4476932577935031e-06} +{"train_loss": 0.0004476978210732341, "global_step": 65956, "epoch": 554, "lr": 1.4471640378553031e-06} +{"train_loss": 0.0001828622043831274, "global_step": 65957, "epoch": 554, "lr": 1.4466349132454093e-06} +{"train_loss": 0.0004451690474525094, "global_step": 65958, "epoch": 554, "lr": 1.44610588396486e-06} +{"train_loss": 0.00022571044974029064, "global_step": 65959, "epoch": 554, "lr": 1.4455769500146988e-06} +{"train_loss": 0.00019610600429587066, "global_step": 65960, "epoch": 554, "lr": 1.4450481113959524e-06} +{"train_loss": 0.00021604001813102514, "global_step": 65961, "epoch": 554, "lr": 1.4445193681096758e-06} +{"train_loss": 0.0002146381011698395, "global_step": 65962, "epoch": 554, "lr": 1.4439907201568958e-06} +{"train_loss": 0.00023928230802994221, "global_step": 65963, "epoch": 554, "lr": 1.4434621675386506e-06} +{"train_loss": 0.00025104411179199815, "global_step": 65964, "epoch": 554, "lr": 1.442933710255978e-06} +{"train_loss": 0.0004846666706725955, "global_step": 65965, "epoch": 554, "lr": 1.442405348309922e-06} +{"train_loss": 0.0002833351609297097, "global_step": 65966, "epoch": 554, "lr": 1.441877081701515e-06} +{"train_loss": 0.00022466499649453908, "global_step": 65967, "epoch": 554, "lr": 1.441348910431789e-06} +{"train_loss": 0.00012295505439396948, "global_step": 65968, "epoch": 554, "lr": 1.4408208345017938e-06} +{"train_loss": 0.00018765278218779713, "global_step": 65969, "epoch": 554, "lr": 1.4402928539125503e-06} +{"train_loss": 0.00017609081987757236, "global_step": 65970, "epoch": 554, "lr": 1.4397649686651137e-06} +{"train_loss": 0.0002975579700432718, "global_step": 65971, "epoch": 554, "lr": 1.4392371787605052e-06} +{"train_loss": 0.00037691285251639783, "global_step": 65972, "epoch": 554, "lr": 1.4387094841997685e-06} +{"train_loss": 0.00019923951185774058, "global_step": 65973, "epoch": 554, "lr": 1.4381818849839357e-06} +{"train_loss": 0.00016781987505964935, "global_step": 65974, "epoch": 554, "lr": 1.4376543811140452e-06} +{"train_loss": 0.00025745495804585516, "global_step": 65975, "epoch": 554, "lr": 1.4371269725911297e-06} +{"train_loss": 0.00022472828277386725, "global_step": 65976, "epoch": 554, "lr": 1.4365996594162323e-06} +{"train_loss": 0.0005225908244028687, "global_step": 65977, "epoch": 554, "lr": 1.4360724415903803e-06} +{"train_loss": 0.00046896992716938257, "global_step": 65978, "epoch": 554, "lr": 1.4355453191146173e-06} +{"train_loss": 0.00018303978140465915, "global_step": 65979, "epoch": 554, "lr": 1.4350182919899647e-06} +{"train_loss": 0.00016802844766061753, "global_step": 65980, "epoch": 554, "lr": 1.4344913602174715e-06} +{"train_loss": 0.00037961441557854414, "global_step": 65981, "epoch": 554, "lr": 1.4339645237981648e-06} +{"train_loss": 0.000298582628602162, "global_step": 65982, "epoch": 554, "lr": 1.433437782733077e-06} +{"train_loss": 0.0001503111852798611, "global_step": 65983, "epoch": 554, "lr": 1.4329111370232461e-06} +{"train_loss": 0.0003121148911304772, "global_step": 65984, "epoch": 554, "lr": 1.432384586669705e-06} +{"train_loss": 0.00023018353385850787, "global_step": 65985, "epoch": 554, "lr": 1.4318581316734914e-06} +{"train_loss": 0.00018510555673856288, "global_step": 65986, "epoch": 554, "lr": 1.4313317720356379e-06} +{"train_loss": 0.00021239632042124867, "global_step": 65987, "epoch": 554, "lr": 1.4308055077571713e-06} +{"train_loss": 0.00021567575458902866, "global_step": 65988, "epoch": 554, "lr": 1.43027933883913e-06} +{"train_loss": 0.000166812285897322, "global_step": 65989, "epoch": 554, "lr": 1.4297532652825463e-06} +{"train_loss": 0.00017065618885681033, "global_step": 65990, "epoch": 554, "lr": 1.4292272870884527e-06} +{"train_loss": 0.00020075040811207145, "global_step": 65991, "epoch": 554, "lr": 1.4287014042578817e-06} +{"train_loss": 0.000489325902890414, "global_step": 65992, "epoch": 554, "lr": 1.4281756167918714e-06} +{"train_loss": 0.00028436110005714, "global_step": 65993, "epoch": 554, "lr": 1.4276499246914433e-06} +{"train_loss": 0.00020927081641275436, "global_step": 65994, "epoch": 554, "lr": 1.4271243279576352e-06} +{"train_loss": 0.00023605965543538332, "global_step": 65995, "epoch": 554, "lr": 1.4265988265914854e-06} +{"train_loss": 0.00012511902605183423, "global_step": 65996, "epoch": 554, "lr": 1.4260734205940095e-06} +{"train_loss": 0.00020781201601494104, "global_step": 65997, "epoch": 554, "lr": 1.4255481099662571e-06} +{"train_loss": 0.00024181007756851614, "global_step": 65998, "epoch": 554, "lr": 1.4250228947092492e-06} +{"train_loss": 0.0002507807221263647, "global_step": 65999, "epoch": 554, "lr": 1.424497774824024e-06} +{"train_loss": 0.00034819598658941686, "global_step": 66000, "epoch": 554, "lr": 1.4239727503115975e-06} +{"train_loss": 0.00023038999643176794, "global_step": 66001, "epoch": 554, "lr": 1.4234478211730185e-06} +{"train_loss": 0.0003612172731664032, "global_step": 66002, "epoch": 554, "lr": 1.4229229874093086e-06} +{"train_loss": 0.00022455120051745325, "global_step": 66003, "epoch": 554, "lr": 1.4223982490215005e-06} +{"train_loss": 0.00023325470101553947, "global_step": 66004, "epoch": 554, "lr": 1.4218736060106208e-06} +{"train_loss": 0.0003446860355325043, "global_step": 66005, "epoch": 554, "lr": 1.4213490583777078e-06} +{"train_loss": 0.00027856670203618705, "global_step": 66006, "epoch": 554, "lr": 1.4208246061237773e-06} +{"train_loss": 0.0001210380214615725, "global_step": 66007, "epoch": 554, "lr": 1.420300249249873e-06} +{"train_loss": 0.0004010100965388119, "global_step": 66008, "epoch": 554, "lr": 1.4197759877570215e-06} +{"train_loss": 0.000188355304999277, "global_step": 66009, "epoch": 554, "lr": 1.4192518216462448e-06} +{"train_loss": 0.0002753163571469486, "global_step": 66010, "epoch": 554, "lr": 1.4187277509185803e-06} +{"train_loss": 0.00018261998775415123, "global_step": 66011, "epoch": 554, "lr": 1.4182037755750554e-06} +{"train_loss": 0.00030437257373705506, "global_step": 66012, "epoch": 554, "lr": 1.417679895616697e-06} +{"train_loss": 0.00025428456137888134, "global_step": 66013, "epoch": 554, "lr": 1.4171561110445263e-06} +{"train_loss": 0.00026061723474413157, "global_step": 66014, "epoch": 554, "lr": 1.4166324218595871e-06} +{"train_loss": 0.00023780608898960054, "global_step": 66015, "epoch": 554, "lr": 1.4161088280628953e-06} +{"train_loss": 0.0002562752924859524, "global_step": 66016, "epoch": 554, "lr": 1.4155853296554888e-06} +{"train_loss": 0.00016004801727831364, "global_step": 66017, "epoch": 554, "lr": 1.415061926638389e-06} +{"train_loss": 0.00046362035209313035, "global_step": 66018, "epoch": 554, "lr": 1.414538619012623e-06} +{"train_loss": 0.0003625192621257156, "global_step": 66019, "epoch": 554, "lr": 1.4140154067792177e-06} +{"train_loss": 0.00012989219976589084, "global_step": 66020, "epoch": 554, "lr": 1.4134922899392056e-06} +{"train_loss": 0.0007407349185086787, "global_step": 66021, "epoch": 554, "lr": 1.412969268493608e-06} +{"train_loss": 0.0005670961108990014, "global_step": 66022, "epoch": 554, "lr": 1.412446342443452e-06} +{"train_loss": 0.00033917365362867713, "global_step": 66023, "epoch": 554, "lr": 1.4119235117897755e-06} +{"train_loss": 0.0003045474295504391, "global_step": 66024, "epoch": 554, "lr": 1.4114007765335946e-06} +{"train_loss": 0.00033943666494451463, "global_step": 66025, "epoch": 554, "lr": 1.4108781366759304e-06} +{"train_loss": 0.00015203567454591393, "global_step": 66026, "epoch": 554, "lr": 1.4103555922178212e-06} +{"train_loss": 0.0006159296608529985, "global_step": 66027, "epoch": 554, "lr": 1.4098331431602829e-06} +{"train_loss": 0.00014435380580835044, "global_step": 66028, "epoch": 554, "lr": 1.4093107895043533e-06} +{"train_loss": 0.0004925545654259622, "global_step": 66029, "epoch": 554, "lr": 1.408788531251043e-06} +{"train_loss": 0.00013554848555941135, "global_step": 66030, "epoch": 554, "lr": 1.4082663684013898e-06} +{"train_loss": 0.00033370667370036244, "global_step": 66031, "epoch": 554, "lr": 1.407744300956415e-06} +{"train_loss": 0.00027918105479329824, "global_step": 66032, "epoch": 554, "lr": 1.4072223289171405e-06} +{"train_loss": 0.00017100303375627846, "global_step": 66033, "epoch": 554, "lr": 1.4067004522845984e-06} +{"train_loss": 0.00015622966748196632, "global_step": 66034, "epoch": 554, "lr": 1.406178671059799e-06} +{"train_loss": 0.00026280409656465054, "global_step": 66035, "epoch": 554, "lr": 1.4056569852437806e-06} +{"train_loss": 0.00012548049562610686, "global_step": 66036, "epoch": 554, "lr": 1.40513539483757e-06} +{"train_loss": 0.00038250323268584907, "global_step": 66037, "epoch": 554, "lr": 1.404613899842172e-06} +{"train_loss": 0.00019695956143550575, "global_step": 66038, "epoch": 554, "lr": 1.4040925002586357e-06} +{"train_loss": 0.0004071157018188387, "global_step": 66039, "epoch": 554, "lr": 1.4035711960879605e-06} +{"train_loss": 0.00025229339371435344, "global_step": 66040, "epoch": 554, "lr": 1.4030499873311898e-06} +{"train_loss": 0.0002982028527185321, "global_step": 66041, "epoch": 554, "lr": 1.4025288739893338e-06} +{"train_loss": 0.0001412096607964486, "global_step": 66042, "epoch": 554, "lr": 1.4020078560634254e-06} +{"train_loss": 0.0002971089561469853, "global_step": 66043, "epoch": 554, "lr": 1.4014869335544855e-06} +{"train_loss": 0.00026797490594800984, "global_step": 66044, "epoch": 554, "lr": 1.400966106463525e-06, "val_loss": 0.021062558516860008} +{"train_loss": 0.00019096041796728969, "global_step": 66045, "epoch": 555, "lr": 1.4004453747915813e-06} +{"train_loss": 0.00013789611693937331, "global_step": 66046, "epoch": 555, "lr": 1.3999247385396651e-06} +{"train_loss": 0.00019630664610303938, "global_step": 66047, "epoch": 555, "lr": 1.399404197708809e-06} +{"train_loss": 0.00018936532433144748, "global_step": 66048, "epoch": 555, "lr": 1.3988837523000286e-06} +{"train_loss": 0.0001667371834628284, "global_step": 66049, "epoch": 555, "lr": 1.3983634023143511e-06} +{"train_loss": 0.00017673576076049358, "global_step": 66050, "epoch": 555, "lr": 1.3978431477527975e-06} +{"train_loss": 0.00027265551034361124, "global_step": 66051, "epoch": 555, "lr": 1.3973229886163786e-06} +{"train_loss": 0.00025840685702860355, "global_step": 66052, "epoch": 555, "lr": 1.3968029249061266e-06} +{"train_loss": 0.00044244882883504033, "global_step": 66053, "epoch": 555, "lr": 1.3962829566230574e-06} +{"train_loss": 0.000244140945142135, "global_step": 66054, "epoch": 555, "lr": 1.395763083768198e-06} +{"train_loss": 0.0002647853398229927, "global_step": 66055, "epoch": 555, "lr": 1.3952433063425695e-06} +{"train_loss": 0.00036159800947643816, "global_step": 66056, "epoch": 555, "lr": 1.3947236243471773e-06} +{"train_loss": 0.00079637102317065, "global_step": 66057, "epoch": 555, "lr": 1.394204037783059e-06} +{"train_loss": 0.00036589711089618504, "global_step": 66058, "epoch": 555, "lr": 1.393684546651225e-06} +{"train_loss": 0.00016253298963420093, "global_step": 66059, "epoch": 555, "lr": 1.393165150952702e-06} +{"train_loss": 0.00015133453416638076, "global_step": 66060, "epoch": 555, "lr": 1.3926458506885009e-06} +{"train_loss": 0.00013656378723680973, "global_step": 66061, "epoch": 555, "lr": 1.3921266458596537e-06} +{"train_loss": 0.00037336625973694026, "global_step": 66062, "epoch": 555, "lr": 1.391607536467171e-06} +{"train_loss": 0.00024635219597257674, "global_step": 66063, "epoch": 555, "lr": 1.3910885225120685e-06} +{"train_loss": 0.0002563054149504751, "global_step": 66064, "epoch": 555, "lr": 1.3905696039953785e-06} +{"train_loss": 0.0002756132453214377, "global_step": 66065, "epoch": 555, "lr": 1.3900507809181062e-06} +{"train_loss": 0.00026731437537819147, "global_step": 66066, "epoch": 555, "lr": 1.3895320532812784e-06} +{"train_loss": 0.0003953363047912717, "global_step": 66067, "epoch": 555, "lr": 1.389013421085905e-06} +{"train_loss": 0.00025856203865259886, "global_step": 66068, "epoch": 555, "lr": 1.3884948843330193e-06} +{"train_loss": 0.00022925740631762892, "global_step": 66069, "epoch": 555, "lr": 1.3879764430236253e-06} +{"train_loss": 0.00021826410375069827, "global_step": 66070, "epoch": 555, "lr": 1.3874580971587448e-06} +{"train_loss": 0.00039233436109498143, "global_step": 66071, "epoch": 555, "lr": 1.3869398467394046e-06} +{"train_loss": 0.00023669099027756602, "global_step": 66072, "epoch": 555, "lr": 1.386421691766604e-06} +{"train_loss": 0.0002521082933526486, "global_step": 66073, "epoch": 555, "lr": 1.385903632241381e-06} +{"train_loss": 0.00026078580413013697, "global_step": 66074, "epoch": 555, "lr": 1.3853856681647403e-06} +{"train_loss": 0.00026194623205810785, "global_step": 66075, "epoch": 555, "lr": 1.384867799537698e-06} +{"train_loss": 0.0002621884341351688, "global_step": 66076, "epoch": 555, "lr": 1.3843500263612752e-06} +{"train_loss": 0.000244857365032658, "global_step": 66077, "epoch": 555, "lr": 1.3838323486364824e-06} +{"train_loss": 0.0002164078614441678, "global_step": 66078, "epoch": 555, "lr": 1.383314766364352e-06} +{"train_loss": 0.00035455511533655226, "global_step": 66079, "epoch": 555, "lr": 1.3827972795458777e-06} +{"train_loss": 0.0004581164103001356, "global_step": 66080, "epoch": 555, "lr": 1.3822798881820975e-06} +{"train_loss": 0.0003623031952884048, "global_step": 66081, "epoch": 555, "lr": 1.3817625922740108e-06} +{"train_loss": 0.00023574595979880542, "global_step": 66082, "epoch": 555, "lr": 1.3812453918226386e-06} +{"train_loss": 0.00015864898159634322, "global_step": 66083, "epoch": 555, "lr": 1.3807282868289972e-06} +{"train_loss": 0.000268452160526067, "global_step": 66084, "epoch": 555, "lr": 1.3802112772941022e-06} +{"train_loss": 0.00028371921507641673, "global_step": 66085, "epoch": 555, "lr": 1.3796943632189695e-06} +{"train_loss": 0.00019788046483881772, "global_step": 66086, "epoch": 555, "lr": 1.3791775446046152e-06} +{"train_loss": 0.0001698185078566894, "global_step": 66087, "epoch": 555, "lr": 1.3786608214520436e-06} +{"train_loss": 0.0004938565543852746, "global_step": 66088, "epoch": 555, "lr": 1.378144193762282e-06} +{"train_loss": 0.00036546195042319596, "global_step": 66089, "epoch": 555, "lr": 1.3776276615363347e-06} +{"train_loss": 0.00033636094303801656, "global_step": 66090, "epoch": 555, "lr": 1.3771112247752293e-06} +{"train_loss": 0.00018828414613381028, "global_step": 66091, "epoch": 555, "lr": 1.3765948834799647e-06} +{"train_loss": 0.00023778552713338286, "global_step": 66092, "epoch": 555, "lr": 1.3760786376515678e-06} +{"train_loss": 0.00017189295613206923, "global_step": 66093, "epoch": 555, "lr": 1.3755624872910433e-06} +{"train_loss": 0.00024818064412102103, "global_step": 66094, "epoch": 555, "lr": 1.3750464323994017e-06} +{"train_loss": 0.00018973246915265918, "global_step": 66095, "epoch": 555, "lr": 1.3745304729776697e-06} +{"train_loss": 0.0001429953845217824, "global_step": 66096, "epoch": 555, "lr": 1.374014609026847e-06} +{"train_loss": 0.00035725077032111585, "global_step": 66097, "epoch": 555, "lr": 1.3734988405479544e-06} +{"train_loss": 0.00026068027364090085, "global_step": 66098, "epoch": 555, "lr": 1.3729831675419967e-06} +{"train_loss": 0.00019453579443506896, "global_step": 66099, "epoch": 555, "lr": 1.372467590009996e-06} +{"train_loss": 0.00022212343174032867, "global_step": 66100, "epoch": 555, "lr": 1.3719521079529563e-06} +{"train_loss": 0.00016848788072820753, "global_step": 66101, "epoch": 555, "lr": 1.3714367213718994e-06} +{"train_loss": 0.00034457704168744385, "global_step": 66102, "epoch": 555, "lr": 1.370921430267824e-06} +{"train_loss": 0.00023356146994046867, "global_step": 66103, "epoch": 555, "lr": 1.370406234641758e-06} +{"train_loss": 0.00016841714386828244, "global_step": 66104, "epoch": 555, "lr": 1.3698911344946942e-06} +{"train_loss": 0.00030621467158198357, "global_step": 66105, "epoch": 555, "lr": 1.3693761298276652e-06} +{"train_loss": 0.0001855177542893216, "global_step": 66106, "epoch": 555, "lr": 1.3688612206416595e-06} +{"train_loss": 0.00019034148135688156, "global_step": 66107, "epoch": 555, "lr": 1.3683464069377094e-06} +{"train_loss": 0.00025147502310574055, "global_step": 66108, "epoch": 555, "lr": 1.367831688716803e-06} +{"train_loss": 0.00019136913761030883, "global_step": 66109, "epoch": 555, "lr": 1.3673170659799784e-06} +{"train_loss": 0.00032504682894796133, "global_step": 66110, "epoch": 555, "lr": 1.366802538728218e-06} +{"train_loss": 0.00024326487618964165, "global_step": 66111, "epoch": 555, "lr": 1.3662881069625545e-06} +{"train_loss": 0.00016697512182872742, "global_step": 66112, "epoch": 555, "lr": 1.3657737706839868e-06} +{"train_loss": 0.00034059019526466727, "global_step": 66113, "epoch": 555, "lr": 1.36525952989352e-06} +{"train_loss": 0.00026100577088072896, "global_step": 66114, "epoch": 555, "lr": 1.364745384592181e-06} +{"train_loss": 0.00022888134117238224, "global_step": 66115, "epoch": 555, "lr": 1.3642313347809578e-06} +{"train_loss": 0.00026609134511090815, "global_step": 66116, "epoch": 555, "lr": 1.363717380460877e-06} +{"train_loss": 0.00029186467872932553, "global_step": 66117, "epoch": 555, "lr": 1.3632035216329387e-06} +{"train_loss": 0.00041478528873994946, "global_step": 66118, "epoch": 555, "lr": 1.362689758298158e-06} +{"train_loss": 0.00023255434643942863, "global_step": 66119, "epoch": 555, "lr": 1.3621760904575343e-06} +{"train_loss": 0.00036750189610756934, "global_step": 66120, "epoch": 555, "lr": 1.3616625181120834e-06} +{"train_loss": 0.0002824607363436371, "global_step": 66121, "epoch": 555, "lr": 1.3611490412628158e-06} +{"train_loss": 0.0002449599269311875, "global_step": 66122, "epoch": 555, "lr": 1.3606356599107307e-06} +{"train_loss": 0.00020870790467597544, "global_step": 66123, "epoch": 555, "lr": 1.3601223740568437e-06} +{"train_loss": 0.0004173912457190454, "global_step": 66124, "epoch": 555, "lr": 1.3596091837021596e-06} +{"train_loss": 0.0002179119037464261, "global_step": 66125, "epoch": 555, "lr": 1.3590960888476833e-06} +{"train_loss": 0.00032462808303534985, "global_step": 66126, "epoch": 555, "lr": 1.3585830894944307e-06} +{"train_loss": 0.00021104284678585827, "global_step": 66127, "epoch": 555, "lr": 1.3580701856434008e-06} +{"train_loss": 0.00018853979418054223, "global_step": 66128, "epoch": 555, "lr": 1.3575573772956041e-06} +{"train_loss": 0.0001459061895729974, "global_step": 66129, "epoch": 555, "lr": 1.357044664452045e-06} +{"train_loss": 0.00017830934666562825, "global_step": 66130, "epoch": 555, "lr": 1.3565320471137344e-06} +{"train_loss": 0.0002750186249613762, "global_step": 66131, "epoch": 555, "lr": 1.3560195252816766e-06} +{"train_loss": 0.0005317089962773025, "global_step": 66132, "epoch": 555, "lr": 1.3555070989568708e-06} +{"train_loss": 0.00030202229390852153, "global_step": 66133, "epoch": 555, "lr": 1.354994768140333e-06} +{"train_loss": 0.0002054559881798923, "global_step": 66134, "epoch": 555, "lr": 1.3544825328330735e-06} +{"train_loss": 0.00019559921929612756, "global_step": 66135, "epoch": 555, "lr": 1.3539703930360804e-06} +{"train_loss": 0.00024114883854053915, "global_step": 66136, "epoch": 555, "lr": 1.3534583487503805e-06} +{"train_loss": 0.00015892687952145934, "global_step": 66137, "epoch": 555, "lr": 1.3529463999769564e-06} +{"train_loss": 0.00027471163775771856, "global_step": 66138, "epoch": 555, "lr": 1.3524345467168354e-06} +{"train_loss": 0.00037558082840405405, "global_step": 66139, "epoch": 555, "lr": 1.3519227889709996e-06} +{"train_loss": 0.00019974705355707556, "global_step": 66140, "epoch": 555, "lr": 1.351411126740476e-06} +{"train_loss": 0.00015768592129461467, "global_step": 66141, "epoch": 555, "lr": 1.350899560026253e-06} +{"train_loss": 0.00036958957207389176, "global_step": 66142, "epoch": 555, "lr": 1.3503880888293518e-06} +{"train_loss": 0.00021545993513427675, "global_step": 66143, "epoch": 555, "lr": 1.3498767131507605e-06} +{"train_loss": 0.00030244895606301725, "global_step": 66144, "epoch": 555, "lr": 1.349365432991484e-06} +{"train_loss": 0.00023971518385224044, "global_step": 66145, "epoch": 555, "lr": 1.3488542483525378e-06} +{"train_loss": 0.00032923443359322846, "global_step": 66146, "epoch": 555, "lr": 1.3483431592349104e-06} +{"train_loss": 0.0002575302205514163, "global_step": 66147, "epoch": 555, "lr": 1.347832165639623e-06} +{"train_loss": 0.00022640431416220963, "global_step": 66148, "epoch": 555, "lr": 1.3473212675676639e-06} +{"train_loss": 0.00019111405708827078, "global_step": 66149, "epoch": 555, "lr": 1.346810465020043e-06} +{"train_loss": 0.00026907710707746446, "global_step": 66150, "epoch": 555, "lr": 1.3462997579977654e-06} +{"train_loss": 0.00037171138683333993, "global_step": 66151, "epoch": 555, "lr": 1.3457891465018246e-06} +{"train_loss": 0.0003031972737517208, "global_step": 66152, "epoch": 555, "lr": 1.345278630533231e-06} +{"train_loss": 0.0001915083557832986, "global_step": 66153, "epoch": 555, "lr": 1.3447682100929838e-06} +{"train_loss": 0.0002285414666403085, "global_step": 66154, "epoch": 555, "lr": 1.3442578851820875e-06} +{"train_loss": 0.0003044883778784424, "global_step": 66155, "epoch": 555, "lr": 1.3437476558015472e-06} +{"train_loss": 0.0002593069220893085, "global_step": 66156, "epoch": 555, "lr": 1.3432375219523507e-06} +{"train_loss": 0.00024596008006483316, "global_step": 66157, "epoch": 555, "lr": 1.3427274836355141e-06} +{"train_loss": 0.000590211886446923, "global_step": 66158, "epoch": 555, "lr": 1.342217540852031e-06} +{"train_loss": 0.0001553123875055462, "global_step": 66159, "epoch": 555, "lr": 1.3417076936029116e-06} +{"train_loss": 0.00028724479489028454, "global_step": 66160, "epoch": 555, "lr": 1.341197941889144e-06} +{"train_loss": 0.0004971043090336025, "global_step": 66161, "epoch": 555, "lr": 1.3406882857117443e-06} +{"train_loss": 0.0002037316735368222, "global_step": 66162, "epoch": 555, "lr": 1.3401787250717002e-06} +{"train_loss": 0.00026847628050898553, "global_step": 66163, "epoch": 555, "lr": 1.3396692599700112e-06, "val_loss": 0.0196169912815094, "train_action_mse_error": 3.4182060062448727e-06} +{"train_loss": 0.000402971199946478, "global_step": 66164, "epoch": 556, "lr": 1.339159890407693e-06} +{"train_loss": 0.0003087875375058502, "global_step": 66165, "epoch": 556, "lr": 1.3386506163857227e-06} +{"train_loss": 0.0007051604334264994, "global_step": 66166, "epoch": 556, "lr": 1.3381414379051271e-06} +{"train_loss": 0.0004607253649737686, "global_step": 66167, "epoch": 556, "lr": 1.3376323549668834e-06} +{"train_loss": 0.0002090174675686285, "global_step": 66168, "epoch": 556, "lr": 1.3371233675719963e-06} +{"train_loss": 0.00025620832457207143, "global_step": 66169, "epoch": 556, "lr": 1.3366144757214761e-06} +{"train_loss": 0.00031540446798317134, "global_step": 66170, "epoch": 556, "lr": 1.3361056794163107e-06} +{"train_loss": 0.0003048291546292603, "global_step": 66171, "epoch": 556, "lr": 1.3355969786575106e-06} +{"train_loss": 0.00022857461590319872, "global_step": 66172, "epoch": 556, "lr": 1.3350883734460583e-06} +{"train_loss": 0.0005657841684296727, "global_step": 66173, "epoch": 556, "lr": 1.3345798637829642e-06} +{"train_loss": 0.00025370786897838116, "global_step": 66174, "epoch": 556, "lr": 1.3340714496692275e-06} +{"train_loss": 0.00017305795336142182, "global_step": 66175, "epoch": 556, "lr": 1.3335631311058304e-06} +{"train_loss": 0.00016199176025111228, "global_step": 66176, "epoch": 556, "lr": 1.3330549080937948e-06} +{"train_loss": 0.00029546284349635243, "global_step": 66177, "epoch": 556, "lr": 1.3325467806340974e-06} +{"train_loss": 0.00026310948305763304, "global_step": 66178, "epoch": 556, "lr": 1.332038748727754e-06} +{"train_loss": 0.00039676512824371457, "global_step": 66179, "epoch": 556, "lr": 1.3315308123757475e-06} +{"train_loss": 0.00023530614271294326, "global_step": 66180, "epoch": 556, "lr": 1.3310229715790824e-06} +{"train_loss": 0.00018442443979438394, "global_step": 66181, "epoch": 556, "lr": 1.3305152263387577e-06} +{"train_loss": 0.00015271053416654468, "global_step": 66182, "epoch": 556, "lr": 1.3300075766557563e-06} +{"train_loss": 0.00024945460609160364, "global_step": 66183, "epoch": 556, "lr": 1.329500022531094e-06} +{"train_loss": 0.00012736275675706565, "global_step": 66184, "epoch": 556, "lr": 1.3289925639657585e-06} +{"train_loss": 0.00037857407005503774, "global_step": 66185, "epoch": 556, "lr": 1.3284852009607441e-06} +{"train_loss": 0.00036077250842936337, "global_step": 66186, "epoch": 556, "lr": 1.3279779335170494e-06} +{"train_loss": 0.0002488593745511025, "global_step": 66187, "epoch": 556, "lr": 1.3274707616356685e-06} +{"train_loss": 0.00039522830047644675, "global_step": 66188, "epoch": 556, "lr": 1.3269636853176058e-06} +{"train_loss": 0.00013627827866002917, "global_step": 66189, "epoch": 556, "lr": 1.3264567045638442e-06} +{"train_loss": 0.00024894948001019657, "global_step": 66190, "epoch": 556, "lr": 1.3259498193753883e-06} +{"train_loss": 0.0001580666721565649, "global_step": 66191, "epoch": 556, "lr": 1.3254430297532206e-06} +{"train_loss": 0.00029958595405332744, "global_step": 66192, "epoch": 556, "lr": 1.3249363356983569e-06} +{"train_loss": 0.00015691084263380617, "global_step": 66193, "epoch": 556, "lr": 1.3244297372117798e-06} +{"train_loss": 0.00026213552337139845, "global_step": 66194, "epoch": 556, "lr": 1.3239232342944773e-06} +{"train_loss": 0.0004692163784056902, "global_step": 66195, "epoch": 556, "lr": 1.3234168269474546e-06} +{"train_loss": 0.00043717300286516547, "global_step": 66196, "epoch": 556, "lr": 1.322910515171699e-06} +{"train_loss": 0.0004084166430402547, "global_step": 66197, "epoch": 556, "lr": 1.3224042989682162e-06} +{"train_loss": 0.00015797508240211755, "global_step": 66198, "epoch": 556, "lr": 1.3218981783379824e-06} +{"train_loss": 0.00019045552471652627, "global_step": 66199, "epoch": 556, "lr": 1.3213921532820084e-06} +{"train_loss": 0.00036698035546578467, "global_step": 66200, "epoch": 556, "lr": 1.3208862238012765e-06} +{"train_loss": 0.0001821945479605347, "global_step": 66201, "epoch": 556, "lr": 1.3203803898967915e-06} +{"train_loss": 0.00025786765036173165, "global_step": 66202, "epoch": 556, "lr": 1.3198746515695305e-06} +{"train_loss": 0.0003589619300328195, "global_step": 66203, "epoch": 556, "lr": 1.3193690088204925e-06} +{"train_loss": 0.0003229225694667548, "global_step": 66204, "epoch": 556, "lr": 1.3188634616506823e-06} +{"train_loss": 0.00016902704373933375, "global_step": 66205, "epoch": 556, "lr": 1.318358010061077e-06} +{"train_loss": 0.00034122884972020984, "global_step": 66206, "epoch": 556, "lr": 1.3178526540526758e-06} +{"train_loss": 0.0002631915849633515, "global_step": 66207, "epoch": 556, "lr": 1.3173473936264725e-06} +{"train_loss": 0.00016165860870387405, "global_step": 66208, "epoch": 556, "lr": 1.3168422287834493e-06} +{"train_loss": 0.00033428616006858647, "global_step": 66209, "epoch": 556, "lr": 1.3163371595246166e-06} +{"train_loss": 0.0002507592143956572, "global_step": 66210, "epoch": 556, "lr": 1.315832185850946e-06} +{"train_loss": 0.00017935568757820874, "global_step": 66211, "epoch": 556, "lr": 1.315327307763442e-06} +{"train_loss": 0.0004206153389532119, "global_step": 66212, "epoch": 556, "lr": 1.314822525263093e-06} +{"train_loss": 0.00022698020620737225, "global_step": 66213, "epoch": 556, "lr": 1.3143178383508815e-06} +{"train_loss": 0.00024361327814403921, "global_step": 66214, "epoch": 556, "lr": 1.313813247027812e-06} +{"train_loss": 0.0002557982224971056, "global_step": 66215, "epoch": 556, "lr": 1.3133087512948673e-06} +{"train_loss": 0.00026609410997480154, "global_step": 66216, "epoch": 556, "lr": 1.3128043511530408e-06} +{"train_loss": 0.0002037868252955377, "global_step": 66217, "epoch": 556, "lr": 1.3123000466033154e-06} +{"train_loss": 0.00025391619419679046, "global_step": 66218, "epoch": 556, "lr": 1.3117958376466954e-06} +{"train_loss": 0.00019296925165690482, "global_step": 66219, "epoch": 556, "lr": 1.3112917242841583e-06} +{"train_loss": 0.0002450703759677708, "global_step": 66220, "epoch": 556, "lr": 1.3107877065166974e-06} +{"train_loss": 0.000216332045965828, "global_step": 66221, "epoch": 556, "lr": 1.3102837843453063e-06} +{"train_loss": 0.00016665934526827186, "global_step": 66222, "epoch": 556, "lr": 1.3097799577709679e-06} +{"train_loss": 0.00014994545199442655, "global_step": 66223, "epoch": 556, "lr": 1.3092762267946813e-06} +{"train_loss": 0.00040169694693759084, "global_step": 66224, "epoch": 556, "lr": 1.3087725914174232e-06} +{"train_loss": 0.000570078962482512, "global_step": 66225, "epoch": 556, "lr": 1.3082690516401874e-06} +{"train_loss": 0.00037806102773174644, "global_step": 66226, "epoch": 556, "lr": 1.3077656074639677e-06} +{"train_loss": 0.0002819871297106147, "global_step": 66227, "epoch": 556, "lr": 1.307262258889741e-06} +{"train_loss": 0.0003427404153626412, "global_step": 66228, "epoch": 556, "lr": 1.306759005918512e-06} +{"train_loss": 0.000296647718641907, "global_step": 66229, "epoch": 556, "lr": 1.3062558485512522e-06} +{"train_loss": 0.00031217941432259977, "global_step": 66230, "epoch": 556, "lr": 1.3057527867889607e-06} +{"train_loss": 0.00016872206469997764, "global_step": 66231, "epoch": 556, "lr": 1.3052498206326202e-06} +{"train_loss": 0.0001737195416353643, "global_step": 66232, "epoch": 556, "lr": 1.3047469500832187e-06} +{"train_loss": 0.00022945620003156364, "global_step": 66233, "epoch": 556, "lr": 1.3042441751417444e-06} +{"train_loss": 0.0002202631876571104, "global_step": 66234, "epoch": 556, "lr": 1.3037414958091909e-06} +{"train_loss": 0.00016475995653308928, "global_step": 66235, "epoch": 556, "lr": 1.3032389120865297e-06} +{"train_loss": 0.00022622400138061494, "global_step": 66236, "epoch": 556, "lr": 1.3027364239747597e-06} +{"train_loss": 0.00014000669762026519, "global_step": 66237, "epoch": 556, "lr": 1.3022340314748637e-06} +{"train_loss": 0.0001381038164254278, "global_step": 66238, "epoch": 556, "lr": 1.30173173458783e-06} +{"train_loss": 0.00045943516306579113, "global_step": 66239, "epoch": 556, "lr": 1.3012295333146408e-06} +{"train_loss": 0.0002854156191460788, "global_step": 66240, "epoch": 556, "lr": 1.3007274276562843e-06} +{"train_loss": 0.0006382090505212545, "global_step": 66241, "epoch": 556, "lr": 1.3002254176137485e-06} +{"train_loss": 0.00014686914801131934, "global_step": 66242, "epoch": 556, "lr": 1.2997235031880217e-06} +{"train_loss": 0.00024854199727997184, "global_step": 66243, "epoch": 556, "lr": 1.299221684380081e-06} +{"train_loss": 0.0004097376368008554, "global_step": 66244, "epoch": 556, "lr": 1.298719961190914e-06} +{"train_loss": 0.00023473873443435878, "global_step": 66245, "epoch": 556, "lr": 1.2982183336215092e-06} +{"train_loss": 0.0001734336547087878, "global_step": 66246, "epoch": 556, "lr": 1.2977168016728492e-06} +{"train_loss": 0.00024121349269989878, "global_step": 66247, "epoch": 556, "lr": 1.2972153653459162e-06} +{"train_loss": 0.0001637314271647483, "global_step": 66248, "epoch": 556, "lr": 1.2967140246416987e-06} +{"train_loss": 0.00021280960936564952, "global_step": 66249, "epoch": 556, "lr": 1.2962127795611844e-06} +{"train_loss": 0.00020506858709268272, "global_step": 66250, "epoch": 556, "lr": 1.2957116301053563e-06} +{"train_loss": 0.0001412884594174102, "global_step": 66251, "epoch": 556, "lr": 1.2952105762751855e-06} +{"train_loss": 0.00027169223176315427, "global_step": 66252, "epoch": 556, "lr": 1.294709618071671e-06} +{"train_loss": 0.00017522956477478147, "global_step": 66253, "epoch": 556, "lr": 1.2942087554957848e-06} +{"train_loss": 0.00024644803488627076, "global_step": 66254, "epoch": 556, "lr": 1.293707988548526e-06} +{"train_loss": 0.00018052580708172172, "global_step": 66255, "epoch": 556, "lr": 1.29320731723086e-06} +{"train_loss": 0.00028555619064718485, "global_step": 66256, "epoch": 556, "lr": 1.292706741543781e-06} +{"train_loss": 0.0003322541306260973, "global_step": 66257, "epoch": 556, "lr": 1.2922062614882713e-06} +{"train_loss": 0.00016307066834997386, "global_step": 66258, "epoch": 556, "lr": 1.2917058770653078e-06} +{"train_loss": 0.00019250538025517017, "global_step": 66259, "epoch": 556, "lr": 1.2912055882758788e-06} +{"train_loss": 0.0001600699033588171, "global_step": 66260, "epoch": 556, "lr": 1.2907053951209558e-06} +{"train_loss": 0.00039172900142148137, "global_step": 66261, "epoch": 556, "lr": 1.2902052976015378e-06} +{"train_loss": 0.00015261798398569226, "global_step": 66262, "epoch": 556, "lr": 1.2897052957185962e-06} +{"train_loss": 0.00017000027582980692, "global_step": 66263, "epoch": 556, "lr": 1.2892053894731082e-06} +{"train_loss": 0.0002695296425372362, "global_step": 66264, "epoch": 556, "lr": 1.2887055788660674e-06} +{"train_loss": 0.00036088351043872535, "global_step": 66265, "epoch": 556, "lr": 1.288205863898445e-06} +{"train_loss": 0.00023232332023326308, "global_step": 66266, "epoch": 556, "lr": 1.2877062445712297e-06} +{"train_loss": 0.00040523309144191444, "global_step": 66267, "epoch": 556, "lr": 1.2872067208853978e-06} +{"train_loss": 0.00025564408861100674, "global_step": 66268, "epoch": 556, "lr": 1.2867072928419322e-06} +{"train_loss": 0.0002049748582066968, "global_step": 66269, "epoch": 556, "lr": 1.2862079604418153e-06} +{"train_loss": 0.00039661271148361266, "global_step": 66270, "epoch": 556, "lr": 1.2857087236860188e-06} +{"train_loss": 0.0002771932340692729, "global_step": 66271, "epoch": 556, "lr": 1.2852095825755305e-06} +{"train_loss": 0.00021411797206383198, "global_step": 66272, "epoch": 556, "lr": 1.2847105371113276e-06} +{"train_loss": 0.001171368989162147, "global_step": 66273, "epoch": 556, "lr": 1.2842115872943983e-06} +{"train_loss": 0.0002148751518689096, "global_step": 66274, "epoch": 556, "lr": 1.2837127331257082e-06} +{"train_loss": 0.0003515864082146436, "global_step": 66275, "epoch": 556, "lr": 1.2832139746062455e-06} +{"train_loss": 0.00016950207646004856, "global_step": 66276, "epoch": 556, "lr": 1.2827153117369872e-06} +{"train_loss": 0.0002917987294495106, "global_step": 66277, "epoch": 556, "lr": 1.2822167445189103e-06} +{"train_loss": 0.0003588166437111795, "global_step": 66278, "epoch": 556, "lr": 1.281718272953003e-06} +{"train_loss": 0.0001488171110395342, "global_step": 66279, "epoch": 556, "lr": 1.281219897040231e-06} +{"train_loss": 0.0002472625346854329, "global_step": 66280, "epoch": 556, "lr": 1.2807216167815829e-06} +{"train_loss": 0.00016960484208539128, "global_step": 66281, "epoch": 556, "lr": 1.2802234321780348e-06} +{"train_loss": 0.00027694217415581295, "global_step": 66282, "epoch": 556, "lr": 1.2797253432305534e-06, "val_loss": 0.013596741482615471} +{"train_loss": 0.00022768117196392268, "global_step": 66283, "epoch": 557, "lr": 1.2792273499401375e-06} +{"train_loss": 0.0002648451772984117, "global_step": 66284, "epoch": 557, "lr": 1.278729452307742e-06} +{"train_loss": 0.00027900224085897207, "global_step": 66285, "epoch": 557, "lr": 1.2782316503343662e-06} +{"train_loss": 0.0005331204738467932, "global_step": 66286, "epoch": 557, "lr": 1.2777339440209702e-06} +{"train_loss": 0.0002918925310950726, "global_step": 66287, "epoch": 557, "lr": 1.2772363333685479e-06} +{"train_loss": 0.0001699805579846725, "global_step": 66288, "epoch": 557, "lr": 1.2767388183780594e-06} +{"train_loss": 0.00032318150624632835, "global_step": 66289, "epoch": 557, "lr": 1.2762413990504873e-06} +{"train_loss": 0.0001759554579621181, "global_step": 66290, "epoch": 557, "lr": 1.2757440753868143e-06} +{"train_loss": 0.0001681003050180152, "global_step": 66291, "epoch": 557, "lr": 1.275246847388012e-06} +{"train_loss": 0.00021139999444130808, "global_step": 66292, "epoch": 557, "lr": 1.274749715055057e-06} +{"train_loss": 0.0003754350764211267, "global_step": 66293, "epoch": 557, "lr": 1.2742526783889263e-06} +{"train_loss": 0.000308709975797683, "global_step": 66294, "epoch": 557, "lr": 1.2737557373905917e-06} +{"train_loss": 0.00021673965966328979, "global_step": 66295, "epoch": 557, "lr": 1.2732588920610356e-06} +{"train_loss": 0.0002716676681302488, "global_step": 66296, "epoch": 557, "lr": 1.2727621424012236e-06} +{"train_loss": 0.00042988796485587955, "global_step": 66297, "epoch": 557, "lr": 1.2722654884121442e-06} +{"train_loss": 0.00012594320287462324, "global_step": 66298, "epoch": 557, "lr": 1.2717689300947578e-06} +{"train_loss": 0.00021941069280728698, "global_step": 66299, "epoch": 557, "lr": 1.2712724674500576e-06} +{"train_loss": 0.0001775489072315395, "global_step": 66300, "epoch": 557, "lr": 1.2707761004789987e-06} +{"train_loss": 0.00013726386532653123, "global_step": 66301, "epoch": 557, "lr": 1.270279829182569e-06} +{"train_loss": 0.0001445174275431782, "global_step": 66302, "epoch": 557, "lr": 1.2697836535617402e-06} +{"train_loss": 0.000218728935578838, "global_step": 66303, "epoch": 557, "lr": 1.2692875736174781e-06} +{"train_loss": 0.00020364875672385097, "global_step": 66304, "epoch": 557, "lr": 1.2687915893507762e-06} +{"train_loss": 0.00029818512848578393, "global_step": 66305, "epoch": 557, "lr": 1.268295700762584e-06} +{"train_loss": 0.00019676507508847862, "global_step": 66306, "epoch": 557, "lr": 1.267799907853895e-06} +{"train_loss": 0.0003800680278800428, "global_step": 66307, "epoch": 557, "lr": 1.267304210625675e-06} +{"train_loss": 0.00030979429720900953, "global_step": 66308, "epoch": 557, "lr": 1.26680860907889e-06} +{"train_loss": 0.00025608541909605265, "global_step": 66309, "epoch": 557, "lr": 1.2663131032145226e-06} +{"train_loss": 0.00016522435180377215, "global_step": 66310, "epoch": 557, "lr": 1.2658176930335441e-06} +{"train_loss": 0.00023047324793878943, "global_step": 66311, "epoch": 557, "lr": 1.2653223785369262e-06} +{"train_loss": 0.0002734943409450352, "global_step": 66312, "epoch": 557, "lr": 1.2648271597256456e-06} +{"train_loss": 0.0002171978703700006, "global_step": 66313, "epoch": 557, "lr": 1.264332036600663e-06} +{"train_loss": 0.00029885218827985227, "global_step": 66314, "epoch": 557, "lr": 1.2638370091629604e-06} +{"train_loss": 0.0003777621896006167, "global_step": 66315, "epoch": 557, "lr": 1.263342077413504e-06} +{"train_loss": 0.0006339221727102995, "global_step": 66316, "epoch": 557, "lr": 1.2628472413532766e-06} +{"train_loss": 0.0004236262757331133, "global_step": 66317, "epoch": 557, "lr": 1.2623525009832327e-06} +{"train_loss": 0.00016882769705262035, "global_step": 66318, "epoch": 557, "lr": 1.2618578563043603e-06} +{"train_loss": 0.00019267226161900908, "global_step": 66319, "epoch": 557, "lr": 1.2613633073176256e-06} +{"train_loss": 0.00025729386834427714, "global_step": 66320, "epoch": 557, "lr": 1.2608688540239888e-06} +{"train_loss": 0.0002316530590178445, "global_step": 66321, "epoch": 557, "lr": 1.2603744964244324e-06} +{"train_loss": 0.00045240321196615696, "global_step": 66322, "epoch": 557, "lr": 1.2598802345199222e-06} +{"train_loss": 0.00040015505510382354, "global_step": 66323, "epoch": 557, "lr": 1.2593860683114301e-06} +{"train_loss": 0.00023647821217309684, "global_step": 66324, "epoch": 557, "lr": 1.2588919977999324e-06} +{"train_loss": 0.00034039089223369956, "global_step": 66325, "epoch": 557, "lr": 1.2583980229863846e-06} +{"train_loss": 0.0002857479848898947, "global_step": 66326, "epoch": 557, "lr": 1.2579041438717686e-06} +{"train_loss": 0.00020251513342373073, "global_step": 66327, "epoch": 557, "lr": 1.2574103604570453e-06} +{"train_loss": 0.0005494605866260827, "global_step": 66328, "epoch": 557, "lr": 1.256916672743197e-06} +{"train_loss": 0.00019624580454546958, "global_step": 66329, "epoch": 557, "lr": 1.2564230807311783e-06} +{"train_loss": 0.0002511808997951448, "global_step": 66330, "epoch": 557, "lr": 1.255929584421972e-06} +{"train_loss": 0.0003512219700496644, "global_step": 66331, "epoch": 557, "lr": 1.2554361838165384e-06} +{"train_loss": 0.00027239436167292297, "global_step": 66332, "epoch": 557, "lr": 1.254942878915849e-06} +{"train_loss": 0.0003980762558057904, "global_step": 66333, "epoch": 557, "lr": 1.2544496697208696e-06} +{"train_loss": 0.00018226885003969073, "global_step": 66334, "epoch": 557, "lr": 1.2539565562325717e-06} +{"train_loss": 0.00020649695943575352, "global_step": 66335, "epoch": 557, "lr": 1.2534635384519211e-06} +{"train_loss": 0.0003113020211458206, "global_step": 66336, "epoch": 557, "lr": 1.2529706163798837e-06} +{"train_loss": 0.00015438481932505965, "global_step": 66337, "epoch": 557, "lr": 1.2524777900174368e-06} +{"train_loss": 0.00026795000303536654, "global_step": 66338, "epoch": 557, "lr": 1.2519850593655402e-06} +{"train_loss": 0.0002571656950749457, "global_step": 66339, "epoch": 557, "lr": 1.2514924244251602e-06} +{"train_loss": 0.0002475449291523546, "global_step": 66340, "epoch": 557, "lr": 1.2509998851972738e-06} +{"train_loss": 0.00038176143425516784, "global_step": 66341, "epoch": 557, "lr": 1.2505074416828355e-06} +{"train_loss": 0.0002241596084786579, "global_step": 66342, "epoch": 557, "lr": 1.2500150938828225e-06} +{"train_loss": 0.00024899569689296186, "global_step": 66343, "epoch": 557, "lr": 1.2495228417981952e-06} +{"train_loss": 0.00020497225341387093, "global_step": 66344, "epoch": 557, "lr": 1.249030685429914e-06} +{"train_loss": 0.000213011764572002, "global_step": 66345, "epoch": 557, "lr": 1.248538624778961e-06} +{"train_loss": 0.0003963678900618106, "global_step": 66346, "epoch": 557, "lr": 1.2480466598462915e-06} +{"train_loss": 0.00023184966994449496, "global_step": 66347, "epoch": 557, "lr": 1.247554790632871e-06} +{"train_loss": 0.0006747196894139051, "global_step": 66348, "epoch": 557, "lr": 1.2470630171396714e-06} +{"train_loss": 0.0004772055835928768, "global_step": 66349, "epoch": 557, "lr": 1.2465713393676582e-06} +{"train_loss": 0.00017110511544160545, "global_step": 66350, "epoch": 557, "lr": 1.246079757317792e-06} +{"train_loss": 0.0005811758455820382, "global_step": 66351, "epoch": 557, "lr": 1.2455882709910328e-06} +{"train_loss": 0.00020809893612749875, "global_step": 66352, "epoch": 557, "lr": 1.2450968803883579e-06} +{"train_loss": 0.00023845682153478265, "global_step": 66353, "epoch": 557, "lr": 1.2446055855107276e-06} +{"train_loss": 0.00024709486751817167, "global_step": 66354, "epoch": 557, "lr": 1.2441143863591021e-06} +{"train_loss": 0.0004986628191545606, "global_step": 66355, "epoch": 557, "lr": 1.243623282934453e-06} +{"train_loss": 0.0002811098820529878, "global_step": 66356, "epoch": 557, "lr": 1.2431322752377406e-06} +{"train_loss": 0.0003745981666725129, "global_step": 66357, "epoch": 557, "lr": 1.2426413632699252e-06} +{"train_loss": 0.00023894020705483854, "global_step": 66358, "epoch": 557, "lr": 1.2421505470319783e-06} +{"train_loss": 0.00017833437595982105, "global_step": 66359, "epoch": 557, "lr": 1.2416598265248602e-06} +{"train_loss": 0.0002953247167170048, "global_step": 66360, "epoch": 557, "lr": 1.2411692017495257e-06} +{"train_loss": 0.0002445644640829414, "global_step": 66361, "epoch": 557, "lr": 1.2406786727069574e-06} +{"train_loss": 0.00022661803814116865, "global_step": 66362, "epoch": 557, "lr": 1.2401882393981046e-06} +{"train_loss": 0.00018258120690006763, "global_step": 66363, "epoch": 557, "lr": 1.2396979018239274e-06} +{"train_loss": 0.00021091432427056134, "global_step": 66364, "epoch": 557, "lr": 1.2392076599853975e-06} +{"train_loss": 0.0002901871339417994, "global_step": 66365, "epoch": 557, "lr": 1.238717513883475e-06} +{"train_loss": 0.0004907287075184286, "global_step": 66366, "epoch": 557, "lr": 1.238227463519115e-06} +{"train_loss": 0.0002651605464052409, "global_step": 66367, "epoch": 557, "lr": 1.237737508893294e-06} +{"train_loss": 0.0002119320706697181, "global_step": 66368, "epoch": 557, "lr": 1.2372476500069618e-06} +{"train_loss": 0.0002725662779994309, "global_step": 66369, "epoch": 557, "lr": 1.2367578868610895e-06} +{"train_loss": 0.00022276706295087934, "global_step": 66370, "epoch": 557, "lr": 1.2362682194566267e-06} +{"train_loss": 0.0002201785973738879, "global_step": 66371, "epoch": 557, "lr": 1.2357786477945443e-06} +{"train_loss": 0.00021778402151539922, "global_step": 66372, "epoch": 557, "lr": 1.2352891718757976e-06} +{"train_loss": 0.0008489239262416959, "global_step": 66373, "epoch": 557, "lr": 1.2347997917013577e-06} +{"train_loss": 0.00024459423730149865, "global_step": 66374, "epoch": 557, "lr": 1.2343105072721738e-06} +{"train_loss": 0.00032122136326506734, "global_step": 66375, "epoch": 557, "lr": 1.2338213185892122e-06} +{"train_loss": 0.00037929622340016067, "global_step": 66376, "epoch": 557, "lr": 1.2333322256534385e-06} +{"train_loss": 0.00013530229625757784, "global_step": 66377, "epoch": 557, "lr": 1.2328432284657965e-06} +{"train_loss": 0.0002677170850802213, "global_step": 66378, "epoch": 557, "lr": 1.2323543270272686e-06} +{"train_loss": 0.00020500605751294643, "global_step": 66379, "epoch": 557, "lr": 1.231865521338793e-06} +{"train_loss": 0.00028217863291502, "global_step": 66380, "epoch": 557, "lr": 1.2313768114013414e-06} +{"train_loss": 0.00022825611813459545, "global_step": 66381, "epoch": 557, "lr": 1.2308881972158793e-06} +{"train_loss": 0.00021242645743768662, "global_step": 66382, "epoch": 557, "lr": 1.230399678783345e-06} +{"train_loss": 0.00035408008261583745, "global_step": 66383, "epoch": 557, "lr": 1.229911256104721e-06} +{"train_loss": 0.0006558698951266706, "global_step": 66384, "epoch": 557, "lr": 1.2294229291809511e-06} +{"train_loss": 0.00013898839824832976, "global_step": 66385, "epoch": 557, "lr": 1.2289346980130012e-06} +{"train_loss": 0.000244714057771489, "global_step": 66386, "epoch": 557, "lr": 1.2284465626018204e-06} +{"train_loss": 0.0003987274831160903, "global_step": 66387, "epoch": 557, "lr": 1.227958522948386e-06} +{"train_loss": 0.0005291884299367666, "global_step": 66388, "epoch": 557, "lr": 1.2274705790536411e-06} +{"train_loss": 0.00019833851547446102, "global_step": 66389, "epoch": 557, "lr": 1.226982730918541e-06} +{"train_loss": 0.00016920342750381678, "global_step": 66390, "epoch": 557, "lr": 1.2264949785440571e-06} +{"train_loss": 0.0004817499138880521, "global_step": 66391, "epoch": 557, "lr": 1.226007321931133e-06} +{"train_loss": 0.0003620924544520676, "global_step": 66392, "epoch": 557, "lr": 1.2255197610807345e-06} +{"train_loss": 0.00017376019968651235, "global_step": 66393, "epoch": 557, "lr": 1.2250322959938221e-06} +{"train_loss": 0.00014115664816927165, "global_step": 66394, "epoch": 557, "lr": 1.2245449266713393e-06} +{"train_loss": 0.00023842127120587975, "global_step": 66395, "epoch": 557, "lr": 1.2240576531142633e-06} +{"train_loss": 0.0003528852539602667, "global_step": 66396, "epoch": 557, "lr": 1.2235704753235267e-06} +{"train_loss": 0.0004847879463341087, "global_step": 66397, "epoch": 557, "lr": 1.2230833933001063e-06} +{"train_loss": 0.00029458742938004434, "global_step": 66398, "epoch": 557, "lr": 1.2225964070449458e-06} +{"train_loss": 0.00016255905211437494, "global_step": 66399, "epoch": 557, "lr": 1.2221095165590057e-06} +{"train_loss": 0.00019206183787900954, "global_step": 66400, "epoch": 557, "lr": 1.2216227218432463e-06} +{"train_loss": 0.0002874674246413633, "global_step": 66401, "epoch": 557, "lr": 1.2211360228986169e-06, "val_loss": 0.01628539152443409} +{"train_loss": 0.00011392822489142418, "global_step": 66402, "epoch": 558, "lr": 1.2206494197260832e-06} +{"train_loss": 0.00036722823278978467, "global_step": 66403, "epoch": 558, "lr": 1.2201629123265834e-06} +{"train_loss": 0.00030552304815500975, "global_step": 66404, "epoch": 558, "lr": 1.219676500701089e-06} +{"train_loss": 0.0002705182123463601, "global_step": 66405, "epoch": 558, "lr": 1.2191901848505438e-06} +{"train_loss": 0.0002804220712278038, "global_step": 66406, "epoch": 558, "lr": 1.218703964775908e-06} +{"train_loss": 0.00017431561718694866, "global_step": 66407, "epoch": 558, "lr": 1.218217840478142e-06} +{"train_loss": 0.0003911461099050939, "global_step": 66408, "epoch": 558, "lr": 1.2177318119581837e-06} +{"train_loss": 0.0003407546610105783, "global_step": 66409, "epoch": 558, "lr": 1.217245879217005e-06} +{"train_loss": 0.0005012537585571408, "global_step": 66410, "epoch": 558, "lr": 1.2167600422555435e-06} +{"train_loss": 0.0003689273144118488, "global_step": 66411, "epoch": 558, "lr": 1.2162743010747712e-06} +{"train_loss": 0.00032969258609227836, "global_step": 66412, "epoch": 558, "lr": 1.2157886556756315e-06} +{"train_loss": 0.00022485258523374796, "global_step": 66413, "epoch": 558, "lr": 1.2153031060590736e-06} +{"train_loss": 0.00033881457056850195, "global_step": 66414, "epoch": 558, "lr": 1.2148176522260634e-06} +{"train_loss": 0.0002748396364040673, "global_step": 66415, "epoch": 558, "lr": 1.2143322941775392e-06} +{"train_loss": 0.0003828431072179228, "global_step": 66416, "epoch": 558, "lr": 1.2138470319144669e-06} +{"train_loss": 0.00031509282416664064, "global_step": 66417, "epoch": 558, "lr": 1.2133618654377898e-06} +{"train_loss": 0.00045217794831842184, "global_step": 66418, "epoch": 558, "lr": 1.2128767947484688e-06} +{"train_loss": 0.0001554911577841267, "global_step": 66419, "epoch": 558, "lr": 1.2123918198474525e-06} +{"train_loss": 0.00019515369785949588, "global_step": 66420, "epoch": 558, "lr": 1.2119069407356854e-06} +{"train_loss": 0.0003558332391548902, "global_step": 66421, "epoch": 558, "lr": 1.2114221574141326e-06} +{"train_loss": 0.00029207946499809623, "global_step": 66422, "epoch": 558, "lr": 1.2109374698837383e-06} +{"train_loss": 0.0007017567986622453, "global_step": 66423, "epoch": 558, "lr": 1.2104528781454572e-06} +{"train_loss": 0.0001335837150691077, "global_step": 66424, "epoch": 558, "lr": 1.2099683822002383e-06} +{"train_loss": 0.0001632965140743181, "global_step": 66425, "epoch": 558, "lr": 1.2094839820490366e-06} +{"train_loss": 0.0006383129511959851, "global_step": 66426, "epoch": 558, "lr": 1.2089996776928014e-06} +{"train_loss": 0.00036999385338276625, "global_step": 66427, "epoch": 558, "lr": 1.2085154691324762e-06} +{"train_loss": 0.0005893050110898912, "global_step": 66428, "epoch": 558, "lr": 1.2080313563690215e-06} +{"train_loss": 0.00012105494533898309, "global_step": 66429, "epoch": 558, "lr": 1.2075473394033865e-06} +{"train_loss": 0.00022569450084120035, "global_step": 66430, "epoch": 558, "lr": 1.2070634182365203e-06} +{"train_loss": 0.0002166640479117632, "global_step": 66431, "epoch": 558, "lr": 1.2065795928693668e-06} +{"train_loss": 0.0003023727040272206, "global_step": 66432, "epoch": 558, "lr": 1.2060958633028862e-06} +{"train_loss": 0.00018775401986204088, "global_step": 66433, "epoch": 558, "lr": 1.2056122295380224e-06} +{"train_loss": 0.00048424035776406527, "global_step": 66434, "epoch": 558, "lr": 1.2051286915757187e-06} +{"train_loss": 0.00021694751922041178, "global_step": 66435, "epoch": 558, "lr": 1.2046452494169414e-06} +{"train_loss": 0.0003737851220648736, "global_step": 66436, "epoch": 558, "lr": 1.2041619030626284e-06} +{"train_loss": 0.0002387340209679678, "global_step": 66437, "epoch": 558, "lr": 1.203678652513729e-06} +{"train_loss": 0.00012246074038557708, "global_step": 66438, "epoch": 558, "lr": 1.203195497771198e-06} +{"train_loss": 0.0001655334490351379, "global_step": 66439, "epoch": 558, "lr": 1.2027124388359734e-06} +{"train_loss": 0.00014944102440495044, "global_step": 66440, "epoch": 558, "lr": 1.2022294757090157e-06} +{"train_loss": 0.0002291011915076524, "global_step": 66441, "epoch": 558, "lr": 1.2017466083912576e-06} +{"train_loss": 0.00028386746998876333, "global_step": 66442, "epoch": 558, "lr": 1.201263836883665e-06} +{"train_loss": 0.000327141082379967, "global_step": 66443, "epoch": 558, "lr": 1.2007811611871756e-06} +{"train_loss": 0.0002903769491240382, "global_step": 66444, "epoch": 558, "lr": 1.200298581302739e-06} +{"train_loss": 0.0003362550924066454, "global_step": 66445, "epoch": 558, "lr": 1.1998160972313044e-06} +{"train_loss": 0.00024079538707155734, "global_step": 66446, "epoch": 558, "lr": 1.1993337089738156e-06} +{"train_loss": 0.00013508653501048684, "global_step": 66447, "epoch": 558, "lr": 1.1988514165312214e-06} +{"train_loss": 0.0002312319411430508, "global_step": 66448, "epoch": 558, "lr": 1.198369219904466e-06} +{"train_loss": 0.0003267516731284559, "global_step": 66449, "epoch": 558, "lr": 1.197887119094504e-06} +{"train_loss": 0.0005337002803571522, "global_step": 66450, "epoch": 558, "lr": 1.1974051141022736e-06} +{"train_loss": 0.00017477832443546504, "global_step": 66451, "epoch": 558, "lr": 1.1969232049287238e-06} +{"train_loss": 0.000191097758943215, "global_step": 66452, "epoch": 558, "lr": 1.196441391574804e-06} +{"train_loss": 0.0003932789259124547, "global_step": 66453, "epoch": 558, "lr": 1.1959596740414524e-06} +{"train_loss": 0.0003750744799617678, "global_step": 66454, "epoch": 558, "lr": 1.1954780523296295e-06} +{"train_loss": 0.0007001072517596185, "global_step": 66455, "epoch": 558, "lr": 1.1949965264402618e-06} +{"train_loss": 0.00026350258849561214, "global_step": 66456, "epoch": 558, "lr": 1.19451509637431e-06} +{"train_loss": 0.00032065968844108284, "global_step": 66457, "epoch": 558, "lr": 1.194033762132718e-06} +{"train_loss": 0.00014744765940122306, "global_step": 66458, "epoch": 558, "lr": 1.193552523716418e-06} +{"train_loss": 0.00018099603767041117, "global_step": 66459, "epoch": 558, "lr": 1.193071381126365e-06} +{"train_loss": 0.00015312028699554503, "global_step": 66460, "epoch": 558, "lr": 1.1925903343635026e-06} +{"train_loss": 0.0003889384097419679, "global_step": 66461, "epoch": 558, "lr": 1.1921093834287745e-06} +{"train_loss": 0.0004372842377051711, "global_step": 66462, "epoch": 558, "lr": 1.1916285283231243e-06} +{"train_loss": 0.00026419773348607123, "global_step": 66463, "epoch": 558, "lr": 1.1911477690475015e-06} +{"train_loss": 0.0005345383542589843, "global_step": 66464, "epoch": 558, "lr": 1.190667105602844e-06} +{"train_loss": 0.00018292473396286368, "global_step": 66465, "epoch": 558, "lr": 1.1901865379900956e-06} +{"train_loss": 0.0007440109620802104, "global_step": 66466, "epoch": 558, "lr": 1.1897060662102e-06} +{"train_loss": 0.0005808858550153673, "global_step": 66467, "epoch": 558, "lr": 1.1892256902641064e-06} +{"train_loss": 0.00018409505719318986, "global_step": 66468, "epoch": 558, "lr": 1.1887454101527473e-06} +{"train_loss": 0.00020962422422599047, "global_step": 66469, "epoch": 558, "lr": 1.1882652258770777e-06} +{"train_loss": 0.00034200071240775287, "global_step": 66470, "epoch": 558, "lr": 1.18778513743803e-06} +{"train_loss": 0.0002489119942765683, "global_step": 66471, "epoch": 558, "lr": 1.187305144836559e-06} +{"train_loss": 0.0003296046343166381, "global_step": 66472, "epoch": 558, "lr": 1.186825248073592e-06} +{"train_loss": 0.00017966298037208617, "global_step": 66473, "epoch": 558, "lr": 1.1863454471500834e-06} +{"train_loss": 0.00022353068925440311, "global_step": 66474, "epoch": 558, "lr": 1.1858657420669605e-06} +{"train_loss": 0.00014758433098904788, "global_step": 66475, "epoch": 558, "lr": 1.1853861328251892e-06} +{"train_loss": 0.00022208296286407858, "global_step": 66476, "epoch": 558, "lr": 1.1849066194256909e-06} +{"train_loss": 0.00031148031121119857, "global_step": 66477, "epoch": 558, "lr": 1.1844272018694092e-06} +{"train_loss": 0.00021805890719406307, "global_step": 66478, "epoch": 558, "lr": 1.183947880157299e-06} +{"train_loss": 0.0003127289528492838, "global_step": 66479, "epoch": 558, "lr": 1.1834686542902818e-06} +{"train_loss": 0.00022736757819075137, "global_step": 66480, "epoch": 558, "lr": 1.1829895242693178e-06} +{"train_loss": 0.00032081655808724463, "global_step": 66481, "epoch": 558, "lr": 1.1825104900953342e-06} +{"train_loss": 0.00042041586129926145, "global_step": 66482, "epoch": 558, "lr": 1.1820315517692748e-06} +{"train_loss": 0.00031344540184363723, "global_step": 66483, "epoch": 558, "lr": 1.1815527092920831e-06} +{"train_loss": 0.00043496291618794203, "global_step": 66484, "epoch": 558, "lr": 1.1810739626646915e-06} +{"train_loss": 0.0003394553787074983, "global_step": 66485, "epoch": 558, "lr": 1.1805953118880552e-06} +{"train_loss": 0.00015582946070935577, "global_step": 66486, "epoch": 558, "lr": 1.1801167569630955e-06} +{"train_loss": 0.00026048565632663667, "global_step": 66487, "epoch": 558, "lr": 1.1796382978907672e-06} +{"train_loss": 0.00024307258718181401, "global_step": 66488, "epoch": 558, "lr": 1.179159934672003e-06} +{"train_loss": 0.00020601952564902604, "global_step": 66489, "epoch": 558, "lr": 1.1786816673077405e-06} +{"train_loss": 0.0002595595142338425, "global_step": 66490, "epoch": 558, "lr": 1.1782034957989186e-06} +{"train_loss": 0.0002552747610025108, "global_step": 66491, "epoch": 558, "lr": 1.1777254201464804e-06} +{"train_loss": 0.0006364687578752637, "global_step": 66492, "epoch": 558, "lr": 1.1772474403513644e-06} +{"train_loss": 0.0002123474987456575, "global_step": 66493, "epoch": 558, "lr": 1.1767695564145032e-06} +{"train_loss": 0.0002428310108371079, "global_step": 66494, "epoch": 558, "lr": 1.17629176833684e-06} +{"train_loss": 0.00030215061269700527, "global_step": 66495, "epoch": 558, "lr": 1.1758140761193138e-06} +{"train_loss": 0.0001324439508607611, "global_step": 66496, "epoch": 558, "lr": 1.1753364797628619e-06} +{"train_loss": 0.0005668022204190493, "global_step": 66497, "epoch": 558, "lr": 1.1748589792684173e-06} +{"train_loss": 0.0006226504920050502, "global_step": 66498, "epoch": 558, "lr": 1.1743815746369235e-06} +{"train_loss": 0.00033864466240629554, "global_step": 66499, "epoch": 558, "lr": 1.1739042658693078e-06} +{"train_loss": 0.0004044566594529897, "global_step": 66500, "epoch": 558, "lr": 1.1734270529665247e-06} +{"train_loss": 0.00024377451336476952, "global_step": 66501, "epoch": 558, "lr": 1.172949935929496e-06} +{"train_loss": 0.0002514583757147193, "global_step": 66502, "epoch": 558, "lr": 1.1724729147591651e-06} +{"train_loss": 0.00024923670571297407, "global_step": 66503, "epoch": 558, "lr": 1.1719959894564647e-06} +{"train_loss": 0.00031892090919427574, "global_step": 66504, "epoch": 558, "lr": 1.1715191600223386e-06} +{"train_loss": 0.00018059261492453516, "global_step": 66505, "epoch": 558, "lr": 1.1710424264577136e-06} +{"train_loss": 0.00040747266029939055, "global_step": 66506, "epoch": 558, "lr": 1.1705657887635336e-06} +{"train_loss": 0.00021008186740800738, "global_step": 66507, "epoch": 558, "lr": 1.1700892469407309e-06} +{"train_loss": 0.0002027408336289227, "global_step": 66508, "epoch": 558, "lr": 1.1696128009902385e-06} +{"train_loss": 0.00032361585181206465, "global_step": 66509, "epoch": 558, "lr": 1.169136450913e-06} +{"train_loss": 0.0003462883469182998, "global_step": 66510, "epoch": 558, "lr": 1.1686601967099364e-06} +{"train_loss": 0.00020774434960912913, "global_step": 66511, "epoch": 558, "lr": 1.1681840383819975e-06} +{"train_loss": 0.00035862938966602087, "global_step": 66512, "epoch": 558, "lr": 1.1677079759301157e-06} +{"train_loss": 0.00014575458772014827, "global_step": 66513, "epoch": 558, "lr": 1.1672320093552126e-06} +{"train_loss": 0.0002786926634144038, "global_step": 66514, "epoch": 558, "lr": 1.1667561386582426e-06} +{"train_loss": 0.00022051919950172305, "global_step": 66515, "epoch": 558, "lr": 1.166280363840122e-06} +{"train_loss": 0.00030889222398400307, "global_step": 66516, "epoch": 558, "lr": 1.1658046849017944e-06} +{"train_loss": 0.00022808935318607837, "global_step": 66517, "epoch": 558, "lr": 1.1653291018441925e-06} +{"train_loss": 0.00020239719015080482, "global_step": 66518, "epoch": 558, "lr": 1.1648536146682543e-06} +{"train_loss": 0.00029665237525478005, "global_step": 66519, "epoch": 558, "lr": 1.1643782233749069e-06} +{"train_loss": 0.00030222919970377104, "global_step": 66520, "epoch": 558, "lr": 1.1639029279650826e-06, "val_loss": 0.04512300714850426} +{"train_loss": 0.00029373200959526, "global_step": 66521, "epoch": 559, "lr": 1.16342772843972e-06} +{"train_loss": 0.0003738072991836816, "global_step": 66522, "epoch": 559, "lr": 1.1629526247997459e-06} +{"train_loss": 0.00016873890126589686, "global_step": 66523, "epoch": 559, "lr": 1.1624776170460982e-06} +{"train_loss": 0.0001848341489676386, "global_step": 66524, "epoch": 559, "lr": 1.16200270517971e-06} +{"train_loss": 0.00030418424285016954, "global_step": 66525, "epoch": 559, "lr": 1.1615278892015137e-06} +{"train_loss": 0.00015128031373023987, "global_step": 66526, "epoch": 559, "lr": 1.161053169112436e-06} +{"train_loss": 0.00019569910364225507, "global_step": 66527, "epoch": 559, "lr": 1.1605785449134154e-06} +{"train_loss": 0.00012359675019979477, "global_step": 66528, "epoch": 559, "lr": 1.160104016605379e-06} +{"train_loss": 0.0001940068614203483, "global_step": 66529, "epoch": 559, "lr": 1.159629584189259e-06} +{"train_loss": 0.000268529518507421, "global_step": 66530, "epoch": 559, "lr": 1.1591552476659884e-06} +{"train_loss": 0.00020340706396382302, "global_step": 66531, "epoch": 559, "lr": 1.158681007036505e-06} +{"train_loss": 0.0002813282480929047, "global_step": 66532, "epoch": 559, "lr": 1.158206862301725e-06} +{"train_loss": 0.0002509193727746606, "global_step": 66533, "epoch": 559, "lr": 1.1577328134625976e-06} +{"train_loss": 0.0003210255817975849, "global_step": 66534, "epoch": 559, "lr": 1.1572588605200329e-06} +{"train_loss": 0.00029866417753510177, "global_step": 66535, "epoch": 559, "lr": 1.1567850034749805e-06} +{"train_loss": 0.0002393467875663191, "global_step": 66536, "epoch": 559, "lr": 1.156311242328356e-06} +{"train_loss": 0.0003472914395388216, "global_step": 66537, "epoch": 559, "lr": 1.1558375770811037e-06} +{"train_loss": 0.00017211968952324241, "global_step": 66538, "epoch": 559, "lr": 1.1553640077341444e-06} +{"train_loss": 0.00030924880411475897, "global_step": 66539, "epoch": 559, "lr": 1.1548905342884053e-06} +{"train_loss": 0.00047296262346208096, "global_step": 66540, "epoch": 559, "lr": 1.1544171567448248e-06} +{"train_loss": 0.000187667494174093, "global_step": 66541, "epoch": 559, "lr": 1.153943875104324e-06} +{"train_loss": 0.00026344109210185707, "global_step": 66542, "epoch": 559, "lr": 1.1534706893678416e-06} +{"train_loss": 0.0003490273957140744, "global_step": 66543, "epoch": 559, "lr": 1.1529975995362929e-06} +{"train_loss": 0.00025390787050127983, "global_step": 66544, "epoch": 559, "lr": 1.152524605610622e-06} +{"train_loss": 0.0001899196213344112, "global_step": 66545, "epoch": 559, "lr": 1.1520517075917503e-06} +{"train_loss": 0.00040814068051986396, "global_step": 66546, "epoch": 559, "lr": 1.1515789054806047e-06} +{"train_loss": 0.00030853983480483294, "global_step": 66547, "epoch": 559, "lr": 1.1511061992781125e-06} +{"train_loss": 0.00013455137377604842, "global_step": 66548, "epoch": 559, "lr": 1.150633588985206e-06} +{"train_loss": 0.0002393282193224877, "global_step": 66549, "epoch": 559, "lr": 1.1501610746028124e-06} +{"train_loss": 0.00029000811628066003, "global_step": 66550, "epoch": 559, "lr": 1.1496886561318643e-06} +{"train_loss": 0.00017567574104759842, "global_step": 66551, "epoch": 559, "lr": 1.149216333573272e-06} +{"train_loss": 0.0001914206222863868, "global_step": 66552, "epoch": 559, "lr": 1.1487441069279848e-06} +{"train_loss": 0.00032373005524277687, "global_step": 66553, "epoch": 559, "lr": 1.148271976196913e-06} +{"train_loss": 0.00020135620434302837, "global_step": 66554, "epoch": 559, "lr": 1.1477999413809947e-06} +{"train_loss": 0.0002796234330162406, "global_step": 66555, "epoch": 559, "lr": 1.1473280024811462e-06} +{"train_loss": 0.00018257259216625243, "global_step": 66556, "epoch": 559, "lr": 1.1468561594983051e-06} +{"train_loss": 0.00020437415514606982, "global_step": 66557, "epoch": 559, "lr": 1.1463844124333932e-06} +{"train_loss": 0.00012819364201277494, "global_step": 66558, "epoch": 559, "lr": 1.1459127612873321e-06} +{"train_loss": 0.0002660800237208605, "global_step": 66559, "epoch": 559, "lr": 1.1454412060610542e-06} +{"train_loss": 0.00028248291346244514, "global_step": 66560, "epoch": 559, "lr": 1.144969746755481e-06} +{"train_loss": 0.00017079814278986305, "global_step": 66561, "epoch": 559, "lr": 1.144498383371545e-06} +{"train_loss": 0.00022642272233497351, "global_step": 66562, "epoch": 559, "lr": 1.1440271159101623e-06} +{"train_loss": 0.000525378156453371, "global_step": 66563, "epoch": 559, "lr": 1.1435559443722655e-06} +{"train_loss": 0.00022360586444847286, "global_step": 66564, "epoch": 559, "lr": 1.1430848687587758e-06} +{"train_loss": 0.0004322118475101888, "global_step": 66565, "epoch": 559, "lr": 1.1426138890706207e-06} +{"train_loss": 0.0001881361531559378, "global_step": 66566, "epoch": 559, "lr": 1.1421430053087211e-06} +{"train_loss": 0.0003247177228331566, "global_step": 66567, "epoch": 559, "lr": 1.1416722174740046e-06} +{"train_loss": 0.00018051026563625783, "global_step": 66568, "epoch": 559, "lr": 1.141201525567398e-06} +{"train_loss": 0.0001653678045840934, "global_step": 66569, "epoch": 559, "lr": 1.1407309295898227e-06} +{"train_loss": 0.00013469580153468996, "global_step": 66570, "epoch": 559, "lr": 1.1402604295421947e-06} +{"train_loss": 0.0004132884496357292, "global_step": 66571, "epoch": 559, "lr": 1.1397900254254524e-06} +{"train_loss": 0.0004304028698243201, "global_step": 66572, "epoch": 559, "lr": 1.1393197172405113e-06} +{"train_loss": 0.0003450511139817536, "global_step": 66573, "epoch": 559, "lr": 1.1388495049882986e-06} +{"train_loss": 0.00030480758869089186, "global_step": 66574, "epoch": 559, "lr": 1.1383793886697303e-06} +{"train_loss": 0.00022438139421865344, "global_step": 66575, "epoch": 559, "lr": 1.1379093682857333e-06} +{"train_loss": 0.0003281085519120097, "global_step": 66576, "epoch": 559, "lr": 1.1374394438372348e-06} +{"train_loss": 0.00018472454394213855, "global_step": 66577, "epoch": 559, "lr": 1.1369696153251508e-06} +{"train_loss": 0.0002056188095593825, "global_step": 66578, "epoch": 559, "lr": 1.1364998827504136e-06} +{"train_loss": 0.00026354307192377746, "global_step": 66579, "epoch": 559, "lr": 1.1360302461139283e-06} +{"train_loss": 0.0001983049587579444, "global_step": 66580, "epoch": 559, "lr": 1.135560705416633e-06} +{"train_loss": 0.00019294740923214704, "global_step": 66581, "epoch": 559, "lr": 1.1350912606594488e-06} +{"train_loss": 0.0003079249581787735, "global_step": 66582, "epoch": 559, "lr": 1.134621911843281e-06} +{"train_loss": 0.0002452742774039507, "global_step": 66583, "epoch": 559, "lr": 1.1341526589690731e-06} +{"train_loss": 0.00022587549756281078, "global_step": 66584, "epoch": 559, "lr": 1.1336835020377302e-06} +{"train_loss": 0.00021753863256890327, "global_step": 66585, "epoch": 559, "lr": 1.1332144410501789e-06} +{"train_loss": 0.00012288660218473524, "global_step": 66586, "epoch": 559, "lr": 1.1327454760073408e-06} +{"train_loss": 0.00018904995522461832, "global_step": 66587, "epoch": 559, "lr": 1.1322766069101375e-06} +{"train_loss": 0.00022073471336625516, "global_step": 66588, "epoch": 559, "lr": 1.1318078337594907e-06} +{"train_loss": 0.0002600513107609004, "global_step": 66589, "epoch": 559, "lr": 1.1313391565563158e-06} +{"train_loss": 0.00017838469648268074, "global_step": 66590, "epoch": 559, "lr": 1.1308705753015348e-06} +{"train_loss": 0.00025723999715410173, "global_step": 66591, "epoch": 559, "lr": 1.1304020899960687e-06} +{"train_loss": 0.0001958283392013982, "global_step": 66592, "epoch": 559, "lr": 1.1299337006408395e-06} +{"train_loss": 0.0002224050840595737, "global_step": 66593, "epoch": 559, "lr": 1.1294654072367573e-06} +{"train_loss": 0.0002616135752759874, "global_step": 66594, "epoch": 559, "lr": 1.1289972097847545e-06} +{"train_loss": 0.00036001999978907406, "global_step": 66595, "epoch": 559, "lr": 1.128529108285742e-06} +{"train_loss": 0.0003672685124911368, "global_step": 66596, "epoch": 559, "lr": 1.1280611027406462e-06} +{"train_loss": 0.00026452713063918054, "global_step": 66597, "epoch": 559, "lr": 1.127593193150378e-06} +{"train_loss": 0.000529909273609519, "global_step": 66598, "epoch": 559, "lr": 1.1271253795158643e-06} +{"train_loss": 0.0001487819099565968, "global_step": 66599, "epoch": 559, "lr": 1.1266576618380097e-06} +{"train_loss": 0.00027853422216139734, "global_step": 66600, "epoch": 559, "lr": 1.1261900401177473e-06} +{"train_loss": 0.00022594362962991, "global_step": 66601, "epoch": 559, "lr": 1.1257225143559868e-06} +{"train_loss": 0.0002806248376145959, "global_step": 66602, "epoch": 559, "lr": 1.1252550845536503e-06} +{"train_loss": 0.00031469890382140875, "global_step": 66603, "epoch": 559, "lr": 1.1247877507116534e-06} +{"train_loss": 0.00016977205814328045, "global_step": 66604, "epoch": 559, "lr": 1.124320512830912e-06} +{"train_loss": 0.0004528563003987074, "global_step": 66605, "epoch": 559, "lr": 1.1238533709123479e-06} +{"train_loss": 0.00021593752899207175, "global_step": 66606, "epoch": 559, "lr": 1.1233863249568767e-06} +{"train_loss": 0.00018378418462816626, "global_step": 66607, "epoch": 559, "lr": 1.1229193749654198e-06} +{"train_loss": 0.000363565661245957, "global_step": 66608, "epoch": 559, "lr": 1.122452520938877e-06} +{"train_loss": 0.00020460515224840492, "global_step": 66609, "epoch": 559, "lr": 1.121985762878186e-06} +{"train_loss": 0.00025675888173282146, "global_step": 66610, "epoch": 559, "lr": 1.1215191007842517e-06} +{"train_loss": 0.0003551099798642099, "global_step": 66611, "epoch": 559, "lr": 1.1210525346579904e-06} +{"train_loss": 0.0002996003022417426, "global_step": 66612, "epoch": 559, "lr": 1.120586064500323e-06} +{"train_loss": 0.00022503403306473047, "global_step": 66613, "epoch": 559, "lr": 1.1201196903121659e-06} +{"train_loss": 0.00017165057943202555, "global_step": 66614, "epoch": 559, "lr": 1.1196534120944292e-06} +{"train_loss": 0.00019851633987855166, "global_step": 66615, "epoch": 559, "lr": 1.1191872298480288e-06} +{"train_loss": 0.0002936881501227617, "global_step": 66616, "epoch": 559, "lr": 1.1187211435738808e-06} +{"train_loss": 0.00023563721333630383, "global_step": 66617, "epoch": 559, "lr": 1.1182551532729013e-06} +{"train_loss": 0.00024466292234137654, "global_step": 66618, "epoch": 559, "lr": 1.1177892589460114e-06} +{"train_loss": 0.00021024666784796864, "global_step": 66619, "epoch": 559, "lr": 1.1173234605941219e-06} +{"train_loss": 0.00019850280659738928, "global_step": 66620, "epoch": 559, "lr": 1.1168577582181372e-06} +{"train_loss": 0.0002059977559838444, "global_step": 66621, "epoch": 559, "lr": 1.1163921518189845e-06} +{"train_loss": 0.0003616815956775099, "global_step": 66622, "epoch": 559, "lr": 1.1159266413975688e-06} +{"train_loss": 0.00019234330102335662, "global_step": 66623, "epoch": 559, "lr": 1.115461226954817e-06} +{"train_loss": 0.000292527605779469, "global_step": 66624, "epoch": 559, "lr": 1.114995908491623e-06} +{"train_loss": 0.00029942247783765197, "global_step": 66625, "epoch": 559, "lr": 1.1145306860089244e-06} +{"train_loss": 0.0002778845082502812, "global_step": 66626, "epoch": 559, "lr": 1.1140655595076156e-06} +{"train_loss": 0.0004038412298541516, "global_step": 66627, "epoch": 559, "lr": 1.1136005289886175e-06} +{"train_loss": 0.0001319031580351293, "global_step": 66628, "epoch": 559, "lr": 1.1131355944528354e-06} +{"train_loss": 0.00012024404713883996, "global_step": 66629, "epoch": 559, "lr": 1.1126707559011961e-06} +{"train_loss": 0.00019797883578576148, "global_step": 66630, "epoch": 559, "lr": 1.1122060133346047e-06} +{"train_loss": 0.0001819191820686683, "global_step": 66631, "epoch": 559, "lr": 1.1117413667539711e-06} +{"train_loss": 0.0002379432989982888, "global_step": 66632, "epoch": 559, "lr": 1.1112768161602116e-06} +{"train_loss": 0.0003489019873086363, "global_step": 66633, "epoch": 559, "lr": 1.1108123615542421e-06} +{"train_loss": 0.00031381743610836565, "global_step": 66634, "epoch": 559, "lr": 1.1103480029369616e-06} +{"train_loss": 0.00023470574524253607, "global_step": 66635, "epoch": 559, "lr": 1.109883740309292e-06} +{"train_loss": 0.0002680992183741182, "global_step": 66636, "epoch": 559, "lr": 1.1094195736721436e-06} +{"train_loss": 0.0003208335256204009, "global_step": 66637, "epoch": 559, "lr": 1.1089555030264265e-06} +{"train_loss": 0.0002480727853253484, "global_step": 66638, "epoch": 559, "lr": 1.1084915283730568e-06} +{"train_loss": 0.0002587935560776171, "global_step": 66639, "epoch": 559, "lr": 1.108027649712934e-06, "val_loss": 0.024305211380124092} +{"train_loss": 0.000731303240172565, "global_step": 66640, "epoch": 560, "lr": 1.107563867046979e-06} +{"train_loss": 0.00024150192621164024, "global_step": 66641, "epoch": 560, "lr": 1.1071001803760972e-06} +{"train_loss": 0.0002917543170042336, "global_step": 66642, "epoch": 560, "lr": 1.1066365897012043e-06} +{"train_loss": 0.000177139911102131, "global_step": 66643, "epoch": 560, "lr": 1.1061730950231996e-06} +{"train_loss": 0.00023685839551035315, "global_step": 66644, "epoch": 560, "lr": 1.1057096963430048e-06} +{"train_loss": 0.0004033333680126816, "global_step": 66645, "epoch": 560, "lr": 1.1052463936615298e-06} +{"train_loss": 0.0003539907920639962, "global_step": 66646, "epoch": 560, "lr": 1.1047831869796743e-06} +{"train_loss": 0.00020416799816302955, "global_step": 66647, "epoch": 560, "lr": 1.1043200762983542e-06} +{"train_loss": 0.0001667379547143355, "global_step": 66648, "epoch": 560, "lr": 1.103857061618474e-06} +{"train_loss": 0.0003657677152659744, "global_step": 66649, "epoch": 560, "lr": 1.1033941429409556e-06} +{"train_loss": 0.00032526665017940104, "global_step": 66650, "epoch": 560, "lr": 1.102931320266698e-06} +{"train_loss": 0.0002039381506619975, "global_step": 66651, "epoch": 560, "lr": 1.1024685935966006e-06} +{"train_loss": 0.00017348697292618454, "global_step": 66652, "epoch": 560, "lr": 1.1020059629315904e-06} +{"train_loss": 0.00027307658456265926, "global_step": 66653, "epoch": 560, "lr": 1.1015434282725667e-06} +{"train_loss": 0.0001900516072055325, "global_step": 66654, "epoch": 560, "lr": 1.1010809896204399e-06} +{"train_loss": 0.00035866734106093645, "global_step": 66655, "epoch": 560, "lr": 1.1006186469761093e-06} +{"train_loss": 0.00021230248967185616, "global_step": 66656, "epoch": 560, "lr": 1.1001564003404963e-06} +{"train_loss": 0.000317828671541065, "global_step": 66657, "epoch": 560, "lr": 1.0996942497145058e-06} +{"train_loss": 0.00015415824600495398, "global_step": 66658, "epoch": 560, "lr": 1.0992321950990315e-06} +{"train_loss": 0.0001885544479591772, "global_step": 66659, "epoch": 560, "lr": 1.0987702364950003e-06} +{"train_loss": 0.0004706059698946774, "global_step": 66660, "epoch": 560, "lr": 1.0983083739033006e-06} +{"train_loss": 0.00028799226856790483, "global_step": 66661, "epoch": 560, "lr": 1.097846607324854e-06} +{"train_loss": 0.00014906068099662662, "global_step": 66662, "epoch": 560, "lr": 1.0973849367605537e-06} +{"train_loss": 0.00023944351414684206, "global_step": 66663, "epoch": 560, "lr": 1.0969233622113162e-06} +{"train_loss": 0.0001758396247169003, "global_step": 66664, "epoch": 560, "lr": 1.0964618836780517e-06} +{"train_loss": 0.0006008982891216874, "global_step": 66665, "epoch": 560, "lr": 1.0960005011616537e-06} +{"train_loss": 0.00018795460346154869, "global_step": 66666, "epoch": 560, "lr": 1.0955392146630384e-06} +{"train_loss": 0.00021429189655464143, "global_step": 66667, "epoch": 560, "lr": 1.0950780241830993e-06} +{"train_loss": 0.00032793713035061955, "global_step": 66668, "epoch": 560, "lr": 1.0946169297227581e-06} +{"train_loss": 0.0002573078963905573, "global_step": 66669, "epoch": 560, "lr": 1.0941559312829143e-06} +{"train_loss": 0.0001866058591986075, "global_step": 66670, "epoch": 560, "lr": 1.093695028864461e-06} +{"train_loss": 0.00020184445020277053, "global_step": 66671, "epoch": 560, "lr": 1.09323422246832e-06} +{"train_loss": 0.0005407704738900065, "global_step": 66672, "epoch": 560, "lr": 1.0927735120953797e-06} +{"train_loss": 0.0001946192787727341, "global_step": 66673, "epoch": 560, "lr": 1.0923128977465613e-06} +{"train_loss": 0.0002061204140773043, "global_step": 66674, "epoch": 560, "lr": 1.0918523794227586e-06} +{"train_loss": 0.00040740641998127103, "global_step": 66675, "epoch": 560, "lr": 1.091391957124882e-06} +{"train_loss": 0.0004133755574002862, "global_step": 66676, "epoch": 560, "lr": 1.0909316308538308e-06} +{"train_loss": 0.0002829158620443195, "global_step": 66677, "epoch": 560, "lr": 1.09047140061051e-06} +{"train_loss": 0.00016437165322713554, "global_step": 66678, "epoch": 560, "lr": 1.090011266395824e-06} +{"train_loss": 0.0002249383833259344, "global_step": 66679, "epoch": 560, "lr": 1.0895512282106724e-06} +{"train_loss": 0.00014200917212292552, "global_step": 66680, "epoch": 560, "lr": 1.0890912860559654e-06} +{"train_loss": 0.0002953190996777266, "global_step": 66681, "epoch": 560, "lr": 1.0886314399325969e-06} +{"train_loss": 0.00022829628142062575, "global_step": 66682, "epoch": 560, "lr": 1.0881716898414829e-06} +{"train_loss": 0.00028698021196760237, "global_step": 66683, "epoch": 560, "lr": 1.0877120357835168e-06} +{"train_loss": 0.00021170999389141798, "global_step": 66684, "epoch": 560, "lr": 1.0872524777595927e-06} +{"train_loss": 0.0004967313725501299, "global_step": 66685, "epoch": 560, "lr": 1.086793015770632e-06} +{"train_loss": 0.00014294919674284756, "global_step": 66686, "epoch": 560, "lr": 1.086333649817528e-06} +{"train_loss": 0.000212488419492729, "global_step": 66687, "epoch": 560, "lr": 1.0858743799011806e-06} +{"train_loss": 0.00021170356194488704, "global_step": 66688, "epoch": 560, "lr": 1.0854152060224944e-06} +{"train_loss": 0.0002892289194278419, "global_step": 66689, "epoch": 560, "lr": 1.0849561281823629e-06} +{"train_loss": 0.00022226490546017885, "global_step": 66690, "epoch": 560, "lr": 1.0844971463817022e-06} +{"train_loss": 0.00033457446261309087, "global_step": 66691, "epoch": 560, "lr": 1.0840382606214005e-06} +{"train_loss": 0.00021365503198467195, "global_step": 66692, "epoch": 560, "lr": 1.0835794709023683e-06} +{"train_loss": 0.00027983286418020725, "global_step": 66693, "epoch": 560, "lr": 1.0831207772254992e-06} +{"train_loss": 0.00018320602248422801, "global_step": 66694, "epoch": 560, "lr": 1.082662179591698e-06} +{"train_loss": 0.0005188944633118808, "global_step": 66695, "epoch": 560, "lr": 1.0822036780018586e-06} +{"train_loss": 0.00023972394410520792, "global_step": 66696, "epoch": 560, "lr": 1.0817452724568911e-06} +{"train_loss": 0.0001945212425198406, "global_step": 66697, "epoch": 560, "lr": 1.0812869629576839e-06} +{"train_loss": 0.00016390417295042425, "global_step": 66698, "epoch": 560, "lr": 1.0808287495051472e-06} +{"train_loss": 0.0002975350362248719, "global_step": 66699, "epoch": 560, "lr": 1.0803706321001805e-06} +{"train_loss": 0.00016548149869777262, "global_step": 66700, "epoch": 560, "lr": 1.079912610743683e-06} +{"train_loss": 0.00016502427752129734, "global_step": 66701, "epoch": 560, "lr": 1.0794546854365428e-06} +{"train_loss": 0.0003159420157317072, "global_step": 66702, "epoch": 560, "lr": 1.0789968561796703e-06} +{"train_loss": 0.00019167570280842483, "global_step": 66703, "epoch": 560, "lr": 1.0785391229739595e-06} +{"train_loss": 0.00019067399261984974, "global_step": 66704, "epoch": 560, "lr": 1.0780814858203147e-06} +{"train_loss": 0.00037053224514238536, "global_step": 66705, "epoch": 560, "lr": 1.0776239447196247e-06} +{"train_loss": 0.00025807012571021914, "global_step": 66706, "epoch": 560, "lr": 1.0771664996727938e-06} +{"train_loss": 0.00026873592287302017, "global_step": 66707, "epoch": 560, "lr": 1.076709150680727e-06} +{"train_loss": 0.0002797400811687112, "global_step": 66708, "epoch": 560, "lr": 1.076251897744307e-06} +{"train_loss": 0.0002348918205825612, "global_step": 66709, "epoch": 560, "lr": 1.0757947408644443e-06} +{"train_loss": 0.0002220096212113276, "global_step": 66710, "epoch": 560, "lr": 1.0753376800420268e-06} +{"train_loss": 0.0002926691377069801, "global_step": 66711, "epoch": 560, "lr": 1.074880715277965e-06} +{"train_loss": 0.0002377798082306981, "global_step": 66712, "epoch": 560, "lr": 1.0744238465731416e-06} +{"train_loss": 0.00026323896599933505, "global_step": 66713, "epoch": 560, "lr": 1.0739670739284613e-06} +{"train_loss": 0.00014117789396550506, "global_step": 66714, "epoch": 560, "lr": 1.0735103973448234e-06} +{"train_loss": 0.000306595116853714, "global_step": 66715, "epoch": 560, "lr": 1.0730538168231162e-06} +{"train_loss": 0.00015478026762139052, "global_step": 66716, "epoch": 560, "lr": 1.0725973323642447e-06} +{"train_loss": 0.00015443404845427722, "global_step": 66717, "epoch": 560, "lr": 1.0721409439690966e-06} +{"train_loss": 0.00025705352891236544, "global_step": 66718, "epoch": 560, "lr": 1.071684651638577e-06} +{"train_loss": 0.00023990028421394527, "global_step": 66719, "epoch": 560, "lr": 1.0712284553735796e-06} +{"train_loss": 0.00024708753335289657, "global_step": 66720, "epoch": 560, "lr": 1.070772355174987e-06} +{"train_loss": 0.00012116362631786615, "global_step": 66721, "epoch": 560, "lr": 1.0703163510437152e-06} +{"train_loss": 0.00041715489351190627, "global_step": 66722, "epoch": 560, "lr": 1.0698604429806469e-06} +{"train_loss": 0.0002635567798279226, "global_step": 66723, "epoch": 560, "lr": 1.0694046309866813e-06} +{"train_loss": 0.0002858032239601016, "global_step": 66724, "epoch": 560, "lr": 1.0689489150627064e-06} +{"train_loss": 0.00024126353673636913, "global_step": 66725, "epoch": 560, "lr": 1.0684932952096328e-06} +{"train_loss": 0.0003192921867594123, "global_step": 66726, "epoch": 560, "lr": 1.0680377714283375e-06} +{"train_loss": 0.0003392180078662932, "global_step": 66727, "epoch": 560, "lr": 1.0675823437197251e-06} +{"train_loss": 0.0002867578878067434, "global_step": 66728, "epoch": 560, "lr": 1.0671270120846843e-06} +{"train_loss": 0.0002035186334978789, "global_step": 66729, "epoch": 560, "lr": 1.0666717765241141e-06} +{"train_loss": 0.00025382626336067915, "global_step": 66730, "epoch": 560, "lr": 1.0662166370389082e-06} +{"train_loss": 0.00019317430269438773, "global_step": 66731, "epoch": 560, "lr": 1.0657615936299549e-06} +{"train_loss": 0.00032616581302136183, "global_step": 66732, "epoch": 560, "lr": 1.0653066462981532e-06} +{"train_loss": 0.00012436108954716474, "global_step": 66733, "epoch": 560, "lr": 1.0648517950443914e-06} +{"train_loss": 0.00023953232448548079, "global_step": 66734, "epoch": 560, "lr": 1.0643970398695635e-06} +{"train_loss": 0.00017620502330828458, "global_step": 66735, "epoch": 560, "lr": 1.0639423807745685e-06} +{"train_loss": 0.00015038391575217247, "global_step": 66736, "epoch": 560, "lr": 1.0634878177602947e-06} +{"train_loss": 0.00020627983030863106, "global_step": 66737, "epoch": 560, "lr": 1.0630333508276358e-06} +{"train_loss": 0.00014079349057283252, "global_step": 66738, "epoch": 560, "lr": 1.06257897997748e-06} +{"train_loss": 0.00024214923905674368, "global_step": 66739, "epoch": 560, "lr": 1.0621247052107207e-06} +{"train_loss": 0.00032072406611405313, "global_step": 66740, "epoch": 560, "lr": 1.0616705265282523e-06} +{"train_loss": 0.00040600408101454377, "global_step": 66741, "epoch": 560, "lr": 1.061216443930968e-06} +{"train_loss": 0.00018931836530100554, "global_step": 66742, "epoch": 560, "lr": 1.060762457419756e-06} +{"train_loss": 0.00021932809613645077, "global_step": 66743, "epoch": 560, "lr": 1.0603085669955049e-06} +{"train_loss": 0.0003723723639268428, "global_step": 66744, "epoch": 560, "lr": 1.0598547726591135e-06} +{"train_loss": 0.0002780072973109782, "global_step": 66745, "epoch": 560, "lr": 1.0594010744114702e-06} +{"train_loss": 0.000357082491973415, "global_step": 66746, "epoch": 560, "lr": 1.0589474722534576e-06} +{"train_loss": 0.0002208865189459175, "global_step": 66747, "epoch": 560, "lr": 1.0584939661859805e-06} +{"train_loss": 0.00023842269729357213, "global_step": 66748, "epoch": 560, "lr": 1.058040556209916e-06} +{"train_loss": 0.000287627219222486, "global_step": 66749, "epoch": 560, "lr": 1.0575872423261635e-06} +{"train_loss": 0.0003386797907296568, "global_step": 66750, "epoch": 560, "lr": 1.0571340245356054e-06} +{"train_loss": 0.0002561979927122593, "global_step": 66751, "epoch": 560, "lr": 1.056680902839141e-06} +{"train_loss": 0.0003067607176490128, "global_step": 66752, "epoch": 560, "lr": 1.0562278772376533e-06} +{"train_loss": 0.00019314953533466905, "global_step": 66753, "epoch": 560, "lr": 1.05577494773203e-06} +{"train_loss": 0.000253606413025409, "global_step": 66754, "epoch": 560, "lr": 1.0553221143231706e-06} +{"train_loss": 0.00025204007397405803, "global_step": 66755, "epoch": 560, "lr": 1.0548693770119523e-06} +{"train_loss": 0.0001990204182220623, "global_step": 66756, "epoch": 560, "lr": 1.0544167357992684e-06} +{"train_loss": 0.00018870689382310957, "global_step": 66757, "epoch": 560, "lr": 1.0539641906860132e-06} +{"train_loss": 0.0002604468178763172, "global_step": 66758, "epoch": 560, "lr": 1.0535117416730633e-06, "val_loss": 0.040251851081848145, "train_action_mse_error": 4.804956461157417e-06} +{"train_loss": 0.00020070135360583663, "global_step": 66759, "epoch": 561, "lr": 1.0530593887613238e-06} +{"train_loss": 0.00017048446170520037, "global_step": 66760, "epoch": 561, "lr": 1.0526071319516606e-06} +{"train_loss": 0.00027405694709159434, "global_step": 66761, "epoch": 561, "lr": 1.0521549712449785e-06} +{"train_loss": 0.00012670696014538407, "global_step": 66762, "epoch": 561, "lr": 1.0517029066421657e-06} +{"train_loss": 0.0001574650377733633, "global_step": 66763, "epoch": 561, "lr": 1.0512509381440993e-06} +{"train_loss": 0.0002350152935832739, "global_step": 66764, "epoch": 561, "lr": 1.050799065751673e-06} +{"train_loss": 0.0001885522942757234, "global_step": 66765, "epoch": 561, "lr": 1.050347289465775e-06} +{"train_loss": 0.00017059029778465629, "global_step": 66766, "epoch": 561, "lr": 1.0498956092872936e-06} +{"train_loss": 0.00032632608781568706, "global_step": 66767, "epoch": 561, "lr": 1.0494440252171056e-06} +{"train_loss": 0.00018029211787506938, "global_step": 66768, "epoch": 561, "lr": 1.0489925372561105e-06} +{"train_loss": 0.00022220093524083495, "global_step": 66769, "epoch": 561, "lr": 1.0485411454051908e-06} +{"train_loss": 0.0003119255125056952, "global_step": 66770, "epoch": 561, "lr": 1.0480898496652236e-06} +{"train_loss": 0.0003105479700025171, "global_step": 66771, "epoch": 561, "lr": 1.0476386500371083e-06} +{"train_loss": 0.0003168404509779066, "global_step": 66772, "epoch": 561, "lr": 1.0471875465217162e-06} +{"train_loss": 0.00026419860660098493, "global_step": 66773, "epoch": 561, "lr": 1.0467365391199523e-06} +{"train_loss": 0.0004526949778664857, "global_step": 66774, "epoch": 561, "lr": 1.0462856278326826e-06} +{"train_loss": 0.00021912115334998816, "global_step": 66775, "epoch": 561, "lr": 1.0458348126608065e-06} +{"train_loss": 0.0002637963043525815, "global_step": 66776, "epoch": 561, "lr": 1.045384093605206e-06} +{"train_loss": 0.0003156425373163074, "global_step": 66777, "epoch": 561, "lr": 1.0449334706667534e-06} +{"train_loss": 0.00021168706007301807, "global_step": 66778, "epoch": 561, "lr": 1.0444829438463532e-06} +{"train_loss": 0.0004521935188677162, "global_step": 66779, "epoch": 561, "lr": 1.044032513144877e-06} +{"train_loss": 0.00022057007299736142, "global_step": 66780, "epoch": 561, "lr": 1.0435821785632127e-06} +{"train_loss": 0.00020504494023043662, "global_step": 66781, "epoch": 561, "lr": 1.0431319401022433e-06} +{"train_loss": 0.00019379847799427807, "global_step": 66782, "epoch": 561, "lr": 1.0426817977628621e-06} +{"train_loss": 0.0001815831201383844, "global_step": 66783, "epoch": 561, "lr": 1.0422317515459411e-06} +{"train_loss": 0.00013712824147660285, "global_step": 66784, "epoch": 561, "lr": 1.0417818014523629e-06} +{"train_loss": 0.00027108326321467757, "global_step": 66785, "epoch": 561, "lr": 1.0413319474830208e-06} +{"train_loss": 0.0003304842102807015, "global_step": 66786, "epoch": 561, "lr": 1.0408821896387867e-06} +{"train_loss": 0.00032916435156948864, "global_step": 66787, "epoch": 561, "lr": 1.040432527920554e-06} +{"train_loss": 0.00022445071954280138, "global_step": 66788, "epoch": 561, "lr": 1.0399829623292057e-06} +{"train_loss": 0.00036985185579396784, "global_step": 66789, "epoch": 561, "lr": 1.0395334928656132e-06} +{"train_loss": 0.000233706712606363, "global_step": 66790, "epoch": 561, "lr": 1.03908411953067e-06} +{"train_loss": 0.00015769369201734662, "global_step": 66791, "epoch": 561, "lr": 1.0386348423252478e-06} +{"train_loss": 0.00022039341274648905, "global_step": 66792, "epoch": 561, "lr": 1.038185661250246e-06} +{"train_loss": 0.0002917543170042336, "global_step": 66793, "epoch": 561, "lr": 1.037736576306525e-06} +{"train_loss": 0.000458512018667534, "global_step": 66794, "epoch": 561, "lr": 1.0372875874949895e-06} +{"train_loss": 0.000314101082039997, "global_step": 66795, "epoch": 561, "lr": 1.0368386948164999e-06} +{"train_loss": 0.00046690544695593417, "global_step": 66796, "epoch": 561, "lr": 1.0363898982719445e-06} +{"train_loss": 0.00026424575480632484, "global_step": 66797, "epoch": 561, "lr": 1.0359411978622113e-06} +{"train_loss": 0.0003885953628923744, "global_step": 66798, "epoch": 561, "lr": 1.035492593588172e-06} +{"train_loss": 0.00018097828433383256, "global_step": 66799, "epoch": 561, "lr": 1.0350440854507204e-06} +{"train_loss": 0.0003261048113927245, "global_step": 66800, "epoch": 561, "lr": 1.0345956734507222e-06} +{"train_loss": 0.0002860755193978548, "global_step": 66801, "epoch": 561, "lr": 1.0341473575890658e-06} +{"train_loss": 0.00020920889801345766, "global_step": 66802, "epoch": 561, "lr": 1.0336991378666338e-06} +{"train_loss": 0.00040189133142121136, "global_step": 66803, "epoch": 561, "lr": 1.0332510142842978e-06} +{"train_loss": 0.00019958418852183968, "global_step": 66804, "epoch": 561, "lr": 1.0328029868429457e-06} +{"train_loss": 0.00020369167032185942, "global_step": 66805, "epoch": 561, "lr": 1.0323550555434491e-06} +{"train_loss": 0.0005661213654093444, "global_step": 66806, "epoch": 561, "lr": 1.0319072203866963e-06} +{"train_loss": 0.00026193566736765206, "global_step": 66807, "epoch": 561, "lr": 1.031459481373559e-06} +{"train_loss": 0.00013525127724278718, "global_step": 66808, "epoch": 561, "lr": 1.0310118385049194e-06} +{"train_loss": 0.00018090620869770646, "global_step": 66809, "epoch": 561, "lr": 1.0305642917816605e-06} +{"train_loss": 0.00022633183107245713, "global_step": 66810, "epoch": 561, "lr": 1.030116841204648e-06} +{"train_loss": 0.00032416792237199843, "global_step": 66811, "epoch": 561, "lr": 1.0296694867747759e-06} +{"train_loss": 0.00024291015870403498, "global_step": 66812, "epoch": 561, "lr": 1.0292222284929153e-06} +{"train_loss": 0.00020493178453762084, "global_step": 66813, "epoch": 561, "lr": 1.0287750663599494e-06} +{"train_loss": 0.00025858497247099876, "global_step": 66814, "epoch": 561, "lr": 1.0283280003767493e-06} +{"train_loss": 0.0001781722967280075, "global_step": 66815, "epoch": 561, "lr": 1.0278810305441921e-06} +{"train_loss": 0.00022555046598426998, "global_step": 66816, "epoch": 561, "lr": 1.0274341568631608e-06} +{"train_loss": 0.0002227146178483963, "global_step": 66817, "epoch": 561, "lr": 1.0269873793345263e-06} +{"train_loss": 0.00017685168131720275, "global_step": 66818, "epoch": 561, "lr": 1.0265406979591773e-06} +{"train_loss": 0.00030051107751205564, "global_step": 66819, "epoch": 561, "lr": 1.0260941127379798e-06} +{"train_loss": 0.00016667878662701696, "global_step": 66820, "epoch": 561, "lr": 1.0256476236718105e-06} +{"train_loss": 0.0002507710305508226, "global_step": 66821, "epoch": 561, "lr": 1.0252012307615578e-06} +{"train_loss": 0.00032834813464432955, "global_step": 66822, "epoch": 561, "lr": 1.0247549340080819e-06} +{"train_loss": 0.00016429153038188815, "global_step": 66823, "epoch": 561, "lr": 1.0243087334122769e-06} +{"train_loss": 0.00027950885123573244, "global_step": 66824, "epoch": 561, "lr": 1.0238626289750031e-06} +{"train_loss": 0.0003065304772462696, "global_step": 66825, "epoch": 561, "lr": 1.023416620697143e-06} +{"train_loss": 0.00027196214068681, "global_step": 66826, "epoch": 561, "lr": 1.0229707085795736e-06} +{"train_loss": 0.00023497751681134105, "global_step": 66827, "epoch": 561, "lr": 1.0225248926231723e-06} +{"train_loss": 0.0002587957715149969, "global_step": 66828, "epoch": 561, "lr": 1.0220791728287993e-06} +{"train_loss": 0.00032321931212209165, "global_step": 66829, "epoch": 561, "lr": 1.021633549197354e-06} +{"train_loss": 0.00041777538717724383, "global_step": 66830, "epoch": 561, "lr": 1.021188021729691e-06} +{"train_loss": 0.0003002024022862315, "global_step": 66831, "epoch": 561, "lr": 1.0207425904266932e-06} +{"train_loss": 0.00023356900783255696, "global_step": 66832, "epoch": 561, "lr": 1.0202972552892375e-06} +{"train_loss": 0.00021968403598293662, "global_step": 66833, "epoch": 561, "lr": 1.0198520163181957e-06} +{"train_loss": 0.00038244356983341277, "global_step": 66834, "epoch": 561, "lr": 1.019406873514439e-06} +{"train_loss": 0.00014645393821410835, "global_step": 66835, "epoch": 561, "lr": 1.0189618268788504e-06} +{"train_loss": 0.00024484089226461947, "global_step": 66836, "epoch": 561, "lr": 1.0185168764122898e-06} +{"train_loss": 0.000185763172339648, "global_step": 66837, "epoch": 561, "lr": 1.0180720221156403e-06} +{"train_loss": 0.00027639581821858883, "global_step": 66838, "epoch": 561, "lr": 1.0176272639897789e-06} +{"train_loss": 0.0001191251867567189, "global_step": 66839, "epoch": 561, "lr": 1.0171826020355656e-06} +{"train_loss": 0.00019080674974247813, "global_step": 66840, "epoch": 561, "lr": 1.0167380362538893e-06} +{"train_loss": 0.00038999892421998084, "global_step": 66841, "epoch": 561, "lr": 1.0162935666456041e-06} +{"train_loss": 0.00023675993725191802, "global_step": 66842, "epoch": 561, "lr": 1.0158491932116044e-06} +{"train_loss": 0.0002091077039949596, "global_step": 66843, "epoch": 561, "lr": 1.0154049159527446e-06} +{"train_loss": 0.0003123476344626397, "global_step": 66844, "epoch": 561, "lr": 1.0149607348699076e-06} +{"train_loss": 0.0002484138822183013, "global_step": 66845, "epoch": 561, "lr": 1.0145166499639647e-06} +{"train_loss": 0.00018390688637737185, "global_step": 66846, "epoch": 561, "lr": 1.0140726612357765e-06} +{"train_loss": 0.0002128331398125738, "global_step": 66847, "epoch": 561, "lr": 1.013628768686231e-06} +{"train_loss": 0.0003171701682731509, "global_step": 66848, "epoch": 561, "lr": 1.0131849723161834e-06} +{"train_loss": 0.00022855612041894346, "global_step": 66849, "epoch": 561, "lr": 1.0127412721265218e-06} +{"train_loss": 0.0001895359600894153, "global_step": 66850, "epoch": 561, "lr": 1.0122976681181006e-06} +{"train_loss": 0.00029087121947668493, "global_step": 66851, "epoch": 561, "lr": 1.0118541602918085e-06} +{"train_loss": 0.0002893985656555742, "global_step": 66852, "epoch": 561, "lr": 1.0114107486485058e-06} +{"train_loss": 0.0001561977987876162, "global_step": 66853, "epoch": 561, "lr": 1.0109674331890585e-06} +{"train_loss": 0.0003442791639827192, "global_step": 66854, "epoch": 561, "lr": 1.010524213914349e-06} +{"train_loss": 0.00025502778589725494, "global_step": 66855, "epoch": 561, "lr": 1.0100810908252378e-06} +{"train_loss": 0.00018270673172082752, "global_step": 66856, "epoch": 561, "lr": 1.0096380639226022e-06} +{"train_loss": 0.00017594594100955874, "global_step": 66857, "epoch": 561, "lr": 1.009195133207308e-06} +{"train_loss": 0.00017710079555399716, "global_step": 66858, "epoch": 561, "lr": 1.0087522986802212e-06} +{"train_loss": 0.00033765393891371787, "global_step": 66859, "epoch": 561, "lr": 1.0083095603422133e-06} +{"train_loss": 0.00029660662403330207, "global_step": 66860, "epoch": 561, "lr": 1.0078669181941613e-06} +{"train_loss": 0.0002073039358947426, "global_step": 66861, "epoch": 561, "lr": 1.007424372236926e-06} +{"train_loss": 0.0002326036774320528, "global_step": 66862, "epoch": 561, "lr": 1.006981922471384e-06} +{"train_loss": 0.0005836898344568908, "global_step": 66863, "epoch": 561, "lr": 1.0065395688983902e-06} +{"train_loss": 0.00024748590658418834, "global_step": 66864, "epoch": 561, "lr": 1.0060973115188277e-06} +{"train_loss": 0.00019575280020944774, "global_step": 66865, "epoch": 561, "lr": 1.0056551503335566e-06} +{"train_loss": 0.00046023615868762136, "global_step": 66866, "epoch": 561, "lr": 1.0052130853434482e-06} +{"train_loss": 0.00016985851107165217, "global_step": 66867, "epoch": 561, "lr": 1.004771116549369e-06} +{"train_loss": 0.00037327740574255586, "global_step": 66868, "epoch": 561, "lr": 1.0043292439521901e-06} +{"train_loss": 0.00029033637838438153, "global_step": 66869, "epoch": 561, "lr": 1.003887467552772e-06} +{"train_loss": 0.0001456783793400973, "global_step": 66870, "epoch": 561, "lr": 1.0034457873519864e-06} +{"train_loss": 0.0002921780978795141, "global_step": 66871, "epoch": 561, "lr": 1.0030042033507047e-06} +{"train_loss": 0.0001997489744098857, "global_step": 66872, "epoch": 561, "lr": 1.0025627155497874e-06} +{"train_loss": 0.00014890020247548819, "global_step": 66873, "epoch": 561, "lr": 1.002121323950106e-06} +{"train_loss": 0.00018067582277581096, "global_step": 66874, "epoch": 561, "lr": 1.0016800285525207e-06} +{"train_loss": 0.00032109260791912675, "global_step": 66875, "epoch": 561, "lr": 1.0012388293579034e-06} +{"train_loss": 0.0001792863622540608, "global_step": 66876, "epoch": 561, "lr": 1.0007977263671253e-06} +{"train_loss": 0.0002577564405290089, "global_step": 66877, "epoch": 561, "lr": 1.000356719581036e-06, "val_loss": 0.026135213673114777} +{"train_loss": 0.00030604959465563297, "global_step": 66878, "epoch": 562, "lr": 9.999158090005178e-07} +{"train_loss": 0.0002516698732506484, "global_step": 66879, "epoch": 562, "lr": 9.994749946264258e-07} +{"train_loss": 0.00015401732525788248, "global_step": 66880, "epoch": 562, "lr": 9.990342764596318e-07} +{"train_loss": 0.00028233457123860717, "global_step": 66881, "epoch": 562, "lr": 9.985936545009955e-07} +{"train_loss": 0.00016557073104195297, "global_step": 66882, "epoch": 562, "lr": 9.981531287513945e-07} +{"train_loss": 0.000252430239925161, "global_step": 66883, "epoch": 562, "lr": 9.977126992116782e-07} +{"train_loss": 0.00014433205069508404, "global_step": 66884, "epoch": 562, "lr": 9.972723658827176e-07} +{"train_loss": 0.0003311304608359933, "global_step": 66885, "epoch": 562, "lr": 9.968321287653792e-07} +{"train_loss": 0.00020946031145285815, "global_step": 66886, "epoch": 562, "lr": 9.963919878605232e-07} +{"train_loss": 0.00029843748779967427, "global_step": 66887, "epoch": 562, "lr": 9.959519431690211e-07} +{"train_loss": 0.00013635850336868316, "global_step": 66888, "epoch": 562, "lr": 9.955119946917334e-07} +{"train_loss": 0.00021152554836589843, "global_step": 66889, "epoch": 562, "lr": 9.950721424295151e-07} +{"train_loss": 0.0005401616217568517, "global_step": 66890, "epoch": 562, "lr": 9.94632386383243e-07} +{"train_loss": 0.00015824795991647989, "global_step": 66891, "epoch": 562, "lr": 9.941927265537664e-07} +{"train_loss": 0.0002769889251794666, "global_step": 66892, "epoch": 562, "lr": 9.937531629419682e-07} +{"train_loss": 0.00022192213509697467, "global_step": 66893, "epoch": 562, "lr": 9.933136955486922e-07} +{"train_loss": 0.0005167382187210023, "global_step": 66894, "epoch": 562, "lr": 9.928743243748096e-07} +{"train_loss": 0.00036091788206249475, "global_step": 66895, "epoch": 562, "lr": 9.924350494211865e-07} +{"train_loss": 0.0002288769610458985, "global_step": 66896, "epoch": 562, "lr": 9.919958706886779e-07} +{"train_loss": 0.00019572433666326106, "global_step": 66897, "epoch": 562, "lr": 9.915567881781496e-07} +{"train_loss": 0.0003090224927291274, "global_step": 66898, "epoch": 562, "lr": 9.911178018904678e-07} +{"train_loss": 0.0005154504324309528, "global_step": 66899, "epoch": 562, "lr": 9.90678911826487e-07} +{"train_loss": 0.00022812683891970664, "global_step": 66900, "epoch": 562, "lr": 9.902401179870735e-07} +{"train_loss": 0.0003729193704202771, "global_step": 66901, "epoch": 562, "lr": 9.898014203730876e-07} +{"train_loss": 0.0003971267433371395, "global_step": 66902, "epoch": 562, "lr": 9.893628189853954e-07} +{"train_loss": 0.00020204052270855755, "global_step": 66903, "epoch": 562, "lr": 9.889243138248462e-07} +{"train_loss": 0.00019912845164071769, "global_step": 66904, "epoch": 562, "lr": 9.884859048923111e-07} +{"train_loss": 0.000325753673678264, "global_step": 66905, "epoch": 562, "lr": 9.880475921886456e-07} +{"train_loss": 0.00023028967552818358, "global_step": 66906, "epoch": 562, "lr": 9.876093757147153e-07} +{"train_loss": 0.0004910397110506892, "global_step": 66907, "epoch": 562, "lr": 9.871712554713752e-07} +{"train_loss": 0.00038470144500024617, "global_step": 66908, "epoch": 562, "lr": 9.867332314594912e-07} +{"train_loss": 0.0005669877282343805, "global_step": 66909, "epoch": 562, "lr": 9.862953036799182e-07} +{"train_loss": 0.0003408986085560173, "global_step": 66910, "epoch": 562, "lr": 9.858574721335168e-07} +{"train_loss": 0.000178828981006518, "global_step": 66911, "epoch": 562, "lr": 9.854197368211526e-07} +{"train_loss": 0.00039081586874090135, "global_step": 66912, "epoch": 562, "lr": 9.849820977436753e-07} +{"train_loss": 0.00028478680178523064, "global_step": 66913, "epoch": 562, "lr": 9.845445549019504e-07} +{"train_loss": 0.000805546180345118, "global_step": 66914, "epoch": 562, "lr": 9.841071082968389e-07} +{"train_loss": 0.000385263585485518, "global_step": 66915, "epoch": 562, "lr": 9.836697579291897e-07} +{"train_loss": 0.00022001549950800836, "global_step": 66916, "epoch": 562, "lr": 9.832325037998746e-07} +{"train_loss": 0.00019326509209349751, "global_step": 66917, "epoch": 562, "lr": 9.827953459097427e-07} +{"train_loss": 0.00017148553160950541, "global_step": 66918, "epoch": 562, "lr": 9.8235828425966e-07} +{"train_loss": 0.00039969573845155537, "global_step": 66919, "epoch": 562, "lr": 9.819213188504705e-07} +{"train_loss": 0.000259440770605579, "global_step": 66920, "epoch": 562, "lr": 9.81484449683051e-07} +{"train_loss": 0.0001917262707138434, "global_step": 66921, "epoch": 562, "lr": 9.810476767582454e-07} +{"train_loss": 0.000384434504667297, "global_step": 66922, "epoch": 562, "lr": 9.806110000769198e-07} +{"train_loss": 0.0002998054551426321, "global_step": 66923, "epoch": 562, "lr": 9.801744196399232e-07} +{"train_loss": 0.00024890151689760387, "global_step": 66924, "epoch": 562, "lr": 9.797379354481162e-07} +{"train_loss": 0.00012378727842587978, "global_step": 66925, "epoch": 562, "lr": 9.793015475023647e-07} +{"train_loss": 0.0002620943123474717, "global_step": 66926, "epoch": 562, "lr": 9.788652558035072e-07} +{"train_loss": 0.00022761165746487677, "global_step": 66927, "epoch": 562, "lr": 9.784290603524148e-07} +{"train_loss": 0.00047256314428523183, "global_step": 66928, "epoch": 562, "lr": 9.779929611499428e-07} +{"train_loss": 0.00018546437786426395, "global_step": 66929, "epoch": 562, "lr": 9.775569581969346e-07} +{"train_loss": 0.00017359192133881152, "global_step": 66930, "epoch": 562, "lr": 9.771210514942674e-07} +{"train_loss": 0.00038332323310896754, "global_step": 66931, "epoch": 562, "lr": 9.766852410427797e-07} +{"train_loss": 0.00016244132712017745, "global_step": 66932, "epoch": 562, "lr": 9.762495268433369e-07} +{"train_loss": 0.0002950501802843064, "global_step": 66933, "epoch": 562, "lr": 9.758139088967888e-07} +{"train_loss": 0.000209788850042969, "global_step": 66934, "epoch": 562, "lr": 9.753783872039902e-07} +{"train_loss": 0.00031605002004653215, "global_step": 66935, "epoch": 562, "lr": 9.749429617658068e-07} +{"train_loss": 0.00022798232384957373, "global_step": 66936, "epoch": 562, "lr": 9.74507632583077e-07} +{"train_loss": 0.00025123177329078317, "global_step": 66937, "epoch": 562, "lr": 9.74072399656667e-07} +{"train_loss": 0.0002010043681366369, "global_step": 66938, "epoch": 562, "lr": 9.736372629874314e-07} +{"train_loss": 0.00033232694840990007, "global_step": 66939, "epoch": 562, "lr": 9.73202222576214e-07} +{"train_loss": 0.00014774641022086143, "global_step": 66940, "epoch": 562, "lr": 9.727672784238806e-07} +{"train_loss": 0.00024128730001393706, "global_step": 66941, "epoch": 562, "lr": 9.723324305312808e-07} +{"train_loss": 0.00022770000214222819, "global_step": 66942, "epoch": 562, "lr": 9.718976788992695e-07} +{"train_loss": 0.0003001840377692133, "global_step": 66943, "epoch": 562, "lr": 9.714630235286959e-07} +{"train_loss": 0.0002957279793918133, "global_step": 66944, "epoch": 562, "lr": 9.710284644204204e-07} +{"train_loss": 0.00033179481397382915, "global_step": 66945, "epoch": 562, "lr": 9.705940015752923e-07} +{"train_loss": 0.000278067629551515, "global_step": 66946, "epoch": 562, "lr": 9.70159634994161e-07} +{"train_loss": 0.000377259508240968, "global_step": 66947, "epoch": 562, "lr": 9.69725364677887e-07} +{"train_loss": 0.00015807474846951663, "global_step": 66948, "epoch": 562, "lr": 9.692911906273139e-07} +{"train_loss": 0.00022459652973338962, "global_step": 66949, "epoch": 562, "lr": 9.688571128433022e-07} +{"train_loss": 0.00019065623928327113, "global_step": 66950, "epoch": 562, "lr": 9.68423131326701e-07} +{"train_loss": 0.00029601636924780905, "global_step": 66951, "epoch": 562, "lr": 9.679892460783656e-07} +{"train_loss": 0.0003751321346499026, "global_step": 66952, "epoch": 562, "lr": 9.675554570991452e-07} +{"train_loss": 0.00021280643704812974, "global_step": 66953, "epoch": 562, "lr": 9.671217643898888e-07} +{"train_loss": 0.00027046652394346893, "global_step": 66954, "epoch": 562, "lr": 9.666881679514517e-07} +{"train_loss": 0.00014940739492885768, "global_step": 66955, "epoch": 562, "lr": 9.662546677846828e-07} +{"train_loss": 0.0003430389042478055, "global_step": 66956, "epoch": 562, "lr": 9.658212638904373e-07} +{"train_loss": 0.00038075901102274656, "global_step": 66957, "epoch": 562, "lr": 9.65387956269559e-07} +{"train_loss": 0.000266825663857162, "global_step": 66958, "epoch": 562, "lr": 9.649547449229023e-07} +{"train_loss": 0.0002560793946031481, "global_step": 66959, "epoch": 562, "lr": 9.645216298513226e-07} +{"train_loss": 0.00018338683003094047, "global_step": 66960, "epoch": 562, "lr": 9.640886110556635e-07} +{"train_loss": 0.0001606243458809331, "global_step": 66961, "epoch": 562, "lr": 9.636556885367743e-07} +{"train_loss": 0.00020444330584723502, "global_step": 66962, "epoch": 562, "lr": 9.632228622955153e-07} +{"train_loss": 0.0004578759544529021, "global_step": 66963, "epoch": 562, "lr": 9.627901323327248e-07} +{"train_loss": 0.0005402854876592755, "global_step": 66964, "epoch": 562, "lr": 9.623574986492633e-07} +{"train_loss": 0.00033453310607001185, "global_step": 66965, "epoch": 562, "lr": 9.619249612459636e-07} +{"train_loss": 0.00017881586973089725, "global_step": 66966, "epoch": 562, "lr": 9.614925201236969e-07} +{"train_loss": 0.000312647083774209, "global_step": 66967, "epoch": 562, "lr": 9.610601752832904e-07} +{"train_loss": 0.0002363382518524304, "global_step": 66968, "epoch": 562, "lr": 9.606279267256102e-07} +{"train_loss": 0.00040998609620146453, "global_step": 66969, "epoch": 562, "lr": 9.60195774451489e-07} +{"train_loss": 0.00019554971368052065, "global_step": 66970, "epoch": 562, "lr": 9.597637184617924e-07} +{"train_loss": 0.0004289564967621118, "global_step": 66971, "epoch": 562, "lr": 9.593317587573646e-07} +{"train_loss": 0.0003029010258615017, "global_step": 66972, "epoch": 562, "lr": 9.588998953390383e-07} +{"train_loss": 0.00022229223395697773, "global_step": 66973, "epoch": 562, "lr": 9.584681282076847e-07} +{"train_loss": 0.0002595119585748762, "global_step": 66974, "epoch": 562, "lr": 9.58036457364131e-07} +{"train_loss": 0.00016622099792584777, "global_step": 66975, "epoch": 562, "lr": 9.576048828092376e-07} +{"train_loss": 0.00047888842527754605, "global_step": 66976, "epoch": 562, "lr": 9.57173404543843e-07} +{"train_loss": 0.00019639298261608928, "global_step": 66977, "epoch": 562, "lr": 9.567420225688017e-07} +{"train_loss": 0.0003186065296176821, "global_step": 66978, "epoch": 562, "lr": 9.563107368849578e-07} +{"train_loss": 0.00040969401015900075, "global_step": 66979, "epoch": 562, "lr": 9.558795474931547e-07} +{"train_loss": 0.0003968864621128887, "global_step": 66980, "epoch": 562, "lr": 9.554484543942532e-07} +{"train_loss": 0.00018845680460799485, "global_step": 66981, "epoch": 562, "lr": 9.550174575890746e-07} +{"train_loss": 0.000241927380557172, "global_step": 66982, "epoch": 562, "lr": 9.545865570784907e-07} +{"train_loss": 0.00020142158609814942, "global_step": 66983, "epoch": 562, "lr": 9.541557528633338e-07} +{"train_loss": 0.00025107141118496656, "global_step": 66984, "epoch": 562, "lr": 9.53725044944448e-07} +{"train_loss": 0.0001209491238114424, "global_step": 66985, "epoch": 562, "lr": 9.532944333226879e-07} +{"train_loss": 0.0002805010590236634, "global_step": 66986, "epoch": 562, "lr": 9.528639179988919e-07} +{"train_loss": 0.00015603064093738794, "global_step": 66987, "epoch": 562, "lr": 9.524334989739092e-07} +{"train_loss": 0.0002949357149191201, "global_step": 66988, "epoch": 562, "lr": 9.520031762485837e-07} +{"train_loss": 0.00021338110673241317, "global_step": 66989, "epoch": 562, "lr": 9.515729498237591e-07} +{"train_loss": 0.00022418532171286643, "global_step": 66990, "epoch": 562, "lr": 9.511428197002847e-07} +{"train_loss": 0.00018038458074443042, "global_step": 66991, "epoch": 562, "lr": 9.507127858789933e-07} +{"train_loss": 0.0004301680310163647, "global_step": 66992, "epoch": 562, "lr": 9.502828483607395e-07} +{"train_loss": 0.0003036647103726864, "global_step": 66993, "epoch": 562, "lr": 9.498530071463674e-07} +{"train_loss": 0.00022652701591141522, "global_step": 66994, "epoch": 562, "lr": 9.49423262236715e-07} +{"train_loss": 0.00019266424351371825, "global_step": 66995, "epoch": 562, "lr": 9.489936136326372e-07} +{"train_loss": 0.0002827560433119089, "global_step": 66996, "epoch": 562, "lr": 9.485640613349612e-07, "val_loss": 0.02789705991744995} +{"train_loss": 0.00019614097254816443, "global_step": 66997, "epoch": 563, "lr": 9.481346053445472e-07} +{"train_loss": 0.0003622022341005504, "global_step": 66998, "epoch": 563, "lr": 9.477052456622227e-07} +{"train_loss": 0.00035167986061424017, "global_step": 66999, "epoch": 563, "lr": 9.472759822888477e-07} +{"train_loss": 0.0002872347249649465, "global_step": 67000, "epoch": 563, "lr": 9.468468152252496e-07} +{"train_loss": 0.0003201626241207123, "global_step": 67001, "epoch": 563, "lr": 9.464177444722777e-07} +{"train_loss": 0.00022742836154066026, "global_step": 67002, "epoch": 563, "lr": 9.459887700307757e-07} +{"train_loss": 0.00020717702864203602, "global_step": 67003, "epoch": 563, "lr": 9.455598919015817e-07} +{"train_loss": 0.00031501773628406227, "global_step": 67004, "epoch": 563, "lr": 9.451311100855453e-07} +{"train_loss": 0.00015001824067439884, "global_step": 67005, "epoch": 563, "lr": 9.44702424583499e-07} +{"train_loss": 0.0003280236560385674, "global_step": 67006, "epoch": 563, "lr": 9.442738353962865e-07} +{"train_loss": 0.00016500464698765427, "global_step": 67007, "epoch": 563, "lr": 9.438453425247574e-07} +{"train_loss": 0.00033874125801958144, "global_step": 67008, "epoch": 563, "lr": 9.43416945969744e-07} +{"train_loss": 0.00039737403858453035, "global_step": 67009, "epoch": 563, "lr": 9.429886457320903e-07} +{"train_loss": 0.00040572191937826574, "global_step": 67010, "epoch": 563, "lr": 9.425604418126344e-07} +{"train_loss": 0.0007097974303178489, "global_step": 67011, "epoch": 563, "lr": 9.421323342122257e-07} +{"train_loss": 0.00022703951981384307, "global_step": 67012, "epoch": 563, "lr": 9.417043229316969e-07} +{"train_loss": 0.00021828107128385454, "global_step": 67013, "epoch": 563, "lr": 9.412764079718916e-07} +{"train_loss": 0.00033491605427116156, "global_step": 67014, "epoch": 563, "lr": 9.408485893336483e-07} +{"train_loss": 0.00034637219505384564, "global_step": 67015, "epoch": 563, "lr": 9.40420867017805e-07} +{"train_loss": 0.000307130569126457, "global_step": 67016, "epoch": 563, "lr": 9.39993241025211e-07} +{"train_loss": 0.0004054898163303733, "global_step": 67017, "epoch": 563, "lr": 9.39565711356688e-07} +{"train_loss": 0.00021122448379173875, "global_step": 67018, "epoch": 563, "lr": 9.391382780130964e-07} +{"train_loss": 0.0005814533215016127, "global_step": 67019, "epoch": 563, "lr": 9.387109409952577e-07} +{"train_loss": 0.00018455827375873923, "global_step": 67020, "epoch": 563, "lr": 9.382837003040268e-07} +{"train_loss": 0.00024153286358341575, "global_step": 67021, "epoch": 563, "lr": 9.378565559402308e-07} +{"train_loss": 0.0002679124881979078, "global_step": 67022, "epoch": 563, "lr": 9.37429507904708e-07} +{"train_loss": 0.0003418580745346844, "global_step": 67023, "epoch": 563, "lr": 9.370025561983076e-07} +{"train_loss": 0.0004735066322609782, "global_step": 67024, "epoch": 563, "lr": 9.365757008218567e-07} +{"train_loss": 0.00020308401144575328, "global_step": 67025, "epoch": 563, "lr": 9.361489417761993e-07} +{"train_loss": 0.00034668564330786467, "global_step": 67026, "epoch": 563, "lr": 9.357222790621678e-07} +{"train_loss": 0.0003206591645721346, "global_step": 67027, "epoch": 563, "lr": 9.352957126806061e-07} +{"train_loss": 0.00013759586727246642, "global_step": 67028, "epoch": 563, "lr": 9.348692426323524e-07} +{"train_loss": 0.0007845804211683571, "global_step": 67029, "epoch": 563, "lr": 9.344428689182339e-07} +{"train_loss": 0.00038656379911117256, "global_step": 67030, "epoch": 563, "lr": 9.340165915390997e-07} +{"train_loss": 0.00023747843806631863, "global_step": 67031, "epoch": 563, "lr": 9.335904104957827e-07} +{"train_loss": 0.0001709974167170003, "global_step": 67032, "epoch": 563, "lr": 9.33164325789121e-07} +{"train_loss": 0.00022491721028927714, "global_step": 67033, "epoch": 563, "lr": 9.327383374199472e-07} +{"train_loss": 0.0007784009794704616, "global_step": 67034, "epoch": 563, "lr": 9.323124453890997e-07} +{"train_loss": 0.00019139946380164474, "global_step": 67035, "epoch": 563, "lr": 9.318866496974165e-07} +{"train_loss": 0.0003468459763098508, "global_step": 67036, "epoch": 563, "lr": 9.31460950345725e-07} +{"train_loss": 0.0001647362660150975, "global_step": 67037, "epoch": 563, "lr": 9.310353473348743e-07} +{"train_loss": 0.00015008293848950416, "global_step": 67038, "epoch": 563, "lr": 9.30609840665686e-07} +{"train_loss": 0.00032878771889954805, "global_step": 67039, "epoch": 563, "lr": 9.30184430339015e-07} +{"train_loss": 0.00019433762645348907, "global_step": 67040, "epoch": 563, "lr": 9.297591163556774e-07} +{"train_loss": 0.00039688742253929377, "global_step": 67041, "epoch": 563, "lr": 9.293338987165112e-07} +{"train_loss": 0.0001995539787458256, "global_step": 67042, "epoch": 563, "lr": 9.28908777422366e-07} +{"train_loss": 0.0004294376412872225, "global_step": 67043, "epoch": 563, "lr": 9.284837524740575e-07} +{"train_loss": 0.0005156445549800992, "global_step": 67044, "epoch": 563, "lr": 9.280588238724297e-07} +{"train_loss": 0.0004053459269925952, "global_step": 67045, "epoch": 563, "lr": 9.276339916183208e-07} +{"train_loss": 0.00019309596973471344, "global_step": 67046, "epoch": 563, "lr": 9.272092557125523e-07} +{"train_loss": 0.00013167335418984294, "global_step": 67047, "epoch": 563, "lr": 9.267846161559734e-07} +{"train_loss": 0.00044850181438960135, "global_step": 67048, "epoch": 563, "lr": 9.263600729494059e-07} +{"train_loss": 0.00046836017281748354, "global_step": 67049, "epoch": 563, "lr": 9.25935626093688e-07} +{"train_loss": 0.00014726152585353702, "global_step": 67050, "epoch": 563, "lr": 9.255112755896522e-07} +{"train_loss": 0.00013790823868475854, "global_step": 67051, "epoch": 563, "lr": 9.250870214381313e-07} +{"train_loss": 0.0003094507264904678, "global_step": 67052, "epoch": 563, "lr": 9.246628636399634e-07} +{"train_loss": 0.000513117469381541, "global_step": 67053, "epoch": 563, "lr": 9.242388021959758e-07} +{"train_loss": 0.0002367132401559502, "global_step": 67054, "epoch": 563, "lr": 9.23814837107001e-07} +{"train_loss": 0.00029629701748490334, "global_step": 67055, "epoch": 563, "lr": 9.233909683738717e-07} +{"train_loss": 0.00026036534109152853, "global_step": 67056, "epoch": 563, "lr": 9.229671959974207e-07} +{"train_loss": 0.00023948019952513278, "global_step": 67057, "epoch": 563, "lr": 9.225435199784805e-07} +{"train_loss": 0.00026358896866440773, "global_step": 67058, "epoch": 563, "lr": 9.221199403178893e-07} +{"train_loss": 0.00015432151849381626, "global_step": 67059, "epoch": 563, "lr": 9.216964570164632e-07} +{"train_loss": 0.0002659890742506832, "global_step": 67060, "epoch": 563, "lr": 9.212730700750516e-07} +{"train_loss": 0.00018104739137925208, "global_step": 67061, "epoch": 563, "lr": 9.208497794944704e-07} +{"train_loss": 0.00020368023251648992, "global_step": 67062, "epoch": 563, "lr": 9.204265852755578e-07} +{"train_loss": 0.00013761462469119579, "global_step": 67063, "epoch": 563, "lr": 9.200034874191466e-07} +{"train_loss": 0.0003056755813304335, "global_step": 67064, "epoch": 563, "lr": 9.195804859260638e-07} +{"train_loss": 0.0003850635257549584, "global_step": 67065, "epoch": 563, "lr": 9.19157580797142e-07} +{"train_loss": 0.00019392847025301307, "global_step": 67066, "epoch": 563, "lr": 9.18734772033214e-07} +{"train_loss": 0.0003553146671038121, "global_step": 67067, "epoch": 563, "lr": 9.183120596351014e-07} +{"train_loss": 0.00028497978928498924, "global_step": 67068, "epoch": 563, "lr": 9.178894436036422e-07} +{"train_loss": 0.0002869316376745701, "global_step": 67069, "epoch": 563, "lr": 9.174669239396583e-07} +{"train_loss": 0.0006152440328150988, "global_step": 67070, "epoch": 563, "lr": 9.170445006439931e-07} +{"train_loss": 0.0001870219421107322, "global_step": 67071, "epoch": 563, "lr": 9.16622173717463e-07} +{"train_loss": 0.00023897446226328611, "global_step": 67072, "epoch": 563, "lr": 9.161999431609003e-07} +{"train_loss": 0.00022673903731629252, "global_step": 67073, "epoch": 563, "lr": 9.157778089751378e-07} +{"train_loss": 0.0002372947201365605, "global_step": 67074, "epoch": 563, "lr": 9.153557711609973e-07} +{"train_loss": 0.00031285773729905486, "global_step": 67075, "epoch": 563, "lr": 9.149338297193166e-07} +{"train_loss": 0.00022302808065433055, "global_step": 67076, "epoch": 563, "lr": 9.145119846509232e-07} +{"train_loss": 0.000366274849511683, "global_step": 67077, "epoch": 563, "lr": 9.140902359566328e-07} +{"train_loss": 0.0003036905254703015, "global_step": 67078, "epoch": 563, "lr": 9.136685836372838e-07} +{"train_loss": 0.00018993523553945124, "global_step": 67079, "epoch": 563, "lr": 9.132470276937033e-07} +{"train_loss": 0.00016039081674534827, "global_step": 67080, "epoch": 563, "lr": 9.128255681267184e-07} +{"train_loss": 0.0003468781360425055, "global_step": 67081, "epoch": 563, "lr": 9.124042049371561e-07} +{"train_loss": 0.000316089135594666, "global_step": 67082, "epoch": 563, "lr": 9.119829381258494e-07} +{"train_loss": 0.00028118619229644537, "global_step": 67083, "epoch": 563, "lr": 9.115617676936139e-07} +{"train_loss": 0.0003410334757063538, "global_step": 67084, "epoch": 563, "lr": 9.111406936412825e-07} +{"train_loss": 0.000302240252494812, "global_step": 67085, "epoch": 563, "lr": 9.107197159696823e-07} +{"train_loss": 0.0002918924728874117, "global_step": 67086, "epoch": 563, "lr": 9.102988346796404e-07} +{"train_loss": 0.00016217754455283284, "global_step": 67087, "epoch": 563, "lr": 9.098780497719839e-07} +{"train_loss": 0.0001210509508382529, "global_step": 67088, "epoch": 563, "lr": 9.094573612475343e-07} +{"train_loss": 0.00023107550805434585, "global_step": 67089, "epoch": 563, "lr": 9.090367691071244e-07} +{"train_loss": 0.00024583807680755854, "global_step": 67090, "epoch": 563, "lr": 9.086162733515702e-07} +{"train_loss": 0.0003197953919880092, "global_step": 67091, "epoch": 563, "lr": 9.081958739817098e-07} +{"train_loss": 0.0002940312842838466, "global_step": 67092, "epoch": 563, "lr": 9.077755709983537e-07} +{"train_loss": 0.00027210472035221756, "global_step": 67093, "epoch": 563, "lr": 9.073553644023458e-07} +{"train_loss": 0.00019299998530186713, "global_step": 67094, "epoch": 563, "lr": 9.069352541944909e-07} +{"train_loss": 0.000259772757999599, "global_step": 67095, "epoch": 563, "lr": 9.065152403756328e-07} +{"train_loss": 0.00043140019988641143, "global_step": 67096, "epoch": 563, "lr": 9.060953229465818e-07} +{"train_loss": 0.00045332525041885674, "global_step": 67097, "epoch": 563, "lr": 9.056755019081709e-07} +{"train_loss": 0.00022808463836554438, "global_step": 67098, "epoch": 563, "lr": 9.052557772612158e-07} +{"train_loss": 0.00023899381631053984, "global_step": 67099, "epoch": 563, "lr": 9.048361490065549e-07} +{"train_loss": 0.0002505062730051577, "global_step": 67100, "epoch": 563, "lr": 9.04416617144993e-07} +{"train_loss": 0.0002839961089193821, "global_step": 67101, "epoch": 563, "lr": 9.03997181677374e-07} +{"train_loss": 0.00023881603556219488, "global_step": 67102, "epoch": 563, "lr": 9.035778426045083e-07} +{"train_loss": 0.00020484028209466487, "global_step": 67103, "epoch": 563, "lr": 9.031585999272174e-07} +{"train_loss": 0.00014042369730304927, "global_step": 67104, "epoch": 563, "lr": 9.02739453646334e-07} +{"train_loss": 0.00036163523327559233, "global_step": 67105, "epoch": 563, "lr": 9.023204037626687e-07} +{"train_loss": 0.00024300141376443207, "global_step": 67106, "epoch": 563, "lr": 9.019014502770596e-07} +{"train_loss": 0.0003209422284271568, "global_step": 67107, "epoch": 563, "lr": 9.014825931903226e-07} +{"train_loss": 0.00025984825333580375, "global_step": 67108, "epoch": 563, "lr": 9.010638325032739e-07} +{"train_loss": 0.00018264558457303792, "global_step": 67109, "epoch": 563, "lr": 9.00645168216746e-07} +{"train_loss": 0.00025422527687624097, "global_step": 67110, "epoch": 563, "lr": 9.002266003315552e-07} +{"train_loss": 0.00018589157843962312, "global_step": 67111, "epoch": 563, "lr": 8.998081288485228e-07} +{"train_loss": 0.0002376189368078485, "global_step": 67112, "epoch": 563, "lr": 8.993897537684703e-07} +{"train_loss": 0.00018731328600551933, "global_step": 67113, "epoch": 563, "lr": 8.989714750922196e-07} +{"train_loss": 0.0002425810816930607, "global_step": 67114, "epoch": 563, "lr": 8.985532928205975e-07} +{"train_loss": 0.0002901446791571181, "global_step": 67115, "epoch": 563, "lr": 8.981352069544146e-07, "val_loss": 0.026968616992235184} +{"train_loss": 0.00031051013502292335, "global_step": 67116, "epoch": 564, "lr": 8.977172174945036e-07} +{"train_loss": 0.00022234332573134452, "global_step": 67117, "epoch": 564, "lr": 8.972993244416694e-07} +{"train_loss": 0.00015847408212721348, "global_step": 67118, "epoch": 564, "lr": 8.968815277967502e-07} +{"train_loss": 0.00017504306742921472, "global_step": 67119, "epoch": 564, "lr": 8.964638275605563e-07} +{"train_loss": 0.00021284696413204074, "global_step": 67120, "epoch": 564, "lr": 8.960462237339095e-07} +{"train_loss": 0.00013925340317655355, "global_step": 67121, "epoch": 564, "lr": 8.956287163176314e-07} +{"train_loss": 0.0005093950894661248, "global_step": 67122, "epoch": 564, "lr": 8.952113053125377e-07} +{"train_loss": 0.00014471373287960887, "global_step": 67123, "epoch": 564, "lr": 8.947939907194502e-07} +{"train_loss": 0.0001648055185796693, "global_step": 67124, "epoch": 564, "lr": 8.943767725391905e-07} +{"train_loss": 0.00029958991217426956, "global_step": 67125, "epoch": 564, "lr": 8.939596507725745e-07} +{"train_loss": 0.00021860662673134357, "global_step": 67126, "epoch": 564, "lr": 8.935426254204238e-07} +{"train_loss": 0.00016906342352740467, "global_step": 67127, "epoch": 564, "lr": 8.931256964835544e-07} +{"train_loss": 0.0003183024819009006, "global_step": 67128, "epoch": 564, "lr": 8.927088639627878e-07} +{"train_loss": 0.00017048198787961155, "global_step": 67129, "epoch": 564, "lr": 8.922921278589403e-07} +{"train_loss": 0.00017859718354884535, "global_step": 67130, "epoch": 564, "lr": 8.918754881728331e-07} +{"train_loss": 0.00011809411807917058, "global_step": 67131, "epoch": 564, "lr": 8.914589449052768e-07} +{"train_loss": 0.0001541988312965259, "global_step": 67132, "epoch": 564, "lr": 8.910424980570986e-07} +{"train_loss": 0.00018795633513946086, "global_step": 67133, "epoch": 564, "lr": 8.906261476291144e-07} +{"train_loss": 0.0002552375372033566, "global_step": 67134, "epoch": 564, "lr": 8.902098936221349e-07} +{"train_loss": 0.0002191998646594584, "global_step": 67135, "epoch": 564, "lr": 8.897937360369812e-07} +{"train_loss": 0.00022732400975655764, "global_step": 67136, "epoch": 564, "lr": 8.893776748744697e-07} +{"train_loss": 0.00016253345529548824, "global_step": 67137, "epoch": 564, "lr": 8.889617101354219e-07} +{"train_loss": 0.00014872393512632698, "global_step": 67138, "epoch": 564, "lr": 8.885458418206483e-07} +{"train_loss": 0.00019337676349096, "global_step": 67139, "epoch": 564, "lr": 8.881300699309759e-07} +{"train_loss": 0.0002538174157962203, "global_step": 67140, "epoch": 564, "lr": 8.877143944672095e-07} +{"train_loss": 0.0001441322674509138, "global_step": 67141, "epoch": 564, "lr": 8.872988154301598e-07} +{"train_loss": 0.00013314625539351255, "global_step": 67142, "epoch": 564, "lr": 8.868833328206649e-07} +{"train_loss": 0.00022151721350383013, "global_step": 67143, "epoch": 564, "lr": 8.864679466395188e-07} +{"train_loss": 0.00014344493683893234, "global_step": 67144, "epoch": 564, "lr": 8.860526568875482e-07} +{"train_loss": 0.00023463628895115107, "global_step": 67145, "epoch": 564, "lr": 8.856374635655695e-07} +{"train_loss": 0.00018801780242938548, "global_step": 67146, "epoch": 564, "lr": 8.852223666743876e-07} +{"train_loss": 0.00021301128435879946, "global_step": 67147, "epoch": 564, "lr": 8.848073662148349e-07} +{"train_loss": 0.00015163507487159222, "global_step": 67148, "epoch": 564, "lr": 8.843924621877053e-07} +{"train_loss": 0.0002690156106837094, "global_step": 67149, "epoch": 564, "lr": 8.839776545938317e-07} +{"train_loss": 0.0001268508640350774, "global_step": 67150, "epoch": 564, "lr": 8.835629434340132e-07} +{"train_loss": 0.00018708115385379642, "global_step": 67151, "epoch": 564, "lr": 8.831483287090769e-07} +{"train_loss": 0.00027692975709214807, "global_step": 67152, "epoch": 564, "lr": 8.827338104198335e-07} +{"train_loss": 0.00015942273603286594, "global_step": 67153, "epoch": 564, "lr": 8.823193885670877e-07} +{"train_loss": 0.0002178241848014295, "global_step": 67154, "epoch": 564, "lr": 8.819050631516668e-07} +{"train_loss": 0.00012902633170597255, "global_step": 67155, "epoch": 564, "lr": 8.814908341743699e-07} +{"train_loss": 0.00042724175727926195, "global_step": 67156, "epoch": 564, "lr": 8.810767016360244e-07} +{"train_loss": 0.00046022384776733816, "global_step": 67157, "epoch": 564, "lr": 8.806626655374351e-07} +{"train_loss": 0.0001612713822396472, "global_step": 67158, "epoch": 564, "lr": 8.802487258794179e-07} +{"train_loss": 0.00019811400852631778, "global_step": 67159, "epoch": 564, "lr": 8.798348826627833e-07} +{"train_loss": 0.0003480352752376348, "global_step": 67160, "epoch": 564, "lr": 8.794211358883475e-07} +{"train_loss": 0.0001855979789979756, "global_step": 67161, "epoch": 564, "lr": 8.790074855569208e-07} +{"train_loss": 0.00020558830874506384, "global_step": 67162, "epoch": 564, "lr": 8.785939316693137e-07} +{"train_loss": 0.0004065735556650907, "global_step": 67163, "epoch": 564, "lr": 8.781804742263366e-07} +{"train_loss": 0.0004358259029686451, "global_step": 67164, "epoch": 564, "lr": 8.777671132288112e-07} +{"train_loss": 0.0002916937810368836, "global_step": 67165, "epoch": 564, "lr": 8.773538486775368e-07} +{"train_loss": 0.0001462857035221532, "global_step": 67166, "epoch": 564, "lr": 8.769406805733349e-07} +{"train_loss": 0.0001924501993926242, "global_step": 67167, "epoch": 564, "lr": 8.765276089170049e-07} +{"train_loss": 0.00017723981000017375, "global_step": 67168, "epoch": 564, "lr": 8.761146337093684e-07} +{"train_loss": 0.00020576755923684686, "global_step": 67169, "epoch": 564, "lr": 8.757017549512358e-07} +{"train_loss": 0.0003694807237479836, "global_step": 67170, "epoch": 564, "lr": 8.752889726434122e-07} +{"train_loss": 0.00013485830277204514, "global_step": 67171, "epoch": 564, "lr": 8.748762867867133e-07} +{"train_loss": 0.00037791923386976123, "global_step": 67172, "epoch": 564, "lr": 8.744636973819387e-07} +{"train_loss": 0.0002708549436647445, "global_step": 67173, "epoch": 564, "lr": 8.740512044299154e-07} +{"train_loss": 0.00029272763640619814, "global_step": 67174, "epoch": 564, "lr": 8.736388079314373e-07} +{"train_loss": 0.0005138504202477634, "global_step": 67175, "epoch": 564, "lr": 8.732265078873259e-07} +{"train_loss": 0.00023170854547061026, "global_step": 67176, "epoch": 564, "lr": 8.728143042983805e-07} +{"train_loss": 0.00015482233720831573, "global_step": 67177, "epoch": 564, "lr": 8.724021971654173e-07} +{"train_loss": 0.0002978051779791713, "global_step": 67178, "epoch": 564, "lr": 8.719901864892521e-07} +{"train_loss": 0.00040674570482224226, "global_step": 67179, "epoch": 564, "lr": 8.715782722706733e-07} +{"train_loss": 0.000182760224561207, "global_step": 67180, "epoch": 564, "lr": 8.71166454510508e-07} +{"train_loss": 0.0002175044792238623, "global_step": 67181, "epoch": 564, "lr": 8.707547332095611e-07} +{"train_loss": 0.00015578747843392193, "global_step": 67182, "epoch": 564, "lr": 8.703431083686376e-07} +{"train_loss": 0.0004376260912977159, "global_step": 67183, "epoch": 564, "lr": 8.699315799885421e-07} +{"train_loss": 0.00012371031334623694, "global_step": 67184, "epoch": 564, "lr": 8.695201480700909e-07} +{"train_loss": 0.00018146642833016813, "global_step": 67185, "epoch": 564, "lr": 8.691088126140889e-07} +{"train_loss": 0.0002473150088917464, "global_step": 67186, "epoch": 564, "lr": 8.686975736213409e-07} +{"train_loss": 0.00034491479163989425, "global_step": 67187, "epoch": 564, "lr": 8.682864310926575e-07} +{"train_loss": 0.00020397342450451106, "global_step": 67188, "epoch": 564, "lr": 8.678753850288379e-07} +{"train_loss": 0.00037471341784112155, "global_step": 67189, "epoch": 564, "lr": 8.674644354307038e-07} +{"train_loss": 0.00021921754523646086, "global_step": 67190, "epoch": 564, "lr": 8.670535822990544e-07} +{"train_loss": 0.00031912201666273177, "global_step": 67191, "epoch": 564, "lr": 8.666428256346948e-07} +{"train_loss": 0.0002720485790632665, "global_step": 67192, "epoch": 564, "lr": 8.662321654384298e-07} +{"train_loss": 0.00023113613133318722, "global_step": 67193, "epoch": 564, "lr": 8.658216017110698e-07} +{"train_loss": 0.00025818016729317605, "global_step": 67194, "epoch": 564, "lr": 8.6541113445342e-07} +{"train_loss": 0.0003051246458198875, "global_step": 67195, "epoch": 564, "lr": 8.650007636662905e-07} +{"train_loss": 0.00023108275490812957, "global_step": 67196, "epoch": 564, "lr": 8.645904893504753e-07} +{"train_loss": 0.0006489574443548918, "global_step": 67197, "epoch": 564, "lr": 8.641803115067959e-07} +{"train_loss": 0.00029187914333306253, "global_step": 67198, "epoch": 564, "lr": 8.637702301360406e-07} +{"train_loss": 0.0003884162870235741, "global_step": 67199, "epoch": 564, "lr": 8.633602452390311e-07} +{"train_loss": 0.00030514737591147423, "global_step": 67200, "epoch": 564, "lr": 8.629503568165554e-07} +{"train_loss": 0.0003705799172166735, "global_step": 67201, "epoch": 564, "lr": 8.625405648694351e-07} +{"train_loss": 0.00026900292141363025, "global_step": 67202, "epoch": 564, "lr": 8.621308693984697e-07} +{"train_loss": 0.00025690995971672237, "global_step": 67203, "epoch": 564, "lr": 8.617212704044531e-07} +{"train_loss": 0.0001918275811476633, "global_step": 67204, "epoch": 564, "lr": 8.613117678881955e-07} +{"train_loss": 0.0002996076946146786, "global_step": 67205, "epoch": 564, "lr": 8.609023618505075e-07} +{"train_loss": 0.0004199373070150614, "global_step": 67206, "epoch": 564, "lr": 8.604930522921883e-07} +{"train_loss": 0.0001836260053096339, "global_step": 67207, "epoch": 564, "lr": 8.600838392140376e-07} +{"train_loss": 0.0002660284808371216, "global_step": 67208, "epoch": 564, "lr": 8.596747226168655e-07} +{"train_loss": 0.0003847979533020407, "global_step": 67209, "epoch": 564, "lr": 8.592657025014716e-07} +{"train_loss": 0.00023323504137806594, "global_step": 67210, "epoch": 564, "lr": 8.588567788686552e-07} +{"train_loss": 0.0005012866458855569, "global_step": 67211, "epoch": 564, "lr": 8.584479517192323e-07} +{"train_loss": 0.00021906739857513458, "global_step": 67212, "epoch": 564, "lr": 8.580392210539911e-07} +{"train_loss": 0.0004726740880869329, "global_step": 67213, "epoch": 564, "lr": 8.576305868737422e-07} +{"train_loss": 0.0002491686900611967, "global_step": 67214, "epoch": 564, "lr": 8.572220491792849e-07} +{"train_loss": 0.00039934201049618423, "global_step": 67215, "epoch": 564, "lr": 8.568136079714184e-07} +{"train_loss": 0.0003472477837931365, "global_step": 67216, "epoch": 564, "lr": 8.564052632509534e-07} +{"train_loss": 0.00030978303402662277, "global_step": 67217, "epoch": 564, "lr": 8.55997015018678e-07} +{"train_loss": 0.00020465585112106055, "global_step": 67218, "epoch": 564, "lr": 8.555888632754139e-07} +{"train_loss": 0.00027160224271938205, "global_step": 67219, "epoch": 564, "lr": 8.551808080219381e-07} +{"train_loss": 0.00013813770783599466, "global_step": 67220, "epoch": 564, "lr": 8.547728492590779e-07} +{"train_loss": 0.0003805918386206031, "global_step": 67221, "epoch": 564, "lr": 8.543649869876102e-07} +{"train_loss": 0.0002059697435470298, "global_step": 67222, "epoch": 564, "lr": 8.539572212083513e-07} +{"train_loss": 0.0002571847289800644, "global_step": 67223, "epoch": 564, "lr": 8.535495519220948e-07} +{"train_loss": 0.00020734305144287646, "global_step": 67224, "epoch": 564, "lr": 8.531419791296458e-07} +{"train_loss": 0.00020168948685750365, "global_step": 67225, "epoch": 564, "lr": 8.527345028317979e-07} +{"train_loss": 0.00022839210578240454, "global_step": 67226, "epoch": 564, "lr": 8.523271230293617e-07} +{"train_loss": 0.0003208428679499775, "global_step": 67227, "epoch": 564, "lr": 8.519198397231254e-07} +{"train_loss": 0.00017394722090102732, "global_step": 67228, "epoch": 564, "lr": 8.515126529138939e-07} +{"train_loss": 0.0003800858976319432, "global_step": 67229, "epoch": 564, "lr": 8.511055626024666e-07} +{"train_loss": 0.00015421994612552226, "global_step": 67230, "epoch": 564, "lr": 8.506985687896485e-07} +{"train_loss": 0.0004672121722251177, "global_step": 67231, "epoch": 564, "lr": 8.502916714762221e-07} +{"train_loss": 0.0003440521832089871, "global_step": 67232, "epoch": 564, "lr": 8.498848706630092e-07} +{"train_loss": 0.00020130458869971335, "global_step": 67233, "epoch": 564, "lr": 8.494781663507922e-07} +{"train_loss": 0.00025945580444599995, "global_step": 67234, "epoch": 564, "lr": 8.490715585403652e-07, "val_loss": 0.0256974995136261} +{"train_loss": 0.0002885143621824682, "global_step": 67235, "epoch": 565, "lr": 8.486650472325442e-07} +{"train_loss": 0.00036769130383618176, "global_step": 67236, "epoch": 565, "lr": 8.482586324281172e-07} +{"train_loss": 0.00019026230438612401, "global_step": 67237, "epoch": 565, "lr": 8.478523141278838e-07} +{"train_loss": 0.0004193591885268688, "global_step": 67238, "epoch": 565, "lr": 8.474460923326377e-07} +{"train_loss": 0.00019831271492876112, "global_step": 67239, "epoch": 565, "lr": 8.470399670431839e-07} +{"train_loss": 0.00016583323304075748, "global_step": 67240, "epoch": 565, "lr": 8.466339382603161e-07} +{"train_loss": 0.0002263039059471339, "global_step": 67241, "epoch": 565, "lr": 8.462280059848283e-07} +{"train_loss": 0.000867938157171011, "global_step": 67242, "epoch": 565, "lr": 8.458221702175251e-07} +{"train_loss": 0.00016463738575112075, "global_step": 67243, "epoch": 565, "lr": 8.454164309591894e-07} +{"train_loss": 0.00035340749309398234, "global_step": 67244, "epoch": 565, "lr": 8.450107882106373e-07} +{"train_loss": 0.00017435444169677794, "global_step": 67245, "epoch": 565, "lr": 8.446052419726513e-07} +{"train_loss": 0.000304122397210449, "global_step": 67246, "epoch": 565, "lr": 8.44199792246031e-07} +{"train_loss": 0.00021228447440080345, "global_step": 67247, "epoch": 565, "lr": 8.437944390315755e-07} +{"train_loss": 0.00021483587624970824, "global_step": 67248, "epoch": 565, "lr": 8.433891823300733e-07} +{"train_loss": 0.00028222231776453555, "global_step": 67249, "epoch": 565, "lr": 8.429840221423235e-07} +{"train_loss": 0.0003210743307135999, "global_step": 67250, "epoch": 565, "lr": 8.425789584691257e-07} +{"train_loss": 0.00040442057070322335, "global_step": 67251, "epoch": 565, "lr": 8.421739913112737e-07} +{"train_loss": 0.00031548069091513753, "global_step": 67252, "epoch": 565, "lr": 8.417691206695666e-07} +{"train_loss": 0.0005197509890422225, "global_step": 67253, "epoch": 565, "lr": 8.413643465447818e-07} +{"train_loss": 0.00017828328418545425, "global_step": 67254, "epoch": 565, "lr": 8.409596689377352e-07} +{"train_loss": 0.00016071624122560024, "global_step": 67255, "epoch": 565, "lr": 8.405550878492097e-07} +{"train_loss": 0.00015111538232304156, "global_step": 67256, "epoch": 565, "lr": 8.401506032799988e-07} +{"train_loss": 0.00017729881801642478, "global_step": 67257, "epoch": 565, "lr": 8.397462152309077e-07} +{"train_loss": 0.00026500181411392987, "global_step": 67258, "epoch": 565, "lr": 8.393419237027133e-07} +{"train_loss": 0.00021998301963321865, "global_step": 67259, "epoch": 565, "lr": 8.389377286962318e-07} +{"train_loss": 0.0001389921671943739, "global_step": 67260, "epoch": 565, "lr": 8.385336302122348e-07} +{"train_loss": 0.0003862805024255067, "global_step": 67261, "epoch": 565, "lr": 8.381296282515272e-07} +{"train_loss": 0.00021890518837608397, "global_step": 67262, "epoch": 565, "lr": 8.377257228148971e-07} +{"train_loss": 0.00044713239185512066, "global_step": 67263, "epoch": 565, "lr": 8.373219139031441e-07} +{"train_loss": 0.0003256131603848189, "global_step": 67264, "epoch": 565, "lr": 8.369182015170563e-07} +{"train_loss": 0.0002206522913184017, "global_step": 67265, "epoch": 565, "lr": 8.365145856574275e-07} +{"train_loss": 0.00033203416387550533, "global_step": 67266, "epoch": 565, "lr": 8.361110663250516e-07} +{"train_loss": 0.00022816566342953593, "global_step": 67267, "epoch": 565, "lr": 8.357076435207168e-07} +{"train_loss": 0.0004390842223074287, "global_step": 67268, "epoch": 565, "lr": 8.353043172452168e-07} +{"train_loss": 0.00032837578328326344, "global_step": 67269, "epoch": 565, "lr": 8.349010874993457e-07} +{"train_loss": 0.0002774439053609967, "global_step": 67270, "epoch": 565, "lr": 8.344979542838971e-07} +{"train_loss": 0.000154047243995592, "global_step": 67271, "epoch": 565, "lr": 8.340949175996538e-07} +{"train_loss": 0.0002522532595321536, "global_step": 67272, "epoch": 565, "lr": 8.33691977447415e-07} +{"train_loss": 0.00031237758230417967, "global_step": 67273, "epoch": 565, "lr": 8.332891338279691e-07} +{"train_loss": 0.00021748582366853952, "global_step": 67274, "epoch": 565, "lr": 8.328863867421044e-07} +{"train_loss": 0.00014973928045947105, "global_step": 67275, "epoch": 565, "lr": 8.324837361906202e-07} +{"train_loss": 0.00020283329649828374, "global_step": 67276, "epoch": 565, "lr": 8.320811821742935e-07} +{"train_loss": 0.00014011608436703682, "global_step": 67277, "epoch": 565, "lr": 8.316787246939295e-07} +{"train_loss": 0.00041279676952399313, "global_step": 67278, "epoch": 565, "lr": 8.312763637503163e-07} +{"train_loss": 0.0003622517688199878, "global_step": 67279, "epoch": 565, "lr": 8.308740993442254e-07} +{"train_loss": 0.00013302708975970745, "global_step": 67280, "epoch": 565, "lr": 8.30471931476473e-07} +{"train_loss": 0.00028112955624237657, "global_step": 67281, "epoch": 565, "lr": 8.300698601478252e-07} +{"train_loss": 0.00031204530387185514, "global_step": 67282, "epoch": 565, "lr": 8.296678853590923e-07} +{"train_loss": 0.00017861790547613055, "global_step": 67283, "epoch": 565, "lr": 8.292660071110459e-07} +{"train_loss": 0.0004346968198660761, "global_step": 67284, "epoch": 565, "lr": 8.288642254044854e-07} +{"train_loss": 0.00023678733850829303, "global_step": 67285, "epoch": 565, "lr": 8.284625402401991e-07} +{"train_loss": 0.00025883811758831143, "global_step": 67286, "epoch": 565, "lr": 8.280609516189641e-07} +{"train_loss": 0.0004058523045387119, "global_step": 67287, "epoch": 565, "lr": 8.27659459541591e-07} +{"train_loss": 0.00016439550381619483, "global_step": 67288, "epoch": 565, "lr": 8.272580640088456e-07} +{"train_loss": 0.00038107633008621633, "global_step": 67289, "epoch": 565, "lr": 8.268567650215275e-07} +{"train_loss": 0.0001580696552991867, "global_step": 67290, "epoch": 565, "lr": 8.264555625804249e-07} +{"train_loss": 0.0002567150804679841, "global_step": 67291, "epoch": 565, "lr": 8.260544566863204e-07} +{"train_loss": 0.0001398894819431007, "global_step": 67292, "epoch": 565, "lr": 8.256534473400079e-07} +{"train_loss": 0.00018664805975276977, "global_step": 67293, "epoch": 565, "lr": 8.252525345422701e-07} +{"train_loss": 0.00012988712114747614, "global_step": 67294, "epoch": 565, "lr": 8.248517182938952e-07} +{"train_loss": 0.00023901788517832756, "global_step": 67295, "epoch": 565, "lr": 8.244509985956716e-07} +{"train_loss": 0.00027582081384025514, "global_step": 67296, "epoch": 565, "lr": 8.240503754483819e-07} +{"train_loss": 0.00018259903299622238, "global_step": 67297, "epoch": 565, "lr": 8.236498488528199e-07} +{"train_loss": 0.0002301307104062289, "global_step": 67298, "epoch": 565, "lr": 8.232494188097628e-07} +{"train_loss": 0.00032749533420428634, "global_step": 67299, "epoch": 565, "lr": 8.2284908532001e-07} +{"train_loss": 0.0003037899441551417, "global_step": 67300, "epoch": 565, "lr": 8.224488483843328e-07} +{"train_loss": 0.00018763543630484492, "global_step": 67301, "epoch": 565, "lr": 8.220487080035255e-07} +{"train_loss": 0.00021469885541591793, "global_step": 67302, "epoch": 565, "lr": 8.216486641783704e-07} +{"train_loss": 0.0001580378011567518, "global_step": 67303, "epoch": 565, "lr": 8.212487169096506e-07} +{"train_loss": 0.00035468919668346643, "global_step": 67304, "epoch": 565, "lr": 8.208488661981595e-07} +{"train_loss": 0.00028245546855032444, "global_step": 67305, "epoch": 565, "lr": 8.204491120446745e-07} +{"train_loss": 0.0005030684405937791, "global_step": 67306, "epoch": 565, "lr": 8.200494544499892e-07} +{"train_loss": 0.00019428759696893394, "global_step": 67307, "epoch": 565, "lr": 8.196498934148756e-07} +{"train_loss": 0.00019149186846334487, "global_step": 67308, "epoch": 565, "lr": 8.192504289401326e-07} +{"train_loss": 0.00020600609423127025, "global_step": 67309, "epoch": 565, "lr": 8.188510610265377e-07} +{"train_loss": 0.00028155167819932103, "global_step": 67310, "epoch": 565, "lr": 8.184517896748678e-07} +{"train_loss": 0.00017958601529244334, "global_step": 67311, "epoch": 565, "lr": 8.180526148859168e-07} +{"train_loss": 0.0002530212514102459, "global_step": 67312, "epoch": 565, "lr": 8.176535366604621e-07} +{"train_loss": 0.000295671314233914, "global_step": 67313, "epoch": 565, "lr": 8.172545549992972e-07} +{"train_loss": 0.0003469412913545966, "global_step": 67314, "epoch": 565, "lr": 8.168556699031938e-07} +{"train_loss": 0.0003118080203421414, "global_step": 67315, "epoch": 565, "lr": 8.1645688137294e-07} +{"train_loss": 0.0002329656999791041, "global_step": 67316, "epoch": 565, "lr": 8.160581894093189e-07} +{"train_loss": 0.00032914301846176386, "global_step": 67317, "epoch": 565, "lr": 8.156595940131129e-07} +{"train_loss": 0.00025476934388279915, "global_step": 67318, "epoch": 565, "lr": 8.152610951851047e-07} +{"train_loss": 0.00033745597465895116, "global_step": 67319, "epoch": 565, "lr": 8.148626929260772e-07} +{"train_loss": 0.00018317383364774287, "global_step": 67320, "epoch": 565, "lr": 8.144643872368129e-07} +{"train_loss": 0.0004706301260739565, "global_step": 67321, "epoch": 565, "lr": 8.140661781180892e-07} +{"train_loss": 0.000155651054228656, "global_step": 67322, "epoch": 565, "lr": 8.136680655706941e-07} +{"train_loss": 0.0004108435823582113, "global_step": 67323, "epoch": 565, "lr": 8.132700495954049e-07} +{"train_loss": 0.0002447766892146319, "global_step": 67324, "epoch": 565, "lr": 8.128721301930098e-07} +{"train_loss": 0.00021309434669092298, "global_step": 67325, "epoch": 565, "lr": 8.124743073642804e-07} +{"train_loss": 0.00022740193526260555, "global_step": 67326, "epoch": 565, "lr": 8.120765811100051e-07} +{"train_loss": 0.00019164128752890974, "global_step": 67327, "epoch": 565, "lr": 8.116789514309664e-07} +{"train_loss": 0.0005130149656906724, "global_step": 67328, "epoch": 565, "lr": 8.11281418327936e-07} +{"train_loss": 0.000286141294054687, "global_step": 67329, "epoch": 565, "lr": 8.108839818017022e-07} +{"train_loss": 0.0002824993571266532, "global_step": 67330, "epoch": 565, "lr": 8.104866418530422e-07} +{"train_loss": 0.00024515073164366186, "global_step": 67331, "epoch": 565, "lr": 8.100893984827329e-07} +{"train_loss": 0.0002141989825759083, "global_step": 67332, "epoch": 565, "lr": 8.096922516915628e-07} +{"train_loss": 0.00015591322153341025, "global_step": 67333, "epoch": 565, "lr": 8.092952014803091e-07} +{"train_loss": 0.0006360599654726684, "global_step": 67334, "epoch": 565, "lr": 8.088982478497431e-07} +{"train_loss": 0.00019146503473166376, "global_step": 67335, "epoch": 565, "lr": 8.085013908006534e-07} +{"train_loss": 0.0003517236327752471, "global_step": 67336, "epoch": 565, "lr": 8.081046303338113e-07} +{"train_loss": 0.00024570204550400376, "global_step": 67337, "epoch": 565, "lr": 8.077079664500053e-07} +{"train_loss": 0.0001437448663637042, "global_step": 67338, "epoch": 565, "lr": 8.073113991500069e-07} +{"train_loss": 0.00023931142641231418, "global_step": 67339, "epoch": 565, "lr": 8.069149284345989e-07} +{"train_loss": 0.000334147218381986, "global_step": 67340, "epoch": 565, "lr": 8.065185543045583e-07} +{"train_loss": 0.00019252031052019447, "global_step": 67341, "epoch": 565, "lr": 8.061222767606569e-07} +{"train_loss": 0.0004478215123526752, "global_step": 67342, "epoch": 565, "lr": 8.057260958036827e-07} +{"train_loss": 0.0004320983134675771, "global_step": 67343, "epoch": 565, "lr": 8.053300114344131e-07} +{"train_loss": 0.00043961461051367223, "global_step": 67344, "epoch": 565, "lr": 8.049340236536196e-07} +{"train_loss": 0.0001826016086852178, "global_step": 67345, "epoch": 565, "lr": 8.045381324620793e-07} +{"train_loss": 0.00023153520305640996, "global_step": 67346, "epoch": 565, "lr": 8.04142337860575e-07} +{"train_loss": 0.00018703793466556817, "global_step": 67347, "epoch": 565, "lr": 8.037466398498839e-07} +{"train_loss": 0.00022284565784502774, "global_step": 67348, "epoch": 565, "lr": 8.033510384307774e-07} +{"train_loss": 0.00020157323160674423, "global_step": 67349, "epoch": 565, "lr": 8.029555336040384e-07} +{"train_loss": 0.00015485193580389023, "global_step": 67350, "epoch": 565, "lr": 8.025601253704385e-07} +{"train_loss": 0.00022367699421010911, "global_step": 67351, "epoch": 565, "lr": 8.021648137307547e-07} +{"train_loss": 0.00038891242002137005, "global_step": 67352, "epoch": 565, "lr": 8.017695986857699e-07} +{"train_loss": 0.0002740767873440157, "global_step": 67353, "epoch": 565, "lr": 8.013744802362444e-07, "val_loss": 0.02537049911916256, "train_action_mse_error": 3.7419154068629723e-06} +{"train_loss": 0.00023790205887053162, "global_step": 67354, "epoch": 566, "lr": 8.009794583829666e-07} +{"train_loss": 0.0002670690882951021, "global_step": 67355, "epoch": 566, "lr": 8.005845331267137e-07} +{"train_loss": 0.00026748195523396134, "global_step": 67356, "epoch": 566, "lr": 8.001897044682572e-07} +{"train_loss": 0.0002530292549636215, "global_step": 67357, "epoch": 566, "lr": 7.997949724083687e-07} +{"train_loss": 0.0001804997882572934, "global_step": 67358, "epoch": 566, "lr": 7.994003369478254e-07} +{"train_loss": 0.0004516707267612219, "global_step": 67359, "epoch": 566, "lr": 7.990057980874099e-07} +{"train_loss": 0.0005444613634608686, "global_step": 67360, "epoch": 566, "lr": 7.98611355827883e-07} +{"train_loss": 0.000465763034299016, "global_step": 67361, "epoch": 566, "lr": 7.982170101700326e-07} +{"train_loss": 0.00024594232672825456, "global_step": 67362, "epoch": 566, "lr": 7.978227611146194e-07} +{"train_loss": 0.0002532679063733667, "global_step": 67363, "epoch": 566, "lr": 7.974286086624316e-07} +{"train_loss": 0.00018027100304607302, "global_step": 67364, "epoch": 566, "lr": 7.970345528142298e-07} +{"train_loss": 0.00026875047478824854, "global_step": 67365, "epoch": 566, "lr": 7.966405935708022e-07} +{"train_loss": 0.0003324537829030305, "global_step": 67366, "epoch": 566, "lr": 7.962467309329092e-07} +{"train_loss": 0.00014171322982292622, "global_step": 67367, "epoch": 566, "lr": 7.95852964901328e-07} +{"train_loss": 0.0002464198914822191, "global_step": 67368, "epoch": 566, "lr": 7.954592954768358e-07} +{"train_loss": 0.0003317795635666698, "global_step": 67369, "epoch": 566, "lr": 7.950657226601987e-07} +{"train_loss": 0.00037088870885781944, "global_step": 67370, "epoch": 566, "lr": 7.946722464521994e-07} +{"train_loss": 0.0001708915806375444, "global_step": 67371, "epoch": 566, "lr": 7.942788668536039e-07} +{"train_loss": 0.00015431649808306247, "global_step": 67372, "epoch": 566, "lr": 7.938855838651782e-07} +{"train_loss": 0.0003221596125513315, "global_step": 67373, "epoch": 566, "lr": 7.934923974877051e-07} +{"train_loss": 0.0001855384762166068, "global_step": 67374, "epoch": 566, "lr": 7.930993077219506e-07} +{"train_loss": 0.00016356195555999875, "global_step": 67375, "epoch": 566, "lr": 7.92706314568692e-07} +{"train_loss": 0.00027609188691712916, "global_step": 67376, "epoch": 566, "lr": 7.92313418028695e-07} +{"train_loss": 0.0002156491536879912, "global_step": 67377, "epoch": 566, "lr": 7.919206181027372e-07} +{"train_loss": 0.00039735838072374463, "global_step": 67378, "epoch": 566, "lr": 7.915279147915844e-07} +{"train_loss": 0.0004637463134713471, "global_step": 67379, "epoch": 566, "lr": 7.911353080960027e-07} +{"train_loss": 0.00029809068655595183, "global_step": 67380, "epoch": 566, "lr": 7.907427980167803e-07} +{"train_loss": 0.0002153828536393121, "global_step": 67381, "epoch": 566, "lr": 7.903503845546667e-07} +{"train_loss": 0.00030460822745226324, "global_step": 67382, "epoch": 566, "lr": 7.899580677104501e-07} +{"train_loss": 0.0003723558329511434, "global_step": 67383, "epoch": 566, "lr": 7.895658474848966e-07} +{"train_loss": 0.0002636340504977852, "global_step": 67384, "epoch": 566, "lr": 7.891737238787667e-07} +{"train_loss": 0.00019546192197594792, "global_step": 67385, "epoch": 566, "lr": 7.887816968928375e-07} +{"train_loss": 0.0006156868766993284, "global_step": 67386, "epoch": 566, "lr": 7.883897665278805e-07} +{"train_loss": 0.00018527811334934086, "global_step": 67387, "epoch": 566, "lr": 7.87997932784662e-07} +{"train_loss": 0.0002387349377386272, "global_step": 67388, "epoch": 566, "lr": 7.87606195663948e-07} +{"train_loss": 0.0003103085036855191, "global_step": 67389, "epoch": 566, "lr": 7.872145551665156e-07} +{"train_loss": 0.0008957522222772241, "global_step": 67390, "epoch": 566, "lr": 7.868230112931308e-07} +{"train_loss": 0.00027205643709748983, "global_step": 67391, "epoch": 566, "lr": 7.864315640445541e-07} +{"train_loss": 0.00024421754642389715, "global_step": 67392, "epoch": 566, "lr": 7.860402134215683e-07} +{"train_loss": 0.00021943324827589095, "global_step": 67393, "epoch": 566, "lr": 7.856489594249339e-07} +{"train_loss": 0.00015563468332402408, "global_step": 67394, "epoch": 566, "lr": 7.852578020554225e-07} +{"train_loss": 0.0003232391318306327, "global_step": 67395, "epoch": 566, "lr": 7.848667413137944e-07} +{"train_loss": 0.000116499031719286, "global_step": 67396, "epoch": 566, "lr": 7.844757772008215e-07} +{"train_loss": 0.0002500611008144915, "global_step": 67397, "epoch": 566, "lr": 7.840849097172809e-07} +{"train_loss": 0.00018594253924675286, "global_step": 67398, "epoch": 566, "lr": 7.836941388639219e-07} +{"train_loss": 0.00018984792404808104, "global_step": 67399, "epoch": 566, "lr": 7.833034646415271e-07} +{"train_loss": 0.00034467634395696223, "global_step": 67400, "epoch": 566, "lr": 7.829128870508573e-07} +{"train_loss": 0.0001865569211076945, "global_step": 67401, "epoch": 566, "lr": 7.825224060926839e-07} +{"train_loss": 0.00017034901247825474, "global_step": 67402, "epoch": 566, "lr": 7.821320217677619e-07} +{"train_loss": 0.0004050015704706311, "global_step": 67403, "epoch": 566, "lr": 7.817417340768685e-07} +{"train_loss": 0.0002754111192189157, "global_step": 67404, "epoch": 566, "lr": 7.813515430207696e-07} +{"train_loss": 0.0002089370391331613, "global_step": 67405, "epoch": 566, "lr": 7.809614486002259e-07} +{"train_loss": 0.0002460227406118065, "global_step": 67406, "epoch": 566, "lr": 7.805714508160089e-07} +{"train_loss": 0.00023862988746259362, "global_step": 67407, "epoch": 566, "lr": 7.801815496688736e-07} +{"train_loss": 0.00022203251137398183, "global_step": 67408, "epoch": 566, "lr": 7.797917451596027e-07} +{"train_loss": 0.00032687175553292036, "global_step": 67409, "epoch": 566, "lr": 7.79402037288951e-07} +{"train_loss": 0.0002554049133323133, "global_step": 67410, "epoch": 566, "lr": 7.790124260576792e-07} +{"train_loss": 0.00020279509772080928, "global_step": 67411, "epoch": 566, "lr": 7.786229114665644e-07} +{"train_loss": 0.00023041077656671405, "global_step": 67412, "epoch": 566, "lr": 7.782334935163615e-07} +{"train_loss": 0.00021269723947625607, "global_step": 67413, "epoch": 566, "lr": 7.778441722078422e-07} +{"train_loss": 0.00020390792633406818, "global_step": 67414, "epoch": 566, "lr": 7.774549475417614e-07} +{"train_loss": 0.00019600176892708987, "global_step": 67415, "epoch": 566, "lr": 7.770658195188907e-07} +{"train_loss": 0.0004209196486044675, "global_step": 67416, "epoch": 566, "lr": 7.766767881399961e-07} +{"train_loss": 0.0001582149852765724, "global_step": 67417, "epoch": 566, "lr": 7.762878534058382e-07} +{"train_loss": 0.0001887917605927214, "global_step": 67418, "epoch": 566, "lr": 7.758990153171775e-07} +{"train_loss": 0.00022359068680088967, "global_step": 67419, "epoch": 566, "lr": 7.7551027387478e-07} +{"train_loss": 0.0002525885938666761, "global_step": 67420, "epoch": 566, "lr": 7.751216290794117e-07} +{"train_loss": 0.000273947196546942, "global_step": 67421, "epoch": 566, "lr": 7.747330809318276e-07} +{"train_loss": 0.00014614569954574108, "global_step": 67422, "epoch": 566, "lr": 7.743446294327994e-07} +{"train_loss": 0.0001422171335434541, "global_step": 67423, "epoch": 566, "lr": 7.739562745830875e-07} +{"train_loss": 0.00016038375906646252, "global_step": 67424, "epoch": 566, "lr": 7.735680163834525e-07} +{"train_loss": 0.0001594049681443721, "global_step": 67425, "epoch": 566, "lr": 7.731798548346547e-07} +{"train_loss": 0.0002427215367788449, "global_step": 67426, "epoch": 566, "lr": 7.727917899374604e-07} +{"train_loss": 0.00020656890410464257, "global_step": 67427, "epoch": 566, "lr": 7.724038216926355e-07} +{"train_loss": 0.00017962997662834823, "global_step": 67428, "epoch": 566, "lr": 7.72015950100935e-07} +{"train_loss": 0.0001974147162400186, "global_step": 67429, "epoch": 566, "lr": 7.716281751631194e-07} +{"train_loss": 0.00011816091137006879, "global_step": 67430, "epoch": 566, "lr": 7.712404968799548e-07} +{"train_loss": 0.00019362369494047016, "global_step": 67431, "epoch": 566, "lr": 7.708529152521959e-07} +{"train_loss": 0.00020045024575665593, "global_step": 67432, "epoch": 566, "lr": 7.704654302806146e-07} +{"train_loss": 0.0005591466906480491, "global_step": 67433, "epoch": 566, "lr": 7.700780419659603e-07} +{"train_loss": 0.00020090796169824898, "global_step": 67434, "epoch": 566, "lr": 7.696907503089989e-07} +{"train_loss": 0.0002386501873843372, "global_step": 67435, "epoch": 566, "lr": 7.69303555310491e-07} +{"train_loss": 0.0003281830286141485, "global_step": 67436, "epoch": 566, "lr": 7.689164569711971e-07} +{"train_loss": 0.0002611922100186348, "global_step": 67437, "epoch": 566, "lr": 7.685294552918775e-07} +{"train_loss": 0.00037192265153862536, "global_step": 67438, "epoch": 566, "lr": 7.681425502732819e-07} +{"train_loss": 0.00017129701154772192, "global_step": 67439, "epoch": 566, "lr": 7.677557419161874e-07} +{"train_loss": 0.0005300728371366858, "global_step": 67440, "epoch": 566, "lr": 7.673690302213432e-07} +{"train_loss": 0.0002750452549662441, "global_step": 67441, "epoch": 566, "lr": 7.669824151895099e-07} +{"train_loss": 0.00023374386364594102, "global_step": 67442, "epoch": 566, "lr": 7.665958968214481e-07} +{"train_loss": 0.00030611082911491394, "global_step": 67443, "epoch": 566, "lr": 7.662094751179127e-07} +{"train_loss": 0.0002229156089015305, "global_step": 67444, "epoch": 566, "lr": 7.658231500796642e-07} +{"train_loss": 0.00021549283701460809, "global_step": 67445, "epoch": 566, "lr": 7.654369217074631e-07} +{"train_loss": 0.00030452938517555594, "global_step": 67446, "epoch": 566, "lr": 7.650507900020698e-07} +{"train_loss": 0.00021098372235428542, "global_step": 67447, "epoch": 566, "lr": 7.646647549642394e-07} +{"train_loss": 0.00032324803760275245, "global_step": 67448, "epoch": 566, "lr": 7.642788165947268e-07} +{"train_loss": 0.00014794617891311646, "global_step": 67449, "epoch": 566, "lr": 7.638929748942924e-07} +{"train_loss": 0.0002504938165657222, "global_step": 67450, "epoch": 566, "lr": 7.635072298636914e-07} +{"train_loss": 0.00012014267849735916, "global_step": 67451, "epoch": 566, "lr": 7.631215815036896e-07} +{"train_loss": 0.000221418755245395, "global_step": 67452, "epoch": 566, "lr": 7.627360298150365e-07} +{"train_loss": 0.0002304230583831668, "global_step": 67453, "epoch": 566, "lr": 7.623505747984927e-07} +{"train_loss": 0.00024629381368868053, "global_step": 67454, "epoch": 566, "lr": 7.619652164548075e-07} +{"train_loss": 0.0002458378439769149, "global_step": 67455, "epoch": 566, "lr": 7.615799547847469e-07} +{"train_loss": 0.0001300234580412507, "global_step": 67456, "epoch": 566, "lr": 7.611947897890604e-07} +{"train_loss": 0.0002563112648203969, "global_step": 67457, "epoch": 566, "lr": 7.608097214685139e-07} +{"train_loss": 0.00018305933917872608, "global_step": 67458, "epoch": 566, "lr": 7.604247498238515e-07} +{"train_loss": 0.000280647975159809, "global_step": 67459, "epoch": 566, "lr": 7.600398748558391e-07} +{"train_loss": 0.0002993604284711182, "global_step": 67460, "epoch": 566, "lr": 7.59655096565226e-07} +{"train_loss": 0.0001788504741853103, "global_step": 67461, "epoch": 566, "lr": 7.592704149527674e-07} +{"train_loss": 0.0002636332646943629, "global_step": 67462, "epoch": 566, "lr": 7.588858300192236e-07} +{"train_loss": 0.0002822823007591069, "global_step": 67463, "epoch": 566, "lr": 7.585013417653442e-07} +{"train_loss": 0.0002757023030426353, "global_step": 67464, "epoch": 566, "lr": 7.581169501918895e-07} +{"train_loss": 0.00038862202200107276, "global_step": 67465, "epoch": 566, "lr": 7.577326552996089e-07} +{"train_loss": 0.0001925867109093815, "global_step": 67466, "epoch": 566, "lr": 7.57348457089263e-07} +{"train_loss": 0.0003117932647000998, "global_step": 67467, "epoch": 566, "lr": 7.569643555616013e-07} +{"train_loss": 0.000116008821350988, "global_step": 67468, "epoch": 566, "lr": 7.565803507173785e-07} +{"train_loss": 0.0002722533536143601, "global_step": 67469, "epoch": 566, "lr": 7.561964425573498e-07} +{"train_loss": 0.0003079743473790586, "global_step": 67470, "epoch": 566, "lr": 7.5581263108227e-07} +{"train_loss": 0.000547465868294239, "global_step": 67471, "epoch": 566, "lr": 7.554289162928885e-07} +{"train_loss": 0.00026273722122051606, "global_step": 67472, "epoch": 566, "lr": 7.550452981899602e-07, "val_loss": 0.023302394896745682} +{"train_loss": 0.00020257409778423607, "global_step": 67473, "epoch": 567, "lr": 7.546617767742459e-07} +{"train_loss": 0.0007277908152900636, "global_step": 67474, "epoch": 567, "lr": 7.542783520464835e-07} +{"train_loss": 0.00029286730568856, "global_step": 67475, "epoch": 567, "lr": 7.538950240074394e-07} +{"train_loss": 0.000376431125914678, "global_step": 67476, "epoch": 567, "lr": 7.535117926578572e-07} +{"train_loss": 0.00017365541134495288, "global_step": 67477, "epoch": 567, "lr": 7.531286579984975e-07} +{"train_loss": 0.0003814231895375997, "global_step": 67478, "epoch": 567, "lr": 7.527456200301097e-07} +{"train_loss": 0.00012836570385843515, "global_step": 67479, "epoch": 567, "lr": 7.523626787534432e-07} +{"train_loss": 0.00019436435832176358, "global_step": 67480, "epoch": 567, "lr": 7.51979834169253e-07} +{"train_loss": 0.0003050153609365225, "global_step": 67481, "epoch": 567, "lr": 7.515970862782829e-07} +{"train_loss": 0.0001533164904685691, "global_step": 67482, "epoch": 567, "lr": 7.512144350812933e-07} +{"train_loss": 0.00046362963621504605, "global_step": 67483, "epoch": 567, "lr": 7.508318805790337e-07} +{"train_loss": 0.0002295918093295768, "global_step": 67484, "epoch": 567, "lr": 7.504494227722536e-07} +{"train_loss": 0.00015988011728040874, "global_step": 67485, "epoch": 567, "lr": 7.500670616617078e-07} +{"train_loss": 0.00015420872659888119, "global_step": 67486, "epoch": 567, "lr": 7.496847972481402e-07} +{"train_loss": 0.000183043084689416, "global_step": 67487, "epoch": 567, "lr": 7.493026295323003e-07} +{"train_loss": 0.00034845448681153357, "global_step": 67488, "epoch": 567, "lr": 7.489205585149484e-07} +{"train_loss": 0.0001896954490803182, "global_step": 67489, "epoch": 567, "lr": 7.485385841968284e-07} +{"train_loss": 0.00016023909847717732, "global_step": 67490, "epoch": 567, "lr": 7.481567065786954e-07} +{"train_loss": 0.00015538131992798299, "global_step": 67491, "epoch": 567, "lr": 7.477749256612876e-07} +{"train_loss": 0.0002165002515539527, "global_step": 67492, "epoch": 567, "lr": 7.473932414453655e-07} +{"train_loss": 0.0002952486393041909, "global_step": 67493, "epoch": 567, "lr": 7.47011653931673e-07} +{"train_loss": 0.0001962863461812958, "global_step": 67494, "epoch": 567, "lr": 7.466301631209649e-07} +{"train_loss": 0.00024455093080177903, "global_step": 67495, "epoch": 567, "lr": 7.462487690139852e-07} +{"train_loss": 0.0004247937467880547, "global_step": 67496, "epoch": 567, "lr": 7.458674716114833e-07} +{"train_loss": 0.00014286258374340832, "global_step": 67497, "epoch": 567, "lr": 7.45486270914214e-07} +{"train_loss": 0.0002980870194733143, "global_step": 67498, "epoch": 567, "lr": 7.451051669229103e-07} +{"train_loss": 0.00014568014012183994, "global_step": 67499, "epoch": 567, "lr": 7.447241596383381e-07} +{"train_loss": 0.0002389199216850102, "global_step": 67500, "epoch": 567, "lr": 7.443432490612301e-07} +{"train_loss": 0.0003108849923592061, "global_step": 67501, "epoch": 567, "lr": 7.439624351923524e-07} +{"train_loss": 0.0003542782797012478, "global_step": 67502, "epoch": 567, "lr": 7.435817180324378e-07} +{"train_loss": 0.0003008594794664532, "global_step": 67503, "epoch": 567, "lr": 7.432010975822356e-07} +{"train_loss": 0.00020904603297822177, "global_step": 67504, "epoch": 567, "lr": 7.428205738425009e-07} +{"train_loss": 0.00016720397979952395, "global_step": 67505, "epoch": 567, "lr": 7.424401468139664e-07} +{"train_loss": 0.00026561642880551517, "global_step": 67506, "epoch": 567, "lr": 7.42059816497398e-07} +{"train_loss": 0.00036357794306240976, "global_step": 67507, "epoch": 567, "lr": 7.416795828935231e-07} +{"train_loss": 0.00027835945365950465, "global_step": 67508, "epoch": 567, "lr": 7.412994460031076e-07} +{"train_loss": 0.00021952387760393322, "global_step": 67509, "epoch": 567, "lr": 7.409194058268842e-07} +{"train_loss": 0.00018080341396853328, "global_step": 67510, "epoch": 567, "lr": 7.405394623656025e-07} +{"train_loss": 0.00018452735093887895, "global_step": 67511, "epoch": 567, "lr": 7.401596156200119e-07} +{"train_loss": 0.0001653656509006396, "global_step": 67512, "epoch": 567, "lr": 7.397798655908506e-07} +{"train_loss": 0.00031266489531844854, "global_step": 67513, "epoch": 567, "lr": 7.394002122788734e-07} +{"train_loss": 0.00034468717058189213, "global_step": 67514, "epoch": 567, "lr": 7.390206556848133e-07} +{"train_loss": 0.0003201088111381978, "global_step": 67515, "epoch": 567, "lr": 7.386411958094308e-07} +{"train_loss": 0.0002765286772046238, "global_step": 67516, "epoch": 567, "lr": 7.38261832653464e-07} +{"train_loss": 0.00043250093585811555, "global_step": 67517, "epoch": 567, "lr": 7.378825662176514e-07} +{"train_loss": 0.0001714718237053603, "global_step": 67518, "epoch": 567, "lr": 7.375033965027478e-07} +{"train_loss": 0.0003529424429871142, "global_step": 67519, "epoch": 567, "lr": 7.371243235094915e-07} +{"train_loss": 0.00015361122495960444, "global_step": 67520, "epoch": 567, "lr": 7.367453472386321e-07} +{"train_loss": 0.000310930801788345, "global_step": 67521, "epoch": 567, "lr": 7.363664676909077e-07} +{"train_loss": 0.00024673412553966045, "global_step": 67522, "epoch": 567, "lr": 7.359876848670621e-07} +{"train_loss": 0.0002617734717205167, "global_step": 67523, "epoch": 567, "lr": 7.356089987678449e-07} +{"train_loss": 0.00034164797398261726, "global_step": 67524, "epoch": 567, "lr": 7.352304093939944e-07} +{"train_loss": 0.0002515648666303605, "global_step": 67525, "epoch": 567, "lr": 7.348519167462598e-07} +{"train_loss": 0.00013489657430909574, "global_step": 67526, "epoch": 567, "lr": 7.344735208253739e-07} +{"train_loss": 0.0005322244251146913, "global_step": 67527, "epoch": 567, "lr": 7.340952216320918e-07} +{"train_loss": 0.0005628478829748929, "global_step": 67528, "epoch": 567, "lr": 7.33717019167146e-07} +{"train_loss": 0.00041552219772711396, "global_step": 67529, "epoch": 567, "lr": 7.333389134312863e-07} +{"train_loss": 0.00035410368582233787, "global_step": 67530, "epoch": 567, "lr": 7.329609044252505e-07} +{"train_loss": 0.0002120838180417195, "global_step": 67531, "epoch": 567, "lr": 7.325829921497829e-07} +{"train_loss": 0.00015847961185500026, "global_step": 67532, "epoch": 567, "lr": 7.322051766056271e-07} +{"train_loss": 0.00039770451257936656, "global_step": 67533, "epoch": 567, "lr": 7.318274577935213e-07} +{"train_loss": 0.00035013764863833785, "global_step": 67534, "epoch": 567, "lr": 7.314498357142096e-07} +{"train_loss": 0.00014751518028788269, "global_step": 67535, "epoch": 567, "lr": 7.310723103684358e-07} +{"train_loss": 0.00020777554891537875, "global_step": 67536, "epoch": 567, "lr": 7.306948817569326e-07} +{"train_loss": 0.00013608056178782135, "global_step": 67537, "epoch": 567, "lr": 7.303175498804493e-07} +{"train_loss": 0.00025145916151814163, "global_step": 67538, "epoch": 567, "lr": 7.299403147397188e-07} +{"train_loss": 0.0002271150442538783, "global_step": 67539, "epoch": 567, "lr": 7.295631763354904e-07} +{"train_loss": 0.00014297290181275457, "global_step": 67540, "epoch": 567, "lr": 7.291861346685081e-07} +{"train_loss": 0.00017478778318036348, "global_step": 67541, "epoch": 567, "lr": 7.288091897394933e-07} +{"train_loss": 0.0003170459531247616, "global_step": 67542, "epoch": 567, "lr": 7.284323415492067e-07} +{"train_loss": 0.00024073143140412867, "global_step": 67543, "epoch": 567, "lr": 7.280555900983699e-07} +{"train_loss": 0.00013168921577744186, "global_step": 67544, "epoch": 567, "lr": 7.276789353877378e-07} +{"train_loss": 0.00042796097113750875, "global_step": 67545, "epoch": 567, "lr": 7.273023774180432e-07} +{"train_loss": 0.00048119068378582597, "global_step": 67546, "epoch": 567, "lr": 7.269259161900299e-07} +{"train_loss": 0.0001877540344139561, "global_step": 67547, "epoch": 567, "lr": 7.265495517044307e-07} +{"train_loss": 0.00016214180504903197, "global_step": 67548, "epoch": 567, "lr": 7.261732839619839e-07} +{"train_loss": 0.00025521600036881864, "global_step": 67549, "epoch": 567, "lr": 7.257971129634389e-07} +{"train_loss": 0.00022408908989746124, "global_step": 67550, "epoch": 567, "lr": 7.254210387095173e-07} +{"train_loss": 0.0002483536663930863, "global_step": 67551, "epoch": 567, "lr": 7.25045061200974e-07} +{"train_loss": 0.00024888754705898464, "global_step": 67552, "epoch": 567, "lr": 7.246691804385419e-07} +{"train_loss": 0.00013814886915497482, "global_step": 67553, "epoch": 567, "lr": 7.242933964229537e-07} +{"train_loss": 0.0002768939302768558, "global_step": 67554, "epoch": 567, "lr": 7.239177091549532e-07} +{"train_loss": 0.00035562648554332554, "global_step": 67555, "epoch": 567, "lr": 7.235421186352731e-07} +{"train_loss": 0.0003023357130587101, "global_step": 67556, "epoch": 567, "lr": 7.231666248646573e-07} +{"train_loss": 0.00018805332365445793, "global_step": 67557, "epoch": 567, "lr": 7.227912278438331e-07} +{"train_loss": 0.00025326680042780936, "global_step": 67558, "epoch": 567, "lr": 7.224159275735499e-07} +{"train_loss": 0.0007310541695915163, "global_step": 67559, "epoch": 567, "lr": 7.220407240545402e-07} +{"train_loss": 0.00018546934006735682, "global_step": 67560, "epoch": 567, "lr": 7.216656172875369e-07} +{"train_loss": 0.0002503562718629837, "global_step": 67561, "epoch": 567, "lr": 7.212906072732783e-07} +{"train_loss": 0.00019465196237433702, "global_step": 67562, "epoch": 567, "lr": 7.209156940124973e-07} +{"train_loss": 0.00030683615477755666, "global_step": 67563, "epoch": 567, "lr": 7.205408775059375e-07} +{"train_loss": 0.0003011516237165779, "global_step": 67564, "epoch": 567, "lr": 7.201661577543262e-07} +{"train_loss": 0.000301573978504166, "global_step": 67565, "epoch": 567, "lr": 7.197915347584127e-07} +{"train_loss": 0.0002602119348011911, "global_step": 67566, "epoch": 567, "lr": 7.194170085189189e-07} +{"train_loss": 0.0002788641140796244, "global_step": 67567, "epoch": 567, "lr": 7.190425790365829e-07} +{"train_loss": 0.00026225863257423043, "global_step": 67568, "epoch": 567, "lr": 7.18668246312143e-07} +{"train_loss": 0.00020641105948016047, "global_step": 67569, "epoch": 567, "lr": 7.18294010346332e-07} +{"train_loss": 0.00023057602811604738, "global_step": 67570, "epoch": 567, "lr": 7.179198711398883e-07} +{"train_loss": 0.00036669831024482846, "global_step": 67571, "epoch": 567, "lr": 7.1754582869355e-07} +{"train_loss": 0.00028332864167168736, "global_step": 67572, "epoch": 567, "lr": 7.171718830080332e-07} +{"train_loss": 0.00021530747471842915, "global_step": 67573, "epoch": 567, "lr": 7.167980340840929e-07} +{"train_loss": 0.0002019424136960879, "global_step": 67574, "epoch": 567, "lr": 7.164242819224509e-07} +{"train_loss": 0.0001780137390596792, "global_step": 67575, "epoch": 567, "lr": 7.160506265238454e-07} +{"train_loss": 0.0004096170305274427, "global_step": 67576, "epoch": 567, "lr": 7.156770678890034e-07} +{"train_loss": 0.0001933225867105648, "global_step": 67577, "epoch": 567, "lr": 7.153036060186747e-07} +{"train_loss": 0.00022619817173108459, "global_step": 67578, "epoch": 567, "lr": 7.149302409135749e-07} +{"train_loss": 0.00020271161338314414, "global_step": 67579, "epoch": 567, "lr": 7.145569725744483e-07} +{"train_loss": 0.0001338642614427954, "global_step": 67580, "epoch": 567, "lr": 7.141838010020218e-07} +{"train_loss": 0.0003482136526145041, "global_step": 67581, "epoch": 567, "lr": 7.138107261970283e-07} +{"train_loss": 0.0005104443989694118, "global_step": 67582, "epoch": 567, "lr": 7.134377481602062e-07} +{"train_loss": 0.00016126103582791984, "global_step": 67583, "epoch": 567, "lr": 7.130648668922768e-07} +{"train_loss": 0.00022954141604714096, "global_step": 67584, "epoch": 567, "lr": 7.126920823939842e-07} +{"train_loss": 0.00023153002257458866, "global_step": 67585, "epoch": 567, "lr": 7.123193946660556e-07} +{"train_loss": 0.00021715745970141143, "global_step": 67586, "epoch": 567, "lr": 7.119468037092236e-07} +{"train_loss": 0.0003383222210686654, "global_step": 67587, "epoch": 567, "lr": 7.1157430952421e-07} +{"train_loss": 0.0004936635377816856, "global_step": 67588, "epoch": 567, "lr": 7.112019121117641e-07} +{"train_loss": 0.00017205266340170056, "global_step": 67589, "epoch": 567, "lr": 7.108296114726021e-07} +{"train_loss": 0.00024455314269289374, "global_step": 67590, "epoch": 567, "lr": 7.104574076074622e-07} +{"train_loss": 0.0002694436764254571, "global_step": 67591, "epoch": 567, "lr": 7.100853005170716e-07, "val_loss": 0.01428942009806633} +{"train_loss": 0.00020112156926188618, "global_step": 67592, "epoch": 568, "lr": 7.097132902021685e-07} +{"train_loss": 0.00034191092709079385, "global_step": 67593, "epoch": 568, "lr": 7.093413766634694e-07} +{"train_loss": 0.00015748554142192006, "global_step": 67594, "epoch": 568, "lr": 7.089695599017176e-07} +{"train_loss": 0.0004176414804533124, "global_step": 67595, "epoch": 568, "lr": 7.085978399176351e-07} +{"train_loss": 0.00037683703703805804, "global_step": 67596, "epoch": 568, "lr": 7.082262167119547e-07} +{"train_loss": 0.00014220036973711103, "global_step": 67597, "epoch": 568, "lr": 7.078546902854144e-07} +{"train_loss": 0.0002954180527012795, "global_step": 67598, "epoch": 568, "lr": 7.074832606387249e-07} +{"train_loss": 0.00012009729107376188, "global_step": 67599, "epoch": 568, "lr": 7.071119277726301e-07} +{"train_loss": 0.0002920531842391938, "global_step": 67600, "epoch": 568, "lr": 7.067406916878516e-07} +{"train_loss": 0.00015420795534737408, "global_step": 67601, "epoch": 568, "lr": 7.063695523851277e-07} +{"train_loss": 0.00019003282068297267, "global_step": 67602, "epoch": 568, "lr": 7.059985098651745e-07} +{"train_loss": 0.00020986530580557883, "global_step": 67603, "epoch": 568, "lr": 7.056275641287358e-07} +{"train_loss": 0.0004467770049814135, "global_step": 67604, "epoch": 568, "lr": 7.052567151765221e-07} +{"train_loss": 0.0002682590566109866, "global_step": 67605, "epoch": 568, "lr": 7.048859630092719e-07} +{"train_loss": 0.00031713489443063736, "global_step": 67606, "epoch": 568, "lr": 7.045153076277177e-07} +{"train_loss": 0.0002033802738878876, "global_step": 67607, "epoch": 568, "lr": 7.041447490325759e-07} +{"train_loss": 0.00037670848541893065, "global_step": 67608, "epoch": 568, "lr": 7.03774287224579e-07} +{"train_loss": 0.0001702717418083921, "global_step": 67609, "epoch": 568, "lr": 7.034039222044597e-07} +{"train_loss": 0.00027248088736087084, "global_step": 67610, "epoch": 568, "lr": 7.030336539729343e-07} +{"train_loss": 0.0005746984388679266, "global_step": 67611, "epoch": 568, "lr": 7.026634825307409e-07} +{"train_loss": 0.00020510390459094197, "global_step": 67612, "epoch": 568, "lr": 7.022934078785959e-07} +{"train_loss": 0.00035723153268918395, "global_step": 67613, "epoch": 568, "lr": 7.019234300172373e-07} +{"train_loss": 0.0003149320837110281, "global_step": 67614, "epoch": 568, "lr": 7.015535489473757e-07} +{"train_loss": 0.00033274226007051766, "global_step": 67615, "epoch": 568, "lr": 7.01183764669755e-07} +{"train_loss": 0.00024053585366345942, "global_step": 67616, "epoch": 568, "lr": 7.008140771850969e-07} +{"train_loss": 0.00024722141097299755, "global_step": 67617, "epoch": 568, "lr": 7.004444864941118e-07} +{"train_loss": 0.00016657510423101485, "global_step": 67618, "epoch": 568, "lr": 7.000749925975436e-07} +{"train_loss": 0.00021021488646510988, "global_step": 67619, "epoch": 568, "lr": 6.99705595496114e-07} +{"train_loss": 0.0002984567254316062, "global_step": 67620, "epoch": 568, "lr": 6.993362951905391e-07} +{"train_loss": 0.00015161682676989585, "global_step": 67621, "epoch": 568, "lr": 6.989670916815516e-07} +{"train_loss": 0.0001685577299213037, "global_step": 67622, "epoch": 568, "lr": 6.985979849698787e-07} +{"train_loss": 0.00013561887317337096, "global_step": 67623, "epoch": 568, "lr": 6.98228975056242e-07} +{"train_loss": 0.0002408933505648747, "global_step": 67624, "epoch": 568, "lr": 6.978600619413578e-07} +{"train_loss": 0.00028961285715922713, "global_step": 67625, "epoch": 568, "lr": 6.974912456259697e-07} +{"train_loss": 0.00019876027363352478, "global_step": 67626, "epoch": 568, "lr": 6.971225261107827e-07} +{"train_loss": 0.000245811534114182, "global_step": 67627, "epoch": 568, "lr": 6.967539033965298e-07} +{"train_loss": 0.0002298572799190879, "global_step": 67628, "epoch": 568, "lr": 6.96385377483938e-07} +{"train_loss": 0.0002534861268941313, "global_step": 67629, "epoch": 568, "lr": 6.960169483737178e-07} +{"train_loss": 0.00018496968550607562, "global_step": 67630, "epoch": 568, "lr": 6.956486160666076e-07} +{"train_loss": 0.0002817431522998959, "global_step": 67631, "epoch": 568, "lr": 6.952803805633179e-07} +{"train_loss": 0.00013190093159209937, "global_step": 67632, "epoch": 568, "lr": 6.949122418645815e-07} +{"train_loss": 0.00024972320534288883, "global_step": 67633, "epoch": 568, "lr": 6.945441999711144e-07} +{"train_loss": 0.0001786987850209698, "global_step": 67634, "epoch": 568, "lr": 6.941762548836494e-07} +{"train_loss": 0.00015146652003750205, "global_step": 67635, "epoch": 568, "lr": 6.938084066028971e-07} +{"train_loss": 0.0006297461804933846, "global_step": 67636, "epoch": 568, "lr": 6.934406551295847e-07} +{"train_loss": 0.00045580428559333086, "global_step": 67637, "epoch": 568, "lr": 6.930730004644336e-07} +{"train_loss": 0.00027950998628512025, "global_step": 67638, "epoch": 568, "lr": 6.927054426081658e-07} +{"train_loss": 0.00038745030178688467, "global_step": 67639, "epoch": 568, "lr": 6.923379815615084e-07} +{"train_loss": 0.00035643819137476385, "global_step": 67640, "epoch": 568, "lr": 6.919706173251716e-07} +{"train_loss": 0.00023166922619566321, "global_step": 67641, "epoch": 568, "lr": 6.916033498998831e-07} +{"train_loss": 0.00011424499825807288, "global_step": 67642, "epoch": 568, "lr": 6.912361792863642e-07} +{"train_loss": 0.00021569253294728696, "global_step": 67643, "epoch": 568, "lr": 6.908691054853367e-07} +{"train_loss": 0.0003445748006924987, "global_step": 67644, "epoch": 568, "lr": 6.905021284975166e-07} +{"train_loss": 0.00017976727394852787, "global_step": 67645, "epoch": 568, "lr": 6.901352483236312e-07} +{"train_loss": 0.00021355124772526324, "global_step": 67646, "epoch": 568, "lr": 6.897684649643965e-07} +{"train_loss": 0.0002995251852553338, "global_step": 67647, "epoch": 568, "lr": 6.894017784205342e-07} +{"train_loss": 0.0001630433544050902, "global_step": 67648, "epoch": 568, "lr": 6.890351886927605e-07} +{"train_loss": 0.000239362838328816, "global_step": 67649, "epoch": 568, "lr": 6.886686957818022e-07} +{"train_loss": 0.00029634611564688385, "global_step": 67650, "epoch": 568, "lr": 6.883022996883704e-07} +{"train_loss": 0.00016029764083214104, "global_step": 67651, "epoch": 568, "lr": 6.879360004131918e-07} +{"train_loss": 0.00032827473478391767, "global_step": 67652, "epoch": 568, "lr": 6.875697979569773e-07} +{"train_loss": 0.0002487187448423356, "global_step": 67653, "epoch": 568, "lr": 6.872036923204595e-07} +{"train_loss": 0.00021084319450892508, "global_step": 67654, "epoch": 568, "lr": 6.868376835043433e-07} +{"train_loss": 0.0001410883414791897, "global_step": 67655, "epoch": 568, "lr": 6.864717715093504e-07} +{"train_loss": 0.000232110804063268, "global_step": 67656, "epoch": 568, "lr": 6.861059563362082e-07} +{"train_loss": 0.00021045652101747692, "global_step": 67657, "epoch": 568, "lr": 6.857402379856215e-07} +{"train_loss": 0.0003283125115558505, "global_step": 67658, "epoch": 568, "lr": 6.85374616458323e-07} +{"train_loss": 0.00025767215993255377, "global_step": 67659, "epoch": 568, "lr": 6.850090917550234e-07} +{"train_loss": 0.00031212077010422945, "global_step": 67660, "epoch": 568, "lr": 6.846436638764331e-07} +{"train_loss": 0.00045176123967394233, "global_step": 67661, "epoch": 568, "lr": 6.842783328232849e-07} +{"train_loss": 0.00022742195869795978, "global_step": 67662, "epoch": 568, "lr": 6.839130985962783e-07} +{"train_loss": 0.00030141929164528847, "global_step": 67663, "epoch": 568, "lr": 6.83547961196146e-07} +{"train_loss": 0.0003539668978191912, "global_step": 67664, "epoch": 568, "lr": 6.831829206235929e-07} +{"train_loss": 0.000337564735673368, "global_step": 67665, "epoch": 568, "lr": 6.828179768793463e-07} +{"train_loss": 0.00032052892493084073, "global_step": 67666, "epoch": 568, "lr": 6.824531299641224e-07} +{"train_loss": 0.00038062999374233186, "global_step": 67667, "epoch": 568, "lr": 6.820883798786204e-07} +{"train_loss": 0.00025174813345074654, "global_step": 67668, "epoch": 568, "lr": 6.817237266235787e-07} +{"train_loss": 0.0005778304766863585, "global_step": 67669, "epoch": 568, "lr": 6.813591701996969e-07} +{"train_loss": 0.00019054455333389342, "global_step": 67670, "epoch": 568, "lr": 6.809947106077075e-07} +{"train_loss": 0.00019965331011917442, "global_step": 67671, "epoch": 568, "lr": 6.806303478483045e-07} +{"train_loss": 0.00022842313046567142, "global_step": 67672, "epoch": 568, "lr": 6.802660819222206e-07} +{"train_loss": 0.00016565033001825213, "global_step": 67673, "epoch": 568, "lr": 6.799019128301665e-07} +{"train_loss": 0.00022493855794891715, "global_step": 67674, "epoch": 568, "lr": 6.795378405728526e-07} +{"train_loss": 0.0001612738415133208, "global_step": 67675, "epoch": 568, "lr": 6.791738651510004e-07} +{"train_loss": 0.0002415455674054101, "global_step": 67676, "epoch": 568, "lr": 6.788099865653208e-07} +{"train_loss": 0.00010481067874934524, "global_step": 67677, "epoch": 568, "lr": 6.784462048165241e-07} +{"train_loss": 0.0002664373896550387, "global_step": 67678, "epoch": 568, "lr": 6.780825199053375e-07} +{"train_loss": 0.00011987256584689021, "global_step": 67679, "epoch": 568, "lr": 6.777189318324606e-07} +{"train_loss": 0.00033551472006365657, "global_step": 67680, "epoch": 568, "lr": 6.773554405986149e-07} +{"train_loss": 0.00023579233675263822, "global_step": 67681, "epoch": 568, "lr": 6.769920462045054e-07} +{"train_loss": 0.0004819046298507601, "global_step": 67682, "epoch": 568, "lr": 6.766287486508649e-07} +{"train_loss": 0.00013035237498115748, "global_step": 67683, "epoch": 568, "lr": 6.762655479383817e-07} +{"train_loss": 0.00036587551585398614, "global_step": 67684, "epoch": 568, "lr": 6.759024440677941e-07} +{"train_loss": 0.00027943981694988906, "global_step": 67685, "epoch": 568, "lr": 6.755394370397905e-07} +{"train_loss": 0.00021868266048841178, "global_step": 67686, "epoch": 568, "lr": 6.751765268551036e-07} +{"train_loss": 0.00026742485351860523, "global_step": 67687, "epoch": 568, "lr": 6.748137135144328e-07} +{"train_loss": 0.0003183127846568823, "global_step": 67688, "epoch": 568, "lr": 6.744509970185053e-07} +{"train_loss": 0.00014269193343352526, "global_step": 67689, "epoch": 568, "lr": 6.740883773680151e-07} +{"train_loss": 0.00023947091540321708, "global_step": 67690, "epoch": 568, "lr": 6.737258545636838e-07} +{"train_loss": 0.00020526487787719816, "global_step": 67691, "epoch": 568, "lr": 6.733634286062218e-07} +{"train_loss": 0.0002027266164077446, "global_step": 67692, "epoch": 568, "lr": 6.730010994963453e-07} +{"train_loss": 0.0001377271837554872, "global_step": 67693, "epoch": 568, "lr": 6.726388672347539e-07} +{"train_loss": 0.00038770257378928363, "global_step": 67694, "epoch": 568, "lr": 6.722767318221745e-07} +{"train_loss": 0.00021481735166162252, "global_step": 67695, "epoch": 568, "lr": 6.719146932593013e-07} +{"train_loss": 0.0001725083711789921, "global_step": 67696, "epoch": 568, "lr": 6.715527515468612e-07} +{"train_loss": 0.00012961195898242295, "global_step": 67697, "epoch": 568, "lr": 6.711909066855537e-07} +{"train_loss": 0.0001781573664629832, "global_step": 67698, "epoch": 568, "lr": 6.708291586760951e-07} +{"train_loss": 0.0002608992508612573, "global_step": 67699, "epoch": 568, "lr": 6.704675075191902e-07} +{"train_loss": 0.0002804594114422798, "global_step": 67700, "epoch": 568, "lr": 6.701059532155551e-07} +{"train_loss": 0.0003081680042669177, "global_step": 67701, "epoch": 568, "lr": 6.697444957658949e-07} +{"train_loss": 0.0004090813745278865, "global_step": 67702, "epoch": 568, "lr": 6.693831351709202e-07} +{"train_loss": 0.00017776583263184875, "global_step": 67703, "epoch": 568, "lr": 6.690218714313468e-07} +{"train_loss": 0.0001203761639771983, "global_step": 67704, "epoch": 568, "lr": 6.686607045478744e-07} +{"train_loss": 0.00030127482023090124, "global_step": 67705, "epoch": 568, "lr": 6.682996345212189e-07} +{"train_loss": 0.00019797308777924627, "global_step": 67706, "epoch": 568, "lr": 6.679386613520855e-07} +{"train_loss": 0.00028650942840613425, "global_step": 67707, "epoch": 568, "lr": 6.675777850411791e-07} +{"train_loss": 0.00020483281696215272, "global_step": 67708, "epoch": 568, "lr": 6.672170055892213e-07} +{"train_loss": 0.0003183493099641055, "global_step": 67709, "epoch": 568, "lr": 6.668563229969116e-07} +{"train_loss": 0.00025760494775438147, "global_step": 67710, "epoch": 568, "lr": 6.66495737264955e-07, "val_loss": 0.03875361382961273} +{"train_loss": 0.0002407055872026831, "global_step": 67711, "epoch": 569, "lr": 6.661352483940675e-07} +{"train_loss": 0.00034211351885460317, "global_step": 67712, "epoch": 569, "lr": 6.657748563849486e-07} +{"train_loss": 0.00032062045647762716, "global_step": 67713, "epoch": 569, "lr": 6.654145612383089e-07} +{"train_loss": 0.00016047274402808398, "global_step": 67714, "epoch": 569, "lr": 6.650543629548589e-07} +{"train_loss": 0.00015067384811118245, "global_step": 67715, "epoch": 569, "lr": 6.646942615353092e-07} +{"train_loss": 0.00022750698553863913, "global_step": 67716, "epoch": 569, "lr": 6.643342569803535e-07} +{"train_loss": 0.00014316514716483653, "global_step": 67717, "epoch": 569, "lr": 6.639743492907136e-07} +{"train_loss": 0.000187529090908356, "global_step": 67718, "epoch": 569, "lr": 6.636145384670833e-07} +{"train_loss": 0.0002245619398308918, "global_step": 67719, "epoch": 569, "lr": 6.632548245101843e-07} +{"train_loss": 0.00013270732597447932, "global_step": 67720, "epoch": 569, "lr": 6.628952074207051e-07} +{"train_loss": 0.00021751553867943585, "global_step": 67721, "epoch": 569, "lr": 6.625356871993616e-07} +{"train_loss": 0.0002262403431814164, "global_step": 67722, "epoch": 569, "lr": 6.621762638468587e-07} +{"train_loss": 0.00034027561196126044, "global_step": 67723, "epoch": 569, "lr": 6.618169373639072e-07} +{"train_loss": 0.00015835060912650079, "global_step": 67724, "epoch": 569, "lr": 6.614577077512007e-07} +{"train_loss": 0.00020450088777579367, "global_step": 67725, "epoch": 569, "lr": 6.610985750094501e-07} +{"train_loss": 0.0007145552663132548, "global_step": 67726, "epoch": 569, "lr": 6.607395391393656e-07} +{"train_loss": 0.00033441188861615956, "global_step": 67727, "epoch": 569, "lr": 6.603806001416468e-07} +{"train_loss": 0.0006242815288715065, "global_step": 67728, "epoch": 569, "lr": 6.600217580169988e-07} +{"train_loss": 0.00020756285812240094, "global_step": 67729, "epoch": 569, "lr": 6.596630127661263e-07} +{"train_loss": 0.0003216122859157622, "global_step": 67730, "epoch": 569, "lr": 6.593043643897401e-07} +{"train_loss": 0.0005316491005942225, "global_step": 67731, "epoch": 569, "lr": 6.589458128885285e-07} +{"train_loss": 0.0002258796157548204, "global_step": 67732, "epoch": 569, "lr": 6.58587358263213e-07} +{"train_loss": 0.00020206408225931227, "global_step": 67733, "epoch": 569, "lr": 6.582290005144876e-07} +{"train_loss": 0.00045428634621202946, "global_step": 67734, "epoch": 569, "lr": 6.578707396430573e-07} +{"train_loss": 0.00015990223619155586, "global_step": 67735, "epoch": 569, "lr": 6.57512575649627e-07} +{"train_loss": 0.0002170746010961011, "global_step": 67736, "epoch": 569, "lr": 6.571545085348962e-07} +{"train_loss": 0.00015870465722400695, "global_step": 67737, "epoch": 569, "lr": 6.567965382995811e-07} +{"train_loss": 0.00024653729633428156, "global_step": 67738, "epoch": 569, "lr": 6.564386649443644e-07} +{"train_loss": 0.00015647793770767748, "global_step": 67739, "epoch": 569, "lr": 6.560808884699621e-07} +{"train_loss": 0.0003184436063747853, "global_step": 67740, "epoch": 569, "lr": 6.557232088770738e-07} +{"train_loss": 0.0002275365695822984, "global_step": 67741, "epoch": 569, "lr": 6.553656261663987e-07} +{"train_loss": 0.00026232836535200477, "global_step": 67742, "epoch": 569, "lr": 6.550081403386477e-07} +{"train_loss": 0.0003982751222793013, "global_step": 67743, "epoch": 569, "lr": 6.546507513945088e-07} +{"train_loss": 0.0002630247035995126, "global_step": 67744, "epoch": 569, "lr": 6.542934593346983e-07} +{"train_loss": 0.00019940642232540995, "global_step": 67745, "epoch": 569, "lr": 6.539362641599045e-07} +{"train_loss": 0.00015841722779441625, "global_step": 67746, "epoch": 569, "lr": 6.535791658708379e-07} +{"train_loss": 0.00016480313206557184, "global_step": 67747, "epoch": 569, "lr": 6.53222164468198e-07} +{"train_loss": 0.00015351982438005507, "global_step": 67748, "epoch": 569, "lr": 6.528652599526841e-07} +{"train_loss": 0.0002803517272695899, "global_step": 67749, "epoch": 569, "lr": 6.525084523249958e-07} +{"train_loss": 0.0004309132928028703, "global_step": 67750, "epoch": 569, "lr": 6.521517415858325e-07} +{"train_loss": 0.00025486148661002517, "global_step": 67751, "epoch": 569, "lr": 6.517951277358991e-07} +{"train_loss": 0.00012212990259286016, "global_step": 67752, "epoch": 569, "lr": 6.514386107758952e-07} +{"train_loss": 0.0002849264710675925, "global_step": 67753, "epoch": 569, "lr": 6.510821907065201e-07} +{"train_loss": 0.00021461641881614923, "global_step": 67754, "epoch": 569, "lr": 6.507258675284733e-07} +{"train_loss": 0.00039835815550759435, "global_step": 67755, "epoch": 569, "lr": 6.503696412424487e-07} +{"train_loss": 0.00022435882419813424, "global_step": 67756, "epoch": 569, "lr": 6.500135118491568e-07} +{"train_loss": 0.00014882496907375753, "global_step": 67757, "epoch": 569, "lr": 6.496574793492915e-07} +{"train_loss": 0.0003595353337004781, "global_step": 67758, "epoch": 569, "lr": 6.493015437435524e-07} +{"train_loss": 0.00015062496822793037, "global_step": 67759, "epoch": 569, "lr": 6.48945705032633e-07} +{"train_loss": 0.00040557171450927854, "global_step": 67760, "epoch": 569, "lr": 6.485899632172388e-07} +{"train_loss": 0.0001969305012607947, "global_step": 67761, "epoch": 569, "lr": 6.482343182980632e-07} +{"train_loss": 0.00023547033197246492, "global_step": 67762, "epoch": 569, "lr": 6.47878770275806e-07} +{"train_loss": 0.0002264829963678494, "global_step": 67763, "epoch": 569, "lr": 6.47523319151172e-07} +{"train_loss": 0.00023911792959552258, "global_step": 67764, "epoch": 569, "lr": 6.471679649248496e-07} +{"train_loss": 0.00013967625272925943, "global_step": 67765, "epoch": 569, "lr": 6.468127075975439e-07} +{"train_loss": 0.0003093341365456581, "global_step": 67766, "epoch": 569, "lr": 6.464575471699485e-07} +{"train_loss": 0.0004974559997208416, "global_step": 67767, "epoch": 569, "lr": 6.461024836427576e-07} +{"train_loss": 0.0002500462287571281, "global_step": 67768, "epoch": 569, "lr": 6.457475170166705e-07} +{"train_loss": 0.0002598721766844392, "global_step": 67769, "epoch": 569, "lr": 6.453926472923866e-07} +{"train_loss": 0.00027126111672259867, "global_step": 67770, "epoch": 569, "lr": 6.450378744706054e-07} +{"train_loss": 0.00015301632811315358, "global_step": 67771, "epoch": 569, "lr": 6.446831985520152e-07} +{"train_loss": 0.0002009206364164129, "global_step": 67772, "epoch": 569, "lr": 6.44328619537321e-07} +{"train_loss": 0.00023748454987071455, "global_step": 67773, "epoch": 569, "lr": 6.439741374272112e-07} +{"train_loss": 0.00021443155128508806, "global_step": 67774, "epoch": 569, "lr": 6.436197522223853e-07} +{"train_loss": 0.0002396261115791276, "global_step": 67775, "epoch": 569, "lr": 6.432654639235425e-07} +{"train_loss": 0.0004939711652696133, "global_step": 67776, "epoch": 569, "lr": 6.429112725313713e-07} +{"train_loss": 0.0001737710990710184, "global_step": 67777, "epoch": 569, "lr": 6.425571780465711e-07} +{"train_loss": 0.00023112462076824158, "global_step": 67778, "epoch": 569, "lr": 6.422031804698414e-07} +{"train_loss": 0.00014579037087969482, "global_step": 67779, "epoch": 569, "lr": 6.418492798018649e-07} +{"train_loss": 0.00023011042503640056, "global_step": 67780, "epoch": 569, "lr": 6.414954760433522e-07} +{"train_loss": 0.00019608804723247886, "global_step": 67781, "epoch": 569, "lr": 6.411417691949806e-07} +{"train_loss": 0.00037576566683128476, "global_step": 67782, "epoch": 569, "lr": 6.407881592574605e-07} +{"train_loss": 0.0003117375017609447, "global_step": 67783, "epoch": 569, "lr": 6.404346462314803e-07} +{"train_loss": 0.0002570810029283166, "global_step": 67784, "epoch": 569, "lr": 6.400812301177284e-07} +{"train_loss": 0.0002728135441429913, "global_step": 67785, "epoch": 569, "lr": 6.397279109169097e-07} +{"train_loss": 0.00022422017354983836, "global_step": 67786, "epoch": 569, "lr": 6.39374688629707e-07} +{"train_loss": 0.00015708734281361103, "global_step": 67787, "epoch": 569, "lr": 6.390215632568198e-07} +{"train_loss": 0.00031885234056971967, "global_step": 67788, "epoch": 569, "lr": 6.386685347989363e-07} +{"train_loss": 0.00014909081801306456, "global_step": 67789, "epoch": 569, "lr": 6.383156032567617e-07} +{"train_loss": 0.00016858053277246654, "global_step": 67790, "epoch": 569, "lr": 6.379627686309786e-07} +{"train_loss": 0.0001717259583529085, "global_step": 67791, "epoch": 569, "lr": 6.37610030922281e-07} +{"train_loss": 0.00021645573724526912, "global_step": 67792, "epoch": 569, "lr": 6.372573901313628e-07} +{"train_loss": 0.00024271654547192156, "global_step": 67793, "epoch": 569, "lr": 6.369048462589122e-07} +{"train_loss": 0.000304711633361876, "global_step": 67794, "epoch": 569, "lr": 6.365523993056344e-07} +{"train_loss": 0.00026344324578531086, "global_step": 67795, "epoch": 569, "lr": 6.362000492722009e-07} +{"train_loss": 0.0002529555931687355, "global_step": 67796, "epoch": 569, "lr": 6.358477961593223e-07} +{"train_loss": 0.0002726262027863413, "global_step": 67797, "epoch": 569, "lr": 6.35495639967687e-07} +{"train_loss": 0.000223823546548374, "global_step": 67798, "epoch": 569, "lr": 6.351435806979722e-07} +{"train_loss": 0.00022393028484657407, "global_step": 67799, "epoch": 569, "lr": 6.347916183508829e-07} +{"train_loss": 0.00033971297671087086, "global_step": 67800, "epoch": 569, "lr": 6.344397529271073e-07} +{"train_loss": 0.00029973938944749534, "global_step": 67801, "epoch": 569, "lr": 6.34087984427334e-07} +{"train_loss": 0.00021072491654194891, "global_step": 67802, "epoch": 569, "lr": 6.337363128522567e-07} +{"train_loss": 0.00027204008074477315, "global_step": 67803, "epoch": 569, "lr": 6.333847382025638e-07} +{"train_loss": 0.00018458963313605636, "global_step": 67804, "epoch": 569, "lr": 6.33033260478949e-07} +{"train_loss": 0.0003587817191146314, "global_step": 67805, "epoch": 569, "lr": 6.326818796820899e-07} +{"train_loss": 0.0002561331493780017, "global_step": 67806, "epoch": 569, "lr": 6.323305958126969e-07} +{"train_loss": 0.0002913340867962688, "global_step": 67807, "epoch": 569, "lr": 6.319794088714415e-07} +{"train_loss": 0.00018617081514094025, "global_step": 67808, "epoch": 569, "lr": 6.316283188590233e-07} +{"train_loss": 0.0003896731068380177, "global_step": 67809, "epoch": 569, "lr": 6.312773257761251e-07} +{"train_loss": 0.0002267785312142223, "global_step": 67810, "epoch": 569, "lr": 6.309264296234407e-07} +{"train_loss": 0.00021427571482490748, "global_step": 67811, "epoch": 569, "lr": 6.305756304016641e-07} +{"train_loss": 0.0004127905995119363, "global_step": 67812, "epoch": 569, "lr": 6.302249281114669e-07} +{"train_loss": 0.0002932508068624884, "global_step": 67813, "epoch": 569, "lr": 6.298743227535597e-07} +{"train_loss": 0.00047659844858571887, "global_step": 67814, "epoch": 569, "lr": 6.295238143286142e-07} +{"train_loss": 0.00025186649872921407, "global_step": 67815, "epoch": 569, "lr": 6.291734028373242e-07} +{"train_loss": 0.00025009579258039594, "global_step": 67816, "epoch": 569, "lr": 6.288230882803781e-07} +{"train_loss": 0.0003227110719308257, "global_step": 67817, "epoch": 569, "lr": 6.284728706584642e-07} +{"train_loss": 0.00018188125977758318, "global_step": 67818, "epoch": 569, "lr": 6.281227499722653e-07} +{"train_loss": 0.0003678908688016236, "global_step": 67819, "epoch": 569, "lr": 6.277727262224808e-07} +{"train_loss": 0.00024508312344551086, "global_step": 67820, "epoch": 569, "lr": 6.274227994097825e-07} +{"train_loss": 0.00035538533120416105, "global_step": 67821, "epoch": 569, "lr": 6.270729695348642e-07} +{"train_loss": 0.00011942999844904989, "global_step": 67822, "epoch": 569, "lr": 6.2672323659842e-07} +{"train_loss": 0.0001447783870389685, "global_step": 67823, "epoch": 569, "lr": 6.263736006011267e-07} +{"train_loss": 0.0001788838126230985, "global_step": 67824, "epoch": 569, "lr": 6.26024061543673e-07} +{"train_loss": 0.00029782691854052246, "global_step": 67825, "epoch": 569, "lr": 6.256746194267471e-07} +{"train_loss": 0.00028545467648655176, "global_step": 67826, "epoch": 569, "lr": 6.253252742510373e-07} +{"train_loss": 0.00022090779384598136, "global_step": 67827, "epoch": 569, "lr": 6.24976026017221e-07} +{"train_loss": 0.0003102564951404929, "global_step": 67828, "epoch": 569, "lr": 6.246268747259975e-07} +{"train_loss": 0.0002653437830212315, "global_step": 67829, "epoch": 569, "lr": 6.24277820378033e-07, "val_loss": 0.05408494919538498} +{"train_loss": 0.00041924291872419417, "global_step": 67830, "epoch": 570, "lr": 6.239288629740326e-07} +{"train_loss": 0.00020665772899519652, "global_step": 67831, "epoch": 570, "lr": 6.235800025146676e-07} +{"train_loss": 0.00032459726207889616, "global_step": 67832, "epoch": 570, "lr": 6.232312390006323e-07} +{"train_loss": 0.0001550849701743573, "global_step": 67833, "epoch": 570, "lr": 6.228825724326037e-07} +{"train_loss": 0.0002059405524050817, "global_step": 67834, "epoch": 570, "lr": 6.225340028112758e-07} +{"train_loss": 0.0001668466575210914, "global_step": 67835, "epoch": 570, "lr": 6.221855301373203e-07} +{"train_loss": 0.00032791256671771407, "global_step": 67836, "epoch": 570, "lr": 6.21837154411431e-07} +{"train_loss": 0.0005064245779067278, "global_step": 67837, "epoch": 570, "lr": 6.214888756342907e-07} +{"train_loss": 0.0003908812359441072, "global_step": 67838, "epoch": 570, "lr": 6.211406938065767e-07} +{"train_loss": 0.0003252224996685982, "global_step": 67839, "epoch": 570, "lr": 6.207926089289829e-07} +{"train_loss": 0.00024163447960745543, "global_step": 67840, "epoch": 570, "lr": 6.204446210021864e-07} +{"train_loss": 0.00017838823259808123, "global_step": 67841, "epoch": 570, "lr": 6.200967300268701e-07} +{"train_loss": 0.00019346764020156115, "global_step": 67842, "epoch": 570, "lr": 6.197489360037223e-07} +{"train_loss": 0.0004024926747661084, "global_step": 67843, "epoch": 570, "lr": 6.194012389334147e-07} +{"train_loss": 0.00021024627494625747, "global_step": 67844, "epoch": 570, "lr": 6.190536388166413e-07} +{"train_loss": 0.00025906090741045773, "global_step": 67845, "epoch": 570, "lr": 6.187061356540791e-07} +{"train_loss": 0.0004714154056273401, "global_step": 67846, "epoch": 570, "lr": 6.183587294464166e-07} +{"train_loss": 0.00013645274157170206, "global_step": 67847, "epoch": 570, "lr": 6.18011420194331e-07} +{"train_loss": 0.00025957555044442415, "global_step": 67848, "epoch": 570, "lr": 6.176642078984995e-07} +{"train_loss": 0.0002461289695929736, "global_step": 67849, "epoch": 570, "lr": 6.17317092559605e-07} +{"train_loss": 0.0002411922614555806, "global_step": 67850, "epoch": 570, "lr": 6.169700741783413e-07} +{"train_loss": 0.00034612356103025377, "global_step": 67851, "epoch": 570, "lr": 6.166231527553745e-07} +{"train_loss": 0.0003123413189314306, "global_step": 67852, "epoch": 570, "lr": 6.162763282913986e-07} +{"train_loss": 0.0002674408024176955, "global_step": 67853, "epoch": 570, "lr": 6.159296007870797e-07} +{"train_loss": 0.00022310917847789824, "global_step": 67854, "epoch": 570, "lr": 6.15582970243117e-07} +{"train_loss": 0.0002961919526569545, "global_step": 67855, "epoch": 570, "lr": 6.152364366601715e-07} +{"train_loss": 0.00041458936175331473, "global_step": 67856, "epoch": 570, "lr": 6.148900000389424e-07} +{"train_loss": 0.0002886264119297266, "global_step": 67857, "epoch": 570, "lr": 6.145436603800902e-07} +{"train_loss": 0.00027544793556444347, "global_step": 67858, "epoch": 570, "lr": 6.141974176843146e-07} +{"train_loss": 0.0003821533755399287, "global_step": 67859, "epoch": 570, "lr": 6.138512719522816e-07} +{"train_loss": 0.00021477990958373994, "global_step": 67860, "epoch": 570, "lr": 6.135052231846794e-07} +{"train_loss": 0.00036439692485146224, "global_step": 67861, "epoch": 570, "lr": 6.131592713821855e-07} +{"train_loss": 0.00023623471497558057, "global_step": 67862, "epoch": 570, "lr": 6.128134165454713e-07} +{"train_loss": 0.0003018129209522158, "global_step": 67863, "epoch": 570, "lr": 6.124676586752254e-07} +{"train_loss": 0.00027957986458204687, "global_step": 67864, "epoch": 570, "lr": 6.121219977721193e-07} +{"train_loss": 0.00036500615533441305, "global_step": 67865, "epoch": 570, "lr": 6.117764338368359e-07} +{"train_loss": 0.000307902431814, "global_step": 67866, "epoch": 570, "lr": 6.114309668700579e-07} +{"train_loss": 0.00016541147488169372, "global_step": 67867, "epoch": 570, "lr": 6.110855968724516e-07} +{"train_loss": 0.00023324816720560193, "global_step": 67868, "epoch": 570, "lr": 6.107403238447107e-07} +{"train_loss": 0.00018797606753651053, "global_step": 67869, "epoch": 570, "lr": 6.103951477874958e-07} +{"train_loss": 0.0005403456161729991, "global_step": 67870, "epoch": 570, "lr": 6.10050068701501e-07} +{"train_loss": 0.00026742913178168237, "global_step": 67871, "epoch": 570, "lr": 6.097050865873921e-07} +{"train_loss": 0.0002346210094401613, "global_step": 67872, "epoch": 570, "lr": 6.093602014458522e-07} +{"train_loss": 0.0001361402973998338, "global_step": 67873, "epoch": 570, "lr": 6.090154132775583e-07} +{"train_loss": 0.0001839139877120033, "global_step": 67874, "epoch": 570, "lr": 6.086707220831822e-07} +{"train_loss": 0.00041883447556756437, "global_step": 67875, "epoch": 570, "lr": 6.083261278634067e-07} +{"train_loss": 0.00046932214172556996, "global_step": 67876, "epoch": 570, "lr": 6.079816306189035e-07} +{"train_loss": 0.00022520864149555564, "global_step": 67877, "epoch": 570, "lr": 6.076372303503552e-07} +{"train_loss": 0.00030393473571166396, "global_step": 67878, "epoch": 570, "lr": 6.072929270584338e-07} +{"train_loss": 0.00021944340551272035, "global_step": 67879, "epoch": 570, "lr": 6.069487207438162e-07} +{"train_loss": 0.00031063833739608526, "global_step": 67880, "epoch": 570, "lr": 6.066046114071744e-07} +{"train_loss": 0.0002597161801531911, "global_step": 67881, "epoch": 570, "lr": 6.062605990491909e-07} +{"train_loss": 0.00025127417757175863, "global_step": 67882, "epoch": 570, "lr": 6.059166836705377e-07} +{"train_loss": 0.0004421475750859827, "global_step": 67883, "epoch": 570, "lr": 6.055728652718861e-07} +{"train_loss": 0.0003325837024021894, "global_step": 67884, "epoch": 570, "lr": 6.052291438539193e-07} +{"train_loss": 0.0003611407009884715, "global_step": 67885, "epoch": 570, "lr": 6.048855194173087e-07} +{"train_loss": 0.0002893870114348829, "global_step": 67886, "epoch": 570, "lr": 6.04541991962726e-07} +{"train_loss": 0.0001082711823983118, "global_step": 67887, "epoch": 570, "lr": 6.041985614908485e-07} +{"train_loss": 0.0006416414398699999, "global_step": 67888, "epoch": 570, "lr": 6.038552280023479e-07} +{"train_loss": 0.00030221231281757355, "global_step": 67889, "epoch": 570, "lr": 6.035119914979015e-07} +{"train_loss": 0.0002407780266366899, "global_step": 67890, "epoch": 570, "lr": 6.031688519781808e-07} +{"train_loss": 0.00030339183285832405, "global_step": 67891, "epoch": 570, "lr": 6.028258094438688e-07} +{"train_loss": 0.0002818330831360072, "global_step": 67892, "epoch": 570, "lr": 6.024828638956259e-07} +{"train_loss": 0.00026486447313800454, "global_step": 67893, "epoch": 570, "lr": 6.021400153341294e-07} +{"train_loss": 0.000307495123706758, "global_step": 67894, "epoch": 570, "lr": 6.017972637600567e-07} +{"train_loss": 0.00027082941960543394, "global_step": 67895, "epoch": 570, "lr": 6.01454609174068e-07} +{"train_loss": 0.00025955040473490953, "global_step": 67896, "epoch": 570, "lr": 6.011120515768575e-07} +{"train_loss": 0.00037295339279808104, "global_step": 67897, "epoch": 570, "lr": 6.007695909690803e-07} +{"train_loss": 0.00013194415078032762, "global_step": 67898, "epoch": 570, "lr": 6.004272273514133e-07} +{"train_loss": 0.0002376639167778194, "global_step": 67899, "epoch": 570, "lr": 6.00084960724534e-07} +{"train_loss": 0.00028156975167803466, "global_step": 67900, "epoch": 570, "lr": 5.997427910891085e-07} +{"train_loss": 0.0002115099923685193, "global_step": 67901, "epoch": 570, "lr": 5.994007184458139e-07} +{"train_loss": 0.00029813178116455674, "global_step": 67902, "epoch": 570, "lr": 5.99058742795311e-07} +{"train_loss": 0.0001679349661571905, "global_step": 67903, "epoch": 570, "lr": 5.987168641382823e-07} +{"train_loss": 0.00036789182922802866, "global_step": 67904, "epoch": 570, "lr": 5.983750824753998e-07} +{"train_loss": 0.00028972321888431907, "global_step": 67905, "epoch": 570, "lr": 5.980333978073238e-07} +{"train_loss": 0.00018284894758835435, "global_step": 67906, "epoch": 570, "lr": 5.976918101347318e-07} +{"train_loss": 0.00028308285982348025, "global_step": 67907, "epoch": 570, "lr": 5.973503194582952e-07} +{"train_loss": 0.00030797842191532254, "global_step": 67908, "epoch": 570, "lr": 5.970089257786859e-07} +{"train_loss": 0.00016804032202344388, "global_step": 67909, "epoch": 570, "lr": 5.966676290965644e-07} +{"train_loss": 0.00023696309654042125, "global_step": 67910, "epoch": 570, "lr": 5.963264294126136e-07} +{"train_loss": 0.0003747910668607801, "global_step": 67911, "epoch": 570, "lr": 5.959853267274995e-07} +{"train_loss": 0.00035705798654817045, "global_step": 67912, "epoch": 570, "lr": 5.956443210418882e-07} +{"train_loss": 0.00027435689116828144, "global_step": 67913, "epoch": 570, "lr": 5.953034123564516e-07} +{"train_loss": 0.00020215885888319463, "global_step": 67914, "epoch": 570, "lr": 5.949626006718556e-07} +{"train_loss": 0.00023886335839051753, "global_step": 67915, "epoch": 570, "lr": 5.946218859887775e-07} +{"train_loss": 0.00039259548066183925, "global_step": 67916, "epoch": 570, "lr": 5.94281268307878e-07} +{"train_loss": 0.00028582997038029134, "global_step": 67917, "epoch": 570, "lr": 5.939407476298287e-07} +{"train_loss": 0.0001609201281098649, "global_step": 67918, "epoch": 570, "lr": 5.936003239552956e-07} +{"train_loss": 0.00015359901590272784, "global_step": 67919, "epoch": 570, "lr": 5.932599972849506e-07} +{"train_loss": 0.00017805305833462626, "global_step": 67920, "epoch": 570, "lr": 5.929197676194654e-07} +{"train_loss": 0.0001802172337193042, "global_step": 67921, "epoch": 570, "lr": 5.925796349595003e-07} +{"train_loss": 0.0003034312976524234, "global_step": 67922, "epoch": 570, "lr": 5.922395993057328e-07} +{"train_loss": 0.00019563852401915938, "global_step": 67923, "epoch": 570, "lr": 5.918996606588234e-07} +{"train_loss": 0.00020841469813603908, "global_step": 67924, "epoch": 570, "lr": 5.915598190194326e-07} +{"train_loss": 0.0002985101891681552, "global_step": 67925, "epoch": 570, "lr": 5.912200743882434e-07} +{"train_loss": 0.00017497029330115765, "global_step": 67926, "epoch": 570, "lr": 5.908804267659107e-07} +{"train_loss": 0.00042441755067557096, "global_step": 67927, "epoch": 570, "lr": 5.905408761531117e-07} +{"train_loss": 0.00019747113401535898, "global_step": 67928, "epoch": 570, "lr": 5.902014225505015e-07} +{"train_loss": 0.0007594850612804294, "global_step": 67929, "epoch": 570, "lr": 5.898620659587517e-07} +{"train_loss": 0.000159761548275128, "global_step": 67930, "epoch": 570, "lr": 5.895228063785341e-07} +{"train_loss": 0.00016980308282654732, "global_step": 67931, "epoch": 570, "lr": 5.891836438105037e-07} +{"train_loss": 0.00017426539852749556, "global_step": 67932, "epoch": 570, "lr": 5.888445782553376e-07} +{"train_loss": 0.00016169369337148964, "global_step": 67933, "epoch": 570, "lr": 5.88505609713691e-07} +{"train_loss": 0.0001479058264521882, "global_step": 67934, "epoch": 570, "lr": 5.881667381862354e-07} +{"train_loss": 0.00023308803793042898, "global_step": 67935, "epoch": 570, "lr": 5.878279636736428e-07} +{"train_loss": 0.000268090283498168, "global_step": 67936, "epoch": 570, "lr": 5.874892861765624e-07} +{"train_loss": 0.00027254773885942996, "global_step": 67937, "epoch": 570, "lr": 5.871507056956715e-07} +{"train_loss": 0.00023116149532143027, "global_step": 67938, "epoch": 570, "lr": 5.868122222316308e-07} +{"train_loss": 0.00017778799519874156, "global_step": 67939, "epoch": 570, "lr": 5.864738357851062e-07} +{"train_loss": 0.00022393287508748472, "global_step": 67940, "epoch": 570, "lr": 5.861355463567586e-07} +{"train_loss": 0.000209578123758547, "global_step": 67941, "epoch": 570, "lr": 5.857973539472594e-07} +{"train_loss": 0.00018434524827171117, "global_step": 67942, "epoch": 570, "lr": 5.854592585572694e-07} +{"train_loss": 0.00022455463476944715, "global_step": 67943, "epoch": 570, "lr": 5.851212601874434e-07} +{"train_loss": 0.00018794597417581826, "global_step": 67944, "epoch": 570, "lr": 5.847833588384588e-07} +{"train_loss": 0.00024672894505783916, "global_step": 67945, "epoch": 570, "lr": 5.84445554510965e-07} +{"train_loss": 0.00014798916527070105, "global_step": 67946, "epoch": 570, "lr": 5.841078472056394e-07} +{"train_loss": 0.00026806906680576503, "global_step": 67947, "epoch": 570, "lr": 5.837702369231368e-07} +{"train_loss": 0.0002718342737414084, "global_step": 67948, "epoch": 570, "lr": 5.834327236641235e-07, "val_loss": 0.015977049246430397, "train_action_mse_error": 3.763377208088059e-06} +{"train_loss": 0.00034762462018989027, "global_step": 67949, "epoch": 571, "lr": 5.8309530742926e-07} +{"train_loss": 0.00033771415473893285, "global_step": 67950, "epoch": 571, "lr": 5.827579882192125e-07} +{"train_loss": 0.0004287342308089137, "global_step": 67951, "epoch": 571, "lr": 5.824207660346359e-07} +{"train_loss": 0.00024180166656151414, "global_step": 67952, "epoch": 571, "lr": 5.820836408761965e-07} +{"train_loss": 0.00022383910254575312, "global_step": 67953, "epoch": 571, "lr": 5.817466127445547e-07} +{"train_loss": 0.0004119693476241082, "global_step": 67954, "epoch": 571, "lr": 5.814096816403824e-07} +{"train_loss": 0.0003129631222691387, "global_step": 67955, "epoch": 571, "lr": 5.810728475643234e-07} +{"train_loss": 0.00023298230371437967, "global_step": 67956, "epoch": 571, "lr": 5.80736110517055e-07} +{"train_loss": 0.00011893819464603439, "global_step": 67957, "epoch": 571, "lr": 5.803994704992266e-07} +{"train_loss": 0.00018000969430431724, "global_step": 67958, "epoch": 571, "lr": 5.800629275115044e-07} +{"train_loss": 0.0003179799241479486, "global_step": 67959, "epoch": 571, "lr": 5.797264815545489e-07} +{"train_loss": 0.00017834997561294585, "global_step": 67960, "epoch": 571, "lr": 5.793901326290263e-07} +{"train_loss": 0.0002798911591526121, "global_step": 67961, "epoch": 571, "lr": 5.79053880735586e-07} +{"train_loss": 0.00013924673839937896, "global_step": 67962, "epoch": 571, "lr": 5.787177258748944e-07} +{"train_loss": 0.0001730113581288606, "global_step": 67963, "epoch": 571, "lr": 5.783816680476118e-07} +{"train_loss": 0.00015679767238907516, "global_step": 67964, "epoch": 571, "lr": 5.780457072543932e-07} +{"train_loss": 0.00023021706147119403, "global_step": 67965, "epoch": 571, "lr": 5.777098434959105e-07} +{"train_loss": 0.00044446150423027575, "global_step": 67966, "epoch": 571, "lr": 5.773740767728075e-07} +{"train_loss": 0.00022696415544487536, "global_step": 67967, "epoch": 571, "lr": 5.770384070857504e-07} +{"train_loss": 0.0003730733005795628, "global_step": 67968, "epoch": 571, "lr": 5.767028344353997e-07} +{"train_loss": 0.00030727178091183305, "global_step": 67969, "epoch": 571, "lr": 5.763673588224105e-07} +{"train_loss": 0.0003983542846981436, "global_step": 67970, "epoch": 571, "lr": 5.76031980247449e-07} +{"train_loss": 0.0002612622338347137, "global_step": 67971, "epoch": 571, "lr": 5.756966987111645e-07} +{"train_loss": 0.00014806041144765913, "global_step": 67972, "epoch": 571, "lr": 5.753615142142233e-07} +{"train_loss": 0.00029137390083633363, "global_step": 67973, "epoch": 571, "lr": 5.750264267572802e-07} +{"train_loss": 0.00023512958432547748, "global_step": 67974, "epoch": 571, "lr": 5.74691436340985e-07} +{"train_loss": 0.00017934033530764282, "global_step": 67975, "epoch": 571, "lr": 5.743565429660092e-07} +{"train_loss": 0.0003064619086217135, "global_step": 67976, "epoch": 571, "lr": 5.740217466329967e-07} +{"train_loss": 0.00031857413705438375, "global_step": 67977, "epoch": 571, "lr": 5.736870473426192e-07} +{"train_loss": 0.000175471359398216, "global_step": 67978, "epoch": 571, "lr": 5.733524450955263e-07} +{"train_loss": 0.0003405512834433466, "global_step": 67979, "epoch": 571, "lr": 5.730179398923729e-07} +{"train_loss": 0.0003093525010626763, "global_step": 67980, "epoch": 571, "lr": 5.726835317338197e-07} +{"train_loss": 0.00016087660333141685, "global_step": 67981, "epoch": 571, "lr": 5.723492206205217e-07} +{"train_loss": 0.0002584285684861243, "global_step": 67982, "epoch": 571, "lr": 5.720150065531338e-07} +{"train_loss": 0.0002641462779138237, "global_step": 67983, "epoch": 571, "lr": 5.716808895323167e-07} +{"train_loss": 0.0002073090145131573, "global_step": 67984, "epoch": 571, "lr": 5.713468695587199e-07} +{"train_loss": 0.00022889208048582077, "global_step": 67985, "epoch": 571, "lr": 5.710129466330039e-07} +{"train_loss": 0.00026403460651636124, "global_step": 67986, "epoch": 571, "lr": 5.706791207558238e-07} +{"train_loss": 0.00020222828607074916, "global_step": 67987, "epoch": 571, "lr": 5.703453919278401e-07} +{"train_loss": 0.0001984734699362889, "global_step": 67988, "epoch": 571, "lr": 5.700117601496913e-07} +{"train_loss": 0.00029940810054540634, "global_step": 67989, "epoch": 571, "lr": 5.696782254220545e-07} +{"train_loss": 0.0004296398547012359, "global_step": 67990, "epoch": 571, "lr": 5.693447877455627e-07} +{"train_loss": 0.0001797077857190743, "global_step": 67991, "epoch": 571, "lr": 5.69011447120893e-07} +{"train_loss": 0.0004676348762586713, "global_step": 67992, "epoch": 571, "lr": 5.686782035486838e-07} +{"train_loss": 0.0002110428613377735, "global_step": 67993, "epoch": 571, "lr": 5.6834505702959e-07} +{"train_loss": 0.000229170749662444, "global_step": 67994, "epoch": 571, "lr": 5.680120075642725e-07} +{"train_loss": 0.00027037024847231805, "global_step": 67995, "epoch": 571, "lr": 5.676790551533862e-07} +{"train_loss": 0.00017556817329023033, "global_step": 67996, "epoch": 571, "lr": 5.673461997975748e-07} +{"train_loss": 0.0003950090322177857, "global_step": 67997, "epoch": 571, "lr": 5.670134414975048e-07} +{"train_loss": 0.00017581558495294303, "global_step": 67998, "epoch": 571, "lr": 5.666807802538143e-07} +{"train_loss": 0.0001882927172118798, "global_step": 67999, "epoch": 571, "lr": 5.663482160671752e-07} +{"train_loss": 0.0001442980719730258, "global_step": 68000, "epoch": 571, "lr": 5.660157489382201e-07} +{"train_loss": 0.0003014341928064823, "global_step": 68001, "epoch": 571, "lr": 5.656833788676152e-07} +{"train_loss": 0.000145234793308191, "global_step": 68002, "epoch": 571, "lr": 5.653511058560101e-07} +{"train_loss": 0.0002701233606785536, "global_step": 68003, "epoch": 571, "lr": 5.650189299040598e-07} +{"train_loss": 0.0001987209980143234, "global_step": 68004, "epoch": 571, "lr": 5.646868510124137e-07} +{"train_loss": 0.00034272012999281287, "global_step": 68005, "epoch": 571, "lr": 5.643548691817158e-07} +{"train_loss": 0.00012762437108904123, "global_step": 68006, "epoch": 571, "lr": 5.640229844126322e-07} +{"train_loss": 0.00035524729173630476, "global_step": 68007, "epoch": 571, "lr": 5.636911967058068e-07} +{"train_loss": 0.0002726445673033595, "global_step": 68008, "epoch": 571, "lr": 5.633595060618945e-07} +{"train_loss": 0.0004215544031467289, "global_step": 68009, "epoch": 571, "lr": 5.630279124815396e-07} +{"train_loss": 0.0002759709022939205, "global_step": 68010, "epoch": 571, "lr": 5.626964159654025e-07} +{"train_loss": 0.00048423645785078406, "global_step": 68011, "epoch": 571, "lr": 5.62365016514127e-07} +{"train_loss": 0.00013746318290941417, "global_step": 68012, "epoch": 571, "lr": 5.620337141283627e-07} +{"train_loss": 0.00014389269927050918, "global_step": 68013, "epoch": 571, "lr": 5.617025088087702e-07} +{"train_loss": 0.0002202217874582857, "global_step": 68014, "epoch": 571, "lr": 5.613714005559878e-07} +{"train_loss": 0.0003386411408428103, "global_step": 68015, "epoch": 571, "lr": 5.610403893706761e-07} +{"train_loss": 0.0001564311678521335, "global_step": 68016, "epoch": 571, "lr": 5.607094752534736e-07} +{"train_loss": 0.0006406938191503286, "global_step": 68017, "epoch": 571, "lr": 5.603786582050352e-07} +{"train_loss": 0.00022417816217057407, "global_step": 68018, "epoch": 571, "lr": 5.600479382260215e-07} +{"train_loss": 0.00016957675688900054, "global_step": 68019, "epoch": 571, "lr": 5.597173153170598e-07} +{"train_loss": 0.0001602683769306168, "global_step": 68020, "epoch": 571, "lr": 5.593867894788218e-07} +{"train_loss": 0.00019558721396606416, "global_step": 68021, "epoch": 571, "lr": 5.590563607119404e-07} +{"train_loss": 0.0002615591511130333, "global_step": 68022, "epoch": 571, "lr": 5.587260290170704e-07} +{"train_loss": 0.0001960250228876248, "global_step": 68023, "epoch": 571, "lr": 5.583957943948615e-07} +{"train_loss": 0.00030578579753637314, "global_step": 68024, "epoch": 571, "lr": 5.580656568459575e-07} +{"train_loss": 0.0001270289212698117, "global_step": 68025, "epoch": 571, "lr": 5.577356163710134e-07} +{"train_loss": 0.0003594307345338166, "global_step": 68026, "epoch": 571, "lr": 5.574056729706678e-07} +{"train_loss": 0.00014690097304992378, "global_step": 68027, "epoch": 571, "lr": 5.570758266455811e-07} +{"train_loss": 0.000237217522226274, "global_step": 68028, "epoch": 571, "lr": 5.567460773963862e-07} +{"train_loss": 0.0002369943103985861, "global_step": 68029, "epoch": 571, "lr": 5.564164252237436e-07} +{"train_loss": 0.00016672977653797716, "global_step": 68030, "epoch": 571, "lr": 5.560868701282973e-07} +{"train_loss": 0.00021189081599004567, "global_step": 68031, "epoch": 571, "lr": 5.557574121106856e-07} +{"train_loss": 0.00023079598031472415, "global_step": 68032, "epoch": 571, "lr": 5.554280511715637e-07} +{"train_loss": 0.00029800503398291767, "global_step": 68033, "epoch": 571, "lr": 5.550987873115754e-07} +{"train_loss": 0.00015999288007151335, "global_step": 68034, "epoch": 571, "lr": 5.547696205313757e-07} +{"train_loss": 0.00017737496818881482, "global_step": 68035, "epoch": 571, "lr": 5.544405508315975e-07} +{"train_loss": 0.00016071266145445406, "global_step": 68036, "epoch": 571, "lr": 5.541115782128903e-07} +{"train_loss": 0.00019835628336295485, "global_step": 68037, "epoch": 571, "lr": 5.53782702675909e-07} +{"train_loss": 0.00020144252630416304, "global_step": 68038, "epoch": 571, "lr": 5.534539242212866e-07} +{"train_loss": 0.0002830678131431341, "global_step": 68039, "epoch": 571, "lr": 5.53125242849678e-07} +{"train_loss": 0.00016165076522156596, "global_step": 68040, "epoch": 571, "lr": 5.527966585617217e-07} +{"train_loss": 0.0004672509094234556, "global_step": 68041, "epoch": 571, "lr": 5.524681713580726e-07} +{"train_loss": 0.00020743247296195477, "global_step": 68042, "epoch": 571, "lr": 5.521397812393691e-07} +{"train_loss": 0.00019216253713238984, "global_step": 68043, "epoch": 571, "lr": 5.518114882062497e-07} +{"train_loss": 0.00019507210527081043, "global_step": 68044, "epoch": 571, "lr": 5.514832922593693e-07} +{"train_loss": 0.00015217659529298544, "global_step": 68045, "epoch": 571, "lr": 5.511551933993719e-07} +{"train_loss": 0.0003121321788057685, "global_step": 68046, "epoch": 571, "lr": 5.508271916268959e-07} +{"train_loss": 0.0002606308844406158, "global_step": 68047, "epoch": 571, "lr": 5.504992869425852e-07} +{"train_loss": 0.00017877640493679792, "global_step": 68048, "epoch": 571, "lr": 5.501714793470891e-07} +{"train_loss": 0.00017414109606761485, "global_step": 68049, "epoch": 571, "lr": 5.498437688410463e-07} +{"train_loss": 0.00022180643281899393, "global_step": 68050, "epoch": 571, "lr": 5.495161554251061e-07} +{"train_loss": 0.00014396064216271043, "global_step": 68051, "epoch": 571, "lr": 5.491886390999012e-07} +{"train_loss": 0.00028573564486578107, "global_step": 68052, "epoch": 571, "lr": 5.488612198660869e-07} +{"train_loss": 0.0003186382818967104, "global_step": 68053, "epoch": 571, "lr": 5.485338977243015e-07} +{"train_loss": 0.00018765495042316616, "global_step": 68054, "epoch": 571, "lr": 5.482066726751834e-07} +{"train_loss": 0.00022582993551623076, "global_step": 68055, "epoch": 571, "lr": 5.478795447193819e-07} +{"train_loss": 0.00024401539121754467, "global_step": 68056, "epoch": 571, "lr": 5.4755251385753e-07} +{"train_loss": 0.00027036466053687036, "global_step": 68057, "epoch": 571, "lr": 5.472255800902771e-07} +{"train_loss": 0.0004439526528585702, "global_step": 68058, "epoch": 571, "lr": 5.468987434182671e-07} +{"train_loss": 0.0005674892454408109, "global_step": 68059, "epoch": 571, "lr": 5.465720038421384e-07} +{"train_loss": 0.00019917445024475455, "global_step": 68060, "epoch": 571, "lr": 5.462453613625295e-07} +{"train_loss": 0.00034219553344883025, "global_step": 68061, "epoch": 571, "lr": 5.459188159800899e-07} +{"train_loss": 0.00014964932051952928, "global_step": 68062, "epoch": 571, "lr": 5.455923676954466e-07} +{"train_loss": 0.0002157165145035833, "global_step": 68063, "epoch": 571, "lr": 5.452660165092549e-07} +{"train_loss": 0.00027376465732231736, "global_step": 68064, "epoch": 571, "lr": 5.449397624221476e-07} +{"train_loss": 0.00012896486441604793, "global_step": 68065, "epoch": 571, "lr": 5.446136054347684e-07} +{"train_loss": 0.00012954715930391103, "global_step": 68066, "epoch": 571, "lr": 5.442875455477558e-07} +{"train_loss": 0.00025153836105048204, "global_step": 68067, "epoch": 571, "lr": 5.439615827617539e-07, "val_loss": 0.016698526218533516} +{"train_loss": 0.0005787136033177376, "global_step": 68068, "epoch": 572, "lr": 5.436357170774009e-07} +{"train_loss": 0.00018863941659219563, "global_step": 68069, "epoch": 572, "lr": 5.433099484953297e-07} +{"train_loss": 0.0003590910055208951, "global_step": 68070, "epoch": 572, "lr": 5.429842770161897e-07} +{"train_loss": 0.00019502924988046288, "global_step": 68071, "epoch": 572, "lr": 5.426587026406138e-07} +{"train_loss": 0.0003672686580102891, "global_step": 68072, "epoch": 572, "lr": 5.423332253692459e-07} +{"train_loss": 0.00022253874340094626, "global_step": 68073, "epoch": 572, "lr": 5.420078452027245e-07} +{"train_loss": 0.00018398341489955783, "global_step": 68074, "epoch": 572, "lr": 5.416825621416821e-07} +{"train_loss": 0.000193177824257873, "global_step": 68075, "epoch": 572, "lr": 5.413573761867685e-07} +{"train_loss": 0.00023119754041545093, "global_step": 68076, "epoch": 572, "lr": 5.410322873386108e-07} +{"train_loss": 0.0001538814976811409, "global_step": 68077, "epoch": 572, "lr": 5.407072955978532e-07} +{"train_loss": 0.0002685690997168422, "global_step": 68078, "epoch": 572, "lr": 5.403824009651281e-07} +{"train_loss": 0.0002202174800913781, "global_step": 68079, "epoch": 572, "lr": 5.400576034410854e-07} +{"train_loss": 0.00016361402231268585, "global_step": 68080, "epoch": 572, "lr": 5.397329030263521e-07} +{"train_loss": 0.00019592420721892267, "global_step": 68081, "epoch": 572, "lr": 5.394082997215721e-07} +{"train_loss": 0.0002367527486057952, "global_step": 68082, "epoch": 572, "lr": 5.390837935273785e-07} +{"train_loss": 0.0001605157449375838, "global_step": 68083, "epoch": 572, "lr": 5.387593844444095e-07} +{"train_loss": 0.0001684464659774676, "global_step": 68084, "epoch": 572, "lr": 5.384350724733033e-07} +{"train_loss": 0.00017678126459941268, "global_step": 68085, "epoch": 572, "lr": 5.381108576146932e-07} +{"train_loss": 0.00013946587569080293, "global_step": 68086, "epoch": 572, "lr": 5.377867398692171e-07} +{"train_loss": 0.00030310932197608054, "global_step": 68087, "epoch": 572, "lr": 5.374627192375193e-07} +{"train_loss": 0.0002633712429087609, "global_step": 68088, "epoch": 572, "lr": 5.371387957202212e-07} +{"train_loss": 0.00013002511695958674, "global_step": 68089, "epoch": 572, "lr": 5.368149693179724e-07} +{"train_loss": 0.0004819710156880319, "global_step": 68090, "epoch": 572, "lr": 5.364912400314004e-07} +{"train_loss": 0.00020981747366022319, "global_step": 68091, "epoch": 572, "lr": 5.361676078611488e-07} +{"train_loss": 0.00021150884276721627, "global_step": 68092, "epoch": 572, "lr": 5.358440728078396e-07} +{"train_loss": 0.0002148167259292677, "global_step": 68093, "epoch": 572, "lr": 5.355206348721221e-07} +{"train_loss": 0.0005955186788924038, "global_step": 68094, "epoch": 572, "lr": 5.351972940546235e-07} +{"train_loss": 0.0001294887624680996, "global_step": 68095, "epoch": 572, "lr": 5.348740503559769e-07} +{"train_loss": 0.0002500500704627484, "global_step": 68096, "epoch": 572, "lr": 5.345509037768259e-07} +{"train_loss": 0.0002516582317184657, "global_step": 68097, "epoch": 572, "lr": 5.342278543177925e-07} +{"train_loss": 0.0002065684529952705, "global_step": 68098, "epoch": 572, "lr": 5.339049019795261e-07} +{"train_loss": 0.00025486628874205053, "global_step": 68099, "epoch": 572, "lr": 5.335820467626484e-07} +{"train_loss": 0.00023253905237652361, "global_step": 68100, "epoch": 572, "lr": 5.332592886677979e-07} +{"train_loss": 0.00029301163158379495, "global_step": 68101, "epoch": 572, "lr": 5.329366276956127e-07} +{"train_loss": 0.00026238730060867965, "global_step": 68102, "epoch": 572, "lr": 5.326140638467148e-07} +{"train_loss": 0.0001452621800126508, "global_step": 68103, "epoch": 572, "lr": 5.322915971217479e-07} +{"train_loss": 0.0002343534433748573, "global_step": 68104, "epoch": 572, "lr": 5.31969227521345e-07} +{"train_loss": 0.0004111261514481157, "global_step": 68105, "epoch": 572, "lr": 5.316469550461278e-07} +{"train_loss": 0.00022683107818011194, "global_step": 68106, "epoch": 572, "lr": 5.313247796967402e-07} +{"train_loss": 0.00021300399384927005, "global_step": 68107, "epoch": 572, "lr": 5.31002701473815e-07} +{"train_loss": 0.0002769157290458679, "global_step": 68108, "epoch": 572, "lr": 5.306807203779796e-07} +{"train_loss": 0.00020190690702293068, "global_step": 68109, "epoch": 572, "lr": 5.30358836409861e-07} +{"train_loss": 0.0002567202318459749, "global_step": 68110, "epoch": 572, "lr": 5.300370495701035e-07} +{"train_loss": 0.00026503452681936324, "global_step": 68111, "epoch": 572, "lr": 5.297153598593341e-07} +{"train_loss": 0.00025860496680252254, "global_step": 68112, "epoch": 572, "lr": 5.293937672781801e-07} +{"train_loss": 0.00020303907513152808, "global_step": 68113, "epoch": 572, "lr": 5.290722718272801e-07} +{"train_loss": 0.0002985282917506993, "global_step": 68114, "epoch": 572, "lr": 5.287508735072555e-07} +{"train_loss": 0.0002405335835646838, "global_step": 68115, "epoch": 572, "lr": 5.284295723187449e-07} +{"train_loss": 0.000182215531822294, "global_step": 68116, "epoch": 572, "lr": 5.281083682623866e-07} +{"train_loss": 0.0003745501453522593, "global_step": 68117, "epoch": 572, "lr": 5.277872613387913e-07} +{"train_loss": 0.00037873658584430814, "global_step": 68118, "epoch": 572, "lr": 5.274662515486084e-07} +{"train_loss": 0.000220910893403925, "global_step": 68119, "epoch": 572, "lr": 5.271453388924541e-07} +{"train_loss": 0.00020196188415866345, "global_step": 68120, "epoch": 572, "lr": 5.268245233709668e-07} +{"train_loss": 0.0002901773841585964, "global_step": 68121, "epoch": 572, "lr": 5.265038049847737e-07} +{"train_loss": 0.00024251276045106351, "global_step": 68122, "epoch": 572, "lr": 5.261831837345021e-07} +{"train_loss": 0.0002799862122628838, "global_step": 68123, "epoch": 572, "lr": 5.258626596207905e-07} +{"train_loss": 0.0001497905032010749, "global_step": 68124, "epoch": 572, "lr": 5.255422326442605e-07} +{"train_loss": 0.0002962529833894223, "global_step": 68125, "epoch": 572, "lr": 5.252219028055393e-07} +{"train_loss": 0.00022159283980727196, "global_step": 68126, "epoch": 572, "lr": 5.2490167010526e-07} +{"train_loss": 0.00019923130457755178, "global_step": 68127, "epoch": 572, "lr": 5.245815345440553e-07} +{"train_loss": 0.0003814477240666747, "global_step": 68128, "epoch": 572, "lr": 5.242614961225412e-07} +{"train_loss": 0.00017361046047881246, "global_step": 68129, "epoch": 572, "lr": 5.239415548413618e-07} +{"train_loss": 0.00012291231541894376, "global_step": 68130, "epoch": 572, "lr": 5.236217107011331e-07} +{"train_loss": 0.0002985316386912018, "global_step": 68131, "epoch": 572, "lr": 5.233019637024883e-07} +{"train_loss": 0.00037918187445029616, "global_step": 68132, "epoch": 572, "lr": 5.229823138460543e-07} +{"train_loss": 0.0002684452338144183, "global_step": 68133, "epoch": 572, "lr": 5.226627611324586e-07} +{"train_loss": 0.00034259186941199005, "global_step": 68134, "epoch": 572, "lr": 5.223433055623284e-07} +{"train_loss": 0.0004629781760741025, "global_step": 68135, "epoch": 572, "lr": 5.220239471362965e-07} +{"train_loss": 0.00025972852017730474, "global_step": 68136, "epoch": 572, "lr": 5.21704685854979e-07} +{"train_loss": 0.0004599051899276674, "global_step": 68137, "epoch": 572, "lr": 5.213855217190089e-07} +{"train_loss": 0.0005885992432013154, "global_step": 68138, "epoch": 572, "lr": 5.210664547290078e-07} +{"train_loss": 0.00019730448548216373, "global_step": 68139, "epoch": 572, "lr": 5.207474848856142e-07} +{"train_loss": 0.00019243330461904407, "global_step": 68140, "epoch": 572, "lr": 5.204286121894442e-07} +{"train_loss": 0.0001649595214985311, "global_step": 68141, "epoch": 572, "lr": 5.20109836641125e-07} +{"train_loss": 0.0001548591535538435, "global_step": 68142, "epoch": 572, "lr": 5.197911582412895e-07} +{"train_loss": 0.00018296550842933357, "global_step": 68143, "epoch": 572, "lr": 5.19472576990554e-07} +{"train_loss": 0.00024219487386289984, "global_step": 68144, "epoch": 572, "lr": 5.191540928895455e-07} +{"train_loss": 0.00023034148034639657, "global_step": 68145, "epoch": 572, "lr": 5.188357059388915e-07} +{"train_loss": 0.00022617439390160143, "global_step": 68146, "epoch": 572, "lr": 5.185174161392248e-07} +{"train_loss": 0.00014055022620595992, "global_step": 68147, "epoch": 572, "lr": 5.181992234911559e-07} +{"train_loss": 0.00026232533855363727, "global_step": 68148, "epoch": 572, "lr": 5.178811279953177e-07} +{"train_loss": 0.0001614605134818703, "global_step": 68149, "epoch": 572, "lr": 5.175631296523321e-07} +{"train_loss": 0.00020469231822062284, "global_step": 68150, "epoch": 572, "lr": 5.17245228462826e-07} +{"train_loss": 0.00022619408264290541, "global_step": 68151, "epoch": 572, "lr": 5.169274244274269e-07} +{"train_loss": 0.00022763348533771932, "global_step": 68152, "epoch": 572, "lr": 5.166097175467455e-07} +{"train_loss": 0.0004877872415818274, "global_step": 68153, "epoch": 572, "lr": 5.1629210782142e-07} +{"train_loss": 0.00022743204317521304, "global_step": 68154, "epoch": 572, "lr": 5.159745952520722e-07} +{"train_loss": 0.00022184573754202574, "global_step": 68155, "epoch": 572, "lr": 5.156571798393129e-07} +{"train_loss": 0.0003272996691521257, "global_step": 68156, "epoch": 572, "lr": 5.153398615837801e-07} +{"train_loss": 0.00024321961973328143, "global_step": 68157, "epoch": 572, "lr": 5.150226404860903e-07} +{"train_loss": 0.00036062023718841374, "global_step": 68158, "epoch": 572, "lr": 5.14705516546865e-07} +{"train_loss": 0.00034056295407935977, "global_step": 68159, "epoch": 572, "lr": 5.143884897667317e-07} +{"train_loss": 0.00027043692534789443, "global_step": 68160, "epoch": 572, "lr": 5.140715601463065e-07} +{"train_loss": 0.00030231333221308887, "global_step": 68161, "epoch": 572, "lr": 5.137547276862165e-07} +{"train_loss": 0.00033769718720577657, "global_step": 68162, "epoch": 572, "lr": 5.134379923870836e-07} +{"train_loss": 0.00019188546866644174, "global_step": 68163, "epoch": 572, "lr": 5.131213542495294e-07} +{"train_loss": 0.000496279273647815, "global_step": 68164, "epoch": 572, "lr": 5.128048132741702e-07} +{"train_loss": 0.00015713265747763216, "global_step": 68165, "epoch": 572, "lr": 5.124883694616334e-07} +{"train_loss": 0.0002579431456979364, "global_step": 68166, "epoch": 572, "lr": 5.121720228125349e-07} +{"train_loss": 0.0002427803265163675, "global_step": 68167, "epoch": 572, "lr": 5.118557733275075e-07} +{"train_loss": 0.00019797116692643613, "global_step": 68168, "epoch": 572, "lr": 5.115396210071621e-07} +{"train_loss": 0.00020840062643401325, "global_step": 68169, "epoch": 572, "lr": 5.112235658521147e-07} +{"train_loss": 0.00012691240408457816, "global_step": 68170, "epoch": 572, "lr": 5.109076078630038e-07} +{"train_loss": 0.00025914734578691423, "global_step": 68171, "epoch": 572, "lr": 5.105917470404286e-07} +{"train_loss": 0.0001916574692586437, "global_step": 68172, "epoch": 572, "lr": 5.102759833850223e-07} +{"train_loss": 0.00011550549243111163, "global_step": 68173, "epoch": 572, "lr": 5.099603168974066e-07} +{"train_loss": 0.00048787816194817424, "global_step": 68174, "epoch": 572, "lr": 5.096447475781919e-07} +{"train_loss": 0.00013879382458981127, "global_step": 68175, "epoch": 572, "lr": 5.093292754280055e-07} +{"train_loss": 0.00010911349818343297, "global_step": 68176, "epoch": 572, "lr": 5.090139004474581e-07} +{"train_loss": 0.00025527473189868033, "global_step": 68177, "epoch": 572, "lr": 5.086986226371826e-07} +{"train_loss": 0.00021150030079297721, "global_step": 68178, "epoch": 572, "lr": 5.08383441997784e-07} +{"train_loss": 0.0003043784527108073, "global_step": 68179, "epoch": 572, "lr": 5.080683585298896e-07} +{"train_loss": 0.0004994496703147888, "global_step": 68180, "epoch": 572, "lr": 5.077533722341154e-07} +{"train_loss": 0.00020818038319703192, "global_step": 68181, "epoch": 572, "lr": 5.074384831110779e-07} +{"train_loss": 0.0003743595734704286, "global_step": 68182, "epoch": 572, "lr": 5.071236911613986e-07} +{"train_loss": 0.00017332220159005374, "global_step": 68183, "epoch": 572, "lr": 5.068089963856937e-07} +{"train_loss": 0.00026127533055841923, "global_step": 68184, "epoch": 572, "lr": 5.06494398784585e-07} +{"train_loss": 0.000374250317690894, "global_step": 68185, "epoch": 572, "lr": 5.061798983586829e-07} +{"train_loss": 0.0002577573790663986, "global_step": 68186, "epoch": 572, "lr": 5.058654951086095e-07, "val_loss": 0.023176422342658043} +{"train_loss": 0.0001250518107553944, "global_step": 68187, "epoch": 573, "lr": 5.055511890349862e-07} +{"train_loss": 0.00036342311068437994, "global_step": 68188, "epoch": 573, "lr": 5.052369801384183e-07} +{"train_loss": 0.0001877418690128252, "global_step": 68189, "epoch": 573, "lr": 5.049228684195384e-07} +{"train_loss": 0.0002661596518009901, "global_step": 68190, "epoch": 573, "lr": 5.046088538789462e-07} +{"train_loss": 0.0001451528223697096, "global_step": 68191, "epoch": 573, "lr": 5.042949365172689e-07} +{"train_loss": 0.0001354652486043051, "global_step": 68192, "epoch": 573, "lr": 5.039811163351282e-07} +{"train_loss": 0.0002103415463352576, "global_step": 68193, "epoch": 573, "lr": 5.036673933331237e-07} +{"train_loss": 0.0001909152342705056, "global_step": 68194, "epoch": 573, "lr": 5.033537675118827e-07} +{"train_loss": 0.00033226696541532874, "global_step": 68195, "epoch": 573, "lr": 5.030402388720212e-07} +{"train_loss": 0.00023555726511403918, "global_step": 68196, "epoch": 573, "lr": 5.0272680741415e-07} +{"train_loss": 0.00029917602660134435, "global_step": 68197, "epoch": 573, "lr": 5.024134731388852e-07} +{"train_loss": 0.0002292181015945971, "global_step": 68198, "epoch": 573, "lr": 5.021002360468485e-07} +{"train_loss": 0.00015561975305899978, "global_step": 68199, "epoch": 573, "lr": 5.017870961386451e-07} +{"train_loss": 0.000372506765415892, "global_step": 68200, "epoch": 573, "lr": 5.014740534148965e-07} +{"train_loss": 0.00023016025079414248, "global_step": 68201, "epoch": 573, "lr": 5.011611078762135e-07} +{"train_loss": 0.00024146951909642667, "global_step": 68202, "epoch": 573, "lr": 5.008482595232178e-07} +{"train_loss": 0.0005793941090814769, "global_step": 68203, "epoch": 573, "lr": 5.005355083565144e-07} +{"train_loss": 0.00020250698435120285, "global_step": 68204, "epoch": 573, "lr": 5.002228543767196e-07} +{"train_loss": 0.00016416709695477039, "global_step": 68205, "epoch": 573, "lr": 4.999102975844494e-07} +{"train_loss": 0.00018020263814833015, "global_step": 68206, "epoch": 573, "lr": 4.995978379803201e-07} +{"train_loss": 0.00014508466119877994, "global_step": 68207, "epoch": 573, "lr": 4.992854755649424e-07} +{"train_loss": 0.0001307654893025756, "global_step": 68208, "epoch": 573, "lr": 4.989732103389266e-07} +{"train_loss": 0.00035516321077011526, "global_step": 68209, "epoch": 573, "lr": 4.986610423028893e-07} +{"train_loss": 0.0002444703713990748, "global_step": 68210, "epoch": 573, "lr": 4.983489714574463e-07} +{"train_loss": 0.00022546586114913225, "global_step": 68211, "epoch": 573, "lr": 4.980369978031974e-07} +{"train_loss": 0.00011908057058462873, "global_step": 68212, "epoch": 573, "lr": 4.977251213407752e-07} +{"train_loss": 0.00022433513368014246, "global_step": 68213, "epoch": 573, "lr": 4.974133420707738e-07} +{"train_loss": 0.0002501753333490342, "global_step": 68214, "epoch": 573, "lr": 4.971016599938149e-07} +{"train_loss": 0.00012058534775860608, "global_step": 68215, "epoch": 573, "lr": 4.967900751105093e-07} +{"train_loss": 0.00022656831424683332, "global_step": 68216, "epoch": 573, "lr": 4.964785874214673e-07} +{"train_loss": 0.00026201456785202026, "global_step": 68217, "epoch": 573, "lr": 4.961671969272996e-07} +{"train_loss": 0.00021239550551399589, "global_step": 68218, "epoch": 573, "lr": 4.95855903628617e-07} +{"train_loss": 0.00018786810687743127, "global_step": 68219, "epoch": 573, "lr": 4.955447075260355e-07} +{"train_loss": 0.00027678892365656793, "global_step": 68220, "epoch": 573, "lr": 4.952336086201658e-07} +{"train_loss": 0.00016270892228931189, "global_step": 68221, "epoch": 573, "lr": 4.949226069116075e-07} +{"train_loss": 0.0013278801925480366, "global_step": 68222, "epoch": 573, "lr": 4.946117024009877e-07} +{"train_loss": 0.00025036477018147707, "global_step": 68223, "epoch": 573, "lr": 4.943008950889116e-07} +{"train_loss": 0.00041009418782778084, "global_step": 68224, "epoch": 573, "lr": 4.939901849759787e-07} +{"train_loss": 0.0005607742350548506, "global_step": 68225, "epoch": 573, "lr": 4.936795720628107e-07} +{"train_loss": 0.00029797054594382644, "global_step": 68226, "epoch": 573, "lr": 4.933690563500126e-07} +{"train_loss": 0.000610305170994252, "global_step": 68227, "epoch": 573, "lr": 4.930586378382007e-07} +{"train_loss": 0.00022423133486881852, "global_step": 68228, "epoch": 573, "lr": 4.92748316527969e-07} +{"train_loss": 0.00027719661011360586, "global_step": 68229, "epoch": 573, "lr": 4.924380924199446e-07} +{"train_loss": 0.0004985443083569407, "global_step": 68230, "epoch": 573, "lr": 4.921279655147326e-07} +{"train_loss": 0.0004321974120102823, "global_step": 68231, "epoch": 573, "lr": 4.918179358129271e-07} +{"train_loss": 0.0002763648226391524, "global_step": 68232, "epoch": 573, "lr": 4.915080033151553e-07} +{"train_loss": 0.00019463634816929698, "global_step": 68233, "epoch": 573, "lr": 4.911981680220168e-07} +{"train_loss": 0.00016396593127865344, "global_step": 68234, "epoch": 573, "lr": 4.908884299341221e-07} +{"train_loss": 0.0003395199601072818, "global_step": 68235, "epoch": 573, "lr": 4.905787890520764e-07} +{"train_loss": 0.0001696811814326793, "global_step": 68236, "epoch": 573, "lr": 4.902692453764901e-07} +{"train_loss": 0.0003236060729250312, "global_step": 68237, "epoch": 573, "lr": 4.89959798907974e-07} +{"train_loss": 0.0002669982786756009, "global_step": 68238, "epoch": 573, "lr": 4.896504496471276e-07} +{"train_loss": 0.0001774161064531654, "global_step": 68239, "epoch": 573, "lr": 4.893411975945672e-07} +{"train_loss": 0.00017572447541169822, "global_step": 68240, "epoch": 573, "lr": 4.890320427508976e-07} +{"train_loss": 0.0004658769757952541, "global_step": 68241, "epoch": 573, "lr": 4.887229851167185e-07} +{"train_loss": 0.0003211562871001661, "global_step": 68242, "epoch": 573, "lr": 4.884140246926517e-07} +{"train_loss": 0.0002039311802946031, "global_step": 68243, "epoch": 573, "lr": 4.881051614792854e-07} +{"train_loss": 0.00017906307766679674, "global_step": 68244, "epoch": 573, "lr": 4.877963954772358e-07} +{"train_loss": 0.00026627452461980283, "global_step": 68245, "epoch": 573, "lr": 4.874877266871081e-07} +{"train_loss": 0.00022192583128344268, "global_step": 68246, "epoch": 573, "lr": 4.871791551095128e-07} +{"train_loss": 0.00021216782624833286, "global_step": 68247, "epoch": 573, "lr": 4.868706807450496e-07} +{"train_loss": 0.00017824825772549957, "global_step": 68248, "epoch": 573, "lr": 4.865623035943234e-07} +{"train_loss": 0.0001421936322003603, "global_step": 68249, "epoch": 573, "lr": 4.862540236579449e-07} +{"train_loss": 0.00025485228979960084, "global_step": 68250, "epoch": 573, "lr": 4.859458409365136e-07} +{"train_loss": 0.000348609231878072, "global_step": 68251, "epoch": 573, "lr": 4.856377554306457e-07} +{"train_loss": 0.00015802890993654728, "global_step": 68252, "epoch": 573, "lr": 4.853297671409296e-07} +{"train_loss": 0.00019602212705649436, "global_step": 68253, "epoch": 573, "lr": 4.85021876067987e-07} +{"train_loss": 0.00036293084849603474, "global_step": 68254, "epoch": 573, "lr": 4.847140822124119e-07} +{"train_loss": 0.00012146164226578549, "global_step": 68255, "epoch": 573, "lr": 4.844063855748038e-07} +{"train_loss": 0.0003098060842603445, "global_step": 68256, "epoch": 573, "lr": 4.840987861557789e-07} +{"train_loss": 0.0001846401864895597, "global_step": 68257, "epoch": 573, "lr": 4.837912839559367e-07} +{"train_loss": 0.00032074222690425813, "global_step": 68258, "epoch": 573, "lr": 4.834838789758822e-07} +{"train_loss": 0.00027647288516163826, "global_step": 68259, "epoch": 573, "lr": 4.831765712162095e-07} +{"train_loss": 0.0002626492641866207, "global_step": 68260, "epoch": 573, "lr": 4.828693606775348e-07} +{"train_loss": 0.00038554941420443356, "global_step": 68261, "epoch": 573, "lr": 4.825622473604574e-07} +{"train_loss": 0.00013148848665878177, "global_step": 68262, "epoch": 573, "lr": 4.822552312655771e-07} +{"train_loss": 0.00013250118354335427, "global_step": 68263, "epoch": 573, "lr": 4.819483123934987e-07} +{"train_loss": 0.000235693107242696, "global_step": 68264, "epoch": 573, "lr": 4.816414907448219e-07} +{"train_loss": 0.00019346867338754237, "global_step": 68265, "epoch": 573, "lr": 4.813347663201572e-07} +{"train_loss": 0.00017527391901239753, "global_step": 68266, "epoch": 573, "lr": 4.810281391200932e-07} +{"train_loss": 0.0002713554713409394, "global_step": 68267, "epoch": 573, "lr": 4.80721609145246e-07} +{"train_loss": 0.0001501853985246271, "global_step": 68268, "epoch": 573, "lr": 4.80415176396215e-07} +{"train_loss": 0.00046789180487394333, "global_step": 68269, "epoch": 573, "lr": 4.801088408735888e-07} +{"train_loss": 0.00025445703067816794, "global_step": 68270, "epoch": 573, "lr": 4.798026025779889e-07} +{"train_loss": 0.00026329245883971453, "global_step": 68271, "epoch": 573, "lr": 4.794964615099984e-07} +{"train_loss": 0.00028320500859990716, "global_step": 68272, "epoch": 573, "lr": 4.791904176702278e-07} +{"train_loss": 0.00046324546565301716, "global_step": 68273, "epoch": 573, "lr": 4.788844710592766e-07} +{"train_loss": 0.00014683810877613723, "global_step": 68274, "epoch": 573, "lr": 4.785786216777443e-07} +{"train_loss": 0.00018266642291564494, "global_step": 68275, "epoch": 573, "lr": 4.782728695262361e-07} +{"train_loss": 0.0003748467715922743, "global_step": 68276, "epoch": 573, "lr": 4.77967214605346e-07} +{"train_loss": 0.00029807473765686154, "global_step": 68277, "epoch": 573, "lr": 4.776616569156789e-07} +{"train_loss": 0.00028146529803052545, "global_step": 68278, "epoch": 573, "lr": 4.773561964578288e-07} +{"train_loss": 0.0003029676154255867, "global_step": 68279, "epoch": 573, "lr": 4.770508332324009e-07} +{"train_loss": 0.0002063758292933926, "global_step": 68280, "epoch": 573, "lr": 4.76745567239989e-07} +{"train_loss": 0.00017384864622727036, "global_step": 68281, "epoch": 573, "lr": 4.764403984812038e-07} +{"train_loss": 0.00017191820370499045, "global_step": 68282, "epoch": 573, "lr": 4.761353269566282e-07} +{"train_loss": 0.0001626568118808791, "global_step": 68283, "epoch": 573, "lr": 4.7583035266687836e-07} +{"train_loss": 0.00014254983398132026, "global_step": 68284, "epoch": 573, "lr": 4.755254756125427e-07} +{"train_loss": 0.0002208110672654584, "global_step": 68285, "epoch": 573, "lr": 4.752206957942151e-07} +{"train_loss": 0.0001744057663017884, "global_step": 68286, "epoch": 573, "lr": 4.749160132125119e-07} +{"train_loss": 0.000269456475507468, "global_step": 68287, "epoch": 573, "lr": 4.7461142786801583e-07} +{"train_loss": 0.00030265841633081436, "global_step": 68288, "epoch": 573, "lr": 4.743069397613209e-07} +{"train_loss": 0.00017791116260923445, "global_step": 68289, "epoch": 573, "lr": 4.740025488930433e-07} +{"train_loss": 0.0002878379891626537, "global_step": 68290, "epoch": 573, "lr": 4.736982552637659e-07} +{"train_loss": 0.0004117429198231548, "global_step": 68291, "epoch": 573, "lr": 4.7339405887409373e-07} +{"train_loss": 0.00021682234364561737, "global_step": 68292, "epoch": 573, "lr": 4.7308995972462077e-07} +{"train_loss": 0.0002652248367667198, "global_step": 68293, "epoch": 573, "lr": 4.7278595781594105e-07} +{"train_loss": 0.00023322776542045176, "global_step": 68294, "epoch": 573, "lr": 4.7248205314865957e-07} +{"train_loss": 0.00018023481243290007, "global_step": 68295, "epoch": 573, "lr": 4.721782457233648e-07} +{"train_loss": 0.0002957526012323797, "global_step": 68296, "epoch": 573, "lr": 4.7187453554066175e-07} +{"train_loss": 0.00033093831734731793, "global_step": 68297, "epoch": 573, "lr": 4.715709226011389e-07} +{"train_loss": 0.0007863063947297633, "global_step": 68298, "epoch": 573, "lr": 4.712674069053957e-07} +{"train_loss": 0.00022580206859856844, "global_step": 68299, "epoch": 573, "lr": 4.709639884540262e-07} +{"train_loss": 0.0001687679614406079, "global_step": 68300, "epoch": 573, "lr": 4.7066066724762436e-07} +{"train_loss": 0.00014626933261752129, "global_step": 68301, "epoch": 573, "lr": 4.703574432867952e-07} +{"train_loss": 0.00018903489399235696, "global_step": 68302, "epoch": 573, "lr": 4.700543165721216e-07} +{"train_loss": 0.0002689619141165167, "global_step": 68303, "epoch": 573, "lr": 4.697512871042087e-07} +{"train_loss": 0.00036244720104150474, "global_step": 68304, "epoch": 573, "lr": 4.6944835488365036e-07} +{"train_loss": 0.0002655842126994746, "global_step": 68305, "epoch": 573, "lr": 4.6914551991103506e-07, "val_loss": 0.03262219950556755} +{"train_loss": 0.00035002556978724897, "global_step": 68306, "epoch": 574, "lr": 4.688427821869623e-07} +{"train_loss": 0.0005273642018437386, "global_step": 68307, "epoch": 574, "lr": 4.685401417120205e-07} +{"train_loss": 0.00034994762972928584, "global_step": 68308, "epoch": 574, "lr": 4.682375984868148e-07} +{"train_loss": 0.000403871905291453, "global_step": 68309, "epoch": 574, "lr": 4.67935152511928e-07} +{"train_loss": 0.0001929790450958535, "global_step": 68310, "epoch": 574, "lr": 4.676328037879596e-07} +{"train_loss": 0.0002589092473499477, "global_step": 68311, "epoch": 574, "lr": 4.673305523155036e-07} +{"train_loss": 0.00028211716562509537, "global_step": 68312, "epoch": 574, "lr": 4.6702839809515397e-07} +{"train_loss": 0.00017668325745034963, "global_step": 68313, "epoch": 574, "lr": 4.667263411274991e-07} +{"train_loss": 0.00014229472435545176, "global_step": 68314, "epoch": 574, "lr": 4.664243814131386e-07} +{"train_loss": 0.00012474793766159564, "global_step": 68315, "epoch": 574, "lr": 4.661225189526608e-07} +{"train_loss": 0.00024341924290638417, "global_step": 68316, "epoch": 574, "lr": 4.6582075374665965e-07} +{"train_loss": 0.00036532513331621885, "global_step": 68317, "epoch": 574, "lr": 4.655190857957237e-07} +{"train_loss": 0.00040664037805981934, "global_step": 68318, "epoch": 574, "lr": 4.652175151004523e-07} +{"train_loss": 0.00015496634296141565, "global_step": 68319, "epoch": 574, "lr": 4.64916041661434e-07} +{"train_loss": 0.0005683383205905557, "global_step": 68320, "epoch": 574, "lr": 4.646146654792627e-07} +{"train_loss": 0.0003911999228876084, "global_step": 68321, "epoch": 574, "lr": 4.643133865545213e-07} +{"train_loss": 0.00030628006788901985, "global_step": 68322, "epoch": 574, "lr": 4.640122048878204e-07} +{"train_loss": 0.00039448862662538886, "global_step": 68323, "epoch": 574, "lr": 4.637111204797318e-07} +{"train_loss": 0.00017015988123603165, "global_step": 68324, "epoch": 574, "lr": 4.6341013333085493e-07} +{"train_loss": 0.0005627226200886071, "global_step": 68325, "epoch": 574, "lr": 4.631092434417783e-07} +{"train_loss": 0.0001753085380187258, "global_step": 68326, "epoch": 574, "lr": 4.6280845081309587e-07} +{"train_loss": 0.00024101248709484935, "global_step": 68327, "epoch": 574, "lr": 4.6250775544540157e-07} +{"train_loss": 0.0001921222428791225, "global_step": 68328, "epoch": 574, "lr": 4.6220715733927277e-07} +{"train_loss": 0.00014090925105847418, "global_step": 68329, "epoch": 574, "lr": 4.619066564953145e-07} +{"train_loss": 0.00027706805849447846, "global_step": 68330, "epoch": 574, "lr": 4.616062529141096e-07} +{"train_loss": 0.0004188587481621653, "global_step": 68331, "epoch": 574, "lr": 4.613059465962466e-07} +{"train_loss": 0.00015605002408847213, "global_step": 68332, "epoch": 574, "lr": 4.610057375423138e-07} +{"train_loss": 0.00025216839276254177, "global_step": 68333, "epoch": 574, "lr": 4.607056257529052e-07} +{"train_loss": 0.000586862675845623, "global_step": 68334, "epoch": 574, "lr": 4.604056112286148e-07} +{"train_loss": 0.00013320725702214986, "global_step": 68335, "epoch": 574, "lr": 4.601056939700199e-07} +{"train_loss": 0.00020226264314260334, "global_step": 68336, "epoch": 574, "lr": 4.5980587397771446e-07} +{"train_loss": 0.0001396075531374663, "global_step": 68337, "epoch": 574, "lr": 4.5950615125229245e-07} +{"train_loss": 0.00025609589647501707, "global_step": 68338, "epoch": 574, "lr": 4.5920652579433123e-07} +{"train_loss": 0.00025939103215932846, "global_step": 68339, "epoch": 574, "lr": 4.5890699760443025e-07} +{"train_loss": 0.00016949299606494606, "global_step": 68340, "epoch": 574, "lr": 4.5860756668316687e-07} +{"train_loss": 0.00022418334265239537, "global_step": 68341, "epoch": 574, "lr": 4.5830823303114056e-07} +{"train_loss": 0.0001793514529708773, "global_step": 68342, "epoch": 574, "lr": 4.5800899664893425e-07} +{"train_loss": 0.0001837864692788571, "global_step": 68343, "epoch": 574, "lr": 4.577098575371308e-07} +{"train_loss": 0.0002486149896867573, "global_step": 68344, "epoch": 574, "lr": 4.574108156963186e-07} +{"train_loss": 0.00019854526908602566, "global_step": 68345, "epoch": 574, "lr": 4.5711187112709163e-07} +{"train_loss": 0.0002118674456141889, "global_step": 68346, "epoch": 574, "lr": 4.5681302383003276e-07} +{"train_loss": 0.00025466797524131835, "global_step": 68347, "epoch": 574, "lr": 4.565142738057249e-07} +{"train_loss": 0.00023435326875187457, "global_step": 68348, "epoch": 574, "lr": 4.562156210547619e-07} +{"train_loss": 0.00035446061519905925, "global_step": 68349, "epoch": 574, "lr": 4.559170655777267e-07} +{"train_loss": 0.00014265341451391578, "global_step": 68350, "epoch": 574, "lr": 4.556186073752022e-07} +{"train_loss": 0.0002610491355881095, "global_step": 68351, "epoch": 574, "lr": 4.5532024644778235e-07} +{"train_loss": 0.00017373081936966628, "global_step": 68352, "epoch": 574, "lr": 4.5502198279604447e-07} +{"train_loss": 0.0004217495152261108, "global_step": 68353, "epoch": 574, "lr": 4.547238164205769e-07} +{"train_loss": 0.0003171440912410617, "global_step": 68354, "epoch": 574, "lr": 4.5442574732197374e-07} +{"train_loss": 0.00018582891789264977, "global_step": 68355, "epoch": 574, "lr": 4.541277755008011e-07} +{"train_loss": 0.00027347839204594493, "global_step": 68356, "epoch": 574, "lr": 4.5382990095766407e-07} +{"train_loss": 0.0002189148945035413, "global_step": 68357, "epoch": 574, "lr": 4.5353212369313446e-07} +{"train_loss": 0.00020398326159920543, "global_step": 68358, "epoch": 574, "lr": 4.5323444370780065e-07} +{"train_loss": 0.0003509671369101852, "global_step": 68359, "epoch": 574, "lr": 4.5293686100225107e-07} +{"train_loss": 0.00024311544257216156, "global_step": 68360, "epoch": 574, "lr": 4.52639375577063e-07} +{"train_loss": 0.00021529843797907233, "global_step": 68361, "epoch": 574, "lr": 4.523419874328305e-07} +{"train_loss": 0.0002534851082600653, "global_step": 68362, "epoch": 574, "lr": 4.520446965701253e-07} +{"train_loss": 0.0004869055701419711, "global_step": 68363, "epoch": 574, "lr": 4.5174750298954126e-07} +{"train_loss": 0.0004163036064710468, "global_step": 68364, "epoch": 574, "lr": 4.514504066916503e-07} +{"train_loss": 0.0002230492391390726, "global_step": 68365, "epoch": 574, "lr": 4.5115340767705184e-07} +{"train_loss": 0.00036402526893652976, "global_step": 68366, "epoch": 574, "lr": 4.508565059463121e-07} +{"train_loss": 0.00021338700025808066, "global_step": 68367, "epoch": 574, "lr": 4.5055970150002515e-07} +{"train_loss": 0.0002564602764323354, "global_step": 68368, "epoch": 574, "lr": 4.502629943387737e-07} +{"train_loss": 0.00040334343793801963, "global_step": 68369, "epoch": 574, "lr": 4.4996638446313523e-07} +{"train_loss": 0.00014366916730068624, "global_step": 68370, "epoch": 574, "lr": 4.4966987187369245e-07} +{"train_loss": 0.00027293807943351567, "global_step": 68371, "epoch": 574, "lr": 4.4937345657102837e-07} +{"train_loss": 0.00018872885266318917, "global_step": 68372, "epoch": 574, "lr": 4.490771385557313e-07} +{"train_loss": 0.0003269535081926733, "global_step": 68373, "epoch": 574, "lr": 4.4878091782837304e-07} +{"train_loss": 0.0003008215280715376, "global_step": 68374, "epoch": 574, "lr": 4.4848479438954206e-07} +{"train_loss": 0.0002430073800496757, "global_step": 68375, "epoch": 574, "lr": 4.481887682398156e-07} +{"train_loss": 0.00018844674923457205, "global_step": 68376, "epoch": 574, "lr": 4.4789283937977654e-07} +{"train_loss": 0.00012423857697285712, "global_step": 68377, "epoch": 574, "lr": 4.475970078100078e-07} +{"train_loss": 0.00013767635391559452, "global_step": 68378, "epoch": 574, "lr": 4.4730127353108664e-07} +{"train_loss": 0.00035648568882606924, "global_step": 68379, "epoch": 574, "lr": 4.4700563654359597e-07} +{"train_loss": 0.00022487175010610372, "global_step": 68380, "epoch": 574, "lr": 4.4671009684811306e-07} +{"train_loss": 0.0002438211813569069, "global_step": 68381, "epoch": 574, "lr": 4.4641465444522633e-07} +{"train_loss": 0.000247262156335637, "global_step": 68382, "epoch": 574, "lr": 4.461193093355076e-07} +{"train_loss": 0.00019448870443738997, "global_step": 68383, "epoch": 574, "lr": 4.458240615195397e-07} +{"train_loss": 0.00025303667644038796, "global_step": 68384, "epoch": 574, "lr": 4.4552891099789995e-07} +{"train_loss": 0.00013743147428613156, "global_step": 68385, "epoch": 574, "lr": 4.4523385777117123e-07} +{"train_loss": 0.00019229504687245935, "global_step": 68386, "epoch": 574, "lr": 4.4493890183993634e-07} +{"train_loss": 0.0003193998127244413, "global_step": 68387, "epoch": 574, "lr": 4.4464404320476714e-07} +{"train_loss": 0.00028964655939489603, "global_step": 68388, "epoch": 574, "lr": 4.443492818662409e-07} +{"train_loss": 0.0005491580232046545, "global_step": 68389, "epoch": 574, "lr": 4.4405461782494606e-07} +{"train_loss": 0.00022816096316091716, "global_step": 68390, "epoch": 574, "lr": 4.437600510814488e-07} +{"train_loss": 0.00012952629185747355, "global_step": 68391, "epoch": 574, "lr": 4.4346558163634313e-07} +{"train_loss": 0.00015804541180841625, "global_step": 68392, "epoch": 574, "lr": 4.431712094901952e-07} +{"train_loss": 0.0002503147115930915, "global_step": 68393, "epoch": 574, "lr": 4.4287693464358236e-07} +{"train_loss": 0.00017248251242563128, "global_step": 68394, "epoch": 574, "lr": 4.425827570970931e-07} +{"train_loss": 0.00037944965879432857, "global_step": 68395, "epoch": 574, "lr": 4.422886768512935e-07} +{"train_loss": 0.0002963745500892401, "global_step": 68396, "epoch": 574, "lr": 4.419946939067665e-07} +{"train_loss": 0.00022585102124139667, "global_step": 68397, "epoch": 574, "lr": 4.417008082640894e-07} +{"train_loss": 0.0001975169579964131, "global_step": 68398, "epoch": 574, "lr": 4.41407019923834e-07} +{"train_loss": 0.0003788829199038446, "global_step": 68399, "epoch": 574, "lr": 4.4111332888658876e-07} +{"train_loss": 0.00021437153918668628, "global_step": 68400, "epoch": 574, "lr": 4.408197351529197e-07} +{"train_loss": 0.0002810435544233769, "global_step": 68401, "epoch": 574, "lr": 4.4052623872340436e-07} +{"train_loss": 0.00018883327720686793, "global_step": 68402, "epoch": 574, "lr": 4.4023283959861994e-07} +{"train_loss": 0.00027095217956230044, "global_step": 68403, "epoch": 574, "lr": 4.399395377791493e-07} +{"train_loss": 0.00034536237944848835, "global_step": 68404, "epoch": 574, "lr": 4.396463332655587e-07} +{"train_loss": 0.0006883979076519608, "global_step": 68405, "epoch": 574, "lr": 4.3935322605842545e-07} +{"train_loss": 0.0001573156623635441, "global_step": 68406, "epoch": 574, "lr": 4.390602161583324e-07} +{"train_loss": 0.00030256883474066854, "global_step": 68407, "epoch": 574, "lr": 4.387673035658457e-07} +{"train_loss": 0.00013282963482197374, "global_step": 68408, "epoch": 574, "lr": 4.3847448828154836e-07} +{"train_loss": 0.00020295589638408273, "global_step": 68409, "epoch": 574, "lr": 4.38181770306012e-07} +{"train_loss": 0.00039656751323491335, "global_step": 68410, "epoch": 574, "lr": 4.3788914963980856e-07} +{"train_loss": 0.0002301703643752262, "global_step": 68411, "epoch": 574, "lr": 4.3759662628351515e-07} +{"train_loss": 0.00039801871753297746, "global_step": 68412, "epoch": 574, "lr": 4.3730420023770367e-07} +{"train_loss": 0.0002714112342800945, "global_step": 68413, "epoch": 574, "lr": 4.370118715029514e-07} +{"train_loss": 0.00019813056860584766, "global_step": 68414, "epoch": 574, "lr": 4.3671964007983013e-07} +{"train_loss": 0.0002371448208577931, "global_step": 68415, "epoch": 574, "lr": 4.364275059689171e-07} +{"train_loss": 0.0002219151210738346, "global_step": 68416, "epoch": 574, "lr": 4.361354691707842e-07} +{"train_loss": 0.00016448795213364065, "global_step": 68417, "epoch": 574, "lr": 4.3584352968600304e-07} +{"train_loss": 0.0001276545226573944, "global_step": 68418, "epoch": 574, "lr": 4.355516875151511e-07} +{"train_loss": 0.00018667963740881532, "global_step": 68419, "epoch": 574, "lr": 4.3525994265879443e-07} +{"train_loss": 0.0002304519439348951, "global_step": 68420, "epoch": 574, "lr": 4.3496829511751046e-07} +{"train_loss": 0.00021091011876706034, "global_step": 68421, "epoch": 574, "lr": 4.346767448918709e-07} +{"train_loss": 0.00028277290402911603, "global_step": 68422, "epoch": 574, "lr": 4.343852919824476e-07} +{"train_loss": 0.00026127134333364666, "global_step": 68423, "epoch": 574, "lr": 4.3409393638981777e-07} +{"train_loss": 0.00026409827322433036, "global_step": 68424, "epoch": 574, "lr": 4.338026781145421e-07, "val_loss": 0.02070903405547142} +{"train_loss": 0.0006717328215017915, "global_step": 68425, "epoch": 575, "lr": 4.3351151715720907e-07} +{"train_loss": 0.0002698275784496218, "global_step": 68426, "epoch": 575, "lr": 4.332204535183737e-07} +{"train_loss": 0.00028993189334869385, "global_step": 68427, "epoch": 575, "lr": 4.329294871986134e-07} +{"train_loss": 0.000303968001389876, "global_step": 68428, "epoch": 575, "lr": 4.3263861819850535e-07} +{"train_loss": 0.00021329816081561148, "global_step": 68429, "epoch": 575, "lr": 4.3234784651861037e-07} +{"train_loss": 0.00025154848117381334, "global_step": 68430, "epoch": 575, "lr": 4.3205717215951126e-07} +{"train_loss": 0.00047029188135638833, "global_step": 68431, "epoch": 575, "lr": 4.3176659512176865e-07} +{"train_loss": 0.00020869319268967956, "global_step": 68432, "epoch": 575, "lr": 4.314761154059599e-07} +{"train_loss": 0.0002586502523627132, "global_step": 68433, "epoch": 575, "lr": 4.3118573301264564e-07} +{"train_loss": 0.0006584200309589505, "global_step": 68434, "epoch": 575, "lr": 4.308954479424088e-07} +{"train_loss": 0.00015538708248641342, "global_step": 68435, "epoch": 575, "lr": 4.3060526019580996e-07} +{"train_loss": 0.00022719339176546782, "global_step": 68436, "epoch": 575, "lr": 4.303151697734209e-07} +{"train_loss": 0.0001585840218467638, "global_step": 68437, "epoch": 575, "lr": 4.3002517667581346e-07} +{"train_loss": 0.0001305867190239951, "global_step": 68438, "epoch": 575, "lr": 4.297352809035593e-07} +{"train_loss": 0.00029714085394516587, "global_step": 68439, "epoch": 575, "lr": 4.2944548245721917e-07} +{"train_loss": 0.0004881858767475933, "global_step": 68440, "epoch": 575, "lr": 4.291557813373703e-07} +{"train_loss": 0.00015120622992981225, "global_step": 68441, "epoch": 575, "lr": 4.2886617754457903e-07} +{"train_loss": 0.00028022099286317825, "global_step": 68442, "epoch": 575, "lr": 4.2857667107940594e-07} +{"train_loss": 0.00012175292067695409, "global_step": 68443, "epoch": 575, "lr": 4.2828726194243384e-07} +{"train_loss": 0.0003137729363515973, "global_step": 68444, "epoch": 575, "lr": 4.279979501342179e-07} +{"train_loss": 0.0001707385090412572, "global_step": 68445, "epoch": 575, "lr": 4.277087356553411e-07} +{"train_loss": 0.00014458471559919417, "global_step": 68446, "epoch": 575, "lr": 4.274196185063528e-07} +{"train_loss": 0.0003363826253917068, "global_step": 68447, "epoch": 575, "lr": 4.27130598687836e-07} +{"train_loss": 0.0002898011589422822, "global_step": 68448, "epoch": 575, "lr": 4.2684167620034576e-07} +{"train_loss": 0.00016992884047795087, "global_step": 68449, "epoch": 575, "lr": 4.26552851044465e-07} +{"train_loss": 0.00023824030358809978, "global_step": 68450, "epoch": 575, "lr": 4.2626412322074317e-07} +{"train_loss": 0.0003329002356622368, "global_step": 68451, "epoch": 575, "lr": 4.259754927297632e-07} +{"train_loss": 0.0003931749379262328, "global_step": 68452, "epoch": 575, "lr": 4.256869595720747e-07} +{"train_loss": 0.00012705799599643797, "global_step": 68453, "epoch": 575, "lr": 4.253985237482605e-07} +{"train_loss": 0.00045549252536147833, "global_step": 68454, "epoch": 575, "lr": 4.2511018525888123e-07} +{"train_loss": 0.000181097726454027, "global_step": 68455, "epoch": 575, "lr": 4.248219441044976e-07} +{"train_loss": 0.00026643619639799, "global_step": 68456, "epoch": 575, "lr": 4.2453380028568137e-07} +{"train_loss": 0.00020092978957109153, "global_step": 68457, "epoch": 575, "lr": 4.2424575380299867e-07} +{"train_loss": 0.0001415275619365275, "global_step": 68458, "epoch": 575, "lr": 4.239578046570103e-07} +{"train_loss": 0.0002239934547105804, "global_step": 68459, "epoch": 575, "lr": 4.236699528482824e-07} +{"train_loss": 0.00023976652300916612, "global_step": 68460, "epoch": 575, "lr": 4.233821983773867e-07} +{"train_loss": 0.00034788731136359274, "global_step": 68461, "epoch": 575, "lr": 4.230945412448839e-07} +{"train_loss": 0.00016889124526642263, "global_step": 68462, "epoch": 575, "lr": 4.228069814513347e-07} +{"train_loss": 0.00016542986850254238, "global_step": 68463, "epoch": 575, "lr": 4.225195189973108e-07} +{"train_loss": 0.0003236363991163671, "global_step": 68464, "epoch": 575, "lr": 4.2223215388336734e-07} +{"train_loss": 0.00012335946667008102, "global_step": 68465, "epoch": 575, "lr": 4.2194488611008164e-07} +{"train_loss": 0.0003784078871831298, "global_step": 68466, "epoch": 575, "lr": 4.216577156780033e-07} +{"train_loss": 0.0006444918108172715, "global_step": 68467, "epoch": 575, "lr": 4.2137064258770954e-07} +{"train_loss": 0.00025574187748134136, "global_step": 68468, "epoch": 575, "lr": 4.210836668397611e-07} +{"train_loss": 0.000279477535514161, "global_step": 68469, "epoch": 575, "lr": 4.207967884347075e-07} +{"train_loss": 0.00022005946084391326, "global_step": 68470, "epoch": 575, "lr": 4.2051000737313164e-07} +{"train_loss": 0.00014487699081655592, "global_step": 68471, "epoch": 575, "lr": 4.2022332365558304e-07} +{"train_loss": 0.0005175615078769624, "global_step": 68472, "epoch": 575, "lr": 4.1993673728262796e-07} +{"train_loss": 0.0001893337903311476, "global_step": 68473, "epoch": 575, "lr": 4.196502482548326e-07} +{"train_loss": 0.00021363762789405882, "global_step": 68474, "epoch": 575, "lr": 4.1936385657275757e-07} +{"train_loss": 0.00031972595024853945, "global_step": 68475, "epoch": 575, "lr": 4.1907756223696357e-07} +{"train_loss": 0.00041341903852298856, "global_step": 68476, "epoch": 575, "lr": 4.1879136524801133e-07} +{"train_loss": 0.00024098969879560173, "global_step": 68477, "epoch": 575, "lr": 4.1850526560646694e-07} +{"train_loss": 0.0002059212129097432, "global_step": 68478, "epoch": 575, "lr": 4.1821926331289675e-07} +{"train_loss": 0.0003717221843544394, "global_step": 68479, "epoch": 575, "lr": 4.1793335836784464e-07} +{"train_loss": 0.00039627731894142926, "global_step": 68480, "epoch": 575, "lr": 4.1764755077189355e-07} +{"train_loss": 0.0002320317435078323, "global_step": 68481, "epoch": 575, "lr": 4.1736184052558747e-07} +{"train_loss": 0.00022459766478277743, "global_step": 68482, "epoch": 575, "lr": 4.1707622762949816e-07} +{"train_loss": 0.00041219606646336615, "global_step": 68483, "epoch": 575, "lr": 4.1679071208418073e-07} +{"train_loss": 0.00017453108739573509, "global_step": 68484, "epoch": 575, "lr": 4.1650529389020144e-07} +{"train_loss": 0.0002804292307700962, "global_step": 68485, "epoch": 575, "lr": 4.162199730481098e-07} +{"train_loss": 0.0002869260497391224, "global_step": 68486, "epoch": 575, "lr": 4.1593474955847753e-07} +{"train_loss": 0.00019926062668673694, "global_step": 68487, "epoch": 575, "lr": 4.156496234218654e-07} +{"train_loss": 0.00017687914078123868, "global_step": 68488, "epoch": 575, "lr": 4.153645946388174e-07} +{"train_loss": 0.00023491549654863775, "global_step": 68489, "epoch": 575, "lr": 4.150796632099108e-07} +{"train_loss": 0.0001220326084876433, "global_step": 68490, "epoch": 575, "lr": 4.147948291356951e-07} +{"train_loss": 0.00027735091862268746, "global_step": 68491, "epoch": 575, "lr": 4.145100924167311e-07} +{"train_loss": 0.00022193195763975382, "global_step": 68492, "epoch": 575, "lr": 4.1422545305358494e-07} +{"train_loss": 0.00028638727962970734, "global_step": 68493, "epoch": 575, "lr": 4.1394091104680067e-07} +{"train_loss": 0.0007092228042893112, "global_step": 68494, "epoch": 575, "lr": 4.1365646639695554e-07} +{"train_loss": 0.00016602090909145772, "global_step": 68495, "epoch": 575, "lr": 4.1337211910458804e-07} +{"train_loss": 0.0002023559354711324, "global_step": 68496, "epoch": 575, "lr": 4.1308786917027554e-07} +{"train_loss": 0.0003232377057429403, "global_step": 68497, "epoch": 575, "lr": 4.1280371659456194e-07} +{"train_loss": 0.00028982345247641206, "global_step": 68498, "epoch": 575, "lr": 4.125196613780136e-07} +{"train_loss": 0.00013662592391483486, "global_step": 68499, "epoch": 575, "lr": 4.122357035211855e-07} +{"train_loss": 0.00020213884999975562, "global_step": 68500, "epoch": 575, "lr": 4.119518430246327e-07} +{"train_loss": 0.00013543742534238845, "global_step": 68501, "epoch": 575, "lr": 4.116680798889161e-07} +{"train_loss": 0.0002583306923042983, "global_step": 68502, "epoch": 575, "lr": 4.1138441411459063e-07} +{"train_loss": 0.00026225371402688324, "global_step": 68503, "epoch": 575, "lr": 4.1110084570221696e-07} +{"train_loss": 0.00017580452549736947, "global_step": 68504, "epoch": 575, "lr": 4.108173746523447e-07} +{"train_loss": 0.00034110716660507023, "global_step": 68505, "epoch": 575, "lr": 4.1053400096554007e-07} +{"train_loss": 0.00017814860621001571, "global_step": 68506, "epoch": 575, "lr": 4.102507246423526e-07} +{"train_loss": 0.00013988977298140526, "global_step": 68507, "epoch": 575, "lr": 4.0996754568333737e-07} +{"train_loss": 0.00019552702724467963, "global_step": 68508, "epoch": 575, "lr": 4.0968446408905513e-07} +{"train_loss": 0.00017009662406053394, "global_step": 68509, "epoch": 575, "lr": 4.094014798600554e-07} +{"train_loss": 0.00016714751836843789, "global_step": 68510, "epoch": 575, "lr": 4.0911859299689883e-07} +{"train_loss": 0.00015562816406600177, "global_step": 68511, "epoch": 575, "lr": 4.088358035001405e-07} +{"train_loss": 0.00019386202620808035, "global_step": 68512, "epoch": 575, "lr": 4.0855311137033556e-07} +{"train_loss": 0.0002480406255926937, "global_step": 68513, "epoch": 575, "lr": 4.0827051660803917e-07} +{"train_loss": 0.0002458423550706357, "global_step": 68514, "epoch": 575, "lr": 4.0798801921380637e-07} +{"train_loss": 0.00019723543664440513, "global_step": 68515, "epoch": 575, "lr": 4.077056191881923e-07} +{"train_loss": 0.00018287470447830856, "global_step": 68516, "epoch": 575, "lr": 4.0742331653174647e-07} +{"train_loss": 0.00026385989622212946, "global_step": 68517, "epoch": 575, "lr": 4.071411112450296e-07} +{"train_loss": 0.00019356345001142472, "global_step": 68518, "epoch": 575, "lr": 4.068590033285913e-07} +{"train_loss": 0.00013574454351328313, "global_step": 68519, "epoch": 575, "lr": 4.0657699278298654e-07} +{"train_loss": 0.000267758994596079, "global_step": 68520, "epoch": 575, "lr": 4.0629507960877054e-07} +{"train_loss": 0.0003535413125064224, "global_step": 68521, "epoch": 575, "lr": 4.060132638064984e-07} +{"train_loss": 0.0003057665308006108, "global_step": 68522, "epoch": 575, "lr": 4.0573154537671966e-07} +{"train_loss": 0.00018383080896455795, "global_step": 68523, "epoch": 575, "lr": 4.0544992431998386e-07} +{"train_loss": 0.0002564308815635741, "global_step": 68524, "epoch": 575, "lr": 4.0516840063685166e-07} +{"train_loss": 0.00013891674461774528, "global_step": 68525, "epoch": 575, "lr": 4.0488697432787825e-07} +{"train_loss": 0.00014540707343257964, "global_step": 68526, "epoch": 575, "lr": 4.04605645393602e-07} +{"train_loss": 0.0005228142254054546, "global_step": 68527, "epoch": 575, "lr": 4.0432441383458916e-07} +{"train_loss": 0.00019241108384449035, "global_step": 68528, "epoch": 575, "lr": 4.040432796513838e-07} +{"train_loss": 0.000358429184416309, "global_step": 68529, "epoch": 575, "lr": 4.037622428445464e-07} +{"train_loss": 0.00017135617963504046, "global_step": 68530, "epoch": 575, "lr": 4.034813034146212e-07} +{"train_loss": 0.00026579873519949615, "global_step": 68531, "epoch": 575, "lr": 4.032004613621576e-07} +{"train_loss": 0.0002501075796317309, "global_step": 68532, "epoch": 575, "lr": 4.029197166877163e-07} +{"train_loss": 0.00018896169785875827, "global_step": 68533, "epoch": 575, "lr": 4.026390693918358e-07} +{"train_loss": 0.0002180107549065724, "global_step": 68534, "epoch": 575, "lr": 4.023585194750823e-07} +{"train_loss": 0.00018547213403508067, "global_step": 68535, "epoch": 575, "lr": 4.020780669379942e-07} +{"train_loss": 0.0002785127726383507, "global_step": 68536, "epoch": 575, "lr": 4.017977117811322e-07} +{"train_loss": 0.00021217514586169273, "global_step": 68537, "epoch": 575, "lr": 4.0151745400504036e-07} +{"train_loss": 0.00021674558229278773, "global_step": 68538, "epoch": 575, "lr": 4.0123729361026817e-07} +{"train_loss": 0.0002922642743214965, "global_step": 68539, "epoch": 575, "lr": 4.009572305973708e-07} +{"train_loss": 0.0002312661672476679, "global_step": 68540, "epoch": 575, "lr": 4.0067726496689217e-07} +{"train_loss": 0.0003182635409757495, "global_step": 68541, "epoch": 575, "lr": 4.0039739671938745e-07} +{"train_loss": 0.00012214969319757074, "global_step": 68542, "epoch": 575, "lr": 4.0011762585539515e-07} +{"train_loss": 0.0002571536164961661, "global_step": 68543, "epoch": 575, "lr": 3.998379523754814e-07, "val_loss": 0.018385956063866615, "train_action_mse_error": 2.831456185958814e-06} +{"train_loss": 0.0004417419550009072, "global_step": 68544, "epoch": 576, "lr": 3.995583762801847e-07} +{"train_loss": 0.00023399134806822985, "global_step": 68545, "epoch": 576, "lr": 3.992788975700601e-07} +{"train_loss": 0.0003691287129186094, "global_step": 68546, "epoch": 576, "lr": 3.989995162456461e-07} +{"train_loss": 0.00015050631191115826, "global_step": 68547, "epoch": 576, "lr": 3.987202323074979e-07} +{"train_loss": 0.0002150029904441908, "global_step": 68548, "epoch": 576, "lr": 3.9844104575616494e-07} +{"train_loss": 0.0002205346681876108, "global_step": 68549, "epoch": 576, "lr": 3.981619565921968e-07} +{"train_loss": 0.000347454275470227, "global_step": 68550, "epoch": 576, "lr": 3.97882964816132e-07} +{"train_loss": 0.0005201727035455406, "global_step": 68551, "epoch": 576, "lr": 3.976040704285311e-07} +{"train_loss": 0.00020800867059733719, "global_step": 68552, "epoch": 576, "lr": 3.973252734299326e-07} +{"train_loss": 0.000260339118540287, "global_step": 68553, "epoch": 576, "lr": 3.970465738208862e-07} +{"train_loss": 0.00014953099889680743, "global_step": 68554, "epoch": 576, "lr": 3.9676797160194123e-07} +{"train_loss": 0.0004295877006370574, "global_step": 68555, "epoch": 576, "lr": 3.964894667736418e-07} +{"train_loss": 0.00017323720385320485, "global_step": 68556, "epoch": 576, "lr": 3.962110593365376e-07} +{"train_loss": 0.0003049587248824537, "global_step": 68557, "epoch": 576, "lr": 3.959327492911724e-07} +{"train_loss": 0.0001591697073308751, "global_step": 68558, "epoch": 576, "lr": 3.9565453663809037e-07} +{"train_loss": 0.0002732969296630472, "global_step": 68559, "epoch": 576, "lr": 3.953764213778466e-07} +{"train_loss": 0.0004546859418042004, "global_step": 68560, "epoch": 576, "lr": 3.9509840351097947e-07} +{"train_loss": 0.00027007394237443805, "global_step": 68561, "epoch": 576, "lr": 3.9482048303803865e-07} +{"train_loss": 0.00017479537928011268, "global_step": 68562, "epoch": 576, "lr": 3.9454265995956254e-07} +{"train_loss": 0.00025698007084429264, "global_step": 68563, "epoch": 576, "lr": 3.9426493427611177e-07} +{"train_loss": 0.0002251633704872802, "global_step": 68564, "epoch": 576, "lr": 3.9398730598821377e-07} +{"train_loss": 0.0002522138529457152, "global_step": 68565, "epoch": 576, "lr": 3.9370977509642917e-07} +{"train_loss": 0.00015041530423332006, "global_step": 68566, "epoch": 576, "lr": 3.934323416012908e-07} +{"train_loss": 0.00020592597138602287, "global_step": 68567, "epoch": 576, "lr": 3.9315500550334837e-07} +{"train_loss": 0.00024175162252504379, "global_step": 68568, "epoch": 576, "lr": 3.9287776680315135e-07} +{"train_loss": 0.0002575647667981684, "global_step": 68569, "epoch": 576, "lr": 3.9260062550123265e-07} +{"train_loss": 0.00022693176288157701, "global_step": 68570, "epoch": 576, "lr": 3.9232358159814743e-07} +{"train_loss": 0.0001718664134386927, "global_step": 68571, "epoch": 576, "lr": 3.920466350944285e-07} +{"train_loss": 0.00028092687716707587, "global_step": 68572, "epoch": 576, "lr": 3.9176978599063106e-07} +{"train_loss": 0.00019799817528109998, "global_step": 68573, "epoch": 576, "lr": 3.914930342872936e-07} +{"train_loss": 0.0003826619067694992, "global_step": 68574, "epoch": 576, "lr": 3.9121637998495995e-07} +{"train_loss": 0.0003935581771656871, "global_step": 68575, "epoch": 576, "lr": 3.909398230841743e-07} +{"train_loss": 0.00017177994595840573, "global_step": 68576, "epoch": 576, "lr": 3.9066336358547505e-07} +{"train_loss": 0.00022825918858870864, "global_step": 68577, "epoch": 576, "lr": 3.903870014894118e-07} +{"train_loss": 0.00020191144722048193, "global_step": 68578, "epoch": 576, "lr": 3.901107367965229e-07} +{"train_loss": 0.00030947441700845957, "global_step": 68579, "epoch": 576, "lr": 3.898345695073469e-07} +{"train_loss": 0.0002660336613189429, "global_step": 68580, "epoch": 576, "lr": 3.8955849962243884e-07} +{"train_loss": 0.00019758024427574128, "global_step": 68581, "epoch": 576, "lr": 3.8928252714232616e-07} +{"train_loss": 0.0001973385806195438, "global_step": 68582, "epoch": 576, "lr": 3.890066520675584e-07} +{"train_loss": 0.0008433479815721512, "global_step": 68583, "epoch": 576, "lr": 3.8873087439867396e-07} +{"train_loss": 0.00033622642513364553, "global_step": 68584, "epoch": 576, "lr": 3.8845519413622244e-07} +{"train_loss": 0.00019345419423189014, "global_step": 68585, "epoch": 576, "lr": 3.881796112807312e-07} +{"train_loss": 0.00020805759413633496, "global_step": 68586, "epoch": 576, "lr": 3.8790412583275537e-07} +{"train_loss": 0.0002648687514010817, "global_step": 68587, "epoch": 576, "lr": 3.876287377928278e-07} +{"train_loss": 0.00036043921136297286, "global_step": 68588, "epoch": 576, "lr": 3.873534471614926e-07} +{"train_loss": 0.00017591133655514568, "global_step": 68589, "epoch": 576, "lr": 3.870782539392881e-07} +{"train_loss": 0.0003207131812814623, "global_step": 68590, "epoch": 576, "lr": 3.868031581267473e-07} +{"train_loss": 0.00022709464246872813, "global_step": 68591, "epoch": 576, "lr": 3.8652815972442525e-07} +{"train_loss": 0.00016589435108471662, "global_step": 68592, "epoch": 576, "lr": 3.862532587328549e-07} +{"train_loss": 0.00032093614572659135, "global_step": 68593, "epoch": 576, "lr": 3.859784551525747e-07} +{"train_loss": 0.0004034089797642082, "global_step": 68594, "epoch": 576, "lr": 3.8570374898412863e-07} +{"train_loss": 0.00016931451682467014, "global_step": 68595, "epoch": 576, "lr": 3.854291402280441e-07} +{"train_loss": 0.00012436007091309875, "global_step": 68596, "epoch": 576, "lr": 3.851546288848762e-07} +{"train_loss": 0.00022743549197912216, "global_step": 68597, "epoch": 576, "lr": 3.8488021495515223e-07} +{"train_loss": 0.0003315925714559853, "global_step": 68598, "epoch": 576, "lr": 3.8460589843942184e-07} +{"train_loss": 0.0002863082045223564, "global_step": 68599, "epoch": 576, "lr": 3.8433167933821237e-07} +{"train_loss": 0.00028471031691879034, "global_step": 68600, "epoch": 576, "lr": 3.8405755765206777e-07} +{"train_loss": 0.0001795165881048888, "global_step": 68601, "epoch": 576, "lr": 3.8378353338152653e-07} +{"train_loss": 0.00027597733424045146, "global_step": 68602, "epoch": 576, "lr": 3.8350960652712154e-07} +{"train_loss": 0.0002589500218164176, "global_step": 68603, "epoch": 576, "lr": 3.832357770894024e-07} +{"train_loss": 0.00022150254517327994, "global_step": 68604, "epoch": 576, "lr": 3.8296204506889087e-07} +{"train_loss": 0.00021396897500380874, "global_step": 68605, "epoch": 576, "lr": 3.826884104661366e-07} +{"train_loss": 0.00025086948880925775, "global_step": 68606, "epoch": 576, "lr": 3.824148732816724e-07} +{"train_loss": 0.00039250036934390664, "global_step": 68607, "epoch": 576, "lr": 3.821414335160367e-07} +{"train_loss": 0.0002480394614394754, "global_step": 68608, "epoch": 576, "lr": 3.8186809116976253e-07} +{"train_loss": 0.00026395669556222856, "global_step": 68609, "epoch": 576, "lr": 3.815948462433938e-07} +{"train_loss": 0.00015065373736433685, "global_step": 68610, "epoch": 576, "lr": 3.8132169873745795e-07} +{"train_loss": 0.0002904052962549031, "global_step": 68611, "epoch": 576, "lr": 3.810486486524989e-07} +{"train_loss": 0.00016554266039747745, "global_step": 68612, "epoch": 576, "lr": 3.8077569598904406e-07} +{"train_loss": 0.0002944173465948552, "global_step": 68613, "epoch": 576, "lr": 3.80502840747643e-07} +{"train_loss": 0.0002699407923500985, "global_step": 68614, "epoch": 576, "lr": 3.8023008292881746e-07} +{"train_loss": 0.00026290412642993033, "global_step": 68615, "epoch": 576, "lr": 3.7995742253311707e-07} +{"train_loss": 0.00021935917902737856, "global_step": 68616, "epoch": 576, "lr": 3.79684859561058e-07} +{"train_loss": 0.00015240442007780075, "global_step": 68617, "epoch": 576, "lr": 3.794123940131955e-07} +{"train_loss": 0.00019246838928665966, "global_step": 68618, "epoch": 576, "lr": 3.791400258900568e-07} +{"train_loss": 0.00018716893100645393, "global_step": 68619, "epoch": 576, "lr": 3.7886775519216934e-07} +{"train_loss": 0.00019985027029179037, "global_step": 68620, "epoch": 576, "lr": 3.7859558192007707e-07} +{"train_loss": 0.0002810595033224672, "global_step": 68621, "epoch": 576, "lr": 3.783235060743073e-07} +{"train_loss": 0.0002390304725850001, "global_step": 68622, "epoch": 576, "lr": 3.780515276554042e-07} +{"train_loss": 0.0002458931994624436, "global_step": 68623, "epoch": 576, "lr": 3.777796466638894e-07} +{"train_loss": 0.00022202933905646205, "global_step": 68624, "epoch": 576, "lr": 3.7750786310030705e-07} +{"train_loss": 0.00018238222401123494, "global_step": 68625, "epoch": 576, "lr": 3.772361769651844e-07} +{"train_loss": 0.0006235610926523805, "global_step": 68626, "epoch": 576, "lr": 3.7696458825906e-07} +{"train_loss": 0.0005460958345793188, "global_step": 68627, "epoch": 576, "lr": 3.7669309698246116e-07} +{"train_loss": 0.00017152298823930323, "global_step": 68628, "epoch": 576, "lr": 3.7642170313592075e-07} +{"train_loss": 0.0002495329827070236, "global_step": 68629, "epoch": 576, "lr": 3.761504067199828e-07} +{"train_loss": 0.0001964220282388851, "global_step": 68630, "epoch": 576, "lr": 3.7587920773516915e-07} +{"train_loss": 0.00033939964487217367, "global_step": 68631, "epoch": 576, "lr": 3.756081061820127e-07} +{"train_loss": 0.00014797326002735645, "global_step": 68632, "epoch": 576, "lr": 3.753371020610519e-07} +{"train_loss": 0.00041008091648109257, "global_step": 68633, "epoch": 576, "lr": 3.750661953728085e-07} +{"train_loss": 0.00016505963867530227, "global_step": 68634, "epoch": 576, "lr": 3.747953861178266e-07} +{"train_loss": 0.0006575759616680443, "global_step": 68635, "epoch": 576, "lr": 3.7452467429663354e-07} +{"train_loss": 0.00036288000410422683, "global_step": 68636, "epoch": 576, "lr": 3.742540599097566e-07} +{"train_loss": 0.00012099026935175061, "global_step": 68637, "epoch": 576, "lr": 3.7398354295772877e-07} +{"train_loss": 0.00016605205019004643, "global_step": 68638, "epoch": 576, "lr": 3.737131234410829e-07} +{"train_loss": 0.00023286184296011925, "global_step": 68639, "epoch": 576, "lr": 3.7344280136035194e-07} +{"train_loss": 0.00016933068400248885, "global_step": 68640, "epoch": 576, "lr": 3.731725767160632e-07} +{"train_loss": 0.00021749400184489787, "global_step": 68641, "epoch": 576, "lr": 3.7290244950874964e-07} +{"train_loss": 0.00013625173596665263, "global_step": 68642, "epoch": 576, "lr": 3.726324197389386e-07} +{"train_loss": 0.0002418290969217196, "global_step": 68643, "epoch": 576, "lr": 3.7236248740716297e-07} +{"train_loss": 0.00022429721138905734, "global_step": 68644, "epoch": 576, "lr": 3.720926525139501e-07} +{"train_loss": 0.00020055909408256412, "global_step": 68645, "epoch": 576, "lr": 3.7182291505982736e-07} +{"train_loss": 0.00017644559557083994, "global_step": 68646, "epoch": 576, "lr": 3.7155327504533324e-07} +{"train_loss": 0.0001826169027481228, "global_step": 68647, "epoch": 576, "lr": 3.71283732470995e-07} +{"train_loss": 0.0004234802327118814, "global_step": 68648, "epoch": 576, "lr": 3.7101428733733455e-07} +{"train_loss": 0.00018958233704324812, "global_step": 68649, "epoch": 576, "lr": 3.707449396448903e-07} +{"train_loss": 0.00023961954866535962, "global_step": 68650, "epoch": 576, "lr": 3.7047568939417853e-07} +{"train_loss": 0.00015241748769767582, "global_step": 68651, "epoch": 576, "lr": 3.702065365857432e-07} +{"train_loss": 0.00014235510025173426, "global_step": 68652, "epoch": 576, "lr": 3.699374812201006e-07} +{"train_loss": 0.00031308282632380724, "global_step": 68653, "epoch": 576, "lr": 3.696685232977837e-07} +{"train_loss": 0.0002446917351335287, "global_step": 68654, "epoch": 576, "lr": 3.6939966281932523e-07} +{"train_loss": 0.0003493050462566316, "global_step": 68655, "epoch": 576, "lr": 3.6913089978524163e-07} +{"train_loss": 0.00015805063594598323, "global_step": 68656, "epoch": 576, "lr": 3.688622341960712e-07} +{"train_loss": 0.00017058725643437356, "global_step": 68657, "epoch": 576, "lr": 3.685936660523359e-07} +{"train_loss": 0.00027764542028307915, "global_step": 68658, "epoch": 576, "lr": 3.683251953545686e-07} +{"train_loss": 0.00027975201373919845, "global_step": 68659, "epoch": 576, "lr": 3.680568221032854e-07} +{"train_loss": 0.0001788280060281977, "global_step": 68660, "epoch": 576, "lr": 3.677885462990249e-07} +{"train_loss": 0.00015013955999165773, "global_step": 68661, "epoch": 576, "lr": 3.6752036794231447e-07} +{"train_loss": 0.00025812229016862275, "global_step": 68662, "epoch": 576, "lr": 3.672522870336648e-07, "val_loss": 0.045195356011390686} +{"train_loss": 0.0002991118235513568, "global_step": 68663, "epoch": 577, "lr": 3.669843035736198e-07} +{"train_loss": 0.00018888359772972763, "global_step": 68664, "epoch": 577, "lr": 3.667164175626958e-07} +{"train_loss": 0.00012230702850501984, "global_step": 68665, "epoch": 577, "lr": 3.6644862900142016e-07} +{"train_loss": 0.00020207713532727212, "global_step": 68666, "epoch": 577, "lr": 3.6618093789032027e-07} +{"train_loss": 0.000262360175838694, "global_step": 68667, "epoch": 577, "lr": 3.659133442299234e-07} +{"train_loss": 0.00023845810210332274, "global_step": 68668, "epoch": 577, "lr": 3.65645848020757e-07} +{"train_loss": 0.0002127932821167633, "global_step": 68669, "epoch": 577, "lr": 3.6537844926333163e-07} +{"train_loss": 0.00025406116037629545, "global_step": 68670, "epoch": 577, "lr": 3.6511114795819146e-07} +{"train_loss": 0.0006338804960250854, "global_step": 68671, "epoch": 577, "lr": 3.6484394410585264e-07} +{"train_loss": 0.0002114602248184383, "global_step": 68672, "epoch": 577, "lr": 3.6457683770683704e-07} +{"train_loss": 0.0002639697049744427, "global_step": 68673, "epoch": 577, "lr": 3.6430982876167195e-07} +{"train_loss": 0.0003504752239678055, "global_step": 68674, "epoch": 577, "lr": 3.640429172708848e-07} +{"train_loss": 0.00027577896253205836, "global_step": 68675, "epoch": 577, "lr": 3.6377610323499176e-07} +{"train_loss": 0.00026489407173357904, "global_step": 68676, "epoch": 577, "lr": 3.635093866545258e-07} +{"train_loss": 0.00015837835962884128, "global_step": 68677, "epoch": 577, "lr": 3.6324276753000317e-07} +{"train_loss": 0.00015796285879332572, "global_step": 68678, "epoch": 577, "lr": 3.6297624586195123e-07} +{"train_loss": 0.0003622057556640357, "global_step": 68679, "epoch": 577, "lr": 3.6270982165089176e-07} +{"train_loss": 0.0003424375900067389, "global_step": 68680, "epoch": 577, "lr": 3.624434948973521e-07} +{"train_loss": 0.0002485040749888867, "global_step": 68681, "epoch": 577, "lr": 3.621772656018485e-07} +{"train_loss": 0.00028403583564795554, "global_step": 68682, "epoch": 577, "lr": 3.6191113376490836e-07} +{"train_loss": 0.00024182059860322624, "global_step": 68683, "epoch": 577, "lr": 3.616450993870535e-07} +{"train_loss": 0.00019624733249656856, "global_step": 68684, "epoch": 577, "lr": 3.6137916246880563e-07} +{"train_loss": 0.0003765618021134287, "global_step": 68685, "epoch": 577, "lr": 3.611133230106811e-07} +{"train_loss": 0.0007054713205434382, "global_step": 68686, "epoch": 577, "lr": 3.6084758101321283e-07} +{"train_loss": 0.0002573613601271063, "global_step": 68687, "epoch": 577, "lr": 3.60581936476917e-07} +{"train_loss": 0.00016614758351352066, "global_step": 68688, "epoch": 577, "lr": 3.6031638940231536e-07} +{"train_loss": 0.0002565170871093869, "global_step": 68689, "epoch": 577, "lr": 3.6005093978992987e-07} +{"train_loss": 0.00018029057537205517, "global_step": 68690, "epoch": 577, "lr": 3.597855876402767e-07} +{"train_loss": 0.00025473712594248354, "global_step": 68691, "epoch": 577, "lr": 3.595203329538832e-07} +{"train_loss": 0.00022899979376234114, "global_step": 68692, "epoch": 577, "lr": 3.592551757312712e-07} +{"train_loss": 0.0003144557704217732, "global_step": 68693, "epoch": 577, "lr": 3.5899011597295695e-07} +{"train_loss": 0.00012167834938736632, "global_step": 68694, "epoch": 577, "lr": 3.587251536794622e-07} +{"train_loss": 0.00022275617811828852, "global_step": 68695, "epoch": 577, "lr": 3.5846028885130335e-07} +{"train_loss": 0.0003536157018970698, "global_step": 68696, "epoch": 577, "lr": 3.581955214890076e-07} +{"train_loss": 0.00042224404751323164, "global_step": 68697, "epoch": 577, "lr": 3.5793085159309124e-07} +{"train_loss": 0.00047839092439971864, "global_step": 68698, "epoch": 577, "lr": 3.5766627916407616e-07} +{"train_loss": 0.00027553242398425937, "global_step": 68699, "epoch": 577, "lr": 3.574018042024785e-07} +{"train_loss": 0.00026330508990213275, "global_step": 68700, "epoch": 577, "lr": 3.5713742670881455e-07} +{"train_loss": 0.00034545609378255904, "global_step": 68701, "epoch": 577, "lr": 3.568731466836173e-07} +{"train_loss": 0.00037518885801546276, "global_step": 68702, "epoch": 577, "lr": 3.566089641273862e-07} +{"train_loss": 0.0001606071018613875, "global_step": 68703, "epoch": 577, "lr": 3.563448790406543e-07} +{"train_loss": 0.0003504643973428756, "global_step": 68704, "epoch": 577, "lr": 3.560808914239322e-07} +{"train_loss": 0.0001486188848502934, "global_step": 68705, "epoch": 577, "lr": 3.558170012777473e-07} +{"train_loss": 0.00026011999580077827, "global_step": 68706, "epoch": 577, "lr": 3.5555320860261034e-07} +{"train_loss": 0.0003180244530085474, "global_step": 68707, "epoch": 577, "lr": 3.5528951339903747e-07} +{"train_loss": 0.00014526359154842794, "global_step": 68708, "epoch": 577, "lr": 3.550259156675506e-07} +{"train_loss": 0.00017278772429563105, "global_step": 68709, "epoch": 577, "lr": 3.547624154086715e-07} +{"train_loss": 0.000392274116165936, "global_step": 68710, "epoch": 577, "lr": 3.544990126229053e-07} +{"train_loss": 0.0005644685006700456, "global_step": 68711, "epoch": 577, "lr": 3.5423570731078493e-07} +{"train_loss": 0.0003328270395286381, "global_step": 68712, "epoch": 577, "lr": 3.5397249947281e-07} +{"train_loss": 0.0002649032394401729, "global_step": 68713, "epoch": 577, "lr": 3.5370938910951333e-07} +{"train_loss": 0.00022753249504603446, "global_step": 68714, "epoch": 577, "lr": 3.534463762214002e-07} +{"train_loss": 0.0003443188325036317, "global_step": 68715, "epoch": 577, "lr": 3.531834608089923e-07} +{"train_loss": 0.0002143076271750033, "global_step": 68716, "epoch": 577, "lr": 3.52920642872806e-07} +{"train_loss": 0.00015043644816614687, "global_step": 68717, "epoch": 577, "lr": 3.526579224133575e-07} +{"train_loss": 0.0002513955987524241, "global_step": 68718, "epoch": 577, "lr": 3.5239529943115745e-07} +{"train_loss": 0.0002614717814140022, "global_step": 68719, "epoch": 577, "lr": 3.521327739267222e-07} +{"train_loss": 0.00025916873710229993, "global_step": 68720, "epoch": 577, "lr": 3.51870345900579e-07} +{"train_loss": 0.0005743782967329025, "global_step": 68721, "epoch": 577, "lr": 3.516080153532275e-07} +{"train_loss": 0.0002712077694013715, "global_step": 68722, "epoch": 577, "lr": 3.5134578228518957e-07} +{"train_loss": 0.0005541177815757692, "global_step": 68723, "epoch": 577, "lr": 3.5108364669698136e-07} +{"train_loss": 0.0003004599711857736, "global_step": 68724, "epoch": 577, "lr": 3.5082160858911917e-07} +{"train_loss": 0.0002383935498073697, "global_step": 68725, "epoch": 577, "lr": 3.505596679621137e-07} +{"train_loss": 0.00023173994850367308, "global_step": 68726, "epoch": 577, "lr": 3.5029782481647565e-07} +{"train_loss": 0.00017243452020920813, "global_step": 68727, "epoch": 577, "lr": 3.5003607915272686e-07} +{"train_loss": 0.00012802262790501118, "global_step": 68728, "epoch": 577, "lr": 3.49774430971378e-07} +{"train_loss": 0.0002849214361049235, "global_step": 68729, "epoch": 577, "lr": 3.495128802729453e-07} +{"train_loss": 0.0003955973079428077, "global_step": 68730, "epoch": 577, "lr": 3.492514270579339e-07} +{"train_loss": 0.00018171417468693107, "global_step": 68731, "epoch": 577, "lr": 3.4899007132686567e-07} +{"train_loss": 0.00022787479974795133, "global_step": 68732, "epoch": 577, "lr": 3.487288130802513e-07} +{"train_loss": 0.00014618277782574296, "global_step": 68733, "epoch": 577, "lr": 3.4846765231860144e-07} +{"train_loss": 0.00025972045841626823, "global_step": 68734, "epoch": 577, "lr": 3.482065890424324e-07} +{"train_loss": 0.00045205128844827414, "global_step": 68735, "epoch": 577, "lr": 3.479456232522549e-07} +{"train_loss": 0.00024131622922141105, "global_step": 68736, "epoch": 577, "lr": 3.476847549485851e-07} +{"train_loss": 0.0002191202947869897, "global_step": 68737, "epoch": 577, "lr": 3.474239841319282e-07} +{"train_loss": 0.00024367650621570647, "global_step": 68738, "epoch": 577, "lr": 3.471633108028005e-07} +{"train_loss": 0.00028819567523896694, "global_step": 68739, "epoch": 577, "lr": 3.4690273496171267e-07} +{"train_loss": 0.0006298224907368422, "global_step": 68740, "epoch": 577, "lr": 3.4664225660917537e-07} +{"train_loss": 0.00032139604445546865, "global_step": 68741, "epoch": 577, "lr": 3.463818757457049e-07} +{"train_loss": 0.00020551102352328598, "global_step": 68742, "epoch": 577, "lr": 3.4612159237180086e-07} +{"train_loss": 0.0001619544200366363, "global_step": 68743, "epoch": 577, "lr": 3.458614064879906e-07} +{"train_loss": 0.00017107442545238882, "global_step": 68744, "epoch": 577, "lr": 3.456013180947737e-07} +{"train_loss": 0.0003622205404099077, "global_step": 68745, "epoch": 577, "lr": 3.4534132719266086e-07} +{"train_loss": 0.00020471868629101664, "global_step": 68746, "epoch": 577, "lr": 3.4508143378217397e-07} +{"train_loss": 0.00021963527251500636, "global_step": 68747, "epoch": 577, "lr": 3.4482163786380695e-07} +{"train_loss": 0.0002661912585608661, "global_step": 68748, "epoch": 577, "lr": 3.445619394380817e-07} +{"train_loss": 0.00015729173901490867, "global_step": 68749, "epoch": 577, "lr": 3.443023385055033e-07} +{"train_loss": 0.00020468482398428023, "global_step": 68750, "epoch": 577, "lr": 3.440428350665825e-07} +{"train_loss": 0.00031214868067763746, "global_step": 68751, "epoch": 577, "lr": 3.437834291218245e-07} +{"train_loss": 0.00023789731494616717, "global_step": 68752, "epoch": 577, "lr": 3.435241206717454e-07} +{"train_loss": 0.00020329192921053618, "global_step": 68753, "epoch": 577, "lr": 3.432649097168561e-07} +{"train_loss": 0.00030739401699975133, "global_step": 68754, "epoch": 577, "lr": 3.4300579625765604e-07} +{"train_loss": 0.00027089350624009967, "global_step": 68755, "epoch": 577, "lr": 3.427467802946616e-07} +{"train_loss": 0.00014598725829273462, "global_step": 68756, "epoch": 577, "lr": 3.424878618283778e-07} +{"train_loss": 0.00012374403013382107, "global_step": 68757, "epoch": 577, "lr": 3.422290408593154e-07} +{"train_loss": 0.00022162105597089976, "global_step": 68758, "epoch": 577, "lr": 3.419703173879796e-07} +{"train_loss": 0.00023897715436760336, "global_step": 68759, "epoch": 577, "lr": 3.41711691414881e-07} +{"train_loss": 0.00020319194300100207, "global_step": 68760, "epoch": 577, "lr": 3.4145316294052486e-07} +{"train_loss": 0.00019445577345322818, "global_step": 68761, "epoch": 577, "lr": 3.4119473196542185e-07} +{"train_loss": 0.00010371689131716266, "global_step": 68762, "epoch": 577, "lr": 3.4093639849007705e-07} +{"train_loss": 0.0002419371739961207, "global_step": 68763, "epoch": 577, "lr": 3.406781625149957e-07} +{"train_loss": 0.00013506201503332704, "global_step": 68764, "epoch": 577, "lr": 3.404200240406885e-07} +{"train_loss": 0.0001451941061532125, "global_step": 68765, "epoch": 577, "lr": 3.401619830676661e-07} +{"train_loss": 0.0002563354792073369, "global_step": 68766, "epoch": 577, "lr": 3.399040395964226e-07} +{"train_loss": 0.00036591090611182153, "global_step": 68767, "epoch": 577, "lr": 3.3964619362747974e-07} +{"train_loss": 0.00020159452105872333, "global_step": 68768, "epoch": 577, "lr": 3.393884451613316e-07} +{"train_loss": 0.0003272511821705848, "global_step": 68769, "epoch": 577, "lr": 3.391307941984889e-07} +{"train_loss": 0.00021843281865585595, "global_step": 68770, "epoch": 577, "lr": 3.388732407394568e-07} +{"train_loss": 0.0001525516709079966, "global_step": 68771, "epoch": 577, "lr": 3.3861578478474596e-07} +{"train_loss": 0.00017623916210141033, "global_step": 68772, "epoch": 577, "lr": 3.3835842633485603e-07} +{"train_loss": 0.0002951304486487061, "global_step": 68773, "epoch": 577, "lr": 3.3810116539028656e-07} +{"train_loss": 0.00021545625349972397, "global_step": 68774, "epoch": 577, "lr": 3.3784400195155943e-07} +{"train_loss": 0.00022122880909591913, "global_step": 68775, "epoch": 577, "lr": 3.37586936019163e-07} +{"train_loss": 0.00026760841137729585, "global_step": 68776, "epoch": 577, "lr": 3.3732996759361366e-07} +{"train_loss": 0.0001954682229552418, "global_step": 68777, "epoch": 577, "lr": 3.37073096675411e-07} +{"train_loss": 0.00026318628806620836, "global_step": 68778, "epoch": 577, "lr": 3.368163232650545e-07} +{"train_loss": 0.0002626813657116145, "global_step": 68779, "epoch": 577, "lr": 3.3655964736306054e-07} +{"train_loss": 0.00019291041826363653, "global_step": 68780, "epoch": 577, "lr": 3.363030689699176e-07} +{"train_loss": 0.00026376749143814434, "global_step": 68781, "epoch": 577, "lr": 3.3604658808614744e-07, "val_loss": 0.012160795740783215} +{"train_loss": 0.000191854007425718, "global_step": 68782, "epoch": 578, "lr": 3.357902047122385e-07} +{"train_loss": 0.0001636151282582432, "global_step": 68783, "epoch": 578, "lr": 3.3553391884870167e-07} +{"train_loss": 0.0002940978156402707, "global_step": 68784, "epoch": 578, "lr": 3.352777304960364e-07} +{"train_loss": 0.00018458884733263403, "global_step": 68785, "epoch": 578, "lr": 3.3502163965474785e-07} +{"train_loss": 0.0004811456019524485, "global_step": 68786, "epoch": 578, "lr": 3.347656463253357e-07} +{"train_loss": 0.00025490246480330825, "global_step": 68787, "epoch": 578, "lr": 3.3450975050831055e-07} +{"train_loss": 0.00015278956561814994, "global_step": 68788, "epoch": 578, "lr": 3.3425395220416655e-07} +{"train_loss": 0.00022765525500290096, "global_step": 68789, "epoch": 578, "lr": 3.339982514134088e-07} +{"train_loss": 0.0001495469332439825, "global_step": 68790, "epoch": 578, "lr": 3.3374264813654245e-07} +{"train_loss": 0.00022210278257261962, "global_step": 68791, "epoch": 578, "lr": 3.334871423740615e-07} +{"train_loss": 0.00032753098639659584, "global_step": 68792, "epoch": 578, "lr": 3.332317341264768e-07} +{"train_loss": 0.00021792107145301998, "global_step": 68793, "epoch": 578, "lr": 3.3297642339428225e-07} +{"train_loss": 0.00019947973487433046, "global_step": 68794, "epoch": 578, "lr": 3.327212101779831e-07} +{"train_loss": 0.00029292641556821764, "global_step": 68795, "epoch": 578, "lr": 3.3246609447807887e-07} +{"train_loss": 0.0001631070044822991, "global_step": 68796, "epoch": 578, "lr": 3.3221107629507475e-07} +{"train_loss": 0.0001160769970738329, "global_step": 68797, "epoch": 578, "lr": 3.319561556294648e-07} +{"train_loss": 0.0002683458151295781, "global_step": 68798, "epoch": 578, "lr": 3.3170133248175417e-07} +{"train_loss": 0.00020854226022493094, "global_step": 68799, "epoch": 578, "lr": 3.3144660685244246e-07} +{"train_loss": 0.0003276253992225975, "global_step": 68800, "epoch": 578, "lr": 3.3119197874202926e-07} +{"train_loss": 0.00020875847258139402, "global_step": 68801, "epoch": 578, "lr": 3.3093744815101415e-07} +{"train_loss": 0.00013244987349025905, "global_step": 68802, "epoch": 578, "lr": 3.3068301507989117e-07} +{"train_loss": 0.00016918971959967166, "global_step": 68803, "epoch": 578, "lr": 3.3042867952917113e-07} +{"train_loss": 0.0003035542322322726, "global_step": 68804, "epoch": 578, "lr": 3.3017444149934796e-07} +{"train_loss": 0.00020239506557118148, "global_step": 68805, "epoch": 578, "lr": 3.299203009909213e-07} +{"train_loss": 0.00021256056788843125, "global_step": 68806, "epoch": 578, "lr": 3.2966625800438524e-07} +{"train_loss": 0.00028883034246973693, "global_step": 68807, "epoch": 578, "lr": 3.294123125402504e-07} +{"train_loss": 0.0003019530267920345, "global_step": 68808, "epoch": 578, "lr": 3.291584645989998e-07} +{"train_loss": 0.00028346723411232233, "global_step": 68809, "epoch": 578, "lr": 3.289047141811441e-07} +{"train_loss": 0.00017497055523563176, "global_step": 68810, "epoch": 578, "lr": 3.2865106128717737e-07} +{"train_loss": 0.00029417668702080846, "global_step": 68811, "epoch": 578, "lr": 3.283975059175992e-07} +{"train_loss": 0.0002522811701055616, "global_step": 68812, "epoch": 578, "lr": 3.2814404807290364e-07} +{"train_loss": 0.00015653614536859095, "global_step": 68813, "epoch": 578, "lr": 3.2789068775359035e-07} +{"train_loss": 0.00015992813860066235, "global_step": 68814, "epoch": 578, "lr": 3.276374249601588e-07} +{"train_loss": 0.00020775143639184535, "global_step": 68815, "epoch": 578, "lr": 3.2738425969310313e-07} +{"train_loss": 0.00012624735245481133, "global_step": 68816, "epoch": 578, "lr": 3.2713119195292294e-07} +{"train_loss": 0.0002614844706840813, "global_step": 68817, "epoch": 578, "lr": 3.268782217401123e-07} +{"train_loss": 0.00015800161054357886, "global_step": 68818, "epoch": 578, "lr": 3.266253490551707e-07} +{"train_loss": 0.00023725893697701395, "global_step": 68819, "epoch": 578, "lr": 3.263725738985923e-07} +{"train_loss": 0.00014315421867650002, "global_step": 68820, "epoch": 578, "lr": 3.261198962708767e-07} +{"train_loss": 0.0002966900065075606, "global_step": 68821, "epoch": 578, "lr": 3.2586731617251234e-07} +{"train_loss": 0.0003425416653044522, "global_step": 68822, "epoch": 578, "lr": 3.256148336040099e-07} +{"train_loss": 0.0002883162524085492, "global_step": 68823, "epoch": 578, "lr": 3.2536244856584684e-07} +{"train_loss": 0.00028477306477725506, "global_step": 68824, "epoch": 578, "lr": 3.251101610585339e-07} +{"train_loss": 0.0001624593569431454, "global_step": 68825, "epoch": 578, "lr": 3.2485797108255946e-07} +{"train_loss": 0.00014140631537884474, "global_step": 68826, "epoch": 578, "lr": 3.246058786384121e-07} +{"train_loss": 0.00014535468653775752, "global_step": 68827, "epoch": 578, "lr": 3.2435388372660246e-07} +{"train_loss": 0.00027506606420502067, "global_step": 68828, "epoch": 578, "lr": 3.241019863476136e-07} +{"train_loss": 0.00020873612083960325, "global_step": 68829, "epoch": 578, "lr": 3.2385018650194497e-07} +{"train_loss": 0.00017981846758630127, "global_step": 68830, "epoch": 578, "lr": 3.235984841900852e-07} +{"train_loss": 0.00014408817514777184, "global_step": 68831, "epoch": 578, "lr": 3.2334687941253385e-07} +{"train_loss": 0.00023248807701747864, "global_step": 68832, "epoch": 578, "lr": 3.230953721697905e-07} +{"train_loss": 0.0002255948056699708, "global_step": 68833, "epoch": 578, "lr": 3.228439624623325e-07} +{"train_loss": 0.00014965928858146071, "global_step": 68834, "epoch": 578, "lr": 3.2259265029067064e-07} +{"train_loss": 0.0003831689537037164, "global_step": 68835, "epoch": 578, "lr": 3.2234143565528785e-07} +{"train_loss": 0.00013151078019291162, "global_step": 68836, "epoch": 578, "lr": 3.2209031855667814e-07} +{"train_loss": 0.00019030981638934463, "global_step": 68837, "epoch": 578, "lr": 3.2183929899534113e-07} +{"train_loss": 0.0002774793829303235, "global_step": 68838, "epoch": 578, "lr": 3.2158837697176537e-07} +{"train_loss": 0.00039682252099737525, "global_step": 68839, "epoch": 578, "lr": 3.213375524864393e-07} +{"train_loss": 0.00027695068274624646, "global_step": 68840, "epoch": 578, "lr": 3.210868255398625e-07} +{"train_loss": 0.0002770057471934706, "global_step": 68841, "epoch": 578, "lr": 3.2083619613252346e-07} +{"train_loss": 0.0003882039454765618, "global_step": 68842, "epoch": 578, "lr": 3.205856642649163e-07} +{"train_loss": 0.00021146793733350933, "global_step": 68843, "epoch": 578, "lr": 3.203352299375295e-07} +{"train_loss": 0.00017861108062788844, "global_step": 68844, "epoch": 578, "lr": 3.200848931508571e-07} +{"train_loss": 0.00022451768745668232, "global_step": 68845, "epoch": 578, "lr": 3.198346539053876e-07} +{"train_loss": 0.00039268951513804495, "global_step": 68846, "epoch": 578, "lr": 3.1958451220162054e-07} +{"train_loss": 0.0004389180103316903, "global_step": 68847, "epoch": 578, "lr": 3.19334468040039e-07} +{"train_loss": 0.000262083689449355, "global_step": 68848, "epoch": 578, "lr": 3.190845214211424e-07} +{"train_loss": 0.00040814621024765074, "global_step": 68849, "epoch": 578, "lr": 3.188346723454083e-07} +{"train_loss": 0.0002889455354306847, "global_step": 68850, "epoch": 578, "lr": 3.185849208133362e-07} +{"train_loss": 0.0005619594012387097, "global_step": 68851, "epoch": 578, "lr": 3.183352668254203e-07} +{"train_loss": 0.000362071004929021, "global_step": 68852, "epoch": 578, "lr": 3.1808571038213776e-07} +{"train_loss": 0.00014665450726170093, "global_step": 68853, "epoch": 578, "lr": 3.178362514839939e-07} +{"train_loss": 0.0003349759499542415, "global_step": 68854, "epoch": 578, "lr": 3.1758689013146605e-07} +{"train_loss": 0.00024658552138134837, "global_step": 68855, "epoch": 578, "lr": 3.173376263250483e-07} +{"train_loss": 0.00014481291873380542, "global_step": 68856, "epoch": 578, "lr": 3.1708846006523463e-07} +{"train_loss": 0.0002610826923046261, "global_step": 68857, "epoch": 578, "lr": 3.168393913525025e-07} +{"train_loss": 0.00014920298417564481, "global_step": 68858, "epoch": 578, "lr": 3.165904201873515e-07} +{"train_loss": 0.0002133408997906372, "global_step": 68859, "epoch": 578, "lr": 3.1634154657027016e-07} +{"train_loss": 0.00016505066014360636, "global_step": 68860, "epoch": 578, "lr": 3.1609277050174135e-07} +{"train_loss": 0.0003349243779666722, "global_step": 68861, "epoch": 578, "lr": 3.158440919822592e-07} +{"train_loss": 0.0001660381822148338, "global_step": 68862, "epoch": 578, "lr": 3.1559551101230656e-07} +{"train_loss": 0.00040117473690770566, "global_step": 68863, "epoch": 578, "lr": 3.1534702759237756e-07} +{"train_loss": 0.0002751988358795643, "global_step": 68864, "epoch": 578, "lr": 3.1509864172294956e-07} +{"train_loss": 0.00026325316866859794, "global_step": 68865, "epoch": 578, "lr": 3.1485035340452774e-07} +{"train_loss": 0.00040416454430669546, "global_step": 68866, "epoch": 578, "lr": 3.1460216263757835e-07} +{"train_loss": 0.0003270288580097258, "global_step": 68867, "epoch": 578, "lr": 3.143540694226066e-07} +{"train_loss": 0.0002451891195960343, "global_step": 68868, "epoch": 578, "lr": 3.1410607376008983e-07} +{"train_loss": 0.0004543076502159238, "global_step": 68869, "epoch": 578, "lr": 3.1385817565051657e-07} +{"train_loss": 0.00017439780640415847, "global_step": 68870, "epoch": 578, "lr": 3.1361037509438086e-07} +{"train_loss": 0.00026880003861151636, "global_step": 68871, "epoch": 578, "lr": 3.1336267209215454e-07} +{"train_loss": 0.00020195644174236804, "global_step": 68872, "epoch": 578, "lr": 3.131150666443372e-07} +{"train_loss": 0.00018882137374021113, "global_step": 68873, "epoch": 578, "lr": 3.128675587514118e-07} +{"train_loss": 0.00020038135698996484, "global_step": 68874, "epoch": 578, "lr": 3.126201484138558e-07} +{"train_loss": 0.0001612019696040079, "global_step": 68875, "epoch": 578, "lr": 3.123728356321687e-07} +{"train_loss": 0.00020568240142893046, "global_step": 68876, "epoch": 578, "lr": 3.121256204068224e-07} +{"train_loss": 0.00016595896158833057, "global_step": 68877, "epoch": 578, "lr": 3.118785027383164e-07} +{"train_loss": 0.00032367988023906946, "global_step": 68878, "epoch": 578, "lr": 3.1163148262712273e-07} +{"train_loss": 0.00035206269240006804, "global_step": 68879, "epoch": 578, "lr": 3.113845600737353e-07} +{"train_loss": 0.00027872680220752954, "global_step": 68880, "epoch": 578, "lr": 3.1113773507863706e-07} +{"train_loss": 0.0002840623783413321, "global_step": 68881, "epoch": 578, "lr": 3.1089100764231107e-07} +{"train_loss": 0.0003319872485008091, "global_step": 68882, "epoch": 578, "lr": 3.1064437776524014e-07} +{"train_loss": 0.00025987240951508284, "global_step": 68883, "epoch": 578, "lr": 3.103978454479073e-07} +{"train_loss": 0.00035896440385840833, "global_step": 68884, "epoch": 578, "lr": 3.1015141069080655e-07} +{"train_loss": 0.0002349143906030804, "global_step": 68885, "epoch": 578, "lr": 3.0990507349440976e-07} +{"train_loss": 0.00016100269567687064, "global_step": 68886, "epoch": 578, "lr": 3.0965883385921104e-07} +{"train_loss": 0.00029584846924990416, "global_step": 68887, "epoch": 578, "lr": 3.094126917856877e-07} +{"train_loss": 0.000443010067101568, "global_step": 68888, "epoch": 578, "lr": 3.091666472743171e-07} +{"train_loss": 0.00034581913496367633, "global_step": 68889, "epoch": 578, "lr": 3.089207003255934e-07} +{"train_loss": 0.00021350753377191722, "global_step": 68890, "epoch": 578, "lr": 3.0867485093999946e-07} +{"train_loss": 0.0002536323736421764, "global_step": 68891, "epoch": 578, "lr": 3.0842909911800723e-07} +{"train_loss": 0.0002781339280772954, "global_step": 68892, "epoch": 578, "lr": 3.081834448601051e-07} +{"train_loss": 0.00019643068662844598, "global_step": 68893, "epoch": 578, "lr": 3.079378881667816e-07} +{"train_loss": 0.00021397923410404474, "global_step": 68894, "epoch": 578, "lr": 3.0769242903851416e-07} +{"train_loss": 0.000237947708228603, "global_step": 68895, "epoch": 578, "lr": 3.074470674757801e-07} +{"train_loss": 0.0003168435941915959, "global_step": 68896, "epoch": 578, "lr": 3.072018034790625e-07} +{"train_loss": 0.000288368493784219, "global_step": 68897, "epoch": 578, "lr": 3.069566370488497e-07} +{"train_loss": 0.0003394018276594579, "global_step": 68898, "epoch": 578, "lr": 3.0671156818561366e-07} +{"train_loss": 0.00022189279843587428, "global_step": 68899, "epoch": 578, "lr": 3.064665968898428e-07} +{"train_loss": 0.000254223973868403, "global_step": 68900, "epoch": 578, "lr": 3.0622172316202015e-07, "val_loss": 0.02258499339222908} +{"train_loss": 0.0003750486939679831, "global_step": 68901, "epoch": 579, "lr": 3.0597694700261747e-07} +{"train_loss": 0.0003968131204601377, "global_step": 68902, "epoch": 579, "lr": 3.0573226841212334e-07} +{"train_loss": 0.00032239063875749707, "global_step": 68903, "epoch": 579, "lr": 3.054876873910095e-07} +{"train_loss": 0.0004375852004159242, "global_step": 68904, "epoch": 579, "lr": 3.052432039397646e-07} +{"train_loss": 0.0003252003516536206, "global_step": 68905, "epoch": 579, "lr": 3.0499881805886587e-07} +{"train_loss": 0.00019227004668209702, "global_step": 68906, "epoch": 579, "lr": 3.0475452974879083e-07} +{"train_loss": 0.0002495210792403668, "global_step": 68907, "epoch": 579, "lr": 3.045103390100279e-07} +{"train_loss": 0.00019683779100887477, "global_step": 68908, "epoch": 579, "lr": 3.042662458430434e-07} +{"train_loss": 0.00029424435342662036, "global_step": 68909, "epoch": 579, "lr": 3.0402225024832587e-07} +{"train_loss": 0.00014315545558929443, "global_step": 68910, "epoch": 579, "lr": 3.037783522263471e-07} +{"train_loss": 0.0001991895551327616, "global_step": 68911, "epoch": 579, "lr": 3.0353455177759007e-07} +{"train_loss": 0.0007227588794194162, "global_step": 68912, "epoch": 579, "lr": 3.0329084890253766e-07} +{"train_loss": 0.00027552590472623706, "global_step": 68913, "epoch": 579, "lr": 3.0304724360166736e-07} +{"train_loss": 0.00022634353081230074, "global_step": 68914, "epoch": 579, "lr": 3.0280373587544543e-07} +{"train_loss": 0.00019105190585833043, "global_step": 68915, "epoch": 579, "lr": 3.025603257243659e-07} +{"train_loss": 0.00020532324560917914, "global_step": 68916, "epoch": 579, "lr": 3.0231701314889504e-07} +{"train_loss": 0.00035032787127420306, "global_step": 68917, "epoch": 579, "lr": 3.020737981495214e-07} +{"train_loss": 0.00022756142425350845, "global_step": 68918, "epoch": 579, "lr": 3.0183068072671126e-07} +{"train_loss": 0.0002905239525716752, "global_step": 68919, "epoch": 579, "lr": 3.015876608809476e-07} +{"train_loss": 0.00017183135787490755, "global_step": 68920, "epoch": 579, "lr": 3.013447386127133e-07} +{"train_loss": 0.00017138541443273425, "global_step": 68921, "epoch": 579, "lr": 3.0110191392246914e-07} +{"train_loss": 0.0001759369479259476, "global_step": 68922, "epoch": 579, "lr": 3.008591868107091e-07} +{"train_loss": 0.00017734381253831089, "global_step": 68923, "epoch": 579, "lr": 3.006165572778996e-07} +{"train_loss": 0.00013954541645944118, "global_step": 68924, "epoch": 579, "lr": 3.0037402532452355e-07} +{"train_loss": 0.00022192002506926656, "global_step": 68925, "epoch": 579, "lr": 3.001315909510527e-07} +{"train_loss": 0.00024032487999647856, "global_step": 68926, "epoch": 579, "lr": 2.99889254157959e-07} +{"train_loss": 0.0004681923892349005, "global_step": 68927, "epoch": 579, "lr": 2.9964701494572534e-07} +{"train_loss": 0.00029374691075645387, "global_step": 68928, "epoch": 579, "lr": 2.994048733148236e-07} +{"train_loss": 0.00027871766360476613, "global_step": 68929, "epoch": 579, "lr": 2.991628292657367e-07} +{"train_loss": 0.0002183079777751118, "global_step": 68930, "epoch": 579, "lr": 2.989208827989254e-07} +{"train_loss": 0.00026043326943181455, "global_step": 68931, "epoch": 579, "lr": 2.986790339148782e-07} +{"train_loss": 0.00031435448909178376, "global_step": 68932, "epoch": 579, "lr": 2.984372826140669e-07} +{"train_loss": 0.0001519872312201187, "global_step": 68933, "epoch": 579, "lr": 2.9819562889695784e-07} +{"train_loss": 0.00032672000816091895, "global_step": 68934, "epoch": 579, "lr": 2.9795407276403954e-07} +{"train_loss": 0.0002925895096268505, "global_step": 68935, "epoch": 579, "lr": 2.977126142157727e-07} +{"train_loss": 0.0002152075758203864, "global_step": 68936, "epoch": 579, "lr": 2.9747125325264025e-07} +{"train_loss": 0.00016633904306218028, "global_step": 68937, "epoch": 579, "lr": 2.972299898751085e-07} +{"train_loss": 0.00027910247445106506, "global_step": 68938, "epoch": 579, "lr": 2.969888240836605e-07} +{"train_loss": 0.00017017916252370924, "global_step": 68939, "epoch": 579, "lr": 2.9674775587876234e-07} +{"train_loss": 0.0002986099570989609, "global_step": 68940, "epoch": 579, "lr": 2.965067852608916e-07} +{"train_loss": 0.00018332109902985394, "global_step": 68941, "epoch": 579, "lr": 2.9626591223052e-07} +{"train_loss": 0.00021054770331829786, "global_step": 68942, "epoch": 579, "lr": 2.960251367881195e-07} +{"train_loss": 0.0004481748037505895, "global_step": 68943, "epoch": 579, "lr": 2.9578445893416187e-07} +{"train_loss": 0.00014632810780312866, "global_step": 68944, "epoch": 579, "lr": 2.9554387866912447e-07} +{"train_loss": 0.0003236000193282962, "global_step": 68945, "epoch": 579, "lr": 2.9530339599347365e-07} +{"train_loss": 0.0002056904777418822, "global_step": 68946, "epoch": 579, "lr": 2.9506301090768687e-07} +{"train_loss": 0.0002451263426337391, "global_step": 68947, "epoch": 579, "lr": 2.9482272341223026e-07} +{"train_loss": 0.00030581688042730093, "global_step": 68948, "epoch": 579, "lr": 2.945825335075814e-07} +{"train_loss": 0.0005960778216831386, "global_step": 68949, "epoch": 579, "lr": 2.943424411942064e-07} +{"train_loss": 0.00020056571520399302, "global_step": 68950, "epoch": 579, "lr": 2.9410244647258276e-07} +{"train_loss": 0.00021436512179207057, "global_step": 68951, "epoch": 579, "lr": 2.938625493431824e-07} +{"train_loss": 0.0001712312368908897, "global_step": 68952, "epoch": 579, "lr": 2.9362274980646586e-07} +{"train_loss": 0.0007208223105408251, "global_step": 68953, "epoch": 579, "lr": 2.933830478629163e-07} +{"train_loss": 0.0001776551071088761, "global_step": 68954, "epoch": 579, "lr": 2.9314344351299427e-07} +{"train_loss": 0.00014725509390700608, "global_step": 68955, "epoch": 579, "lr": 2.9290393675717733e-07} +{"train_loss": 0.00023268134100362659, "global_step": 68956, "epoch": 579, "lr": 2.926645275959372e-07} +{"train_loss": 0.00019858103769365698, "global_step": 68957, "epoch": 579, "lr": 2.9242521602972915e-07} +{"train_loss": 0.0002979871060233563, "global_step": 68958, "epoch": 579, "lr": 2.9218600205904166e-07} +{"train_loss": 0.000187191428267397, "global_step": 68959, "epoch": 579, "lr": 2.919468856843355e-07} +{"train_loss": 0.00018161608022637665, "global_step": 68960, "epoch": 579, "lr": 2.9170786690607686e-07} +{"train_loss": 0.00020445595146156847, "global_step": 68961, "epoch": 579, "lr": 2.9146894572474324e-07} +{"train_loss": 0.00019732193322852254, "global_step": 68962, "epoch": 579, "lr": 2.912301221408009e-07} +{"train_loss": 0.0002115387178491801, "global_step": 68963, "epoch": 579, "lr": 2.9099139615471615e-07} +{"train_loss": 0.0002563287562225014, "global_step": 68964, "epoch": 579, "lr": 2.9075276776695526e-07} +{"train_loss": 0.00018846002058126032, "global_step": 68965, "epoch": 579, "lr": 2.905142369779956e-07} +{"train_loss": 0.0003205831744708121, "global_step": 68966, "epoch": 579, "lr": 2.90275803788298e-07} +{"train_loss": 0.0002643185143824667, "global_step": 68967, "epoch": 579, "lr": 2.9003746819833424e-07} +{"train_loss": 0.0001519543002359569, "global_step": 68968, "epoch": 579, "lr": 2.897992302085761e-07} +{"train_loss": 0.00024540774757042527, "global_step": 68969, "epoch": 579, "lr": 2.8956108981947895e-07} +{"train_loss": 0.00018597148300614208, "global_step": 68970, "epoch": 579, "lr": 2.8932304703152004e-07} +{"train_loss": 0.0001556476199766621, "global_step": 68971, "epoch": 579, "lr": 2.890851018451657e-07} +{"train_loss": 0.0002407018473604694, "global_step": 68972, "epoch": 579, "lr": 2.8884725426087666e-07} +{"train_loss": 0.0004435263981577009, "global_step": 68973, "epoch": 579, "lr": 2.886095042791304e-07} +{"train_loss": 0.0001690869394224137, "global_step": 68974, "epoch": 579, "lr": 2.883718519003875e-07} +{"train_loss": 0.0001991112803807482, "global_step": 68975, "epoch": 579, "lr": 2.8813429712511444e-07} +{"train_loss": 0.000205894437385723, "global_step": 68976, "epoch": 579, "lr": 2.878968399537829e-07} +{"train_loss": 0.00028229079907760024, "global_step": 68977, "epoch": 579, "lr": 2.876594803868482e-07} +{"train_loss": 0.0004445524828042835, "global_step": 68978, "epoch": 579, "lr": 2.8742221842478767e-07} +{"train_loss": 0.00024196392041631043, "global_step": 68979, "epoch": 579, "lr": 2.871850540680621e-07} +{"train_loss": 0.00020244292682036757, "global_step": 68980, "epoch": 579, "lr": 2.869479873171377e-07} +{"train_loss": 0.00041443650843575597, "global_step": 68981, "epoch": 579, "lr": 2.867110181724808e-07} +{"train_loss": 0.0005637552822008729, "global_step": 68982, "epoch": 579, "lr": 2.8647414663455775e-07} +{"train_loss": 0.00017100988770835102, "global_step": 68983, "epoch": 579, "lr": 2.8623737270382365e-07} +{"train_loss": 0.0002356496697757393, "global_step": 68984, "epoch": 579, "lr": 2.86000696380756e-07} +{"train_loss": 0.0002043109998339787, "global_step": 68985, "epoch": 579, "lr": 2.857641176658155e-07} +{"train_loss": 0.0002620983577799052, "global_step": 68986, "epoch": 579, "lr": 2.855276365594683e-07} +{"train_loss": 0.00042586951167322695, "global_step": 68987, "epoch": 579, "lr": 2.852912530621754e-07} +{"train_loss": 0.00017573336663190275, "global_step": 68988, "epoch": 579, "lr": 2.850549671743974e-07} +{"train_loss": 0.00045503073488362134, "global_step": 68989, "epoch": 579, "lr": 2.848187788966061e-07} +{"train_loss": 0.00023568097094539553, "global_step": 68990, "epoch": 579, "lr": 2.845826882292568e-07} +{"train_loss": 0.0002165543264709413, "global_step": 68991, "epoch": 579, "lr": 2.8434669517282686e-07} +{"train_loss": 0.00016785346087999642, "global_step": 68992, "epoch": 579, "lr": 2.841107997277659e-07} +{"train_loss": 0.0001839613978518173, "global_step": 68993, "epoch": 579, "lr": 2.838750018945402e-07} +{"train_loss": 0.000169090781128034, "global_step": 68994, "epoch": 579, "lr": 2.8363930167361605e-07} +{"train_loss": 0.0005157779669389129, "global_step": 68995, "epoch": 579, "lr": 2.834036990654543e-07} +{"train_loss": 0.0001750103838276118, "global_step": 68996, "epoch": 579, "lr": 2.831681940705211e-07} +{"train_loss": 0.00023037548817228526, "global_step": 68997, "epoch": 579, "lr": 2.829327866892717e-07} +{"train_loss": 0.0002243471099063754, "global_step": 68998, "epoch": 579, "lr": 2.8269747692217796e-07} +{"train_loss": 0.0003473071556072682, "global_step": 68999, "epoch": 579, "lr": 2.8246226476968953e-07} +{"train_loss": 0.00030390892061404884, "global_step": 69000, "epoch": 579, "lr": 2.822271502322782e-07} +{"train_loss": 0.0001916082837851718, "global_step": 69001, "epoch": 579, "lr": 2.8199213331040476e-07} +{"train_loss": 0.0002543394220992923, "global_step": 69002, "epoch": 579, "lr": 2.817572140045244e-07} +{"train_loss": 0.00011235818965360522, "global_step": 69003, "epoch": 579, "lr": 2.8152239231510334e-07} +{"train_loss": 0.0001571820757817477, "global_step": 69004, "epoch": 579, "lr": 2.812876682426024e-07} +{"train_loss": 0.00016318142297677696, "global_step": 69005, "epoch": 579, "lr": 2.8105304178748236e-07} +{"train_loss": 0.00023021615925244987, "global_step": 69006, "epoch": 579, "lr": 2.8081851295019833e-07} +{"train_loss": 0.00021302432287484407, "global_step": 69007, "epoch": 579, "lr": 2.805840817312166e-07} +{"train_loss": 0.00016759759455453604, "global_step": 69008, "epoch": 579, "lr": 2.80349748130998e-07} +{"train_loss": 0.00022718236141372472, "global_step": 69009, "epoch": 579, "lr": 2.8011551214999765e-07} +{"train_loss": 0.0002755310561042279, "global_step": 69010, "epoch": 579, "lr": 2.7988137378868185e-07} +{"train_loss": 0.0005788530688732862, "global_step": 69011, "epoch": 579, "lr": 2.796473330475058e-07} +{"train_loss": 0.00022107061522547156, "global_step": 69012, "epoch": 579, "lr": 2.794133899269358e-07} +{"train_loss": 0.00019763570162467659, "global_step": 69013, "epoch": 579, "lr": 2.7917954442742143e-07} +{"train_loss": 0.00013979477807879448, "global_step": 69014, "epoch": 579, "lr": 2.7894579654942357e-07} +{"train_loss": 0.00025553005980327725, "global_step": 69015, "epoch": 579, "lr": 2.7871214629340834e-07} +{"train_loss": 0.0001725343317957595, "global_step": 69016, "epoch": 579, "lr": 2.7847859365982556e-07} +{"train_loss": 0.00021595352154690772, "global_step": 69017, "epoch": 579, "lr": 2.7824513864914137e-07} +{"train_loss": 0.00017583365843165666, "global_step": 69018, "epoch": 579, "lr": 2.7801178126181104e-07} +{"train_loss": 0.0002589081311324502, "global_step": 69019, "epoch": 579, "lr": 2.7777852149828976e-07, "val_loss": 0.01780928485095501} +{"train_loss": 0.00018948384968098253, "global_step": 69020, "epoch": 580, "lr": 2.775453593590438e-07} +{"train_loss": 0.0001713555830065161, "global_step": 69021, "epoch": 580, "lr": 2.7731229484451726e-07} +{"train_loss": 0.00027146731736138463, "global_step": 69022, "epoch": 580, "lr": 2.77079327955182e-07} +{"train_loss": 0.00022303653531707823, "global_step": 69023, "epoch": 580, "lr": 2.7684645869148764e-07} +{"train_loss": 0.0002660214377101511, "global_step": 69024, "epoch": 580, "lr": 2.766136870538949e-07} +{"train_loss": 0.00021480345458257943, "global_step": 69025, "epoch": 580, "lr": 2.7638101304285903e-07} +{"train_loss": 0.00024120297166518867, "global_step": 69026, "epoch": 580, "lr": 2.761484366588352e-07} +{"train_loss": 0.00021050225768703967, "global_step": 69027, "epoch": 580, "lr": 2.7591595790227855e-07} +{"train_loss": 0.0001700767024885863, "global_step": 69028, "epoch": 580, "lr": 2.7568357677364987e-07} +{"train_loss": 0.000127789840917103, "global_step": 69029, "epoch": 580, "lr": 2.7545129327340993e-07} +{"train_loss": 0.00012897291162516922, "global_step": 69030, "epoch": 580, "lr": 2.752191074020027e-07} +{"train_loss": 0.00017663145263213664, "global_step": 69031, "epoch": 580, "lr": 2.7498701915989466e-07} +{"train_loss": 0.00013059406774118543, "global_step": 69032, "epoch": 580, "lr": 2.747550285475353e-07} +{"train_loss": 0.0004759596777148545, "global_step": 69033, "epoch": 580, "lr": 2.7452313556538543e-07} +{"train_loss": 0.00030280594364739954, "global_step": 69034, "epoch": 580, "lr": 2.742913402138947e-07} +{"train_loss": 0.0002638797741383314, "global_step": 69035, "epoch": 580, "lr": 2.740596424935182e-07} +{"train_loss": 0.0002730301639530808, "global_step": 69036, "epoch": 580, "lr": 2.7382804240471684e-07} +{"train_loss": 0.00022088155674282461, "global_step": 69037, "epoch": 580, "lr": 2.7359653994793454e-07} +{"train_loss": 0.00030140846502035856, "global_step": 69038, "epoch": 580, "lr": 2.733651351236377e-07} +{"train_loss": 0.0002663354389369488, "global_step": 69039, "epoch": 580, "lr": 2.7313382793227593e-07} +{"train_loss": 0.00038790571852587163, "global_step": 69040, "epoch": 580, "lr": 2.729026183743044e-07} +{"train_loss": 0.00025383196771144867, "global_step": 69041, "epoch": 580, "lr": 2.7267150645017835e-07} +{"train_loss": 0.0002525115851312876, "global_step": 69042, "epoch": 580, "lr": 2.7244049216034186e-07} +{"train_loss": 0.00031214134651236236, "global_step": 69043, "epoch": 580, "lr": 2.7220957550526116e-07} +{"train_loss": 0.00013940637290943414, "global_step": 69044, "epoch": 580, "lr": 2.7197875648538595e-07} +{"train_loss": 0.00017338509496767074, "global_step": 69045, "epoch": 580, "lr": 2.717480351011603e-07} +{"train_loss": 0.00016030909318942577, "global_step": 69046, "epoch": 580, "lr": 2.7151741135305055e-07} +{"train_loss": 0.00029020116198807955, "global_step": 69047, "epoch": 580, "lr": 2.7128688524150626e-07} +{"train_loss": 0.0002328653063159436, "global_step": 69048, "epoch": 580, "lr": 2.7105645676697155e-07} +{"train_loss": 0.00013405020581558347, "global_step": 69049, "epoch": 580, "lr": 2.708261259299072e-07} +{"train_loss": 0.00020239946024958044, "global_step": 69050, "epoch": 580, "lr": 2.7059589273076283e-07} +{"train_loss": 0.00021597754675894976, "global_step": 69051, "epoch": 580, "lr": 2.7036575716999355e-07} +{"train_loss": 0.0002674431598279625, "global_step": 69052, "epoch": 580, "lr": 2.701357192480436e-07} +{"train_loss": 0.0003196526668034494, "global_step": 69053, "epoch": 580, "lr": 2.699057789653736e-07} +{"train_loss": 0.00017319356265943497, "global_step": 69054, "epoch": 580, "lr": 2.696759363224222e-07} +{"train_loss": 0.00019235095533076674, "global_step": 69055, "epoch": 580, "lr": 2.694461913196611e-07} +{"train_loss": 0.00022273774084169418, "global_step": 69056, "epoch": 580, "lr": 2.692165439575234e-07} +{"train_loss": 0.0002341352665098384, "global_step": 69057, "epoch": 580, "lr": 2.689869942364642e-07} +{"train_loss": 0.000135577138280496, "global_step": 69058, "epoch": 580, "lr": 2.687575421569388e-07} +{"train_loss": 0.0001409130491083488, "global_step": 69059, "epoch": 580, "lr": 2.6852818771939125e-07} +{"train_loss": 0.0002119477721862495, "global_step": 69060, "epoch": 580, "lr": 2.6829893092428227e-07} +{"train_loss": 0.0001805455394787714, "global_step": 69061, "epoch": 580, "lr": 2.6806977177205037e-07} +{"train_loss": 0.00015546628856100142, "global_step": 69062, "epoch": 580, "lr": 2.678407102631508e-07} +{"train_loss": 0.0003177816979587078, "global_step": 69063, "epoch": 580, "lr": 2.676117463980332e-07} +{"train_loss": 0.0001763909385772422, "global_step": 69064, "epoch": 580, "lr": 2.6738288017714717e-07} +{"train_loss": 0.00013467106327880174, "global_step": 69065, "epoch": 580, "lr": 2.671541116009424e-07} +{"train_loss": 0.0003204992972314358, "global_step": 69066, "epoch": 580, "lr": 2.669254406698685e-07} +{"train_loss": 0.0002885417197830975, "global_step": 69067, "epoch": 580, "lr": 2.666968673843695e-07} +{"train_loss": 0.0001699076674412936, "global_step": 69068, "epoch": 580, "lr": 2.664683917449007e-07} +{"train_loss": 0.0001975888735614717, "global_step": 69069, "epoch": 580, "lr": 2.662400137519061e-07} +{"train_loss": 0.00048136303666979074, "global_step": 69070, "epoch": 580, "lr": 2.660117334058354e-07} +{"train_loss": 0.000376138516003266, "global_step": 69071, "epoch": 580, "lr": 2.6578355070714376e-07} +{"train_loss": 0.00043375472887419164, "global_step": 69072, "epoch": 580, "lr": 2.655554656562642e-07} +{"train_loss": 0.00016089572454802692, "global_step": 69073, "epoch": 580, "lr": 2.6532747825365743e-07} +{"train_loss": 0.00018016729154624045, "global_step": 69074, "epoch": 580, "lr": 2.650995884997676e-07} +{"train_loss": 0.00030172703554853797, "global_step": 69075, "epoch": 580, "lr": 2.6487179639503866e-07} +{"train_loss": 0.00018452761287335306, "global_step": 69076, "epoch": 580, "lr": 2.646441019399204e-07} +{"train_loss": 0.00013068143744021654, "global_step": 69077, "epoch": 580, "lr": 2.6441650513486793e-07} +{"train_loss": 0.0005393742467276752, "global_step": 69078, "epoch": 580, "lr": 2.641890059803087e-07} +{"train_loss": 0.00021952108363620937, "global_step": 69079, "epoch": 580, "lr": 2.63961604476709e-07} +{"train_loss": 0.00022668359451927245, "global_step": 69080, "epoch": 580, "lr": 2.637343006245019e-07} +{"train_loss": 0.00027907660114578903, "global_step": 69081, "epoch": 580, "lr": 2.6350709442414243e-07} +{"train_loss": 0.00014234492846298963, "global_step": 69082, "epoch": 580, "lr": 2.632799858760748e-07} +{"train_loss": 0.00019544675888027996, "global_step": 69083, "epoch": 580, "lr": 2.630529749807376e-07} +{"train_loss": 0.00014966951857786626, "global_step": 69084, "epoch": 580, "lr": 2.628260617385858e-07} +{"train_loss": 0.000609385606367141, "global_step": 69085, "epoch": 580, "lr": 2.625992461500637e-07} +{"train_loss": 0.00025160174118354917, "global_step": 69086, "epoch": 580, "lr": 2.6237252821560975e-07} +{"train_loss": 0.00021793969790451229, "global_step": 69087, "epoch": 580, "lr": 2.621459079356736e-07} +{"train_loss": 0.0005229650414548814, "global_step": 69088, "epoch": 580, "lr": 2.619193853107049e-07} +{"train_loss": 0.00018590845866128802, "global_step": 69089, "epoch": 580, "lr": 2.616929603411422e-07} +{"train_loss": 0.0002841404639184475, "global_step": 69090, "epoch": 580, "lr": 2.6146663302742956e-07} +{"train_loss": 0.0003215642354916781, "global_step": 69091, "epoch": 580, "lr": 2.6124040337001666e-07} +{"train_loss": 0.000180130431544967, "global_step": 69092, "epoch": 580, "lr": 2.6101427136933645e-07} +{"train_loss": 0.0001813318522181362, "global_step": 69093, "epoch": 580, "lr": 2.6078823702584965e-07} +{"train_loss": 0.00025034937425516546, "global_step": 69094, "epoch": 580, "lr": 2.605623003399893e-07} +{"train_loss": 0.00016059656627476215, "global_step": 69095, "epoch": 580, "lr": 2.6033646131219944e-07} +{"train_loss": 0.0002191316307289526, "global_step": 69096, "epoch": 580, "lr": 2.6011071994292426e-07} +{"train_loss": 0.00034694408532232046, "global_step": 69097, "epoch": 580, "lr": 2.598850762326077e-07} +{"train_loss": 0.00020567368483170867, "global_step": 69098, "epoch": 580, "lr": 2.59659530181694e-07} +{"train_loss": 0.0004859748878516257, "global_step": 69099, "epoch": 580, "lr": 2.5943408179062714e-07} +{"train_loss": 0.00022854935377836227, "global_step": 69100, "epoch": 580, "lr": 2.592087310598457e-07} +{"train_loss": 0.000199267320567742, "global_step": 69101, "epoch": 580, "lr": 2.589834779897937e-07} +{"train_loss": 0.00035988405579701066, "global_step": 69102, "epoch": 580, "lr": 2.5875832258090983e-07} +{"train_loss": 0.000188725272892043, "global_step": 69103, "epoch": 580, "lr": 2.5853326483364915e-07} +{"train_loss": 0.00045214686542749405, "global_step": 69104, "epoch": 580, "lr": 2.583083047484336e-07} +{"train_loss": 0.00026468545547686517, "global_step": 69105, "epoch": 580, "lr": 2.5808344232571835e-07} +{"train_loss": 0.00012862859875895083, "global_step": 69106, "epoch": 580, "lr": 2.578586775659475e-07} +{"train_loss": 0.0003338585956953466, "global_step": 69107, "epoch": 580, "lr": 2.5763401046955404e-07} +{"train_loss": 0.0003025232581421733, "global_step": 69108, "epoch": 580, "lr": 2.5740944103698205e-07} +{"train_loss": 0.0002722219505812973, "global_step": 69109, "epoch": 580, "lr": 2.5718496926867007e-07} +{"train_loss": 0.00028180598746985197, "global_step": 69110, "epoch": 580, "lr": 2.569605951650622e-07} +{"train_loss": 0.0004475947062019259, "global_step": 69111, "epoch": 580, "lr": 2.5673631872660254e-07} +{"train_loss": 0.0001698841224424541, "global_step": 69112, "epoch": 580, "lr": 2.5651213995372404e-07} +{"train_loss": 0.00016538290947210044, "global_step": 69113, "epoch": 580, "lr": 2.5628805884686526e-07} +{"train_loss": 0.00024393960484303534, "global_step": 69114, "epoch": 580, "lr": 2.560640754064758e-07} +{"train_loss": 0.0002429356100037694, "global_step": 69115, "epoch": 580, "lr": 2.558401896329887e-07} +{"train_loss": 0.0002129262575181201, "global_step": 69116, "epoch": 580, "lr": 2.556164015268425e-07} +{"train_loss": 0.00020112133643124253, "global_step": 69117, "epoch": 580, "lr": 2.5539271108848127e-07} +{"train_loss": 0.00032790604745969176, "global_step": 69118, "epoch": 580, "lr": 2.551691183183436e-07} +{"train_loss": 0.0002487543097231537, "global_step": 69119, "epoch": 580, "lr": 2.549456232168679e-07} +{"train_loss": 0.00025808834470808506, "global_step": 69120, "epoch": 580, "lr": 2.5472222578448726e-07} +{"train_loss": 0.0003872521920129657, "global_step": 69121, "epoch": 580, "lr": 2.544989260216457e-07} +{"train_loss": 0.0002100566343870014, "global_step": 69122, "epoch": 580, "lr": 2.542757239287874e-07} +{"train_loss": 0.00040394312236458063, "global_step": 69123, "epoch": 580, "lr": 2.5405261950633417e-07} +{"train_loss": 0.00024140001914929599, "global_step": 69124, "epoch": 580, "lr": 2.5382961275474126e-07} +{"train_loss": 0.00025163142709061503, "global_step": 69125, "epoch": 580, "lr": 2.5360670367444163e-07} +{"train_loss": 0.000483353971503675, "global_step": 69126, "epoch": 580, "lr": 2.5338389226586267e-07} +{"train_loss": 0.00020857046183664352, "global_step": 69127, "epoch": 580, "lr": 2.531611785294541e-07} +{"train_loss": 0.0003609111299738288, "global_step": 69128, "epoch": 580, "lr": 2.5293856246564886e-07} +{"train_loss": 0.00022435981372836977, "global_step": 69129, "epoch": 580, "lr": 2.527160440748855e-07} +{"train_loss": 0.00029058693326078355, "global_step": 69130, "epoch": 580, "lr": 2.5249362335759695e-07} +{"train_loss": 0.00026734027778729796, "global_step": 69131, "epoch": 580, "lr": 2.522713003142219e-07} +{"train_loss": 0.0001299115247093141, "global_step": 69132, "epoch": 580, "lr": 2.520490749451987e-07} +{"train_loss": 0.0007371220272034407, "global_step": 69133, "epoch": 580, "lr": 2.5182694725096045e-07} +{"train_loss": 0.0009500503656454384, "global_step": 69134, "epoch": 580, "lr": 2.516049172319457e-07} +{"train_loss": 0.0003300213429611176, "global_step": 69135, "epoch": 580, "lr": 2.5138298488859293e-07} +{"train_loss": 0.00012001154391327873, "global_step": 69136, "epoch": 580, "lr": 2.5116115022133513e-07} +{"train_loss": 0.00017233104154001921, "global_step": 69137, "epoch": 580, "lr": 2.509394132305998e-07} +{"train_loss": 0.00026352727814321213, "global_step": 69138, "epoch": 580, "lr": 2.507177739168365e-07, "val_loss": 0.05224117264151573, "train_action_mse_error": 3.6360040667204885e-06} +{"train_loss": 0.0002961828140541911, "global_step": 69139, "epoch": 581, "lr": 2.504962322804727e-07} +{"train_loss": 0.00020788228721357882, "global_step": 69140, "epoch": 581, "lr": 2.5027478832194693e-07} +{"train_loss": 0.0002652019902598113, "global_step": 69141, "epoch": 581, "lr": 2.5005344204168666e-07} +{"train_loss": 0.00032621072023175657, "global_step": 69142, "epoch": 581, "lr": 2.4983219344013597e-07} +{"train_loss": 0.00034964369842782617, "global_step": 69143, "epoch": 581, "lr": 2.4961104251772225e-07} +{"train_loss": 0.0001476436445955187, "global_step": 69144, "epoch": 581, "lr": 2.493899892748841e-07} +{"train_loss": 0.00021431263303384185, "global_step": 69145, "epoch": 581, "lr": 2.491690337120489e-07} +{"train_loss": 0.00017459575610700995, "global_step": 69146, "epoch": 581, "lr": 2.489481758296608e-07} +{"train_loss": 0.00012447134940885007, "global_step": 69147, "epoch": 581, "lr": 2.4872741562814716e-07} +{"train_loss": 0.00018788369197864085, "global_step": 69148, "epoch": 581, "lr": 2.4850675310794103e-07} +{"train_loss": 0.00041882615187205374, "global_step": 69149, "epoch": 581, "lr": 2.482861882694754e-07} +{"train_loss": 0.0003067290526814759, "global_step": 69150, "epoch": 581, "lr": 2.480657211131887e-07} +{"train_loss": 0.0004530847363639623, "global_step": 69151, "epoch": 581, "lr": 2.4784535163950295e-07} +{"train_loss": 0.0003200970822945237, "global_step": 69152, "epoch": 581, "lr": 2.4762507984886216e-07} +{"train_loss": 0.00032632576767355204, "global_step": 69153, "epoch": 581, "lr": 2.474049057416938e-07} +{"train_loss": 0.0005827125278301537, "global_step": 69154, "epoch": 581, "lr": 2.471848293184309e-07} +{"train_loss": 0.00027810968458652496, "global_step": 69155, "epoch": 581, "lr": 2.469648505795064e-07} +{"train_loss": 0.00017017876962199807, "global_step": 69156, "epoch": 581, "lr": 2.4674496952534765e-07} +{"train_loss": 0.00019722087017726153, "global_step": 69157, "epoch": 581, "lr": 2.465251861563933e-07} +{"train_loss": 0.00021308660507202148, "global_step": 69158, "epoch": 581, "lr": 2.463055004730708e-07} +{"train_loss": 0.00041252735536545515, "global_step": 69159, "epoch": 581, "lr": 2.4608591247580747e-07} +{"train_loss": 0.0003643837117124349, "global_step": 69160, "epoch": 581, "lr": 2.458664221650475e-07} +{"train_loss": 0.0001915252214530483, "global_step": 69161, "epoch": 581, "lr": 2.4564702954120165e-07} +{"train_loss": 0.000337158766342327, "global_step": 69162, "epoch": 581, "lr": 2.454277346047251e-07} +{"train_loss": 0.00029882663511671126, "global_step": 69163, "epoch": 581, "lr": 2.4520853735602864e-07} +{"train_loss": 0.00042558563291095197, "global_step": 69164, "epoch": 581, "lr": 2.4498943779555086e-07} +{"train_loss": 0.0001934798783622682, "global_step": 69165, "epoch": 581, "lr": 2.4477043592371905e-07} +{"train_loss": 0.0001737030252115801, "global_step": 69166, "epoch": 581, "lr": 2.4455153174096637e-07} +{"train_loss": 0.0002905108267441392, "global_step": 69167, "epoch": 581, "lr": 2.443327252477201e-07} +{"train_loss": 0.0003423267335165292, "global_step": 69168, "epoch": 581, "lr": 2.4411401644441335e-07} +{"train_loss": 0.00027522590244188905, "global_step": 69169, "epoch": 581, "lr": 2.438954053314735e-07} +{"train_loss": 0.00017457014473620802, "global_step": 69170, "epoch": 581, "lr": 2.4367689190932795e-07} +{"train_loss": 0.00014184527390170842, "global_step": 69171, "epoch": 581, "lr": 2.434584761784042e-07} +{"train_loss": 0.00020713060803245753, "global_step": 69172, "epoch": 581, "lr": 2.4324015813913526e-07} +{"train_loss": 0.00021952914539724588, "global_step": 69173, "epoch": 581, "lr": 2.4302193779195405e-07} +{"train_loss": 0.00031361347646452487, "global_step": 69174, "epoch": 581, "lr": 2.428038151372769e-07} +{"train_loss": 0.0002261573390569538, "global_step": 69175, "epoch": 581, "lr": 2.4258579017554237e-07} +{"train_loss": 0.00022075281594879925, "global_step": 69176, "epoch": 581, "lr": 2.423678629071724e-07} +{"train_loss": 0.000244064605794847, "global_step": 69177, "epoch": 581, "lr": 2.4215003333259987e-07} +{"train_loss": 0.00016783172031864524, "global_step": 69178, "epoch": 581, "lr": 2.4193230145224675e-07} +{"train_loss": 0.00024405728618148714, "global_step": 69179, "epoch": 581, "lr": 2.41714667266546e-07} +{"train_loss": 0.00036910895141772926, "global_step": 69180, "epoch": 581, "lr": 2.4149713077592506e-07} +{"train_loss": 0.0003804243460763246, "global_step": 69181, "epoch": 581, "lr": 2.412796919808058e-07} +{"train_loss": 0.00020324456272646785, "global_step": 69182, "epoch": 581, "lr": 2.410623508816157e-07} +{"train_loss": 0.0003415732062421739, "global_step": 69183, "epoch": 581, "lr": 2.408451074787876e-07} +{"train_loss": 0.00014727041707374156, "global_step": 69184, "epoch": 581, "lr": 2.406279617727436e-07} +{"train_loss": 0.00022553784947376698, "global_step": 69185, "epoch": 581, "lr": 2.4041091376390545e-07} +{"train_loss": 0.00020885678532067686, "global_step": 69186, "epoch": 581, "lr": 2.401939634527117e-07} +{"train_loss": 0.00018540924065746367, "global_step": 69187, "epoch": 581, "lr": 2.3997711083957875e-07} +{"train_loss": 0.00025926437228918076, "global_step": 69188, "epoch": 581, "lr": 2.3976035592493397e-07} +{"train_loss": 0.0003604397352319211, "global_step": 69189, "epoch": 581, "lr": 2.395436987092048e-07} +{"train_loss": 0.0001288820058107376, "global_step": 69190, "epoch": 581, "lr": 2.3932713919281314e-07} +{"train_loss": 0.00023596521350555122, "global_step": 69191, "epoch": 581, "lr": 2.3911067737618644e-07} +{"train_loss": 0.00030399218667298555, "global_step": 69192, "epoch": 581, "lr": 2.388943132597521e-07} +{"train_loss": 0.00015348225133493543, "global_step": 69193, "epoch": 581, "lr": 2.3867804684393204e-07} +{"train_loss": 0.0001756996935000643, "global_step": 69194, "epoch": 581, "lr": 2.3846187812914813e-07} +{"train_loss": 0.00034880131715908647, "global_step": 69195, "epoch": 581, "lr": 2.3824580711583333e-07} +{"train_loss": 0.00024135885178111494, "global_step": 69196, "epoch": 581, "lr": 2.3802983380440403e-07} +{"train_loss": 0.0006573697319254279, "global_step": 69197, "epoch": 581, "lr": 2.3781395819528206e-07} +{"train_loss": 0.00020164409943390638, "global_step": 69198, "epoch": 581, "lr": 2.3759818028890602e-07} +{"train_loss": 0.0002729599073063582, "global_step": 69199, "epoch": 581, "lr": 2.3738250008568108e-07} +{"train_loss": 0.0002130247448803857, "global_step": 69200, "epoch": 581, "lr": 2.371669175860458e-07} +{"train_loss": 0.0002105466992361471, "global_step": 69201, "epoch": 581, "lr": 2.3695143279041099e-07} +{"train_loss": 0.00030640512704849243, "global_step": 69202, "epoch": 581, "lr": 2.367360456992096e-07} +{"train_loss": 0.0003740111133083701, "global_step": 69203, "epoch": 581, "lr": 2.3652075631285796e-07} +{"train_loss": 0.000196149674593471, "global_step": 69204, "epoch": 581, "lr": 2.3630556463178354e-07} +{"train_loss": 0.0003198697813786566, "global_step": 69205, "epoch": 581, "lr": 2.3609047065640265e-07} +{"train_loss": 0.0002282968198414892, "global_step": 69206, "epoch": 581, "lr": 2.358754743871483e-07} +{"train_loss": 0.00017217161075677723, "global_step": 69207, "epoch": 581, "lr": 2.3566057582443125e-07} +{"train_loss": 0.0001980147644644603, "global_step": 69208, "epoch": 581, "lr": 2.3544577496867893e-07} +{"train_loss": 0.00027762746321968734, "global_step": 69209, "epoch": 581, "lr": 2.3523107182031323e-07} +{"train_loss": 0.0002625800552777946, "global_step": 69210, "epoch": 581, "lr": 2.350164663797505e-07} +{"train_loss": 0.0005032981280237436, "global_step": 69211, "epoch": 581, "lr": 2.3480195864742372e-07} +{"train_loss": 0.00015557551523670554, "global_step": 69212, "epoch": 581, "lr": 2.3458754862374366e-07} +{"train_loss": 0.00012113288539694622, "global_step": 69213, "epoch": 581, "lr": 2.343732363091322e-07} +{"train_loss": 0.00013636378571391106, "global_step": 69214, "epoch": 581, "lr": 2.3415902170401127e-07} +{"train_loss": 0.00022396183339878917, "global_step": 69215, "epoch": 581, "lr": 2.3394490480880827e-07} +{"train_loss": 0.0001803176273824647, "global_step": 69216, "epoch": 581, "lr": 2.3373088562393397e-07} +{"train_loss": 0.00021461611322592944, "global_step": 69217, "epoch": 581, "lr": 2.3351696414981028e-07} +{"train_loss": 0.0002058387326542288, "global_step": 69218, "epoch": 581, "lr": 2.3330314038685907e-07} +{"train_loss": 0.00015784986317157745, "global_step": 69219, "epoch": 581, "lr": 2.330894143355078e-07} +{"train_loss": 0.00031408690847456455, "global_step": 69220, "epoch": 581, "lr": 2.3287578599616166e-07} +{"train_loss": 0.00018789473688229918, "global_step": 69221, "epoch": 581, "lr": 2.3266225536924813e-07} +{"train_loss": 0.00026522003463469446, "global_step": 69222, "epoch": 581, "lr": 2.3244882245518906e-07} +{"train_loss": 0.0004718707059510052, "global_step": 69223, "epoch": 581, "lr": 2.3223548725439526e-07} +{"train_loss": 0.00022270334011409432, "global_step": 69224, "epoch": 581, "lr": 2.3202224976729415e-07} +{"train_loss": 0.00035560684045776725, "global_step": 69225, "epoch": 581, "lr": 2.3180910999429651e-07} +{"train_loss": 0.0008943899301812053, "global_step": 69226, "epoch": 581, "lr": 2.3159606793582978e-07} +{"train_loss": 0.0001943055831361562, "global_step": 69227, "epoch": 581, "lr": 2.3138312359230475e-07} +{"train_loss": 0.00012596008309628814, "global_step": 69228, "epoch": 581, "lr": 2.3117027696413773e-07} +{"train_loss": 0.00013560921070165932, "global_step": 69229, "epoch": 581, "lr": 2.3095752805175618e-07} +{"train_loss": 0.00014458635996561497, "global_step": 69230, "epoch": 581, "lr": 2.307448768555709e-07} +{"train_loss": 0.0003117377054877579, "global_step": 69231, "epoch": 581, "lr": 2.3053232337599816e-07} +{"train_loss": 0.00015304698899853975, "global_step": 69232, "epoch": 581, "lr": 2.3031986761345991e-07} +{"train_loss": 0.00015457799599971622, "global_step": 69233, "epoch": 581, "lr": 2.3010750956837245e-07} +{"train_loss": 0.0002525426389183849, "global_step": 69234, "epoch": 581, "lr": 2.2989524924115214e-07} +{"train_loss": 0.00021372576884459704, "global_step": 69235, "epoch": 581, "lr": 2.2968308663221528e-07} +{"train_loss": 0.0002705940860323608, "global_step": 69236, "epoch": 581, "lr": 2.294710217419782e-07} +{"train_loss": 0.00041279307333752513, "global_step": 69237, "epoch": 581, "lr": 2.2925905457085728e-07} +{"train_loss": 0.00014605796604882926, "global_step": 69238, "epoch": 581, "lr": 2.290471851192688e-07} +{"train_loss": 0.000278649473330006, "global_step": 69239, "epoch": 581, "lr": 2.2883541338762916e-07} +{"train_loss": 0.00037590734427794814, "global_step": 69240, "epoch": 581, "lr": 2.286237393763546e-07} +{"train_loss": 0.00024931388907134533, "global_step": 69241, "epoch": 581, "lr": 2.28412163085856e-07} +{"train_loss": 0.00025680006365291774, "global_step": 69242, "epoch": 581, "lr": 2.282006845165552e-07} +{"train_loss": 0.0002488951140549034, "global_step": 69243, "epoch": 581, "lr": 2.279893036688685e-07} +{"train_loss": 0.0004775316047016531, "global_step": 69244, "epoch": 581, "lr": 2.2777802054320674e-07} +{"train_loss": 0.0001404639333486557, "global_step": 69245, "epoch": 581, "lr": 2.2756683513998066e-07} +{"train_loss": 0.00014118495164439082, "global_step": 69246, "epoch": 581, "lr": 2.2735574745961773e-07} +{"train_loss": 0.00022228668967727572, "global_step": 69247, "epoch": 581, "lr": 2.2714475750251763e-07} +{"train_loss": 0.0001909288257593289, "global_step": 69248, "epoch": 581, "lr": 2.269338652691022e-07} +{"train_loss": 0.000252593687037006, "global_step": 69249, "epoch": 581, "lr": 2.2672307075978228e-07} +{"train_loss": 0.0005861145327799022, "global_step": 69250, "epoch": 581, "lr": 2.265123739749797e-07} +{"train_loss": 0.0002567158662714064, "global_step": 69251, "epoch": 581, "lr": 2.2630177491509973e-07} +{"train_loss": 0.00016338351997546852, "global_step": 69252, "epoch": 581, "lr": 2.260912735805587e-07} +{"train_loss": 0.0001699506101431325, "global_step": 69253, "epoch": 581, "lr": 2.2588086997177293e-07} +{"train_loss": 0.0002112302026944235, "global_step": 69254, "epoch": 581, "lr": 2.2567056408914767e-07} +{"train_loss": 0.0007124554831534624, "global_step": 69255, "epoch": 581, "lr": 2.2546035593310478e-07} +{"train_loss": 0.00017966856830753386, "global_step": 69256, "epoch": 581, "lr": 2.252502455040495e-07} +{"train_loss": 0.0002672321401206784, "global_step": 69257, "epoch": 581, "lr": 2.250402328024037e-07, "val_loss": 0.019172346219420433} +{"train_loss": 0.000270760094281286, "global_step": 69258, "epoch": 582, "lr": 2.2483031782856712e-07} +{"train_loss": 0.00023760992917232215, "global_step": 69259, "epoch": 582, "lr": 2.2462050058296158e-07} +{"train_loss": 0.000135460591991432, "global_step": 69260, "epoch": 582, "lr": 2.2441078106599235e-07} +{"train_loss": 0.00023307297669816762, "global_step": 69261, "epoch": 582, "lr": 2.2420115927808127e-07} +{"train_loss": 0.00032796087907627225, "global_step": 69262, "epoch": 582, "lr": 2.2399163521962808e-07} +{"train_loss": 0.00013433142157737166, "global_step": 69263, "epoch": 582, "lr": 2.2378220889105462e-07} +{"train_loss": 0.00025615436607040465, "global_step": 69264, "epoch": 582, "lr": 2.2357288029276058e-07} +{"train_loss": 0.00017327094974461943, "global_step": 69265, "epoch": 582, "lr": 2.2336364942516786e-07} +{"train_loss": 0.00019718454859685153, "global_step": 69266, "epoch": 582, "lr": 2.2315451628868167e-07} +{"train_loss": 0.0002945655141957104, "global_step": 69267, "epoch": 582, "lr": 2.2294548088371282e-07} +{"train_loss": 0.0002267795061925426, "global_step": 69268, "epoch": 582, "lr": 2.2273654321067205e-07} +{"train_loss": 0.00018495024414733052, "global_step": 69269, "epoch": 582, "lr": 2.2252770326997018e-07} +{"train_loss": 0.000367092463420704, "global_step": 69270, "epoch": 582, "lr": 2.22318961062018e-07} +{"train_loss": 0.0002984048333019018, "global_step": 69271, "epoch": 582, "lr": 2.2211031658722624e-07} +{"train_loss": 0.0005693965358659625, "global_step": 69272, "epoch": 582, "lr": 2.219017698460002e-07} +{"train_loss": 0.00011252842523390427, "global_step": 69273, "epoch": 582, "lr": 2.216933208387506e-07} +{"train_loss": 0.00027915657847188413, "global_step": 69274, "epoch": 582, "lr": 2.214849695658938e-07} +{"train_loss": 0.00018955675477627665, "global_step": 69275, "epoch": 582, "lr": 2.212767160278295e-07} +{"train_loss": 0.00013522981316782534, "global_step": 69276, "epoch": 582, "lr": 2.2106856022496848e-07} +{"train_loss": 0.0002132340014213696, "global_step": 69277, "epoch": 582, "lr": 2.20860502157727e-07} +{"train_loss": 0.00017174897948279977, "global_step": 69278, "epoch": 582, "lr": 2.2065254182650485e-07} +{"train_loss": 0.0003200491482857615, "global_step": 69279, "epoch": 582, "lr": 2.2044467923171276e-07} +{"train_loss": 0.00022620413801632822, "global_step": 69280, "epoch": 582, "lr": 2.2023691437375593e-07} +{"train_loss": 0.00029032223392277956, "global_step": 69281, "epoch": 582, "lr": 2.2002924725305074e-07} +{"train_loss": 0.00034951980342157185, "global_step": 69282, "epoch": 582, "lr": 2.198216778700024e-07} +{"train_loss": 0.00019076208991464227, "global_step": 69283, "epoch": 582, "lr": 2.196142062250106e-07} +{"train_loss": 0.00012734773918054998, "global_step": 69284, "epoch": 582, "lr": 2.194068323184917e-07} +{"train_loss": 0.00021002624998800457, "global_step": 69285, "epoch": 582, "lr": 2.191995561508453e-07} +{"train_loss": 0.00021625208319164813, "global_step": 69286, "epoch": 582, "lr": 2.1899237772248226e-07} +{"train_loss": 0.00025402067694813013, "global_step": 69287, "epoch": 582, "lr": 2.1878529703381335e-07} +{"train_loss": 0.00022215886565390974, "global_step": 69288, "epoch": 582, "lr": 2.185783140852382e-07} +{"train_loss": 0.0002618319122120738, "global_step": 69289, "epoch": 582, "lr": 2.1837142887716766e-07} +{"train_loss": 0.0002915320510510355, "global_step": 69290, "epoch": 582, "lr": 2.1816464141000692e-07} +{"train_loss": 0.00033073575468733907, "global_step": 69291, "epoch": 582, "lr": 2.1795795168416122e-07} +{"train_loss": 0.00018224699306301773, "global_step": 69292, "epoch": 582, "lr": 2.1775135970003579e-07} +{"train_loss": 0.00022336095571517944, "global_step": 69293, "epoch": 582, "lr": 2.1754486545803587e-07} +{"train_loss": 0.00025331589858978987, "global_step": 69294, "epoch": 582, "lr": 2.1733846895857224e-07} +{"train_loss": 0.000252560421358794, "global_step": 69295, "epoch": 582, "lr": 2.1713217020203903e-07} +{"train_loss": 0.00023611157666891813, "global_step": 69296, "epoch": 582, "lr": 2.1692596918885255e-07} +{"train_loss": 0.00016550483996979892, "global_step": 69297, "epoch": 582, "lr": 2.167198659194125e-07} +{"train_loss": 0.00022627547150477767, "global_step": 69298, "epoch": 582, "lr": 2.165138603941297e-07} +{"train_loss": 0.0002700745826587081, "global_step": 69299, "epoch": 582, "lr": 2.163079526133982e-07} +{"train_loss": 0.00013761097216047347, "global_step": 69300, "epoch": 582, "lr": 2.1610214257762885e-07} +{"train_loss": 0.00022591406013816595, "global_step": 69301, "epoch": 582, "lr": 2.158964302872213e-07} +{"train_loss": 0.00021091278176754713, "global_step": 69302, "epoch": 582, "lr": 2.156908157425863e-07} +{"train_loss": 0.00022208094014786184, "global_step": 69303, "epoch": 582, "lr": 2.1548529894411806e-07} +{"train_loss": 0.00024741573724895716, "global_step": 69304, "epoch": 582, "lr": 2.1527987989223287e-07} +{"train_loss": 0.0002739291812758893, "global_step": 69305, "epoch": 582, "lr": 2.1507455858732483e-07} +{"train_loss": 0.00018111417011823505, "global_step": 69306, "epoch": 582, "lr": 2.1486933502979922e-07} +{"train_loss": 0.00021449224732350558, "global_step": 69307, "epoch": 582, "lr": 2.146642092200557e-07} +{"train_loss": 0.00014271566760726273, "global_step": 69308, "epoch": 582, "lr": 2.144591811584995e-07} +{"train_loss": 0.00021037393889855593, "global_step": 69309, "epoch": 582, "lr": 2.1425425084553586e-07} +{"train_loss": 0.00030454678926616907, "global_step": 69310, "epoch": 582, "lr": 2.1404941828157e-07} +{"train_loss": 0.00017081537225749344, "global_step": 69311, "epoch": 582, "lr": 2.1384468346699603e-07} +{"train_loss": 0.0002625182387419045, "global_step": 69312, "epoch": 582, "lr": 2.1364004640221924e-07} +{"train_loss": 0.00017669415683485568, "global_step": 69313, "epoch": 582, "lr": 2.1343550708763926e-07} +{"train_loss": 0.0001735140976961702, "global_step": 69314, "epoch": 582, "lr": 2.1323106552366135e-07} +{"train_loss": 0.00013478969049174339, "global_step": 69315, "epoch": 582, "lr": 2.1302672171068517e-07} +{"train_loss": 0.0004804314812645316, "global_step": 69316, "epoch": 582, "lr": 2.1282247564911039e-07} +{"train_loss": 0.00018648816330824047, "global_step": 69317, "epoch": 582, "lr": 2.1261832733934228e-07} +{"train_loss": 0.00015514995902776718, "global_step": 69318, "epoch": 582, "lr": 2.1241427678177494e-07} +{"train_loss": 0.0002548924821894616, "global_step": 69319, "epoch": 582, "lr": 2.1221032397681917e-07} +{"train_loss": 0.00024934334214776754, "global_step": 69320, "epoch": 582, "lr": 2.1200646892486908e-07} +{"train_loss": 0.00019766826881095767, "global_step": 69321, "epoch": 582, "lr": 2.118027116263188e-07} +{"train_loss": 0.0002732470748014748, "global_step": 69322, "epoch": 582, "lr": 2.1159905208157916e-07} +{"train_loss": 0.00011173597886227071, "global_step": 69323, "epoch": 582, "lr": 2.1139549029104423e-07} +{"train_loss": 0.00019001054170075804, "global_step": 69324, "epoch": 582, "lr": 2.1119202625511925e-07} +{"train_loss": 0.0002802055678330362, "global_step": 69325, "epoch": 582, "lr": 2.109886599741928e-07} +{"train_loss": 0.00026255715056322515, "global_step": 69326, "epoch": 582, "lr": 2.1078539144867571e-07} +{"train_loss": 0.00044457349576987326, "global_step": 69327, "epoch": 582, "lr": 2.1058222067896205e-07} +{"train_loss": 0.0001371091784676537, "global_step": 69328, "epoch": 582, "lr": 2.1037914766545151e-07} +{"train_loss": 0.0003674092295113951, "global_step": 69329, "epoch": 582, "lr": 2.1017617240854382e-07} +{"train_loss": 0.0002464975696057081, "global_step": 69330, "epoch": 582, "lr": 2.099732949086275e-07} +{"train_loss": 0.00017678273434285074, "global_step": 69331, "epoch": 582, "lr": 2.097705151661189e-07} +{"train_loss": 0.00032234902027994394, "global_step": 69332, "epoch": 582, "lr": 2.0956783318140104e-07} +{"train_loss": 0.0007800741586834192, "global_step": 69333, "epoch": 582, "lr": 2.093652489548792e-07} +{"train_loss": 0.00018824431754183024, "global_step": 69334, "epoch": 582, "lr": 2.0916276248694745e-07} +{"train_loss": 0.00032017240300774574, "global_step": 69335, "epoch": 582, "lr": 2.0896037377801103e-07} +{"train_loss": 0.0002787552948575467, "global_step": 69336, "epoch": 582, "lr": 2.08758082828453e-07} +{"train_loss": 0.00017870833107735962, "global_step": 69337, "epoch": 582, "lr": 2.085558896386841e-07} +{"train_loss": 0.0002497576060704887, "global_step": 69338, "epoch": 582, "lr": 2.0835379420909295e-07} +{"train_loss": 0.00012325898569542915, "global_step": 69339, "epoch": 582, "lr": 2.0815179654008478e-07} +{"train_loss": 0.0002878128143493086, "global_step": 69340, "epoch": 582, "lr": 2.0794989663204812e-07} +{"train_loss": 0.0003772048803512007, "global_step": 69341, "epoch": 582, "lr": 2.077480944853827e-07} +{"train_loss": 0.000156188674736768, "global_step": 69342, "epoch": 582, "lr": 2.075463901004826e-07} +{"train_loss": 0.00015643621736671776, "global_step": 69343, "epoch": 582, "lr": 2.073447834777531e-07} +{"train_loss": 0.00029104240820743144, "global_step": 69344, "epoch": 582, "lr": 2.071432746175772e-07} +{"train_loss": 0.00032576502417214215, "global_step": 69345, "epoch": 582, "lr": 2.069418635203546e-07} +{"train_loss": 0.0003410066128708422, "global_step": 69346, "epoch": 582, "lr": 2.0674055018648496e-07} +{"train_loss": 0.00037406591582112014, "global_step": 69347, "epoch": 582, "lr": 2.0653933461635688e-07} +{"train_loss": 0.00018156037549488246, "global_step": 69348, "epoch": 582, "lr": 2.0633821681037002e-07} +{"train_loss": 0.0002253335405839607, "global_step": 69349, "epoch": 582, "lr": 2.0613719676891852e-07} +{"train_loss": 0.0002481139963492751, "global_step": 69350, "epoch": 582, "lr": 2.059362744923965e-07} +{"train_loss": 0.0003042753378394991, "global_step": 69351, "epoch": 582, "lr": 2.0573544998120365e-07} +{"train_loss": 0.00019278163381386548, "global_step": 69352, "epoch": 582, "lr": 2.05534723235723e-07} +{"train_loss": 0.0002123104641214013, "global_step": 69353, "epoch": 582, "lr": 2.0533409425635974e-07} +{"train_loss": 0.00031369327916763723, "global_step": 69354, "epoch": 582, "lr": 2.0513356304350252e-07} +{"train_loss": 0.00017448146536480635, "global_step": 69355, "epoch": 582, "lr": 2.049331295975454e-07} +{"train_loss": 0.00039909101906232536, "global_step": 69356, "epoch": 582, "lr": 2.0473279391888257e-07} +{"train_loss": 0.00024329443112947047, "global_step": 69357, "epoch": 582, "lr": 2.045325560079081e-07} +{"train_loss": 0.00024243223015218973, "global_step": 69358, "epoch": 582, "lr": 2.0433241586501062e-07} +{"train_loss": 0.00020257901633158326, "global_step": 69359, "epoch": 582, "lr": 2.0413237349058978e-07} +{"train_loss": 0.00022856068972032517, "global_step": 69360, "epoch": 582, "lr": 2.0393242888503417e-07} +{"train_loss": 0.0001426736853318289, "global_step": 69361, "epoch": 582, "lr": 2.0373258204873235e-07} +{"train_loss": 0.00022683653514832258, "global_step": 69362, "epoch": 582, "lr": 2.0353283298208957e-07} +{"train_loss": 0.0003332036139909178, "global_step": 69363, "epoch": 582, "lr": 2.0333318168548887e-07} +{"train_loss": 0.00020514802599791437, "global_step": 69364, "epoch": 582, "lr": 2.031336281593188e-07} +{"train_loss": 0.00014584267046302557, "global_step": 69365, "epoch": 582, "lr": 2.0293417240397905e-07} +{"train_loss": 0.000199199712369591, "global_step": 69366, "epoch": 582, "lr": 2.027348144198582e-07} +{"train_loss": 0.00018660901696421206, "global_step": 69367, "epoch": 582, "lr": 2.0253555420734483e-07} +{"train_loss": 0.00021718503558076918, "global_step": 69368, "epoch": 582, "lr": 2.0233639176683304e-07} +{"train_loss": 0.00017030563321895897, "global_step": 69369, "epoch": 582, "lr": 2.0213732709871703e-07} +{"train_loss": 0.0002748091355897486, "global_step": 69370, "epoch": 582, "lr": 2.0193836020337976e-07} +{"train_loss": 0.00021156505681574345, "global_step": 69371, "epoch": 582, "lr": 2.0173949108122092e-07} +{"train_loss": 0.00033190532121807337, "global_step": 69372, "epoch": 582, "lr": 2.0154071973262355e-07} +{"train_loss": 0.0003228607529308647, "global_step": 69373, "epoch": 582, "lr": 2.013420461579818e-07} +{"train_loss": 0.00015092984540387988, "global_step": 69374, "epoch": 582, "lr": 2.0114347035768423e-07} +{"train_loss": 0.0006118576275184751, "global_step": 69375, "epoch": 582, "lr": 2.009449923321194e-07} +{"train_loss": 0.0002461069928381412, "global_step": 69376, "epoch": 582, "lr": 2.0074661208168144e-07, "val_loss": 0.014318462461233139} +{"train_loss": 0.00016751674411352724, "global_step": 69377, "epoch": 583, "lr": 2.0054832960675896e-07} +{"train_loss": 0.0001736921549309045, "global_step": 69378, "epoch": 583, "lr": 2.0035014490773496e-07} +{"train_loss": 0.0001606944133527577, "global_step": 69379, "epoch": 583, "lr": 2.0015205798500913e-07} +{"train_loss": 0.00012120164319640025, "global_step": 69380, "epoch": 583, "lr": 1.9995406883895895e-07} +{"train_loss": 0.0001601187977939844, "global_step": 69381, "epoch": 583, "lr": 1.997561774699841e-07} +{"train_loss": 0.00027058995328843594, "global_step": 69382, "epoch": 583, "lr": 1.9955838387846203e-07} +{"train_loss": 0.0001868485560407862, "global_step": 69383, "epoch": 583, "lr": 1.9936068806478692e-07} +{"train_loss": 0.00021050804934930056, "global_step": 69384, "epoch": 583, "lr": 1.9916309002935285e-07} +{"train_loss": 0.00018403521971777081, "global_step": 69385, "epoch": 583, "lr": 1.9896558977253733e-07} +{"train_loss": 0.00013810193922836334, "global_step": 69386, "epoch": 583, "lr": 1.987681872947289e-07} +{"train_loss": 0.0001772841060301289, "global_step": 69387, "epoch": 583, "lr": 1.9857088259632174e-07} +{"train_loss": 0.0002491869672667235, "global_step": 69388, "epoch": 583, "lr": 1.9837367567770438e-07} +{"train_loss": 0.00013893283903598785, "global_step": 69389, "epoch": 583, "lr": 1.9817656653925432e-07} +{"train_loss": 0.0004122363752685487, "global_step": 69390, "epoch": 583, "lr": 1.979795551813657e-07} +{"train_loss": 0.00013714306987822056, "global_step": 69391, "epoch": 583, "lr": 1.9778264160442705e-07} +{"train_loss": 0.0002649051311891526, "global_step": 69392, "epoch": 583, "lr": 1.975858258088159e-07} +{"train_loss": 0.0002787880948744714, "global_step": 69393, "epoch": 583, "lr": 1.9738910779492635e-07} +{"train_loss": 0.0002821314556058496, "global_step": 69394, "epoch": 583, "lr": 1.9719248756314147e-07} +{"train_loss": 0.0002010402240557596, "global_step": 69395, "epoch": 583, "lr": 1.9699596511384976e-07} +{"train_loss": 0.00023347247042693198, "global_step": 69396, "epoch": 583, "lr": 1.9679954044743987e-07} +{"train_loss": 0.0003465941990725696, "global_step": 69397, "epoch": 583, "lr": 1.9660321356428923e-07} +{"train_loss": 0.0005412533646449447, "global_step": 69398, "epoch": 583, "lr": 1.9640698446478645e-07} +{"train_loss": 0.00015999149763956666, "global_step": 69399, "epoch": 583, "lr": 1.9621085314932008e-07} +{"train_loss": 0.00031361725996248424, "global_step": 69400, "epoch": 583, "lr": 1.9601481961827317e-07} +{"train_loss": 0.00023983050778042525, "global_step": 69401, "epoch": 583, "lr": 1.9581888387202874e-07} +{"train_loss": 0.00019148961291648448, "global_step": 69402, "epoch": 583, "lr": 1.956230459109698e-07} +{"train_loss": 0.00023636792320758104, "global_step": 69403, "epoch": 583, "lr": 1.954273057354905e-07} +{"train_loss": 0.00013959255011286587, "global_step": 69404, "epoch": 583, "lr": 1.952316633459683e-07} +{"train_loss": 0.00041731848614290357, "global_step": 69405, "epoch": 583, "lr": 1.9503611874278072e-07} +{"train_loss": 0.000228074291953817, "global_step": 69406, "epoch": 583, "lr": 1.9484067192632737e-07} +{"train_loss": 0.00016210525063797832, "global_step": 69407, "epoch": 583, "lr": 1.9464532289698024e-07} +{"train_loss": 0.0002997579867951572, "global_step": 69408, "epoch": 583, "lr": 1.9445007165512786e-07} +{"train_loss": 0.0003997859894298017, "global_step": 69409, "epoch": 583, "lr": 1.9425491820114773e-07} +{"train_loss": 0.0002875541977118701, "global_step": 69410, "epoch": 583, "lr": 1.940598625354284e-07} +{"train_loss": 0.00021309120347723365, "global_step": 69411, "epoch": 583, "lr": 1.9386490465835294e-07} +{"train_loss": 0.0001718538987915963, "global_step": 69412, "epoch": 583, "lr": 1.9367004457030436e-07} +{"train_loss": 0.00031226599821820855, "global_step": 69413, "epoch": 583, "lr": 1.934752822716601e-07} +{"train_loss": 0.00035599604598246515, "global_step": 69414, "epoch": 583, "lr": 1.9328061776280882e-07} +{"train_loss": 0.00027038317057304084, "global_step": 69415, "epoch": 583, "lr": 1.9308605104412791e-07} +{"train_loss": 0.0002146526676369831, "global_step": 69416, "epoch": 583, "lr": 1.9289158211600044e-07} +{"train_loss": 0.00016016885638237, "global_step": 69417, "epoch": 583, "lr": 1.9269721097881498e-07} +{"train_loss": 0.00026910315500572324, "global_step": 69418, "epoch": 583, "lr": 1.9250293763294346e-07} +{"train_loss": 0.00031439511803910136, "global_step": 69419, "epoch": 583, "lr": 1.9230876207876892e-07} +{"train_loss": 0.00013856134319212288, "global_step": 69420, "epoch": 583, "lr": 1.921146843166799e-07} +{"train_loss": 0.00028318905970081687, "global_step": 69421, "epoch": 583, "lr": 1.9192070434704835e-07} +{"train_loss": 0.00012465083273127675, "global_step": 69422, "epoch": 583, "lr": 1.9172682217026283e-07} +{"train_loss": 0.0003703479014802724, "global_step": 69423, "epoch": 583, "lr": 1.915330377866953e-07} +{"train_loss": 0.00023834625608287752, "global_step": 69424, "epoch": 583, "lr": 1.9133935119673986e-07} +{"train_loss": 0.0001767767098499462, "global_step": 69425, "epoch": 583, "lr": 1.9114576240075733e-07} +{"train_loss": 0.00021431411732919514, "global_step": 69426, "epoch": 583, "lr": 1.909522713991474e-07} +{"train_loss": 0.00021777153597213328, "global_step": 69427, "epoch": 583, "lr": 1.9075887819228199e-07} +{"train_loss": 0.00020369789854157716, "global_step": 69428, "epoch": 583, "lr": 1.9056558278053306e-07} +{"train_loss": 0.0002287922106916085, "global_step": 69429, "epoch": 583, "lr": 1.9037238516429467e-07} +{"train_loss": 0.00013629916065838188, "global_step": 69430, "epoch": 583, "lr": 1.9017928534393325e-07} +{"train_loss": 0.00023706391220912337, "global_step": 69431, "epoch": 583, "lr": 1.8998628331983738e-07} +{"train_loss": 0.00011435189662734047, "global_step": 69432, "epoch": 583, "lr": 1.8979337909237893e-07} +{"train_loss": 0.00029356160666793585, "global_step": 69433, "epoch": 583, "lr": 1.89600572661941e-07} +{"train_loss": 0.00022872253612149507, "global_step": 69434, "epoch": 583, "lr": 1.8940786402889542e-07} +{"train_loss": 0.000280893815215677, "global_step": 69435, "epoch": 583, "lr": 1.8921525319363643e-07} +{"train_loss": 0.00033591690589673817, "global_step": 69436, "epoch": 583, "lr": 1.8902274015652477e-07} +{"train_loss": 0.00030111760133877397, "global_step": 69437, "epoch": 583, "lr": 1.8883032491794905e-07} +{"train_loss": 0.00018730513693299145, "global_step": 69438, "epoch": 583, "lr": 1.8863800747827564e-07} +{"train_loss": 0.0003065864439122379, "global_step": 69439, "epoch": 583, "lr": 1.884457878378987e-07} +{"train_loss": 0.00019054794393014163, "global_step": 69440, "epoch": 583, "lr": 1.8825366599718453e-07} +{"train_loss": 0.0001507830311311409, "global_step": 69441, "epoch": 583, "lr": 1.8806164195651066e-07} +{"train_loss": 0.0005482698325067759, "global_step": 69442, "epoch": 583, "lr": 1.878697157162601e-07} +{"train_loss": 0.0005256046424619853, "global_step": 69443, "epoch": 583, "lr": 1.876778872768048e-07} +{"train_loss": 0.00012812357454095036, "global_step": 69444, "epoch": 583, "lr": 1.8748615663851665e-07} +{"train_loss": 0.00029359792824834585, "global_step": 69445, "epoch": 583, "lr": 1.8729452380178426e-07} +{"train_loss": 0.0006470696534961462, "global_step": 69446, "epoch": 583, "lr": 1.8710298876697397e-07} +{"train_loss": 0.00021315223420970142, "global_step": 69447, "epoch": 583, "lr": 1.8691155153446883e-07} +{"train_loss": 0.0002820839872583747, "global_step": 69448, "epoch": 583, "lr": 1.867202121046352e-07} +{"train_loss": 0.00024043599842116237, "global_step": 69449, "epoch": 583, "lr": 1.8652897047786167e-07} +{"train_loss": 0.00018451796495355666, "global_step": 69450, "epoch": 583, "lr": 1.8633782665450904e-07} +{"train_loss": 0.0001550493179820478, "global_step": 69451, "epoch": 583, "lr": 1.8614678063496594e-07} +{"train_loss": 0.0002032898919424042, "global_step": 69452, "epoch": 583, "lr": 1.8595583241959868e-07} +{"train_loss": 0.0002822079695761204, "global_step": 69453, "epoch": 583, "lr": 1.8576498200879033e-07} +{"train_loss": 0.0004957820056006312, "global_step": 69454, "epoch": 583, "lr": 1.8557422940290726e-07} +{"train_loss": 0.0006368659669533372, "global_step": 69455, "epoch": 583, "lr": 1.853835746023269e-07} +{"train_loss": 0.00018969419761560857, "global_step": 69456, "epoch": 583, "lr": 1.8519301760742124e-07} +{"train_loss": 0.00016961412620730698, "global_step": 69457, "epoch": 583, "lr": 1.8500255841857329e-07} +{"train_loss": 0.00030125404009595513, "global_step": 69458, "epoch": 583, "lr": 1.8481219703614938e-07} +{"train_loss": 0.00028643838595598936, "global_step": 69459, "epoch": 583, "lr": 1.8462193346052148e-07} +{"train_loss": 0.0002387098502367735, "global_step": 69460, "epoch": 583, "lr": 1.8443176769206705e-07} +{"train_loss": 0.0003852308145724237, "global_step": 69461, "epoch": 583, "lr": 1.84241699731158e-07} +{"train_loss": 0.00036213017301633954, "global_step": 69462, "epoch": 583, "lr": 1.8405172957817186e-07} +{"train_loss": 0.00013294571544975042, "global_step": 69463, "epoch": 583, "lr": 1.838618572334805e-07} +{"train_loss": 0.0004161967081017792, "global_step": 69464, "epoch": 583, "lr": 1.8367208269744474e-07} +{"train_loss": 0.00039846828440204263, "global_step": 69465, "epoch": 583, "lr": 1.8348240597045318e-07} +{"train_loss": 0.00021218156325630844, "global_step": 69466, "epoch": 583, "lr": 1.832928270528722e-07} +{"train_loss": 0.00045579500147141516, "global_step": 69467, "epoch": 583, "lr": 1.8310334594506817e-07} +{"train_loss": 0.0005585385370068252, "global_step": 69468, "epoch": 583, "lr": 1.8291396264742411e-07} +{"train_loss": 0.00015677505871281028, "global_step": 69469, "epoch": 583, "lr": 1.827246771603064e-07} +{"train_loss": 0.00021588237723335624, "global_step": 69470, "epoch": 583, "lr": 1.8253548948408694e-07} +{"train_loss": 0.00023087371664587408, "global_step": 69471, "epoch": 583, "lr": 1.8234639961913214e-07} +{"train_loss": 0.00016708851035218686, "global_step": 69472, "epoch": 583, "lr": 1.8215740756581944e-07} +{"train_loss": 0.00021148312953300774, "global_step": 69473, "epoch": 583, "lr": 1.819685133245208e-07} +{"train_loss": 0.000306452508084476, "global_step": 69474, "epoch": 583, "lr": 1.817797168956026e-07} +{"train_loss": 0.0001557841314934194, "global_step": 69475, "epoch": 583, "lr": 1.8159101827944224e-07} +{"train_loss": 0.00023228235659189522, "global_step": 69476, "epoch": 583, "lr": 1.8140241747640063e-07} +{"train_loss": 0.00018261423974763602, "global_step": 69477, "epoch": 583, "lr": 1.8121391448685522e-07} +{"train_loss": 0.00030818881350569427, "global_step": 69478, "epoch": 583, "lr": 1.8102550931117234e-07} +{"train_loss": 0.00034932128619402647, "global_step": 69479, "epoch": 583, "lr": 1.8083720194972397e-07} +{"train_loss": 0.00021904219465795904, "global_step": 69480, "epoch": 583, "lr": 1.8064899240288203e-07} +{"train_loss": 0.000199939648155123, "global_step": 69481, "epoch": 583, "lr": 1.8046088067101286e-07} +{"train_loss": 0.0001828536478569731, "global_step": 69482, "epoch": 583, "lr": 1.8027286675448285e-07} +{"train_loss": 0.00022065520170144737, "global_step": 69483, "epoch": 583, "lr": 1.8008495065366392e-07} +{"train_loss": 0.0004157976363785565, "global_step": 69484, "epoch": 583, "lr": 1.7989713236892802e-07} +{"train_loss": 0.0005829971050843596, "global_step": 69485, "epoch": 583, "lr": 1.797094119006415e-07} +{"train_loss": 0.0004062013467773795, "global_step": 69486, "epoch": 583, "lr": 1.7952178924917627e-07} +{"train_loss": 0.00020641555602196604, "global_step": 69487, "epoch": 583, "lr": 1.7933426441489322e-07} +{"train_loss": 0.0002432164183119312, "global_step": 69488, "epoch": 583, "lr": 1.7914683739816417e-07} +{"train_loss": 0.00022374717809725553, "global_step": 69489, "epoch": 583, "lr": 1.7895950819936114e-07} +{"train_loss": 0.0004959343932569027, "global_step": 69490, "epoch": 583, "lr": 1.7877227681884488e-07} +{"train_loss": 0.0001390530087519437, "global_step": 69491, "epoch": 583, "lr": 1.7858514325699294e-07} +{"train_loss": 0.0002735418966040015, "global_step": 69492, "epoch": 583, "lr": 1.7839810751416054e-07} +{"train_loss": 0.0001551964960526675, "global_step": 69493, "epoch": 583, "lr": 1.7821116959072516e-07} +{"train_loss": 0.00024695321917533875, "global_step": 69494, "epoch": 583, "lr": 1.7802432948704207e-07} +{"train_loss": 0.00026247711551860917, "global_step": 69495, "epoch": 583, "lr": 1.778375872034943e-07, "val_loss": 0.022978078573942184} +{"train_loss": 0.0005524412845261395, "global_step": 69496, "epoch": 584, "lr": 1.7765094274043714e-07} +{"train_loss": 0.00019976192561443895, "global_step": 69497, "epoch": 584, "lr": 1.7746439609823696e-07} +{"train_loss": 0.0002913374628406018, "global_step": 69498, "epoch": 584, "lr": 1.7727794727726012e-07} +{"train_loss": 0.000205417672987096, "global_step": 69499, "epoch": 584, "lr": 1.7709159627787853e-07} +{"train_loss": 0.00031431668321602046, "global_step": 69500, "epoch": 584, "lr": 1.769053431004586e-07} +{"train_loss": 0.00021158946037758142, "global_step": 69501, "epoch": 584, "lr": 1.7671918774535556e-07} +{"train_loss": 0.00036826173891313374, "global_step": 69502, "epoch": 584, "lr": 1.7653313021294692e-07} +{"train_loss": 0.0005152244120836258, "global_step": 69503, "epoch": 584, "lr": 1.7634717050358795e-07} +{"train_loss": 0.00021147119696252048, "global_step": 69504, "epoch": 584, "lr": 1.7616130861765057e-07} +{"train_loss": 0.00023040077940095216, "global_step": 69505, "epoch": 584, "lr": 1.7597554455550115e-07} +{"train_loss": 0.00017674897389952093, "global_step": 69506, "epoch": 584, "lr": 1.7578987831749494e-07} +{"train_loss": 0.00031250796746462584, "global_step": 69507, "epoch": 584, "lr": 1.7560430990400944e-07} +{"train_loss": 0.00044213555520400405, "global_step": 69508, "epoch": 584, "lr": 1.7541883931539437e-07} +{"train_loss": 0.00020237339776940644, "global_step": 69509, "epoch": 584, "lr": 1.7523346655202722e-07} +{"train_loss": 0.00033965028706006706, "global_step": 69510, "epoch": 584, "lr": 1.7504819161426324e-07} +{"train_loss": 0.0003529242821969092, "global_step": 69511, "epoch": 584, "lr": 1.7486301450246878e-07} +{"train_loss": 0.00017840975488070399, "global_step": 69512, "epoch": 584, "lr": 1.7467793521701026e-07} +{"train_loss": 0.00021428025502245873, "global_step": 69513, "epoch": 584, "lr": 1.7449295375824292e-07} +{"train_loss": 0.00013035399024374783, "global_step": 69514, "epoch": 584, "lr": 1.7430807012654428e-07} +{"train_loss": 0.00017324666259810328, "global_step": 69515, "epoch": 584, "lr": 1.7412328432226398e-07} +{"train_loss": 0.0003351079358253628, "global_step": 69516, "epoch": 584, "lr": 1.7393859634576848e-07} +{"train_loss": 0.00015571614494547248, "global_step": 69517, "epoch": 584, "lr": 1.7375400619742411e-07} +{"train_loss": 0.00026868144050240517, "global_step": 69518, "epoch": 584, "lr": 1.7356951387758613e-07} +{"train_loss": 0.00032742306939326227, "global_step": 69519, "epoch": 584, "lr": 1.733851193866265e-07} +{"train_loss": 0.00027901428984478116, "global_step": 69520, "epoch": 584, "lr": 1.7320082272490046e-07} +{"train_loss": 0.0005221761530265212, "global_step": 69521, "epoch": 584, "lr": 1.7301662389276884e-07} +{"train_loss": 0.00020632323867175728, "global_step": 69522, "epoch": 584, "lr": 1.7283252289059803e-07} +{"train_loss": 0.0002643992193043232, "global_step": 69523, "epoch": 584, "lr": 1.726485197187433e-07} +{"train_loss": 0.00029213569359853864, "global_step": 69524, "epoch": 584, "lr": 1.7246461437757656e-07} +{"train_loss": 0.0001592528133187443, "global_step": 69525, "epoch": 584, "lr": 1.7228080686744752e-07} +{"train_loss": 0.00018349086167290807, "global_step": 69526, "epoch": 584, "lr": 1.7209709718872258e-07} +{"train_loss": 0.0001900676725199446, "global_step": 69527, "epoch": 584, "lr": 1.7191348534176255e-07} +{"train_loss": 0.00019808561773970723, "global_step": 69528, "epoch": 584, "lr": 1.7172997132692826e-07} +{"train_loss": 0.00027589438832364976, "global_step": 69529, "epoch": 584, "lr": 1.7154655514457497e-07} +{"train_loss": 0.0003519096062518656, "global_step": 69530, "epoch": 584, "lr": 1.7136323679506904e-07} +{"train_loss": 0.0001677950203884393, "global_step": 69531, "epoch": 584, "lr": 1.7118001627877133e-07} +{"train_loss": 0.00021653018484357744, "global_step": 69532, "epoch": 584, "lr": 1.7099689359603156e-07} +{"train_loss": 0.00022772687952965498, "global_step": 69533, "epoch": 584, "lr": 1.708138687472216e-07} +{"train_loss": 0.0002013129269471392, "global_step": 69534, "epoch": 584, "lr": 1.7063094173269124e-07} +{"train_loss": 0.00029987437301315367, "global_step": 69535, "epoch": 584, "lr": 1.704481125528068e-07} +{"train_loss": 0.00047097078640945256, "global_step": 69536, "epoch": 584, "lr": 1.7026538120791803e-07} +{"train_loss": 0.000339811755111441, "global_step": 69537, "epoch": 584, "lr": 1.7008274769839683e-07} +{"train_loss": 0.00021091540111228824, "global_step": 69538, "epoch": 584, "lr": 1.6990021202459295e-07} +{"train_loss": 0.00018321051902603358, "global_step": 69539, "epoch": 584, "lr": 1.6971777418686162e-07} +{"train_loss": 0.00026141759008169174, "global_step": 69540, "epoch": 584, "lr": 1.6953543418556928e-07} +{"train_loss": 0.00026752924895845354, "global_step": 69541, "epoch": 584, "lr": 1.6935319202107114e-07} +{"train_loss": 0.00012551034160424024, "global_step": 69542, "epoch": 584, "lr": 1.6917104769372248e-07} +{"train_loss": 0.00040009585791267455, "global_step": 69543, "epoch": 584, "lr": 1.689890012038897e-07} +{"train_loss": 0.0005619701696559787, "global_step": 69544, "epoch": 584, "lr": 1.6880705255191697e-07} +{"train_loss": 0.0002143072197213769, "global_step": 69545, "epoch": 584, "lr": 1.6862520173817064e-07} +{"train_loss": 0.00032987951999530196, "global_step": 69546, "epoch": 584, "lr": 1.6844344876300046e-07} +{"train_loss": 0.0002042554842773825, "global_step": 69547, "epoch": 584, "lr": 1.6826179362677274e-07} +{"train_loss": 0.0002106415486196056, "global_step": 69548, "epoch": 584, "lr": 1.6808023632983727e-07} +{"train_loss": 0.00018724187975749373, "global_step": 69549, "epoch": 584, "lr": 1.6789877687254928e-07} +{"train_loss": 0.00028363027377054095, "global_step": 69550, "epoch": 584, "lr": 1.6771741525527518e-07} +{"train_loss": 0.00028640241362154484, "global_step": 69551, "epoch": 584, "lr": 1.675361514783591e-07} +{"train_loss": 0.00023086318105924875, "global_step": 69552, "epoch": 584, "lr": 1.673549855421619e-07} +{"train_loss": 0.00015097037248779088, "global_step": 69553, "epoch": 584, "lr": 1.6717391744704435e-07} +{"train_loss": 0.00019113783491775393, "global_step": 69554, "epoch": 584, "lr": 1.669929471933507e-07} +{"train_loss": 0.0001570761378388852, "global_step": 69555, "epoch": 584, "lr": 1.6681207478144721e-07} +{"train_loss": 0.00031591998413205147, "global_step": 69556, "epoch": 584, "lr": 1.6663130021167817e-07} +{"train_loss": 0.00021708551503252238, "global_step": 69557, "epoch": 584, "lr": 1.6645062348440988e-07} +{"train_loss": 0.00023837428307160735, "global_step": 69558, "epoch": 584, "lr": 1.6627004459999208e-07} +{"train_loss": 0.0002008632436627522, "global_step": 69559, "epoch": 584, "lr": 1.6608956355878002e-07} +{"train_loss": 0.0003091758117079735, "global_step": 69560, "epoch": 584, "lr": 1.6590918036112347e-07} +{"train_loss": 0.00043225716217420995, "global_step": 69561, "epoch": 584, "lr": 1.6572889500737766e-07} +{"train_loss": 0.00017747913079801947, "global_step": 69562, "epoch": 584, "lr": 1.6554870749790896e-07} +{"train_loss": 0.0001556654169689864, "global_step": 69563, "epoch": 584, "lr": 1.6536861783305046e-07} +{"train_loss": 0.00012963083281647414, "global_step": 69564, "epoch": 584, "lr": 1.651886260131741e-07} +{"train_loss": 0.0003799166879616678, "global_step": 69565, "epoch": 584, "lr": 1.65008732038624e-07} +{"train_loss": 0.00028185005066916347, "global_step": 69566, "epoch": 584, "lr": 1.6482893590975545e-07} +{"train_loss": 0.0002904545108322054, "global_step": 69567, "epoch": 584, "lr": 1.646492376269182e-07} +{"train_loss": 0.00023497063375543803, "global_step": 69568, "epoch": 584, "lr": 1.6446963719047304e-07} +{"train_loss": 0.00019841166795231402, "global_step": 69569, "epoch": 584, "lr": 1.642901346007586e-07} +{"train_loss": 0.00046668335562571883, "global_step": 69570, "epoch": 584, "lr": 1.641107298581468e-07} +{"train_loss": 0.00022866942163091153, "global_step": 69571, "epoch": 584, "lr": 1.639314229629707e-07} +{"train_loss": 0.00013489331468008459, "global_step": 69572, "epoch": 584, "lr": 1.637522139155967e-07} +{"train_loss": 0.0003770309849642217, "global_step": 69573, "epoch": 584, "lr": 1.6357310271636893e-07} +{"train_loss": 0.0003978968015871942, "global_step": 69574, "epoch": 584, "lr": 1.633940893656427e-07} +{"train_loss": 0.0003955687570851296, "global_step": 69575, "epoch": 584, "lr": 1.632151738637677e-07} +{"train_loss": 0.00018480968719813973, "global_step": 69576, "epoch": 584, "lr": 1.630363562110937e-07} +{"train_loss": 0.00023373719886876643, "global_step": 69577, "epoch": 584, "lr": 1.628576364079759e-07} +{"train_loss": 0.00019709274056367576, "global_step": 69578, "epoch": 584, "lr": 1.6267901445476407e-07} +{"train_loss": 0.00022653135238215327, "global_step": 69579, "epoch": 584, "lr": 1.6250049035180236e-07} +{"train_loss": 0.000258113956078887, "global_step": 69580, "epoch": 584, "lr": 1.623220640994516e-07} +{"train_loss": 0.0002686067600734532, "global_step": 69581, "epoch": 584, "lr": 1.6214373569805596e-07} +{"train_loss": 0.00015023027663119137, "global_step": 69582, "epoch": 584, "lr": 1.6196550514796516e-07} +{"train_loss": 0.00013486311945598572, "global_step": 69583, "epoch": 584, "lr": 1.617873724495289e-07} +{"train_loss": 0.00017671652312856168, "global_step": 69584, "epoch": 584, "lr": 1.6160933760310247e-07} +{"train_loss": 0.00011705411452567205, "global_step": 69585, "epoch": 584, "lr": 1.6143140060903006e-07} +{"train_loss": 0.00027119662263430655, "global_step": 69586, "epoch": 584, "lr": 1.6125356146766136e-07} +{"train_loss": 0.00023053034965414554, "global_step": 69587, "epoch": 584, "lr": 1.6107582017935164e-07} +{"train_loss": 0.00027681878418661654, "global_step": 69588, "epoch": 584, "lr": 1.6089817674443952e-07} +{"train_loss": 0.0004041253705509007, "global_step": 69589, "epoch": 584, "lr": 1.6072063116328028e-07} +{"train_loss": 0.00016083820082712919, "global_step": 69590, "epoch": 584, "lr": 1.6054318343622365e-07} +{"train_loss": 0.00020444444089662284, "global_step": 69591, "epoch": 584, "lr": 1.603658335636138e-07} +{"train_loss": 0.0002285992231918499, "global_step": 69592, "epoch": 584, "lr": 1.6018858154580595e-07} +{"train_loss": 0.0003024743346031755, "global_step": 69593, "epoch": 584, "lr": 1.6001142738313879e-07} +{"train_loss": 0.00015798296954017133, "global_step": 69594, "epoch": 584, "lr": 1.59834371075962e-07} +{"train_loss": 0.00025243041454814374, "global_step": 69595, "epoch": 584, "lr": 1.5965741262463087e-07} +{"train_loss": 0.00023466507263947278, "global_step": 69596, "epoch": 584, "lr": 1.5948055202948952e-07} +{"train_loss": 0.00020426703849807382, "global_step": 69597, "epoch": 584, "lr": 1.5930378929087663e-07} +{"train_loss": 0.0002072626812150702, "global_step": 69598, "epoch": 584, "lr": 1.5912712440914745e-07} +{"train_loss": 0.0004393137351144105, "global_step": 69599, "epoch": 584, "lr": 1.589505573846517e-07} +{"train_loss": 0.00021292110614012927, "global_step": 69600, "epoch": 584, "lr": 1.5877408821772798e-07} +{"train_loss": 0.0002390562731307, "global_step": 69601, "epoch": 584, "lr": 1.5859771690872604e-07} +{"train_loss": 0.00014958389510866255, "global_step": 69602, "epoch": 584, "lr": 1.584214434579956e-07} +{"train_loss": 0.00016335913096554577, "global_step": 69603, "epoch": 584, "lr": 1.582452678658808e-07} +{"train_loss": 0.00032847721013240516, "global_step": 69604, "epoch": 584, "lr": 1.5806919013272025e-07} +{"train_loss": 0.00041209490154869854, "global_step": 69605, "epoch": 584, "lr": 1.5789321025887483e-07} +{"train_loss": 0.00026739505119621754, "global_step": 69606, "epoch": 584, "lr": 1.57717328244672e-07} +{"train_loss": 0.0001686521718511358, "global_step": 69607, "epoch": 584, "lr": 1.575415440904726e-07} +{"train_loss": 0.0003650264989119023, "global_step": 69608, "epoch": 584, "lr": 1.573658577966153e-07} +{"train_loss": 0.0002690402907319367, "global_step": 69609, "epoch": 584, "lr": 1.5719026936344417e-07} +{"train_loss": 0.00015820511907804757, "global_step": 69610, "epoch": 584, "lr": 1.57014778791309e-07} +{"train_loss": 0.00014019168156664819, "global_step": 69611, "epoch": 584, "lr": 1.5683938608054282e-07} +{"train_loss": 0.0002906896988861263, "global_step": 69612, "epoch": 584, "lr": 1.5666409123150095e-07} +{"train_loss": 0.0002956782409455627, "global_step": 69613, "epoch": 584, "lr": 1.5648889424452195e-07} +{"train_loss": 0.00025833009072323137, "global_step": 69614, "epoch": 584, "lr": 1.563137951199556e-07, "val_loss": 0.015410445630550385} +{"train_loss": 0.00017754847067408264, "global_step": 69615, "epoch": 585, "lr": 1.5613879385814044e-07} +{"train_loss": 0.00025964167434722185, "global_step": 69616, "epoch": 585, "lr": 1.5596389045942628e-07} +{"train_loss": 0.0001735537516651675, "global_step": 69617, "epoch": 585, "lr": 1.5578908492414612e-07} +{"train_loss": 0.00015390382031910121, "global_step": 69618, "epoch": 585, "lr": 1.556143772526497e-07} +{"train_loss": 0.00019083174993284047, "global_step": 69619, "epoch": 585, "lr": 1.5543976744528122e-07} +{"train_loss": 0.00012212670117150992, "global_step": 69620, "epoch": 585, "lr": 1.5526525550237924e-07} +{"train_loss": 0.00012757483636960387, "global_step": 69621, "epoch": 585, "lr": 1.5509084142429352e-07} +{"train_loss": 0.0001428134273737669, "global_step": 69622, "epoch": 585, "lr": 1.5491652521135712e-07} +{"train_loss": 0.00016703792789485306, "global_step": 69623, "epoch": 585, "lr": 1.5474230686391976e-07} +{"train_loss": 0.00013488534023053944, "global_step": 69624, "epoch": 585, "lr": 1.5456818638232007e-07} +{"train_loss": 0.0002455335343256593, "global_step": 69625, "epoch": 585, "lr": 1.5439416376689665e-07} +{"train_loss": 0.0004172208427917212, "global_step": 69626, "epoch": 585, "lr": 1.542202390179992e-07} +{"train_loss": 0.0002113191585522145, "global_step": 69627, "epoch": 585, "lr": 1.5404641213596638e-07} +{"train_loss": 0.00031809622305445373, "global_step": 69628, "epoch": 585, "lr": 1.5387268312113122e-07} +{"train_loss": 0.0004334599943831563, "global_step": 69629, "epoch": 585, "lr": 1.5369905197384903e-07} +{"train_loss": 0.00032696203561499715, "global_step": 69630, "epoch": 585, "lr": 1.5352551869445287e-07} +{"train_loss": 0.00029588452889584005, "global_step": 69631, "epoch": 585, "lr": 1.5335208328328132e-07} +{"train_loss": 0.00022404937772080302, "global_step": 69632, "epoch": 585, "lr": 1.531787457406786e-07} +{"train_loss": 0.000179339709575288, "global_step": 69633, "epoch": 585, "lr": 1.5300550606698328e-07} +{"train_loss": 0.0001449652190785855, "global_step": 69634, "epoch": 585, "lr": 1.52832364262534e-07} +{"train_loss": 0.00021043437300249934, "global_step": 69635, "epoch": 585, "lr": 1.5265932032767495e-07} +{"train_loss": 0.000486067176098004, "global_step": 69636, "epoch": 585, "lr": 1.524863742627447e-07} +{"train_loss": 0.0001318473950959742, "global_step": 69637, "epoch": 585, "lr": 1.523135260680819e-07} +{"train_loss": 0.00018276461923960596, "global_step": 69638, "epoch": 585, "lr": 1.5214077574403074e-07} +{"train_loss": 0.00021181489864829928, "global_step": 69639, "epoch": 585, "lr": 1.519681232909187e-07} +{"train_loss": 0.0002606989583000541, "global_step": 69640, "epoch": 585, "lr": 1.517955687090955e-07} +{"train_loss": 0.0002504893927834928, "global_step": 69641, "epoch": 585, "lr": 1.5162311199889424e-07} +{"train_loss": 0.00026361923664808273, "global_step": 69642, "epoch": 585, "lr": 1.5145075316065348e-07} +{"train_loss": 0.00043366110185161233, "global_step": 69643, "epoch": 585, "lr": 1.5127849219471747e-07} +{"train_loss": 0.00019116417388431728, "global_step": 69644, "epoch": 585, "lr": 1.511063291014192e-07} +{"train_loss": 0.00023094142670743167, "global_step": 69645, "epoch": 585, "lr": 1.5093426388110288e-07} +{"train_loss": 0.00029351693228818476, "global_step": 69646, "epoch": 585, "lr": 1.5076229653409601e-07} +{"train_loss": 0.0004799659363925457, "global_step": 69647, "epoch": 585, "lr": 1.5059042706074278e-07} +{"train_loss": 0.00045687879901379347, "global_step": 69648, "epoch": 585, "lr": 1.5041865546137624e-07} +{"train_loss": 0.00021720415679737926, "global_step": 69649, "epoch": 585, "lr": 1.5024698173634056e-07} +{"train_loss": 0.00020690009114332497, "global_step": 69650, "epoch": 585, "lr": 1.5007540588597435e-07} +{"train_loss": 0.00014273912529461086, "global_step": 69651, "epoch": 585, "lr": 1.4990392791059958e-07} +{"train_loss": 0.00020041629613842815, "global_step": 69652, "epoch": 585, "lr": 1.4973254781057155e-07} +{"train_loss": 0.0002864849811885506, "global_step": 69653, "epoch": 585, "lr": 1.4956126558621219e-07} +{"train_loss": 0.0001501485676271841, "global_step": 69654, "epoch": 585, "lr": 1.493900812378657e-07} +{"train_loss": 0.00023659307043999434, "global_step": 69655, "epoch": 585, "lr": 1.492189947658651e-07} +{"train_loss": 0.0002168799692299217, "global_step": 69656, "epoch": 585, "lr": 1.4904800617054905e-07} +{"train_loss": 0.00039300372009165585, "global_step": 69657, "epoch": 585, "lr": 1.488771154522506e-07} +{"train_loss": 0.00021260305948089808, "global_step": 69658, "epoch": 585, "lr": 1.487063226113028e-07} +{"train_loss": 0.00029126362642273307, "global_step": 69659, "epoch": 585, "lr": 1.4853562764804984e-07} +{"train_loss": 0.00027083620079793036, "global_step": 69660, "epoch": 585, "lr": 1.4836503056281924e-07} +{"train_loss": 0.0003067854850087315, "global_step": 69661, "epoch": 585, "lr": 1.4819453135594408e-07} +{"train_loss": 0.00039091522921808064, "global_step": 69662, "epoch": 585, "lr": 1.480241300277685e-07} +{"train_loss": 0.00017584316083230078, "global_step": 69663, "epoch": 585, "lr": 1.4785382657861445e-07} +{"train_loss": 0.00015964030171744525, "global_step": 69664, "epoch": 585, "lr": 1.476836210088317e-07} +{"train_loss": 0.00012997197336517274, "global_step": 69665, "epoch": 585, "lr": 1.475135133187422e-07} +{"train_loss": 0.00027485305326990783, "global_step": 69666, "epoch": 585, "lr": 1.4734350350868452e-07} +{"train_loss": 0.00020424698595888913, "global_step": 69667, "epoch": 585, "lr": 1.471735915789918e-07} +{"train_loss": 0.00024110983940772712, "global_step": 69668, "epoch": 585, "lr": 1.4700377752999706e-07} +{"train_loss": 0.00022337651171255857, "global_step": 69669, "epoch": 585, "lr": 1.4683406136203891e-07} +{"train_loss": 0.00018602467025630176, "global_step": 69670, "epoch": 585, "lr": 1.4666444307543936e-07} +{"train_loss": 0.00028671487234532833, "global_step": 69671, "epoch": 585, "lr": 1.4649492267054254e-07} +{"train_loss": 0.0002847198920790106, "global_step": 69672, "epoch": 585, "lr": 1.4632550014767598e-07} +{"train_loss": 0.00024394580395892262, "global_step": 69673, "epoch": 585, "lr": 1.4615617550717276e-07} +{"train_loss": 0.00018922999151982367, "global_step": 69674, "epoch": 585, "lr": 1.459869487493659e-07} +{"train_loss": 0.0004622158012352884, "global_step": 69675, "epoch": 585, "lr": 1.4581781987458854e-07} +{"train_loss": 0.0002400369558017701, "global_step": 69676, "epoch": 585, "lr": 1.4564878888316812e-07} +{"train_loss": 0.0003119461180176586, "global_step": 69677, "epoch": 585, "lr": 1.4547985577544888e-07} +{"train_loss": 0.000179369977558963, "global_step": 69678, "epoch": 585, "lr": 1.453110205517416e-07} +{"train_loss": 0.0002637421421241015, "global_step": 69679, "epoch": 585, "lr": 1.4514228321240165e-07} +{"train_loss": 0.00029657490085810423, "global_step": 69680, "epoch": 585, "lr": 1.449736437577398e-07} +{"train_loss": 0.0001620448165340349, "global_step": 69681, "epoch": 585, "lr": 1.448051021881003e-07} +{"train_loss": 0.0003857627452816814, "global_step": 69682, "epoch": 585, "lr": 1.4463665850380504e-07} +{"train_loss": 0.0001385488867526874, "global_step": 69683, "epoch": 585, "lr": 1.4446831270519822e-07} +{"train_loss": 0.00018644418742042035, "global_step": 69684, "epoch": 585, "lr": 1.4430006479259627e-07} +{"train_loss": 0.00016883226635400206, "global_step": 69685, "epoch": 585, "lr": 1.4413191476633224e-07} +{"train_loss": 0.00036312954034656286, "global_step": 69686, "epoch": 585, "lr": 1.4396386262674478e-07} +{"train_loss": 0.00015683060337323695, "global_step": 69687, "epoch": 585, "lr": 1.4379590837415024e-07} +{"train_loss": 0.0005898926756344736, "global_step": 69688, "epoch": 585, "lr": 1.4362805200889284e-07} +{"train_loss": 0.00022904030629433692, "global_step": 69689, "epoch": 585, "lr": 1.4346029353129453e-07} +{"train_loss": 0.0002687199739739299, "global_step": 69690, "epoch": 585, "lr": 1.4329263294168282e-07} +{"train_loss": 0.0002654602867551148, "global_step": 69691, "epoch": 585, "lr": 1.4312507024039078e-07} +{"train_loss": 0.00015997093578334898, "global_step": 69692, "epoch": 585, "lr": 1.4295760542774595e-07} +{"train_loss": 0.0003696848580148071, "global_step": 69693, "epoch": 585, "lr": 1.4279023850408136e-07} +{"train_loss": 0.0003234973701182753, "global_step": 69694, "epoch": 585, "lr": 1.4262296946971898e-07} +{"train_loss": 0.0004359849262982607, "global_step": 69695, "epoch": 585, "lr": 1.4245579832498634e-07} +{"train_loss": 0.00024217744066845626, "global_step": 69696, "epoch": 585, "lr": 1.4228872507022207e-07} +{"train_loss": 0.00021918145648669451, "global_step": 69697, "epoch": 585, "lr": 1.4212174970574255e-07} +{"train_loss": 0.00018210260896012187, "global_step": 69698, "epoch": 585, "lr": 1.4195487223188087e-07} +{"train_loss": 0.0001766319473972544, "global_step": 69699, "epoch": 585, "lr": 1.4178809264896452e-07} +{"train_loss": 0.00016326062905136496, "global_step": 69700, "epoch": 585, "lr": 1.4162141095732106e-07} +{"train_loss": 0.00012691866140812635, "global_step": 69701, "epoch": 585, "lr": 1.4145482715727798e-07} +{"train_loss": 0.00027629031683318317, "global_step": 69702, "epoch": 585, "lr": 1.4128834124915724e-07} +{"train_loss": 0.00017339669284410775, "global_step": 69703, "epoch": 585, "lr": 1.4112195323329746e-07} +{"train_loss": 0.0004834462015423924, "global_step": 69704, "epoch": 585, "lr": 1.4095566311000952e-07} +{"train_loss": 0.00013437672168947756, "global_step": 69705, "epoch": 585, "lr": 1.4078947087963756e-07} +{"train_loss": 0.0001868000690592453, "global_step": 69706, "epoch": 585, "lr": 1.4062337654249246e-07} +{"train_loss": 0.00030011445051059127, "global_step": 69707, "epoch": 585, "lr": 1.4045738009891286e-07} +{"train_loss": 0.00046016910346224904, "global_step": 69708, "epoch": 585, "lr": 1.4029148154921512e-07} +{"train_loss": 0.000201290866243653, "global_step": 69709, "epoch": 585, "lr": 1.401256808937268e-07} +{"train_loss": 0.0001957862259587273, "global_step": 69710, "epoch": 585, "lr": 1.399599781327754e-07} +{"train_loss": 0.0002875971549656242, "global_step": 69711, "epoch": 585, "lr": 1.397943732666829e-07} +{"train_loss": 0.0002074318181257695, "global_step": 69712, "epoch": 585, "lr": 1.3962886629578232e-07} +{"train_loss": 0.0003177206963300705, "global_step": 69713, "epoch": 585, "lr": 1.3946345722039567e-07} +{"train_loss": 0.00029222838929854333, "global_step": 69714, "epoch": 585, "lr": 1.3929814604083936e-07} +{"train_loss": 0.00033529807114973664, "global_step": 69715, "epoch": 585, "lr": 1.3913293275744643e-07} +{"train_loss": 0.00018662730872165412, "global_step": 69716, "epoch": 585, "lr": 1.3896781737054444e-07} +{"train_loss": 0.0002831855381373316, "global_step": 69717, "epoch": 585, "lr": 1.388027998804442e-07} +{"train_loss": 0.0003571888373699039, "global_step": 69718, "epoch": 585, "lr": 1.3863788028748437e-07} +{"train_loss": 0.00015966239152476192, "global_step": 69719, "epoch": 585, "lr": 1.3847305859197579e-07} +{"train_loss": 0.0001864098449004814, "global_step": 69720, "epoch": 585, "lr": 1.383083347942571e-07} +{"train_loss": 0.0004320452571846545, "global_step": 69721, "epoch": 585, "lr": 1.3814370889463357e-07} +{"train_loss": 0.00019066609092988074, "global_step": 69722, "epoch": 585, "lr": 1.3797918089344385e-07} +{"train_loss": 0.00023019332729745656, "global_step": 69723, "epoch": 585, "lr": 1.3781475079100438e-07} +{"train_loss": 0.0006093315314501524, "global_step": 69724, "epoch": 585, "lr": 1.3765041858763705e-07} +{"train_loss": 0.00018103423644788563, "global_step": 69725, "epoch": 585, "lr": 1.374861842836639e-07} +{"train_loss": 0.00019887342932634056, "global_step": 69726, "epoch": 585, "lr": 1.373220478794124e-07} +{"train_loss": 0.00021181657211855054, "global_step": 69727, "epoch": 585, "lr": 1.3715800937520452e-07} +{"train_loss": 0.00022448234085459262, "global_step": 69728, "epoch": 585, "lr": 1.3699406877135667e-07} +{"train_loss": 0.00018755423661787063, "global_step": 69729, "epoch": 585, "lr": 1.368302260681964e-07} +{"train_loss": 0.00023519134265370667, "global_step": 69730, "epoch": 585, "lr": 1.366664812660401e-07} +{"train_loss": 0.0002551059296820313, "global_step": 69731, "epoch": 585, "lr": 1.365028343652097e-07} +{"train_loss": 0.0003006933256983757, "global_step": 69732, "epoch": 585, "lr": 1.363392853660328e-07} +{"train_loss": 0.000255224435955106, "global_step": 69733, "epoch": 585, "lr": 1.3617583426882575e-07, "val_loss": 0.030438121408224106, "train_action_mse_error": 3.009522288266453e-06} +{"train_loss": 0.0004953224561177194, "global_step": 69734, "epoch": 586, "lr": 1.3601248107391052e-07} +{"train_loss": 0.00015642827202100307, "global_step": 69735, "epoch": 586, "lr": 1.3584922578160909e-07} +{"train_loss": 0.00025094443117268384, "global_step": 69736, "epoch": 586, "lr": 1.3568606839223785e-07} +{"train_loss": 0.00020048191072419286, "global_step": 69737, "epoch": 586, "lr": 1.355230089061188e-07} +{"train_loss": 0.0002150198124581948, "global_step": 69738, "epoch": 586, "lr": 1.3536004732357942e-07} +{"train_loss": 0.0001893035660032183, "global_step": 69739, "epoch": 586, "lr": 1.3519718364492505e-07} +{"train_loss": 0.0002996157272718847, "global_step": 69740, "epoch": 586, "lr": 1.3503441787048877e-07} +{"train_loss": 0.00017944401770364493, "global_step": 69741, "epoch": 586, "lr": 1.3487175000058693e-07} +{"train_loss": 0.0002862772380467504, "global_step": 69742, "epoch": 586, "lr": 1.3470918003553045e-07} +{"train_loss": 0.00027922220760956407, "global_step": 69743, "epoch": 586, "lr": 1.3454670797565238e-07} +{"train_loss": 0.00014349984121508896, "global_step": 69744, "epoch": 586, "lr": 1.3438433382125804e-07} +{"train_loss": 0.00018636666936799884, "global_step": 69745, "epoch": 586, "lr": 1.3422205757267492e-07} +{"train_loss": 0.00024777287035249174, "global_step": 69746, "epoch": 586, "lr": 1.34059879230225e-07} +{"train_loss": 0.00024184302310459316, "global_step": 69747, "epoch": 586, "lr": 1.338977987942136e-07} +{"train_loss": 0.00016805368068162352, "global_step": 69748, "epoch": 586, "lr": 1.3373581626496823e-07} +{"train_loss": 0.0002100140554830432, "global_step": 69749, "epoch": 586, "lr": 1.335739316428053e-07} +{"train_loss": 0.0002909411850851029, "global_step": 69750, "epoch": 586, "lr": 1.3341214492804677e-07} +{"train_loss": 0.00020927524019498378, "global_step": 69751, "epoch": 586, "lr": 1.3325045612100352e-07} +{"train_loss": 0.00018491395167075098, "global_step": 69752, "epoch": 586, "lr": 1.3308886522199192e-07} +{"train_loss": 0.00026359097682870924, "global_step": 69753, "epoch": 586, "lr": 1.3292737223133956e-07} +{"train_loss": 0.0005576508119702339, "global_step": 69754, "epoch": 586, "lr": 1.327659771493517e-07} +{"train_loss": 0.0003618905902840197, "global_step": 69755, "epoch": 586, "lr": 1.3260467997635028e-07} +{"train_loss": 0.00017854415636975318, "global_step": 69756, "epoch": 586, "lr": 1.324434807126518e-07} +{"train_loss": 0.0002325014938833192, "global_step": 69757, "epoch": 586, "lr": 1.3228237935857813e-07} +{"train_loss": 0.00014913744234945625, "global_step": 69758, "epoch": 586, "lr": 1.3212137591443462e-07} +{"train_loss": 0.00017392184236086905, "global_step": 69759, "epoch": 586, "lr": 1.3196047038054327e-07} +{"train_loss": 0.00021558176376856863, "global_step": 69760, "epoch": 586, "lr": 1.3179966275722598e-07} +{"train_loss": 0.00023576222884003073, "global_step": 69761, "epoch": 586, "lr": 1.3163895304478813e-07} +{"train_loss": 0.00022825358610134572, "global_step": 69762, "epoch": 586, "lr": 1.314783412435461e-07} +{"train_loss": 0.00024120687157846987, "global_step": 69763, "epoch": 586, "lr": 1.313178273538218e-07} +{"train_loss": 0.0002305753732798621, "global_step": 69764, "epoch": 586, "lr": 1.3115741137593175e-07} +{"train_loss": 0.00019494919979479164, "global_step": 69765, "epoch": 586, "lr": 1.3099709331018117e-07} +{"train_loss": 0.00042033090721815825, "global_step": 69766, "epoch": 586, "lr": 1.3083687315689209e-07} +{"train_loss": 0.00021532161918003112, "global_step": 69767, "epoch": 586, "lr": 1.3067675091637532e-07} +{"train_loss": 0.0005467490991577506, "global_step": 69768, "epoch": 586, "lr": 1.3051672658894732e-07} +{"train_loss": 0.0003040194569621235, "global_step": 69769, "epoch": 586, "lr": 1.3035680017492448e-07} +{"train_loss": 0.00012611152487806976, "global_step": 69770, "epoch": 586, "lr": 1.301969716746121e-07} +{"train_loss": 0.00016671961930114776, "global_step": 69771, "epoch": 586, "lr": 1.300372410883377e-07} +{"train_loss": 0.00015242894005496055, "global_step": 69772, "epoch": 586, "lr": 1.2987760841640105e-07} +{"train_loss": 0.0003873599926009774, "global_step": 69773, "epoch": 586, "lr": 1.2971807365912414e-07} +{"train_loss": 0.0002988180494867265, "global_step": 69774, "epoch": 586, "lr": 1.2955863681682334e-07} +{"train_loss": 0.00024428078904747963, "global_step": 69775, "epoch": 586, "lr": 1.2939929788979842e-07} +{"train_loss": 0.00020912877516821027, "global_step": 69776, "epoch": 586, "lr": 1.2924005687837693e-07} +{"train_loss": 0.0001716225960990414, "global_step": 69777, "epoch": 586, "lr": 1.2908091378285857e-07} +{"train_loss": 0.0002849835145752877, "global_step": 69778, "epoch": 586, "lr": 1.2892186860356536e-07} +{"train_loss": 0.0002728583640418947, "global_step": 69779, "epoch": 586, "lr": 1.2876292134080813e-07} +{"train_loss": 0.00024431649944745004, "global_step": 69780, "epoch": 586, "lr": 1.286040719948922e-07} +{"train_loss": 0.0002836048661265522, "global_step": 69781, "epoch": 586, "lr": 1.28445320566134e-07} +{"train_loss": 0.00034434112603776157, "global_step": 69782, "epoch": 586, "lr": 1.2828666705484994e-07} +{"train_loss": 0.00019647236331366003, "global_step": 69783, "epoch": 586, "lr": 1.2812811146134528e-07} +{"train_loss": 0.00020011058950331062, "global_step": 69784, "epoch": 586, "lr": 1.2796965378593097e-07} +{"train_loss": 0.0002926336310338229, "global_step": 69785, "epoch": 586, "lr": 1.2781129402892333e-07} +{"train_loss": 0.00018337256915401667, "global_step": 69786, "epoch": 586, "lr": 1.2765303219062775e-07} +{"train_loss": 0.00019057047029491514, "global_step": 69787, "epoch": 586, "lr": 1.2749486827135504e-07} +{"train_loss": 0.00017567523173056543, "global_step": 69788, "epoch": 586, "lr": 1.2733680227142164e-07} +{"train_loss": 0.00033966239425353706, "global_step": 69789, "epoch": 586, "lr": 1.2717883419113286e-07} +{"train_loss": 0.00012206629617139697, "global_step": 69790, "epoch": 586, "lr": 1.270209640308051e-07} +{"train_loss": 0.00015895566320978105, "global_step": 69791, "epoch": 586, "lr": 1.2686319179073813e-07} +{"train_loss": 0.0002660485915839672, "global_step": 69792, "epoch": 586, "lr": 1.2670551747124836e-07} +{"train_loss": 0.0001852145796874538, "global_step": 69793, "epoch": 586, "lr": 1.2654794107264668e-07} +{"train_loss": 0.00039373995969071984, "global_step": 69794, "epoch": 586, "lr": 1.263904625952328e-07} +{"train_loss": 0.00015566307411063462, "global_step": 69795, "epoch": 586, "lr": 1.2623308203932871e-07} +{"train_loss": 0.00037935833097435534, "global_step": 69796, "epoch": 586, "lr": 1.2607579940523973e-07} +{"train_loss": 0.0002833908365573734, "global_step": 69797, "epoch": 586, "lr": 1.2591861469327114e-07} +{"train_loss": 0.0001389000826748088, "global_step": 69798, "epoch": 586, "lr": 1.257615279037283e-07} +{"train_loss": 0.00013985816622152925, "global_step": 69799, "epoch": 586, "lr": 1.2560453903692758e-07} +{"train_loss": 0.00025078083854168653, "global_step": 69800, "epoch": 586, "lr": 1.2544764809317433e-07} +{"train_loss": 0.00035507799475453794, "global_step": 69801, "epoch": 586, "lr": 1.2529085507277938e-07} +{"train_loss": 0.00028783577727153897, "global_step": 69802, "epoch": 586, "lr": 1.251341599760425e-07} +{"train_loss": 0.00019001876353286207, "global_step": 69803, "epoch": 586, "lr": 1.249775628032801e-07} +{"train_loss": 0.0001861308846855536, "global_step": 69804, "epoch": 586, "lr": 1.2482106355479196e-07} +{"train_loss": 0.00017984544683713466, "global_step": 69805, "epoch": 586, "lr": 1.246646622308889e-07} +{"train_loss": 0.00040276715299114585, "global_step": 69806, "epoch": 586, "lr": 1.2450835883188182e-07} +{"train_loss": 0.0004316168779041618, "global_step": 69807, "epoch": 586, "lr": 1.2435215335807603e-07} +{"train_loss": 0.00030452327337116003, "global_step": 69808, "epoch": 586, "lr": 1.241960458097713e-07} +{"train_loss": 0.0005537696415558457, "global_step": 69809, "epoch": 586, "lr": 1.24040036187284e-07} +{"train_loss": 0.00018475032993592322, "global_step": 69810, "epoch": 586, "lr": 1.238841244909139e-07} +{"train_loss": 0.0003229253343306482, "global_step": 69811, "epoch": 586, "lr": 1.2372831072096635e-07} +{"train_loss": 0.00016840655007399619, "global_step": 69812, "epoch": 586, "lr": 1.2357259487775219e-07} +{"train_loss": 0.00017589607159607112, "global_step": 69813, "epoch": 586, "lr": 1.2341697696157117e-07} +{"train_loss": 0.00022377051936928183, "global_step": 69814, "epoch": 586, "lr": 1.2326145697273972e-07} +{"train_loss": 0.00018307128630112857, "global_step": 69815, "epoch": 586, "lr": 1.2310603491155204e-07} +{"train_loss": 0.0003173012228216976, "global_step": 69816, "epoch": 586, "lr": 1.2295071077831344e-07} +{"train_loss": 0.0011438499204814434, "global_step": 69817, "epoch": 586, "lr": 1.2279548457333478e-07} +{"train_loss": 0.0003214566968381405, "global_step": 69818, "epoch": 586, "lr": 1.2264035629692138e-07} +{"train_loss": 0.00031834442052058876, "global_step": 69819, "epoch": 586, "lr": 1.2248532594937302e-07} +{"train_loss": 0.00042229017708450556, "global_step": 69820, "epoch": 586, "lr": 1.2233039353099496e-07} +{"train_loss": 0.00017406010010745376, "global_step": 69821, "epoch": 586, "lr": 1.2217555904209254e-07} +{"train_loss": 0.00016526527178939432, "global_step": 69822, "epoch": 586, "lr": 1.2202082248297109e-07} +{"train_loss": 0.00018461418221704662, "global_step": 69823, "epoch": 586, "lr": 1.2186618385393588e-07} +{"train_loss": 0.0002843709662556648, "global_step": 69824, "epoch": 586, "lr": 1.2171164315528115e-07} +{"train_loss": 0.0001809722452890128, "global_step": 69825, "epoch": 586, "lr": 1.2155720038732333e-07} +{"train_loss": 0.00016420871543232352, "global_step": 69826, "epoch": 586, "lr": 1.2140285555035658e-07} +{"train_loss": 0.0002444243000354618, "global_step": 69827, "epoch": 586, "lr": 1.2124860864468624e-07} +{"train_loss": 0.0001710867218207568, "global_step": 69828, "epoch": 586, "lr": 1.2109445967061206e-07} +{"train_loss": 0.00023677796707488596, "global_step": 69829, "epoch": 586, "lr": 1.2094040862844492e-07} +{"train_loss": 0.0002845056005753577, "global_step": 69830, "epoch": 586, "lr": 1.2078645551848455e-07} +{"train_loss": 0.00018913947860710323, "global_step": 69831, "epoch": 586, "lr": 1.206326003410252e-07} +{"train_loss": 0.0001718479470582679, "global_step": 69832, "epoch": 586, "lr": 1.204788430963777e-07} +{"train_loss": 0.00019289387273602188, "global_step": 69833, "epoch": 586, "lr": 1.2032518378484182e-07} +{"train_loss": 0.0002545391325838864, "global_step": 69834, "epoch": 586, "lr": 1.201716224067173e-07} +{"train_loss": 0.0004462717042770237, "global_step": 69835, "epoch": 586, "lr": 1.2001815896230394e-07} +{"train_loss": 0.0002162924938602373, "global_step": 69836, "epoch": 586, "lr": 1.198647934519126e-07} +{"train_loss": 0.0002411074674455449, "global_step": 69837, "epoch": 586, "lr": 1.1971152587583189e-07} +{"train_loss": 0.00021898755221627653, "global_step": 69838, "epoch": 586, "lr": 1.1955835623437273e-07} +{"train_loss": 0.00016237300587818027, "global_step": 69839, "epoch": 586, "lr": 1.1940528452783483e-07} +{"train_loss": 0.0002855011261999607, "global_step": 69840, "epoch": 586, "lr": 1.1925231075650688e-07} +{"train_loss": 0.0001829855318646878, "global_step": 69841, "epoch": 586, "lr": 1.190994349207053e-07} +{"train_loss": 0.00019264404545538127, "global_step": 69842, "epoch": 586, "lr": 1.1894665702071872e-07} +{"train_loss": 0.00016550446162000299, "global_step": 69843, "epoch": 586, "lr": 1.1879397705685246e-07} +{"train_loss": 0.00014897427172400057, "global_step": 69844, "epoch": 586, "lr": 1.186413950294063e-07} +{"train_loss": 0.0003109157260041684, "global_step": 69845, "epoch": 586, "lr": 1.1848891093867998e-07} +{"train_loss": 0.00028489084797911346, "global_step": 69846, "epoch": 586, "lr": 1.1833652478496771e-07} +{"train_loss": 0.0002782472292892635, "global_step": 69847, "epoch": 586, "lr": 1.181842365685748e-07} +{"train_loss": 0.00014647209900431335, "global_step": 69848, "epoch": 586, "lr": 1.1803204628980102e-07} +{"train_loss": 0.0001716799451969564, "global_step": 69849, "epoch": 586, "lr": 1.1787995394893503e-07} +{"train_loss": 0.0001519247016403824, "global_step": 69850, "epoch": 586, "lr": 1.1772795954628768e-07} +{"train_loss": 0.00020821559883188456, "global_step": 69851, "epoch": 586, "lr": 1.1757606308215319e-07} +{"train_loss": 0.0002516271872250285, "global_step": 69852, "epoch": 586, "lr": 1.1742426455682576e-07, "val_loss": 0.04451392590999603} +{"train_loss": 0.00018824431754183024, "global_step": 69853, "epoch": 587, "lr": 1.1727256397061071e-07} +{"train_loss": 0.00013818623847328126, "global_step": 69854, "epoch": 587, "lr": 1.1712096132379669e-07} +{"train_loss": 0.00024407042656093836, "global_step": 69855, "epoch": 587, "lr": 1.1696945661668901e-07} +{"train_loss": 0.00035191202186979353, "global_step": 69856, "epoch": 587, "lr": 1.168180498495819e-07} +{"train_loss": 0.00037050675018690526, "global_step": 69857, "epoch": 587, "lr": 1.1666674102277508e-07} +{"train_loss": 0.0004106929409317672, "global_step": 69858, "epoch": 587, "lr": 1.165155301365628e-07} +{"train_loss": 0.0001471525029046461, "global_step": 69859, "epoch": 587, "lr": 1.1636441719123925e-07} +{"train_loss": 0.00020406508701853454, "global_step": 69860, "epoch": 587, "lr": 1.1621340218710975e-07} +{"train_loss": 0.00018783746054396033, "global_step": 69861, "epoch": 587, "lr": 1.1606248512446848e-07} +{"train_loss": 0.0001819457538658753, "global_step": 69862, "epoch": 587, "lr": 1.1591166600360414e-07} +{"train_loss": 0.00034212361788377166, "global_step": 69863, "epoch": 587, "lr": 1.1576094482481647e-07} +{"train_loss": 0.00022062970674596727, "global_step": 69864, "epoch": 587, "lr": 1.1561032158840524e-07} +{"train_loss": 0.0002444996207486838, "global_step": 69865, "epoch": 587, "lr": 1.1545979629466463e-07} +{"train_loss": 0.00031077125458978117, "global_step": 69866, "epoch": 587, "lr": 1.1530936894388889e-07} +{"train_loss": 0.0002570454671513289, "global_step": 69867, "epoch": 587, "lr": 1.151590395363722e-07} +{"train_loss": 0.00016178730584215373, "global_step": 69868, "epoch": 587, "lr": 1.1500880807241432e-07} +{"train_loss": 0.0002551780780777335, "global_step": 69869, "epoch": 587, "lr": 1.1485867455230392e-07} +{"train_loss": 0.00020895147463306785, "global_step": 69870, "epoch": 587, "lr": 1.1470863897634077e-07} +{"train_loss": 0.00018415988597553223, "global_step": 69871, "epoch": 587, "lr": 1.1455870134481905e-07} +{"train_loss": 0.00021306498092599213, "global_step": 69872, "epoch": 587, "lr": 1.1440886165803299e-07} +{"train_loss": 0.00027739573852159083, "global_step": 69873, "epoch": 587, "lr": 1.1425911991627125e-07} +{"train_loss": 0.0002634220873005688, "global_step": 69874, "epoch": 587, "lr": 1.1410947611983358e-07} +{"train_loss": 0.00028331272187642753, "global_step": 69875, "epoch": 587, "lr": 1.1395993026901419e-07} +{"train_loss": 0.00024278195633087307, "global_step": 69876, "epoch": 587, "lr": 1.1381048236410174e-07} +{"train_loss": 0.00012166219676146284, "global_step": 69877, "epoch": 587, "lr": 1.13661132405396e-07} +{"train_loss": 0.0004281196161173284, "global_step": 69878, "epoch": 587, "lr": 1.135118803931856e-07} +{"train_loss": 0.00021028469200246036, "global_step": 69879, "epoch": 587, "lr": 1.1336272632777034e-07} +{"train_loss": 0.00034167603007517755, "global_step": 69880, "epoch": 587, "lr": 1.1321367020942775e-07} +{"train_loss": 0.0003518804151099175, "global_step": 69881, "epoch": 587, "lr": 1.1306471203846869e-07} +{"train_loss": 0.0002195337729062885, "global_step": 69882, "epoch": 587, "lr": 1.1291585181517072e-07} +{"train_loss": 0.0001537949574412778, "global_step": 69883, "epoch": 587, "lr": 1.1276708953983916e-07} +{"train_loss": 0.00019936451280955225, "global_step": 69884, "epoch": 587, "lr": 1.1261842521275712e-07} +{"train_loss": 0.0002447996521368623, "global_step": 69885, "epoch": 587, "lr": 1.1246985883421878e-07} +{"train_loss": 0.00012816785601899028, "global_step": 69886, "epoch": 587, "lr": 1.1232139040451839e-07} +{"train_loss": 0.00028764104354195297, "global_step": 69887, "epoch": 587, "lr": 1.1217301992394458e-07} +{"train_loss": 0.0002548707998357713, "global_step": 69888, "epoch": 587, "lr": 1.1202474739278601e-07} +{"train_loss": 0.00028410361846908927, "global_step": 69889, "epoch": 587, "lr": 1.118765728113369e-07} +{"train_loss": 0.00045212465920485556, "global_step": 69890, "epoch": 587, "lr": 1.1172849617989145e-07} +{"train_loss": 0.0002520903944969177, "global_step": 69891, "epoch": 587, "lr": 1.1158051749873833e-07} +{"train_loss": 0.0002833929902408272, "global_step": 69892, "epoch": 587, "lr": 1.1143263676816618e-07} +{"train_loss": 0.00019683911523316056, "global_step": 69893, "epoch": 587, "lr": 1.1128485398846367e-07} +{"train_loss": 0.0002166165941162035, "global_step": 69894, "epoch": 587, "lr": 1.11137169159925e-07} +{"train_loss": 0.00044553252519108355, "global_step": 69895, "epoch": 587, "lr": 1.1098958228283884e-07} +{"train_loss": 0.0002229235105914995, "global_step": 69896, "epoch": 587, "lr": 1.1084209335749384e-07} +{"train_loss": 0.00014067078882362694, "global_step": 69897, "epoch": 587, "lr": 1.1069470238418422e-07} +{"train_loss": 0.00016564916586503386, "global_step": 69898, "epoch": 587, "lr": 1.1054740936319308e-07} +{"train_loss": 0.00024852558271959424, "global_step": 69899, "epoch": 587, "lr": 1.1040021429480907e-07} +{"train_loss": 0.0001581874385010451, "global_step": 69900, "epoch": 587, "lr": 1.102531171793264e-07} +{"train_loss": 0.00022212910698726773, "global_step": 69901, "epoch": 587, "lr": 1.1010611801703374e-07} +{"train_loss": 0.0002432923938613385, "global_step": 69902, "epoch": 587, "lr": 1.0995921680821974e-07} +{"train_loss": 0.00021712204033974558, "global_step": 69903, "epoch": 587, "lr": 1.0981241355316751e-07} +{"train_loss": 0.00014739713515155017, "global_step": 69904, "epoch": 587, "lr": 1.0966570825216572e-07} +{"train_loss": 0.00025172432651743293, "global_step": 69905, "epoch": 587, "lr": 1.0951910090550854e-07} +{"train_loss": 0.0002681358892004937, "global_step": 69906, "epoch": 587, "lr": 1.0937259151347912e-07} +{"train_loss": 0.00019210924801882356, "global_step": 69907, "epoch": 587, "lr": 1.0922618007637165e-07} +{"train_loss": 0.0001808846864150837, "global_step": 69908, "epoch": 587, "lr": 1.0907986659446368e-07} +{"train_loss": 0.0001645999145694077, "global_step": 69909, "epoch": 587, "lr": 1.0893365106804943e-07} +{"train_loss": 0.0003760622930712998, "global_step": 69910, "epoch": 587, "lr": 1.0878753349741199e-07} +{"train_loss": 0.00035219016717746854, "global_step": 69911, "epoch": 587, "lr": 1.0864151388284006e-07} +{"train_loss": 0.00030377134680747986, "global_step": 69912, "epoch": 587, "lr": 1.0849559222462224e-07} +{"train_loss": 0.00039991040830500424, "global_step": 69913, "epoch": 587, "lr": 1.0834976852304169e-07} +{"train_loss": 0.0002881895925384015, "global_step": 69914, "epoch": 587, "lr": 1.0820404277838703e-07} +{"train_loss": 0.0002345887041883543, "global_step": 69915, "epoch": 587, "lr": 1.0805841499094694e-07} +{"train_loss": 0.00023758811585139483, "global_step": 69916, "epoch": 587, "lr": 1.0791288516099895e-07} +{"train_loss": 0.00044946500565856695, "global_step": 69917, "epoch": 587, "lr": 1.0776745328883731e-07} +{"train_loss": 0.0004798217269126326, "global_step": 69918, "epoch": 587, "lr": 1.0762211937473954e-07} +{"train_loss": 0.00032220929278992116, "global_step": 69919, "epoch": 587, "lr": 1.0747688341899986e-07} +{"train_loss": 0.00034490268444642425, "global_step": 69920, "epoch": 587, "lr": 1.0733174542189583e-07} +{"train_loss": 0.00024841289268806577, "global_step": 69921, "epoch": 587, "lr": 1.0718670538371611e-07} +{"train_loss": 0.00018167585949413478, "global_step": 69922, "epoch": 587, "lr": 1.0704176330474935e-07} +{"train_loss": 0.00029348317184485495, "global_step": 69923, "epoch": 587, "lr": 1.0689691918527311e-07} +{"train_loss": 0.00012743192201014608, "global_step": 69924, "epoch": 587, "lr": 1.0675217302557605e-07} +{"train_loss": 0.00019729977066162974, "global_step": 69925, "epoch": 587, "lr": 1.0660752482593572e-07} +{"train_loss": 0.00016149562725331634, "global_step": 69926, "epoch": 587, "lr": 1.0646297458664634e-07} +{"train_loss": 0.00025555139291100204, "global_step": 69927, "epoch": 587, "lr": 1.063185223079799e-07} +{"train_loss": 0.0003356053784955293, "global_step": 69928, "epoch": 587, "lr": 1.0617416799023617e-07} +{"train_loss": 0.00022522755898535252, "global_step": 69929, "epoch": 587, "lr": 1.0602991163368159e-07} +{"train_loss": 0.0001939907087944448, "global_step": 69930, "epoch": 587, "lr": 1.0588575323861039e-07} +{"train_loss": 0.00015300522500183433, "global_step": 69931, "epoch": 587, "lr": 1.0574169280530011e-07} +{"train_loss": 0.0003410150238778442, "global_step": 69932, "epoch": 587, "lr": 1.0559773033403941e-07} +{"train_loss": 0.0003445793699938804, "global_step": 69933, "epoch": 587, "lr": 1.0545386582510031e-07} +{"train_loss": 0.0001907705736812204, "global_step": 69934, "epoch": 587, "lr": 1.05310099278777e-07} +{"train_loss": 0.00016898420290090144, "global_step": 69935, "epoch": 587, "lr": 1.0516643069534704e-07} +{"train_loss": 0.0002281167107867077, "global_step": 69936, "epoch": 587, "lr": 1.0502286007509354e-07} +{"train_loss": 0.0005043827113695443, "global_step": 69937, "epoch": 587, "lr": 1.0487938741829406e-07} +{"train_loss": 0.00011736351007129997, "global_step": 69938, "epoch": 587, "lr": 1.047360127252317e-07} +{"train_loss": 0.00016326601325999945, "global_step": 69939, "epoch": 587, "lr": 1.0459273599619513e-07} +{"train_loss": 0.00013965937250759453, "global_step": 69940, "epoch": 587, "lr": 1.0444955723145633e-07} +{"train_loss": 0.0002144108002539724, "global_step": 69941, "epoch": 587, "lr": 1.0430647643130398e-07} +{"train_loss": 0.00018029251077678055, "global_step": 69942, "epoch": 587, "lr": 1.0416349359601008e-07} +{"train_loss": 0.00032092619221657515, "global_step": 69943, "epoch": 587, "lr": 1.0402060872586328e-07} +{"train_loss": 0.00030498692649416625, "global_step": 69944, "epoch": 587, "lr": 1.0387782182114115e-07} +{"train_loss": 0.0003509608213789761, "global_step": 69945, "epoch": 587, "lr": 1.0373513288212122e-07} +{"train_loss": 0.0004891409771516919, "global_step": 69946, "epoch": 587, "lr": 1.0359254190909218e-07} +{"train_loss": 0.000263852154603228, "global_step": 69947, "epoch": 587, "lr": 1.0345004890232602e-07} +{"train_loss": 0.0001814843126339838, "global_step": 69948, "epoch": 587, "lr": 1.0330765386210583e-07} +{"train_loss": 0.000262915127677843, "global_step": 69949, "epoch": 587, "lr": 1.031653567887092e-07} +{"train_loss": 0.00027079685241915286, "global_step": 69950, "epoch": 587, "lr": 1.0302315768241921e-07} +{"train_loss": 0.00021330993331503123, "global_step": 69951, "epoch": 587, "lr": 1.0288105654350789e-07} +{"train_loss": 0.0002063424908556044, "global_step": 69952, "epoch": 587, "lr": 1.0273905337226386e-07} +{"train_loss": 0.00017441353702452034, "global_step": 69953, "epoch": 587, "lr": 1.0259714816895915e-07} +{"train_loss": 0.00032177503453567624, "global_step": 69954, "epoch": 587, "lr": 1.0245534093387132e-07} +{"train_loss": 0.0002564415626693517, "global_step": 69955, "epoch": 587, "lr": 1.0231363166728347e-07} +{"train_loss": 0.0001777224097168073, "global_step": 69956, "epoch": 587, "lr": 1.0217202036947315e-07} +{"train_loss": 0.0005508766043931246, "global_step": 69957, "epoch": 587, "lr": 1.0203050704071793e-07} +{"train_loss": 0.00022862506739329547, "global_step": 69958, "epoch": 587, "lr": 1.0188909168129534e-07} +{"train_loss": 0.00015354070637840778, "global_step": 69959, "epoch": 587, "lr": 1.0174777429148297e-07} +{"train_loss": 0.0002113834925694391, "global_step": 69960, "epoch": 587, "lr": 1.0160655487155279e-07} +{"train_loss": 0.00027526463964022696, "global_step": 69961, "epoch": 587, "lr": 1.0146543342179349e-07} +{"train_loss": 0.0005754901212640107, "global_step": 69962, "epoch": 587, "lr": 1.013244099424715e-07} +{"train_loss": 0.0004352008400019258, "global_step": 69963, "epoch": 587, "lr": 1.0118348443386994e-07} +{"train_loss": 0.000258691085036844, "global_step": 69964, "epoch": 587, "lr": 1.010426568962608e-07} +{"train_loss": 0.00013166246935725212, "global_step": 69965, "epoch": 587, "lr": 1.0090192732992721e-07} +{"train_loss": 0.0002697525778785348, "global_step": 69966, "epoch": 587, "lr": 1.0076129573514115e-07} +{"train_loss": 0.00028860336169600487, "global_step": 69967, "epoch": 587, "lr": 1.0062076211218019e-07} +{"train_loss": 0.00022808769426774234, "global_step": 69968, "epoch": 587, "lr": 1.0048032646131633e-07} +{"train_loss": 0.00022998747590463609, "global_step": 69969, "epoch": 587, "lr": 1.0033998878283269e-07} +{"train_loss": 0.00028340728022158146, "global_step": 69970, "epoch": 587, "lr": 1.0019974907699569e-07} +{"train_loss": 0.0002578430173320876, "global_step": 69971, "epoch": 587, "lr": 1.0005960734408847e-07, "val_loss": 0.023146122694015503} +{"train_loss": 0.00022438602172769606, "global_step": 69972, "epoch": 588, "lr": 9.991956358438304e-08} +{"train_loss": 0.00016017536108847708, "global_step": 69973, "epoch": 588, "lr": 9.977961779815138e-08} +{"train_loss": 0.00033657619496807456, "global_step": 69974, "epoch": 588, "lr": 9.963976998567659e-08} +{"train_loss": 0.0003196122997906059, "global_step": 69975, "epoch": 588, "lr": 9.950002014722514e-08} +{"train_loss": 0.0002645867061801255, "global_step": 69976, "epoch": 588, "lr": 9.93603682830746e-08} +{"train_loss": 0.00013042075443081558, "global_step": 69977, "epoch": 588, "lr": 9.922081439350251e-08} +{"train_loss": 0.0002352638985030353, "global_step": 69978, "epoch": 588, "lr": 9.908135847877532e-08} +{"train_loss": 0.0002902922569774091, "global_step": 69979, "epoch": 588, "lr": 9.894200053917058e-08} +{"train_loss": 0.00018261205696035177, "global_step": 69980, "epoch": 588, "lr": 9.880274057496031e-08} +{"train_loss": 0.0002203128969995305, "global_step": 69981, "epoch": 588, "lr": 9.866357858642205e-08} +{"train_loss": 0.0001729523646645248, "global_step": 69982, "epoch": 588, "lr": 9.852451457382783e-08} +{"train_loss": 0.0001545078121125698, "global_step": 69983, "epoch": 588, "lr": 9.838554853744964e-08} +{"train_loss": 0.00021772914624307305, "global_step": 69984, "epoch": 588, "lr": 9.824668047755948e-08} +{"train_loss": 0.0003045009507331997, "global_step": 69985, "epoch": 588, "lr": 9.810791039442935e-08} +{"train_loss": 0.00016308805788867176, "global_step": 69986, "epoch": 588, "lr": 9.796923828833127e-08} +{"train_loss": 0.00016151173622347414, "global_step": 69987, "epoch": 588, "lr": 9.783066415954278e-08} +{"train_loss": 0.0006297603249549866, "global_step": 69988, "epoch": 588, "lr": 9.769218800833035e-08} +{"train_loss": 0.00015470180369447917, "global_step": 69989, "epoch": 588, "lr": 9.755380983497154e-08} +{"train_loss": 0.0002680141478776932, "global_step": 69990, "epoch": 588, "lr": 9.741552963973277e-08} +{"train_loss": 0.00030773598700761795, "global_step": 69991, "epoch": 588, "lr": 9.727734742288608e-08} +{"train_loss": 0.00019684714789036661, "global_step": 69992, "epoch": 588, "lr": 9.713926318470346e-08} +{"train_loss": 0.00026674263062886894, "global_step": 69993, "epoch": 588, "lr": 9.700127692546246e-08} +{"train_loss": 0.00017369749548379332, "global_step": 69994, "epoch": 588, "lr": 9.686338864541844e-08} +{"train_loss": 0.0001538581564091146, "global_step": 69995, "epoch": 588, "lr": 9.672559834486005e-08} +{"train_loss": 0.00022934313165023923, "global_step": 69996, "epoch": 588, "lr": 9.658790602404267e-08} +{"train_loss": 0.0003156191378366202, "global_step": 69997, "epoch": 588, "lr": 9.645031168324936e-08} +{"train_loss": 0.0002147204359062016, "global_step": 69998, "epoch": 588, "lr": 9.631281532274106e-08} +{"train_loss": 0.00039144247421063483, "global_step": 69999, "epoch": 588, "lr": 9.61754169427953e-08} +{"train_loss": 0.0001812699920265004, "global_step": 70000, "epoch": 588, "lr": 9.603811654367301e-08} +{"train_loss": 0.00014726430526934564, "global_step": 70001, "epoch": 588, "lr": 9.590091412565172e-08} +{"train_loss": 0.0002044548891717568, "global_step": 70002, "epoch": 588, "lr": 9.57638096889979e-08} +{"train_loss": 0.00022590960725210607, "global_step": 70003, "epoch": 588, "lr": 9.562680323397799e-08} +{"train_loss": 0.00016028317622840405, "global_step": 70004, "epoch": 588, "lr": 9.548989476086401e-08} +{"train_loss": 0.0002348512934986502, "global_step": 70005, "epoch": 588, "lr": 9.53530842699224e-08} +{"train_loss": 0.0002921194536611438, "global_step": 70006, "epoch": 588, "lr": 9.521637176142517e-08} +{"train_loss": 0.00015981419710442424, "global_step": 70007, "epoch": 588, "lr": 9.507975723563878e-08} +{"train_loss": 0.00023999108816497028, "global_step": 70008, "epoch": 588, "lr": 9.494324069282968e-08} +{"train_loss": 0.0002507682656869292, "global_step": 70009, "epoch": 588, "lr": 9.480682213326986e-08} +{"train_loss": 0.0001684764283709228, "global_step": 70010, "epoch": 588, "lr": 9.467050155723134e-08} +{"train_loss": 0.00016742294246796519, "global_step": 70011, "epoch": 588, "lr": 9.453427896496392e-08} +{"train_loss": 0.00013954572204966098, "global_step": 70012, "epoch": 588, "lr": 9.439815435675625e-08} +{"train_loss": 0.00011866776185343042, "global_step": 70013, "epoch": 588, "lr": 9.426212773286369e-08} +{"train_loss": 0.00024476071121171117, "global_step": 70014, "epoch": 588, "lr": 9.41261990935527e-08} +{"train_loss": 0.00016376598796341568, "global_step": 70015, "epoch": 588, "lr": 9.399036843909526e-08} +{"train_loss": 0.00028767550247721374, "global_step": 70016, "epoch": 588, "lr": 9.385463576975784e-08} +{"train_loss": 0.00020927577861584723, "global_step": 70017, "epoch": 588, "lr": 9.371900108580134e-08} +{"train_loss": 0.00024509208742529154, "global_step": 70018, "epoch": 588, "lr": 9.358346438749776e-08} +{"train_loss": 0.00013409694656729698, "global_step": 70019, "epoch": 588, "lr": 9.344802567511357e-08} +{"train_loss": 0.00019724782032426447, "global_step": 70020, "epoch": 588, "lr": 9.331268494890965e-08} +{"train_loss": 0.00011658090079436079, "global_step": 70021, "epoch": 588, "lr": 9.317744220915803e-08} +{"train_loss": 0.0002867161820176989, "global_step": 70022, "epoch": 588, "lr": 9.304229745611959e-08} +{"train_loss": 0.00019258417887613177, "global_step": 70023, "epoch": 588, "lr": 9.290725069005524e-08} +{"train_loss": 0.0002548708289396018, "global_step": 70024, "epoch": 588, "lr": 9.277230191124253e-08} +{"train_loss": 0.00022531254217028618, "global_step": 70025, "epoch": 588, "lr": 9.263745111993683e-08} +{"train_loss": 0.00038904810207895935, "global_step": 70026, "epoch": 588, "lr": 9.250269831640457e-08} +{"train_loss": 0.0002532784710638225, "global_step": 70027, "epoch": 588, "lr": 9.236804350091221e-08} +{"train_loss": 0.0002251158148283139, "global_step": 70028, "epoch": 588, "lr": 9.223348667372623e-08} +{"train_loss": 0.00038512476021423936, "global_step": 70029, "epoch": 588, "lr": 9.209902783510193e-08} +{"train_loss": 0.0001657649117987603, "global_step": 70030, "epoch": 588, "lr": 9.196466698531692e-08} +{"train_loss": 0.00020108917669858783, "global_step": 70031, "epoch": 588, "lr": 9.183040412462096e-08} +{"train_loss": 0.00015829922631382942, "global_step": 70032, "epoch": 588, "lr": 9.169623925328607e-08} +{"train_loss": 0.00017534945800434798, "global_step": 70033, "epoch": 588, "lr": 9.156217237157317e-08} +{"train_loss": 0.00017407204722985625, "global_step": 70034, "epoch": 588, "lr": 9.142820347974867e-08} +{"train_loss": 0.0003183883964084089, "global_step": 70035, "epoch": 588, "lr": 9.129433257807351e-08} +{"train_loss": 0.00039383803959935904, "global_step": 70036, "epoch": 588, "lr": 9.116055966680303e-08} +{"train_loss": 0.00012585415970534086, "global_step": 70037, "epoch": 588, "lr": 9.102688474621479e-08} +{"train_loss": 0.0002642328036017716, "global_step": 70038, "epoch": 588, "lr": 9.089330781655858e-08} +{"train_loss": 0.00019129236170556396, "global_step": 70039, "epoch": 588, "lr": 9.075982887810086e-08} +{"train_loss": 0.00025359619758091867, "global_step": 70040, "epoch": 588, "lr": 9.062644793110809e-08} +{"train_loss": 0.0007540643564425409, "global_step": 70041, "epoch": 588, "lr": 9.04931649758356e-08} +{"train_loss": 0.00014656859275419265, "global_step": 70042, "epoch": 588, "lr": 9.035998001254986e-08} +{"train_loss": 0.00039887113962322474, "global_step": 70043, "epoch": 588, "lr": 9.022689304151177e-08} +{"train_loss": 0.00012858177069574594, "global_step": 70044, "epoch": 588, "lr": 9.009390406297668e-08} +{"train_loss": 0.00015332135080825537, "global_step": 70045, "epoch": 588, "lr": 8.996101307721105e-08} +{"train_loss": 0.00013380257587414235, "global_step": 70046, "epoch": 588, "lr": 8.982822008447578e-08} +{"train_loss": 0.0002011375327128917, "global_step": 70047, "epoch": 588, "lr": 8.969552508503177e-08} +{"train_loss": 0.00031943427165970206, "global_step": 70048, "epoch": 588, "lr": 8.956292807913435e-08} +{"train_loss": 0.00013775535626336932, "global_step": 70049, "epoch": 588, "lr": 8.943042906705001e-08} +{"train_loss": 0.00021186581579968333, "global_step": 70050, "epoch": 588, "lr": 8.929802804903964e-08} +{"train_loss": 0.00016588036669418216, "global_step": 70051, "epoch": 588, "lr": 8.916572502535858e-08} +{"train_loss": 0.00022937814355827868, "global_step": 70052, "epoch": 588, "lr": 8.903351999626774e-08} +{"train_loss": 0.00029516653739847243, "global_step": 70053, "epoch": 588, "lr": 8.890141296202803e-08} +{"train_loss": 0.00018746651767287403, "global_step": 70054, "epoch": 588, "lr": 8.876940392289479e-08} +{"train_loss": 0.0002163830940844491, "global_step": 70055, "epoch": 588, "lr": 8.863749287913448e-08} +{"train_loss": 0.00019243585120420903, "global_step": 70056, "epoch": 588, "lr": 8.850567983100244e-08} +{"train_loss": 0.00020300694450270385, "global_step": 70057, "epoch": 588, "lr": 8.837396477875404e-08} +{"train_loss": 0.00025828875368461013, "global_step": 70058, "epoch": 588, "lr": 8.824234772265572e-08} +{"train_loss": 0.00020101090194657445, "global_step": 70059, "epoch": 588, "lr": 8.811082866295728e-08} +{"train_loss": 0.0002642346662469208, "global_step": 70060, "epoch": 588, "lr": 8.797940759992518e-08} +{"train_loss": 0.00029529730090871453, "global_step": 70061, "epoch": 588, "lr": 8.784808453380921e-08} +{"train_loss": 0.00016846047947183251, "global_step": 70062, "epoch": 588, "lr": 8.77168594648703e-08} +{"train_loss": 0.0002871212491299957, "global_step": 70063, "epoch": 588, "lr": 8.758573239336931e-08} +{"train_loss": 0.000223158102016896, "global_step": 70064, "epoch": 588, "lr": 8.745470331956162e-08} +{"train_loss": 0.00020379737543407828, "global_step": 70065, "epoch": 588, "lr": 8.732377224370259e-08} +{"train_loss": 0.0002246885997010395, "global_step": 70066, "epoch": 588, "lr": 8.719293916605309e-08} +{"train_loss": 0.00031255008070729673, "global_step": 70067, "epoch": 588, "lr": 8.70622040868685e-08} +{"train_loss": 0.00020936505461577326, "global_step": 70068, "epoch": 588, "lr": 8.693156700640414e-08} +{"train_loss": 0.00020945003780070692, "global_step": 70069, "epoch": 588, "lr": 8.68010279249154e-08} +{"train_loss": 0.00023015818442218006, "global_step": 70070, "epoch": 588, "lr": 8.667058684266316e-08} +{"train_loss": 0.00027421105187386274, "global_step": 70071, "epoch": 588, "lr": 8.654024375989723e-08} +{"train_loss": 0.0002814017643686384, "global_step": 70072, "epoch": 588, "lr": 8.640999867687849e-08} +{"train_loss": 0.00017563601431902498, "global_step": 70073, "epoch": 588, "lr": 8.627985159386232e-08} +{"train_loss": 0.00023274897830560803, "global_step": 70074, "epoch": 588, "lr": 8.614980251110404e-08} +{"train_loss": 0.0003141531196888536, "global_step": 70075, "epoch": 588, "lr": 8.60198514288535e-08} +{"train_loss": 0.00025473511777818203, "global_step": 70076, "epoch": 588, "lr": 8.58899983473771e-08} +{"train_loss": 0.00016090035205706954, "global_step": 70077, "epoch": 588, "lr": 8.576024326691912e-08} +{"train_loss": 0.000208866607863456, "global_step": 70078, "epoch": 588, "lr": 8.56305861877349e-08} +{"train_loss": 0.00011982061550952494, "global_step": 70079, "epoch": 588, "lr": 8.55010271100909e-08} +{"train_loss": 0.0002740452764555812, "global_step": 70080, "epoch": 588, "lr": 8.53715660342258e-08} +{"train_loss": 0.00019553604943212122, "global_step": 70081, "epoch": 588, "lr": 8.524220296040608e-08} +{"train_loss": 0.0001573992776684463, "global_step": 70082, "epoch": 588, "lr": 8.511293788887598e-08} +{"train_loss": 0.00016338095883838832, "global_step": 70083, "epoch": 588, "lr": 8.49837708198964e-08} +{"train_loss": 0.00041663096635602415, "global_step": 70084, "epoch": 588, "lr": 8.485470175372267e-08} +{"train_loss": 0.0001977571373572573, "global_step": 70085, "epoch": 588, "lr": 8.472573069059908e-08} +{"train_loss": 0.0002479394606780261, "global_step": 70086, "epoch": 588, "lr": 8.459685763078096e-08} +{"train_loss": 0.0002722283243201673, "global_step": 70087, "epoch": 588, "lr": 8.44680825745292e-08} +{"train_loss": 0.000295934674795717, "global_step": 70088, "epoch": 588, "lr": 8.433940552209362e-08} +{"train_loss": 0.00022296287352219224, "global_step": 70089, "epoch": 588, "lr": 8.421082647371848e-08} +{"train_loss": 0.0002317820893827544, "global_step": 70090, "epoch": 588, "lr": 8.408234542966464e-08, "val_loss": 0.04246608167886734} +{"train_loss": 0.0002496281813364476, "global_step": 70091, "epoch": 589, "lr": 8.39539623901875e-08} +{"train_loss": 0.00014151686627883464, "global_step": 70092, "epoch": 589, "lr": 8.382567735552571e-08} +{"train_loss": 0.00017498947272542864, "global_step": 70093, "epoch": 589, "lr": 8.369749032594576e-08} +{"train_loss": 0.00026874785544350743, "global_step": 70094, "epoch": 589, "lr": 8.356940130169189e-08} +{"train_loss": 0.00019081521895714104, "global_step": 70095, "epoch": 589, "lr": 8.344141028301388e-08} +{"train_loss": 0.0004683140432462096, "global_step": 70096, "epoch": 589, "lr": 8.331351727017267e-08} +{"train_loss": 0.0002418099029455334, "global_step": 70097, "epoch": 589, "lr": 8.318572226340693e-08} +{"train_loss": 0.0001918886264320463, "global_step": 70098, "epoch": 589, "lr": 8.305802526297202e-08} +{"train_loss": 0.00015663474914617836, "global_step": 70099, "epoch": 589, "lr": 8.293042626912329e-08} +{"train_loss": 0.00034679396776482463, "global_step": 70100, "epoch": 589, "lr": 8.280292528210498e-08} +{"train_loss": 0.00017831528384704143, "global_step": 70101, "epoch": 589, "lr": 8.267552230217246e-08} +{"train_loss": 0.00023061939282342792, "global_step": 70102, "epoch": 589, "lr": 8.254821732957552e-08} +{"train_loss": 0.0002449751482345164, "global_step": 70103, "epoch": 589, "lr": 8.24210103645584e-08} +{"train_loss": 0.00010766969353426248, "global_step": 70104, "epoch": 589, "lr": 8.229390140737647e-08} +{"train_loss": 0.00022544075909536332, "global_step": 70105, "epoch": 589, "lr": 8.216689045827398e-08} +{"train_loss": 0.00013539213978219777, "global_step": 70106, "epoch": 589, "lr": 8.203997751750625e-08} +{"train_loss": 0.00018322635150980204, "global_step": 70107, "epoch": 589, "lr": 8.19131625853231e-08} +{"train_loss": 0.00019577117927838117, "global_step": 70108, "epoch": 589, "lr": 8.17864456619688e-08} +{"train_loss": 0.0002354802709305659, "global_step": 70109, "epoch": 589, "lr": 8.165982674769313e-08} +{"train_loss": 0.00013984311954118311, "global_step": 70110, "epoch": 589, "lr": 8.153330584274588e-08} +{"train_loss": 0.0002590455114841461, "global_step": 70111, "epoch": 589, "lr": 8.140688294737131e-08} +{"train_loss": 0.00025483767967671156, "global_step": 70112, "epoch": 589, "lr": 8.128055806183033e-08} +{"train_loss": 0.00019172982138115913, "global_step": 70113, "epoch": 589, "lr": 8.115433118635051e-08} +{"train_loss": 0.0002736710011959076, "global_step": 70114, "epoch": 589, "lr": 8.102820232119834e-08} +{"train_loss": 0.0003927987418137491, "global_step": 70115, "epoch": 589, "lr": 8.09021714666125e-08} +{"train_loss": 0.00020468603179324418, "global_step": 70116, "epoch": 589, "lr": 8.077623862284278e-08} +{"train_loss": 0.0005764613742940128, "global_step": 70117, "epoch": 589, "lr": 8.065040379013899e-08} +{"train_loss": 0.00030355594935826957, "global_step": 70118, "epoch": 589, "lr": 8.052466696873984e-08} +{"train_loss": 0.00012655812315642834, "global_step": 70119, "epoch": 589, "lr": 8.039902815890065e-08} +{"train_loss": 0.00033560648444108665, "global_step": 70120, "epoch": 589, "lr": 8.027348736086015e-08} +{"train_loss": 0.00018439590348862112, "global_step": 70121, "epoch": 589, "lr": 8.014804457487368e-08} +{"train_loss": 0.00017538921383675188, "global_step": 70122, "epoch": 589, "lr": 8.002269980118548e-08} +{"train_loss": 0.0002863563713617623, "global_step": 70123, "epoch": 589, "lr": 7.989745304003426e-08} +{"train_loss": 0.00027669916744343936, "global_step": 70124, "epoch": 589, "lr": 7.977230429167537e-08} +{"train_loss": 0.0001441346830688417, "global_step": 70125, "epoch": 589, "lr": 7.96472535563475e-08} +{"train_loss": 0.0002499698894098401, "global_step": 70126, "epoch": 589, "lr": 7.952230083430046e-08} +{"train_loss": 0.00031866432982496917, "global_step": 70127, "epoch": 589, "lr": 7.939744612577294e-08} +{"train_loss": 0.00035231283982284367, "global_step": 70128, "epoch": 589, "lr": 7.927268943102028e-08} +{"train_loss": 0.00033117819111794233, "global_step": 70129, "epoch": 589, "lr": 7.914803075028677e-08} +{"train_loss": 0.00030839929240755737, "global_step": 70130, "epoch": 589, "lr": 7.902347008380551e-08} +{"train_loss": 0.0003448712232057005, "global_step": 70131, "epoch": 589, "lr": 7.889900743183187e-08} +{"train_loss": 0.00023526119184680283, "global_step": 70132, "epoch": 589, "lr": 7.877464279460456e-08} +{"train_loss": 0.00035765516804531217, "global_step": 70133, "epoch": 589, "lr": 7.865037617237337e-08} +{"train_loss": 0.00020828242122661322, "global_step": 70134, "epoch": 589, "lr": 7.852620756537699e-08} +{"train_loss": 0.00043702361290343106, "global_step": 70135, "epoch": 589, "lr": 7.840213697385967e-08} +{"train_loss": 0.00013066986866761, "global_step": 70136, "epoch": 589, "lr": 7.827816439806568e-08} +{"train_loss": 0.00023480139498133212, "global_step": 70137, "epoch": 589, "lr": 7.81542898382448e-08} +{"train_loss": 0.00016610012971796095, "global_step": 70138, "epoch": 589, "lr": 7.803051329463018e-08} +{"train_loss": 0.00018895800167229027, "global_step": 70139, "epoch": 589, "lr": 7.790683476746608e-08} +{"train_loss": 0.00014631747035309672, "global_step": 70140, "epoch": 589, "lr": 7.778325425700783e-08} +{"train_loss": 0.00021376188669819385, "global_step": 70141, "epoch": 589, "lr": 7.765977176348305e-08} +{"train_loss": 0.00012314345804043114, "global_step": 70142, "epoch": 589, "lr": 7.753638728713596e-08} +{"train_loss": 0.00013215997023507953, "global_step": 70143, "epoch": 589, "lr": 7.741310082822195e-08} +{"train_loss": 0.00012140319449827075, "global_step": 70144, "epoch": 589, "lr": 7.728991238696859e-08} +{"train_loss": 0.00019529931887518615, "global_step": 70145, "epoch": 589, "lr": 7.716682196362013e-08} +{"train_loss": 0.00042159942677244544, "global_step": 70146, "epoch": 589, "lr": 7.704382955842638e-08} +{"train_loss": 0.00018965823983307928, "global_step": 70147, "epoch": 589, "lr": 7.692093517162046e-08} +{"train_loss": 0.0003542049089446664, "global_step": 70148, "epoch": 589, "lr": 7.679813880344666e-08} +{"train_loss": 0.0004003930662292987, "global_step": 70149, "epoch": 589, "lr": 7.66754404541492e-08} +{"train_loss": 0.00014019721129443496, "global_step": 70150, "epoch": 589, "lr": 7.655284012396679e-08} +{"train_loss": 0.00014520998229272664, "global_step": 70151, "epoch": 589, "lr": 7.643033781313258e-08} +{"train_loss": 0.00018767168512567878, "global_step": 70152, "epoch": 589, "lr": 7.630793352190191e-08} +{"train_loss": 0.00024735453189350665, "global_step": 70153, "epoch": 589, "lr": 7.618562725050237e-08} +{"train_loss": 0.00024284808023367077, "global_step": 70154, "epoch": 589, "lr": 7.606341899917824e-08} +{"train_loss": 0.00033514454844407737, "global_step": 70155, "epoch": 589, "lr": 7.594130876817374e-08} +{"train_loss": 0.00017635038238950074, "global_step": 70156, "epoch": 589, "lr": 7.581929655772202e-08} +{"train_loss": 0.0002867476432584226, "global_step": 70157, "epoch": 589, "lr": 7.569738236806734e-08} +{"train_loss": 0.00024753418983891606, "global_step": 70158, "epoch": 589, "lr": 7.557556619944284e-08} +{"train_loss": 0.00015817942039575428, "global_step": 70159, "epoch": 589, "lr": 7.545384805209832e-08} +{"train_loss": 0.0002782691444735974, "global_step": 70160, "epoch": 589, "lr": 7.533222792626138e-08} +{"train_loss": 0.0003594373702071607, "global_step": 70161, "epoch": 589, "lr": 7.521070582217626e-08} +{"train_loss": 0.00017900453531183302, "global_step": 70162, "epoch": 589, "lr": 7.508928174008722e-08} +{"train_loss": 0.00018962631293106824, "global_step": 70163, "epoch": 589, "lr": 7.496795568022186e-08} +{"train_loss": 0.0001631984196137637, "global_step": 70164, "epoch": 589, "lr": 7.484672764281886e-08} +{"train_loss": 0.0005475673242472112, "global_step": 70165, "epoch": 589, "lr": 7.472559762812803e-08} +{"train_loss": 0.0001614698558114469, "global_step": 70166, "epoch": 589, "lr": 7.460456563637696e-08} +{"train_loss": 0.0003161631466355175, "global_step": 70167, "epoch": 589, "lr": 7.448363166780991e-08} +{"train_loss": 0.00017618288984522223, "global_step": 70168, "epoch": 589, "lr": 7.436279572265448e-08} +{"train_loss": 0.0006777331582270563, "global_step": 70169, "epoch": 589, "lr": 7.42420578011549e-08} +{"train_loss": 0.0002199268201366067, "global_step": 70170, "epoch": 589, "lr": 7.412141790354987e-08} +{"train_loss": 0.00036168278893455863, "global_step": 70171, "epoch": 589, "lr": 7.400087603007256e-08} +{"train_loss": 0.00023557280655950308, "global_step": 70172, "epoch": 589, "lr": 7.388043218096163e-08} +{"train_loss": 0.00026495158090256155, "global_step": 70173, "epoch": 589, "lr": 7.376008635645026e-08} +{"train_loss": 0.0002465910220053047, "global_step": 70174, "epoch": 589, "lr": 7.363983855677715e-08} +{"train_loss": 0.00017589480557944626, "global_step": 70175, "epoch": 589, "lr": 7.351968878218096e-08} +{"train_loss": 0.00014849747822154313, "global_step": 70176, "epoch": 589, "lr": 7.339963703289487e-08} +{"train_loss": 0.00035220550489611924, "global_step": 70177, "epoch": 589, "lr": 7.327968330915202e-08} +{"train_loss": 0.00026890524895861745, "global_step": 70178, "epoch": 589, "lr": 7.315982761119111e-08} +{"train_loss": 0.00014517763338517398, "global_step": 70179, "epoch": 589, "lr": 7.304006993925084e-08} +{"train_loss": 0.00036851412733085454, "global_step": 70180, "epoch": 589, "lr": 7.292041029355879e-08} +{"train_loss": 0.00014923835988156497, "global_step": 70181, "epoch": 589, "lr": 7.280084867435366e-08} +{"train_loss": 0.00022404752962756902, "global_step": 70182, "epoch": 589, "lr": 7.268138508187416e-08} +{"train_loss": 0.00036381965037435293, "global_step": 70183, "epoch": 589, "lr": 7.256201951634788e-08} +{"train_loss": 0.0001166922811535187, "global_step": 70184, "epoch": 589, "lr": 7.244275197801354e-08} +{"train_loss": 0.00017161229334305972, "global_step": 70185, "epoch": 589, "lr": 7.23235824670987e-08} +{"train_loss": 0.0001552609755890444, "global_step": 70186, "epoch": 589, "lr": 7.220451098384761e-08} +{"train_loss": 0.0005629121442325413, "global_step": 70187, "epoch": 589, "lr": 7.20855375284879e-08} +{"train_loss": 0.0003247341082897037, "global_step": 70188, "epoch": 589, "lr": 7.19666621012527e-08} +{"train_loss": 0.0004794122069142759, "global_step": 70189, "epoch": 589, "lr": 7.184788470238068e-08} +{"train_loss": 0.00017040382954292, "global_step": 70190, "epoch": 589, "lr": 7.172920533209393e-08} +{"train_loss": 0.00029166435706429183, "global_step": 70191, "epoch": 589, "lr": 7.161062399064222e-08} +{"train_loss": 0.00027371663600206375, "global_step": 70192, "epoch": 589, "lr": 7.149214067824205e-08} +{"train_loss": 0.00014449779700953513, "global_step": 70193, "epoch": 589, "lr": 7.137375539513213e-08} +{"train_loss": 0.00015970294771250337, "global_step": 70194, "epoch": 589, "lr": 7.125546814155115e-08} +{"train_loss": 0.00033668146352283657, "global_step": 70195, "epoch": 589, "lr": 7.11372789177267e-08} +{"train_loss": 0.00022807842469774187, "global_step": 70196, "epoch": 589, "lr": 7.101918772388639e-08} +{"train_loss": 0.0003104539355263114, "global_step": 70197, "epoch": 589, "lr": 7.090119456026334e-08} +{"train_loss": 0.00023395640891976655, "global_step": 70198, "epoch": 589, "lr": 7.078329942709628e-08} +{"train_loss": 0.0002471307525411248, "global_step": 70199, "epoch": 589, "lr": 7.066550232461278e-08} +{"train_loss": 0.00023729268286842853, "global_step": 70200, "epoch": 589, "lr": 7.054780325304044e-08} +{"train_loss": 0.00018089861259795725, "global_step": 70201, "epoch": 589, "lr": 7.043020221261242e-08} +{"train_loss": 0.00019688713655341417, "global_step": 70202, "epoch": 589, "lr": 7.031269920356187e-08} +{"train_loss": 0.0002482132986187935, "global_step": 70203, "epoch": 589, "lr": 7.019529422612193e-08} +{"train_loss": 0.00010606093565002084, "global_step": 70204, "epoch": 589, "lr": 7.007798728051462e-08} +{"train_loss": 0.00023332887212745845, "global_step": 70205, "epoch": 589, "lr": 6.996077836697312e-08} +{"train_loss": 0.00032911417656578124, "global_step": 70206, "epoch": 589, "lr": 6.984366748573612e-08} +{"train_loss": 0.0003347310412209481, "global_step": 70207, "epoch": 589, "lr": 6.97266546370201e-08} +{"train_loss": 0.0001466334651922807, "global_step": 70208, "epoch": 589, "lr": 6.960973982106378e-08} +{"train_loss": 0.0002504657588223144, "global_step": 70209, "epoch": 589, "lr": 6.949292303809474e-08, "val_loss": 0.016754403710365295} +{"train_loss": 0.00037274917121976614, "global_step": 70210, "epoch": 590, "lr": 6.937620428834612e-08} +{"train_loss": 0.00017172266962006688, "global_step": 70211, "epoch": 590, "lr": 6.925958357203999e-08} +{"train_loss": 0.0002539536217227578, "global_step": 70212, "epoch": 590, "lr": 6.914306088940392e-08} +{"train_loss": 0.00028178366483189166, "global_step": 70213, "epoch": 590, "lr": 6.902663624067662e-08} +{"train_loss": 0.00023300481552723795, "global_step": 70214, "epoch": 590, "lr": 6.891030962608014e-08} +{"train_loss": 0.00033037265529856086, "global_step": 70215, "epoch": 590, "lr": 6.879408104584206e-08} +{"train_loss": 0.0002847126452252269, "global_step": 70216, "epoch": 590, "lr": 6.867795050019554e-08} +{"train_loss": 0.00022077215544413775, "global_step": 70217, "epoch": 590, "lr": 6.856191798936263e-08} +{"train_loss": 0.0001392387057421729, "global_step": 70218, "epoch": 590, "lr": 6.844598351357645e-08} +{"train_loss": 0.00026709187659434974, "global_step": 70219, "epoch": 590, "lr": 6.833014707305907e-08} +{"train_loss": 0.0002739233314059675, "global_step": 70220, "epoch": 590, "lr": 6.821440866804362e-08} +{"train_loss": 0.00031370559008792043, "global_step": 70221, "epoch": 590, "lr": 6.809876829875217e-08} +{"train_loss": 0.00018021125288214535, "global_step": 70222, "epoch": 590, "lr": 6.798322596541784e-08} +{"train_loss": 0.0001773352560121566, "global_step": 70223, "epoch": 590, "lr": 6.786778166826268e-08} +{"train_loss": 0.0001823390630306676, "global_step": 70224, "epoch": 590, "lr": 6.77524354075143e-08} +{"train_loss": 0.0002777508634608239, "global_step": 70225, "epoch": 590, "lr": 6.763718718340029e-08} +{"train_loss": 0.00015659209748264402, "global_step": 70226, "epoch": 590, "lr": 6.752203699614268e-08} +{"train_loss": 0.0001347135694231838, "global_step": 70227, "epoch": 590, "lr": 6.740698484597463e-08} +{"train_loss": 0.00013069489796180278, "global_step": 70228, "epoch": 590, "lr": 6.729203073311818e-08} +{"train_loss": 0.0003738072991836816, "global_step": 70229, "epoch": 590, "lr": 6.717717465780093e-08} +{"train_loss": 0.0001895179448183626, "global_step": 70230, "epoch": 590, "lr": 6.706241662023938e-08} +{"train_loss": 0.00025734459632076323, "global_step": 70231, "epoch": 590, "lr": 6.69477566206722e-08} +{"train_loss": 0.00013618414232041687, "global_step": 70232, "epoch": 590, "lr": 6.683319465931592e-08} +{"train_loss": 0.00026948534650728106, "global_step": 70233, "epoch": 590, "lr": 6.671873073640367e-08} +{"train_loss": 0.0002759258495643735, "global_step": 70234, "epoch": 590, "lr": 6.660436485215194e-08} +{"train_loss": 0.00018673327576834708, "global_step": 70235, "epoch": 590, "lr": 6.649009700678276e-08} +{"train_loss": 0.00016833789413794875, "global_step": 70236, "epoch": 590, "lr": 6.637592720053488e-08} +{"train_loss": 0.000351612368831411, "global_step": 70237, "epoch": 590, "lr": 6.626185543361363e-08} +{"train_loss": 0.0002780133509077132, "global_step": 70238, "epoch": 590, "lr": 6.614788170625774e-08} +{"train_loss": 0.0001283807068830356, "global_step": 70239, "epoch": 590, "lr": 6.60340060186837e-08} +{"train_loss": 0.0005138904671184719, "global_step": 70240, "epoch": 590, "lr": 6.592022837111911e-08} +{"train_loss": 0.00016237895761150867, "global_step": 70241, "epoch": 590, "lr": 6.5806548763786e-08} +{"train_loss": 0.0002449903404340148, "global_step": 70242, "epoch": 590, "lr": 6.569296719690643e-08} +{"train_loss": 0.0005846827407367527, "global_step": 70243, "epoch": 590, "lr": 6.557948367070243e-08} +{"train_loss": 0.0001452472060918808, "global_step": 70244, "epoch": 590, "lr": 6.546609818540161e-08} +{"train_loss": 0.0001529020955786109, "global_step": 70245, "epoch": 590, "lr": 6.535281074122046e-08} +{"train_loss": 0.0001664030278334394, "global_step": 70246, "epoch": 590, "lr": 6.523962133838657e-08} +{"train_loss": 0.0002003869303734973, "global_step": 70247, "epoch": 590, "lr": 6.512652997711644e-08} +{"train_loss": 0.00045929133193567395, "global_step": 70248, "epoch": 590, "lr": 6.501353665763765e-08} +{"train_loss": 0.00019530174904502928, "global_step": 70249, "epoch": 590, "lr": 6.490064138017226e-08} +{"train_loss": 0.00027235192828811705, "global_step": 70250, "epoch": 590, "lr": 6.478784414493677e-08} +{"train_loss": 0.00026118961977772415, "global_step": 70251, "epoch": 590, "lr": 6.467514495215876e-08} +{"train_loss": 0.00017607449262868613, "global_step": 70252, "epoch": 590, "lr": 6.456254380205473e-08} +{"train_loss": 0.00014344030932988971, "global_step": 70253, "epoch": 590, "lr": 6.445004069484672e-08} +{"train_loss": 0.0002625039778649807, "global_step": 70254, "epoch": 590, "lr": 6.433763563075124e-08} +{"train_loss": 0.0002077783428831026, "global_step": 70255, "epoch": 590, "lr": 6.422532861000141e-08} +{"train_loss": 0.0002479742979630828, "global_step": 70256, "epoch": 590, "lr": 6.41131196328082e-08} +{"train_loss": 0.0003397747059352696, "global_step": 70257, "epoch": 590, "lr": 6.400100869939363e-08} +{"train_loss": 0.00014199476572684944, "global_step": 70258, "epoch": 590, "lr": 6.388899580997976e-08} +{"train_loss": 0.0001997250219574198, "global_step": 70259, "epoch": 590, "lr": 6.377708096478308e-08} +{"train_loss": 0.00047725281910970807, "global_step": 70260, "epoch": 590, "lr": 6.366526416402563e-08} +{"train_loss": 0.00012262635573279113, "global_step": 70261, "epoch": 590, "lr": 6.355354540792391e-08} +{"train_loss": 0.0003043386386707425, "global_step": 70262, "epoch": 590, "lr": 6.344192469669996e-08} +{"train_loss": 0.000491516082547605, "global_step": 70263, "epoch": 590, "lr": 6.333040203057583e-08} +{"train_loss": 0.00012144355423515663, "global_step": 70264, "epoch": 590, "lr": 6.3218977409768e-08} +{"train_loss": 0.00022446441289503127, "global_step": 70265, "epoch": 590, "lr": 6.3107650834493e-08} +{"train_loss": 0.0001455480232834816, "global_step": 70266, "epoch": 590, "lr": 6.299642230497282e-08} +{"train_loss": 0.00019371490634512156, "global_step": 70267, "epoch": 590, "lr": 6.2885291821424e-08} +{"train_loss": 0.00016216754738707095, "global_step": 70268, "epoch": 590, "lr": 6.2774259384063e-08} +{"train_loss": 0.00017844277317635715, "global_step": 70269, "epoch": 590, "lr": 6.26633249931119e-08} +{"train_loss": 0.00014999444829300046, "global_step": 70270, "epoch": 590, "lr": 6.25524886487816e-08} +{"train_loss": 0.00013265748566482216, "global_step": 70271, "epoch": 590, "lr": 6.244175035129973e-08} +{"train_loss": 0.00013406823563855141, "global_step": 70272, "epoch": 590, "lr": 6.233111010087722e-08} +{"train_loss": 0.00018607043602969497, "global_step": 70273, "epoch": 590, "lr": 6.222056789773056e-08} +{"train_loss": 0.00037018570583313704, "global_step": 70274, "epoch": 590, "lr": 6.211012374208181e-08} +{"train_loss": 0.00016526944818906486, "global_step": 70275, "epoch": 590, "lr": 6.199977763414188e-08} +{"train_loss": 0.0002498353715054691, "global_step": 70276, "epoch": 590, "lr": 6.188952957413286e-08} +{"train_loss": 0.0005355051252990961, "global_step": 70277, "epoch": 590, "lr": 6.177937956226564e-08} +{"train_loss": 0.00018407664902042598, "global_step": 70278, "epoch": 590, "lr": 6.166932759876231e-08} +{"train_loss": 0.00021198336617089808, "global_step": 70279, "epoch": 590, "lr": 6.15593736838338e-08} +{"train_loss": 0.0002630250819493085, "global_step": 70280, "epoch": 590, "lr": 6.144951781770213e-08} +{"train_loss": 0.00019067096582148224, "global_step": 70281, "epoch": 590, "lr": 6.133976000057828e-08} +{"train_loss": 0.00028076383750885725, "global_step": 70282, "epoch": 590, "lr": 6.123010023267317e-08} +{"train_loss": 0.00015217802138067782, "global_step": 70283, "epoch": 590, "lr": 6.112053851421439e-08} +{"train_loss": 0.0003244297986384481, "global_step": 70284, "epoch": 590, "lr": 6.101107484540735e-08} +{"train_loss": 0.00015342954429797828, "global_step": 70285, "epoch": 590, "lr": 6.090170922646854e-08} +{"train_loss": 0.00023500497627537698, "global_step": 70286, "epoch": 590, "lr": 6.079244165761444e-08} +{"train_loss": 0.00020959840912837535, "global_step": 70287, "epoch": 590, "lr": 6.068327213906155e-08} +{"train_loss": 0.0001911224244395271, "global_step": 70288, "epoch": 590, "lr": 6.057420067102082e-08} +{"train_loss": 0.00031980100902728736, "global_step": 70289, "epoch": 590, "lr": 6.046522725370318e-08} +{"train_loss": 0.00037074770079925656, "global_step": 70290, "epoch": 590, "lr": 6.035635188733069e-08} +{"train_loss": 0.0002006759459618479, "global_step": 70291, "epoch": 590, "lr": 6.024757457211427e-08} +{"train_loss": 0.00021299772197380662, "global_step": 70292, "epoch": 590, "lr": 6.013889530826489e-08} +{"train_loss": 0.00042929971823468804, "global_step": 70293, "epoch": 590, "lr": 6.003031409599902e-08} +{"train_loss": 0.0002673231065273285, "global_step": 70294, "epoch": 590, "lr": 5.99218309355276e-08} +{"train_loss": 0.000313078606268391, "global_step": 70295, "epoch": 590, "lr": 5.981344582706161e-08} +{"train_loss": 0.00021535558335017413, "global_step": 70296, "epoch": 590, "lr": 5.970515877082306e-08} +{"train_loss": 0.00013181135000195354, "global_step": 70297, "epoch": 590, "lr": 5.959696976701179e-08} +{"train_loss": 0.0002415003691567108, "global_step": 70298, "epoch": 590, "lr": 5.948887881584986e-08} +{"train_loss": 0.00023500563111156225, "global_step": 70299, "epoch": 590, "lr": 5.938088591754265e-08} +{"train_loss": 0.00019510849961079657, "global_step": 70300, "epoch": 590, "lr": 5.927299107230666e-08} +{"train_loss": 0.0002596956037450582, "global_step": 70301, "epoch": 590, "lr": 5.916519428035838e-08} +{"train_loss": 0.00031208674772642553, "global_step": 70302, "epoch": 590, "lr": 5.905749554189766e-08} +{"train_loss": 0.00018370590987615287, "global_step": 70303, "epoch": 590, "lr": 5.894989485714653e-08} +{"train_loss": 0.0002447242150083184, "global_step": 70304, "epoch": 590, "lr": 5.8842392226304834e-08} +{"train_loss": 0.0001508590648882091, "global_step": 70305, "epoch": 590, "lr": 5.873498764960017e-08} +{"train_loss": 0.00019310392963234335, "global_step": 70306, "epoch": 590, "lr": 5.862768112722683e-08} +{"train_loss": 0.00030886949389241636, "global_step": 70307, "epoch": 590, "lr": 5.852047265940685e-08} +{"train_loss": 0.00016513791342731565, "global_step": 70308, "epoch": 590, "lr": 5.841336224634009e-08} +{"train_loss": 0.00027541571762412786, "global_step": 70309, "epoch": 590, "lr": 5.8306349888248566e-08} +{"train_loss": 0.00035696232225745916, "global_step": 70310, "epoch": 590, "lr": 5.819943558533769e-08} +{"train_loss": 0.00024489028146490455, "global_step": 70311, "epoch": 590, "lr": 5.809261933781285e-08} +{"train_loss": 0.00015904886822681874, "global_step": 70312, "epoch": 590, "lr": 5.798590114589053e-08} +{"train_loss": 0.00039139617001637816, "global_step": 70313, "epoch": 590, "lr": 5.787928100977613e-08} +{"train_loss": 0.00030557799618691206, "global_step": 70314, "epoch": 590, "lr": 5.777275892968059e-08} +{"train_loss": 0.00019326602341607213, "global_step": 70315, "epoch": 590, "lr": 5.766633490581486e-08} +{"train_loss": 0.0001610063191037625, "global_step": 70316, "epoch": 590, "lr": 5.7560008938384316e-08} +{"train_loss": 0.00018805086438078433, "global_step": 70317, "epoch": 590, "lr": 5.7453781027599906e-08} +{"train_loss": 0.0002323779626749456, "global_step": 70318, "epoch": 590, "lr": 5.734765117366703e-08} +{"train_loss": 0.0001647634489927441, "global_step": 70319, "epoch": 590, "lr": 5.7241619376796616e-08} +{"train_loss": 0.00024830258917063475, "global_step": 70320, "epoch": 590, "lr": 5.713568563719962e-08} +{"train_loss": 0.0002419770898995921, "global_step": 70321, "epoch": 590, "lr": 5.7029849955075874e-08} +{"train_loss": 0.0002715816372074187, "global_step": 70322, "epoch": 590, "lr": 5.6924112330641875e-08} +{"train_loss": 0.00019320221326779574, "global_step": 70323, "epoch": 590, "lr": 5.681847276410301e-08} +{"train_loss": 0.00036428376915864646, "global_step": 70324, "epoch": 590, "lr": 5.671293125566468e-08} +{"train_loss": 0.000534854072611779, "global_step": 70325, "epoch": 590, "lr": 5.660748780553227e-08} +{"train_loss": 0.00021846394520252943, "global_step": 70326, "epoch": 590, "lr": 5.6502142413916716e-08} +{"train_loss": 0.00017326678789686412, "global_step": 70327, "epoch": 590, "lr": 5.6396895081023415e-08} +{"train_loss": 0.0002448836607714731, "global_step": 70328, "epoch": 590, "lr": 5.6291745807057764e-08, "val_loss": 0.01698736473917961, "train_action_mse_error": 2.9492605335690314e-06} +{"train_loss": 0.00020949527970515192, "global_step": 70329, "epoch": 591, "lr": 5.6186694592230694e-08} +{"train_loss": 0.00017018573998939246, "global_step": 70330, "epoch": 591, "lr": 5.6081741436747604e-08} +{"train_loss": 0.00018046806508209556, "global_step": 70331, "epoch": 591, "lr": 5.5976886340808334e-08} +{"train_loss": 0.00018365091818850487, "global_step": 70332, "epoch": 591, "lr": 5.587212930462382e-08} +{"train_loss": 0.0002527437172830105, "global_step": 70333, "epoch": 591, "lr": 5.576747032839391e-08} +{"train_loss": 0.0003818149270955473, "global_step": 70334, "epoch": 591, "lr": 5.56629094123351e-08} +{"train_loss": 0.00016788349603302777, "global_step": 70335, "epoch": 591, "lr": 5.555844655664166e-08} +{"train_loss": 0.0002968910848721862, "global_step": 70336, "epoch": 591, "lr": 5.545408176153011e-08} +{"train_loss": 0.0002877175575122237, "global_step": 70337, "epoch": 591, "lr": 5.534981502719472e-08} +{"train_loss": 0.0001810386893339455, "global_step": 70338, "epoch": 591, "lr": 5.5245646353840884e-08} +{"train_loss": 0.00016304018208757043, "global_step": 70339, "epoch": 591, "lr": 5.514157574167955e-08} +{"train_loss": 0.00019635075295809656, "global_step": 70340, "epoch": 591, "lr": 5.503760319091056e-08} +{"train_loss": 0.00014166970504447818, "global_step": 70341, "epoch": 591, "lr": 5.493372870174485e-08} +{"train_loss": 0.0003212670562788844, "global_step": 70342, "epoch": 591, "lr": 5.482995227437671e-08} +{"train_loss": 0.00018344457203056663, "global_step": 70343, "epoch": 591, "lr": 5.472627390901153e-08} +{"train_loss": 0.00027645763475447893, "global_step": 70344, "epoch": 591, "lr": 5.462269360586025e-08} +{"train_loss": 0.00026296405121684074, "global_step": 70345, "epoch": 591, "lr": 5.4519211365117176e-08} +{"train_loss": 0.00034640650846995413, "global_step": 70346, "epoch": 591, "lr": 5.441582718699323e-08} +{"train_loss": 0.0002203564072260633, "global_step": 70347, "epoch": 591, "lr": 5.4312541071688264e-08} +{"train_loss": 0.00022021165932528675, "global_step": 70348, "epoch": 591, "lr": 5.4209353019402106e-08} +{"train_loss": 0.00014252545952331275, "global_step": 70349, "epoch": 591, "lr": 5.410626303034017e-08} +{"train_loss": 0.0001230278139701113, "global_step": 70350, "epoch": 591, "lr": 5.400327110470782e-08} +{"train_loss": 0.00018186129454988986, "global_step": 70351, "epoch": 591, "lr": 5.390037724269936e-08} +{"train_loss": 0.00027586938813328743, "global_step": 70352, "epoch": 591, "lr": 5.3797581444525735e-08} +{"train_loss": 0.00026902230456471443, "global_step": 70353, "epoch": 591, "lr": 5.3694883710381226e-08} +{"train_loss": 0.00029570970218628645, "global_step": 70354, "epoch": 591, "lr": 5.359228404047123e-08} +{"train_loss": 0.00017305012443102896, "global_step": 70355, "epoch": 591, "lr": 5.3489782435001136e-08} +{"train_loss": 0.0002314884914085269, "global_step": 70356, "epoch": 591, "lr": 5.338737889415968e-08} +{"train_loss": 0.0004895724705420434, "global_step": 70357, "epoch": 591, "lr": 5.3285073418163355e-08} +{"train_loss": 0.00019685800361912698, "global_step": 70358, "epoch": 591, "lr": 5.31828660072009e-08} +{"train_loss": 0.00015323722618632019, "global_step": 70359, "epoch": 591, "lr": 5.3080756661483265e-08} +{"train_loss": 0.0001746098860166967, "global_step": 70360, "epoch": 591, "lr": 5.297874538120473e-08} +{"train_loss": 0.00036519704735837877, "global_step": 70361, "epoch": 591, "lr": 5.287683216655959e-08} +{"train_loss": 0.0005151084624230862, "global_step": 70362, "epoch": 591, "lr": 5.277501701775878e-08} +{"train_loss": 0.0003137967432849109, "global_step": 70363, "epoch": 591, "lr": 5.267329993500214e-08} +{"train_loss": 0.0001525640836916864, "global_step": 70364, "epoch": 591, "lr": 5.2571680918478416e-08} +{"train_loss": 0.00022241617261897773, "global_step": 70365, "epoch": 591, "lr": 5.247015996839855e-08} +{"train_loss": 0.00016259070252999663, "global_step": 70366, "epoch": 591, "lr": 5.236873708495682e-08} +{"train_loss": 0.00028720899717882276, "global_step": 70367, "epoch": 591, "lr": 5.226741226835308e-08} +{"train_loss": 0.00036127856583334506, "global_step": 70368, "epoch": 591, "lr": 5.216618551878716e-08} +{"train_loss": 0.00011990464554401115, "global_step": 70369, "epoch": 591, "lr": 5.2065056836453355e-08} +{"train_loss": 0.00012422294821590185, "global_step": 70370, "epoch": 591, "lr": 5.196402622155705e-08} +{"train_loss": 0.00021088733046781272, "global_step": 70371, "epoch": 591, "lr": 5.186309367429254e-08} +{"train_loss": 0.0007578789372928441, "global_step": 70372, "epoch": 591, "lr": 5.176225919485966e-08} +{"train_loss": 0.0001802157494239509, "global_step": 70373, "epoch": 591, "lr": 5.166152278345271e-08} +{"train_loss": 0.000207092787604779, "global_step": 70374, "epoch": 591, "lr": 5.156088444027152e-08} +{"train_loss": 0.00021508806094061583, "global_step": 70375, "epoch": 591, "lr": 5.1460344165515925e-08} +{"train_loss": 0.000214456144021824, "global_step": 70376, "epoch": 591, "lr": 5.135990195938578e-08} +{"train_loss": 0.0002263226779177785, "global_step": 70377, "epoch": 591, "lr": 5.125955782206981e-08} +{"train_loss": 0.0002829443255905062, "global_step": 70378, "epoch": 591, "lr": 5.115931175376787e-08} +{"train_loss": 0.0001606102305231616, "global_step": 70379, "epoch": 591, "lr": 5.1059163754679783e-08} +{"train_loss": 0.00034226806019432843, "global_step": 70380, "epoch": 591, "lr": 5.0959113824999846e-08} +{"train_loss": 0.0001384491624776274, "global_step": 70381, "epoch": 591, "lr": 5.0859161964927904e-08} +{"train_loss": 0.00022593859466724098, "global_step": 70382, "epoch": 591, "lr": 5.075930817465824e-08} +{"train_loss": 0.00015508416981901973, "global_step": 70383, "epoch": 591, "lr": 5.065955245438514e-08} +{"train_loss": 0.0002342803927604109, "global_step": 70384, "epoch": 591, "lr": 5.055989480430845e-08} +{"train_loss": 0.00039448830648325384, "global_step": 70385, "epoch": 591, "lr": 5.0460335224616906e-08} +{"train_loss": 0.0002062183484667912, "global_step": 70386, "epoch": 591, "lr": 5.036087371551035e-08} +{"train_loss": 0.0001665926683926955, "global_step": 70387, "epoch": 591, "lr": 5.026151027718307e-08} +{"train_loss": 0.00031090262928046286, "global_step": 70388, "epoch": 591, "lr": 5.0162244909834896e-08} +{"train_loss": 0.00011180932051502168, "global_step": 70389, "epoch": 591, "lr": 5.006307761365458e-08} +{"train_loss": 0.00022882118355482817, "global_step": 70390, "epoch": 591, "lr": 4.9964008388836416e-08} +{"train_loss": 0.0002468628517817706, "global_step": 70391, "epoch": 591, "lr": 4.986503723558022e-08} +{"train_loss": 0.00037156359758228064, "global_step": 70392, "epoch": 591, "lr": 4.9766164154080306e-08} +{"train_loss": 0.00016955747560132295, "global_step": 70393, "epoch": 591, "lr": 4.96673891445254e-08} +{"train_loss": 0.00031429537921212614, "global_step": 70394, "epoch": 591, "lr": 4.9568712207115344e-08} +{"train_loss": 0.00029497427749447525, "global_step": 70395, "epoch": 591, "lr": 4.947013334203332e-08} +{"train_loss": 0.00033015309600159526, "global_step": 70396, "epoch": 591, "lr": 4.937165254948473e-08} +{"train_loss": 0.00018538153381086886, "global_step": 70397, "epoch": 591, "lr": 4.92732698296583e-08} +{"train_loss": 0.0003497699508443475, "global_step": 70398, "epoch": 591, "lr": 4.9174985182748325e-08} +{"train_loss": 0.00021809224563185126, "global_step": 70399, "epoch": 591, "lr": 4.9076798608943545e-08} +{"train_loss": 0.0002462682023178786, "global_step": 70400, "epoch": 591, "lr": 4.8978710108443793e-08} +{"train_loss": 0.00022408334189094603, "global_step": 70401, "epoch": 591, "lr": 4.8880719681437813e-08} +{"train_loss": 0.00016202093684114516, "global_step": 70402, "epoch": 591, "lr": 4.878282732811989e-08} +{"train_loss": 0.00030625832732766867, "global_step": 70403, "epoch": 591, "lr": 4.868503304867322e-08} +{"train_loss": 0.00041781910113058984, "global_step": 70404, "epoch": 591, "lr": 4.858733684330319e-08} +{"train_loss": 0.0004611290351022035, "global_step": 70405, "epoch": 591, "lr": 4.848973871219298e-08} +{"train_loss": 0.0001783717452781275, "global_step": 70406, "epoch": 591, "lr": 4.839223865553688e-08} +{"train_loss": 0.00013029936235398054, "global_step": 70407, "epoch": 591, "lr": 4.829483667352364e-08} +{"train_loss": 0.000168499507708475, "global_step": 70408, "epoch": 591, "lr": 4.819753276635308e-08} +{"train_loss": 0.0001403590285917744, "global_step": 70409, "epoch": 591, "lr": 4.8100326934202853e-08} +{"train_loss": 0.0002630412927828729, "global_step": 70410, "epoch": 591, "lr": 4.800321917727835e-08} +{"train_loss": 0.0002053705247817561, "global_step": 70411, "epoch": 591, "lr": 4.790620949575719e-08} +{"train_loss": 0.00029136575176380575, "global_step": 70412, "epoch": 591, "lr": 4.780929788983923e-08} +{"train_loss": 0.0002206100762123242, "global_step": 70413, "epoch": 591, "lr": 4.7712484359707655e-08} +{"train_loss": 0.0002726727398112416, "global_step": 70414, "epoch": 591, "lr": 4.761576890555674e-08} +{"train_loss": 0.00031418720027431846, "global_step": 70415, "epoch": 591, "lr": 4.751915152757525e-08} +{"train_loss": 0.00016632553888484836, "global_step": 70416, "epoch": 591, "lr": 4.742263222595744e-08} +{"train_loss": 0.00023154613154474646, "global_step": 70417, "epoch": 591, "lr": 4.732621100088652e-08} +{"train_loss": 0.0001674891827860847, "global_step": 70418, "epoch": 591, "lr": 4.722988785255122e-08} +{"train_loss": 0.0001679589186096564, "global_step": 70419, "epoch": 591, "lr": 4.7133662781145836e-08} +{"train_loss": 0.0001566705759614706, "global_step": 70420, "epoch": 591, "lr": 4.70375357868591e-08} +{"train_loss": 0.00013559628860093653, "global_step": 70421, "epoch": 591, "lr": 4.6941506869874196e-08} +{"train_loss": 0.00014378433115780354, "global_step": 70422, "epoch": 591, "lr": 4.684557603037987e-08} +{"train_loss": 0.00016177943325601518, "global_step": 70423, "epoch": 591, "lr": 4.674974326857595e-08} +{"train_loss": 0.00015093765978235751, "global_step": 70424, "epoch": 591, "lr": 4.665400858463453e-08} +{"train_loss": 0.00035205771564505994, "global_step": 70425, "epoch": 591, "lr": 4.655837197875545e-08} +{"train_loss": 0.00034566421527415514, "global_step": 70426, "epoch": 591, "lr": 4.64628334511219e-08} +{"train_loss": 0.000270928256213665, "global_step": 70427, "epoch": 591, "lr": 4.636739300191706e-08} +{"train_loss": 0.00016347219934687018, "global_step": 70428, "epoch": 591, "lr": 4.627205063134077e-08} +{"train_loss": 0.0003572049317881465, "global_step": 70429, "epoch": 591, "lr": 4.6176806339565114e-08} +{"train_loss": 0.00020351474813651294, "global_step": 70430, "epoch": 591, "lr": 4.608166012678994e-08} +{"train_loss": 0.00018835935043171048, "global_step": 70431, "epoch": 591, "lr": 4.5986611993192875e-08} +{"train_loss": 0.00023678703291807324, "global_step": 70432, "epoch": 591, "lr": 4.589166193896821e-08} +{"train_loss": 0.00046614749589934945, "global_step": 70433, "epoch": 591, "lr": 4.579680996429914e-08} +{"train_loss": 0.00018869857012759894, "global_step": 70434, "epoch": 591, "lr": 4.570205606936329e-08} +{"train_loss": 0.00040370560600422323, "global_step": 70435, "epoch": 591, "lr": 4.56074002543605e-08} +{"train_loss": 0.00024171348195523024, "global_step": 70436, "epoch": 591, "lr": 4.5512842519473965e-08} +{"train_loss": 0.0004194859939161688, "global_step": 70437, "epoch": 591, "lr": 4.5418382864881314e-08} +{"train_loss": 0.00014954843209125102, "global_step": 70438, "epoch": 591, "lr": 4.532402129077129e-08} +{"train_loss": 0.00023301136388909072, "global_step": 70439, "epoch": 591, "lr": 4.522975779733263e-08} +{"train_loss": 0.00015748442092444748, "global_step": 70440, "epoch": 591, "lr": 4.5135592384754066e-08} +{"train_loss": 0.00031993232551030815, "global_step": 70441, "epoch": 591, "lr": 4.504152505320769e-08} +{"train_loss": 0.0006862914888188243, "global_step": 70442, "epoch": 591, "lr": 4.494755580288779e-08} +{"train_loss": 0.00014680848107673228, "global_step": 70443, "epoch": 591, "lr": 4.4853684633977543e-08} +{"train_loss": 0.000257205858360976, "global_step": 70444, "epoch": 591, "lr": 4.4759911546654596e-08} +{"train_loss": 0.00026801542844623327, "global_step": 70445, "epoch": 591, "lr": 4.466623654111324e-08} +{"train_loss": 0.0003292301844339818, "global_step": 70446, "epoch": 591, "lr": 4.457265961753665e-08} +{"train_loss": 0.00024749093096920467, "global_step": 70447, "epoch": 591, "lr": 4.447918077609692e-08, "val_loss": 0.026475289836525917} +{"train_loss": 0.0004023319634143263, "global_step": 70448, "epoch": 592, "lr": 4.438580001698833e-08} +{"train_loss": 0.00019042032363358885, "global_step": 70449, "epoch": 592, "lr": 4.429251734039408e-08} +{"train_loss": 0.0001867890969151631, "global_step": 70450, "epoch": 592, "lr": 4.4199332746491795e-08} +{"train_loss": 0.00022118963534012437, "global_step": 70451, "epoch": 592, "lr": 4.410624623547022e-08} +{"train_loss": 0.00020830909488722682, "global_step": 70452, "epoch": 592, "lr": 4.401325780750143e-08} +{"train_loss": 0.0005377825582399964, "global_step": 70453, "epoch": 592, "lr": 4.392036746278527e-08} +{"train_loss": 0.00018457794794812799, "global_step": 70454, "epoch": 592, "lr": 4.382757520148828e-08} +{"train_loss": 0.00014997397374827415, "global_step": 70455, "epoch": 592, "lr": 4.373488102379919e-08} +{"train_loss": 0.000226896969252266, "global_step": 70456, "epoch": 592, "lr": 4.364228492990119e-08} +{"train_loss": 0.00023582801804877818, "global_step": 70457, "epoch": 592, "lr": 4.3549786919971915e-08} +{"train_loss": 0.000502684386447072, "global_step": 70458, "epoch": 592, "lr": 4.34573869942001e-08} +{"train_loss": 0.00015106512000784278, "global_step": 70459, "epoch": 592, "lr": 4.3365085152757835e-08} +{"train_loss": 0.0002827980788424611, "global_step": 70460, "epoch": 592, "lr": 4.3272881395833854e-08} +{"train_loss": 0.0001190916373161599, "global_step": 70461, "epoch": 592, "lr": 4.3180775723605793e-08} +{"train_loss": 0.00029094808269292116, "global_step": 70462, "epoch": 592, "lr": 4.308876813625684e-08} +{"train_loss": 0.0001761882595019415, "global_step": 70463, "epoch": 592, "lr": 4.2996858633964634e-08} +{"train_loss": 0.00012686464469879866, "global_step": 70464, "epoch": 592, "lr": 4.290504721691235e-08} +{"train_loss": 0.0003607010585255921, "global_step": 70465, "epoch": 592, "lr": 4.281333388527764e-08} +{"train_loss": 0.0001494119642302394, "global_step": 70466, "epoch": 592, "lr": 4.272171863923813e-08} +{"train_loss": 0.00024330349697265774, "global_step": 70467, "epoch": 592, "lr": 4.263020147898256e-08} +{"train_loss": 0.0001717877748887986, "global_step": 70468, "epoch": 592, "lr": 4.253878240468301e-08} +{"train_loss": 0.00016113018500618637, "global_step": 70469, "epoch": 592, "lr": 4.244746141652267e-08} +{"train_loss": 0.0003435540711507201, "global_step": 70470, "epoch": 592, "lr": 4.235623851467918e-08} +{"train_loss": 0.0002856228966265917, "global_step": 70471, "epoch": 592, "lr": 4.2265113699330175e-08} +{"train_loss": 0.00013097678311169147, "global_step": 70472, "epoch": 592, "lr": 4.2174086970658834e-08} +{"train_loss": 0.00017848504649009556, "global_step": 70473, "epoch": 592, "lr": 4.20831583288428e-08} +{"train_loss": 0.00015937401622068137, "global_step": 70474, "epoch": 592, "lr": 4.19923277740597e-08} +{"train_loss": 0.00032654646201990545, "global_step": 70475, "epoch": 592, "lr": 4.1901595306481634e-08} +{"train_loss": 0.0005733184516429901, "global_step": 70476, "epoch": 592, "lr": 4.181096092629733e-08} +{"train_loss": 0.00022824159532319754, "global_step": 70477, "epoch": 592, "lr": 4.172042463367887e-08} +{"train_loss": 0.00016016996232792735, "global_step": 70478, "epoch": 592, "lr": 4.162998642880389e-08} +{"train_loss": 0.00017047191795427352, "global_step": 70479, "epoch": 592, "lr": 4.1539646311850035e-08} +{"train_loss": 0.00040227652061730623, "global_step": 70480, "epoch": 592, "lr": 4.144940428300048e-08} +{"train_loss": 0.00024156656581908464, "global_step": 70481, "epoch": 592, "lr": 4.135926034242177e-08} +{"train_loss": 0.00023300069733522832, "global_step": 70482, "epoch": 592, "lr": 4.126921449030263e-08} +{"train_loss": 0.00022450217511504889, "global_step": 70483, "epoch": 592, "lr": 4.1179266726809604e-08} +{"train_loss": 0.00026029764558188617, "global_step": 70484, "epoch": 592, "lr": 4.108941705212588e-08} +{"train_loss": 0.00020467971626203507, "global_step": 70485, "epoch": 592, "lr": 4.099966546642908e-08} +{"train_loss": 0.00016909405530896038, "global_step": 70486, "epoch": 592, "lr": 4.091001196988575e-08} +{"train_loss": 0.00017202265735249966, "global_step": 70487, "epoch": 592, "lr": 4.0820456562684626e-08} +{"train_loss": 0.0003172479337081313, "global_step": 70488, "epoch": 592, "lr": 4.073099924499224e-08} +{"train_loss": 0.0007585413986817002, "global_step": 70489, "epoch": 592, "lr": 4.0641640016986225e-08} +{"train_loss": 0.0001583318953635171, "global_step": 70490, "epoch": 592, "lr": 4.055237887884422e-08} +{"train_loss": 0.00017942911654245108, "global_step": 70491, "epoch": 592, "lr": 4.046321583073831e-08} +{"train_loss": 0.0002744791563600302, "global_step": 70492, "epoch": 592, "lr": 4.037415087284613e-08} +{"train_loss": 0.00027880026027560234, "global_step": 70493, "epoch": 592, "lr": 4.028518400533976e-08} +{"train_loss": 0.00020317886082921177, "global_step": 70494, "epoch": 592, "lr": 4.019631522839684e-08} +{"train_loss": 0.00031787046464160085, "global_step": 70495, "epoch": 592, "lr": 4.0107544542195005e-08} +{"train_loss": 0.0002487830352038145, "global_step": 70496, "epoch": 592, "lr": 4.0018871946900796e-08} +{"train_loss": 0.00027475575916469097, "global_step": 70497, "epoch": 592, "lr": 3.993029744269738e-08} +{"train_loss": 0.00026746216462925076, "global_step": 70498, "epoch": 592, "lr": 3.984182102975132e-08} +{"train_loss": 0.0007384492782875896, "global_step": 70499, "epoch": 592, "lr": 3.975344270823467e-08} +{"train_loss": 0.00016247315215878189, "global_step": 70500, "epoch": 592, "lr": 3.966516247832508e-08} +{"train_loss": 0.00015938944125082344, "global_step": 70501, "epoch": 592, "lr": 3.9576980340200187e-08} +{"train_loss": 0.00025867504882626235, "global_step": 70502, "epoch": 592, "lr": 3.948889629402097e-08} +{"train_loss": 0.0002198580768890679, "global_step": 70503, "epoch": 592, "lr": 3.940091033997617e-08} +{"train_loss": 0.00018023345910478383, "global_step": 70504, "epoch": 592, "lr": 3.931302247822677e-08} +{"train_loss": 0.00019041211635340005, "global_step": 70505, "epoch": 592, "lr": 3.922523270894485e-08} +{"train_loss": 0.0002114870585501194, "global_step": 70506, "epoch": 592, "lr": 3.91375410323136e-08} +{"train_loss": 0.0003487720969133079, "global_step": 70507, "epoch": 592, "lr": 3.9049947448493995e-08} +{"train_loss": 0.00014915550127625465, "global_step": 70508, "epoch": 592, "lr": 3.896245195766368e-08} +{"train_loss": 0.00021382459090091288, "global_step": 70509, "epoch": 592, "lr": 3.887505455998919e-08} +{"train_loss": 0.00046394666424021125, "global_step": 70510, "epoch": 592, "lr": 3.87877552556537e-08} +{"train_loss": 0.000408283609431237, "global_step": 70511, "epoch": 592, "lr": 3.8700554044812656e-08} +{"train_loss": 0.00016862594929989427, "global_step": 70512, "epoch": 592, "lr": 3.861345092764923e-08} +{"train_loss": 0.00018368143355473876, "global_step": 70513, "epoch": 592, "lr": 3.8526445904329965e-08} +{"train_loss": 0.00022428999363910407, "global_step": 70514, "epoch": 592, "lr": 3.843953897502695e-08} +{"train_loss": 0.00047561866813339293, "global_step": 70515, "epoch": 592, "lr": 3.835273013991225e-08} +{"train_loss": 0.00015288259601220489, "global_step": 70516, "epoch": 592, "lr": 3.826601939915242e-08} +{"train_loss": 0.00016602185496594757, "global_step": 70517, "epoch": 592, "lr": 3.817940675291953e-08} +{"train_loss": 0.00018313714826945215, "global_step": 70518, "epoch": 592, "lr": 3.809289220138568e-08} +{"train_loss": 0.0002185544144595042, "global_step": 70519, "epoch": 592, "lr": 3.800647574471739e-08} +{"train_loss": 0.0003825818421319127, "global_step": 70520, "epoch": 592, "lr": 3.792015738308119e-08} +{"train_loss": 0.00031587094417773187, "global_step": 70521, "epoch": 592, "lr": 3.7833937116660276e-08} +{"train_loss": 0.0002730021660681814, "global_step": 70522, "epoch": 592, "lr": 3.774781494560453e-08} +{"train_loss": 0.0006053525721654296, "global_step": 70523, "epoch": 592, "lr": 3.7661790870102686e-08} +{"train_loss": 0.00017049387679435313, "global_step": 70524, "epoch": 592, "lr": 3.757586489031018e-08} +{"train_loss": 0.00021463833400048316, "global_step": 70525, "epoch": 592, "lr": 3.7490037006399085e-08} +{"train_loss": 0.00022855482529848814, "global_step": 70526, "epoch": 592, "lr": 3.740430721853594e-08} +{"train_loss": 0.00017619290156289935, "global_step": 70527, "epoch": 592, "lr": 3.7318675526898384e-08} +{"train_loss": 0.00027029518969357014, "global_step": 70528, "epoch": 592, "lr": 3.7233141931641846e-08} +{"train_loss": 0.0001796125143300742, "global_step": 70529, "epoch": 592, "lr": 3.7147706432943965e-08} +{"train_loss": 0.00031021327595226467, "global_step": 70530, "epoch": 592, "lr": 3.706236903096572e-08} +{"train_loss": 0.0002490542537998408, "global_step": 70531, "epoch": 592, "lr": 3.697712972588474e-08} +{"train_loss": 0.00025960299535654485, "global_step": 70532, "epoch": 592, "lr": 3.6891988517850917e-08} +{"train_loss": 0.00028077579918317497, "global_step": 70533, "epoch": 592, "lr": 3.6806945407052984e-08} +{"train_loss": 0.00020702247275039554, "global_step": 70534, "epoch": 592, "lr": 3.6722000393640824e-08} +{"train_loss": 0.00014315970474854112, "global_step": 70535, "epoch": 592, "lr": 3.6637153477786515e-08} +{"train_loss": 0.00021570175886154175, "global_step": 70536, "epoch": 592, "lr": 3.655240465965659e-08} +{"train_loss": 0.0005773731973022223, "global_step": 70537, "epoch": 592, "lr": 3.646775393942314e-08} +{"train_loss": 0.0005903256242163479, "global_step": 70538, "epoch": 592, "lr": 3.63832013172416e-08} +{"train_loss": 0.00023679361038375646, "global_step": 70539, "epoch": 592, "lr": 3.62987467932896e-08} +{"train_loss": 0.0006439037970267236, "global_step": 70540, "epoch": 592, "lr": 3.621439036772256e-08} +{"train_loss": 0.0003463217581156641, "global_step": 70541, "epoch": 592, "lr": 3.613013204071258e-08} +{"train_loss": 0.00026526296278461814, "global_step": 70542, "epoch": 592, "lr": 3.6045971812420645e-08} +{"train_loss": 0.00019534050079528242, "global_step": 70543, "epoch": 592, "lr": 3.596190968301882e-08} +{"train_loss": 0.0001993798796320334, "global_step": 70544, "epoch": 592, "lr": 3.587794565266811e-08} +{"train_loss": 0.00014496155199594796, "global_step": 70545, "epoch": 592, "lr": 3.579407972152948e-08} +{"train_loss": 0.0002462460834067315, "global_step": 70546, "epoch": 592, "lr": 3.571031188977503e-08} +{"train_loss": 0.00025982476654462516, "global_step": 70547, "epoch": 592, "lr": 3.5626642157560176e-08} +{"train_loss": 0.0002289453404955566, "global_step": 70548, "epoch": 592, "lr": 3.554307052505701e-08} +{"train_loss": 0.0001840681943576783, "global_step": 70549, "epoch": 592, "lr": 3.545959699243207e-08} +{"train_loss": 0.00011405973782530054, "global_step": 70550, "epoch": 592, "lr": 3.5376221559840775e-08} +{"train_loss": 0.00024503940949216485, "global_step": 70551, "epoch": 592, "lr": 3.5292944227444115e-08} +{"train_loss": 0.0001252470538020134, "global_step": 70552, "epoch": 592, "lr": 3.5209764995419726e-08} +{"train_loss": 0.0003069350204896182, "global_step": 70553, "epoch": 592, "lr": 3.512668386392304e-08} +{"train_loss": 0.00035113704507239163, "global_step": 70554, "epoch": 592, "lr": 3.5043700833115034e-08} +{"train_loss": 0.0002905826549977064, "global_step": 70555, "epoch": 592, "lr": 3.49608159031567e-08} +{"train_loss": 0.00017759570619091392, "global_step": 70556, "epoch": 592, "lr": 3.4878029074220106e-08} +{"train_loss": 0.0002909350150730461, "global_step": 70557, "epoch": 592, "lr": 3.4795340346460706e-08} +{"train_loss": 0.0003753096971195191, "global_step": 70558, "epoch": 592, "lr": 3.471274972004501e-08} +{"train_loss": 0.0004168597224634141, "global_step": 70559, "epoch": 592, "lr": 3.463025719512847e-08} +{"train_loss": 0.00016693949874024838, "global_step": 70560, "epoch": 592, "lr": 3.45478627718776e-08} +{"train_loss": 0.00033993992838077247, "global_step": 70561, "epoch": 592, "lr": 3.446556645045895e-08} +{"train_loss": 0.0008062417036853731, "global_step": 70562, "epoch": 592, "lr": 3.438336823102795e-08} +{"train_loss": 0.00017796644533518702, "global_step": 70563, "epoch": 592, "lr": 3.430126811374002e-08} +{"train_loss": 0.00032844682573340833, "global_step": 70564, "epoch": 592, "lr": 3.421926609877279e-08} +{"train_loss": 0.00023785268422216177, "global_step": 70565, "epoch": 592, "lr": 3.413736218627062e-08} +{"train_loss": 0.00027252399985543493, "global_step": 70566, "epoch": 592, "lr": 3.405555637640556e-08, "val_loss": 0.052641358226537704} +{"train_loss": 0.0001235866657225415, "global_step": 70567, "epoch": 593, "lr": 3.397384866933861e-08} +{"train_loss": 0.00035757405566982925, "global_step": 70568, "epoch": 593, "lr": 3.3892239065219654e-08} +{"train_loss": 0.00015534833073616028, "global_step": 70569, "epoch": 593, "lr": 3.381072756421522e-08} +{"train_loss": 0.0002663856721483171, "global_step": 70570, "epoch": 593, "lr": 3.372931416648628e-08} +{"train_loss": 0.0001803821069188416, "global_step": 70571, "epoch": 593, "lr": 3.364799887219383e-08} +{"train_loss": 0.0002299744519405067, "global_step": 70572, "epoch": 593, "lr": 3.35667816814933e-08} +{"train_loss": 0.0003648522251751274, "global_step": 70573, "epoch": 593, "lr": 3.3485662594545665e-08} +{"train_loss": 0.00019315215467941016, "global_step": 70574, "epoch": 593, "lr": 3.340464161151191e-08} +{"train_loss": 0.0001945450931088999, "global_step": 70575, "epoch": 593, "lr": 3.332371873255302e-08} +{"train_loss": 0.00022454843565355986, "global_step": 70576, "epoch": 593, "lr": 3.324289395781888e-08} +{"train_loss": 0.00016189877351280302, "global_step": 70577, "epoch": 593, "lr": 3.316216728748156e-08} +{"train_loss": 0.00035878579365089536, "global_step": 70578, "epoch": 593, "lr": 3.30815387216854e-08} +{"train_loss": 0.0003315051435492933, "global_step": 70579, "epoch": 593, "lr": 3.3001008260596934e-08} +{"train_loss": 0.00020379347552079707, "global_step": 70580, "epoch": 593, "lr": 3.292057590437714e-08} +{"train_loss": 0.0003123038331978023, "global_step": 70581, "epoch": 593, "lr": 3.2840241653175894e-08} +{"train_loss": 0.00023530835460405797, "global_step": 70582, "epoch": 593, "lr": 3.276000550715419e-08} +{"train_loss": 0.00015467792400158942, "global_step": 70583, "epoch": 593, "lr": 3.2679867466473e-08} +{"train_loss": 0.0002574605750851333, "global_step": 70584, "epoch": 593, "lr": 3.2599827531282214e-08} +{"train_loss": 0.00010986416600644588, "global_step": 70585, "epoch": 593, "lr": 3.2519885701742804e-08} +{"train_loss": 0.0002178541908506304, "global_step": 70586, "epoch": 593, "lr": 3.2440041978015754e-08} +{"train_loss": 0.00018018695118371397, "global_step": 70587, "epoch": 593, "lr": 3.23602963602565e-08} +{"train_loss": 0.0002856039209291339, "global_step": 70588, "epoch": 593, "lr": 3.2280648848614924e-08} +{"train_loss": 0.0004132393514737487, "global_step": 70589, "epoch": 593, "lr": 3.2201099443257556e-08} +{"train_loss": 0.00028962810756638646, "global_step": 70590, "epoch": 593, "lr": 3.212164814432872e-08} +{"train_loss": 0.00024551470414735377, "global_step": 70591, "epoch": 593, "lr": 3.204229495199496e-08} +{"train_loss": 0.00021267241390887648, "global_step": 70592, "epoch": 593, "lr": 3.196303986640614e-08} +{"train_loss": 0.00012671115109696984, "global_step": 70593, "epoch": 593, "lr": 3.188388288771771e-08} +{"train_loss": 0.0005595579859800637, "global_step": 70594, "epoch": 593, "lr": 3.180482401609064e-08} +{"train_loss": 0.00019318402337376028, "global_step": 70595, "epoch": 593, "lr": 3.172586325167481e-08} +{"train_loss": 0.000232522317674011, "global_step": 70596, "epoch": 593, "lr": 3.1647000594625664e-08} +{"train_loss": 0.0003293032350484282, "global_step": 70597, "epoch": 593, "lr": 3.156823604510417e-08} +{"train_loss": 0.0002571856020949781, "global_step": 70598, "epoch": 593, "lr": 3.1489569603254666e-08} +{"train_loss": 0.00016713558579795063, "global_step": 70599, "epoch": 593, "lr": 3.141100126923813e-08} +{"train_loss": 0.0002707421954255551, "global_step": 70600, "epoch": 593, "lr": 3.133253104320999e-08} +{"train_loss": 0.00015622707724105567, "global_step": 70601, "epoch": 593, "lr": 3.1254158925320133e-08} +{"train_loss": 0.00012598741159308702, "global_step": 70602, "epoch": 593, "lr": 3.117588491572399e-08} +{"train_loss": 0.00013215484796091914, "global_step": 70603, "epoch": 593, "lr": 3.109770901457698e-08} +{"train_loss": 0.00037114217411726713, "global_step": 70604, "epoch": 593, "lr": 3.1019631222034554e-08} +{"train_loss": 0.000199324989807792, "global_step": 70605, "epoch": 593, "lr": 3.094165153824102e-08} +{"train_loss": 0.00022001522302161902, "global_step": 70606, "epoch": 593, "lr": 3.086376996335738e-08} +{"train_loss": 0.00021306351118255407, "global_step": 70607, "epoch": 593, "lr": 3.0785986497533505e-08} +{"train_loss": 0.0001668160839471966, "global_step": 70608, "epoch": 593, "lr": 3.070830114092482e-08} +{"train_loss": 0.00043595838360488415, "global_step": 70609, "epoch": 593, "lr": 3.063071389368122e-08} +{"train_loss": 0.0002628345391713083, "global_step": 70610, "epoch": 593, "lr": 3.055322475595257e-08} +{"train_loss": 0.00013112995657138526, "global_step": 70611, "epoch": 593, "lr": 3.047583372789986e-08} +{"train_loss": 0.0002812978927977383, "global_step": 70612, "epoch": 593, "lr": 3.0398540809661866e-08} +{"train_loss": 0.00014326079690363258, "global_step": 70613, "epoch": 593, "lr": 3.0321346001405124e-08} +{"train_loss": 0.00021736827329732478, "global_step": 70614, "epoch": 593, "lr": 3.0244249303268413e-08} +{"train_loss": 0.0001659830886637792, "global_step": 70615, "epoch": 593, "lr": 3.016725071541271e-08} +{"train_loss": 0.0002521066926419735, "global_step": 70616, "epoch": 593, "lr": 3.009035023798234e-08} +{"train_loss": 0.00013396854046732187, "global_step": 70617, "epoch": 593, "lr": 3.001354787113275e-08} +{"train_loss": 0.00022078985057305545, "global_step": 70618, "epoch": 593, "lr": 2.993684361501381e-08} +{"train_loss": 0.00043701849062927067, "global_step": 70619, "epoch": 593, "lr": 2.98602374697754e-08} +{"train_loss": 0.00022582767996937037, "global_step": 70620, "epoch": 593, "lr": 2.9783729435567397e-08} +{"train_loss": 0.00021932614617981017, "global_step": 70621, "epoch": 593, "lr": 2.9707319512539688e-08} +{"train_loss": 0.0003837818221654743, "global_step": 70622, "epoch": 593, "lr": 2.963100770084215e-08} +{"train_loss": 0.00025716106756590307, "global_step": 70623, "epoch": 593, "lr": 2.9554794000630215e-08} +{"train_loss": 0.0002979868440888822, "global_step": 70624, "epoch": 593, "lr": 2.947867841204266e-08} +{"train_loss": 0.0001847317034844309, "global_step": 70625, "epoch": 593, "lr": 2.9402660935240466e-08} +{"train_loss": 0.0003441220324020833, "global_step": 70626, "epoch": 593, "lr": 2.9326741570362415e-08} +{"train_loss": 0.00014989185729064047, "global_step": 70627, "epoch": 593, "lr": 2.9250920317563934e-08} +{"train_loss": 0.00020963454153388739, "global_step": 70628, "epoch": 593, "lr": 2.9175197176994908e-08} +{"train_loss": 0.00019627904111985117, "global_step": 70629, "epoch": 593, "lr": 2.909957214880521e-08} +{"train_loss": 0.0003027397324331105, "global_step": 70630, "epoch": 593, "lr": 2.9024045233133623e-08} +{"train_loss": 0.0002158939023502171, "global_step": 70631, "epoch": 593, "lr": 2.8948616430135576e-08} +{"train_loss": 0.00027052330551669, "global_step": 70632, "epoch": 593, "lr": 2.8873285739960953e-08} +{"train_loss": 0.00043446573545224965, "global_step": 70633, "epoch": 593, "lr": 2.879805316275408e-08} +{"train_loss": 0.00020613058586604893, "global_step": 70634, "epoch": 593, "lr": 2.8722918698659283e-08} +{"train_loss": 0.00029351524426601827, "global_step": 70635, "epoch": 593, "lr": 2.8647882347837552e-08} +{"train_loss": 0.00016944107483141124, "global_step": 70636, "epoch": 593, "lr": 2.8572944110422106e-08} +{"train_loss": 0.00037379731656983495, "global_step": 70637, "epoch": 593, "lr": 2.849810398656283e-08} +{"train_loss": 0.00010785051563289016, "global_step": 70638, "epoch": 593, "lr": 2.8423361976409602e-08} +{"train_loss": 0.00020924820273648947, "global_step": 70639, "epoch": 593, "lr": 2.83487180801123e-08} +{"train_loss": 0.00027182704070582986, "global_step": 70640, "epoch": 593, "lr": 2.8274172297809708e-08} +{"train_loss": 0.0005875748465768993, "global_step": 70641, "epoch": 593, "lr": 2.81997246296517e-08} +{"train_loss": 0.0002071406488539651, "global_step": 70642, "epoch": 593, "lr": 2.8125375075788163e-08} +{"train_loss": 0.00017269552336074412, "global_step": 70643, "epoch": 593, "lr": 2.8051123636357867e-08} +{"train_loss": 0.00019492993305902928, "global_step": 70644, "epoch": 593, "lr": 2.7976970311510696e-08} +{"train_loss": 0.00035561254480853677, "global_step": 70645, "epoch": 593, "lr": 2.7902915101396532e-08} +{"train_loss": 0.00024154616403393447, "global_step": 70646, "epoch": 593, "lr": 2.7828958006154148e-08} +{"train_loss": 0.00014155088865663856, "global_step": 70647, "epoch": 593, "lr": 2.7755099025927878e-08} +{"train_loss": 0.0001750337687553838, "global_step": 70648, "epoch": 593, "lr": 2.7681338160867597e-08} +{"train_loss": 0.00046161943464539945, "global_step": 70649, "epoch": 593, "lr": 2.760767541111764e-08} +{"train_loss": 0.000223130700760521, "global_step": 70650, "epoch": 593, "lr": 2.753411077682233e-08} +{"train_loss": 0.00012470268120523542, "global_step": 70651, "epoch": 593, "lr": 2.746064425812045e-08} +{"train_loss": 0.00023109193716663867, "global_step": 70652, "epoch": 593, "lr": 2.7387275855167425e-08} +{"train_loss": 0.00024435180239379406, "global_step": 70653, "epoch": 593, "lr": 2.731400556809649e-08} +{"train_loss": 0.00027684858650900424, "global_step": 70654, "epoch": 593, "lr": 2.7240833397051967e-08} +{"train_loss": 0.00024497267440892756, "global_step": 70655, "epoch": 593, "lr": 2.716775934218929e-08} +{"train_loss": 0.0005921218544244766, "global_step": 70656, "epoch": 593, "lr": 2.7094783403636136e-08} +{"train_loss": 0.00020560092525556684, "global_step": 70657, "epoch": 593, "lr": 2.7021905581547935e-08} +{"train_loss": 0.00021811462647747248, "global_step": 70658, "epoch": 593, "lr": 2.6949125876063465e-08} +{"train_loss": 0.00014395771722774953, "global_step": 70659, "epoch": 593, "lr": 2.6876444287327053e-08} +{"train_loss": 0.0001441198110114783, "global_step": 70660, "epoch": 593, "lr": 2.6803860815477477e-08} +{"train_loss": 0.00011663023178698495, "global_step": 70661, "epoch": 593, "lr": 2.673137546065907e-08} +{"train_loss": 0.00025150104193016887, "global_step": 70662, "epoch": 593, "lr": 2.665898822301616e-08} +{"train_loss": 0.00016603460244368762, "global_step": 70663, "epoch": 593, "lr": 2.6586699102687517e-08} +{"train_loss": 0.0003195101162418723, "global_step": 70664, "epoch": 593, "lr": 2.651450809981748e-08} +{"train_loss": 0.0002900930121541023, "global_step": 70665, "epoch": 593, "lr": 2.6442415214550374e-08} +{"train_loss": 0.0004154388152528554, "global_step": 70666, "epoch": 593, "lr": 2.637042044701943e-08} +{"train_loss": 0.00026864418759942055, "global_step": 70667, "epoch": 593, "lr": 2.629852379737452e-08} +{"train_loss": 0.0003435949911363423, "global_step": 70668, "epoch": 593, "lr": 2.6226725265754425e-08} +{"train_loss": 0.00028274880605749786, "global_step": 70669, "epoch": 593, "lr": 2.6155024852297928e-08} +{"train_loss": 0.0002949197369161993, "global_step": 70670, "epoch": 593, "lr": 2.608342255714935e-08} +{"train_loss": 0.0003071261162403971, "global_step": 70671, "epoch": 593, "lr": 2.6011918380441925e-08} +{"train_loss": 0.0004293663369026035, "global_step": 70672, "epoch": 593, "lr": 2.5940512322325528e-08} +{"train_loss": 0.0002501929411664605, "global_step": 70673, "epoch": 593, "lr": 2.586920438293339e-08} +{"train_loss": 0.00019601227540988475, "global_step": 70674, "epoch": 593, "lr": 2.579799456240983e-08} +{"train_loss": 0.0001536528579890728, "global_step": 70675, "epoch": 593, "lr": 2.572688286089364e-08} +{"train_loss": 0.00036557772546075284, "global_step": 70676, "epoch": 593, "lr": 2.5655869278523593e-08} +{"train_loss": 0.0004501893126871437, "global_step": 70677, "epoch": 593, "lr": 2.558495381543846e-08} +{"train_loss": 0.00019604222325142473, "global_step": 70678, "epoch": 593, "lr": 2.551413647177703e-08} +{"train_loss": 0.0002677186275832355, "global_step": 70679, "epoch": 593, "lr": 2.544341724768362e-08} +{"train_loss": 0.0003388787736184895, "global_step": 70680, "epoch": 593, "lr": 2.5372796143291465e-08} +{"train_loss": 0.00027049449272453785, "global_step": 70681, "epoch": 593, "lr": 2.5302273158739343e-08} +{"train_loss": 0.00026552932104095817, "global_step": 70682, "epoch": 593, "lr": 2.5231848294166028e-08} +{"train_loss": 0.0002780173672363162, "global_step": 70683, "epoch": 593, "lr": 2.5161521549710298e-08} +{"train_loss": 0.000229400975513272, "global_step": 70684, "epoch": 593, "lr": 2.5091292925516486e-08} +{"train_loss": 0.0002535709910346156, "global_step": 70685, "epoch": 593, "lr": 2.5021162421712262e-08, "val_loss": 0.038081057369709015} +{"train_loss": 0.000207390941795893, "global_step": 70686, "epoch": 594, "lr": 2.495113003844196e-08} +{"train_loss": 0.00014189498324412853, "global_step": 70687, "epoch": 594, "lr": 2.4881195775838805e-08} +{"train_loss": 0.000271584780421108, "global_step": 70688, "epoch": 594, "lr": 2.4811359634041574e-08} +{"train_loss": 0.000224534553126432, "global_step": 70689, "epoch": 594, "lr": 2.47416216131946e-08} +{"train_loss": 0.0001764375192578882, "global_step": 70690, "epoch": 594, "lr": 2.467198171342e-08} +{"train_loss": 0.00033337032073177397, "global_step": 70691, "epoch": 594, "lr": 2.4602439934867662e-08} +{"train_loss": 0.00020675065752584487, "global_step": 70692, "epoch": 594, "lr": 2.4532996277670805e-08} +{"train_loss": 0.0005509564653038979, "global_step": 70693, "epoch": 594, "lr": 2.4463650741962663e-08} +{"train_loss": 0.000445462588686496, "global_step": 70694, "epoch": 594, "lr": 2.439440332788201e-08} +{"train_loss": 0.0002793603634927422, "global_step": 70695, "epoch": 594, "lr": 2.4325254035562072e-08} +{"train_loss": 0.00016210867033805698, "global_step": 70696, "epoch": 594, "lr": 2.425620286513608e-08} +{"train_loss": 0.00019962925580330193, "global_step": 70697, "epoch": 594, "lr": 2.418724981675391e-08} +{"train_loss": 0.00017837152699939907, "global_step": 70698, "epoch": 594, "lr": 2.4118394890532137e-08} +{"train_loss": 0.00015924072067718953, "global_step": 70699, "epoch": 594, "lr": 2.404963808662064e-08} +{"train_loss": 0.0002627465582918376, "global_step": 70700, "epoch": 594, "lr": 2.3980979405147096e-08} +{"train_loss": 0.0001987818832276389, "global_step": 70701, "epoch": 594, "lr": 2.3912418846244734e-08} +{"train_loss": 0.00020614356617443264, "global_step": 70702, "epoch": 594, "lr": 2.3843956410052327e-08} +{"train_loss": 0.00024073055828921497, "global_step": 70703, "epoch": 594, "lr": 2.3775592096703104e-08} +{"train_loss": 0.00015799864195287228, "global_step": 70704, "epoch": 594, "lr": 2.370732590633584e-08} +{"train_loss": 0.00017371481226291507, "global_step": 70705, "epoch": 594, "lr": 2.3639157839078217e-08} +{"train_loss": 0.00017392389418091625, "global_step": 70706, "epoch": 594, "lr": 2.357108789506346e-08} +{"train_loss": 0.00031294263317249715, "global_step": 70707, "epoch": 594, "lr": 2.350311607442479e-08} +{"train_loss": 0.0001324030599789694, "global_step": 70708, "epoch": 594, "lr": 2.343524237730099e-08} +{"train_loss": 0.00019771576626226306, "global_step": 70709, "epoch": 594, "lr": 2.336746680382529e-08} +{"train_loss": 0.00028236088110134006, "global_step": 70710, "epoch": 594, "lr": 2.329978935413091e-08} +{"train_loss": 0.00022608907602261752, "global_step": 70711, "epoch": 594, "lr": 2.3232210028339972e-08} +{"train_loss": 0.00029468300635926425, "global_step": 70712, "epoch": 594, "lr": 2.3164728826602366e-08} +{"train_loss": 0.00022834882838651538, "global_step": 70713, "epoch": 594, "lr": 2.309734574903466e-08} +{"train_loss": 0.00012044417962897569, "global_step": 70714, "epoch": 594, "lr": 2.303006079578118e-08} +{"train_loss": 0.0003732502809725702, "global_step": 70715, "epoch": 594, "lr": 2.296287396696406e-08} +{"train_loss": 0.00020686135394498706, "global_step": 70716, "epoch": 594, "lr": 2.2895785262722068e-08} +{"train_loss": 0.00020322548516560346, "global_step": 70717, "epoch": 594, "lr": 2.2828794683182887e-08} +{"train_loss": 0.0002597158891148865, "global_step": 70718, "epoch": 594, "lr": 2.276190222848529e-08} +{"train_loss": 0.0003361939743626863, "global_step": 70719, "epoch": 594, "lr": 2.26951078987514e-08} +{"train_loss": 0.0005108186160214245, "global_step": 70720, "epoch": 594, "lr": 2.262841169412e-08} +{"train_loss": 0.0001474193122703582, "global_step": 70721, "epoch": 594, "lr": 2.256181361471321e-08} +{"train_loss": 0.00017875220510177314, "global_step": 70722, "epoch": 594, "lr": 2.2495313660669815e-08} +{"train_loss": 0.00021688851120416075, "global_step": 70723, "epoch": 594, "lr": 2.2428911832117484e-08} +{"train_loss": 0.0003676269843708724, "global_step": 70724, "epoch": 594, "lr": 2.2362608129183894e-08} +{"train_loss": 0.0006842253496870399, "global_step": 70725, "epoch": 594, "lr": 2.2296402552007824e-08} +{"train_loss": 0.00021349903545342386, "global_step": 70726, "epoch": 594, "lr": 2.2230295100711396e-08} +{"train_loss": 0.00028761071735061705, "global_step": 70727, "epoch": 594, "lr": 2.2164285775422288e-08} +{"train_loss": 0.0003748527669813484, "global_step": 70728, "epoch": 594, "lr": 2.209837457627928e-08} +{"train_loss": 0.00026036155759356916, "global_step": 70729, "epoch": 594, "lr": 2.203256150340449e-08} +{"train_loss": 0.0005429012817330658, "global_step": 70730, "epoch": 594, "lr": 2.1966846556931152e-08} +{"train_loss": 0.0001628413301659748, "global_step": 70731, "epoch": 594, "lr": 2.1901229736981386e-08} +{"train_loss": 0.0003478265425655991, "global_step": 70732, "epoch": 594, "lr": 2.1835711043693975e-08} +{"train_loss": 0.00017744253273122013, "global_step": 70733, "epoch": 594, "lr": 2.1770290477191035e-08} +{"train_loss": 0.0001612408086657524, "global_step": 70734, "epoch": 594, "lr": 2.17049680376058e-08} +{"train_loss": 0.0006239679642021656, "global_step": 70735, "epoch": 594, "lr": 2.163974372506039e-08} +{"train_loss": 0.00014177963021211326, "global_step": 70736, "epoch": 594, "lr": 2.1574617539688035e-08} +{"train_loss": 0.0001720478176139295, "global_step": 70737, "epoch": 594, "lr": 2.150958948161086e-08} +{"train_loss": 0.0001227732573170215, "global_step": 70738, "epoch": 594, "lr": 2.1444659550962088e-08} +{"train_loss": 0.00025515450397506356, "global_step": 70739, "epoch": 594, "lr": 2.1379827747869395e-08} +{"train_loss": 0.0002955079253297299, "global_step": 70740, "epoch": 594, "lr": 2.131509407245491e-08} +{"train_loss": 0.0002426451101200655, "global_step": 70741, "epoch": 594, "lr": 2.1250458524851858e-08} +{"train_loss": 0.00018683689995668828, "global_step": 70742, "epoch": 594, "lr": 2.118592110518236e-08} +{"train_loss": 0.0003354460350237787, "global_step": 70743, "epoch": 594, "lr": 2.1121481813574096e-08} +{"train_loss": 0.00023908200091682374, "global_step": 70744, "epoch": 594, "lr": 2.105714065015474e-08} +{"train_loss": 0.0002476623049005866, "global_step": 70745, "epoch": 594, "lr": 2.0992897615051966e-08} +{"train_loss": 0.00022937754692975432, "global_step": 70746, "epoch": 594, "lr": 2.09287527083879e-08} +{"train_loss": 0.00027374213095754385, "global_step": 70747, "epoch": 594, "lr": 2.0864705930290218e-08} +{"train_loss": 0.00025784532772377133, "global_step": 70748, "epoch": 594, "lr": 2.0800757280886595e-08} +{"train_loss": 0.00015724713739473373, "global_step": 70749, "epoch": 594, "lr": 2.0736906760299158e-08} +{"train_loss": 0.00012871423678006977, "global_step": 70750, "epoch": 594, "lr": 2.067315436866113e-08} +{"train_loss": 0.00035375685547478497, "global_step": 70751, "epoch": 594, "lr": 2.0609500106083535e-08} +{"train_loss": 0.00037330706254579127, "global_step": 70752, "epoch": 594, "lr": 2.054594397270515e-08} +{"train_loss": 0.000300795043585822, "global_step": 70753, "epoch": 594, "lr": 2.04824859686481e-08} +{"train_loss": 0.00021003434085287154, "global_step": 70754, "epoch": 594, "lr": 2.041912609402896e-08} +{"train_loss": 0.00024163212219718844, "global_step": 70755, "epoch": 594, "lr": 2.0355864348975407e-08} +{"train_loss": 0.0004814917629119009, "global_step": 70756, "epoch": 594, "lr": 2.029270073362066e-08} +{"train_loss": 0.00016087584663182497, "global_step": 70757, "epoch": 594, "lr": 2.022963524807575e-08} +{"train_loss": 0.00021057380945421755, "global_step": 70758, "epoch": 594, "lr": 2.01666678924739e-08} +{"train_loss": 0.0004708584165200591, "global_step": 70759, "epoch": 594, "lr": 2.0103798666931684e-08} +{"train_loss": 0.000292579090455547, "global_step": 70760, "epoch": 594, "lr": 2.004102757158233e-08} +{"train_loss": 0.00017336975724902004, "global_step": 70761, "epoch": 594, "lr": 1.9978354606536854e-08} +{"train_loss": 0.00013041202328167856, "global_step": 70762, "epoch": 594, "lr": 1.9915779771928488e-08} +{"train_loss": 0.00044044648529961705, "global_step": 70763, "epoch": 594, "lr": 1.9853303067868257e-08} +{"train_loss": 0.0001546336425235495, "global_step": 70764, "epoch": 594, "lr": 1.9790924494494933e-08} +{"train_loss": 0.00023648879141546786, "global_step": 70765, "epoch": 594, "lr": 1.9728644051919543e-08} +{"train_loss": 0.0001838223688537255, "global_step": 70766, "epoch": 594, "lr": 1.966646174026421e-08} +{"train_loss": 0.00025242441915906966, "global_step": 70767, "epoch": 594, "lr": 1.9604377559662156e-08} +{"train_loss": 0.00021554787235800177, "global_step": 70768, "epoch": 594, "lr": 1.954239151021886e-08} +{"train_loss": 0.0002891231270041317, "global_step": 70769, "epoch": 594, "lr": 1.9480503592067545e-08} +{"train_loss": 0.0002928728936240077, "global_step": 70770, "epoch": 594, "lr": 1.9418713805330337e-08} +{"train_loss": 0.00024181317712645978, "global_step": 70771, "epoch": 594, "lr": 1.9357022150118253e-08} +{"train_loss": 0.00021391024347394705, "global_step": 70772, "epoch": 594, "lr": 1.9295428626564528e-08} +{"train_loss": 0.00020917868823744357, "global_step": 70773, "epoch": 594, "lr": 1.9233933234780176e-08} +{"train_loss": 0.0002558463893365115, "global_step": 70774, "epoch": 594, "lr": 1.917253597489288e-08} +{"train_loss": 0.0001682838483247906, "global_step": 70775, "epoch": 594, "lr": 1.911123684702476e-08} +{"train_loss": 0.0001827879750635475, "global_step": 70776, "epoch": 594, "lr": 1.905003585128684e-08} +{"train_loss": 0.0002588359056971967, "global_step": 70777, "epoch": 594, "lr": 1.8988932987801244e-08} +{"train_loss": 0.0003152137796860188, "global_step": 70778, "epoch": 594, "lr": 1.8927928256695647e-08} +{"train_loss": 0.00019382048049010336, "global_step": 70779, "epoch": 594, "lr": 1.8867021658086624e-08} +{"train_loss": 0.00031888551893644035, "global_step": 70780, "epoch": 594, "lr": 1.880621319209075e-08} +{"train_loss": 0.0005589648499153554, "global_step": 70781, "epoch": 594, "lr": 1.8745502858830146e-08} +{"train_loss": 0.0002035098586929962, "global_step": 70782, "epoch": 594, "lr": 1.8684890658421384e-08} +{"train_loss": 0.0003547771193552762, "global_step": 70783, "epoch": 594, "lr": 1.8624376590986593e-08} +{"train_loss": 0.0002952192153315991, "global_step": 70784, "epoch": 594, "lr": 1.8563960656642345e-08} +{"train_loss": 0.00019355086260475218, "global_step": 70785, "epoch": 594, "lr": 1.850364285550521e-08} +{"train_loss": 0.00036960295983590186, "global_step": 70786, "epoch": 594, "lr": 1.844342318770287e-08} +{"train_loss": 0.00021266748080961406, "global_step": 70787, "epoch": 594, "lr": 1.8383301653340788e-08} +{"train_loss": 0.00019689071632456034, "global_step": 70788, "epoch": 594, "lr": 1.832327825254665e-08} +{"train_loss": 0.00044615997467190027, "global_step": 70789, "epoch": 594, "lr": 1.826335298543702e-08} +{"train_loss": 0.0002669718232937157, "global_step": 70790, "epoch": 594, "lr": 1.8203525852122927e-08} +{"train_loss": 0.0002452078624628484, "global_step": 70791, "epoch": 594, "lr": 1.8143796852726492e-08} +{"train_loss": 0.00028428336372599006, "global_step": 70792, "epoch": 594, "lr": 1.808416598736984e-08} +{"train_loss": 0.00026338870520703495, "global_step": 70793, "epoch": 594, "lr": 1.8024633256163992e-08} +{"train_loss": 0.00024044944439083338, "global_step": 70794, "epoch": 594, "lr": 1.7965198659225523e-08} +{"train_loss": 0.0004301051958464086, "global_step": 70795, "epoch": 594, "lr": 1.790586219667101e-08} +{"train_loss": 0.00018104605260305107, "global_step": 70796, "epoch": 594, "lr": 1.7846623868617018e-08} +{"train_loss": 0.00019289154442958534, "global_step": 70797, "epoch": 594, "lr": 1.778748367518568e-08} +{"train_loss": 0.0002532225043978542, "global_step": 70798, "epoch": 594, "lr": 1.7728441616488013e-08} +{"train_loss": 0.00021553556143771857, "global_step": 70799, "epoch": 594, "lr": 1.766949769264059e-08} +{"train_loss": 0.0002704460348468274, "global_step": 70800, "epoch": 594, "lr": 1.761065190375999e-08} +{"train_loss": 0.0002863546251319349, "global_step": 70801, "epoch": 594, "lr": 1.755190424995723e-08} +{"train_loss": 0.00011645837366813794, "global_step": 70802, "epoch": 594, "lr": 1.7493254731354437e-08} +{"train_loss": 0.00024659567861817777, "global_step": 70803, "epoch": 594, "lr": 1.743470334806263e-08} +{"train_loss": 0.0002616479968531801, "global_step": 70804, "epoch": 594, "lr": 1.737625010019839e-08, "val_loss": 0.028964901342988014} +{"train_loss": 0.0002664337807800621, "global_step": 70805, "epoch": 595, "lr": 1.731789498787828e-08} +{"train_loss": 0.00020836609473917633, "global_step": 70806, "epoch": 595, "lr": 1.725963801121333e-08} +{"train_loss": 0.00021592387929558754, "global_step": 70807, "epoch": 595, "lr": 1.720147917032011e-08} +{"train_loss": 0.00022134596656542271, "global_step": 70808, "epoch": 595, "lr": 1.7143418465309646e-08} +{"train_loss": 0.00018022024596575648, "global_step": 70809, "epoch": 595, "lr": 1.7085455896298508e-08} +{"train_loss": 0.0002531750069465488, "global_step": 70810, "epoch": 595, "lr": 1.7027591463397717e-08} +{"train_loss": 0.00033563963370397687, "global_step": 70811, "epoch": 595, "lr": 1.6969825166729402e-08} +{"train_loss": 0.0004457762697711587, "global_step": 70812, "epoch": 595, "lr": 1.691215700639348e-08} +{"train_loss": 0.00012121503823436797, "global_step": 70813, "epoch": 595, "lr": 1.685458698251763e-08} +{"train_loss": 0.00019555093604139984, "global_step": 70814, "epoch": 595, "lr": 1.6797115095207316e-08} +{"train_loss": 0.00020912123727612197, "global_step": 70815, "epoch": 595, "lr": 1.673974134457357e-08} +{"train_loss": 0.0002837768697645515, "global_step": 70816, "epoch": 595, "lr": 1.6682465730727402e-08} +{"train_loss": 0.0001407966046826914, "global_step": 70817, "epoch": 595, "lr": 1.662528825379095e-08} +{"train_loss": 0.00013274833327159286, "global_step": 70818, "epoch": 595, "lr": 1.6568208913869677e-08} +{"train_loss": 0.000334506097715348, "global_step": 70819, "epoch": 595, "lr": 1.6511227711074605e-08} +{"train_loss": 0.00046649493742734194, "global_step": 70820, "epoch": 595, "lr": 1.6454344645522314e-08} +{"train_loss": 0.00019021106709260494, "global_step": 70821, "epoch": 595, "lr": 1.6397559717323818e-08} +{"train_loss": 0.00016538404452148825, "global_step": 70822, "epoch": 595, "lr": 1.6340872926584594e-08} +{"train_loss": 0.0001854083820944652, "global_step": 70823, "epoch": 595, "lr": 1.6284284273421213e-08} +{"train_loss": 0.00030318103381432593, "global_step": 70824, "epoch": 595, "lr": 1.6227793757944697e-08} +{"train_loss": 0.00043026753701269627, "global_step": 70825, "epoch": 595, "lr": 1.617140138026607e-08} +{"train_loss": 0.00031371103250421584, "global_step": 70826, "epoch": 595, "lr": 1.6115107140490804e-08} +{"train_loss": 0.00036268390249460936, "global_step": 70827, "epoch": 595, "lr": 1.6058911038735468e-08} +{"train_loss": 0.00014874628686811775, "global_step": 70828, "epoch": 595, "lr": 1.600281307511109e-08} +{"train_loss": 0.00022713006183039397, "global_step": 70829, "epoch": 595, "lr": 1.5946813249723137e-08} +{"train_loss": 0.00018331505998503417, "global_step": 70830, "epoch": 595, "lr": 1.589091156268263e-08} +{"train_loss": 0.00017679909069556743, "global_step": 70831, "epoch": 595, "lr": 1.5835108014100598e-08} +{"train_loss": 0.00013348912762012333, "global_step": 70832, "epoch": 595, "lr": 1.5779402604088057e-08} +{"train_loss": 0.0006824524607509375, "global_step": 70833, "epoch": 595, "lr": 1.572379533275048e-08} +{"train_loss": 0.0001706880866549909, "global_step": 70834, "epoch": 595, "lr": 1.566828620020444e-08} +{"train_loss": 0.0002627458597999066, "global_step": 70835, "epoch": 595, "lr": 1.561287520654986e-08} +{"train_loss": 0.00017869654402602464, "global_step": 70836, "epoch": 595, "lr": 1.555756235189776e-08} +{"train_loss": 0.00019224129209760576, "global_step": 70837, "epoch": 595, "lr": 1.550234763635916e-08} +{"train_loss": 0.0003172899305354804, "global_step": 70838, "epoch": 595, "lr": 1.5447231060039535e-08} +{"train_loss": 0.00033711930154822767, "global_step": 70839, "epoch": 595, "lr": 1.5392212623055457e-08} +{"train_loss": 0.00017171241051983088, "global_step": 70840, "epoch": 595, "lr": 1.5337292325501296e-08} +{"train_loss": 0.00021624779037665576, "global_step": 70841, "epoch": 595, "lr": 1.5282470167499176e-08} +{"train_loss": 0.00016943724767770618, "global_step": 70842, "epoch": 595, "lr": 1.522774614914346e-08} +{"train_loss": 0.00023850359139032662, "global_step": 70843, "epoch": 595, "lr": 1.5173120270550732e-08} +{"train_loss": 0.00019221568072680384, "global_step": 70844, "epoch": 595, "lr": 1.5118592531826458e-08} +{"train_loss": 0.00011418096983106807, "global_step": 70845, "epoch": 595, "lr": 1.506416293307611e-08} +{"train_loss": 0.0001675598614383489, "global_step": 70846, "epoch": 595, "lr": 1.500983147441071e-08} +{"train_loss": 0.00015702701057307422, "global_step": 70847, "epoch": 595, "lr": 1.4955598155930172e-08} +{"train_loss": 0.0001270921202376485, "global_step": 70848, "epoch": 595, "lr": 1.490146297773998e-08} +{"train_loss": 0.00023607599723618478, "global_step": 70849, "epoch": 595, "lr": 1.4847425939956694e-08} +{"train_loss": 0.00016896630404517055, "global_step": 70850, "epoch": 595, "lr": 1.4793487042680243e-08} +{"train_loss": 0.0001718887797323987, "global_step": 70851, "epoch": 595, "lr": 1.4739646286010544e-08} +{"train_loss": 0.00014529464533552527, "global_step": 70852, "epoch": 595, "lr": 1.4685903670064172e-08} +{"train_loss": 0.0003490361268632114, "global_step": 70853, "epoch": 595, "lr": 1.4632259194941044e-08} +{"train_loss": 0.0002968856133520603, "global_step": 70854, "epoch": 595, "lr": 1.4578712860752186e-08} +{"train_loss": 0.00016597261128481477, "global_step": 70855, "epoch": 595, "lr": 1.4525264667591965e-08} +{"train_loss": 0.00029579398687928915, "global_step": 70856, "epoch": 595, "lr": 1.4471914615571402e-08} +{"train_loss": 0.00016685952141415328, "global_step": 70857, "epoch": 595, "lr": 1.4418662704795972e-08} +{"train_loss": 0.0002076844102703035, "global_step": 70858, "epoch": 595, "lr": 1.4365508935371141e-08} +{"train_loss": 0.00031006537028588355, "global_step": 70859, "epoch": 595, "lr": 1.4312453307396834e-08} +{"train_loss": 0.0002845051931217313, "global_step": 70860, "epoch": 595, "lr": 1.425949582097852e-08} +{"train_loss": 0.00020604401652235538, "global_step": 70861, "epoch": 595, "lr": 1.4206636476227219e-08} +{"train_loss": 0.00021461841242853552, "global_step": 70862, "epoch": 595, "lr": 1.4153875273237305e-08} +{"train_loss": 0.0002650628739502281, "global_step": 70863, "epoch": 595, "lr": 1.4101212212114245e-08} +{"train_loss": 0.00019169824372511357, "global_step": 70864, "epoch": 595, "lr": 1.4048647292963513e-08} +{"train_loss": 0.00017744017532095313, "global_step": 70865, "epoch": 595, "lr": 1.3996180515890578e-08} +{"train_loss": 0.000179430513526313, "global_step": 70866, "epoch": 595, "lr": 1.394381188099536e-08} +{"train_loss": 0.00018754925986286253, "global_step": 70867, "epoch": 595, "lr": 1.3891541388383334e-08} +{"train_loss": 0.00023200320720206946, "global_step": 70868, "epoch": 595, "lr": 1.3839369038154415e-08} +{"train_loss": 0.00036535030812956393, "global_step": 70869, "epoch": 595, "lr": 1.3787294830408525e-08} +{"train_loss": 0.0002487432211637497, "global_step": 70870, "epoch": 595, "lr": 1.3735318765251138e-08} +{"train_loss": 0.00015792009071446955, "global_step": 70871, "epoch": 595, "lr": 1.368344084278772e-08} +{"train_loss": 0.00012268322461750358, "global_step": 70872, "epoch": 595, "lr": 1.3631661063112644e-08} +{"train_loss": 0.0001567252038512379, "global_step": 70873, "epoch": 595, "lr": 1.3579979426331379e-08} +{"train_loss": 0.00013352416863199323, "global_step": 70874, "epoch": 595, "lr": 1.3528395932549398e-08} +{"train_loss": 0.00016059998597484082, "global_step": 70875, "epoch": 595, "lr": 1.3476910581861069e-08} +{"train_loss": 0.0002625317429192364, "global_step": 70876, "epoch": 595, "lr": 1.3425523374371863e-08} +{"train_loss": 0.00023393650189973414, "global_step": 70877, "epoch": 595, "lr": 1.33742343101817e-08} +{"train_loss": 0.00020366735407151282, "global_step": 70878, "epoch": 595, "lr": 1.3323043389390499e-08} +{"train_loss": 0.0003768467577174306, "global_step": 70879, "epoch": 595, "lr": 1.3271950612103734e-08} +{"train_loss": 0.0002633322146721184, "global_step": 70880, "epoch": 595, "lr": 1.3220955978410221e-08} +{"train_loss": 0.0002590907970443368, "global_step": 70881, "epoch": 595, "lr": 1.3170059488420982e-08} +{"train_loss": 0.00012251263251528144, "global_step": 70882, "epoch": 595, "lr": 1.3119261142230388e-08} +{"train_loss": 0.0001953213504748419, "global_step": 70883, "epoch": 595, "lr": 1.3068560939938356e-08} +{"train_loss": 0.0002105949679389596, "global_step": 70884, "epoch": 595, "lr": 1.3017958881650361e-08} +{"train_loss": 0.0006603454821743071, "global_step": 70885, "epoch": 595, "lr": 1.2967454967455216e-08} +{"train_loss": 0.0001790059613995254, "global_step": 70886, "epoch": 595, "lr": 1.2917049197463949e-08} +{"train_loss": 0.0001689092896413058, "global_step": 70887, "epoch": 595, "lr": 1.2866741571765373e-08} +{"train_loss": 0.0002746300306171179, "global_step": 70888, "epoch": 595, "lr": 1.2816532090464961e-08} +{"train_loss": 0.00031834380934014916, "global_step": 70889, "epoch": 595, "lr": 1.2766420753657082e-08} +{"train_loss": 0.0003519412421155721, "global_step": 70890, "epoch": 595, "lr": 1.2716407561447208e-08} +{"train_loss": 0.00024863236467354, "global_step": 70891, "epoch": 595, "lr": 1.2666492513924155e-08} +{"train_loss": 0.00010622843547025695, "global_step": 70892, "epoch": 595, "lr": 1.2616675611187845e-08} +{"train_loss": 0.00024785788264125586, "global_step": 70893, "epoch": 595, "lr": 1.2566956853343748e-08} +{"train_loss": 0.00023703830083832145, "global_step": 70894, "epoch": 595, "lr": 1.251733624048068e-08} +{"train_loss": 0.00018780746904667467, "global_step": 70895, "epoch": 595, "lr": 1.2467813772698566e-08} +{"train_loss": 0.00020265394414309412, "global_step": 70896, "epoch": 595, "lr": 1.2418389450097323e-08} +{"train_loss": 0.00024793142802082, "global_step": 70897, "epoch": 595, "lr": 1.236906327277132e-08} +{"train_loss": 0.00016126708942465484, "global_step": 70898, "epoch": 595, "lr": 1.2319835240820476e-08} +{"train_loss": 0.0001798281737137586, "global_step": 70899, "epoch": 595, "lr": 1.2270705354333612e-08} +{"train_loss": 0.00021490063227247447, "global_step": 70900, "epoch": 595, "lr": 1.2221673613416197e-08} +{"train_loss": 0.0003274570917710662, "global_step": 70901, "epoch": 595, "lr": 1.2172740018162599e-08} +{"train_loss": 0.00019349234935361892, "global_step": 70902, "epoch": 595, "lr": 1.2123904568667188e-08} +{"train_loss": 0.0002257407904835418, "global_step": 70903, "epoch": 595, "lr": 1.2075167265024335e-08} +{"train_loss": 0.00028239883249625564, "global_step": 70904, "epoch": 595, "lr": 1.2026528107333956e-08} +{"train_loss": 0.00027177517767995596, "global_step": 70905, "epoch": 595, "lr": 1.1977987095690424e-08} +{"train_loss": 0.00036517338594421744, "global_step": 70906, "epoch": 595, "lr": 1.1929544230182555e-08} +{"train_loss": 0.00020821907673962414, "global_step": 70907, "epoch": 595, "lr": 1.1881199510910269e-08} +{"train_loss": 0.000329650443745777, "global_step": 70908, "epoch": 595, "lr": 1.1832952937973485e-08} +{"train_loss": 0.0001941635418916121, "global_step": 70909, "epoch": 595, "lr": 1.1784804511461022e-08} +{"train_loss": 0.00018364688730798662, "global_step": 70910, "epoch": 595, "lr": 1.1736754231467251e-08} +{"train_loss": 0.00020715106802526861, "global_step": 70911, "epoch": 595, "lr": 1.1688802098086537e-08} +{"train_loss": 0.000152048742165789, "global_step": 70912, "epoch": 595, "lr": 1.1640948111418803e-08} +{"train_loss": 0.00034597545163705945, "global_step": 70913, "epoch": 595, "lr": 1.1593192271552867e-08} +{"train_loss": 0.00028493322315625846, "global_step": 70914, "epoch": 595, "lr": 1.1545534578577544e-08} +{"train_loss": 0.0002798447385430336, "global_step": 70915, "epoch": 595, "lr": 1.1497975032598308e-08} +{"train_loss": 0.00020681406022049487, "global_step": 70916, "epoch": 595, "lr": 1.1450513633698423e-08} +{"train_loss": 0.00014088393072597682, "global_step": 70917, "epoch": 595, "lr": 1.1403150381977812e-08} +{"train_loss": 0.0003615494933910668, "global_step": 70918, "epoch": 595, "lr": 1.1355885277525292e-08} +{"train_loss": 0.0003274009795859456, "global_step": 70919, "epoch": 595, "lr": 1.1308718320435229e-08} +{"train_loss": 0.00021083882893435657, "global_step": 70920, "epoch": 595, "lr": 1.1261649510796447e-08} +{"train_loss": 0.00021567037038039416, "global_step": 70921, "epoch": 595, "lr": 1.121467884870886e-08} +{"train_loss": 0.0002998652053065598, "global_step": 70922, "epoch": 595, "lr": 1.1167806334261289e-08} +{"train_loss": 0.00023746648531880606, "global_step": 70923, "epoch": 595, "lr": 1.112103196754255e-08, "val_loss": 0.01200889516621828, "train_action_mse_error": 3.2588573048997205e-06} +{"train_loss": 0.0001266721956199035, "global_step": 70924, "epoch": 596, "lr": 1.1074355748652565e-08} +{"train_loss": 0.0001229949702974409, "global_step": 70925, "epoch": 596, "lr": 1.1027777677669048e-08} +{"train_loss": 0.00021004007430747151, "global_step": 70926, "epoch": 596, "lr": 1.0981297754697473e-08} +{"train_loss": 0.0001884098892332986, "global_step": 70927, "epoch": 596, "lr": 1.0934915979826654e-08} +{"train_loss": 0.00019357327255420387, "global_step": 70928, "epoch": 596, "lr": 1.088863235313986e-08} +{"train_loss": 0.00024376169312745333, "global_step": 70929, "epoch": 596, "lr": 1.084244687473146e-08} +{"train_loss": 0.0003255071642342955, "global_step": 70930, "epoch": 596, "lr": 1.0796359544695823e-08} +{"train_loss": 0.0002522706054151058, "global_step": 70931, "epoch": 596, "lr": 1.0750370363121765e-08} +{"train_loss": 0.00022630474995821714, "global_step": 70932, "epoch": 596, "lr": 1.0704479330098105e-08} +{"train_loss": 0.0002994140377268195, "global_step": 70933, "epoch": 596, "lr": 1.065868644571366e-08} +{"train_loss": 0.00018715806072577834, "global_step": 70934, "epoch": 596, "lr": 1.0612991710062802e-08} +{"train_loss": 0.00016589944425504655, "global_step": 70935, "epoch": 596, "lr": 1.0567395123228796e-08} +{"train_loss": 0.00028357404517009854, "global_step": 70936, "epoch": 596, "lr": 1.052189668531156e-08} +{"train_loss": 0.00025177994393743575, "global_step": 70937, "epoch": 596, "lr": 1.0476496396388812e-08} +{"train_loss": 0.00015450389764737338, "global_step": 70938, "epoch": 596, "lr": 1.043119425655492e-08} +{"train_loss": 0.00029467433341778815, "global_step": 70939, "epoch": 596, "lr": 1.0385990265898705e-08} +{"train_loss": 0.00014143118460197002, "global_step": 70940, "epoch": 596, "lr": 1.0340884424514529e-08} +{"train_loss": 0.00032049953006207943, "global_step": 70941, "epoch": 596, "lr": 1.0295876732480114e-08} +{"train_loss": 0.00020735643920488656, "global_step": 70942, "epoch": 596, "lr": 1.0250967189889826e-08} +{"train_loss": 0.0003045816847588867, "global_step": 70943, "epoch": 596, "lr": 1.0206155796832484e-08} +{"train_loss": 0.0002221212926087901, "global_step": 70944, "epoch": 596, "lr": 1.0161442553391353e-08} +{"train_loss": 0.00028887955704703927, "global_step": 70945, "epoch": 596, "lr": 1.0116827459660805e-08} +{"train_loss": 0.00025297619868069887, "global_step": 70946, "epoch": 596, "lr": 1.0072310515724103e-08} +{"train_loss": 0.0003004370955750346, "global_step": 70947, "epoch": 596, "lr": 1.002789172167562e-08} +{"train_loss": 0.00025885627837851644, "global_step": 70948, "epoch": 596, "lr": 9.983571077587517e-09} +{"train_loss": 0.0002115388197125867, "global_step": 70949, "epoch": 596, "lr": 9.939348583559715e-09} +{"train_loss": 0.0002816622145473957, "global_step": 70950, "epoch": 596, "lr": 9.895224239675482e-09} +{"train_loss": 0.0002139483403880149, "global_step": 70951, "epoch": 596, "lr": 9.851198046023635e-09} +{"train_loss": 0.0002908699098043144, "global_step": 70952, "epoch": 596, "lr": 9.80727000268744e-09} +{"train_loss": 0.00023926440917421132, "global_step": 70953, "epoch": 596, "lr": 9.763440109750166e-09} +{"train_loss": 0.00020170614880044013, "global_step": 70954, "epoch": 596, "lr": 9.71970836730618e-09} +{"train_loss": 0.0006000557914376259, "global_step": 70955, "epoch": 596, "lr": 9.676074775433196e-09} +{"train_loss": 0.00018762679246719927, "global_step": 70956, "epoch": 596, "lr": 9.632539334225587e-09} +{"train_loss": 0.00014373564044944942, "global_step": 70957, "epoch": 596, "lr": 9.589102043755515e-09} +{"train_loss": 0.00022655443171970546, "global_step": 70958, "epoch": 596, "lr": 9.545762904122902e-09} +{"train_loss": 0.00022413089754991233, "global_step": 70959, "epoch": 596, "lr": 9.50252191540546e-09} +{"train_loss": 0.0003077885485254228, "global_step": 70960, "epoch": 596, "lr": 9.45937907769201e-09} +{"train_loss": 0.0002593327662907541, "global_step": 70961, "epoch": 596, "lr": 9.416334391060266e-09} +{"train_loss": 0.00022353135864250362, "global_step": 70962, "epoch": 596, "lr": 9.373387855599048e-09} +{"train_loss": 0.0001530966255813837, "global_step": 70963, "epoch": 596, "lr": 9.330539471391619e-09} +{"train_loss": 0.0006043772445991635, "global_step": 70964, "epoch": 596, "lr": 9.287789238526801e-09} +{"train_loss": 0.00024979302543215454, "global_step": 70965, "epoch": 596, "lr": 9.245137157082306e-09} +{"train_loss": 0.000184062504558824, "global_step": 70966, "epoch": 596, "lr": 9.202583227141403e-09} +{"train_loss": 0.0003039553703274578, "global_step": 70967, "epoch": 596, "lr": 9.16012744879291e-09} +{"train_loss": 0.00013856087753083557, "global_step": 70968, "epoch": 596, "lr": 9.117769822120092e-09} +{"train_loss": 0.00012939800217282027, "global_step": 70969, "epoch": 596, "lr": 9.075510347200667e-09} +{"train_loss": 0.00029537169029936194, "global_step": 70970, "epoch": 596, "lr": 9.03334902412345e-09} +{"train_loss": 0.00012856983812525868, "global_step": 70971, "epoch": 596, "lr": 8.991285852966157e-09} +{"train_loss": 0.00033465647720731795, "global_step": 70972, "epoch": 596, "lr": 8.94932083381761e-09} +{"train_loss": 0.00031149116693995893, "global_step": 70973, "epoch": 596, "lr": 8.907453966749967e-09} +{"train_loss": 0.00045483894064091146, "global_step": 70974, "epoch": 596, "lr": 8.865685251857602e-09} +{"train_loss": 0.00028692540945485234, "global_step": 70975, "epoch": 596, "lr": 8.824014689212678e-09} +{"train_loss": 0.0005625435151159763, "global_step": 70976, "epoch": 596, "lr": 8.782442278904013e-09} +{"train_loss": 0.0001537227799417451, "global_step": 70977, "epoch": 596, "lr": 8.740968021009322e-09} +{"train_loss": 0.00015732103202026337, "global_step": 70978, "epoch": 596, "lr": 8.699591915611872e-09} +{"train_loss": 0.0002007342700380832, "global_step": 70979, "epoch": 596, "lr": 8.658313962789377e-09} +{"train_loss": 0.00019396902644075453, "global_step": 70980, "epoch": 596, "lr": 8.617134162625106e-09} +{"train_loss": 0.00043777620885521173, "global_step": 70981, "epoch": 596, "lr": 8.576052515202326e-09} +{"train_loss": 0.0002529911871533841, "global_step": 70982, "epoch": 596, "lr": 8.535069020598752e-09} +{"train_loss": 0.0003405522438697517, "global_step": 70983, "epoch": 596, "lr": 8.494183678897649e-09} +{"train_loss": 0.00019055099983233958, "global_step": 70984, "epoch": 596, "lr": 8.453396490176734e-09} +{"train_loss": 0.00027650390984490514, "global_step": 70985, "epoch": 596, "lr": 8.412707454513724e-09} +{"train_loss": 0.0002802979142870754, "global_step": 70986, "epoch": 596, "lr": 8.372116571997434e-09} +{"train_loss": 0.00010839650349225849, "global_step": 70987, "epoch": 596, "lr": 8.33162384269448e-09} +{"train_loss": 0.00016938317276071757, "global_step": 70988, "epoch": 596, "lr": 8.29122926669923e-09} +{"train_loss": 0.0002585817710496485, "global_step": 70989, "epoch": 596, "lr": 8.250932844078297e-09} +{"train_loss": 0.0003134209255222231, "global_step": 70990, "epoch": 596, "lr": 8.210734574914947e-09} +{"train_loss": 0.0003503229236230254, "global_step": 70991, "epoch": 596, "lr": 8.170634459292447e-09} +{"train_loss": 0.0001781356695573777, "global_step": 70992, "epoch": 596, "lr": 8.130632497282964e-09} +{"train_loss": 0.00018996560538653284, "global_step": 70993, "epoch": 596, "lr": 8.090728688969762e-09} +{"train_loss": 0.0004058894992340356, "global_step": 70994, "epoch": 596, "lr": 8.050923034430558e-09} +{"train_loss": 0.00024246957036666572, "global_step": 70995, "epoch": 596, "lr": 8.011215533743067e-09} +{"train_loss": 0.00028642715187743306, "global_step": 70996, "epoch": 596, "lr": 7.971606186979453e-09} +{"train_loss": 0.00019089426496066153, "global_step": 70997, "epoch": 596, "lr": 7.932094994228534e-09} +{"train_loss": 0.00016084393428172916, "global_step": 70998, "epoch": 596, "lr": 7.892681955562476e-09} +{"train_loss": 0.0002598916762508452, "global_step": 70999, "epoch": 596, "lr": 7.853367071053442e-09} +{"train_loss": 0.00030925750616006553, "global_step": 71000, "epoch": 596, "lr": 7.814150340784699e-09} +{"train_loss": 0.0002817180356942117, "global_step": 71001, "epoch": 596, "lr": 7.775031764833962e-09} +{"train_loss": 0.0002037023805314675, "global_step": 71002, "epoch": 596, "lr": 7.736011343273397e-09} +{"train_loss": 0.00029314623679965734, "global_step": 71003, "epoch": 596, "lr": 7.69708907618627e-09} +{"train_loss": 0.0002954629308078438, "global_step": 71004, "epoch": 596, "lr": 7.658264963644745e-09} +{"train_loss": 0.00018516412819735706, "global_step": 71005, "epoch": 596, "lr": 7.619539005720988e-09} +{"train_loss": 0.0003047127975150943, "global_step": 71006, "epoch": 596, "lr": 7.580911202498264e-09} +{"train_loss": 0.00016319594578817487, "global_step": 71007, "epoch": 596, "lr": 7.542381554048739e-09} +{"train_loss": 0.0001942394010256976, "global_step": 71008, "epoch": 596, "lr": 7.503950060450127e-09} +{"train_loss": 0.00026234282995574176, "global_step": 71009, "epoch": 596, "lr": 7.465616721774592e-09} +{"train_loss": 0.0001892372383736074, "global_step": 71010, "epoch": 596, "lr": 7.427381538099853e-09} +{"train_loss": 0.00020305511134210974, "global_step": 71011, "epoch": 596, "lr": 7.389244509503623e-09} +{"train_loss": 0.00014704822388011962, "global_step": 71012, "epoch": 596, "lr": 7.351205636052516e-09} +{"train_loss": 0.00015101286408025771, "global_step": 71013, "epoch": 596, "lr": 7.313264917829799e-09} +{"train_loss": 0.00028024683706462383, "global_step": 71014, "epoch": 596, "lr": 7.275422354907635e-09} +{"train_loss": 0.00023569918994326144, "global_step": 71015, "epoch": 596, "lr": 7.237677947352639e-09} +{"train_loss": 0.00020616812980733812, "global_step": 71016, "epoch": 596, "lr": 7.200031695253629e-09} +{"train_loss": 0.00023189916100818664, "global_step": 71017, "epoch": 596, "lr": 7.1624835986716656e-09} +{"train_loss": 0.0003539584868121892, "global_step": 71018, "epoch": 596, "lr": 7.125033657684466e-09} +{"train_loss": 0.0001241272984771058, "global_step": 71019, "epoch": 596, "lr": 7.0876818723697446e-09} +{"train_loss": 0.0001556043716846034, "global_step": 71020, "epoch": 596, "lr": 7.050428242799667e-09} +{"train_loss": 0.0002406940038781613, "global_step": 71021, "epoch": 596, "lr": 7.013272769040846e-09} +{"train_loss": 0.0005747855757363141, "global_step": 71022, "epoch": 596, "lr": 6.976215451170997e-09} +{"train_loss": 0.00027410019538365304, "global_step": 71023, "epoch": 596, "lr": 6.939256289262286e-09} +{"train_loss": 0.00029375177109614015, "global_step": 71024, "epoch": 596, "lr": 6.9023952833868754e-09} +{"train_loss": 0.0001226390595547855, "global_step": 71025, "epoch": 596, "lr": 6.865632433616931e-09} +{"train_loss": 0.00017097657837439328, "global_step": 71026, "epoch": 596, "lr": 6.828967740030167e-09} +{"train_loss": 0.0004314898105803877, "global_step": 71027, "epoch": 596, "lr": 6.792401202687648e-09} +{"train_loss": 0.00031823426252231, "global_step": 71028, "epoch": 596, "lr": 6.7559328216726394e-09} +{"train_loss": 0.00023550790501758456, "global_step": 71029, "epoch": 596, "lr": 6.719562597046203e-09} +{"train_loss": 0.00016985677939374, "global_step": 71030, "epoch": 596, "lr": 6.6832905288860546e-09} +{"train_loss": 0.00023656236589886248, "global_step": 71031, "epoch": 596, "lr": 6.647116617264359e-09} +{"train_loss": 0.00016380056331399828, "global_step": 71032, "epoch": 596, "lr": 6.61104086224773e-09} +{"train_loss": 0.0001577051152708009, "global_step": 71033, "epoch": 596, "lr": 6.575063263913883e-09} +{"train_loss": 0.00024405395379289985, "global_step": 71034, "epoch": 596, "lr": 6.53918382232388e-09} +{"train_loss": 0.0005545942694880068, "global_step": 71035, "epoch": 596, "lr": 6.503402537555436e-09} +{"train_loss": 0.00021015710080973804, "global_step": 71036, "epoch": 596, "lr": 6.4677194096751655e-09} +{"train_loss": 0.00028966375975869596, "global_step": 71037, "epoch": 596, "lr": 6.432134438760784e-09} +{"train_loss": 0.0001975710765691474, "global_step": 71038, "epoch": 596, "lr": 6.396647624867802e-09} +{"train_loss": 0.0002510876511223614, "global_step": 71039, "epoch": 596, "lr": 6.361258968079486e-09} +{"train_loss": 0.00016014673747122288, "global_step": 71040, "epoch": 596, "lr": 6.3259684684569e-09} +{"train_loss": 0.0001991330791497603, "global_step": 71041, "epoch": 596, "lr": 6.2907761260722065e-09} +{"train_loss": 0.0002496455898293208, "global_step": 71042, "epoch": 596, "lr": 6.25568194099202e-09, "val_loss": 0.010867508128285408} +{"train_loss": 0.0002731771091930568, "global_step": 71043, "epoch": 597, "lr": 6.2206859132940554e-09} +{"train_loss": 0.00016682683781255037, "global_step": 71044, "epoch": 597, "lr": 6.185788043033824e-09} +{"train_loss": 0.00020197949197608978, "global_step": 71045, "epoch": 597, "lr": 6.150988330294594e-09} +{"train_loss": 0.00018914607062470168, "global_step": 71046, "epoch": 597, "lr": 6.116286775131874e-09} +{"train_loss": 0.00013010828115511686, "global_step": 71047, "epoch": 597, "lr": 6.0816833776178305e-09} +{"train_loss": 0.00014416694466490299, "global_step": 71048, "epoch": 597, "lr": 6.047178137824628e-09} +{"train_loss": 0.0001515151234343648, "global_step": 71049, "epoch": 597, "lr": 6.0127710558133265e-09} +{"train_loss": 0.00031242091790772974, "global_step": 71050, "epoch": 597, "lr": 5.978462131656093e-09} +{"train_loss": 0.0001903644879348576, "global_step": 71051, "epoch": 597, "lr": 5.94425136541954e-09} +{"train_loss": 0.0001491428993176669, "global_step": 71052, "epoch": 597, "lr": 5.91013875717028e-09} +{"train_loss": 0.0001151317628682591, "global_step": 71053, "epoch": 597, "lr": 5.876124306974928e-09} +{"train_loss": 0.00016229934408329427, "global_step": 71054, "epoch": 597, "lr": 5.842208014900097e-09} +{"train_loss": 0.00015130436804611236, "global_step": 71055, "epoch": 597, "lr": 5.80838988101795e-09} +{"train_loss": 0.00041363260243088007, "global_step": 71056, "epoch": 597, "lr": 5.7746699053840006e-09} +{"train_loss": 0.00023286619398277253, "global_step": 71057, "epoch": 597, "lr": 5.741048088070411e-09} +{"train_loss": 0.001008149585686624, "global_step": 71058, "epoch": 597, "lr": 5.707524429149347e-09} +{"train_loss": 0.0002609894145280123, "global_step": 71059, "epoch": 597, "lr": 5.674098928676319e-09} +{"train_loss": 0.00011189129145350307, "global_step": 71060, "epoch": 597, "lr": 5.640771586717941e-09} +{"train_loss": 0.00038053508615121245, "global_step": 71061, "epoch": 597, "lr": 5.6075424033463776e-09} +{"train_loss": 0.00023809612321201712, "global_step": 71062, "epoch": 597, "lr": 5.5744113786226904e-09} +{"train_loss": 0.0002930430637206882, "global_step": 71063, "epoch": 597, "lr": 5.541378512613493e-09} +{"train_loss": 0.00024044464225880802, "global_step": 71064, "epoch": 597, "lr": 5.508443805379848e-09} +{"train_loss": 0.00021202213247306645, "global_step": 71065, "epoch": 597, "lr": 5.47560725699392e-09} +{"train_loss": 0.00041383394272997975, "global_step": 71066, "epoch": 597, "lr": 5.442868867511219e-09} +{"train_loss": 0.00014224130427464843, "global_step": 71067, "epoch": 597, "lr": 5.410228637003911e-09} +{"train_loss": 0.00022782653104513884, "global_step": 71068, "epoch": 597, "lr": 5.377686565533058e-09} +{"train_loss": 0.00018038848065771163, "global_step": 71069, "epoch": 597, "lr": 5.345242653159721e-09} +{"train_loss": 0.0002728084218688309, "global_step": 71070, "epoch": 597, "lr": 5.312896899944964e-09} +{"train_loss": 0.00017026682326104492, "global_step": 71071, "epoch": 597, "lr": 5.280649305966501e-09} +{"train_loss": 0.00033770190202631056, "global_step": 71072, "epoch": 597, "lr": 5.2484998712687415e-09} +{"train_loss": 0.00024448439944535494, "global_step": 71073, "epoch": 597, "lr": 5.216448595929402e-09} +{"train_loss": 0.0001436017919331789, "global_step": 71074, "epoch": 597, "lr": 5.184495480009544e-09} +{"train_loss": 0.00048271578270941973, "global_step": 71075, "epoch": 597, "lr": 5.152640523564678e-09} +{"train_loss": 0.00028984417440369725, "global_step": 71076, "epoch": 597, "lr": 5.1208837266614185e-09} +{"train_loss": 0.00037708666059188545, "global_step": 71077, "epoch": 597, "lr": 5.089225089366378e-09} +{"train_loss": 0.0001832302223192528, "global_step": 71078, "epoch": 597, "lr": 5.057664611735069e-09} +{"train_loss": 0.0001720194413792342, "global_step": 71079, "epoch": 597, "lr": 5.0262022938285525e-09} +{"train_loss": 0.0002723662764765322, "global_step": 71080, "epoch": 597, "lr": 4.994838135713442e-09} +{"train_loss": 0.0002770432038232684, "global_step": 71081, "epoch": 597, "lr": 4.963572137450801e-09} +{"train_loss": 0.00013990423758514225, "global_step": 71082, "epoch": 597, "lr": 4.932404299101689e-09} +{"train_loss": 0.0001365296047879383, "global_step": 71083, "epoch": 597, "lr": 4.901334620727171e-09} +{"train_loss": 0.00018510232621338218, "global_step": 71084, "epoch": 597, "lr": 4.870363102382758e-09} +{"train_loss": 0.0002046768640866503, "global_step": 71085, "epoch": 597, "lr": 4.8394897441406125e-09} +{"train_loss": 0.00022919058392290026, "global_step": 71086, "epoch": 597, "lr": 4.808714546050697e-09} +{"train_loss": 0.00017257210856769234, "global_step": 71087, "epoch": 597, "lr": 4.778037508179623e-09} +{"train_loss": 0.00024083792231976986, "global_step": 71088, "epoch": 597, "lr": 4.747458630582901e-09} +{"train_loss": 0.00023169680207502097, "global_step": 71089, "epoch": 597, "lr": 4.7169779133271475e-09} +{"train_loss": 0.0001787188375601545, "global_step": 71090, "epoch": 597, "lr": 4.686595356467871e-09} +{"train_loss": 0.0002902229316532612, "global_step": 71091, "epoch": 597, "lr": 4.656310960066135e-09} +{"train_loss": 0.00032515573548153043, "global_step": 71092, "epoch": 597, "lr": 4.62612472417745e-09} +{"train_loss": 0.00027694323216564953, "global_step": 71093, "epoch": 597, "lr": 4.5960366488628785e-09} +{"train_loss": 0.0001734118995955214, "global_step": 71094, "epoch": 597, "lr": 4.566046734189033e-09} +{"train_loss": 0.00020167598268017173, "global_step": 71095, "epoch": 597, "lr": 4.536154980200324e-09} +{"train_loss": 0.00022828376677352935, "global_step": 71096, "epoch": 597, "lr": 4.506361386968916e-09} +{"train_loss": 0.0001411747361999005, "global_step": 71097, "epoch": 597, "lr": 4.4766659545503184e-09} +{"train_loss": 0.00019684784638229758, "global_step": 71098, "epoch": 597, "lr": 4.447068682994493e-09} +{"train_loss": 0.00012350331235211343, "global_step": 71099, "epoch": 597, "lr": 4.417569572368052e-09} +{"train_loss": 0.00039672182174399495, "global_step": 71100, "epoch": 597, "lr": 4.388168622726507e-09} +{"train_loss": 0.0002433295885566622, "global_step": 71101, "epoch": 597, "lr": 4.358865834130921e-09} +{"train_loss": 0.00015705924306530505, "global_step": 71102, "epoch": 597, "lr": 4.329661206631252e-09} +{"train_loss": 0.00023912647156976163, "global_step": 71103, "epoch": 597, "lr": 4.300554740288565e-09} +{"train_loss": 0.0002676657750271261, "global_step": 71104, "epoch": 597, "lr": 4.2715464351639205e-09} +{"train_loss": 0.00036764625110663474, "global_step": 71105, "epoch": 597, "lr": 4.242636291307278e-09} +{"train_loss": 0.00072333007119596, "global_step": 71106, "epoch": 597, "lr": 4.213824308779702e-09} +{"train_loss": 0.00015927320055197924, "global_step": 71107, "epoch": 597, "lr": 4.185110487642252e-09} +{"train_loss": 0.00018382484267931432, "global_step": 71108, "epoch": 597, "lr": 4.156494827939339e-09} +{"train_loss": 0.0003618778137024492, "global_step": 71109, "epoch": 597, "lr": 4.127977329737576e-09} +{"train_loss": 0.0003076623543165624, "global_step": 71110, "epoch": 597, "lr": 4.0995579930869224e-09} +{"train_loss": 0.0002296766615472734, "global_step": 71111, "epoch": 597, "lr": 4.071236818048441e-09} +{"train_loss": 0.00031842326279729605, "global_step": 71112, "epoch": 597, "lr": 4.043013804672091e-09} +{"train_loss": 0.00018874922534450889, "global_step": 71113, "epoch": 597, "lr": 4.014888953018936e-09} +{"train_loss": 0.0003941225295420736, "global_step": 71114, "epoch": 597, "lr": 3.9868622631389355e-09} +{"train_loss": 0.0001681307767285034, "global_step": 71115, "epoch": 597, "lr": 3.9589337350876e-09} +{"train_loss": 0.00024876627139747143, "global_step": 71116, "epoch": 597, "lr": 3.931103368925992e-09} +{"train_loss": 0.00020183763990644366, "global_step": 71117, "epoch": 597, "lr": 3.903371164704073e-09} +{"train_loss": 0.00015352526679635048, "global_step": 71118, "epoch": 597, "lr": 3.875737122471801e-09} +{"train_loss": 0.00017187795310746878, "global_step": 71119, "epoch": 597, "lr": 3.8482012422902395e-09} +{"train_loss": 0.00019212225743103772, "global_step": 71120, "epoch": 597, "lr": 3.820763524214898e-09} +{"train_loss": 0.00019995291950181127, "global_step": 71121, "epoch": 597, "lr": 3.793423968290188e-09} +{"train_loss": 0.000405575759941712, "global_step": 71122, "epoch": 597, "lr": 3.766182574582722e-09} +{"train_loss": 0.00031809607753530145, "global_step": 71123, "epoch": 597, "lr": 3.739039343131357e-09} +{"train_loss": 0.00028108706464990973, "global_step": 71124, "epoch": 597, "lr": 3.711994274002706e-09} +{"train_loss": 0.00023482485266868025, "global_step": 71125, "epoch": 597, "lr": 3.68504736724673e-09} +{"train_loss": 0.00026274105766788125, "global_step": 71126, "epoch": 597, "lr": 3.658198622907838e-09} +{"train_loss": 0.0007708253688178957, "global_step": 71127, "epoch": 597, "lr": 3.631448041047092e-09} +{"train_loss": 0.0002602812310215086, "global_step": 71128, "epoch": 597, "lr": 3.604795621714452e-09} +{"train_loss": 0.00036341958912089467, "global_step": 71129, "epoch": 597, "lr": 3.5782413649598776e-09} +{"train_loss": 0.0002758334740065038, "global_step": 71130, "epoch": 597, "lr": 3.5517852708444323e-09} +{"train_loss": 0.0002733166911639273, "global_step": 71131, "epoch": 597, "lr": 3.5254273394069727e-09} +{"train_loss": 0.0003832764341495931, "global_step": 71132, "epoch": 597, "lr": 3.4991675707085614e-09} +{"train_loss": 0.0003955074062105268, "global_step": 71133, "epoch": 597, "lr": 3.4730059647991588e-09} +{"train_loss": 0.0005025380523875356, "global_step": 71134, "epoch": 597, "lr": 3.4469425217287245e-09} +{"train_loss": 0.000172810789081268, "global_step": 71135, "epoch": 597, "lr": 3.4209772415472186e-09} +{"train_loss": 0.0003170669951941818, "global_step": 71136, "epoch": 597, "lr": 3.3951101243101524e-09} +{"train_loss": 0.00014567300968337804, "global_step": 71137, "epoch": 597, "lr": 3.369341170067486e-09} +{"train_loss": 0.00025131058646366, "global_step": 71138, "epoch": 597, "lr": 3.3436703788636283e-09} +{"train_loss": 0.00023026615963317454, "global_step": 71139, "epoch": 597, "lr": 3.31809775075409e-09} +{"train_loss": 0.00031040768953971565, "global_step": 71140, "epoch": 597, "lr": 3.292623285788832e-09} +{"train_loss": 0.0001906723773572594, "global_step": 71141, "epoch": 597, "lr": 3.267246984012262e-09} +{"train_loss": 0.00028667799779213965, "global_step": 71142, "epoch": 597, "lr": 3.2419688454854436e-09} +{"train_loss": 0.00020206776389386505, "global_step": 71143, "epoch": 597, "lr": 3.2167888702472337e-09} +{"train_loss": 0.00021904364984948188, "global_step": 71144, "epoch": 597, "lr": 3.191707058353144e-09} +{"train_loss": 0.0002107473264914006, "global_step": 71145, "epoch": 597, "lr": 3.166723409853134e-09} +{"train_loss": 0.00030442970455624163, "global_step": 71146, "epoch": 597, "lr": 3.141837924791613e-09} +{"train_loss": 0.00011210182128706947, "global_step": 71147, "epoch": 597, "lr": 3.117050603218541e-09} +{"train_loss": 0.00021576709696091712, "global_step": 71148, "epoch": 597, "lr": 3.0923614451838777e-09} +{"train_loss": 0.0003448525385465473, "global_step": 71149, "epoch": 597, "lr": 3.067770450737584e-09} +{"train_loss": 0.00031686475267633796, "global_step": 71150, "epoch": 597, "lr": 3.0432776199296185e-09} +{"train_loss": 0.00044077803613618016, "global_step": 71151, "epoch": 597, "lr": 3.0188829527988404e-09} +{"train_loss": 0.00022943098156247288, "global_step": 71152, "epoch": 597, "lr": 2.9945864494007604e-09} +{"train_loss": 0.00014121251297183335, "global_step": 71153, "epoch": 597, "lr": 2.970388109785338e-09} +{"train_loss": 0.00025255384389311075, "global_step": 71154, "epoch": 597, "lr": 2.9462879339914317e-09} +{"train_loss": 0.00014078192180022597, "global_step": 71155, "epoch": 597, "lr": 2.9222859220745523e-09} +{"train_loss": 0.0002923983265645802, "global_step": 71156, "epoch": 597, "lr": 2.898382074073558e-09} +{"train_loss": 0.0003669160360004753, "global_step": 71157, "epoch": 597, "lr": 2.8745763900439593e-09} +{"train_loss": 0.00012931479432154447, "global_step": 71158, "epoch": 597, "lr": 2.8508688700246147e-09} +{"train_loss": 0.00014393158198799938, "global_step": 71159, "epoch": 597, "lr": 2.8272595140710344e-09} +{"train_loss": 0.00011732949496945366, "global_step": 71160, "epoch": 597, "lr": 2.803748322222077e-09} +{"train_loss": 0.0002571774001341869, "global_step": 71161, "epoch": 597, "lr": 2.7803352945277028e-09, "val_loss": 0.01363624818623066} +{"train_loss": 0.0001913376763695851, "global_step": 71162, "epoch": 598, "lr": 2.75702043103232e-09} +{"train_loss": 0.0003746748261619359, "global_step": 71163, "epoch": 598, "lr": 2.733803731785889e-09} +{"train_loss": 0.0005263380007818341, "global_step": 71164, "epoch": 598, "lr": 2.7106851968272673e-09} +{"train_loss": 0.00030620090547017753, "global_step": 71165, "epoch": 598, "lr": 2.687664826200864e-09} +{"train_loss": 0.0003101000329479575, "global_step": 71166, "epoch": 598, "lr": 2.6647426199621905e-09} +{"train_loss": 0.00028406563797034323, "global_step": 71167, "epoch": 598, "lr": 2.6419185781445534e-09} +{"train_loss": 0.00021433166693896055, "global_step": 71168, "epoch": 598, "lr": 2.6191927008034632e-09} +{"train_loss": 0.00021389449830166996, "global_step": 71169, "epoch": 598, "lr": 2.5965649879722276e-09} +{"train_loss": 0.0002614614204503596, "global_step": 71170, "epoch": 598, "lr": 2.574035439706357e-09} +{"train_loss": 0.00020124066213611513, "global_step": 71171, "epoch": 598, "lr": 2.5516040560391586e-09} +{"train_loss": 0.0002032684424193576, "global_step": 71172, "epoch": 598, "lr": 2.529270837026143e-09} +{"train_loss": 9.690170554677024e-05, "global_step": 71173, "epoch": 598, "lr": 2.5070357827006176e-09} +{"train_loss": 0.00038173497887328267, "global_step": 71174, "epoch": 598, "lr": 2.4848988931180927e-09} +{"train_loss": 0.00036116366391070187, "global_step": 71175, "epoch": 598, "lr": 2.4628601683063246e-09} +{"train_loss": 0.00026274911942891777, "global_step": 71176, "epoch": 598, "lr": 2.440919608320824e-09} +{"train_loss": 0.00021072222443763167, "global_step": 71177, "epoch": 598, "lr": 2.4190772132060003e-09} +{"train_loss": 0.00019241774862166494, "global_step": 71178, "epoch": 598, "lr": 2.3973329829951594e-09} +{"train_loss": 0.0001779668527888134, "global_step": 71179, "epoch": 598, "lr": 2.375686917732711e-09} +{"train_loss": 0.00012864974269177765, "global_step": 71180, "epoch": 598, "lr": 2.3541390174686152e-09} +{"train_loss": 0.00016584248805884272, "global_step": 71181, "epoch": 598, "lr": 2.332689282241729e-09} +{"train_loss": 0.00014954716607462615, "global_step": 71182, "epoch": 598, "lr": 2.3113377120909107e-09} +{"train_loss": 0.00014226009079720825, "global_step": 71183, "epoch": 598, "lr": 2.2900843070605694e-09} +{"train_loss": 0.00024617198505438864, "global_step": 71184, "epoch": 598, "lr": 2.2689290671895626e-09} +{"train_loss": 0.0003831001522485167, "global_step": 71185, "epoch": 598, "lr": 2.2478719925278503e-09} +{"train_loss": 0.0008136573596857488, "global_step": 71186, "epoch": 598, "lr": 2.2269130831087393e-09} +{"train_loss": 0.0002249667013529688, "global_step": 71187, "epoch": 598, "lr": 2.2060523389710873e-09} +{"train_loss": 0.00012187480024294928, "global_step": 71188, "epoch": 598, "lr": 2.185289760164855e-09} +{"train_loss": 0.0003119995817542076, "global_step": 71189, "epoch": 598, "lr": 2.164625346723348e-09} +{"train_loss": 0.0002085658343276009, "global_step": 71190, "epoch": 598, "lr": 2.144059098696527e-09} +{"train_loss": 0.0001892836589831859, "global_step": 71191, "epoch": 598, "lr": 2.1235910161121474e-09} +{"train_loss": 0.0001853551366366446, "global_step": 71192, "epoch": 598, "lr": 2.1032210990201695e-09} +{"train_loss": 0.0004463538061827421, "global_step": 71193, "epoch": 598, "lr": 2.0829493474538995e-09} +{"train_loss": 0.0003524193889461458, "global_step": 71194, "epoch": 598, "lr": 2.062775761457747e-09} +{"train_loss": 0.00016786680498626083, "global_step": 71195, "epoch": 598, "lr": 2.0427003410705693e-09} +{"train_loss": 0.00022038754832465202, "global_step": 71196, "epoch": 598, "lr": 2.022723086331224e-09} +{"train_loss": 0.00020725312060676515, "global_step": 71197, "epoch": 598, "lr": 2.0028439972785697e-09} +{"train_loss": 0.0003217953199055046, "global_step": 71198, "epoch": 598, "lr": 1.9830630739459123e-09} +{"train_loss": 0.00021737065981142223, "global_step": 71199, "epoch": 598, "lr": 1.963380316388763e-09} +{"train_loss": 0.00040536595042794943, "global_step": 71200, "epoch": 598, "lr": 1.943795724629327e-09} +{"train_loss": 0.00040161210927180946, "global_step": 71201, "epoch": 598, "lr": 1.9243092987120125e-09} +{"train_loss": 0.0004298692801967263, "global_step": 71202, "epoch": 598, "lr": 1.9049210386701266e-09} +{"train_loss": 0.0002468248421791941, "global_step": 71203, "epoch": 598, "lr": 1.885630944553629e-09} +{"train_loss": 0.00031893010600470006, "global_step": 71204, "epoch": 598, "lr": 1.866439016390276e-09} +{"train_loss": 0.00024336381466127932, "global_step": 71205, "epoch": 598, "lr": 1.847345254218924e-09} +{"train_loss": 0.00021921175357419997, "global_step": 71206, "epoch": 598, "lr": 1.828349658083983e-09} +{"train_loss": 0.00020548242900986224, "global_step": 71207, "epoch": 598, "lr": 1.8094522280132087e-09} +{"train_loss": 0.00025679197278805077, "global_step": 71208, "epoch": 598, "lr": 1.7906529640510095e-09} +{"train_loss": 0.00017853292229119688, "global_step": 71209, "epoch": 598, "lr": 1.7719518662251411e-09} +{"train_loss": 0.0003295890928711742, "global_step": 71210, "epoch": 598, "lr": 1.7533489345855636e-09} +{"train_loss": 0.00033302020165137947, "global_step": 71211, "epoch": 598, "lr": 1.7348441691600326e-09} +{"train_loss": 0.00032467578421346843, "global_step": 71212, "epoch": 598, "lr": 1.7164375699818546e-09} +{"train_loss": 0.00012187625543447211, "global_step": 71213, "epoch": 598, "lr": 1.698129137095439e-09} +{"train_loss": 0.00018939106666948646, "global_step": 71214, "epoch": 598, "lr": 1.6799188705340918e-09} +{"train_loss": 0.00019293520017527044, "global_step": 71215, "epoch": 598, "lr": 1.6618067703311201e-09} +{"train_loss": 0.00012520834570750594, "global_step": 71216, "epoch": 598, "lr": 1.643792836525382e-09} +{"train_loss": 0.0001871255662990734, "global_step": 71217, "epoch": 598, "lr": 1.6258770691501835e-09} +{"train_loss": 0.0007338792784139514, "global_step": 71218, "epoch": 598, "lr": 1.6080594682443828e-09} +{"train_loss": 0.00016188705922104418, "global_step": 71219, "epoch": 598, "lr": 1.5903400338357354e-09} +{"train_loss": 0.0001455749006709084, "global_step": 71220, "epoch": 598, "lr": 1.5727187659630993e-09} +{"train_loss": 0.0002887793234549463, "global_step": 71221, "epoch": 598, "lr": 1.555195664659781e-09} +{"train_loss": 0.0002846165152732283, "global_step": 71222, "epoch": 598, "lr": 1.5377707299590871e-09} +{"train_loss": 0.0004210066399537027, "global_step": 71223, "epoch": 598, "lr": 1.5204439619054267e-09} +{"train_loss": 0.0001707246119622141, "global_step": 71224, "epoch": 598, "lr": 1.5032153605154532e-09} +{"train_loss": 0.00029387092217803, "global_step": 71225, "epoch": 598, "lr": 1.4860849258391264e-09} +{"train_loss": 0.00017531005141790956, "global_step": 71226, "epoch": 598, "lr": 1.4690526578986507e-09} +{"train_loss": 0.00013190195022616535, "global_step": 71227, "epoch": 598, "lr": 1.4521185567384355e-09} +{"train_loss": 0.0001271788205485791, "global_step": 71228, "epoch": 598, "lr": 1.4352826223806849e-09} +{"train_loss": 0.00023609900381416082, "global_step": 71229, "epoch": 598, "lr": 1.4185448548642565e-09} +{"train_loss": 0.000329991162288934, "global_step": 71230, "epoch": 598, "lr": 1.4019052542224575e-09} +{"train_loss": 0.0002215341810369864, "global_step": 71231, "epoch": 598, "lr": 1.3853638204830432e-09} +{"train_loss": 0.00024302664678543806, "global_step": 71232, "epoch": 598, "lr": 1.3689205536848715e-09} +{"train_loss": 0.00033675439772196114, "global_step": 71233, "epoch": 598, "lr": 1.3525754538556978e-09} +{"train_loss": 0.0002160832955269143, "global_step": 71234, "epoch": 598, "lr": 1.336328521028829e-09} +{"train_loss": 0.00020686883362941444, "global_step": 71235, "epoch": 598, "lr": 1.3201797552375716e-09} +{"train_loss": 0.00025784980971366167, "global_step": 71236, "epoch": 598, "lr": 1.3041291565096813e-09} +{"train_loss": 0.00028103397926315665, "global_step": 71237, "epoch": 598, "lr": 1.288176724884016e-09} +{"train_loss": 0.00020787031098734587, "global_step": 71238, "epoch": 598, "lr": 1.2723224603883311e-09} +{"train_loss": 0.00013715257227886468, "global_step": 71239, "epoch": 598, "lr": 1.256566363044831e-09} +{"train_loss": 0.00019221722322981805, "global_step": 71240, "epoch": 598, "lr": 1.2409084328979248e-09} +{"train_loss": 0.00013618321099784225, "global_step": 71241, "epoch": 598, "lr": 1.225348669975368e-09} +{"train_loss": 0.0005082179559394717, "global_step": 71242, "epoch": 598, "lr": 1.2098870743049161e-09} +{"train_loss": 0.0002457366499584168, "global_step": 71243, "epoch": 598, "lr": 1.194523645914325e-09} +{"train_loss": 0.00031621422385796905, "global_step": 71244, "epoch": 598, "lr": 1.179258384836901e-09} +{"train_loss": 0.00022836851712781936, "global_step": 71245, "epoch": 598, "lr": 1.1640912911003998e-09} +{"train_loss": 0.00017823414236772805, "global_step": 71246, "epoch": 598, "lr": 1.1490223647381282e-09} +{"train_loss": 0.00015133483975660056, "global_step": 71247, "epoch": 598, "lr": 1.1340516057833928e-09} +{"train_loss": 0.00029487948631867766, "global_step": 71248, "epoch": 598, "lr": 1.119179014252847e-09} +{"train_loss": 0.00014975847443565726, "global_step": 71249, "epoch": 598, "lr": 1.1044045901853484e-09} +{"train_loss": 0.00019065404194407165, "global_step": 71250, "epoch": 598, "lr": 1.0897283336086527e-09} +{"train_loss": 0.0001594455388840288, "global_step": 71251, "epoch": 598, "lr": 1.0751502445505158e-09} +{"train_loss": 0.0002343365049455315, "global_step": 71252, "epoch": 598, "lr": 1.0606703230442439e-09} +{"train_loss": 0.00034419403527863324, "global_step": 71253, "epoch": 598, "lr": 1.0462885691064906e-09} +{"train_loss": 0.0001423959620296955, "global_step": 71254, "epoch": 598, "lr": 1.0320049827761135e-09} +{"train_loss": 0.0003386385506018996, "global_step": 71255, "epoch": 598, "lr": 1.0178195640808685e-09} +{"train_loss": 0.0003212361189071089, "global_step": 71256, "epoch": 598, "lr": 1.0037323130374088e-09} +{"train_loss": 0.0005273654242046177, "global_step": 71257, "epoch": 598, "lr": 9.897432296901432e-10} +{"train_loss": 0.00018019172421190888, "global_step": 71258, "epoch": 598, "lr": 9.758523140501741e-10} +{"train_loss": 0.00026619707932695746, "global_step": 71259, "epoch": 598, "lr": 9.620595661563591e-10} +{"train_loss": 0.0002522618160583079, "global_step": 71260, "epoch": 598, "lr": 9.48364986036454e-10} +{"train_loss": 0.00022758408158551902, "global_step": 71261, "epoch": 598, "lr": 9.347685737071122e-10} +{"train_loss": 0.0004424616927281022, "global_step": 71262, "epoch": 598, "lr": 9.2127032920164e-10} +{"train_loss": 0.00021744893456343561, "global_step": 71263, "epoch": 598, "lr": 9.078702525477934e-10} +{"train_loss": 0.0002200489107053727, "global_step": 71264, "epoch": 598, "lr": 8.945683437677766e-10} +{"train_loss": 0.0003208680427633226, "global_step": 71265, "epoch": 598, "lr": 8.813646028893451e-10} +{"train_loss": 0.00037775596138089895, "global_step": 71266, "epoch": 598, "lr": 8.682590299347038e-10} +{"train_loss": 0.0003475302073638886, "global_step": 71267, "epoch": 598, "lr": 8.5525162494271e-10} +{"train_loss": 0.00017973249487113208, "global_step": 71268, "epoch": 598, "lr": 8.423423879244663e-10} +{"train_loss": 0.0002239736495539546, "global_step": 71269, "epoch": 598, "lr": 8.295313189077281e-10} +{"train_loss": 0.00016389931261073798, "global_step": 71270, "epoch": 598, "lr": 8.168184179258021e-10} +{"train_loss": 0.00024884831509552896, "global_step": 71271, "epoch": 598, "lr": 8.042036849953416e-10} +{"train_loss": 0.00015943916514515877, "global_step": 71272, "epoch": 598, "lr": 7.916871201496534e-10} +{"train_loss": 0.00037089342367835343, "global_step": 71273, "epoch": 598, "lr": 7.792687233998397e-10} +{"train_loss": 0.00025599380023777485, "global_step": 71274, "epoch": 598, "lr": 7.669484947847582e-10} +{"train_loss": 0.0003296883078292012, "global_step": 71275, "epoch": 598, "lr": 7.547264343210625e-10} +{"train_loss": 0.00017899222439154983, "global_step": 71276, "epoch": 598, "lr": 7.426025420309569e-10} +{"train_loss": 0.00020662180031649768, "global_step": 71277, "epoch": 598, "lr": 7.305768179421968e-10} +{"train_loss": 0.0002562353038229048, "global_step": 71278, "epoch": 598, "lr": 7.186492620769869e-10} +{"train_loss": 0.00027935951948165894, "global_step": 71279, "epoch": 598, "lr": 7.068198744630828e-10} +{"train_loss": 0.0002602506943165419, "global_step": 71280, "epoch": 598, "lr": 6.950886551171376e-10, "val_loss": 0.058123305439949036} +{"train_loss": 0.0009937972063198686, "global_step": 71281, "epoch": 599, "lr": 6.83455604061356e-10} +{"train_loss": 0.00016217476513702422, "global_step": 71282, "epoch": 599, "lr": 6.719207213234935e-10} +{"train_loss": 0.00023974764917511493, "global_step": 71283, "epoch": 599, "lr": 6.604840069257546e-10} +{"train_loss": 0.00029360162443481386, "global_step": 71284, "epoch": 599, "lr": 6.491454608903435e-10} +{"train_loss": 0.0005145047325640917, "global_step": 71285, "epoch": 599, "lr": 6.37905083239465e-10} +{"train_loss": 0.00017882285465020686, "global_step": 71286, "epoch": 599, "lr": 6.267628739953235e-10} +{"train_loss": 0.0002022279950324446, "global_step": 71287, "epoch": 599, "lr": 6.157188331745722e-10} +{"train_loss": 0.0002550205681473017, "global_step": 71288, "epoch": 599, "lr": 6.047729608049668e-10} +{"train_loss": 0.0002123603189829737, "global_step": 71289, "epoch": 599, "lr": 5.939252569031606e-10} +{"train_loss": 0.00022170142619870603, "global_step": 71290, "epoch": 599, "lr": 5.831757214969092e-10} +{"train_loss": 0.00038799041067250073, "global_step": 71291, "epoch": 599, "lr": 5.725243546084169e-10} +{"train_loss": 0.00033206792431883514, "global_step": 71292, "epoch": 599, "lr": 5.619711562487861e-10} +{"train_loss": 0.0003047909995075315, "global_step": 71293, "epoch": 599, "lr": 5.515161264457724e-10} +{"train_loss": 0.0002135888789780438, "global_step": 71294, "epoch": 599, "lr": 5.411592652160291e-10} +{"train_loss": 0.0003246280539315194, "global_step": 71295, "epoch": 599, "lr": 5.309005725817606e-10} +{"train_loss": 0.00033557883580215275, "global_step": 71296, "epoch": 599, "lr": 5.207400485651715e-10} +{"train_loss": 0.00024042726727202535, "global_step": 71297, "epoch": 599, "lr": 5.106776931829149e-10} +{"train_loss": 0.00012988591333851218, "global_step": 71298, "epoch": 599, "lr": 5.007135064571955e-10} +{"train_loss": 0.00019408327352721244, "global_step": 71299, "epoch": 599, "lr": 4.908474884102177e-10} +{"train_loss": 0.00017416029004380107, "global_step": 71300, "epoch": 599, "lr": 4.810796390530837e-10} +{"train_loss": 0.00025307200849056244, "global_step": 71301, "epoch": 599, "lr": 4.714099584135489e-10} +{"train_loss": 0.00017755870067048818, "global_step": 71302, "epoch": 599, "lr": 4.618384465027159e-10} +{"train_loss": 0.00037389862700365484, "global_step": 71303, "epoch": 599, "lr": 4.523651033427889e-10} +{"train_loss": 0.0001667740725679323, "global_step": 71304, "epoch": 599, "lr": 4.429899289559725e-10} +{"train_loss": 0.0002457440714351833, "global_step": 71305, "epoch": 599, "lr": 4.337129233589199e-10} +{"train_loss": 0.0003764907596632838, "global_step": 71306, "epoch": 599, "lr": 4.2453408656828453e-10} +{"train_loss": 0.0004612439079210162, "global_step": 71307, "epoch": 599, "lr": 4.1545341860071975e-10} +{"train_loss": 0.00030706165125593543, "global_step": 71308, "epoch": 599, "lr": 4.0647091947287885e-10} +{"train_loss": 0.0005010120803490281, "global_step": 71309, "epoch": 599, "lr": 3.9758658920696636e-10} +{"train_loss": 0.00022030471882317215, "global_step": 71310, "epoch": 599, "lr": 3.8880042781963555e-10} +{"train_loss": 0.0005209991941228509, "global_step": 71311, "epoch": 599, "lr": 3.8011243533309093e-10} +{"train_loss": 0.0001836490264395252, "global_step": 71312, "epoch": 599, "lr": 3.7152261175288363e-10} +{"train_loss": 0.0005969665362499654, "global_step": 71313, "epoch": 599, "lr": 3.6303095710121805e-10} +{"train_loss": 0.00013564041000790894, "global_step": 71314, "epoch": 599, "lr": 3.5463747139474757e-10} +{"train_loss": 0.00019061121565755457, "global_step": 71315, "epoch": 599, "lr": 3.4634215465012555e-10} +{"train_loss": 0.00023131878697313368, "global_step": 71316, "epoch": 599, "lr": 3.381450068840053e-10} +{"train_loss": 0.00027680658968165517, "global_step": 71317, "epoch": 599, "lr": 3.300460281130402e-10} +{"train_loss": 0.0001868847175501287, "global_step": 71318, "epoch": 599, "lr": 3.220452183538836e-10} +{"train_loss": 0.0002810165169648826, "global_step": 71319, "epoch": 599, "lr": 3.1414257761763766e-10} +{"train_loss": 0.00017387481057085097, "global_step": 71320, "epoch": 599, "lr": 3.063381059265069e-10} +{"train_loss": 0.00026315232389606535, "global_step": 71321, "epoch": 599, "lr": 2.9863180328604244e-10} +{"train_loss": 0.0001660497218836099, "global_step": 71322, "epoch": 599, "lr": 2.9102366972399987e-10} +{"train_loss": 0.0003281756362412125, "global_step": 71323, "epoch": 599, "lr": 2.8351370524593026e-10} +{"train_loss": 0.0002455361536704004, "global_step": 71324, "epoch": 599, "lr": 2.7610190986848695e-10} +{"train_loss": 0.00036295803147368133, "global_step": 71325, "epoch": 599, "lr": 2.687882836083233e-10} +{"train_loss": 0.00030419399263337255, "global_step": 71326, "epoch": 599, "lr": 2.6157282648209267e-10} +{"train_loss": 0.0001223335275426507, "global_step": 71327, "epoch": 599, "lr": 2.544555384953462e-10} +{"train_loss": 0.0003454785037320107, "global_step": 71328, "epoch": 599, "lr": 2.474364196702883e-10} +{"train_loss": 0.0003146170056425035, "global_step": 71329, "epoch": 599, "lr": 2.405154700180212e-10} +{"train_loss": 0.00013913822476752102, "global_step": 71330, "epoch": 599, "lr": 2.336926895496472e-10} +{"train_loss": 0.00034353916998952627, "global_step": 71331, "epoch": 599, "lr": 2.2696807828181954e-10} +{"train_loss": 0.0003952391562052071, "global_step": 71332, "epoch": 599, "lr": 2.2034163622564052e-10} +{"train_loss": 0.0002443384728394449, "global_step": 71333, "epoch": 599, "lr": 2.138133633977635e-10} +{"train_loss": 0.0001887491816887632, "global_step": 71334, "epoch": 599, "lr": 2.0738325980373952e-10} +{"train_loss": 0.00023863359820097685, "global_step": 71335, "epoch": 599, "lr": 2.010513254657731e-10} +{"train_loss": 0.00023733812849968672, "global_step": 71336, "epoch": 599, "lr": 1.9481756038941535e-10} +{"train_loss": 0.00022528068802785128, "global_step": 71337, "epoch": 599, "lr": 1.8868196459131958e-10} +{"train_loss": 0.0002765163953881711, "global_step": 71338, "epoch": 599, "lr": 1.8264453807703696e-10} +{"train_loss": 0.00018092880782205611, "global_step": 71339, "epoch": 599, "lr": 1.767052808632208e-10} +{"train_loss": 0.00033480909769423306, "global_step": 71340, "epoch": 599, "lr": 1.7086419296097334e-10} +{"train_loss": 0.0002001499233301729, "global_step": 71341, "epoch": 599, "lr": 1.651212743813968e-10} +{"train_loss": 0.0001656057866057381, "global_step": 71342, "epoch": 599, "lr": 1.5947652513559342e-10} +{"train_loss": 0.00023626768961548805, "global_step": 71343, "epoch": 599, "lr": 1.5392994524021653e-10} +{"train_loss": 0.0001789149537216872, "global_step": 71344, "epoch": 599, "lr": 1.4848153469526615e-10} +{"train_loss": 0.0002644875203259289, "global_step": 71345, "epoch": 599, "lr": 1.4313129351739562e-10} +{"train_loss": 0.00010333967657061294, "global_step": 71346, "epoch": 599, "lr": 1.3787922171770716e-10} +{"train_loss": 0.00014563504373654723, "global_step": 71347, "epoch": 599, "lr": 1.3272531930730303e-10} +{"train_loss": 0.00025369360810145736, "global_step": 71348, "epoch": 599, "lr": 1.2766958629173431e-10} +{"train_loss": 0.00029635924147441983, "global_step": 71349, "epoch": 599, "lr": 1.2271202268210324e-10} +{"train_loss": 0.0002901105908676982, "global_step": 71350, "epoch": 599, "lr": 1.1785262849506318e-10} +{"train_loss": 0.00021605817892123014, "global_step": 71351, "epoch": 599, "lr": 1.1309140373061411e-10} +{"train_loss": 0.00029268127400428057, "global_step": 71352, "epoch": 599, "lr": 1.0842834840540938e-10} +{"train_loss": 0.000222745758946985, "global_step": 71353, "epoch": 599, "lr": 1.0386346252500012e-10} +{"train_loss": 0.00020104358554817736, "global_step": 71354, "epoch": 599, "lr": 9.939674610048855e-11} +{"train_loss": 0.00016111863078549504, "global_step": 71355, "epoch": 599, "lr": 9.502819913742578e-11} +{"train_loss": 0.00017105002189055085, "global_step": 71356, "epoch": 599, "lr": 9.075782164691404e-11} +{"train_loss": 0.00013921498612035066, "global_step": 71357, "epoch": 599, "lr": 8.658561363450445e-11} +{"train_loss": 0.0002731855202000588, "global_step": 71358, "epoch": 599, "lr": 8.251157511129925e-11} +{"train_loss": 0.0002690783585421741, "global_step": 71359, "epoch": 599, "lr": 7.853570608284954e-11} +{"train_loss": 0.00012765951396431774, "global_step": 71360, "epoch": 599, "lr": 7.465800656025756e-11} +{"train_loss": 0.00034049394889734685, "global_step": 71361, "epoch": 599, "lr": 7.087847654907443e-11} +{"train_loss": 0.0002484374272171408, "global_step": 71362, "epoch": 599, "lr": 6.719711605485124e-11} +{"train_loss": 0.0003589811094570905, "global_step": 71363, "epoch": 599, "lr": 6.361392508869024e-11} +{"train_loss": 0.00019879959290847182, "global_step": 71364, "epoch": 599, "lr": 6.012890366169365e-11} +{"train_loss": 0.0002393443719483912, "global_step": 71365, "epoch": 599, "lr": 5.674205176831038e-11} +{"train_loss": 0.00031850242521613836, "global_step": 71366, "epoch": 599, "lr": 5.345336941964263e-11} +{"train_loss": 0.00015732325846329331, "global_step": 71367, "epoch": 599, "lr": 5.0262856632343755e-11} +{"train_loss": 0.00030596129363402724, "global_step": 71368, "epoch": 599, "lr": 4.717051339531153e-11} +{"train_loss": 0.00015771627658978105, "global_step": 71369, "epoch": 599, "lr": 4.417633973075041e-11} +{"train_loss": 0.0004978129873052239, "global_step": 71370, "epoch": 599, "lr": 4.1280335638660404e-11} +{"train_loss": 0.0004750904918182641, "global_step": 71371, "epoch": 599, "lr": 3.84825011190415e-11} +{"train_loss": 0.0001971042511286214, "global_step": 71372, "epoch": 599, "lr": 3.578283618299594e-11} +{"train_loss": 0.0005088741309009492, "global_step": 71373, "epoch": 599, "lr": 3.318134083607483e-11} +{"train_loss": 0.00021319056395441294, "global_step": 71374, "epoch": 599, "lr": 3.0678015083829284e-11} +{"train_loss": 0.00042126249172724783, "global_step": 71375, "epoch": 599, "lr": 2.8272858926259303e-11} +{"train_loss": 0.00036106634070165455, "global_step": 71376, "epoch": 599, "lr": 2.5965872374467126e-11} +{"train_loss": 0.00019640856771729887, "global_step": 71377, "epoch": 599, "lr": 2.3757055428452745e-11} +{"train_loss": 0.00030216522281989455, "global_step": 71378, "epoch": 599, "lr": 2.164640809376728e-11} +{"train_loss": 0.00019889354007318616, "global_step": 71379, "epoch": 599, "lr": 1.963393037596184e-11} +{"train_loss": 0.0001317172427661717, "global_step": 71380, "epoch": 599, "lr": 1.771962227503643e-11} +{"train_loss": 0.00016853124543558806, "global_step": 71381, "epoch": 599, "lr": 1.5903483802093277e-11} +{"train_loss": 0.00013411548570729792, "global_step": 71382, "epoch": 599, "lr": 1.418551495158127e-11} +{"train_loss": 0.0002211470273323357, "global_step": 71383, "epoch": 599, "lr": 1.2565715734602634e-11} +{"train_loss": 0.00021093386749271303, "global_step": 71384, "epoch": 599, "lr": 1.1044086151157374e-11} +{"train_loss": 0.00011400222138036042, "global_step": 71385, "epoch": 599, "lr": 9.620626206796602e-12} +{"train_loss": 0.00016132977907545865, "global_step": 71386, "epoch": 599, "lr": 8.295335895969203e-12} +{"train_loss": 0.0001764785120030865, "global_step": 71387, "epoch": 599, "lr": 7.068215229777408e-12} +{"train_loss": 0.00016602913092356175, "global_step": 71388, "epoch": 599, "lr": 5.939264208221218e-12} +{"train_loss": 0.00015760882524773479, "global_step": 71389, "epoch": 599, "lr": 4.908482836851747e-12} +{"train_loss": 0.00024458355619572103, "global_step": 71390, "epoch": 599, "lr": 3.975871110117879e-12} +{"train_loss": 0.0003729099698830396, "global_step": 71391, "epoch": 599, "lr": 3.1414290335707307e-12} +{"train_loss": 0.0001915169705171138, "global_step": 71392, "epoch": 599, "lr": 2.4051566072103014e-12} +{"train_loss": 0.0002504266449250281, "global_step": 71393, "epoch": 599, "lr": 1.7670538365877064e-12} +{"train_loss": 0.00023712687834631652, "global_step": 71394, "epoch": 599, "lr": 1.2271207217029457e-12} +{"train_loss": 0.00020562668214552104, "global_step": 71395, "epoch": 599, "lr": 7.85357262556019e-13} +{"train_loss": 0.0003173619043081999, "global_step": 71396, "epoch": 599, "lr": 4.417634591469266e-13} +{"train_loss": 0.0004532580787781626, "global_step": 71397, "epoch": 599, "lr": 1.9633931702678355e-13} +{"train_loss": 0.00023232560488395393, "global_step": 71398, "epoch": 599, "lr": 4.9084830644474664e-14} +{"train_loss": 0.0002642765820604561, "global_step": 71399, "epoch": 599, "lr": 0.0, "val_loss": 0.02468540519475937}