SKNahin commited on
Commit
a1d021e
·
verified ·
1 Parent(s): 5ee12c7

Training in progress, step 2700

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. trainer_log.jsonl +150 -0
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ba0e7cd28ecb9e887c324f2fe798b292cdc969075c9b754de98ec5596a2d3a1
3
  size 1064369000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cab280659cd1c95dbbb70daa538e28b02bcea2b30d31d1e958ed8e1a1acf09d
3
  size 1064369000
trainer_log.jsonl CHANGED
@@ -2550,3 +2550,153 @@
2550
  {"current_steps": 2550, "total_steps": 2973, "loss": 1.5873, "lr": 5e-05, "epoch": 2.5726383708035083, "percentage": 85.77, "elapsed_time": "12:53:38", "remaining_time": "2:08:19"}
2551
  {"current_steps": 2551, "total_steps": 2973, "loss": 1.565, "lr": 5e-05, "epoch": 2.573646536949289, "percentage": 85.81, "elapsed_time": "12:54:08", "remaining_time": "2:08:03"}
2552
  {"current_steps": 2552, "total_steps": 2973, "loss": 1.5659, "lr": 5e-05, "epoch": 2.57465470309507, "percentage": 85.84, "elapsed_time": "12:54:26", "remaining_time": "2:07:45"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2550
  {"current_steps": 2550, "total_steps": 2973, "loss": 1.5873, "lr": 5e-05, "epoch": 2.5726383708035083, "percentage": 85.77, "elapsed_time": "12:53:38", "remaining_time": "2:08:19"}
2551
  {"current_steps": 2551, "total_steps": 2973, "loss": 1.565, "lr": 5e-05, "epoch": 2.573646536949289, "percentage": 85.81, "elapsed_time": "12:54:08", "remaining_time": "2:08:03"}
2552
  {"current_steps": 2552, "total_steps": 2973, "loss": 1.5659, "lr": 5e-05, "epoch": 2.57465470309507, "percentage": 85.84, "elapsed_time": "12:54:26", "remaining_time": "2:07:45"}
2553
+ {"current_steps": 2553, "total_steps": 2973, "loss": 1.5834, "lr": 5e-05, "epoch": 2.5756628692408507, "percentage": 85.87, "elapsed_time": "12:54:45", "remaining_time": "2:07:27"}
2554
+ {"current_steps": 2554, "total_steps": 2973, "loss": 1.5558, "lr": 5e-05, "epoch": 2.5766710353866316, "percentage": 85.91, "elapsed_time": "12:55:03", "remaining_time": "2:07:09"}
2555
+ {"current_steps": 2555, "total_steps": 2973, "loss": 1.5652, "lr": 5e-05, "epoch": 2.577679201532413, "percentage": 85.94, "elapsed_time": "12:55:21", "remaining_time": "2:06:50"}
2556
+ {"current_steps": 2556, "total_steps": 2973, "loss": 1.581, "lr": 5e-05, "epoch": 2.578687367678193, "percentage": 85.97, "elapsed_time": "12:55:39", "remaining_time": "2:06:32"}
2557
+ {"current_steps": 2557, "total_steps": 2973, "loss": 1.5752, "lr": 5e-05, "epoch": 2.5796955338239744, "percentage": 86.01, "elapsed_time": "12:55:57", "remaining_time": "2:06:14"}
2558
+ {"current_steps": 2558, "total_steps": 2973, "loss": 1.5776, "lr": 5e-05, "epoch": 2.580703699969755, "percentage": 86.04, "elapsed_time": "12:56:15", "remaining_time": "2:05:56"}
2559
+ {"current_steps": 2559, "total_steps": 2973, "loss": 1.5606, "lr": 5e-05, "epoch": 2.581711866115536, "percentage": 86.07, "elapsed_time": "12:56:33", "remaining_time": "2:05:38"}
2560
+ {"current_steps": 2560, "total_steps": 2973, "loss": 1.5679, "lr": 5e-05, "epoch": 2.5827200322613164, "percentage": 86.11, "elapsed_time": "12:56:51", "remaining_time": "2:05:19"}
2561
+ {"current_steps": 2561, "total_steps": 2973, "loss": 1.5808, "lr": 5e-05, "epoch": 2.5837281984070977, "percentage": 86.14, "elapsed_time": "12:57:10", "remaining_time": "2:05:01"}
2562
+ {"current_steps": 2562, "total_steps": 2973, "loss": 1.5717, "lr": 5e-05, "epoch": 2.5847363645528785, "percentage": 86.18, "elapsed_time": "12:57:28", "remaining_time": "2:04:43"}
2563
+ {"current_steps": 2563, "total_steps": 2973, "loss": 1.5629, "lr": 5e-05, "epoch": 2.5857445306986593, "percentage": 86.21, "elapsed_time": "12:57:46", "remaining_time": "2:04:25"}
2564
+ {"current_steps": 2564, "total_steps": 2973, "loss": 1.5772, "lr": 5e-05, "epoch": 2.58675269684444, "percentage": 86.24, "elapsed_time": "12:58:04", "remaining_time": "2:04:06"}
2565
+ {"current_steps": 2565, "total_steps": 2973, "loss": 1.5629, "lr": 5e-05, "epoch": 2.587760862990221, "percentage": 86.28, "elapsed_time": "12:58:22", "remaining_time": "2:03:48"}
2566
+ {"current_steps": 2566, "total_steps": 2973, "loss": 1.5636, "lr": 5e-05, "epoch": 2.5887690291360017, "percentage": 86.31, "elapsed_time": "12:58:40", "remaining_time": "2:03:30"}
2567
+ {"current_steps": 2567, "total_steps": 2973, "loss": 1.5714, "lr": 5e-05, "epoch": 2.5897771952817825, "percentage": 86.34, "elapsed_time": "12:58:58", "remaining_time": "2:03:12"}
2568
+ {"current_steps": 2568, "total_steps": 2973, "loss": 1.5801, "lr": 5e-05, "epoch": 2.5907853614275633, "percentage": 86.38, "elapsed_time": "12:59:16", "remaining_time": "2:02:54"}
2569
+ {"current_steps": 2569, "total_steps": 2973, "loss": 1.5846, "lr": 5e-05, "epoch": 2.591793527573344, "percentage": 86.41, "elapsed_time": "12:59:34", "remaining_time": "2:02:35"}
2570
+ {"current_steps": 2570, "total_steps": 2973, "loss": 1.57, "lr": 5e-05, "epoch": 2.592801693719125, "percentage": 86.44, "elapsed_time": "12:59:52", "remaining_time": "2:02:17"}
2571
+ {"current_steps": 2571, "total_steps": 2973, "loss": 1.5553, "lr": 5e-05, "epoch": 2.5938098598649058, "percentage": 86.48, "elapsed_time": "13:00:11", "remaining_time": "2:01:59"}
2572
+ {"current_steps": 2572, "total_steps": 2973, "loss": 1.571, "lr": 5e-05, "epoch": 2.5948180260106866, "percentage": 86.51, "elapsed_time": "13:00:29", "remaining_time": "2:01:41"}
2573
+ {"current_steps": 2573, "total_steps": 2973, "loss": 1.5614, "lr": 5e-05, "epoch": 2.5958261921564674, "percentage": 86.55, "elapsed_time": "13:00:47", "remaining_time": "2:01:22"}
2574
+ {"current_steps": 2574, "total_steps": 2973, "loss": 1.5732, "lr": 5e-05, "epoch": 2.596834358302248, "percentage": 86.58, "elapsed_time": "13:01:05", "remaining_time": "2:01:04"}
2575
+ {"current_steps": 2575, "total_steps": 2973, "loss": 1.5739, "lr": 5e-05, "epoch": 2.597842524448029, "percentage": 86.61, "elapsed_time": "13:01:23", "remaining_time": "2:00:46"}
2576
+ {"current_steps": 2576, "total_steps": 2973, "loss": 1.5746, "lr": 5e-05, "epoch": 2.59885069059381, "percentage": 86.65, "elapsed_time": "13:01:41", "remaining_time": "2:00:28"}
2577
+ {"current_steps": 2577, "total_steps": 2973, "loss": 1.5868, "lr": 5e-05, "epoch": 2.5998588567395906, "percentage": 86.68, "elapsed_time": "13:01:59", "remaining_time": "2:00:10"}
2578
+ {"current_steps": 2578, "total_steps": 2973, "loss": 1.5693, "lr": 5e-05, "epoch": 2.6008670228853714, "percentage": 86.71, "elapsed_time": "13:02:17", "remaining_time": "1:59:51"}
2579
+ {"current_steps": 2579, "total_steps": 2973, "loss": 1.5837, "lr": 5e-05, "epoch": 2.6018751890311522, "percentage": 86.75, "elapsed_time": "13:02:35", "remaining_time": "1:59:33"}
2580
+ {"current_steps": 2580, "total_steps": 2973, "loss": 1.5929, "lr": 5e-05, "epoch": 2.602883355176933, "percentage": 86.78, "elapsed_time": "13:02:53", "remaining_time": "1:59:15"}
2581
+ {"current_steps": 2581, "total_steps": 2973, "loss": 1.5777, "lr": 5e-05, "epoch": 2.603891521322714, "percentage": 86.81, "elapsed_time": "13:03:12", "remaining_time": "1:58:57"}
2582
+ {"current_steps": 2582, "total_steps": 2973, "loss": 1.5815, "lr": 5e-05, "epoch": 2.6048996874684947, "percentage": 86.85, "elapsed_time": "13:03:30", "remaining_time": "1:58:38"}
2583
+ {"current_steps": 2583, "total_steps": 2973, "loss": 1.5623, "lr": 5e-05, "epoch": 2.6059078536142755, "percentage": 86.88, "elapsed_time": "13:03:48", "remaining_time": "1:58:20"}
2584
+ {"current_steps": 2584, "total_steps": 2973, "loss": 1.5641, "lr": 5e-05, "epoch": 2.6069160197600567, "percentage": 86.92, "elapsed_time": "13:04:06", "remaining_time": "1:58:02"}
2585
+ {"current_steps": 2585, "total_steps": 2973, "loss": 1.5638, "lr": 5e-05, "epoch": 2.607924185905837, "percentage": 86.95, "elapsed_time": "13:04:24", "remaining_time": "1:57:44"}
2586
+ {"current_steps": 2586, "total_steps": 2973, "loss": 1.5763, "lr": 5e-05, "epoch": 2.6089323520516183, "percentage": 86.98, "elapsed_time": "13:04:42", "remaining_time": "1:57:26"}
2587
+ {"current_steps": 2587, "total_steps": 2973, "loss": 1.5621, "lr": 5e-05, "epoch": 2.6099405181973987, "percentage": 87.02, "elapsed_time": "13:05:00", "remaining_time": "1:57:07"}
2588
+ {"current_steps": 2588, "total_steps": 2973, "loss": 1.5736, "lr": 5e-05, "epoch": 2.61094868434318, "percentage": 87.05, "elapsed_time": "13:05:18", "remaining_time": "1:56:49"}
2589
+ {"current_steps": 2589, "total_steps": 2973, "loss": 1.5776, "lr": 5e-05, "epoch": 2.6119568504889603, "percentage": 87.08, "elapsed_time": "13:05:37", "remaining_time": "1:56:31"}
2590
+ {"current_steps": 2590, "total_steps": 2973, "loss": 1.561, "lr": 5e-05, "epoch": 2.6129650166347416, "percentage": 87.12, "elapsed_time": "13:05:55", "remaining_time": "1:56:13"}
2591
+ {"current_steps": 2591, "total_steps": 2973, "loss": 1.5809, "lr": 5e-05, "epoch": 2.6139731827805224, "percentage": 87.15, "elapsed_time": "13:06:13", "remaining_time": "1:55:54"}
2592
+ {"current_steps": 2592, "total_steps": 2973, "loss": 1.5649, "lr": 5e-05, "epoch": 2.614981348926303, "percentage": 87.18, "elapsed_time": "13:06:31", "remaining_time": "1:55:36"}
2593
+ {"current_steps": 2593, "total_steps": 2973, "loss": 1.5632, "lr": 5e-05, "epoch": 2.615989515072084, "percentage": 87.22, "elapsed_time": "13:06:49", "remaining_time": "1:55:18"}
2594
+ {"current_steps": 2594, "total_steps": 2973, "loss": 1.5692, "lr": 5e-05, "epoch": 2.616997681217865, "percentage": 87.25, "elapsed_time": "13:07:07", "remaining_time": "1:55:00"}
2595
+ {"current_steps": 2595, "total_steps": 2973, "loss": 1.564, "lr": 5e-05, "epoch": 2.6180058473636456, "percentage": 87.29, "elapsed_time": "13:07:25", "remaining_time": "1:54:42"}
2596
+ {"current_steps": 2596, "total_steps": 2973, "loss": 1.5464, "lr": 5e-05, "epoch": 2.6190140135094264, "percentage": 87.32, "elapsed_time": "13:07:43", "remaining_time": "1:54:23"}
2597
+ {"current_steps": 2597, "total_steps": 2973, "loss": 1.5682, "lr": 5e-05, "epoch": 2.6200221796552072, "percentage": 87.35, "elapsed_time": "13:08:01", "remaining_time": "1:54:05"}
2598
+ {"current_steps": 2598, "total_steps": 2973, "loss": 1.5601, "lr": 5e-05, "epoch": 2.621030345800988, "percentage": 87.39, "elapsed_time": "13:08:20", "remaining_time": "1:53:47"}
2599
+ {"current_steps": 2599, "total_steps": 2973, "loss": 1.5762, "lr": 5e-05, "epoch": 2.622038511946769, "percentage": 87.42, "elapsed_time": "13:08:38", "remaining_time": "1:53:29"}
2600
+ {"current_steps": 2600, "total_steps": 2973, "loss": 1.5861, "lr": 5e-05, "epoch": 2.6230466780925497, "percentage": 87.45, "elapsed_time": "13:08:56", "remaining_time": "1:53:10"}
2601
+ {"current_steps": 2601, "total_steps": 2973, "loss": 1.576, "lr": 5e-05, "epoch": 2.6240548442383305, "percentage": 87.49, "elapsed_time": "13:09:14", "remaining_time": "1:52:52"}
2602
+ {"current_steps": 2602, "total_steps": 2973, "loss": 1.5764, "lr": 5e-05, "epoch": 2.6250630103841113, "percentage": 87.52, "elapsed_time": "13:09:32", "remaining_time": "1:52:34"}
2603
+ {"current_steps": 2603, "total_steps": 2973, "loss": 1.5547, "lr": 5e-05, "epoch": 2.626071176529892, "percentage": 87.55, "elapsed_time": "13:09:50", "remaining_time": "1:52:16"}
2604
+ {"current_steps": 2604, "total_steps": 2973, "loss": 1.5685, "lr": 5e-05, "epoch": 2.627079342675673, "percentage": 87.59, "elapsed_time": "13:10:08", "remaining_time": "1:51:58"}
2605
+ {"current_steps": 2605, "total_steps": 2973, "loss": 1.5758, "lr": 5e-05, "epoch": 2.6280875088214537, "percentage": 87.62, "elapsed_time": "13:10:26", "remaining_time": "1:51:39"}
2606
+ {"current_steps": 2606, "total_steps": 2973, "loss": 1.5736, "lr": 5e-05, "epoch": 2.6290956749672345, "percentage": 87.66, "elapsed_time": "13:10:44", "remaining_time": "1:51:21"}
2607
+ {"current_steps": 2607, "total_steps": 2973, "loss": 1.5663, "lr": 5e-05, "epoch": 2.6301038411130153, "percentage": 87.69, "elapsed_time": "13:11:03", "remaining_time": "1:51:03"}
2608
+ {"current_steps": 2608, "total_steps": 2973, "loss": 1.5559, "lr": 5e-05, "epoch": 2.631112007258796, "percentage": 87.72, "elapsed_time": "13:11:21", "remaining_time": "1:50:45"}
2609
+ {"current_steps": 2609, "total_steps": 2973, "loss": 1.5378, "lr": 5e-05, "epoch": 2.632120173404577, "percentage": 87.76, "elapsed_time": "13:11:39", "remaining_time": "1:50:26"}
2610
+ {"current_steps": 2610, "total_steps": 2973, "loss": 1.5657, "lr": 5e-05, "epoch": 2.6331283395503577, "percentage": 87.79, "elapsed_time": "13:11:57", "remaining_time": "1:50:08"}
2611
+ {"current_steps": 2611, "total_steps": 2973, "loss": 1.5607, "lr": 5e-05, "epoch": 2.634136505696139, "percentage": 87.82, "elapsed_time": "13:12:15", "remaining_time": "1:49:50"}
2612
+ {"current_steps": 2612, "total_steps": 2973, "loss": 1.5773, "lr": 5e-05, "epoch": 2.6351446718419194, "percentage": 87.86, "elapsed_time": "13:12:33", "remaining_time": "1:49:32"}
2613
+ {"current_steps": 2613, "total_steps": 2973, "loss": 1.5687, "lr": 5e-05, "epoch": 2.6361528379877006, "percentage": 87.89, "elapsed_time": "13:12:51", "remaining_time": "1:49:14"}
2614
+ {"current_steps": 2614, "total_steps": 2973, "loss": 1.5761, "lr": 5e-05, "epoch": 2.637161004133481, "percentage": 87.92, "elapsed_time": "13:13:09", "remaining_time": "1:48:55"}
2615
+ {"current_steps": 2615, "total_steps": 2973, "loss": 1.5715, "lr": 5e-05, "epoch": 2.6381691702792622, "percentage": 87.96, "elapsed_time": "13:13:27", "remaining_time": "1:48:37"}
2616
+ {"current_steps": 2616, "total_steps": 2973, "loss": 1.5764, "lr": 5e-05, "epoch": 2.6391773364250426, "percentage": 87.99, "elapsed_time": "13:13:46", "remaining_time": "1:48:19"}
2617
+ {"current_steps": 2617, "total_steps": 2973, "loss": 1.5734, "lr": 5e-05, "epoch": 2.640185502570824, "percentage": 88.03, "elapsed_time": "13:14:04", "remaining_time": "1:48:01"}
2618
+ {"current_steps": 2618, "total_steps": 2973, "loss": 1.5752, "lr": 5e-05, "epoch": 2.6411936687166047, "percentage": 88.06, "elapsed_time": "13:14:22", "remaining_time": "1:47:42"}
2619
+ {"current_steps": 2619, "total_steps": 2973, "loss": 1.5752, "lr": 5e-05, "epoch": 2.6422018348623855, "percentage": 88.09, "elapsed_time": "13:14:40", "remaining_time": "1:47:24"}
2620
+ {"current_steps": 2620, "total_steps": 2973, "loss": 1.5548, "lr": 5e-05, "epoch": 2.6432100010081663, "percentage": 88.13, "elapsed_time": "13:14:58", "remaining_time": "1:47:06"}
2621
+ {"current_steps": 2621, "total_steps": 2973, "loss": 1.5782, "lr": 5e-05, "epoch": 2.644218167153947, "percentage": 88.16, "elapsed_time": "13:15:16", "remaining_time": "1:46:48"}
2622
+ {"current_steps": 2622, "total_steps": 2973, "loss": 1.5309, "lr": 5e-05, "epoch": 2.645226333299728, "percentage": 88.19, "elapsed_time": "13:15:34", "remaining_time": "1:46:30"}
2623
+ {"current_steps": 2623, "total_steps": 2973, "loss": 1.5609, "lr": 5e-05, "epoch": 2.6462344994455087, "percentage": 88.23, "elapsed_time": "13:15:52", "remaining_time": "1:46:11"}
2624
+ {"current_steps": 2624, "total_steps": 2973, "loss": 1.5662, "lr": 5e-05, "epoch": 2.6472426655912895, "percentage": 88.26, "elapsed_time": "13:16:11", "remaining_time": "1:45:53"}
2625
+ {"current_steps": 2625, "total_steps": 2973, "loss": 1.5715, "lr": 5e-05, "epoch": 2.6482508317370703, "percentage": 88.29, "elapsed_time": "13:16:29", "remaining_time": "1:45:35"}
2626
+ {"current_steps": 2626, "total_steps": 2973, "loss": 1.5576, "lr": 5e-05, "epoch": 2.649258997882851, "percentage": 88.33, "elapsed_time": "13:16:47", "remaining_time": "1:45:17"}
2627
+ {"current_steps": 2627, "total_steps": 2973, "loss": 1.5654, "lr": 5e-05, "epoch": 2.650267164028632, "percentage": 88.36, "elapsed_time": "13:17:05", "remaining_time": "1:44:59"}
2628
+ {"current_steps": 2628, "total_steps": 2973, "loss": 1.5482, "lr": 5e-05, "epoch": 2.6512753301744127, "percentage": 88.4, "elapsed_time": "13:17:23", "remaining_time": "1:44:40"}
2629
+ {"current_steps": 2629, "total_steps": 2973, "loss": 1.5737, "lr": 5e-05, "epoch": 2.6522834963201936, "percentage": 88.43, "elapsed_time": "13:17:41", "remaining_time": "1:44:22"}
2630
+ {"current_steps": 2630, "total_steps": 2973, "loss": 1.5883, "lr": 5e-05, "epoch": 2.6532916624659744, "percentage": 88.46, "elapsed_time": "13:17:59", "remaining_time": "1:44:04"}
2631
+ {"current_steps": 2631, "total_steps": 2973, "loss": 1.5725, "lr": 5e-05, "epoch": 2.654299828611755, "percentage": 88.5, "elapsed_time": "13:18:17", "remaining_time": "1:43:46"}
2632
+ {"current_steps": 2632, "total_steps": 2973, "loss": 1.5558, "lr": 5e-05, "epoch": 2.655307994757536, "percentage": 88.53, "elapsed_time": "13:18:35", "remaining_time": "1:43:27"}
2633
+ {"current_steps": 2633, "total_steps": 2973, "loss": 1.5665, "lr": 5e-05, "epoch": 2.656316160903317, "percentage": 88.56, "elapsed_time": "13:18:54", "remaining_time": "1:43:09"}
2634
+ {"current_steps": 2634, "total_steps": 2973, "loss": 1.5636, "lr": 5e-05, "epoch": 2.6573243270490976, "percentage": 88.6, "elapsed_time": "13:19:12", "remaining_time": "1:42:51"}
2635
+ {"current_steps": 2635, "total_steps": 2973, "loss": 1.5716, "lr": 5e-05, "epoch": 2.6583324931948784, "percentage": 88.63, "elapsed_time": "13:19:30", "remaining_time": "1:42:33"}
2636
+ {"current_steps": 2636, "total_steps": 2973, "loss": 1.5658, "lr": 5e-05, "epoch": 2.659340659340659, "percentage": 88.66, "elapsed_time": "13:19:48", "remaining_time": "1:42:15"}
2637
+ {"current_steps": 2637, "total_steps": 2973, "loss": 1.5583, "lr": 5e-05, "epoch": 2.66034882548644, "percentage": 88.7, "elapsed_time": "13:20:06", "remaining_time": "1:41:56"}
2638
+ {"current_steps": 2638, "total_steps": 2973, "loss": 1.5822, "lr": 5e-05, "epoch": 2.661356991632221, "percentage": 88.73, "elapsed_time": "13:20:24", "remaining_time": "1:41:38"}
2639
+ {"current_steps": 2639, "total_steps": 2973, "loss": 1.5895, "lr": 5e-05, "epoch": 2.6623651577780016, "percentage": 88.77, "elapsed_time": "13:20:42", "remaining_time": "1:41:20"}
2640
+ {"current_steps": 2640, "total_steps": 2973, "loss": 1.5786, "lr": 5e-05, "epoch": 2.663373323923783, "percentage": 88.8, "elapsed_time": "13:21:00", "remaining_time": "1:41:02"}
2641
+ {"current_steps": 2641, "total_steps": 2973, "loss": 1.5556, "lr": 5e-05, "epoch": 2.6643814900695633, "percentage": 88.83, "elapsed_time": "13:21:18", "remaining_time": "1:40:43"}
2642
+ {"current_steps": 2642, "total_steps": 2973, "loss": 1.5697, "lr": 5e-05, "epoch": 2.6653896562153445, "percentage": 88.87, "elapsed_time": "13:21:36", "remaining_time": "1:40:25"}
2643
+ {"current_steps": 2643, "total_steps": 2973, "loss": 1.5632, "lr": 5e-05, "epoch": 2.666397822361125, "percentage": 88.9, "elapsed_time": "13:21:55", "remaining_time": "1:40:07"}
2644
+ {"current_steps": 2644, "total_steps": 2973, "loss": 1.5613, "lr": 5e-05, "epoch": 2.667405988506906, "percentage": 88.93, "elapsed_time": "13:22:13", "remaining_time": "1:39:49"}
2645
+ {"current_steps": 2645, "total_steps": 2973, "loss": 1.5725, "lr": 5e-05, "epoch": 2.6684141546526865, "percentage": 88.97, "elapsed_time": "13:22:31", "remaining_time": "1:39:31"}
2646
+ {"current_steps": 2646, "total_steps": 2973, "loss": 1.5797, "lr": 5e-05, "epoch": 2.6694223207984678, "percentage": 89.0, "elapsed_time": "13:22:49", "remaining_time": "1:39:12"}
2647
+ {"current_steps": 2647, "total_steps": 2973, "loss": 1.5517, "lr": 5e-05, "epoch": 2.6704304869442486, "percentage": 89.03, "elapsed_time": "13:23:07", "remaining_time": "1:38:54"}
2648
+ {"current_steps": 2648, "total_steps": 2973, "loss": 1.5689, "lr": 5e-05, "epoch": 2.6714386530900294, "percentage": 89.07, "elapsed_time": "13:23:25", "remaining_time": "1:38:36"}
2649
+ {"current_steps": 2649, "total_steps": 2973, "loss": 1.5439, "lr": 5e-05, "epoch": 2.67244681923581, "percentage": 89.1, "elapsed_time": "13:23:43", "remaining_time": "1:38:18"}
2650
+ {"current_steps": 2650, "total_steps": 2973, "loss": 1.5605, "lr": 5e-05, "epoch": 2.673454985381591, "percentage": 89.14, "elapsed_time": "13:24:01", "remaining_time": "1:38:00"}
2651
+ {"current_steps": 2651, "total_steps": 2973, "loss": 1.5474, "lr": 5e-05, "epoch": 2.674463151527372, "percentage": 89.17, "elapsed_time": "13:24:19", "remaining_time": "1:37:41"}
2652
+ {"current_steps": 2652, "total_steps": 2973, "loss": 1.562, "lr": 5e-05, "epoch": 2.6754713176731526, "percentage": 89.2, "elapsed_time": "13:24:38", "remaining_time": "1:37:23"}
2653
+ {"current_steps": 2653, "total_steps": 2973, "loss": 1.5788, "lr": 5e-05, "epoch": 2.6764794838189334, "percentage": 89.24, "elapsed_time": "13:24:56", "remaining_time": "1:37:05"}
2654
+ {"current_steps": 2654, "total_steps": 2973, "loss": 1.5809, "lr": 5e-05, "epoch": 2.6774876499647142, "percentage": 89.27, "elapsed_time": "13:25:14", "remaining_time": "1:36:47"}
2655
+ {"current_steps": 2655, "total_steps": 2973, "loss": 1.568, "lr": 5e-05, "epoch": 2.678495816110495, "percentage": 89.3, "elapsed_time": "13:25:32", "remaining_time": "1:36:28"}
2656
+ {"current_steps": 2656, "total_steps": 2973, "loss": 1.5826, "lr": 5e-05, "epoch": 2.679503982256276, "percentage": 89.34, "elapsed_time": "13:25:50", "remaining_time": "1:36:10"}
2657
+ {"current_steps": 2657, "total_steps": 2973, "loss": 1.5479, "lr": 5e-05, "epoch": 2.6805121484020566, "percentage": 89.37, "elapsed_time": "13:26:08", "remaining_time": "1:35:52"}
2658
+ {"current_steps": 2658, "total_steps": 2973, "loss": 1.5753, "lr": 5e-05, "epoch": 2.6815203145478375, "percentage": 89.4, "elapsed_time": "13:26:26", "remaining_time": "1:35:34"}
2659
+ {"current_steps": 2659, "total_steps": 2973, "loss": 1.5556, "lr": 5e-05, "epoch": 2.6825284806936183, "percentage": 89.44, "elapsed_time": "13:26:44", "remaining_time": "1:35:16"}
2660
+ {"current_steps": 2660, "total_steps": 2973, "loss": 1.5747, "lr": 5e-05, "epoch": 2.683536646839399, "percentage": 89.47, "elapsed_time": "13:27:02", "remaining_time": "1:34:57"}
2661
+ {"current_steps": 2661, "total_steps": 2973, "loss": 1.5687, "lr": 5e-05, "epoch": 2.68454481298518, "percentage": 89.51, "elapsed_time": "13:27:21", "remaining_time": "1:34:39"}
2662
+ {"current_steps": 2662, "total_steps": 2973, "loss": 1.5771, "lr": 5e-05, "epoch": 2.6855529791309607, "percentage": 89.54, "elapsed_time": "13:27:39", "remaining_time": "1:34:21"}
2663
+ {"current_steps": 2663, "total_steps": 2973, "loss": 1.5646, "lr": 5e-05, "epoch": 2.6865611452767415, "percentage": 89.57, "elapsed_time": "13:27:57", "remaining_time": "1:34:03"}
2664
+ {"current_steps": 2664, "total_steps": 2973, "loss": 1.5576, "lr": 5e-05, "epoch": 2.6875693114225223, "percentage": 89.61, "elapsed_time": "13:28:15", "remaining_time": "1:33:45"}
2665
+ {"current_steps": 2665, "total_steps": 2973, "loss": 1.5728, "lr": 5e-05, "epoch": 2.688577477568303, "percentage": 89.64, "elapsed_time": "13:28:33", "remaining_time": "1:33:26"}
2666
+ {"current_steps": 2666, "total_steps": 2973, "loss": 1.566, "lr": 5e-05, "epoch": 2.689585643714084, "percentage": 89.67, "elapsed_time": "13:28:51", "remaining_time": "1:33:08"}
2667
+ {"current_steps": 2667, "total_steps": 2973, "loss": 1.569, "lr": 5e-05, "epoch": 2.690593809859865, "percentage": 89.71, "elapsed_time": "13:29:09", "remaining_time": "1:32:50"}
2668
+ {"current_steps": 2668, "total_steps": 2973, "loss": 1.5996, "lr": 5e-05, "epoch": 2.6916019760056455, "percentage": 89.74, "elapsed_time": "13:29:27", "remaining_time": "1:32:32"}
2669
+ {"current_steps": 2669, "total_steps": 2973, "loss": 1.5783, "lr": 5e-05, "epoch": 2.692610142151427, "percentage": 89.77, "elapsed_time": "13:29:45", "remaining_time": "1:32:13"}
2670
+ {"current_steps": 2670, "total_steps": 2973, "loss": 1.5763, "lr": 5e-05, "epoch": 2.693618308297207, "percentage": 89.81, "elapsed_time": "13:30:04", "remaining_time": "1:31:55"}
2671
+ {"current_steps": 2671, "total_steps": 2973, "loss": 1.5723, "lr": 5e-05, "epoch": 2.6946264744429884, "percentage": 89.84, "elapsed_time": "13:30:22", "remaining_time": "1:31:37"}
2672
+ {"current_steps": 2672, "total_steps": 2973, "loss": 1.5641, "lr": 5e-05, "epoch": 2.695634640588769, "percentage": 89.88, "elapsed_time": "13:30:40", "remaining_time": "1:31:19"}
2673
+ {"current_steps": 2673, "total_steps": 2973, "loss": 1.5447, "lr": 5e-05, "epoch": 2.69664280673455, "percentage": 89.91, "elapsed_time": "13:30:58", "remaining_time": "1:31:01"}
2674
+ {"current_steps": 2674, "total_steps": 2973, "loss": 1.5708, "lr": 5e-05, "epoch": 2.697650972880331, "percentage": 89.94, "elapsed_time": "13:31:16", "remaining_time": "1:30:42"}
2675
+ {"current_steps": 2675, "total_steps": 2973, "loss": 1.5494, "lr": 5e-05, "epoch": 2.6986591390261117, "percentage": 89.98, "elapsed_time": "13:31:34", "remaining_time": "1:30:24"}
2676
+ {"current_steps": 2676, "total_steps": 2973, "loss": 1.5595, "lr": 5e-05, "epoch": 2.6996673051718925, "percentage": 90.01, "elapsed_time": "13:31:52", "remaining_time": "1:30:06"}
2677
+ {"current_steps": 2677, "total_steps": 2973, "loss": 1.5817, "lr": 5e-05, "epoch": 2.7006754713176733, "percentage": 90.04, "elapsed_time": "13:32:10", "remaining_time": "1:29:48"}
2678
+ {"current_steps": 2678, "total_steps": 2973, "loss": 1.5635, "lr": 5e-05, "epoch": 2.701683637463454, "percentage": 90.08, "elapsed_time": "13:32:28", "remaining_time": "1:29:30"}
2679
+ {"current_steps": 2679, "total_steps": 2973, "loss": 1.5825, "lr": 5e-05, "epoch": 2.702691803609235, "percentage": 90.11, "elapsed_time": "13:32:47", "remaining_time": "1:29:11"}
2680
+ {"current_steps": 2680, "total_steps": 2973, "loss": 1.5512, "lr": 5e-05, "epoch": 2.7036999697550157, "percentage": 90.14, "elapsed_time": "13:33:05", "remaining_time": "1:28:53"}
2681
+ {"current_steps": 2681, "total_steps": 2973, "loss": 1.5653, "lr": 5e-05, "epoch": 2.7047081359007965, "percentage": 90.18, "elapsed_time": "13:33:23", "remaining_time": "1:28:35"}
2682
+ {"current_steps": 2682, "total_steps": 2973, "loss": 1.5673, "lr": 5e-05, "epoch": 2.7057163020465773, "percentage": 90.21, "elapsed_time": "13:33:41", "remaining_time": "1:28:17"}
2683
+ {"current_steps": 2683, "total_steps": 2973, "loss": 1.5799, "lr": 5e-05, "epoch": 2.706724468192358, "percentage": 90.25, "elapsed_time": "13:33:59", "remaining_time": "1:27:58"}
2684
+ {"current_steps": 2684, "total_steps": 2973, "loss": 1.5618, "lr": 5e-05, "epoch": 2.707732634338139, "percentage": 90.28, "elapsed_time": "13:34:17", "remaining_time": "1:27:40"}
2685
+ {"current_steps": 2685, "total_steps": 2973, "loss": 1.5648, "lr": 5e-05, "epoch": 2.7087408004839197, "percentage": 90.31, "elapsed_time": "13:34:35", "remaining_time": "1:27:22"}
2686
+ {"current_steps": 2686, "total_steps": 2973, "loss": 1.5626, "lr": 5e-05, "epoch": 2.7097489666297006, "percentage": 90.35, "elapsed_time": "13:34:53", "remaining_time": "1:27:04"}
2687
+ {"current_steps": 2687, "total_steps": 2973, "loss": 1.5609, "lr": 5e-05, "epoch": 2.7107571327754814, "percentage": 90.38, "elapsed_time": "13:35:12", "remaining_time": "1:26:46"}
2688
+ {"current_steps": 2688, "total_steps": 2973, "loss": 1.5655, "lr": 5e-05, "epoch": 2.711765298921262, "percentage": 90.41, "elapsed_time": "13:35:30", "remaining_time": "1:26:27"}
2689
+ {"current_steps": 2689, "total_steps": 2973, "loss": 1.5831, "lr": 5e-05, "epoch": 2.712773465067043, "percentage": 90.45, "elapsed_time": "13:35:48", "remaining_time": "1:26:09"}
2690
+ {"current_steps": 2690, "total_steps": 2973, "loss": 1.5663, "lr": 5e-05, "epoch": 2.713781631212824, "percentage": 90.48, "elapsed_time": "13:36:06", "remaining_time": "1:25:51"}
2691
+ {"current_steps": 2691, "total_steps": 2973, "loss": 1.5647, "lr": 5e-05, "epoch": 2.7147897973586046, "percentage": 90.51, "elapsed_time": "13:36:24", "remaining_time": "1:25:33"}
2692
+ {"current_steps": 2692, "total_steps": 2973, "loss": 1.5717, "lr": 5e-05, "epoch": 2.7157979635043854, "percentage": 90.55, "elapsed_time": "13:36:42", "remaining_time": "1:25:15"}
2693
+ {"current_steps": 2693, "total_steps": 2973, "loss": 1.5749, "lr": 5e-05, "epoch": 2.716806129650166, "percentage": 90.58, "elapsed_time": "13:37:00", "remaining_time": "1:24:56"}
2694
+ {"current_steps": 2694, "total_steps": 2973, "loss": 1.5693, "lr": 5e-05, "epoch": 2.717814295795947, "percentage": 90.62, "elapsed_time": "13:37:18", "remaining_time": "1:24:38"}
2695
+ {"current_steps": 2695, "total_steps": 2973, "loss": 1.5709, "lr": 5e-05, "epoch": 2.718822461941728, "percentage": 90.65, "elapsed_time": "13:37:37", "remaining_time": "1:24:20"}
2696
+ {"current_steps": 2696, "total_steps": 2973, "loss": 1.5669, "lr": 5e-05, "epoch": 2.719830628087509, "percentage": 90.68, "elapsed_time": "13:37:55", "remaining_time": "1:24:02"}
2697
+ {"current_steps": 2697, "total_steps": 2973, "loss": 1.5893, "lr": 5e-05, "epoch": 2.7208387942332894, "percentage": 90.72, "elapsed_time": "13:38:13", "remaining_time": "1:23:43"}
2698
+ {"current_steps": 2698, "total_steps": 2973, "loss": 1.5695, "lr": 5e-05, "epoch": 2.7218469603790707, "percentage": 90.75, "elapsed_time": "13:38:31", "remaining_time": "1:23:25"}
2699
+ {"current_steps": 2699, "total_steps": 2973, "loss": 1.5581, "lr": 5e-05, "epoch": 2.722855126524851, "percentage": 90.78, "elapsed_time": "13:38:49", "remaining_time": "1:23:07"}
2700
+ {"current_steps": 2700, "total_steps": 2973, "loss": 1.5528, "lr": 5e-05, "epoch": 2.7238632926706323, "percentage": 90.82, "elapsed_time": "13:39:07", "remaining_time": "1:22:49"}
2701
+ {"current_steps": 2701, "total_steps": 2973, "loss": 1.5704, "lr": 5e-05, "epoch": 2.7248714588164127, "percentage": 90.85, "elapsed_time": "13:39:35", "remaining_time": "1:22:32"}
2702
+ {"current_steps": 2702, "total_steps": 2973, "loss": 1.593, "lr": 5e-05, "epoch": 2.725879624962194, "percentage": 90.88, "elapsed_time": "13:39:53", "remaining_time": "1:22:13"}