chancharikm commited on
Commit
848eea8
·
verified ·
1 Parent(s): 1c14a2c

Training in progress, step 600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eeffacdc935efb322f1c9780ab304b2632dec0ff6538a73ca8eaea9b017aabeb
3
  size 4998056552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c7328d9e1f45351312f0574ab9b50cc0739c85c9a860a7ef8ec98e51a13393
3
  size 4998056552
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d950f49cb1d1231086ec05e5758fae16a233257120f5fc67af9bf590bdc768f
3
  size 4915962464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bfb52488190ea3cf4ded5e45301f704ebd5bf10eb7b5b465f8d553e5090d505
3
  size 4915962464
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b16f671b09b713bd2bce1808ec381833c0574ba6161b3e138386c2fd590ee36f
3
  size 4915962496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca3d879bfaf76c6064fd3dabe79ff3a9f374c38f77f4a00d18e34cedfbabfd55
3
  size 4915962496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e87f1b1b8452e84386b7bf7b159bc2dbb1e6436187751d6cf74c9dce93938556
3
  size 2704357976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76fed592470092909399a550e3bf05f250cb2e02fe17c96e925b503becd41b31
3
  size 2704357976
trainer_log.jsonl CHANGED
@@ -548,3 +548,53 @@
548
  {"current_steps": 548, "total_steps": 741, "loss": 0.0099, "lr": 5.292729615185637e-06, "epoch": 2.2190669371196754, "percentage": 73.95, "elapsed_time": "2 days, 0:16:20", "remaining_time": "17:00:03"}
549
  {"current_steps": 549, "total_steps": 741, "loss": 0.0129, "lr": 5.241723668827937e-06, "epoch": 2.2231237322515214, "percentage": 74.09, "elapsed_time": "2 days, 0:21:33", "remaining_time": "16:54:45"}
550
  {"current_steps": 550, "total_steps": 741, "loss": 0.0126, "lr": 5.190912599873818e-06, "epoch": 2.227180527383367, "percentage": 74.22, "elapsed_time": "2 days, 0:26:41", "remaining_time": "16:49:24"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
548
  {"current_steps": 548, "total_steps": 741, "loss": 0.0099, "lr": 5.292729615185637e-06, "epoch": 2.2190669371196754, "percentage": 73.95, "elapsed_time": "2 days, 0:16:20", "remaining_time": "17:00:03"}
549
  {"current_steps": 549, "total_steps": 741, "loss": 0.0129, "lr": 5.241723668827937e-06, "epoch": 2.2231237322515214, "percentage": 74.09, "elapsed_time": "2 days, 0:21:33", "remaining_time": "16:54:45"}
550
  {"current_steps": 550, "total_steps": 741, "loss": 0.0126, "lr": 5.190912599873818e-06, "epoch": 2.227180527383367, "percentage": 74.22, "elapsed_time": "2 days, 0:26:41", "remaining_time": "16:49:24"}
551
+ {"current_steps": 551, "total_steps": 741, "loss": 0.0108, "lr": 5.14029742304441e-06, "epoch": 2.231237322515213, "percentage": 74.36, "elapsed_time": "2 days, 0:32:31", "remaining_time": "16:44:19"}
552
+ {"current_steps": 552, "total_steps": 741, "loss": 0.0117, "lr": 5.089879149148781e-06, "epoch": 2.235294117647059, "percentage": 74.49, "elapsed_time": "2 days, 0:37:22", "remaining_time": "16:38:52"}
553
+ {"current_steps": 553, "total_steps": 741, "loss": 0.0091, "lr": 5.0396587850637554e-06, "epoch": 2.239350912778905, "percentage": 74.63, "elapsed_time": "2 days, 0:42:35", "remaining_time": "16:33:34"}
554
+ {"current_steps": 554, "total_steps": 741, "loss": 0.01, "lr": 4.989637333713814e-06, "epoch": 2.2434077079107504, "percentage": 74.76, "elapsed_time": "2 days, 0:47:35", "remaining_time": "16:28:11"}
555
+ {"current_steps": 555, "total_steps": 741, "loss": 0.0111, "lr": 4.93981579405105e-06, "epoch": 2.2474645030425964, "percentage": 74.9, "elapsed_time": "2 days, 0:53:06", "remaining_time": "16:22:59"}
556
+ {"current_steps": 556, "total_steps": 741, "loss": 0.0093, "lr": 4.89019516103522e-06, "epoch": 2.2515212981744424, "percentage": 75.03, "elapsed_time": "2 days, 0:58:35", "remaining_time": "16:17:46"}
557
+ {"current_steps": 557, "total_steps": 741, "loss": 0.014, "lr": 4.840776425613887e-06, "epoch": 2.255578093306288, "percentage": 75.17, "elapsed_time": "2 days, 1:03:43", "remaining_time": "16:12:25"}
558
+ {"current_steps": 558, "total_steps": 741, "loss": 0.0082, "lr": 4.791560574702614e-06, "epoch": 2.259634888438134, "percentage": 75.3, "elapsed_time": "2 days, 1:08:35", "remaining_time": "16:07:00"}
559
+ {"current_steps": 559, "total_steps": 741, "loss": 0.0145, "lr": 4.742548591165289e-06, "epoch": 2.26369168356998, "percentage": 75.44, "elapsed_time": "2 days, 1:14:27", "remaining_time": "16:01:54"}
560
+ {"current_steps": 560, "total_steps": 741, "loss": 0.0133, "lr": 4.693741453794433e-06, "epoch": 2.2677484787018254, "percentage": 75.57, "elapsed_time": "2 days, 1:19:49", "remaining_time": "15:56:39"}
561
+ {"current_steps": 561, "total_steps": 741, "loss": 0.0099, "lr": 4.6451401372917275e-06, "epoch": 2.2718052738336714, "percentage": 75.71, "elapsed_time": "2 days, 1:25:20", "remaining_time": "15:51:26"}
562
+ {"current_steps": 562, "total_steps": 741, "loss": 0.01, "lr": 4.596745612248488e-06, "epoch": 2.2758620689655173, "percentage": 75.84, "elapsed_time": "2 days, 1:30:54", "remaining_time": "15:46:15"}
563
+ {"current_steps": 563, "total_steps": 741, "loss": 0.0133, "lr": 4.548558845126334e-06, "epoch": 2.279918864097363, "percentage": 75.98, "elapsed_time": "2 days, 1:36:05", "remaining_time": "15:40:55"}
564
+ {"current_steps": 564, "total_steps": 741, "loss": 0.0112, "lr": 4.500580798237831e-06, "epoch": 2.283975659229209, "percentage": 76.11, "elapsed_time": "2 days, 1:41:32", "remaining_time": "15:35:41"}
565
+ {"current_steps": 565, "total_steps": 741, "loss": 0.0102, "lr": 4.452812429727313e-06, "epoch": 2.288032454361055, "percentage": 76.25, "elapsed_time": "2 days, 1:46:41", "remaining_time": "15:30:21"}
566
+ {"current_steps": 566, "total_steps": 741, "loss": 0.0129, "lr": 4.405254693551754e-06, "epoch": 2.292089249492901, "percentage": 76.38, "elapsed_time": "2 days, 1:51:21", "remaining_time": "15:24:53"}
567
+ {"current_steps": 567, "total_steps": 741, "loss": 0.008, "lr": 4.357908539461679e-06, "epoch": 2.2961460446247464, "percentage": 76.52, "elapsed_time": "2 days, 1:56:43", "remaining_time": "15:19:37"}
568
+ {"current_steps": 568, "total_steps": 741, "loss": 0.0144, "lr": 4.310774912982227e-06, "epoch": 2.3002028397565923, "percentage": 76.65, "elapsed_time": "2 days, 2:01:55", "remaining_time": "15:14:19"}
569
+ {"current_steps": 569, "total_steps": 741, "loss": 0.0089, "lr": 4.263854755394256e-06, "epoch": 2.3042596348884383, "percentage": 76.79, "elapsed_time": "2 days, 2:06:55", "remaining_time": "15:08:56"}
570
+ {"current_steps": 570, "total_steps": 741, "loss": 0.012, "lr": 4.21714900371556e-06, "epoch": 2.308316430020284, "percentage": 76.92, "elapsed_time": "2 days, 2:12:11", "remaining_time": "15:03:39"}
571
+ {"current_steps": 571, "total_steps": 741, "loss": 0.0082, "lr": 4.170658590682134e-06, "epoch": 2.31237322515213, "percentage": 77.06, "elapsed_time": "2 days, 2:17:29", "remaining_time": "14:58:22"}
572
+ {"current_steps": 572, "total_steps": 741, "loss": 0.0089, "lr": 4.124384444729561e-06, "epoch": 2.316430020283976, "percentage": 77.19, "elapsed_time": "2 days, 2:22:31", "remaining_time": "14:53:01"}
573
+ {"current_steps": 573, "total_steps": 741, "loss": 0.0113, "lr": 4.078327489974466e-06, "epoch": 2.3204868154158214, "percentage": 77.33, "elapsed_time": "2 days, 2:28:22", "remaining_time": "14:47:53"}
574
+ {"current_steps": 574, "total_steps": 741, "loss": 0.0101, "lr": 4.032488646196077e-06, "epoch": 2.3245436105476673, "percentage": 77.46, "elapsed_time": "2 days, 2:33:29", "remaining_time": "14:42:34"}
575
+ {"current_steps": 575, "total_steps": 741, "loss": 0.0082, "lr": 3.986868828817818e-06, "epoch": 2.3286004056795133, "percentage": 77.6, "elapsed_time": "2 days, 2:38:56", "remaining_time": "14:37:19"}
576
+ {"current_steps": 576, "total_steps": 741, "loss": 0.0068, "lr": 3.941468948889067e-06, "epoch": 2.332657200811359, "percentage": 77.73, "elapsed_time": "2 days, 2:44:25", "remaining_time": "14:32:06"}
577
+ {"current_steps": 577, "total_steps": 741, "loss": 0.0108, "lr": 3.8962899130669525e-06, "epoch": 2.336713995943205, "percentage": 77.87, "elapsed_time": "2 days, 2:49:46", "remaining_time": "14:26:50"}
578
+ {"current_steps": 578, "total_steps": 741, "loss": 0.0123, "lr": 3.851332623598227e-06, "epoch": 2.340770791075051, "percentage": 78.0, "elapsed_time": "2 days, 2:55:35", "remaining_time": "14:21:41"}
579
+ {"current_steps": 579, "total_steps": 741, "loss": 0.0112, "lr": 3.8065979783012746e-06, "epoch": 2.344827586206897, "percentage": 78.14, "elapsed_time": "2 days, 3:01:17", "remaining_time": "14:16:31"}
580
+ {"current_steps": 580, "total_steps": 741, "loss": 0.0079, "lr": 3.7620868705481586e-06, "epoch": 2.3488843813387423, "percentage": 78.27, "elapsed_time": "2 days, 3:06:27", "remaining_time": "14:11:12"}
581
+ {"current_steps": 581, "total_steps": 741, "loss": 0.0079, "lr": 3.717800189246807e-06, "epoch": 2.3529411764705883, "percentage": 78.41, "elapsed_time": "2 days, 3:11:24", "remaining_time": "14:05:49"}
582
+ {"current_steps": 582, "total_steps": 741, "loss": 0.0083, "lr": 3.6737388188232305e-06, "epoch": 2.356997971602434, "percentage": 78.54, "elapsed_time": "2 days, 3:16:51", "remaining_time": "14:00:34"}
583
+ {"current_steps": 583, "total_steps": 741, "loss": 0.0083, "lr": 3.629903639203884e-06, "epoch": 2.36105476673428, "percentage": 78.68, "elapsed_time": "2 days, 3:21:45", "remaining_time": "13:55:11"}
584
+ {"current_steps": 584, "total_steps": 741, "loss": 0.0117, "lr": 3.5862955257980813e-06, "epoch": 2.365111561866126, "percentage": 78.81, "elapsed_time": "2 days, 3:26:53", "remaining_time": "13:49:52"}
585
+ {"current_steps": 585, "total_steps": 741, "loss": 0.0123, "lr": 3.5429153494805087e-06, "epoch": 2.369168356997972, "percentage": 78.95, "elapsed_time": "2 days, 3:32:41", "remaining_time": "13:44:42"}
586
+ {"current_steps": 586, "total_steps": 741, "loss": 0.0108, "lr": 3.499763976573866e-06, "epoch": 2.3732251521298173, "percentage": 79.08, "elapsed_time": "2 days, 3:37:38", "remaining_time": "13:39:20"}
587
+ {"current_steps": 587, "total_steps": 741, "loss": 0.0142, "lr": 3.4568422688315027e-06, "epoch": 2.3772819472616633, "percentage": 79.22, "elapsed_time": "2 days, 3:42:41", "remaining_time": "13:33:59"}
588
+ {"current_steps": 588, "total_steps": 741, "loss": 0.0091, "lr": 3.41415108342028e-06, "epoch": 2.3813387423935093, "percentage": 79.35, "elapsed_time": "2 days, 3:47:35", "remaining_time": "13:28:36"}
589
+ {"current_steps": 589, "total_steps": 741, "loss": 0.0072, "lr": 3.371691272903398e-06, "epoch": 2.385395537525355, "percentage": 79.49, "elapsed_time": "2 days, 3:53:01", "remaining_time": "13:23:21"}
590
+ {"current_steps": 590, "total_steps": 741, "loss": 0.01, "lr": 3.329463685223411e-06, "epoch": 2.389452332657201, "percentage": 79.62, "elapsed_time": "2 days, 3:58:16", "remaining_time": "13:18:04"}
591
+ {"current_steps": 591, "total_steps": 741, "loss": 0.0078, "lr": 3.287469163685241e-06, "epoch": 2.393509127789047, "percentage": 79.76, "elapsed_time": "2 days, 4:03:58", "remaining_time": "13:12:53"}
592
+ {"current_steps": 592, "total_steps": 741, "loss": 0.0098, "lr": 3.2457085469394015e-06, "epoch": 2.3975659229208923, "percentage": 79.89, "elapsed_time": "2 days, 4:09:33", "remaining_time": "13:07:40"}
593
+ {"current_steps": 593, "total_steps": 741, "loss": 0.0093, "lr": 3.204182668965198e-06, "epoch": 2.4016227180527383, "percentage": 80.03, "elapsed_time": "2 days, 4:15:20", "remaining_time": "13:02:30"}
594
+ {"current_steps": 594, "total_steps": 741, "loss": 0.0102, "lr": 3.162892359054098e-06, "epoch": 2.4056795131845843, "percentage": 80.16, "elapsed_time": "2 days, 4:20:58", "remaining_time": "12:57:18"}
595
+ {"current_steps": 595, "total_steps": 741, "loss": 0.0072, "lr": 3.12183844179316e-06, "epoch": 2.40973630831643, "percentage": 80.3, "elapsed_time": "2 days, 4:26:34", "remaining_time": "12:52:06"}
596
+ {"current_steps": 596, "total_steps": 741, "loss": 0.0079, "lr": 3.081021737048565e-06, "epoch": 2.413793103448276, "percentage": 80.43, "elapsed_time": "2 days, 4:31:42", "remaining_time": "12:46:46"}
597
+ {"current_steps": 597, "total_steps": 741, "loss": 0.0124, "lr": 3.040443059949264e-06, "epoch": 2.417849898580122, "percentage": 80.57, "elapsed_time": "2 days, 4:37:00", "remaining_time": "12:41:29"}
598
+ {"current_steps": 598, "total_steps": 741, "loss": 0.0108, "lr": 3.0001032208706653e-06, "epoch": 2.4219066937119678, "percentage": 80.7, "elapsed_time": "2 days, 4:42:18", "remaining_time": "12:36:12"}
599
+ {"current_steps": 599, "total_steps": 741, "loss": 0.0082, "lr": 2.960003025418478e-06, "epoch": 2.4259634888438133, "percentage": 80.84, "elapsed_time": "2 days, 4:47:36", "remaining_time": "12:30:55"}
600
+ {"current_steps": 600, "total_steps": 741, "loss": 0.0114, "lr": 2.9201432744126074e-06, "epoch": 2.4300202839756593, "percentage": 80.97, "elapsed_time": "2 days, 4:53:01", "remaining_time": "12:25:39"}