penfever commited on
Commit
e12489e
·
verified ·
1 Parent(s): 9e8cb4f

Training in progress, step 2800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a375fe86d663ca4e5e17fcfc38cae241b677039228f4d00a63b2a53800fb68ad
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbec013b144dcf4537dcc0cb49b39b50ea1642f7d7e17db9124392672d364b6a
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa6ab39e372275385dcff9f8a0f79be2922242203fe5bf9a444dcbcbf564863d
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9929d2a29fdac49e28fdf3f7b05e88804a195d1d0adb4ff97582dbee5fabf467
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d64dc3d8afa7e6b0a9ee99b5a6d0248ec3d5a10a8f9dd7bdc20a3ddec0990939
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80debb644701d5b4f166abc6bb3c6fa38a4d217499061ed0338ba12cb77b4395
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9453cf53d89d8caaefabc9cafbee19e9d8b9420c3675b179fd429a000882092
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7638848eec93fa2e29b648acf6c430284cd6014231333f3e99e2bbb183dc5a61
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -518,3 +518,44 @@
518
  {"current_steps": 2590, "total_steps": 4340, "loss": 0.4384, "lr": 1.6764907452104352e-05, "epoch": 4.17741935483871, "percentage": 59.68, "elapsed_time": "12:46:52", "remaining_time": "8:38:09"}
519
  {"current_steps": 2595, "total_steps": 4340, "loss": 0.4482, "lr": 1.6685563087089597e-05, "epoch": 4.185483870967742, "percentage": 59.79, "elapsed_time": "12:48:13", "remaining_time": "8:36:35"}
520
  {"current_steps": 2600, "total_steps": 4340, "loss": 0.4447, "lr": 1.6606272324501087e-05, "epoch": 4.193548387096774, "percentage": 59.91, "elapsed_time": "12:49:51", "remaining_time": "8:35:12"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
518
  {"current_steps": 2590, "total_steps": 4340, "loss": 0.4384, "lr": 1.6764907452104352e-05, "epoch": 4.17741935483871, "percentage": 59.68, "elapsed_time": "12:46:52", "remaining_time": "8:38:09"}
519
  {"current_steps": 2595, "total_steps": 4340, "loss": 0.4482, "lr": 1.6685563087089597e-05, "epoch": 4.185483870967742, "percentage": 59.79, "elapsed_time": "12:48:13", "remaining_time": "8:36:35"}
520
  {"current_steps": 2600, "total_steps": 4340, "loss": 0.4447, "lr": 1.6606272324501087e-05, "epoch": 4.193548387096774, "percentage": 59.91, "elapsed_time": "12:49:51", "remaining_time": "8:35:12"}
521
+ {"current_steps": 2605, "total_steps": 4340, "loss": 0.4452, "lr": 1.6527036446661396e-05, "epoch": 4.201612903225806, "percentage": 60.02, "elapsed_time": "12:52:51", "remaining_time": "8:34:44"}
522
+ {"current_steps": 2610, "total_steps": 4340, "loss": 0.4642, "lr": 1.644785673500546e-05, "epoch": 4.209677419354839, "percentage": 60.14, "elapsed_time": "12:54:14", "remaining_time": "8:33:11"}
523
+ {"current_steps": 2615, "total_steps": 4340, "loss": 0.4363, "lr": 1.6368734470059902e-05, "epoch": 4.217741935483871, "percentage": 60.25, "elapsed_time": "12:55:44", "remaining_time": "8:31:43"}
524
+ {"current_steps": 2620, "total_steps": 4340, "loss": 0.4471, "lr": 1.628967093142226e-05, "epoch": 4.225806451612903, "percentage": 60.37, "elapsed_time": "12:57:00", "remaining_time": "8:30:05"}
525
+ {"current_steps": 2625, "total_steps": 4340, "loss": 0.4662, "lr": 1.6210667397740357e-05, "epoch": 4.233870967741935, "percentage": 60.48, "elapsed_time": "12:58:47", "remaining_time": "8:28:48"}
526
+ {"current_steps": 2630, "total_steps": 4340, "loss": 0.4491, "lr": 1.613172514669157e-05, "epoch": 4.241935483870968, "percentage": 60.6, "elapsed_time": "13:00:15", "remaining_time": "8:27:19"}
527
+ {"current_steps": 2635, "total_steps": 4340, "loss": 0.4597, "lr": 1.6052845454962195e-05, "epoch": 4.25, "percentage": 60.71, "elapsed_time": "13:01:52", "remaining_time": "8:25:55"}
528
+ {"current_steps": 2640, "total_steps": 4340, "loss": 0.4292, "lr": 1.5974029598226796e-05, "epoch": 4.258064516129032, "percentage": 60.83, "elapsed_time": "13:03:15", "remaining_time": "8:24:22"}
529
+ {"current_steps": 2645, "total_steps": 4340, "loss": 0.4437, "lr": 1.589527885112758e-05, "epoch": 4.266129032258064, "percentage": 60.94, "elapsed_time": "13:04:38", "remaining_time": "8:22:49"}
530
+ {"current_steps": 2650, "total_steps": 4340, "loss": 0.4569, "lr": 1.5816594487253752e-05, "epoch": 4.274193548387097, "percentage": 61.06, "elapsed_time": "13:06:00", "remaining_time": "8:21:15"}
531
+ {"current_steps": 2655, "total_steps": 4340, "loss": 0.458, "lr": 1.5737977779120957e-05, "epoch": 4.282258064516129, "percentage": 61.18, "elapsed_time": "13:07:22", "remaining_time": "8:19:42"}
532
+ {"current_steps": 2660, "total_steps": 4340, "loss": 0.4447, "lr": 1.5659429998150676e-05, "epoch": 4.290322580645161, "percentage": 61.29, "elapsed_time": "13:09:05", "remaining_time": "8:18:22"}
533
+ {"current_steps": 2665, "total_steps": 4340, "loss": 0.4656, "lr": 1.5580952414649683e-05, "epoch": 4.298387096774194, "percentage": 61.41, "elapsed_time": "13:10:26", "remaining_time": "8:16:48"}
534
+ {"current_steps": 2670, "total_steps": 4340, "loss": 0.469, "lr": 1.550254629778947e-05, "epoch": 4.306451612903226, "percentage": 61.52, "elapsed_time": "13:11:49", "remaining_time": "8:15:15"}
535
+ {"current_steps": 2675, "total_steps": 4340, "loss": 0.462, "lr": 1.5424212915585766e-05, "epoch": 4.314516129032258, "percentage": 61.64, "elapsed_time": "13:13:16", "remaining_time": "8:13:45"}
536
+ {"current_steps": 2680, "total_steps": 4340, "loss": 0.4372, "lr": 1.5345953534877986e-05, "epoch": 4.32258064516129, "percentage": 61.75, "elapsed_time": "13:14:33", "remaining_time": "8:12:09"}
537
+ {"current_steps": 2685, "total_steps": 4340, "loss": 0.4667, "lr": 1.5267769421308765e-05, "epoch": 4.330645161290323, "percentage": 61.87, "elapsed_time": "13:15:54", "remaining_time": "8:10:35"}
538
+ {"current_steps": 2690, "total_steps": 4340, "loss": 0.4482, "lr": 1.5189661839303493e-05, "epoch": 4.338709677419355, "percentage": 61.98, "elapsed_time": "13:17:18", "remaining_time": "8:09:03"}
539
+ {"current_steps": 2695, "total_steps": 4340, "loss": 0.444, "lr": 1.5111632052049872e-05, "epoch": 4.346774193548387, "percentage": 62.1, "elapsed_time": "13:18:36", "remaining_time": "8:07:27"}
540
+ {"current_steps": 2700, "total_steps": 4340, "loss": 0.4623, "lr": 1.5033681321477445e-05, "epoch": 4.354838709677419, "percentage": 62.21, "elapsed_time": "13:20:10", "remaining_time": "8:06:02"}
541
+ {"current_steps": 2705, "total_steps": 4340, "loss": 0.4743, "lr": 1.4955810908237247e-05, "epoch": 4.362903225806452, "percentage": 62.33, "elapsed_time": "13:21:32", "remaining_time": "8:04:28"}
542
+ {"current_steps": 2710, "total_steps": 4340, "loss": 0.4461, "lr": 1.4878022071681368e-05, "epoch": 4.370967741935484, "percentage": 62.44, "elapsed_time": "13:23:00", "remaining_time": "8:02:59"}
543
+ {"current_steps": 2715, "total_steps": 4340, "loss": 0.4631, "lr": 1.4800316069842623e-05, "epoch": 4.379032258064516, "percentage": 62.56, "elapsed_time": "13:24:21", "remaining_time": "8:01:25"}
544
+ {"current_steps": 2720, "total_steps": 4340, "loss": 0.4421, "lr": 1.4722694159414176e-05, "epoch": 4.387096774193548, "percentage": 62.67, "elapsed_time": "13:25:42", "remaining_time": "7:59:52"}
545
+ {"current_steps": 2725, "total_steps": 4340, "loss": 0.4618, "lr": 1.4645157595729247e-05, "epoch": 4.395161290322581, "percentage": 62.79, "elapsed_time": "13:27:05", "remaining_time": "7:58:19"}
546
+ {"current_steps": 2730, "total_steps": 4340, "loss": 0.4671, "lr": 1.4567707632740773e-05, "epoch": 4.403225806451613, "percentage": 62.9, "elapsed_time": "13:28:31", "remaining_time": "7:56:49"}
547
+ {"current_steps": 2735, "total_steps": 4340, "loss": 0.4462, "lr": 1.4490345523001155e-05, "epoch": 4.411290322580645, "percentage": 63.02, "elapsed_time": "13:29:50", "remaining_time": "7:55:14"}
548
+ {"current_steps": 2740, "total_steps": 4340, "loss": 0.4456, "lr": 1.4413072517642013e-05, "epoch": 4.419354838709677, "percentage": 63.13, "elapsed_time": "13:31:12", "remaining_time": "7:53:41"}
549
+ {"current_steps": 2745, "total_steps": 4340, "loss": 0.4404, "lr": 1.433588986635392e-05, "epoch": 4.42741935483871, "percentage": 63.25, "elapsed_time": "13:32:42", "remaining_time": "7:52:13"}
550
+ {"current_steps": 2750, "total_steps": 4340, "loss": 0.4585, "lr": 1.4258798817366202e-05, "epoch": 4.435483870967742, "percentage": 63.36, "elapsed_time": "13:34:06", "remaining_time": "7:50:42"}
551
+ {"current_steps": 2755, "total_steps": 4340, "loss": 0.4478, "lr": 1.418180061742677e-05, "epoch": 4.443548387096774, "percentage": 63.48, "elapsed_time": "13:35:24", "remaining_time": "7:49:07"}
552
+ {"current_steps": 2760, "total_steps": 4340, "loss": 0.467, "lr": 1.4104896511781916e-05, "epoch": 4.451612903225806, "percentage": 63.59, "elapsed_time": "13:36:43", "remaining_time": "7:47:32"}
553
+ {"current_steps": 2765, "total_steps": 4340, "loss": 0.4693, "lr": 1.4028087744156239e-05, "epoch": 4.459677419354839, "percentage": 63.71, "elapsed_time": "13:38:24", "remaining_time": "7:46:10"}
554
+ {"current_steps": 2770, "total_steps": 4340, "loss": 0.4364, "lr": 1.3951375556732459e-05, "epoch": 4.467741935483871, "percentage": 63.82, "elapsed_time": "13:40:04", "remaining_time": "7:44:48"}
555
+ {"current_steps": 2775, "total_steps": 4340, "loss": 0.451, "lr": 1.3874761190131371e-05, "epoch": 4.475806451612903, "percentage": 63.94, "elapsed_time": "13:41:29", "remaining_time": "7:43:17"}
556
+ {"current_steps": 2780, "total_steps": 4340, "loss": 0.4559, "lr": 1.3798245883391788e-05, "epoch": 4.483870967741936, "percentage": 64.06, "elapsed_time": "13:42:55", "remaining_time": "7:41:47"}
557
+ {"current_steps": 2785, "total_steps": 4340, "loss": 0.4385, "lr": 1.3721830873950457e-05, "epoch": 4.491935483870968, "percentage": 64.17, "elapsed_time": "13:44:18", "remaining_time": "7:40:15"}
558
+ {"current_steps": 2790, "total_steps": 4340, "loss": 0.4466, "lr": 1.3645517397622104e-05, "epoch": 4.5, "percentage": 64.29, "elapsed_time": "13:45:46", "remaining_time": "7:38:46"}
559
+ {"current_steps": 2795, "total_steps": 4340, "loss": 0.4714, "lr": 1.356930668857941e-05, "epoch": 4.508064516129032, "percentage": 64.4, "elapsed_time": "13:47:05", "remaining_time": "7:37:11"}
560
+ {"current_steps": 2800, "total_steps": 4340, "loss": 0.4697, "lr": 1.3493199979333053e-05, "epoch": 4.516129032258064, "percentage": 64.52, "elapsed_time": "13:48:28", "remaining_time": "7:35:39"}
561
+ {"current_steps": 2805, "total_steps": 4340, "loss": 0.4619, "lr": 1.3417198500711801e-05, "epoch": 4.524193548387097, "percentage": 64.63, "elapsed_time": "13:51:13", "remaining_time": "7:34:52"}