penfever commited on
Commit
0593b08
·
verified ·
1 Parent(s): e12489e

Training in progress, step 3000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbec013b144dcf4537dcc0cb49b39b50ea1642f7d7e17db9124392672d364b6a
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80ccf97e5064519a87c1be6f61380ab25bf51a1918a27412f634f4136a5f347
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9929d2a29fdac49e28fdf3f7b05e88804a195d1d0adb4ff97582dbee5fabf467
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d554f8af0e9ea83d896d2854baa30a8c1b13fce6b98da5dfb7713aa9bce54ee0
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80debb644701d5b4f166abc6bb3c6fa38a4d217499061ed0338ba12cb77b4395
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4289653c6d7d364c217765272a3ede2f06596a2e83aa283a97dea89187fcb114
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7638848eec93fa2e29b648acf6c430284cd6014231333f3e99e2bbb183dc5a61
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad098f743ecaaaa06191fec83efafe4d9dc3734e491e97d1ae75ea0c1afc0553
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -559,3 +559,42 @@
559
  {"current_steps": 2795, "total_steps": 4340, "loss": 0.4714, "lr": 1.356930668857941e-05, "epoch": 4.508064516129032, "percentage": 64.4, "elapsed_time": "13:47:05", "remaining_time": "7:37:11"}
560
  {"current_steps": 2800, "total_steps": 4340, "loss": 0.4697, "lr": 1.3493199979333053e-05, "epoch": 4.516129032258064, "percentage": 64.52, "elapsed_time": "13:48:28", "remaining_time": "7:35:39"}
561
  {"current_steps": 2805, "total_steps": 4340, "loss": 0.4619, "lr": 1.3417198500711801e-05, "epoch": 4.524193548387097, "percentage": 64.63, "elapsed_time": "13:51:13", "remaining_time": "7:34:52"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
559
  {"current_steps": 2795, "total_steps": 4340, "loss": 0.4714, "lr": 1.356930668857941e-05, "epoch": 4.508064516129032, "percentage": 64.4, "elapsed_time": "13:47:05", "remaining_time": "7:37:11"}
560
  {"current_steps": 2800, "total_steps": 4340, "loss": 0.4697, "lr": 1.3493199979333053e-05, "epoch": 4.516129032258064, "percentage": 64.52, "elapsed_time": "13:48:28", "remaining_time": "7:35:39"}
561
  {"current_steps": 2805, "total_steps": 4340, "loss": 0.4619, "lr": 1.3417198500711801e-05, "epoch": 4.524193548387097, "percentage": 64.63, "elapsed_time": "13:51:13", "remaining_time": "7:34:52"}
562
+ {"current_steps": 2810, "total_steps": 4340, "loss": 0.4494, "lr": 1.3341303481842566e-05, "epoch": 4.532258064516129, "percentage": 64.75, "elapsed_time": "13:52:42", "remaining_time": "7:33:23"}
563
+ {"current_steps": 2815, "total_steps": 4340, "loss": 0.449, "lr": 1.3265516150130577e-05, "epoch": 4.540322580645161, "percentage": 64.86, "elapsed_time": "13:54:04", "remaining_time": "7:31:51"}
564
+ {"current_steps": 2820, "total_steps": 4340, "loss": 0.4514, "lr": 1.318983773123948e-05, "epoch": 4.548387096774194, "percentage": 64.98, "elapsed_time": "13:55:55", "remaining_time": "7:30:34"}
565
+ {"current_steps": 2825, "total_steps": 4340, "loss": 0.4697, "lr": 1.311426944907154e-05, "epoch": 4.556451612903226, "percentage": 65.09, "elapsed_time": "13:57:15", "remaining_time": "7:29:00"}
566
+ {"current_steps": 2830, "total_steps": 4340, "loss": 0.449, "lr": 1.3038812525747859e-05, "epoch": 4.564516129032258, "percentage": 65.21, "elapsed_time": "13:58:35", "remaining_time": "7:27:26"}
567
+ {"current_steps": 2835, "total_steps": 4340, "loss": 0.4498, "lr": 1.2963468181588602e-05, "epoch": 4.57258064516129, "percentage": 65.32, "elapsed_time": "13:59:59", "remaining_time": "7:25:55"}
568
+ {"current_steps": 2840, "total_steps": 4340, "loss": 0.4554, "lr": 1.2888237635093233e-05, "epoch": 4.580645161290323, "percentage": 65.44, "elapsed_time": "14:01:29", "remaining_time": "7:24:26"}
569
+ {"current_steps": 2845, "total_steps": 4340, "loss": 0.4621, "lr": 1.2813122102920859e-05, "epoch": 4.588709677419355, "percentage": 65.55, "elapsed_time": "14:02:52", "remaining_time": "7:22:55"}
570
+ {"current_steps": 2850, "total_steps": 4340, "loss": 0.4697, "lr": 1.273812279987051e-05, "epoch": 4.596774193548387, "percentage": 65.67, "elapsed_time": "14:04:11", "remaining_time": "7:21:21"}
571
+ {"current_steps": 2855, "total_steps": 4340, "loss": 0.4634, "lr": 1.2663240938861526e-05, "epoch": 4.604838709677419, "percentage": 65.78, "elapsed_time": "14:05:30", "remaining_time": "7:19:47"}
572
+ {"current_steps": 2860, "total_steps": 4340, "loss": 0.4378, "lr": 1.2588477730913912e-05, "epoch": 4.612903225806452, "percentage": 65.9, "elapsed_time": "14:07:02", "remaining_time": "7:18:19"}
573
+ {"current_steps": 2865, "total_steps": 4340, "loss": 0.4721, "lr": 1.2513834385128783e-05, "epoch": 4.620967741935484, "percentage": 66.01, "elapsed_time": "14:08:18", "remaining_time": "7:16:44"}
574
+ {"current_steps": 2870, "total_steps": 4340, "loss": 0.4504, "lr": 1.2439312108668782e-05, "epoch": 4.629032258064516, "percentage": 66.13, "elapsed_time": "14:09:46", "remaining_time": "7:15:15"}
575
+ {"current_steps": 2875, "total_steps": 4340, "loss": 0.4633, "lr": 1.2364912106738567e-05, "epoch": 4.637096774193548, "percentage": 66.24, "elapsed_time": "14:11:17", "remaining_time": "7:13:47"}
576
+ {"current_steps": 2880, "total_steps": 4340, "loss": 0.4244, "lr": 1.2290635582565334e-05, "epoch": 4.645161290322581, "percentage": 66.36, "elapsed_time": "14:12:39", "remaining_time": "7:12:15"}
577
+ {"current_steps": 2885, "total_steps": 4340, "loss": 0.4361, "lr": 1.221648373737935e-05, "epoch": 4.653225806451613, "percentage": 66.47, "elapsed_time": "14:14:09", "remaining_time": "7:10:47"}
578
+ {"current_steps": 2890, "total_steps": 4340, "loss": 0.4351, "lr": 1.21424577703945e-05, "epoch": 4.661290322580645, "percentage": 66.59, "elapsed_time": "14:15:38", "remaining_time": "7:09:18"}
579
+ {"current_steps": 2895, "total_steps": 4340, "loss": 0.439, "lr": 1.2068558878788941e-05, "epoch": 4.669354838709677, "percentage": 66.71, "elapsed_time": "14:16:54", "remaining_time": "7:07:42"}
580
+ {"current_steps": 2900, "total_steps": 4340, "loss": 0.4435, "lr": 1.1994788257685693e-05, "epoch": 4.67741935483871, "percentage": 66.82, "elapsed_time": "14:18:25", "remaining_time": "7:06:15"}
581
+ {"current_steps": 2905, "total_steps": 4340, "loss": 0.4494, "lr": 1.192114710013335e-05, "epoch": 4.685483870967742, "percentage": 66.94, "elapsed_time": "14:19:37", "remaining_time": "7:04:38"}
582
+ {"current_steps": 2910, "total_steps": 4340, "loss": 0.4443, "lr": 1.1847636597086759e-05, "epoch": 4.693548387096774, "percentage": 67.05, "elapsed_time": "14:20:53", "remaining_time": "7:03:02"}
583
+ {"current_steps": 2915, "total_steps": 4340, "loss": 0.46, "lr": 1.1774257937387774e-05, "epoch": 4.701612903225806, "percentage": 67.17, "elapsed_time": "14:22:22", "remaining_time": "7:01:34"}
584
+ {"current_steps": 2920, "total_steps": 4340, "loss": 0.4584, "lr": 1.1701012307746021e-05, "epoch": 4.709677419354839, "percentage": 67.28, "elapsed_time": "14:23:44", "remaining_time": "7:00:02"}
585
+ {"current_steps": 2925, "total_steps": 4340, "loss": 0.4615, "lr": 1.1627900892719706e-05, "epoch": 4.717741935483871, "percentage": 67.4, "elapsed_time": "14:24:58", "remaining_time": "6:58:26"}
586
+ {"current_steps": 2930, "total_steps": 4340, "loss": 0.4449, "lr": 1.1554924874696471e-05, "epoch": 4.725806451612903, "percentage": 67.51, "elapsed_time": "14:26:36", "remaining_time": "6:57:02"}
587
+ {"current_steps": 2935, "total_steps": 4340, "loss": 0.4291, "lr": 1.1482085433874264e-05, "epoch": 4.733870967741936, "percentage": 67.63, "elapsed_time": "14:28:20", "remaining_time": "6:55:40"}
588
+ {"current_steps": 2940, "total_steps": 4340, "loss": 0.4556, "lr": 1.1409383748242246e-05, "epoch": 4.741935483870968, "percentage": 67.74, "elapsed_time": "14:29:45", "remaining_time": "6:54:10"}
589
+ {"current_steps": 2945, "total_steps": 4340, "loss": 0.4541, "lr": 1.133682099356173e-05, "epoch": 4.75, "percentage": 67.86, "elapsed_time": "14:31:03", "remaining_time": "6:52:36"}
590
+ {"current_steps": 2950, "total_steps": 4340, "loss": 0.4534, "lr": 1.12643983433472e-05, "epoch": 4.758064516129032, "percentage": 67.97, "elapsed_time": "14:32:27", "remaining_time": "6:51:05"}
591
+ {"current_steps": 2955, "total_steps": 4340, "loss": 0.4607, "lr": 1.1192116968847313e-05, "epoch": 4.766129032258064, "percentage": 68.09, "elapsed_time": "14:33:44", "remaining_time": "6:49:31"}
592
+ {"current_steps": 2960, "total_steps": 4340, "loss": 0.4464, "lr": 1.1119978039025959e-05, "epoch": 4.774193548387097, "percentage": 68.2, "elapsed_time": "14:35:11", "remaining_time": "6:48:01"}
593
+ {"current_steps": 2965, "total_steps": 4340, "loss": 0.4614, "lr": 1.1047982720543326e-05, "epoch": 4.782258064516129, "percentage": 68.32, "elapsed_time": "14:36:36", "remaining_time": "6:46:31"}
594
+ {"current_steps": 2970, "total_steps": 4340, "loss": 0.4585, "lr": 1.0976132177737098e-05, "epoch": 4.790322580645161, "percentage": 68.43, "elapsed_time": "14:38:04", "remaining_time": "6:45:02"}
595
+ {"current_steps": 2975, "total_steps": 4340, "loss": 0.4626, "lr": 1.090442757260357e-05, "epoch": 4.798387096774194, "percentage": 68.55, "elapsed_time": "14:39:38", "remaining_time": "6:43:36"}
596
+ {"current_steps": 2980, "total_steps": 4340, "loss": 0.4376, "lr": 1.083287006477888e-05, "epoch": 4.806451612903226, "percentage": 68.66, "elapsed_time": "14:41:24", "remaining_time": "6:42:14"}
597
+ {"current_steps": 2985, "total_steps": 4340, "loss": 0.4755, "lr": 1.0761460811520236e-05, "epoch": 4.814516129032258, "percentage": 68.78, "elapsed_time": "14:43:02", "remaining_time": "6:40:50"}
598
+ {"current_steps": 2990, "total_steps": 4340, "loss": 0.4748, "lr": 1.0690200967687234e-05, "epoch": 4.82258064516129, "percentage": 68.89, "elapsed_time": "14:44:30", "remaining_time": "6:39:21"}
599
+ {"current_steps": 2995, "total_steps": 4340, "loss": 0.4422, "lr": 1.0619091685723132e-05, "epoch": 4.830645161290323, "percentage": 69.01, "elapsed_time": "14:45:57", "remaining_time": "6:37:51"}
600
+ {"current_steps": 3000, "total_steps": 4340, "loss": 0.4447, "lr": 1.0548134115636262e-05, "epoch": 4.838709677419355, "percentage": 69.12, "elapsed_time": "14:47:14", "remaining_time": "6:36:18"}