penfever commited on
Commit
59388d6
·
verified ·
1 Parent(s): 08525da

Training in progress, step 4800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd35ed7a08c4ac5684fe35fa888fef480ed5a304be0aa449ff5243d7cf1e552a
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb7f623166ead846e0aae0c5e7d83408e076584b0ff987a124987f773daa30ae
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff26eb49980efe71ba0fa836bbf7d65212f5da40760c07ebcd44efe30b4290d2
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:756278cacc3e9d6758d821f6722ce104f12debe3b65a7cdc71977341b86abb8b
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab3518a489ed1c8c9a661fa548187c488724dd12c8026040f41f8f3e0a2e6021
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60aaba5e2c9bfdfb9a308cd14bef1289f822349e769312997d43f4d5983208bd
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:162a307cb2095e3e71fc8e111036033fefcaa8b78104c311412d5a37f81317f2
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8277d0aaf833745caa86ba464e1c1ce96b0746b25e187961918c81f0b8e3c3af
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -923,3 +923,43 @@
923
  {"current_steps": 4590, "total_steps": 6188, "loss": 0.076, "lr": 7.599633761856542e-06, "epoch": 5.193548387096774, "percentage": 74.18, "elapsed_time": "11:10:03", "remaining_time": "3:53:16"}
924
  {"current_steps": 4595, "total_steps": 6188, "loss": 0.0763, "lr": 7.555422889141997e-06, "epoch": 5.1992076966610075, "percentage": 74.26, "elapsed_time": "11:11:49", "remaining_time": "3:52:54"}
925
  {"current_steps": 4600, "total_steps": 6188, "loss": 0.0702, "lr": 7.51131102326154e-06, "epoch": 5.204867006225241, "percentage": 74.34, "elapsed_time": "11:13:21", "remaining_time": "3:52:27"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
923
  {"current_steps": 4590, "total_steps": 6188, "loss": 0.076, "lr": 7.599633761856542e-06, "epoch": 5.193548387096774, "percentage": 74.18, "elapsed_time": "11:10:03", "remaining_time": "3:53:16"}
924
  {"current_steps": 4595, "total_steps": 6188, "loss": 0.0763, "lr": 7.555422889141997e-06, "epoch": 5.1992076966610075, "percentage": 74.26, "elapsed_time": "11:11:49", "remaining_time": "3:52:54"}
925
  {"current_steps": 4600, "total_steps": 6188, "loss": 0.0702, "lr": 7.51131102326154e-06, "epoch": 5.204867006225241, "percentage": 74.34, "elapsed_time": "11:13:21", "remaining_time": "3:52:27"}
926
+ {"current_steps": 4605, "total_steps": 6188, "loss": 0.0782, "lr": 7.467298515161305e-06, "epoch": 5.2105263157894735, "percentage": 74.42, "elapsed_time": "11:16:11", "remaining_time": "3:52:26"}
927
+ {"current_steps": 4610, "total_steps": 6188, "loss": 0.0688, "lr": 7.423385714996942e-06, "epoch": 5.216185625353707, "percentage": 74.5, "elapsed_time": "11:17:47", "remaining_time": "3:52:00"}
928
+ {"current_steps": 4615, "total_steps": 6188, "loss": 0.1083, "lr": 7.379572972130864e-06, "epoch": 5.22184493491794, "percentage": 74.58, "elapsed_time": "11:19:45", "remaining_time": "3:51:41"}
929
+ {"current_steps": 4620, "total_steps": 6188, "loss": 0.0639, "lr": 7.335860635129426e-06, "epoch": 5.227504244482173, "percentage": 74.66, "elapsed_time": "11:21:19", "remaining_time": "3:51:14"}
930
+ {"current_steps": 4625, "total_steps": 6188, "loss": 0.0681, "lr": 7.292249051760169e-06, "epoch": 5.233163554046406, "percentage": 74.74, "elapsed_time": "11:22:54", "remaining_time": "3:50:47"}
931
+ {"current_steps": 4630, "total_steps": 6188, "loss": 0.0672, "lr": 7.2487385689890845e-06, "epoch": 5.23882286361064, "percentage": 74.82, "elapsed_time": "11:24:30", "remaining_time": "3:50:20"}
932
+ {"current_steps": 4635, "total_steps": 6188, "loss": 0.1126, "lr": 7.205329532977794e-06, "epoch": 5.244482173174872, "percentage": 74.9, "elapsed_time": "11:26:53", "remaining_time": "3:50:08"}
933
+ {"current_steps": 4640, "total_steps": 6188, "loss": 0.0758, "lr": 7.162022289080837e-06, "epoch": 5.250141482739106, "percentage": 74.98, "elapsed_time": "11:28:31", "remaining_time": "3:49:42"}
934
+ {"current_steps": 4645, "total_steps": 6188, "loss": 0.1059, "lr": 7.1188171818429256e-06, "epoch": 5.255800792303339, "percentage": 75.06, "elapsed_time": "11:30:18", "remaining_time": "3:49:18"}
935
+ {"current_steps": 4650, "total_steps": 6188, "loss": 0.0756, "lr": 7.075714554996176e-06, "epoch": 5.261460101867572, "percentage": 75.15, "elapsed_time": "11:31:53", "remaining_time": "3:48:50"}
936
+ {"current_steps": 4655, "total_steps": 6188, "loss": 0.0997, "lr": 7.032714751457395e-06, "epoch": 5.267119411431805, "percentage": 75.23, "elapsed_time": "11:33:48", "remaining_time": "3:48:29"}
937
+ {"current_steps": 4660, "total_steps": 6188, "loss": 0.1043, "lr": 6.989818113325333e-06, "epoch": 5.272778720996039, "percentage": 75.31, "elapsed_time": "11:35:30", "remaining_time": "3:48:03"}
938
+ {"current_steps": 4665, "total_steps": 6188, "loss": 0.1036, "lr": 6.947024981878001e-06, "epoch": 5.278438030560272, "percentage": 75.39, "elapsed_time": "11:37:09", "remaining_time": "3:47:36"}
939
+ {"current_steps": 4670, "total_steps": 6188, "loss": 0.0755, "lr": 6.904335697569909e-06, "epoch": 5.284097340124505, "percentage": 75.47, "elapsed_time": "11:38:41", "remaining_time": "3:47:06"}
940
+ {"current_steps": 4675, "total_steps": 6188, "loss": 0.0835, "lr": 6.861750600029373e-06, "epoch": 5.289756649688738, "percentage": 75.55, "elapsed_time": "11:40:27", "remaining_time": "3:46:41"}
941
+ {"current_steps": 4680, "total_steps": 6188, "loss": 0.0804, "lr": 6.819270028055844e-06, "epoch": 5.2954159592529715, "percentage": 75.63, "elapsed_time": "11:42:35", "remaining_time": "3:46:23"}
942
+ {"current_steps": 4685, "total_steps": 6188, "loss": 0.0685, "lr": 6.776894319617162e-06, "epoch": 5.301075268817204, "percentage": 75.71, "elapsed_time": "11:44:22", "remaining_time": "3:45:58"}
943
+ {"current_steps": 4690, "total_steps": 6188, "loss": 0.0649, "lr": 6.73462381184689e-06, "epoch": 5.3067345783814375, "percentage": 75.79, "elapsed_time": "11:46:17", "remaining_time": "3:45:35"}
944
+ {"current_steps": 4695, "total_steps": 6188, "loss": 0.0772, "lr": 6.6924588410416604e-06, "epoch": 5.312393887945671, "percentage": 75.87, "elapsed_time": "11:47:58", "remaining_time": "3:45:08"}
945
+ {"current_steps": 4700, "total_steps": 6188, "loss": 0.0897, "lr": 6.650399742658442e-06, "epoch": 5.3180531975099035, "percentage": 75.95, "elapsed_time": "11:50:22", "remaining_time": "3:44:53"}
946
+ {"current_steps": 4705, "total_steps": 6188, "loss": 0.0864, "lr": 6.608446851311918e-06, "epoch": 5.323712507074137, "percentage": 76.03, "elapsed_time": "11:51:56", "remaining_time": "3:44:24"}
947
+ {"current_steps": 4710, "total_steps": 6188, "loss": 0.08, "lr": 6.566600500771796e-06, "epoch": 5.32937181663837, "percentage": 76.12, "elapsed_time": "11:53:31", "remaining_time": "3:43:54"}
948
+ {"current_steps": 4715, "total_steps": 6188, "loss": 0.0701, "lr": 6.524861023960185e-06, "epoch": 5.335031126202603, "percentage": 76.2, "elapsed_time": "11:55:11", "remaining_time": "3:43:25"}
949
+ {"current_steps": 4720, "total_steps": 6188, "loss": 0.0816, "lr": 6.483228752948902e-06, "epoch": 5.340690435766836, "percentage": 76.28, "elapsed_time": "11:56:58", "remaining_time": "3:42:59"}
950
+ {"current_steps": 4725, "total_steps": 6188, "loss": 0.0676, "lr": 6.441704018956858e-06, "epoch": 5.34634974533107, "percentage": 76.36, "elapsed_time": "11:58:31", "remaining_time": "3:42:28"}
951
+ {"current_steps": 4730, "total_steps": 6188, "loss": 0.0773, "lr": 6.400287152347442e-06, "epoch": 5.352009054895303, "percentage": 76.44, "elapsed_time": "12:00:10", "remaining_time": "3:41:59"}
952
+ {"current_steps": 4735, "total_steps": 6188, "loss": 0.0745, "lr": 6.35897848262584e-06, "epoch": 5.357668364459536, "percentage": 76.52, "elapsed_time": "12:01:47", "remaining_time": "3:41:29"}
953
+ {"current_steps": 4740, "total_steps": 6188, "loss": 0.0754, "lr": 6.317778338436449e-06, "epoch": 5.363327674023769, "percentage": 76.6, "elapsed_time": "12:03:24", "remaining_time": "3:40:59"}
954
+ {"current_steps": 4745, "total_steps": 6188, "loss": 0.0923, "lr": 6.276687047560275e-06, "epoch": 5.368986983588003, "percentage": 76.68, "elapsed_time": "12:05:16", "remaining_time": "3:40:33"}
955
+ {"current_steps": 4750, "total_steps": 6188, "loss": 0.0736, "lr": 6.235704936912288e-06, "epoch": 5.374646293152235, "percentage": 76.76, "elapsed_time": "12:06:46", "remaining_time": "3:40:01"}
956
+ {"current_steps": 4755, "total_steps": 6188, "loss": 0.084, "lr": 6.194832332538838e-06, "epoch": 5.380305602716469, "percentage": 76.84, "elapsed_time": "12:08:17", "remaining_time": "3:39:28"}
957
+ {"current_steps": 4760, "total_steps": 6188, "loss": 0.0999, "lr": 6.154069559615081e-06, "epoch": 5.385964912280702, "percentage": 76.92, "elapsed_time": "12:10:16", "remaining_time": "3:39:05"}
958
+ {"current_steps": 4765, "total_steps": 6188, "loss": 0.0752, "lr": 6.113416942442358e-06, "epoch": 5.391624221844935, "percentage": 77.0, "elapsed_time": "12:11:53", "remaining_time": "3:38:34"}
959
+ {"current_steps": 4770, "total_steps": 6188, "loss": 0.067, "lr": 6.072874804445632e-06, "epoch": 5.397283531409168, "percentage": 77.08, "elapsed_time": "12:13:27", "remaining_time": "3:38:02"}
960
+ {"current_steps": 4775, "total_steps": 6188, "loss": 0.0818, "lr": 6.032443468170912e-06, "epoch": 5.4029428409734015, "percentage": 77.17, "elapsed_time": "12:15:10", "remaining_time": "3:37:32"}
961
+ {"current_steps": 4780, "total_steps": 6188, "loss": 0.0905, "lr": 5.992123255282702e-06, "epoch": 5.408602150537634, "percentage": 77.25, "elapsed_time": "12:17:04", "remaining_time": "3:37:06"}
962
+ {"current_steps": 4785, "total_steps": 6188, "loss": 0.0593, "lr": 5.951914486561417e-06, "epoch": 5.4142614601018675, "percentage": 77.33, "elapsed_time": "12:18:35", "remaining_time": "3:36:33"}
963
+ {"current_steps": 4790, "total_steps": 6188, "loss": 0.0799, "lr": 5.911817481900832e-06, "epoch": 5.419920769666101, "percentage": 77.41, "elapsed_time": "12:20:40", "remaining_time": "3:36:10"}
964
+ {"current_steps": 4795, "total_steps": 6188, "loss": 0.0697, "lr": 5.871832560305573e-06, "epoch": 5.425580079230334, "percentage": 77.49, "elapsed_time": "12:22:24", "remaining_time": "3:35:40"}
965
+ {"current_steps": 4800, "total_steps": 6188, "loss": 0.0614, "lr": 5.831960039888533e-06, "epoch": 5.431239388794567, "percentage": 77.57, "elapsed_time": "12:24:03", "remaining_time": "3:35:09"}