penfever commited on
Commit
d72fdb4
·
verified ·
1 Parent(s): 268d806

Training in progress, step 4800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d87a7a4cee62628d96e1920a34e3347c96ec250da2fe8b723901339950401199
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7f3d2f8d384c0d660fbb543a28b9c91984de1ef75d94e8eff5c58d5ef9a06f
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4e5b62841210439d615f38d96fc5bdaa5318a67fe6f5a93c3fb0d81c017fb91
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ba6c4b46758365285f10242153d40e33cecff6b9084525fcd20d7b516774c0a
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6e4efe7126d7c45a26b1a2faae6a692d9840c9cb7b78c63668c3ee3d83298af
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c6cccc1551ef32e2defb82b76cab7216fa2b319151b61ce14a90679ef16e52
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87e158475ac233b3ee6b74734fbc77f3306fd93d226b59d3ea31e47c8b55630b
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75b6dd8211aec9d23f26329a57bb11423ad8559f5f1ed07201c5c1cea20944f3
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -920,3 +920,44 @@
920
  {"current_steps": 4590, "total_steps": 6188, "loss": 0.1399, "lr": 7.599633761856542e-06, "epoch": 5.193548387096774, "percentage": 74.18, "elapsed_time": "11:39:25", "remaining_time": "4:03:30"}
921
  {"current_steps": 4595, "total_steps": 6188, "loss": 0.134, "lr": 7.555422889141997e-06, "epoch": 5.1992076966610075, "percentage": 74.26, "elapsed_time": "11:42:32", "remaining_time": "4:03:33"}
922
  {"current_steps": 4600, "total_steps": 6188, "loss": 0.1596, "lr": 7.51131102326154e-06, "epoch": 5.204867006225241, "percentage": 74.34, "elapsed_time": "11:45:34", "remaining_time": "4:03:34"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
920
  {"current_steps": 4590, "total_steps": 6188, "loss": 0.1399, "lr": 7.599633761856542e-06, "epoch": 5.193548387096774, "percentage": 74.18, "elapsed_time": "11:39:25", "remaining_time": "4:03:30"}
921
  {"current_steps": 4595, "total_steps": 6188, "loss": 0.134, "lr": 7.555422889141997e-06, "epoch": 5.1992076966610075, "percentage": 74.26, "elapsed_time": "11:42:32", "remaining_time": "4:03:33"}
922
  {"current_steps": 4600, "total_steps": 6188, "loss": 0.1596, "lr": 7.51131102326154e-06, "epoch": 5.204867006225241, "percentage": 74.34, "elapsed_time": "11:45:34", "remaining_time": "4:03:34"}
923
+ {"current_steps": 4605, "total_steps": 6188, "loss": 0.1571, "lr": 7.467298515161305e-06, "epoch": 5.2105263157894735, "percentage": 74.42, "elapsed_time": "11:49:37", "remaining_time": "4:03:56"}
924
+ {"current_steps": 4610, "total_steps": 6188, "loss": 0.1484, "lr": 7.423385714996942e-06, "epoch": 5.216185625353707, "percentage": 74.5, "elapsed_time": "11:52:36", "remaining_time": "4:03:55"}
925
+ {"current_steps": 4615, "total_steps": 6188, "loss": 0.1486, "lr": 7.379572972130864e-06, "epoch": 5.22184493491794, "percentage": 74.58, "elapsed_time": "11:55:21", "remaining_time": "4:03:49"}
926
+ {"current_steps": 4620, "total_steps": 6188, "loss": 0.139, "lr": 7.335860635129426e-06, "epoch": 5.227504244482173, "percentage": 74.66, "elapsed_time": "11:58:20", "remaining_time": "4:03:47"}
927
+ {"current_steps": 4625, "total_steps": 6188, "loss": 0.1521, "lr": 7.292249051760169e-06, "epoch": 5.233163554046406, "percentage": 74.74, "elapsed_time": "12:01:14", "remaining_time": "4:03:44"}
928
+ {"current_steps": 4630, "total_steps": 6188, "loss": 0.1565, "lr": 7.2487385689890845e-06, "epoch": 5.23882286361064, "percentage": 74.82, "elapsed_time": "12:04:02", "remaining_time": "4:03:38"}
929
+ {"current_steps": 4635, "total_steps": 6188, "loss": 0.1433, "lr": 7.205329532977794e-06, "epoch": 5.244482173174872, "percentage": 74.9, "elapsed_time": "12:06:53", "remaining_time": "4:03:33"}
930
+ {"current_steps": 4640, "total_steps": 6188, "loss": 0.1583, "lr": 7.162022289080837e-06, "epoch": 5.250141482739106, "percentage": 74.98, "elapsed_time": "12:09:41", "remaining_time": "4:03:26"}
931
+ {"current_steps": 4645, "total_steps": 6188, "loss": 0.1401, "lr": 7.1188171818429256e-06, "epoch": 5.255800792303339, "percentage": 75.06, "elapsed_time": "12:12:32", "remaining_time": "4:03:20"}
932
+ {"current_steps": 4650, "total_steps": 6188, "loss": 0.129, "lr": 7.075714554996176e-06, "epoch": 5.261460101867572, "percentage": 75.15, "elapsed_time": "12:15:30", "remaining_time": "4:03:16"}
933
+ {"current_steps": 4655, "total_steps": 6188, "loss": 0.1314, "lr": 7.032714751457395e-06, "epoch": 5.267119411431805, "percentage": 75.23, "elapsed_time": "12:18:35", "remaining_time": "4:03:14"}
934
+ {"current_steps": 4660, "total_steps": 6188, "loss": 0.136, "lr": 6.989818113325333e-06, "epoch": 5.272778720996039, "percentage": 75.31, "elapsed_time": "12:21:39", "remaining_time": "4:03:11"}
935
+ {"current_steps": 4665, "total_steps": 6188, "loss": 0.1506, "lr": 6.947024981878001e-06, "epoch": 5.278438030560272, "percentage": 75.39, "elapsed_time": "12:24:32", "remaining_time": "4:03:04"}
936
+ {"current_steps": 4670, "total_steps": 6188, "loss": 0.1758, "lr": 6.904335697569909e-06, "epoch": 5.284097340124505, "percentage": 75.47, "elapsed_time": "12:27:09", "remaining_time": "4:02:52"}
937
+ {"current_steps": 4675, "total_steps": 6188, "loss": 0.1618, "lr": 6.861750600029373e-06, "epoch": 5.289756649688738, "percentage": 75.55, "elapsed_time": "12:30:09", "remaining_time": "4:02:46"}
938
+ {"current_steps": 4680, "total_steps": 6188, "loss": 0.1416, "lr": 6.819270028055844e-06, "epoch": 5.2954159592529715, "percentage": 75.63, "elapsed_time": "12:33:06", "remaining_time": "4:02:40"}
939
+ {"current_steps": 4685, "total_steps": 6188, "loss": 0.1499, "lr": 6.776894319617162e-06, "epoch": 5.301075268817204, "percentage": 75.71, "elapsed_time": "12:36:08", "remaining_time": "4:02:34"}
940
+ {"current_steps": 4690, "total_steps": 6188, "loss": 0.1537, "lr": 6.73462381184689e-06, "epoch": 5.3067345783814375, "percentage": 75.79, "elapsed_time": "12:39:11", "remaining_time": "4:02:29"}
941
+ {"current_steps": 4695, "total_steps": 6188, "loss": 0.164, "lr": 6.6924588410416604e-06, "epoch": 5.312393887945671, "percentage": 75.87, "elapsed_time": "12:42:18", "remaining_time": "4:02:24"}
942
+ {"current_steps": 4700, "total_steps": 6188, "loss": 0.1495, "lr": 6.650399742658442e-06, "epoch": 5.3180531975099035, "percentage": 75.95, "elapsed_time": "12:45:23", "remaining_time": "4:02:19"}
943
+ {"current_steps": 4705, "total_steps": 6188, "loss": 0.1542, "lr": 6.608446851311918e-06, "epoch": 5.323712507074137, "percentage": 76.03, "elapsed_time": "12:48:23", "remaining_time": "4:02:11"}
944
+ {"current_steps": 4710, "total_steps": 6188, "loss": 0.1459, "lr": 6.566600500771796e-06, "epoch": 5.32937181663837, "percentage": 76.12, "elapsed_time": "12:51:26", "remaining_time": "4:02:04"}
945
+ {"current_steps": 4715, "total_steps": 6188, "loss": 0.1386, "lr": 6.524861023960185e-06, "epoch": 5.335031126202603, "percentage": 76.2, "elapsed_time": "12:54:28", "remaining_time": "4:01:57"}
946
+ {"current_steps": 4720, "total_steps": 6188, "loss": 0.1724, "lr": 6.483228752948902e-06, "epoch": 5.340690435766836, "percentage": 76.28, "elapsed_time": "12:57:31", "remaining_time": "4:01:49"}
947
+ {"current_steps": 4725, "total_steps": 6188, "loss": 0.1696, "lr": 6.441704018956858e-06, "epoch": 5.34634974533107, "percentage": 76.36, "elapsed_time": "13:00:36", "remaining_time": "4:01:41"}
948
+ {"current_steps": 4730, "total_steps": 6188, "loss": 0.1401, "lr": 6.400287152347442e-06, "epoch": 5.352009054895303, "percentage": 76.44, "elapsed_time": "13:03:41", "remaining_time": "4:01:34"}
949
+ {"current_steps": 4735, "total_steps": 6188, "loss": 0.1504, "lr": 6.35897848262584e-06, "epoch": 5.357668364459536, "percentage": 76.52, "elapsed_time": "13:06:34", "remaining_time": "4:01:22"}
950
+ {"current_steps": 4740, "total_steps": 6188, "loss": 0.152, "lr": 6.317778338436449e-06, "epoch": 5.363327674023769, "percentage": 76.6, "elapsed_time": "13:09:37", "remaining_time": "4:01:13"}
951
+ {"current_steps": 4745, "total_steps": 6188, "loss": 0.1324, "lr": 6.276687047560275e-06, "epoch": 5.368986983588003, "percentage": 76.68, "elapsed_time": "13:12:40", "remaining_time": "4:01:03"}
952
+ {"current_steps": 4750, "total_steps": 6188, "loss": 0.1436, "lr": 6.235704936912288e-06, "epoch": 5.374646293152235, "percentage": 76.76, "elapsed_time": "13:15:43", "remaining_time": "4:00:53"}
953
+ {"current_steps": 4755, "total_steps": 6188, "loss": 0.1362, "lr": 6.194832332538838e-06, "epoch": 5.380305602716469, "percentage": 76.84, "elapsed_time": "13:18:49", "remaining_time": "4:00:44"}
954
+ {"current_steps": 4760, "total_steps": 6188, "loss": 0.1408, "lr": 6.154069559615081e-06, "epoch": 5.385964912280702, "percentage": 76.92, "elapsed_time": "13:21:48", "remaining_time": "4:00:32"}
955
+ {"current_steps": 4765, "total_steps": 6188, "loss": 0.1393, "lr": 6.113416942442358e-06, "epoch": 5.391624221844935, "percentage": 77.0, "elapsed_time": "13:24:46", "remaining_time": "4:00:20"}
956
+ {"current_steps": 4770, "total_steps": 6188, "loss": 0.1474, "lr": 6.072874804445632e-06, "epoch": 5.397283531409168, "percentage": 77.08, "elapsed_time": "13:27:46", "remaining_time": "4:00:07"}
957
+ {"current_steps": 4775, "total_steps": 6188, "loss": 0.1386, "lr": 6.032443468170912e-06, "epoch": 5.4029428409734015, "percentage": 77.17, "elapsed_time": "13:30:51", "remaining_time": "3:59:56"}
958
+ {"current_steps": 4780, "total_steps": 6188, "loss": 0.1414, "lr": 5.992123255282702e-06, "epoch": 5.408602150537634, "percentage": 77.25, "elapsed_time": "13:33:55", "remaining_time": "3:59:45"}
959
+ {"current_steps": 4785, "total_steps": 6188, "loss": 0.1563, "lr": 5.951914486561417e-06, "epoch": 5.4142614601018675, "percentage": 77.33, "elapsed_time": "13:36:59", "remaining_time": "3:59:33"}
960
+ {"current_steps": 4790, "total_steps": 6188, "loss": 0.1556, "lr": 5.911817481900832e-06, "epoch": 5.419920769666101, "percentage": 77.41, "elapsed_time": "13:40:02", "remaining_time": "3:59:20"}
961
+ {"current_steps": 4795, "total_steps": 6188, "loss": 0.127, "lr": 5.871832560305573e-06, "epoch": 5.425580079230334, "percentage": 77.49, "elapsed_time": "13:42:20", "remaining_time": "3:58:53"}
962
+ {"current_steps": 4800, "total_steps": 6188, "loss": 0.0822, "lr": 5.831960039888533e-06, "epoch": 5.431239388794567, "percentage": 77.57, "elapsed_time": "13:43:57", "remaining_time": "3:58:15"}
963
+ {"current_steps": 4805, "total_steps": 6188, "loss": 0.0748, "lr": 5.792200237868361e-06, "epoch": 5.4368986983588, "percentage": 77.65, "elapsed_time": "13:46:48", "remaining_time": "3:57:58"}