penfever commited on
Commit
b9e799b
·
verified ·
1 Parent(s): cfb4977

Training in progress, step 1200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcfe4181fc7b759deeb934fd1ce7f0d05ed49aa95f26ddf5775be6cb73c50ecb
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e453f82279978e9d5e185e0d64cd77ed6a068f0133bd76ca39b4e77fb9240718
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12e7a8575d2a9e7bba697a929be56f4e3991c354c8d7a7dc9a10bcc014333eea
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:520d2a652ebbc6567d8b8af12a7e96bcfb7fd54e5aef4a7e1bc6072324ec6e80
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a6f68b339bf46be541e76ca3377d68ac5e841a508c9d87f5dcb51b114364676
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dba2387adc142dfcfc06e6b1a45aef0e9c5232e4c030800bc2193ab47603ccbd
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8e011e55455016c29dfa81be7772163b8ba53206178c3d01184d4bad298c8a3
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa0ceb73a64d57b374b39186ec1fd0cf785a153dc3ba7fdf209ceecde529a40
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -199,3 +199,43 @@
199
  {"current_steps": 995, "total_steps": 9128, "loss": 0.3149, "lr": 3.9990405553597644e-05, "epoch": 0.7633294975067128, "percentage": 10.9, "elapsed_time": "6:14:29", "remaining_time": "2 days, 3:01:06"}
200
  {"current_steps": 1000, "total_steps": 9128, "loss": 0.3559, "lr": 3.998918460547664e-05, "epoch": 0.7671653241273494, "percentage": 10.96, "elapsed_time": "6:16:10", "remaining_time": "2 days, 2:57:31"}
201
  {"current_steps": 1005, "total_steps": 9128, "loss": 0.3294, "lr": 3.998789057381739e-05, "epoch": 0.7710011507479861, "percentage": 11.01, "elapsed_time": "6:19:16", "remaining_time": "2 days, 3:05:32"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
199
  {"current_steps": 995, "total_steps": 9128, "loss": 0.3149, "lr": 3.9990405553597644e-05, "epoch": 0.7633294975067128, "percentage": 10.9, "elapsed_time": "6:14:29", "remaining_time": "2 days, 3:01:06"}
200
  {"current_steps": 1000, "total_steps": 9128, "loss": 0.3559, "lr": 3.998918460547664e-05, "epoch": 0.7671653241273494, "percentage": 10.96, "elapsed_time": "6:16:10", "remaining_time": "2 days, 2:57:31"}
201
  {"current_steps": 1005, "total_steps": 9128, "loss": 0.3294, "lr": 3.998789057381739e-05, "epoch": 0.7710011507479861, "percentage": 11.01, "elapsed_time": "6:19:16", "remaining_time": "2 days, 3:05:32"}
202
+ {"current_steps": 1010, "total_steps": 9128, "loss": 0.3392, "lr": 3.9986523463351075e-05, "epoch": 0.7748369773686229, "percentage": 11.06, "elapsed_time": "6:21:02", "remaining_time": "2 days, 3:02:38"}
203
+ {"current_steps": 1015, "total_steps": 9128, "loss": 0.3424, "lr": 3.998508327907605e-05, "epoch": 0.7786728039892596, "percentage": 11.12, "elapsed_time": "6:22:44", "remaining_time": "2 days, 2:59:20"}
204
+ {"current_steps": 1020, "total_steps": 9128, "loss": 0.3455, "lr": 3.9983570026257844e-05, "epoch": 0.7825086306098964, "percentage": 11.17, "elapsed_time": "6:24:27", "remaining_time": "2 days, 2:56:06"}
205
+ {"current_steps": 1025, "total_steps": 9128, "loss": 0.3372, "lr": 3.998198371042917e-05, "epoch": 0.7863444572305331, "percentage": 11.23, "elapsed_time": "6:26:08", "remaining_time": "2 days, 2:52:39"}
206
+ {"current_steps": 1030, "total_steps": 9128, "loss": 0.3219, "lr": 3.9980324337389824e-05, "epoch": 0.7901802838511699, "percentage": 11.28, "elapsed_time": "6:27:50", "remaining_time": "2 days, 2:49:15"}
207
+ {"current_steps": 1035, "total_steps": 9128, "loss": 0.3269, "lr": 3.9978591913206724e-05, "epoch": 0.7940161104718066, "percentage": 11.34, "elapsed_time": "6:29:25", "remaining_time": "2 days, 2:45:06"}
208
+ {"current_steps": 1040, "total_steps": 9128, "loss": 0.3324, "lr": 3.9976786444213895e-05, "epoch": 0.7978519370924434, "percentage": 11.39, "elapsed_time": "6:31:04", "remaining_time": "2 days, 2:41:19"}
209
+ {"current_steps": 1045, "total_steps": 9128, "loss": 0.325, "lr": 3.99749079370124e-05, "epoch": 0.8016877637130801, "percentage": 11.45, "elapsed_time": "6:32:46", "remaining_time": "2 days, 2:38:01"}
210
+ {"current_steps": 1050, "total_steps": 9128, "loss": 0.3119, "lr": 3.997295639847036e-05, "epoch": 0.8055235903337169, "percentage": 11.5, "elapsed_time": "6:34:25", "remaining_time": "2 days, 2:34:29"}
211
+ {"current_steps": 1055, "total_steps": 9128, "loss": 0.3201, "lr": 3.997093183572288e-05, "epoch": 0.8093594169543536, "percentage": 11.56, "elapsed_time": "6:36:03", "remaining_time": "2 days, 2:30:38"}
212
+ {"current_steps": 1060, "total_steps": 9128, "loss": 0.3328, "lr": 3.99688342561721e-05, "epoch": 0.8131952435749904, "percentage": 11.61, "elapsed_time": "6:37:41", "remaining_time": "2 days, 2:26:55"}
213
+ {"current_steps": 1065, "total_steps": 9128, "loss": 0.3542, "lr": 3.996666366748708e-05, "epoch": 0.8170310701956272, "percentage": 11.67, "elapsed_time": "6:39:20", "remaining_time": "2 days, 2:23:23"}
214
+ {"current_steps": 1070, "total_steps": 9128, "loss": 0.3265, "lr": 3.996442007760382e-05, "epoch": 0.8208668968162639, "percentage": 11.72, "elapsed_time": "6:40:58", "remaining_time": "2 days, 2:19:40"}
215
+ {"current_steps": 1075, "total_steps": 9128, "loss": 0.3408, "lr": 3.996210349472524e-05, "epoch": 0.8247027234369007, "percentage": 11.78, "elapsed_time": "6:42:37", "remaining_time": "2 days, 2:16:06"}
216
+ {"current_steps": 1080, "total_steps": 9128, "loss": 0.3203, "lr": 3.9959713927321125e-05, "epoch": 0.8285385500575374, "percentage": 11.83, "elapsed_time": "6:44:19", "remaining_time": "2 days, 2:12:54"}
217
+ {"current_steps": 1085, "total_steps": 9128, "loss": 0.332, "lr": 3.99572513841281e-05, "epoch": 0.8323743766781742, "percentage": 11.89, "elapsed_time": "6:46:02", "remaining_time": "2 days, 2:09:57"}
218
+ {"current_steps": 1090, "total_steps": 9128, "loss": 0.3246, "lr": 3.9954715874149596e-05, "epoch": 0.8362102032988109, "percentage": 11.94, "elapsed_time": "6:47:46", "remaining_time": "2 days, 2:07:02"}
219
+ {"current_steps": 1095, "total_steps": 9128, "loss": 0.3103, "lr": 3.9952107406655835e-05, "epoch": 0.8400460299194477, "percentage": 12.0, "elapsed_time": "6:49:30", "remaining_time": "2 days, 2:04:08"}
220
+ {"current_steps": 1100, "total_steps": 9128, "loss": 0.3397, "lr": 3.9949425991183775e-05, "epoch": 0.8438818565400844, "percentage": 12.05, "elapsed_time": "6:51:06", "remaining_time": "2 days, 2:00:20"}
221
+ {"current_steps": 1105, "total_steps": 9128, "loss": 0.322, "lr": 3.9946671637537084e-05, "epoch": 0.8477176831607212, "percentage": 12.11, "elapsed_time": "6:52:47", "remaining_time": "2 days, 1:57:08"}
222
+ {"current_steps": 1110, "total_steps": 9128, "loss": 0.3381, "lr": 3.99438443557861e-05, "epoch": 0.8515535097813579, "percentage": 12.16, "elapsed_time": "6:54:28", "remaining_time": "2 days, 1:53:56"}
223
+ {"current_steps": 1115, "total_steps": 9128, "loss": 0.3375, "lr": 3.9940944156267803e-05, "epoch": 0.8553893364019947, "percentage": 12.22, "elapsed_time": "6:56:08", "remaining_time": "2 days, 1:50:39"}
224
+ {"current_steps": 1120, "total_steps": 9128, "loss": 0.3316, "lr": 3.9937971049585766e-05, "epoch": 0.8592251630226314, "percentage": 12.27, "elapsed_time": "6:57:50", "remaining_time": "2 days, 1:47:31"}
225
+ {"current_steps": 1125, "total_steps": 9128, "loss": 0.3625, "lr": 3.9934925046610134e-05, "epoch": 0.8630609896432682, "percentage": 12.32, "elapsed_time": "6:59:28", "remaining_time": "2 days, 1:44:00"}
226
+ {"current_steps": 1130, "total_steps": 9128, "loss": 0.3292, "lr": 3.993180615847755e-05, "epoch": 0.8668968162639049, "percentage": 12.38, "elapsed_time": "7:01:03", "remaining_time": "2 days, 1:40:15"}
227
+ {"current_steps": 1135, "total_steps": 9128, "loss": 0.3383, "lr": 3.992861439659116e-05, "epoch": 0.8707326428845417, "percentage": 12.43, "elapsed_time": "7:02:48", "remaining_time": "2 days, 1:37:32"}
228
+ {"current_steps": 1140, "total_steps": 9128, "loss": 0.3422, "lr": 3.9925349772620536e-05, "epoch": 0.8745684695051784, "percentage": 12.49, "elapsed_time": "7:04:30", "remaining_time": "2 days, 1:34:31"}
229
+ {"current_steps": 1145, "total_steps": 9128, "loss": 0.3382, "lr": 3.992201229850164e-05, "epoch": 0.8784042961258152, "percentage": 12.54, "elapsed_time": "7:06:10", "remaining_time": "2 days, 1:31:17"}
230
+ {"current_steps": 1150, "total_steps": 9128, "loss": 0.339, "lr": 3.99186019864368e-05, "epoch": 0.8822401227464519, "percentage": 12.6, "elapsed_time": "7:07:57", "remaining_time": "2 days, 1:28:57"}
231
+ {"current_steps": 1155, "total_steps": 9128, "loss": 0.3371, "lr": 3.9915118848894633e-05, "epoch": 0.8860759493670886, "percentage": 12.65, "elapsed_time": "7:09:37", "remaining_time": "2 days, 1:25:42"}
232
+ {"current_steps": 1160, "total_steps": 9128, "loss": 0.3371, "lr": 3.991156289861004e-05, "epoch": 0.8899117759877253, "percentage": 12.71, "elapsed_time": "7:11:12", "remaining_time": "2 days, 1:21:59"}
233
+ {"current_steps": 1165, "total_steps": 9128, "loss": 0.3342, "lr": 3.9907934148584105e-05, "epoch": 0.8937476026083621, "percentage": 12.76, "elapsed_time": "7:12:52", "remaining_time": "2 days, 1:18:47"}
234
+ {"current_steps": 1170, "total_steps": 9128, "loss": 0.3266, "lr": 3.9904232612084104e-05, "epoch": 0.8975834292289988, "percentage": 12.82, "elapsed_time": "7:14:33", "remaining_time": "2 days, 1:15:43"}
235
+ {"current_steps": 1175, "total_steps": 9128, "loss": 0.3125, "lr": 3.990045830264343e-05, "epoch": 0.9014192558496356, "percentage": 12.87, "elapsed_time": "7:16:19", "remaining_time": "2 days, 1:13:13"}
236
+ {"current_steps": 1180, "total_steps": 9128, "loss": 0.3285, "lr": 3.989661123406154e-05, "epoch": 0.9052550824702723, "percentage": 12.93, "elapsed_time": "7:18:02", "remaining_time": "2 days, 1:10:26"}
237
+ {"current_steps": 1185, "total_steps": 9128, "loss": 0.3212, "lr": 3.9892691420403906e-05, "epoch": 0.9090909090909091, "percentage": 12.98, "elapsed_time": "7:19:45", "remaining_time": "2 days, 1:07:39"}
238
+ {"current_steps": 1190, "total_steps": 9128, "loss": 0.3373, "lr": 3.988869887600197e-05, "epoch": 0.9129267357115458, "percentage": 13.04, "elapsed_time": "7:21:21", "remaining_time": "2 days, 1:04:09"}
239
+ {"current_steps": 1195, "total_steps": 9128, "loss": 0.331, "lr": 3.988463361545309e-05, "epoch": 0.9167625623321826, "percentage": 13.09, "elapsed_time": "7:23:01", "remaining_time": "2 days, 1:01:00"}
240
+ {"current_steps": 1200, "total_steps": 9128, "loss": 0.326, "lr": 3.988049565362048e-05, "epoch": 0.9205983889528193, "percentage": 13.15, "elapsed_time": "7:24:41", "remaining_time": "2 days, 0:57:58"}
241
+ {"current_steps": 1205, "total_steps": 9128, "loss": 0.332, "lr": 3.987628500563318e-05, "epoch": 0.9244342155734561, "percentage": 13.2, "elapsed_time": "7:27:34", "remaining_time": "2 days, 1:02:47"}