adpretko commited on
Commit
b28dbc7
·
verified ·
1 Parent(s): 0feed32

Training in progress, step 500

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. trainer_log.jsonl +10 -0
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c09cdb94a6220a32cbc706fe1a889c090b238965f9c0f66070fa8314ba622398
3
  size 3554214752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:903c5490ebce41703da16f896f150df930552515c55bfaf6c462b5f687fa5beb
3
  size 3554214752
trainer_log.jsonl CHANGED
@@ -38,3 +38,13 @@
38
  {"current_steps": 380, "total_steps": 3886, "loss": 0.0129, "lr": 1.9485861182519282e-05, "epoch": 0.19559902200489, "percentage": 9.78, "elapsed_time": "5:58:28", "remaining_time": "2 days, 7:07:20"}
39
  {"current_steps": 390, "total_steps": 3886, "loss": 0.0131, "lr": 2e-05, "epoch": 0.20074636468922918, "percentage": 10.04, "elapsed_time": "6:07:42", "remaining_time": "2 days, 6:56:11"}
40
  {"current_steps": 400, "total_steps": 3886, "loss": 0.0135, "lr": 1.999959647024453e-05, "epoch": 0.2058937073735684, "percentage": 10.29, "elapsed_time": "6:16:59", "remaining_time": "2 days, 6:45:26"}
 
 
 
 
 
 
 
 
 
 
 
38
  {"current_steps": 380, "total_steps": 3886, "loss": 0.0129, "lr": 1.9485861182519282e-05, "epoch": 0.19559902200489, "percentage": 9.78, "elapsed_time": "5:58:28", "remaining_time": "2 days, 7:07:20"}
39
  {"current_steps": 390, "total_steps": 3886, "loss": 0.0131, "lr": 2e-05, "epoch": 0.20074636468922918, "percentage": 10.04, "elapsed_time": "6:07:42", "remaining_time": "2 days, 6:56:11"}
40
  {"current_steps": 400, "total_steps": 3886, "loss": 0.0135, "lr": 1.999959647024453e-05, "epoch": 0.2058937073735684, "percentage": 10.29, "elapsed_time": "6:16:59", "remaining_time": "2 days, 6:45:26"}
41
+ {"current_steps": 410, "total_steps": 3886, "loss": 0.0125, "lr": 1.999838591354537e-05, "epoch": 0.2110410500579076, "percentage": 10.55, "elapsed_time": "6:28:02", "remaining_time": "2 days, 6:49:48"}
42
+ {"current_steps": 420, "total_steps": 3886, "loss": 0.0129, "lr": 1.9996368427601652e-05, "epoch": 0.21618839274224683, "percentage": 10.81, "elapsed_time": "6:37:08", "remaining_time": "2 days, 6:37:18"}
43
+ {"current_steps": 430, "total_steps": 3886, "loss": 0.0124, "lr": 1.9993544175236498e-05, "epoch": 0.22133573542658602, "percentage": 11.07, "elapsed_time": "6:46:24", "remaining_time": "2 days, 6:26:21"}
44
+ {"current_steps": 440, "total_steps": 3886, "loss": 0.013, "lr": 1.998991338438388e-05, "epoch": 0.22648307811092525, "percentage": 11.32, "elapsed_time": "6:55:43", "remaining_time": "2 days, 6:15:52"}
45
+ {"current_steps": 450, "total_steps": 3886, "loss": 0.0121, "lr": 1.9985476348070224e-05, "epoch": 0.23163042079526444, "percentage": 11.58, "elapsed_time": "7:05:02", "remaining_time": "2 days, 6:05:28"}
46
+ {"current_steps": 460, "total_steps": 3886, "loss": 0.021, "lr": 1.9980233424390773e-05, "epoch": 0.23677776347960366, "percentage": 11.84, "elapsed_time": "7:14:24", "remaining_time": "2 days, 5:55:26"}
47
+ {"current_steps": 470, "total_steps": 3886, "loss": 0.0277, "lr": 1.9974185036480664e-05, "epoch": 0.24192510616394286, "percentage": 12.09, "elapsed_time": "7:23:43", "remaining_time": "2 days, 5:44:58"}
48
+ {"current_steps": 480, "total_steps": 3886, "loss": 0.0164, "lr": 1.9967331672480798e-05, "epoch": 0.24707244884828208, "percentage": 12.35, "elapsed_time": "7:32:55", "remaining_time": "2 days, 5:33:51"}
49
+ {"current_steps": 490, "total_steps": 3886, "loss": 0.0138, "lr": 1.995967388549843e-05, "epoch": 0.2522197915326213, "percentage": 12.61, "elapsed_time": "7:42:11", "remaining_time": "2 days, 5:23:17"}
50
+ {"current_steps": 500, "total_steps": 3886, "loss": 0.0137, "lr": 1.9951212293562547e-05, "epoch": 0.2573671342169605, "percentage": 12.87, "elapsed_time": "7:51:30", "remaining_time": "2 days, 5:13:03"}