ryanmarten commited on
Commit
2a414ca
·
verified ·
1 Parent(s): 346eb6f

Training in progress, epoch 10

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82e56d17aff8465bb512bbe11a1691fdc332aa20d9f48f6eec5b7a1f686cca98
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3465adb69584d26ab42322ced2fc5c76ea6f7c0020bfc982e890b96c1bbbec74
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:133280e60df4f37e3a7305b933836029100ea92d83d7f7a2e3c83ca6e2782525
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:316352338021a0260da83fd06c38271b7cb215edf6a7f8da0695da8b865a2273
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe024dd0eaa0dbf3ebfce863bde30992614aaaeed4a9f6460c8109c2f6f43532
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4197ff16346f282d31e6771a06ff3708b87e11539611e971c4d034e5893d70e
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5aac34827af3f90476d6bf48804714919788d5a14f70655339bb5dc25a6f3169
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ce033e236adb378a76c5eaa3005a4f7001f6be8237105a9c322b2ffd65f442c
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -93,3 +93,22 @@
93
  {"current_steps": 93, "total_steps": 117, "loss": 0.0913, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "0:39:35", "remaining_time": "0:10:12"}
94
  {"current_steps": 94, "total_steps": 117, "loss": 0.0863, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "0:39:51", "remaining_time": "0:09:45"}
95
  {"current_steps": 95, "total_steps": 117, "loss": 0.0587, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "0:40:07", "remaining_time": "0:09:17"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
93
  {"current_steps": 93, "total_steps": 117, "loss": 0.0913, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "0:39:35", "remaining_time": "0:10:12"}
94
  {"current_steps": 94, "total_steps": 117, "loss": 0.0863, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "0:39:51", "remaining_time": "0:09:45"}
95
  {"current_steps": 95, "total_steps": 117, "loss": 0.0587, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "0:40:07", "remaining_time": "0:09:17"}
96
+ {"current_steps": 96, "total_steps": 117, "loss": 0.0528, "lr": 9.549150281252633e-07, "epoch": 10.10126582278481, "percentage": 82.05, "elapsed_time": "0:41:22", "remaining_time": "0:09:02"}
97
+ {"current_steps": 97, "total_steps": 117, "loss": 0.1201, "lr": 8.688061284200266e-07, "epoch": 10.20253164556962, "percentage": 82.91, "elapsed_time": "0:41:50", "remaining_time": "0:08:37"}
98
+ {"current_steps": 98, "total_steps": 117, "loss": 0.0666, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "0:42:10", "remaining_time": "0:08:10"}
99
+ {"current_steps": 99, "total_steps": 117, "loss": 0.0978, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "0:42:33", "remaining_time": "0:07:44"}
100
+ {"current_steps": 100, "total_steps": 117, "loss": 0.0864, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:42:58", "remaining_time": "0:07:18"}
101
+ {"current_steps": 101, "total_steps": 117, "loss": 0.0594, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:43:12", "remaining_time": "0:06:50"}
102
+ {"current_steps": 102, "total_steps": 117, "loss": 0.0587, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:43:26", "remaining_time": "0:06:23"}
103
+ {"current_steps": 103, "total_steps": 117, "loss": 0.0576, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:43:45", "remaining_time": "0:05:56"}
104
+ {"current_steps": 104, "total_steps": 117, "loss": 0.0953, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:44:10", "remaining_time": "0:05:31"}
105
+ {"current_steps": 105, "total_steps": 117, "loss": 0.057, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "0:45:26", "remaining_time": "0:05:11"}
106
+ {"current_steps": 106, "total_steps": 117, "loss": 0.044, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "0:45:41", "remaining_time": "0:04:44"}
107
+ {"current_steps": 107, "total_steps": 117, "loss": 0.0728, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "0:46:01", "remaining_time": "0:04:18"}
108
+ {"current_steps": 108, "total_steps": 117, "loss": 0.0428, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "0:46:16", "remaining_time": "0:03:51"}
109
+ {"current_steps": 109, "total_steps": 117, "loss": 0.086, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "0:46:40", "remaining_time": "0:03:25"}
110
+ {"current_steps": 110, "total_steps": 117, "loss": 0.0697, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "0:47:05", "remaining_time": "0:02:59"}
111
+ {"current_steps": 111, "total_steps": 117, "loss": 0.0781, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "0:47:28", "remaining_time": "0:02:33"}
112
+ {"current_steps": 112, "total_steps": 117, "loss": 0.0407, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "0:47:45", "remaining_time": "0:02:07"}
113
+ {"current_steps": 113, "total_steps": 117, "loss": 0.09, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "0:48:03", "remaining_time": "0:01:42"}
114
+ {"current_steps": 114, "total_steps": 117, "loss": 0.0965, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "0:48:27", "remaining_time": "0:01:16"}