gsmyrnis commited on
Commit
08a021e
·
verified ·
1 Parent(s): 4053fe4

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fb93b2d60f815ceb62cd5006844138788a0a0e3c074ca8391dd94ddcdaf730c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:706b526132446956b812baadfb971a64b2774ec4f41e7b6a8348d9723785a8a5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61c71d3142b1620c9dcbb8fd84c9768a16cfb760509c8e0a951b662fcd73cf77
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14096fb3eaca7d4811802305de5b406645987abb8bb04d7a4063448109eb1c9
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d78d885f188fcf24c2ac142a7bd264134a1a709bcd12c011bf3ccd69f526f89
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2409d2000becd09909a0865a8e034f31c1fa62a791b9a7ef1cedf501a1327b16
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd3ac08dd319f49242740f96a6b6fa3a478ffb335c72eddd28865ce8861f11b6
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd62595cbee2360bf20a2a8798b939257493de1f088a33967ca2a499fa454ba7
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -186,3 +186,32 @@
186
  {"current_steps": 186, "total_steps": 216, "loss": 0.2161, "lr": 5.785225463498828e-07, "epoch": 2.571428571428571, "percentage": 86.11, "elapsed_time": "0:12:57", "remaining_time": "0:02:05"}
187
  {"current_steps": 187, "total_steps": 216, "loss": 0.249, "lr": 5.412973117089288e-07, "epoch": 2.5852534562211984, "percentage": 86.57, "elapsed_time": "0:13:00", "remaining_time": "0:02:01"}
188
  {"current_steps": 188, "total_steps": 216, "loss": 0.1794, "lr": 5.05241294573024e-07, "epoch": 2.5990783410138247, "percentage": 87.04, "elapsed_time": "0:13:03", "remaining_time": "0:01:56"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
186
  {"current_steps": 186, "total_steps": 216, "loss": 0.2161, "lr": 5.785225463498828e-07, "epoch": 2.571428571428571, "percentage": 86.11, "elapsed_time": "0:12:57", "remaining_time": "0:02:05"}
187
  {"current_steps": 187, "total_steps": 216, "loss": 0.249, "lr": 5.412973117089288e-07, "epoch": 2.5852534562211984, "percentage": 86.57, "elapsed_time": "0:13:00", "remaining_time": "0:02:01"}
188
  {"current_steps": 188, "total_steps": 216, "loss": 0.1794, "lr": 5.05241294573024e-07, "epoch": 2.5990783410138247, "percentage": 87.04, "elapsed_time": "0:13:03", "remaining_time": "0:01:56"}
189
+ {"current_steps": 189, "total_steps": 216, "loss": 0.2483, "lr": 4.7036395000776556e-07, "epoch": 2.6129032258064515, "percentage": 87.5, "elapsed_time": "0:13:07", "remaining_time": "0:01:52"}
190
+ {"current_steps": 190, "total_steps": 216, "loss": 0.1891, "lr": 4.3667442399229985e-07, "epoch": 2.6267281105990783, "percentage": 87.96, "elapsed_time": "0:13:10", "remaining_time": "0:01:48"}
191
+ {"current_steps": 191, "total_steps": 216, "loss": 0.2294, "lr": 4.041815510209396e-07, "epoch": 2.640552995391705, "percentage": 88.43, "elapsed_time": "0:13:14", "remaining_time": "0:01:43"}
192
+ {"current_steps": 192, "total_steps": 216, "loss": 0.2278, "lr": 3.728938517864794e-07, "epoch": 2.654377880184332, "percentage": 88.89, "elapsed_time": "0:13:17", "remaining_time": "0:01:39"}
193
+ {"current_steps": 193, "total_steps": 216, "loss": 0.2144, "lr": 3.4281953094578877e-07, "epoch": 2.6682027649769586, "percentage": 89.35, "elapsed_time": "0:13:20", "remaining_time": "0:01:35"}
194
+ {"current_steps": 194, "total_steps": 216, "loss": 0.2517, "lr": 3.1396647496828245e-07, "epoch": 2.6820276497695854, "percentage": 89.81, "elapsed_time": "0:13:24", "remaining_time": "0:01:31"}
195
+ {"current_steps": 195, "total_steps": 216, "loss": 0.2611, "lr": 2.8634225006782867e-07, "epoch": 2.6958525345622117, "percentage": 90.28, "elapsed_time": "0:13:27", "remaining_time": "0:01:26"}
196
+ {"current_steps": 196, "total_steps": 216, "loss": 0.2059, "lr": 2.599541002186479e-07, "epoch": 2.709677419354839, "percentage": 90.74, "elapsed_time": "0:13:30", "remaining_time": "0:01:22"}
197
+ {"current_steps": 197, "total_steps": 216, "loss": 0.1805, "lr": 2.3480894525569564e-07, "epoch": 2.7235023041474653, "percentage": 91.2, "elapsed_time": "0:13:34", "remaining_time": "0:01:18"}
198
+ {"current_steps": 198, "total_steps": 216, "loss": 0.2479, "lr": 2.109133790600648e-07, "epoch": 2.737327188940092, "percentage": 91.67, "elapsed_time": "0:13:37", "remaining_time": "0:01:14"}
199
+ {"current_steps": 199, "total_steps": 216, "loss": 0.2388, "lr": 1.8827366782984913e-07, "epoch": 2.751152073732719, "percentage": 92.13, "elapsed_time": "0:13:41", "remaining_time": "0:01:10"}
200
+ {"current_steps": 200, "total_steps": 216, "loss": 0.2238, "lr": 1.6689574843694433e-07, "epoch": 2.7649769585253456, "percentage": 92.59, "elapsed_time": "0:13:44", "remaining_time": "0:01:05"}
201
+ {"current_steps": 201, "total_steps": 216, "loss": 0.1927, "lr": 1.4678522687020414e-07, "epoch": 2.7788018433179724, "percentage": 93.06, "elapsed_time": "0:13:47", "remaining_time": "0:01:01"}
202
+ {"current_steps": 202, "total_steps": 216, "loss": 0.219, "lr": 1.2794737676536993e-07, "epoch": 2.792626728110599, "percentage": 93.52, "elapsed_time": "0:13:51", "remaining_time": "0:00:57"}
203
+ {"current_steps": 203, "total_steps": 216, "loss": 0.2258, "lr": 1.1038713802214718e-07, "epoch": 2.806451612903226, "percentage": 93.98, "elapsed_time": "0:13:54", "remaining_time": "0:00:53"}
204
+ {"current_steps": 204, "total_steps": 216, "loss": 0.2272, "lr": 9.410911550880474e-08, "epoch": 2.8202764976958523, "percentage": 94.44, "elapsed_time": "0:13:58", "remaining_time": "0:00:49"}
205
+ {"current_steps": 205, "total_steps": 216, "loss": 0.1845, "lr": 7.911757785462882e-08, "epoch": 2.8341013824884795, "percentage": 94.91, "elapsed_time": "0:14:01", "remaining_time": "0:00:45"}
206
+ {"current_steps": 206, "total_steps": 216, "loss": 0.1772, "lr": 6.54164563305465e-08, "epoch": 2.847926267281106, "percentage": 95.37, "elapsed_time": "0:14:04", "remaining_time": "0:00:41"}
207
+ {"current_steps": 207, "total_steps": 216, "loss": 0.2429, "lr": 5.3009343818219985e-08, "epoch": 2.8617511520737327, "percentage": 95.83, "elapsed_time": "0:14:08", "remaining_time": "0:00:36"}
208
+ {"current_steps": 208, "total_steps": 216, "loss": 0.2, "lr": 4.189949386787462e-08, "epoch": 2.8755760368663594, "percentage": 96.3, "elapsed_time": "0:14:11", "remaining_time": "0:00:32"}
209
+ {"current_steps": 209, "total_steps": 216, "loss": 0.2812, "lr": 3.2089819845111946e-08, "epoch": 2.889400921658986, "percentage": 96.76, "elapsed_time": "0:14:15", "remaining_time": "0:00:28"}
210
+ {"current_steps": 210, "total_steps": 216, "loss": 0.2579, "lr": 2.358289416693027e-08, "epoch": 2.903225806451613, "percentage": 97.22, "elapsed_time": "0:14:18", "remaining_time": "0:00:24"}
211
+ {"current_steps": 211, "total_steps": 216, "loss": 0.2217, "lr": 1.6380947627153143e-08, "epoch": 2.9170506912442398, "percentage": 97.69, "elapsed_time": "0:14:22", "remaining_time": "0:00:20"}
212
+ {"current_steps": 212, "total_steps": 216, "loss": 0.2273, "lr": 1.0485868811441757e-08, "epoch": 2.9308755760368665, "percentage": 98.15, "elapsed_time": "0:14:25", "remaining_time": "0:00:16"}
213
+ {"current_steps": 213, "total_steps": 216, "loss": 0.2158, "lr": 5.899203602046655e-09, "epoch": 2.944700460829493, "percentage": 98.61, "elapsed_time": "0:14:28", "remaining_time": "0:00:12"}
214
+ {"current_steps": 214, "total_steps": 216, "loss": 0.2063, "lr": 2.6221547724253337e-09, "epoch": 2.9585253456221197, "percentage": 99.07, "elapsed_time": "0:14:32", "remaining_time": "0:00:08"}
215
+ {"current_steps": 215, "total_steps": 216, "loss": 0.2588, "lr": 6.555816718389896e-10, "epoch": 2.9723502304147464, "percentage": 99.54, "elapsed_time": "0:14:35", "remaining_time": "0:00:04"}
216
+ {"current_steps": 216, "total_steps": 216, "loss": 0.2179, "lr": 0.0, "epoch": 2.986175115207373, "percentage": 100.0, "elapsed_time": "0:14:38", "remaining_time": "0:00:00"}
217
+ {"current_steps": 216, "total_steps": 216, "epoch": 2.986175115207373, "percentage": 100.0, "elapsed_time": "0:16:46", "remaining_time": "0:00:00"}