rbelanec commited on
Commit
a3abea9
·
verified ·
1 Parent(s): a332218

Training in progress, step 990

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +20 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed967b35896f6d514f9288cb7f87b470f527edbccffbe6d51385cd2a5bea7325
3
  size 58745928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7b61663d5465934c31edf09497284fabb5155a93f16a6ab29c8ead1a4188b2
3
  size 58745928
trainer_log.jsonl CHANGED
@@ -196,3 +196,23 @@
196
  {"current_steps": 930, "total_steps": 1800, "loss": 0.0, "lr": 2.795047091999849e-05, "epoch": 10.333333333333334, "percentage": 51.67, "elapsed_time": "0:03:32", "remaining_time": "0:03:19", "throughput": 1370.78, "total_tokens": 291744}
197
  {"current_steps": 935, "total_steps": 1800, "loss": 0.0, "lr": 2.770962324910027e-05, "epoch": 10.38888888888889, "percentage": 51.94, "elapsed_time": "0:03:33", "remaining_time": "0:03:17", "throughput": 1371.91, "total_tokens": 293344}
198
  {"current_steps": 940, "total_steps": 1800, "loss": 0.0, "lr": 2.7468520827592197e-05, "epoch": 10.444444444444445, "percentage": 52.22, "elapsed_time": "0:03:34", "remaining_time": "0:03:16", "throughput": 1372.92, "total_tokens": 294912}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
196
  {"current_steps": 930, "total_steps": 1800, "loss": 0.0, "lr": 2.795047091999849e-05, "epoch": 10.333333333333334, "percentage": 51.67, "elapsed_time": "0:03:32", "remaining_time": "0:03:19", "throughput": 1370.78, "total_tokens": 291744}
197
  {"current_steps": 935, "total_steps": 1800, "loss": 0.0, "lr": 2.770962324910027e-05, "epoch": 10.38888888888889, "percentage": 51.94, "elapsed_time": "0:03:33", "remaining_time": "0:03:17", "throughput": 1371.91, "total_tokens": 293344}
198
  {"current_steps": 940, "total_steps": 1800, "loss": 0.0, "lr": 2.7468520827592197e-05, "epoch": 10.444444444444445, "percentage": 52.22, "elapsed_time": "0:03:34", "remaining_time": "0:03:16", "throughput": 1372.92, "total_tokens": 294912}
199
+ {"current_steps": 945, "total_steps": 1800, "loss": 0.0, "lr": 2.7227186323197162e-05, "epoch": 10.5, "percentage": 52.5, "elapsed_time": "0:03:35", "remaining_time": "0:03:15", "throughput": 1373.86, "total_tokens": 296480}
200
+ {"current_steps": 950, "total_steps": 1800, "loss": 0.0, "lr": 2.6985642425457757e-05, "epoch": 10.555555555555555, "percentage": 52.78, "elapsed_time": "0:03:36", "remaining_time": "0:03:13", "throughput": 1374.85, "total_tokens": 298048}
201
+ {"current_steps": 955, "total_steps": 1800, "loss": 0.0, "lr": 2.674391184360313e-05, "epoch": 10.61111111111111, "percentage": 53.06, "elapsed_time": "0:03:37", "remaining_time": "0:03:12", "throughput": 1375.97, "total_tokens": 299648}
202
+ {"current_steps": 960, "total_steps": 1800, "loss": 0.0, "lr": 2.650201730441392e-05, "epoch": 10.666666666666666, "percentage": 53.33, "elapsed_time": "0:03:38", "remaining_time": "0:03:11", "throughput": 1376.9, "total_tokens": 301216}
203
+ {"current_steps": 965, "total_steps": 1800, "loss": 0.0, "lr": 2.6259981550085504e-05, "epoch": 10.722222222222221, "percentage": 53.61, "elapsed_time": "0:03:39", "remaining_time": "0:03:10", "throughput": 1377.8, "total_tokens": 302784}
204
+ {"current_steps": 970, "total_steps": 1800, "loss": 0.0, "lr": 2.60178273360899e-05, "epoch": 10.777777777777779, "percentage": 53.89, "elapsed_time": "0:03:40", "remaining_time": "0:03:08", "throughput": 1378.6, "total_tokens": 304320}
205
+ {"current_steps": 975, "total_steps": 1800, "loss": 0.0, "lr": 2.5775577429036345e-05, "epoch": 10.833333333333334, "percentage": 54.17, "elapsed_time": "0:03:41", "remaining_time": "0:03:07", "throughput": 1379.38, "total_tokens": 305856}
206
+ {"current_steps": 980, "total_steps": 1800, "loss": 0.0, "lr": 2.553325460453086e-05, "epoch": 10.88888888888889, "percentage": 54.44, "elapsed_time": "0:03:42", "remaining_time": "0:03:06", "throughput": 1380.32, "total_tokens": 307424}
207
+ {"current_steps": 985, "total_steps": 1800, "loss": 0.0, "lr": 2.5290881645034932e-05, "epoch": 10.944444444444445, "percentage": 54.72, "elapsed_time": "0:03:43", "remaining_time": "0:03:05", "throughput": 1381.27, "total_tokens": 308992}
208
+ {"current_steps": 990, "total_steps": 1800, "loss": 0.0, "lr": 2.504848133772358e-05, "epoch": 11.0, "percentage": 55.0, "elapsed_time": "0:03:44", "remaining_time": "0:03:03", "throughput": 1381.97, "total_tokens": 310560}
209
+ {"current_steps": 990, "total_steps": 1800, "eval_loss": 0.09742120653390884, "epoch": 11.0, "percentage": 55.0, "elapsed_time": "0:03:45", "remaining_time": "0:03:04", "throughput": 1378.22, "total_tokens": 310560}
210
+ {"current_steps": 995, "total_steps": 1800, "loss": 0.0, "lr": 2.4806076472342997e-05, "epoch": 11.055555555555555, "percentage": 55.28, "elapsed_time": "0:03:47", "remaining_time": "0:03:04", "throughput": 1370.77, "total_tokens": 312160}
211
+ {"current_steps": 1000, "total_steps": 1800, "loss": 0.0, "lr": 2.4563689839067913e-05, "epoch": 11.11111111111111, "percentage": 55.56, "elapsed_time": "0:03:48", "remaining_time": "0:03:02", "throughput": 1371.6, "total_tokens": 313728}
212
+ {"current_steps": 1005, "total_steps": 1800, "loss": 0.0, "lr": 2.432134422635893e-05, "epoch": 11.166666666666666, "percentage": 55.83, "elapsed_time": "0:03:49", "remaining_time": "0:03:01", "throughput": 1372.3, "total_tokens": 315264}
213
+ {"current_steps": 1010, "total_steps": 1800, "loss": 0.0, "lr": 2.4079062418820002e-05, "epoch": 11.222222222222221, "percentage": 56.11, "elapsed_time": "0:03:51", "remaining_time": "0:03:00", "throughput": 1371.06, "total_tokens": 316864}
214
+ {"current_steps": 1015, "total_steps": 1800, "loss": 0.0, "lr": 2.3836867195056335e-05, "epoch": 11.277777777777779, "percentage": 56.39, "elapsed_time": "0:03:52", "remaining_time": "0:02:59", "throughput": 1371.97, "total_tokens": 318432}
215
+ {"current_steps": 1020, "total_steps": 1800, "loss": 0.0, "lr": 2.3594781325532784e-05, "epoch": 11.333333333333334, "percentage": 56.67, "elapsed_time": "0:03:53", "remaining_time": "0:02:58", "throughput": 1372.95, "total_tokens": 320032}
216
+ {"current_steps": 1025, "total_steps": 1800, "loss": 0.0, "lr": 2.3352827570433036e-05, "epoch": 11.38888888888889, "percentage": 56.94, "elapsed_time": "0:03:54", "remaining_time": "0:02:57", "throughput": 1373.5, "total_tokens": 321536}
217
+ {"current_steps": 1030, "total_steps": 1800, "loss": 0.0, "lr": 2.3111028677519804e-05, "epoch": 11.444444444444445, "percentage": 57.22, "elapsed_time": "0:03:55", "remaining_time": "0:02:55", "throughput": 1374.07, "total_tokens": 323040}
218
+ {"current_steps": 1035, "total_steps": 1800, "loss": 0.0, "lr": 2.2869407379996088e-05, "epoch": 11.5, "percentage": 57.5, "elapsed_time": "0:03:56", "remaining_time": "0:02:54", "throughput": 1374.94, "total_tokens": 324608}