rbelanec commited on
Commit
3bb6e00
·
verified ·
1 Parent(s): f17773e

Training in progress, step 2260

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +20 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d9961f4e52262a3912c3cc91ac4b86dca136525a75820413733138993e6738c
3
  size 8388736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dc2c296db4924f0e5a9117c49f989da1ec8fb6c88835c6f8087f5753acf289e
3
  size 8388736
trainer_log.jsonl CHANGED
@@ -451,3 +451,23 @@
451
  {"current_steps": 2160, "total_steps": 2260, "loss": 0.0, "lr": 3.03577582601422e-07, "epoch": 19.115044247787612, "percentage": 95.58, "elapsed_time": "0:03:57", "remaining_time": "0:00:11", "throughput": 2547.58, "total_tokens": 605488}
452
  {"current_steps": 2165, "total_steps": 2260, "loss": 0.0, "lr": 2.743181179037047e-07, "epoch": 19.15929203539823, "percentage": 95.8, "elapsed_time": "0:03:58", "remaining_time": "0:00:10", "throughput": 2548.43, "total_tokens": 606800}
453
  {"current_steps": 2170, "total_steps": 2260, "loss": 0.0, "lr": 2.465332862986447e-07, "epoch": 19.20353982300885, "percentage": 96.02, "elapsed_time": "0:03:58", "remaining_time": "0:00:09", "throughput": 2549.6, "total_tokens": 608272}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
451
  {"current_steps": 2160, "total_steps": 2260, "loss": 0.0, "lr": 3.03577582601422e-07, "epoch": 19.115044247787612, "percentage": 95.58, "elapsed_time": "0:03:57", "remaining_time": "0:00:11", "throughput": 2547.58, "total_tokens": 605488}
452
  {"current_steps": 2165, "total_steps": 2260, "loss": 0.0, "lr": 2.743181179037047e-07, "epoch": 19.15929203539823, "percentage": 95.8, "elapsed_time": "0:03:58", "remaining_time": "0:00:10", "throughput": 2548.43, "total_tokens": 606800}
453
  {"current_steps": 2170, "total_steps": 2260, "loss": 0.0, "lr": 2.465332862986447e-07, "epoch": 19.20353982300885, "percentage": 96.02, "elapsed_time": "0:03:58", "remaining_time": "0:00:09", "throughput": 2549.6, "total_tokens": 608272}
454
+ {"current_steps": 2175, "total_steps": 2260, "loss": 0.0, "lr": 2.2022474486620427e-07, "epoch": 19.24778761061947, "percentage": 96.24, "elapsed_time": "0:03:58", "remaining_time": "0:00:09", "throughput": 2549.69, "total_tokens": 609360}
455
+ {"current_steps": 2180, "total_steps": 2260, "loss": 0.0, "lr": 1.953940626408024e-07, "epoch": 19.292035398230087, "percentage": 96.46, "elapsed_time": "0:03:59", "remaining_time": "0:00:08", "throughput": 2550.22, "total_tokens": 610592}
456
+ {"current_steps": 2185, "total_steps": 2260, "loss": 0.0, "lr": 1.720427205177233e-07, "epoch": 19.336283185840706, "percentage": 96.68, "elapsed_time": "0:03:59", "remaining_time": "0:00:08", "throughput": 2550.6, "total_tokens": 611840}
457
+ {"current_steps": 2190, "total_steps": 2260, "loss": 0.0, "lr": 1.5017211116479802e-07, "epoch": 19.38053097345133, "percentage": 96.9, "elapsed_time": "0:04:00", "remaining_time": "0:00:07", "throughput": 2552.28, "total_tokens": 613472}
458
+ {"current_steps": 2195, "total_steps": 2260, "loss": 0.0, "lr": 1.297835389393598e-07, "epoch": 19.424778761061948, "percentage": 97.12, "elapsed_time": "0:04:00", "remaining_time": "0:00:07", "throughput": 2553.28, "total_tokens": 614848}
459
+ {"current_steps": 2200, "total_steps": 2260, "loss": 0.0, "lr": 1.1087821981042856e-07, "epoch": 19.469026548672566, "percentage": 97.35, "elapsed_time": "0:04:01", "remaining_time": "0:00:06", "throughput": 2554.65, "total_tokens": 616320}
460
+ {"current_steps": 2205, "total_steps": 2260, "loss": 0.0, "lr": 9.345728128621611e-08, "epoch": 19.513274336283185, "percentage": 97.57, "elapsed_time": "0:04:01", "remaining_time": "0:00:06", "throughput": 2555.45, "total_tokens": 617664}
461
+ {"current_steps": 2210, "total_steps": 2260, "loss": 0.0, "lr": 7.752176234685771e-08, "epoch": 19.557522123893804, "percentage": 97.79, "elapsed_time": "0:04:02", "remaining_time": "0:00:05", "throughput": 2556.92, "total_tokens": 619200}
462
+ {"current_steps": 2215, "total_steps": 2260, "loss": 0.0001, "lr": 6.307261338246718e-08, "epoch": 19.601769911504427, "percentage": 98.01, "elapsed_time": "0:04:02", "remaining_time": "0:00:04", "throughput": 2558.08, "total_tokens": 620688}
463
+ {"current_steps": 2220, "total_steps": 2260, "loss": 0.0, "lr": 5.011069613644892e-08, "epoch": 19.646017699115045, "percentage": 98.23, "elapsed_time": "0:04:03", "remaining_time": "0:00:04", "throughput": 2558.73, "total_tokens": 622032}
464
+ {"current_steps": 2225, "total_steps": 2260, "loss": 0.0, "lr": 3.8636783654100174e-08, "epoch": 19.690265486725664, "percentage": 98.45, "elapsed_time": "0:04:03", "remaining_time": "0:00:03", "throughput": 2559.24, "total_tokens": 623248}
465
+ {"current_steps": 2230, "total_steps": 2260, "loss": 0.0, "lr": 2.865156023650617e-08, "epoch": 19.734513274336283, "percentage": 98.67, "elapsed_time": "0:04:04", "remaining_time": "0:00:03", "throughput": 2561.16, "total_tokens": 624944}
466
+ {"current_steps": 2235, "total_steps": 2260, "loss": 0.0, "lr": 2.0155621399742254e-08, "epoch": 19.778761061946902, "percentage": 98.89, "elapsed_time": "0:04:04", "remaining_time": "0:00:02", "throughput": 2561.47, "total_tokens": 626176}
467
+ {"current_steps": 2240, "total_steps": 2260, "loss": 0.0, "lr": 1.31494738393384e-08, "epoch": 19.82300884955752, "percentage": 99.12, "elapsed_time": "0:04:04", "remaining_time": "0:00:02", "throughput": 2561.98, "total_tokens": 627408}
468
+ {"current_steps": 2245, "total_steps": 2260, "loss": 0.0, "lr": 7.633535400070057e-09, "epoch": 19.86725663716814, "percentage": 99.34, "elapsed_time": "0:04:05", "remaining_time": "0:00:01", "throughput": 2564.19, "total_tokens": 629216}
469
+ {"current_steps": 2250, "total_steps": 2260, "loss": 0.0, "lr": 3.6081350510447365e-09, "epoch": 19.911504424778762, "percentage": 99.56, "elapsed_time": "0:04:05", "remaining_time": "0:00:01", "throughput": 2565.12, "total_tokens": 630592}
470
+ {"current_steps": 2255, "total_steps": 2260, "loss": 0.0, "lr": 1.0735128660649406e-09, "epoch": 19.95575221238938, "percentage": 99.78, "elapsed_time": "0:04:06", "remaining_time": "0:00:00", "throughput": 2566.75, "total_tokens": 632208}
471
+ {"current_steps": 2260, "total_steps": 2260, "loss": 0.0, "lr": 2.982000932294504e-11, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:06", "remaining_time": "0:00:00", "throughput": 2566.42, "total_tokens": 633448}
472
+ {"current_steps": 2260, "total_steps": 2260, "eval_loss": 0.34241023659706116, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:07", "remaining_time": "0:00:00", "throughput": 2559.28, "total_tokens": 633448}
473
+ {"current_steps": 2260, "total_steps": 2260, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:08", "remaining_time": "0:00:00", "throughput": 2546.85, "total_tokens": 633448}