rbelanec commited on
Commit
bd3236d
·
verified ·
1 Parent(s): acc9389

Training in progress, step 1140

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +12 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01bd422531fe58f51801f54c74c5dbcbb098eac3452b12f2f9036a6daaf3169c
3
  size 1638528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18cb2d65a9e6e486f5368f30ebeb27cd4f8ca10d37cd7e476773b6ffa33758da
3
  size 1638528
trainer_log.jsonl CHANGED
@@ -235,3 +235,15 @@
235
  {"current_steps": 1083, "total_steps": 1140, "eval_loss": 0.1932847797870636, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "0:04:33", "remaining_time": "0:00:14", "throughput": 2507.11, "total_tokens": 685200}
236
  {"current_steps": 1085, "total_steps": 1140, "loss": 0.0003, "lr": 7.332578507216469e-06, "epoch": 19.035087719298247, "percentage": 95.18, "elapsed_time": "0:04:34", "remaining_time": "0:00:13", "throughput": 2500.39, "total_tokens": 686608}
237
  {"current_steps": 1090, "total_steps": 1140, "loss": 0.0002, "lr": 6.084188161890325e-06, "epoch": 19.12280701754386, "percentage": 95.61, "elapsed_time": "0:04:35", "remaining_time": "0:00:12", "throughput": 2501.39, "total_tokens": 689616}
 
 
 
 
 
 
 
 
 
 
 
 
 
235
  {"current_steps": 1083, "total_steps": 1140, "eval_loss": 0.1932847797870636, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "0:04:33", "remaining_time": "0:00:14", "throughput": 2507.11, "total_tokens": 685200}
236
  {"current_steps": 1085, "total_steps": 1140, "loss": 0.0003, "lr": 7.332578507216469e-06, "epoch": 19.035087719298247, "percentage": 95.18, "elapsed_time": "0:04:34", "remaining_time": "0:00:13", "throughput": 2500.39, "total_tokens": 686608}
237
  {"current_steps": 1090, "total_steps": 1140, "loss": 0.0002, "lr": 6.084188161890325e-06, "epoch": 19.12280701754386, "percentage": 95.61, "elapsed_time": "0:04:35", "remaining_time": "0:00:12", "throughput": 2501.39, "total_tokens": 689616}
238
+ {"current_steps": 1095, "total_steps": 1140, "loss": 0.0002, "lr": 4.95156606941688e-06, "epoch": 19.210526315789473, "percentage": 96.05, "elapsed_time": "0:04:36", "remaining_time": "0:00:11", "throughput": 2502.71, "total_tokens": 692784}
239
+ {"current_steps": 1100, "total_steps": 1140, "loss": 0.0002, "lr": 3.9349777035421194e-06, "epoch": 19.29824561403509, "percentage": 96.49, "elapsed_time": "0:04:37", "remaining_time": "0:00:10", "throughput": 2504.58, "total_tokens": 696176}
240
+ {"current_steps": 1105, "total_steps": 1140, "loss": 0.0005, "lr": 3.034661341025258e-06, "epoch": 19.385964912280702, "percentage": 96.93, "elapsed_time": "0:04:39", "remaining_time": "0:00:08", "throughput": 2505.59, "total_tokens": 699184}
241
+ {"current_steps": 1110, "total_steps": 1140, "loss": 0.0004, "lr": 2.250828005789518e-06, "epoch": 19.473684210526315, "percentage": 97.37, "elapsed_time": "0:04:40", "remaining_time": "0:00:07", "throughput": 2507.14, "total_tokens": 702448}
242
+ {"current_steps": 1115, "total_steps": 1140, "loss": 0.0003, "lr": 1.5836614194602028e-06, "epoch": 19.56140350877193, "percentage": 97.81, "elapsed_time": "0:04:41", "remaining_time": "0:00:06", "throughput": 2507.56, "total_tokens": 705232}
243
+ {"current_steps": 1120, "total_steps": 1140, "loss": 0.0002, "lr": 1.033317958302693e-06, "epoch": 19.649122807017545, "percentage": 98.25, "elapsed_time": "0:04:42", "remaining_time": "0:00:05", "throughput": 2509.32, "total_tokens": 708624}
244
+ {"current_steps": 1125, "total_steps": 1140, "loss": 0.0002, "lr": 5.999266165694906e-07, "epoch": 19.736842105263158, "percentage": 98.68, "elapsed_time": "0:04:43", "remaining_time": "0:00:03", "throughput": 2510.12, "total_tokens": 711568}
245
+ {"current_steps": 1130, "total_steps": 1140, "loss": 0.0002, "lr": 2.8358897626556966e-07, "epoch": 19.82456140350877, "percentage": 99.12, "elapsed_time": "0:04:44", "remaining_time": "0:00:02", "throughput": 2512.44, "total_tokens": 715216}
246
+ {"current_steps": 1135, "total_steps": 1140, "loss": 0.0004, "lr": 8.437918333864537e-08, "epoch": 19.912280701754387, "percentage": 99.56, "elapsed_time": "0:04:45", "remaining_time": "0:00:01", "throughput": 2513.41, "total_tokens": 718288}
247
+ {"current_steps": 1140, "total_steps": 1140, "loss": 0.0002, "lr": 2.343930299963937e-09, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:46", "remaining_time": "0:00:00", "throughput": 2515.66, "total_tokens": 721856}
248
+ {"current_steps": 1140, "total_steps": 1140, "eval_loss": 0.1910102218389511, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:47", "remaining_time": "0:00:00", "throughput": 2508.71, "total_tokens": 721856}
249
+ {"current_steps": 1140, "total_steps": 1140, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "0:04:48", "remaining_time": "0:00:00", "throughput": 2502.11, "total_tokens": 721856}