Training in progress, step 40
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be5c9060ea8d088b63ebde30a5af632b6c8b8a3071ef80e9fa9fa219dd73834f
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -2,3 +2,5 @@
|
|
| 2 |
{"loss": 1.0916611, "grad_norm": 0.55941969, "learning_rate": 2.63e-06, "token_acc": 0.74447185, "epoch": 0.00397911, "global_step/max_steps": "1/756", "percentage": "0.13%", "elapsed_time": "1m 50s", "remaining_time": "23h 10m 25s", "memory(GiB)": 28.08, "train_speed(iter/s)": 0.00905}
|
| 3 |
{"loss": 1.10507329, "grad_norm": 0.50046724, "learning_rate": 2.632e-05, "token_acc": 0.74080157, "epoch": 0.0397911, "global_step/max_steps": "10/756", "percentage": "1.32%", "elapsed_time": "5m 16s", "remaining_time": "6h 34m 5s", "memory(GiB)": 31.13, "train_speed(iter/s)": 0.031549}
|
| 4 |
{"loss": 1.00932264, "grad_norm": 0.22522864, "learning_rate": 5.263e-05, "token_acc": 0.74884435, "epoch": 0.07958219, "global_step/max_steps": "20/756", "percentage": "2.65%", "elapsed_time": "9m 6s", "remaining_time": "5h 35m 11s", "memory(GiB)": 31.16, "train_speed(iter/s)": 0.036596}
|
|
|
|
|
|
|
|
|
| 2 |
{"loss": 1.0916611, "grad_norm": 0.55941969, "learning_rate": 2.63e-06, "token_acc": 0.74447185, "epoch": 0.00397911, "global_step/max_steps": "1/756", "percentage": "0.13%", "elapsed_time": "1m 50s", "remaining_time": "23h 10m 25s", "memory(GiB)": 28.08, "train_speed(iter/s)": 0.00905}
|
| 3 |
{"loss": 1.10507329, "grad_norm": 0.50046724, "learning_rate": 2.632e-05, "token_acc": 0.74080157, "epoch": 0.0397911, "global_step/max_steps": "10/756", "percentage": "1.32%", "elapsed_time": "5m 16s", "remaining_time": "6h 34m 5s", "memory(GiB)": 31.13, "train_speed(iter/s)": 0.031549}
|
| 4 |
{"loss": 1.00932264, "grad_norm": 0.22522864, "learning_rate": 5.263e-05, "token_acc": 0.74884435, "epoch": 0.07958219, "global_step/max_steps": "20/756", "percentage": "2.65%", "elapsed_time": "9m 6s", "remaining_time": "5h 35m 11s", "memory(GiB)": 31.16, "train_speed(iter/s)": 0.036596}
|
| 5 |
+
{"loss": 0.93268452, "grad_norm": 0.25404572, "learning_rate": 7.895e-05, "token_acc": 0.75676336, "epoch": 0.11937329, "global_step/max_steps": "30/756", "percentage": "3.97%", "elapsed_time": "13m 12s", "remaining_time": "5h 19m 30s", "memory(GiB)": 31.41, "train_speed(iter/s)": 0.03787}
|
| 6 |
+
{"loss": 0.87882118, "grad_norm": 0.21832059, "learning_rate": 0.0001, "token_acc": 0.76511042, "epoch": 0.15916439, "global_step/max_steps": "40/756", "percentage": "5.29%", "elapsed_time": "17m 8s", "remaining_time": "5h 6m 52s", "memory(GiB)": 31.41, "train_speed(iter/s)": 0.038887}
|
runs/events.out.tfevents.1770820661.h004.gautschi.rcac.purdue.edu.2476766.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e07079c26292d6f9153d42d597d0a7203297f32a0e8a6ff705bddf9065dbdd82
|
| 3 |
+
size 9203
|