Training in progress, step 40
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a20d8c630f5fcd6609579d1a60c4bdb6feb6a6d62d4bf3c90e9819d4240017ec
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -2,3 +2,5 @@
|
|
| 2 |
{"loss": 1.16878664, "grad_norm": 0.5406909, "learning_rate": 2e-06, "token_acc": 0.72249161, "epoch": 0.00306396, "global_step/max_steps": "1/981", "percentage": "0.10%", "elapsed_time": "2m 35s", "remaining_time": "1d 18h 27m 54s", "memory(GiB)": 26.53, "train_speed(iter/s)": 0.00641}
|
| 3 |
{"loss": 1.17375967, "grad_norm": 0.58584249, "learning_rate": 2e-05, "token_acc": 0.72573775, "epoch": 0.0306396, "global_step/max_steps": "10/981", "percentage": "1.02%", "elapsed_time": "6m 13s", "remaining_time": "10h 4m 42s", "memory(GiB)": 30.81, "train_speed(iter/s)": 0.026762}
|
| 4 |
{"loss": 1.10936718, "grad_norm": 0.30921611, "learning_rate": 4e-05, "token_acc": 0.72818226, "epoch": 0.0612792, "global_step/max_steps": "20/981", "percentage": "2.04%", "elapsed_time": "10m 9s", "remaining_time": "8h 7m 44s", "memory(GiB)": 30.83, "train_speed(iter/s)": 0.032838}
|
|
|
|
|
|
|
|
|
| 2 |
{"loss": 1.16878664, "grad_norm": 0.5406909, "learning_rate": 2e-06, "token_acc": 0.72249161, "epoch": 0.00306396, "global_step/max_steps": "1/981", "percentage": "0.10%", "elapsed_time": "2m 35s", "remaining_time": "1d 18h 27m 54s", "memory(GiB)": 26.53, "train_speed(iter/s)": 0.00641}
|
| 3 |
{"loss": 1.17375967, "grad_norm": 0.58584249, "learning_rate": 2e-05, "token_acc": 0.72573775, "epoch": 0.0306396, "global_step/max_steps": "10/981", "percentage": "1.02%", "elapsed_time": "6m 13s", "remaining_time": "10h 4m 42s", "memory(GiB)": 30.81, "train_speed(iter/s)": 0.026762}
|
| 4 |
{"loss": 1.10936718, "grad_norm": 0.30921611, "learning_rate": 4e-05, "token_acc": 0.72818226, "epoch": 0.0612792, "global_step/max_steps": "20/981", "percentage": "2.04%", "elapsed_time": "10m 9s", "remaining_time": "8h 7m 44s", "memory(GiB)": 30.83, "train_speed(iter/s)": 0.032838}
|
| 5 |
+
{"loss": 1.01700897, "grad_norm": 0.32395476, "learning_rate": 6e-05, "token_acc": 0.73665842, "epoch": 0.09191881, "global_step/max_steps": "30/981", "percentage": "3.06%", "elapsed_time": "14m 15s", "remaining_time": "7h 32m 13s", "memory(GiB)": 31.14, "train_speed(iter/s)": 0.035049}
|
| 6 |
+
{"loss": 0.96151037, "grad_norm": 0.21501774, "learning_rate": 8e-05, "token_acc": 0.74531657, "epoch": 0.12255841, "global_step/max_steps": "40/981", "percentage": "4.08%", "elapsed_time": "18m 15s", "remaining_time": "7h 9m 25s", "memory(GiB)": 31.14, "train_speed(iter/s)": 0.036521}
|
runs/events.out.tfevents.1772953118.h012.gautschi.rcac.purdue.edu.2974893.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0669f759af511dda42895a6be88316c2c1550bda8756bf3a9ee36bcb19049e4
|
| 3 |
+
size 9207
|