Training in progress, step 40
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5aab2642ce284bff61cab02e38886a366d996d40a75c95ffbc62eb02e9abbc2b
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -2,3 +2,5 @@
|
|
| 2 |
{"loss": 1.16878664, "grad_norm": 0.54073948, "learning_rate": 2e-06, "token_acc": 0.72249161, "epoch": 0.00306396, "global_step/max_steps": "1/981", "percentage": "0.10%", "elapsed_time": "2m 32s", "remaining_time": "1d 17h 38m 33s", "memory(GiB)": 26.53, "train_speed(iter/s)": 0.006537}
|
| 3 |
{"loss": 1.1736784, "grad_norm": 0.58766067, "learning_rate": 2e-05, "token_acc": 0.72568921, "epoch": 0.0306396, "global_step/max_steps": "10/981", "percentage": "1.02%", "elapsed_time": "6m 7s", "remaining_time": "9h 54m 19s", "memory(GiB)": 30.81, "train_speed(iter/s)": 0.02723}
|
| 4 |
{"loss": 1.10924559, "grad_norm": 0.30837649, "learning_rate": 4e-05, "token_acc": 0.72819331, "epoch": 0.0612792, "global_step/max_steps": "20/981", "percentage": "2.04%", "elapsed_time": "10m 2s", "remaining_time": "8h 2m 50s", "memory(GiB)": 30.83, "train_speed(iter/s)": 0.033171}
|
|
|
|
|
|
|
|
|
| 2 |
{"loss": 1.16878664, "grad_norm": 0.54073948, "learning_rate": 2e-06, "token_acc": 0.72249161, "epoch": 0.00306396, "global_step/max_steps": "1/981", "percentage": "0.10%", "elapsed_time": "2m 32s", "remaining_time": "1d 17h 38m 33s", "memory(GiB)": 26.53, "train_speed(iter/s)": 0.006537}
|
| 3 |
{"loss": 1.1736784, "grad_norm": 0.58766067, "learning_rate": 2e-05, "token_acc": 0.72568921, "epoch": 0.0306396, "global_step/max_steps": "10/981", "percentage": "1.02%", "elapsed_time": "6m 7s", "remaining_time": "9h 54m 19s", "memory(GiB)": 30.81, "train_speed(iter/s)": 0.02723}
|
| 4 |
{"loss": 1.10924559, "grad_norm": 0.30837649, "learning_rate": 4e-05, "token_acc": 0.72819331, "epoch": 0.0612792, "global_step/max_steps": "20/981", "percentage": "2.04%", "elapsed_time": "10m 2s", "remaining_time": "8h 2m 50s", "memory(GiB)": 30.83, "train_speed(iter/s)": 0.033171}
|
| 5 |
+
{"loss": 1.01692772, "grad_norm": 0.32810712, "learning_rate": 6e-05, "token_acc": 0.73688205, "epoch": 0.09191881, "global_step/max_steps": "30/981", "percentage": "3.06%", "elapsed_time": "14m 3s", "remaining_time": "7h 25m 41s", "memory(GiB)": 31.14, "train_speed(iter/s)": 0.035562}
|
| 6 |
+
{"loss": 0.96151266, "grad_norm": 0.22189981, "learning_rate": 8e-05, "token_acc": 0.74540555, "epoch": 0.12255841, "global_step/max_steps": "40/981", "percentage": "4.08%", "elapsed_time": "17m 59s", "remaining_time": "7h 3m 9s", "memory(GiB)": 31.14, "train_speed(iter/s)": 0.037062}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54a2d12769e74e0607401165e3a16ed4997176bffbaacb7119d55979ca0f9d59
|
| 3 |
+
size 9207
|