Training in progress, step 500
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc29bda333b798b8d6882de60cd19e30948012ea10d0aafa84a760eedf8f43f7
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -57,3 +57,6 @@
|
|
| 57 |
{"loss": 0.67901173, "grad_norm": 0.39468125, "learning_rate": 5.931e-05, "token_acc": 0.79664045, "epoch": 1.4075067, "global_step/max_steps": "460/981", "percentage": "46.89%", "elapsed_time": "3h 20m 17s", "remaining_time": "3h 46m 51s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038277}
|
| 58 |
{"loss": 0.69018073, "grad_norm": 0.47022712, "learning_rate": 5.765e-05, "token_acc": 0.79297059, "epoch": 1.4381463, "global_step/max_steps": "470/981", "percentage": "47.91%", "elapsed_time": "3h 24m 14s", "remaining_time": "3h 42m 3s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038355}
|
| 59 |
{"loss": 0.66265864, "grad_norm": 0.43239185, "learning_rate": 5.598e-05, "token_acc": 0.80108355, "epoch": 1.46878591, "global_step/max_steps": "480/981", "percentage": "48.93%", "elapsed_time": "3h 28m 6s", "remaining_time": "3h 37m 12s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038441}
|
|
|
|
|
|
|
|
|
|
|
|
| 57 |
{"loss": 0.67901173, "grad_norm": 0.39468125, "learning_rate": 5.931e-05, "token_acc": 0.79664045, "epoch": 1.4075067, "global_step/max_steps": "460/981", "percentage": "46.89%", "elapsed_time": "3h 20m 17s", "remaining_time": "3h 46m 51s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038277}
|
| 58 |
{"loss": 0.69018073, "grad_norm": 0.47022712, "learning_rate": 5.765e-05, "token_acc": 0.79297059, "epoch": 1.4381463, "global_step/max_steps": "470/981", "percentage": "47.91%", "elapsed_time": "3h 24m 14s", "remaining_time": "3h 42m 3s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038355}
|
| 59 |
{"loss": 0.66265864, "grad_norm": 0.43239185, "learning_rate": 5.598e-05, "token_acc": 0.80108355, "epoch": 1.46878591, "global_step/max_steps": "480/981", "percentage": "48.93%", "elapsed_time": "3h 28m 6s", "remaining_time": "3h 37m 12s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038441}
|
| 60 |
+
{"loss": 0.67207289, "grad_norm": 0.39702681, "learning_rate": 5.43e-05, "token_acc": 0.79808606, "epoch": 1.49942551, "global_step/max_steps": "490/981", "percentage": "49.95%", "elapsed_time": "3h 31m 56s", "remaining_time": "3h 32m 22s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038531}
|
| 61 |
+
{"loss": 0.68019748, "grad_norm": 0.55682892, "learning_rate": 5.261e-05, "token_acc": 0.79575072, "epoch": 1.53006511, "global_step/max_steps": "500/981", "percentage": "50.97%", "elapsed_time": "3h 35m 47s", "remaining_time": "3h 27m 35s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038618}
|
| 62 |
+
{"eval_loss": 2.66862845, "eval_runtime": 124.7699, "eval_samples_per_second": 2.172, "eval_steps_per_second": 0.545, "eval_token_acc": 0.79923354, "epoch": 1.53006511, "global_step/max_steps": "500/981", "percentage": "50.97%", "elapsed_time": "3h 37m 51s", "remaining_time": "3h 29m 35s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.03825}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0feffb8cd57efb23a215dd0cf6f38c03829c6488ebb938ef26122a187a1cdf63
|
| 3 |
+
size 24585
|