Training in progress, step 700
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef3d90bc96dd88b189982bb4a42c0592e9fd9b2a07a0109f09b1e13da100337a
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -81,3 +81,6 @@
|
|
| 81 |
{"loss": 0.60613508, "grad_norm": 0.44147998, "learning_rate": 4.35e-06, "token_acc": 0.81491268, "epoch": 2.62074111, "global_step/max_steps": "660/756", "percentage": "87.30%", "elapsed_time": "4h 31m 20s", "remaining_time": "39m 28s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040539}
|
| 82 |
{"loss": 0.6118052, "grad_norm": 0.47108141, "learning_rate": 3.5e-06, "token_acc": 0.81243315, "epoch": 2.66053221, "global_step/max_steps": "670/756", "percentage": "88.62%", "elapsed_time": "4h 35m 11s", "remaining_time": "35m 19s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040577}
|
| 83 |
{"loss": 0.59714527, "grad_norm": 0.43485948, "learning_rate": 2.74e-06, "token_acc": 0.81635524, "epoch": 2.7003233, "global_step/max_steps": "680/756", "percentage": "89.95%", "elapsed_time": "4h 39m 5s", "remaining_time": "31m 11s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040607}
|
|
|
|
|
|
|
|
|
|
|
|
| 81 |
{"loss": 0.60613508, "grad_norm": 0.44147998, "learning_rate": 4.35e-06, "token_acc": 0.81491268, "epoch": 2.62074111, "global_step/max_steps": "660/756", "percentage": "87.30%", "elapsed_time": "4h 31m 20s", "remaining_time": "39m 28s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040539}
|
| 82 |
{"loss": 0.6118052, "grad_norm": 0.47108141, "learning_rate": 3.5e-06, "token_acc": 0.81243315, "epoch": 2.66053221, "global_step/max_steps": "670/756", "percentage": "88.62%", "elapsed_time": "4h 35m 11s", "remaining_time": "35m 19s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040577}
|
| 83 |
{"loss": 0.59714527, "grad_norm": 0.43485948, "learning_rate": 2.74e-06, "token_acc": 0.81635524, "epoch": 2.7003233, "global_step/max_steps": "680/756", "percentage": "89.95%", "elapsed_time": "4h 39m 5s", "remaining_time": "31m 11s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040607}
|
| 84 |
+
{"loss": 0.60821619, "grad_norm": 0.45727718, "learning_rate": 2.07e-06, "token_acc": 0.81383335, "epoch": 2.7401144, "global_step/max_steps": "690/756", "percentage": "91.27%", "elapsed_time": "4h 42m 47s", "remaining_time": "27m 2s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040666}
|
| 85 |
+
{"loss": 0.61759448, "grad_norm": 0.46361193, "learning_rate": 1.49e-06, "token_acc": 0.81136959, "epoch": 2.7799055, "global_step/max_steps": "700/756", "percentage": "92.59%", "elapsed_time": "4h 46m 36s", "remaining_time": "22m 55s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040706}
|
| 86 |
+
{"eval_loss": 2.43304062, "eval_runtime": 81.9424, "eval_samples_per_second": 2.233, "eval_steps_per_second": 0.561, "eval_token_acc": 0.81754306, "epoch": 2.7799055, "global_step/max_steps": "700/756", "percentage": "92.59%", "elapsed_time": "4h 47m 58s", "remaining_time": "23m 2s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040513}
|
runs/events.out.tfevents.1770820661.h004.gautschi.rcac.purdue.edu.2476766.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ed8ab525f7a05993a72f659dde4dca396554365231a2ab669fb042aa02bf221
|
| 3 |
+
size 31177
|