Training in progress, step 200
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ab6a23e4d96afef56614d90fbf1343aa812e32e427a8d8f87d012bd2bfe7d9a
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -21,3 +21,6 @@
|
|
| 21 |
{"loss": 0.74879541, "grad_norm": 0.33142075, "learning_rate": 9.659e-05, "token_acc": 0.78281909, "epoch": 0.49023363, "global_step/max_steps": "160/981", "percentage": "16.31%", "elapsed_time": "1h 11m 7s", "remaining_time": "6h 4m 57s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.037492}
|
| 22 |
{"loss": 0.75294838, "grad_norm": 0.384736, "learning_rate": 9.596e-05, "token_acc": 0.78064094, "epoch": 0.52087323, "global_step/max_steps": "170/981", "percentage": "17.33%", "elapsed_time": "1h 14m 58s", "remaining_time": "5h 57m 40s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.037791}
|
| 23 |
{"loss": 0.73525543, "grad_norm": 0.35296121, "learning_rate": 9.527e-05, "token_acc": 0.7861065, "epoch": 0.55151283, "global_step/max_steps": "180/981", "percentage": "18.35%", "elapsed_time": "1h 18m 49s", "remaining_time": "5h 50m 46s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.038059}
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
{"loss": 0.74879541, "grad_norm": 0.33142075, "learning_rate": 9.659e-05, "token_acc": 0.78281909, "epoch": 0.49023363, "global_step/max_steps": "160/981", "percentage": "16.31%", "elapsed_time": "1h 11m 7s", "remaining_time": "6h 4m 57s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.037492}
|
| 22 |
{"loss": 0.75294838, "grad_norm": 0.384736, "learning_rate": 9.596e-05, "token_acc": 0.78064094, "epoch": 0.52087323, "global_step/max_steps": "170/981", "percentage": "17.33%", "elapsed_time": "1h 14m 58s", "remaining_time": "5h 57m 40s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.037791}
|
| 23 |
{"loss": 0.73525543, "grad_norm": 0.35296121, "learning_rate": 9.527e-05, "token_acc": 0.7861065, "epoch": 0.55151283, "global_step/max_steps": "180/981", "percentage": "18.35%", "elapsed_time": "1h 18m 49s", "remaining_time": "5h 50m 46s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.038059}
|
| 24 |
+
{"loss": 0.71808553, "grad_norm": 0.3456454, "learning_rate": 9.452e-05, "token_acc": 0.79099379, "epoch": 0.58215243, "global_step/max_steps": "190/981", "percentage": "19.37%", "elapsed_time": "1h 22m 40s", "remaining_time": "5h 44m 9s", "memory(GiB)": 31.44, "train_speed(iter/s)": 0.038306}
|
| 25 |
+
{"loss": 0.71191416, "grad_norm": 0.35632467, "learning_rate": 9.373e-05, "token_acc": 0.79211222, "epoch": 0.61279203, "global_step/max_steps": "200/981", "percentage": "20.39%", "elapsed_time": "1h 26m 38s", "remaining_time": "5h 38m 19s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038473}
|
| 26 |
+
{"eval_loss": 2.84208274, "eval_runtime": 124.6876, "eval_samples_per_second": 2.173, "eval_steps_per_second": 0.545, "eval_token_acc": 0.79054723, "epoch": 0.61279203, "global_step/max_steps": "200/981", "percentage": "20.39%", "elapsed_time": "1h 28m 43s", "remaining_time": "5h 46m 26s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.037572}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a347e1a0dcb73df0abc453dbcef675c0bce1b2b236ab3872eb0f0dd340aa45ae
|
| 3 |
+
size 14691
|