Training in progress, step 981
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81fa8147b9499f31e9db5964c9239e747637aaef731857233ecd7bff4ee2014c
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -117,3 +117,5 @@
|
|
| 117 |
{"loss": 0.64517288, "grad_norm": 0.44848776, "learning_rate": 1.3e-07, "token_acc": 0.80361007, "epoch": 2.93757181, "global_step/max_steps": "960/981", "percentage": "97.86%", "elapsed_time": "6h 55m 29s", "remaining_time": "9m 5s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038509}
|
| 118 |
{"loss": 0.64295397, "grad_norm": 0.4717283, "learning_rate": 3e-08, "token_acc": 0.80482168, "epoch": 2.96821141, "global_step/max_steps": "970/981", "percentage": "98.88%", "elapsed_time": "6h 59m 23s", "remaining_time": "4m 45s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038548}
|
| 119 |
{"loss": 0.62486019, "grad_norm": 0.41565621, "learning_rate": 0.0, "token_acc": 0.80835402, "epoch": 2.99885101, "global_step/max_steps": "980/981", "percentage": "99.90%", "elapsed_time": "7h 3m 15s", "remaining_time": "25s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.03859}
|
|
|
|
|
|
|
|
|
| 117 |
{"loss": 0.64517288, "grad_norm": 0.44848776, "learning_rate": 1.3e-07, "token_acc": 0.80361007, "epoch": 2.93757181, "global_step/max_steps": "960/981", "percentage": "97.86%", "elapsed_time": "6h 55m 29s", "remaining_time": "9m 5s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038509}
|
| 118 |
{"loss": 0.64295397, "grad_norm": 0.4717283, "learning_rate": 3e-08, "token_acc": 0.80482168, "epoch": 2.96821141, "global_step/max_steps": "970/981", "percentage": "98.88%", "elapsed_time": "6h 59m 23s", "remaining_time": "4m 45s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038548}
|
| 119 |
{"loss": 0.62486019, "grad_norm": 0.41565621, "learning_rate": 0.0, "token_acc": 0.80835402, "epoch": 2.99885101, "global_step/max_steps": "980/981", "percentage": "99.90%", "elapsed_time": "7h 3m 15s", "remaining_time": "25s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.03859}
|
| 120 |
+
{"eval_loss": 2.61317253, "eval_runtime": 125.0988, "eval_samples_per_second": 2.166, "eval_steps_per_second": 0.544, "eval_token_acc": 0.80227843, "epoch": 3.0, "global_step/max_steps": "981/981", "percentage": "100.00%", "elapsed_time": "7h 5m 29s", "remaining_time": "0s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038426}
|
| 121 |
+
{"train_runtime": 25532.9048, "train_samples_per_second": 0.614, "train_steps_per_second": 0.038, "total_flos": 4.6792415081308094e+19, "train_loss": 0.7036621, "epoch": 3.0, "global_step/max_steps": "981/981", "percentage": "100.00%", "elapsed_time": "7h 5m 30s", "remaining_time": "0s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038424}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:278bee85013f8274d517110bd821067a13f444a2ec814d76cddfdc0075c8d240
|
| 3 |
+
size 40899
|