Training in progress, step 260
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ede92ab05a12937c79292c16d6155163485140110a9b39ffaf0693ae37d0172
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -28,3 +28,6 @@
|
|
| 28 |
{"loss": 0.72338204, "grad_norm": 0.33722463, "learning_rate": 9.2e-05, "token_acc": 0.78718055, "epoch": 0.67407124, "global_step/max_steps": "220/981", "percentage": "22.43%", "elapsed_time": "1h 36m 28s", "remaining_time": "5h 33m 44s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038004}
|
| 29 |
{"loss": 0.72606883, "grad_norm": 0.36189213, "learning_rate": 9.106e-05, "token_acc": 0.78815326, "epoch": 0.70471084, "global_step/max_steps": "230/981", "percentage": "23.45%", "elapsed_time": "1h 40m 18s", "remaining_time": "5h 27m 32s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038215}
|
| 30 |
{"loss": 0.71037607, "grad_norm": 0.36756998, "learning_rate": 9.007e-05, "token_acc": 0.78995104, "epoch": 0.73535044, "global_step/max_steps": "240/981", "percentage": "24.46%", "elapsed_time": "1h 44m 7s", "remaining_time": "5h 21m 27s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038418}
|
|
|
|
|
|
|
|
|
|
|
|
| 28 |
{"loss": 0.72338204, "grad_norm": 0.33722463, "learning_rate": 9.2e-05, "token_acc": 0.78718055, "epoch": 0.67407124, "global_step/max_steps": "220/981", "percentage": "22.43%", "elapsed_time": "1h 36m 28s", "remaining_time": "5h 33m 44s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038004}
|
| 29 |
{"loss": 0.72606883, "grad_norm": 0.36189213, "learning_rate": 9.106e-05, "token_acc": 0.78815326, "epoch": 0.70471084, "global_step/max_steps": "230/981", "percentage": "23.45%", "elapsed_time": "1h 40m 18s", "remaining_time": "5h 27m 32s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038215}
|
| 30 |
{"loss": 0.71037607, "grad_norm": 0.36756998, "learning_rate": 9.007e-05, "token_acc": 0.78995104, "epoch": 0.73535044, "global_step/max_steps": "240/981", "percentage": "24.46%", "elapsed_time": "1h 44m 7s", "remaining_time": "5h 21m 27s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038418}
|
| 31 |
+
{"loss": 0.72603316, "grad_norm": 0.36838499, "learning_rate": 8.904e-05, "token_acc": 0.78761645, "epoch": 0.76599004, "global_step/max_steps": "250/981", "percentage": "25.48%", "elapsed_time": "1h 47m 57s", "remaining_time": "5h 15m 38s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038598}
|
| 32 |
+
{"eval_loss": 2.7868228, "eval_runtime": 124.5897, "eval_samples_per_second": 2.175, "eval_steps_per_second": 0.546, "eval_token_acc": 0.79349843, "epoch": 0.76599004, "global_step/max_steps": "250/981", "percentage": "25.48%", "elapsed_time": "1h 50m 1s", "remaining_time": "5h 21m 43s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.037869}
|
| 33 |
+
{"loss": 0.72512798, "grad_norm": 0.38012171, "learning_rate": 8.796e-05, "token_acc": 0.78677306, "epoch": 0.79662964, "global_step/max_steps": "260/981", "percentage": "26.50%", "elapsed_time": "1h 53m 58s", "remaining_time": "5h 16m 3s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.03802}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:772a7bfb9ba731d52df64ab6c449c824508e669e6e9ae5b1df0d326971ff4185
|
| 3 |
+
size 16605
|