Training in progress, step 860
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:077442555dc983e04fa258132da8a8e7ef1c5182775997779cd41ffddbcfc5ba
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -100,3 +100,6 @@
|
|
| 100 |
{"loss": 0.64257121, "grad_norm": 0.39510468, "learning_rate": 7.2e-06, "token_acc": 0.80444136, "epoch": 2.50861739, "global_step/max_steps": "820/981", "percentage": "83.59%", "elapsed_time": "5h 54m 33s", "remaining_time": "1h 9m 36s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038546}
|
| 101 |
{"loss": 0.65501781, "grad_norm": 0.45020461, "learning_rate": 6.35e-06, "token_acc": 0.80161403, "epoch": 2.53925699, "global_step/max_steps": "830/981", "percentage": "84.61%", "elapsed_time": "5h 58m 25s", "remaining_time": "1h 5m 12s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038594}
|
| 102 |
{"loss": 0.6495801, "grad_norm": 0.49507573, "learning_rate": 5.55e-06, "token_acc": 0.80197075, "epoch": 2.56989659, "global_step/max_steps": "840/981", "percentage": "85.63%", "elapsed_time": "6h 2m 19s", "remaining_time": "1h 0m 49s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038639}
|
|
|
|
|
|
|
|
|
|
|
|
| 100 |
{"loss": 0.64257121, "grad_norm": 0.39510468, "learning_rate": 7.2e-06, "token_acc": 0.80444136, "epoch": 2.50861739, "global_step/max_steps": "820/981", "percentage": "83.59%", "elapsed_time": "5h 54m 33s", "remaining_time": "1h 9m 36s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038546}
|
| 101 |
{"loss": 0.65501781, "grad_norm": 0.45020461, "learning_rate": 6.35e-06, "token_acc": 0.80161403, "epoch": 2.53925699, "global_step/max_steps": "830/981", "percentage": "84.61%", "elapsed_time": "5h 58m 25s", "remaining_time": "1h 5m 12s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038594}
|
| 102 |
{"loss": 0.6495801, "grad_norm": 0.49507573, "learning_rate": 5.55e-06, "token_acc": 0.80197075, "epoch": 2.56989659, "global_step/max_steps": "840/981", "percentage": "85.63%", "elapsed_time": "6h 2m 19s", "remaining_time": "1h 0m 49s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038639}
|
| 103 |
+
{"loss": 0.64738607, "grad_norm": 0.43891406, "learning_rate": 4.81e-06, "token_acc": 0.80427136, "epoch": 2.60053619, "global_step/max_steps": "850/981", "percentage": "86.65%", "elapsed_time": "6h 6m 20s", "remaining_time": "56m 27s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038672}
|
| 104 |
+
{"eval_loss": 2.61586905, "eval_runtime": 124.3264, "eval_samples_per_second": 2.18, "eval_steps_per_second": 0.547, "eval_token_acc": 0.80201967, "epoch": 2.60053619, "global_step/max_steps": "850/981", "percentage": "86.65%", "elapsed_time": "6h 8m 24s", "remaining_time": "56m 46s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038454}
|
| 105 |
+
{"loss": 0.63968625, "grad_norm": 0.43007135, "learning_rate": 4.11e-06, "token_acc": 0.80489425, "epoch": 2.63117579, "global_step/max_steps": "860/981", "percentage": "87.67%", "elapsed_time": "6h 12m 18s", "remaining_time": "52m 23s", "memory(GiB)": 32.39, "train_speed(iter/s)": 0.038498}
|
runs/events.out.tfevents.1772968616.h016.gautschi.rcac.purdue.edu.2790912.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1ab5973304b9675fcd18122f122c10c70167c42589c276774dcd0ce6c168e7a
|
| 3 |
+
size 36393
|