Training in progress, step 640
Browse files
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 87368144
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9afba325f2fdf6cd233b7146fd13e39043353dd55999e427d4a850dd70c92c41
|
| 3 |
size 87368144
|
logging.jsonl
CHANGED
|
@@ -74,3 +74,5 @@
|
|
| 74 |
{"eval_loss": 2.44298482, "eval_runtime": 81.8948, "eval_samples_per_second": 2.235, "eval_steps_per_second": 0.562, "eval_token_acc": 0.81703102, "epoch": 2.38199453, "global_step/max_steps": "600/756", "percentage": "79.37%", "elapsed_time": "4h 7m 30s", "remaining_time": "1h 4m 21s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040402}
|
| 75 |
{"loss": 0.60592523, "grad_norm": 0.46010175, "learning_rate": 9.86e-06, "token_acc": 0.81451129, "epoch": 2.42178563, "global_step/max_steps": "610/756", "percentage": "80.69%", "elapsed_time": "4h 11m 20s", "remaining_time": "1h 0m 9s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.04045}
|
| 76 |
{"loss": 0.60055327, "grad_norm": 0.44221529, "learning_rate": 8.59e-06, "token_acc": 0.81496379, "epoch": 2.46157672, "global_step/max_steps": "620/756", "percentage": "82.01%", "elapsed_time": "4h 15m 3s", "remaining_time": "55m 56s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040513}
|
|
|
|
|
|
|
|
|
| 74 |
{"eval_loss": 2.44298482, "eval_runtime": 81.8948, "eval_samples_per_second": 2.235, "eval_steps_per_second": 0.562, "eval_token_acc": 0.81703102, "epoch": 2.38199453, "global_step/max_steps": "600/756", "percentage": "79.37%", "elapsed_time": "4h 7m 30s", "remaining_time": "1h 4m 21s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040402}
|
| 75 |
{"loss": 0.60592523, "grad_norm": 0.46010175, "learning_rate": 9.86e-06, "token_acc": 0.81451129, "epoch": 2.42178563, "global_step/max_steps": "610/756", "percentage": "80.69%", "elapsed_time": "4h 11m 20s", "remaining_time": "1h 0m 9s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.04045}
|
| 76 |
{"loss": 0.60055327, "grad_norm": 0.44221529, "learning_rate": 8.59e-06, "token_acc": 0.81496379, "epoch": 2.46157672, "global_step/max_steps": "620/756", "percentage": "82.01%", "elapsed_time": "4h 15m 3s", "remaining_time": "55m 56s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040513}
|
| 77 |
+
{"loss": 0.60854549, "grad_norm": 2.7957778, "learning_rate": 7.41e-06, "token_acc": 0.81355507, "epoch": 2.50136782, "global_step/max_steps": "630/756", "percentage": "83.33%", "elapsed_time": "4h 18m 49s", "remaining_time": "51m 45s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040569}
|
| 78 |
+
{"loss": 0.6125968, "grad_norm": 0.5052405, "learning_rate": 6.3e-06, "token_acc": 0.81358937, "epoch": 2.54115892, "global_step/max_steps": "640/756", "percentage": "84.66%", "elapsed_time": "4h 22m 32s", "remaining_time": "47m 35s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040629}
|
runs/events.out.tfevents.1770820661.h004.gautschi.rcac.purdue.edu.2476766.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02678cfcd6db6136246397f99257219991ecf9d1a6f4a5bca59213cd7dc75eae
|
| 3 |
+
size 28939
|