minhnam commited on
Commit
120cdc9
·
verified ·
1 Parent(s): 4af804a

Training in progress, step 660

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9afba325f2fdf6cd233b7146fd13e39043353dd55999e427d4a850dd70c92c41
3
  size 87368144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d1c9ea17e321c879e34bb2d166007c5e8a0cac463e6dbfa1d9d8625e9aaccbd
3
  size 87368144
logging.jsonl CHANGED
@@ -76,3 +76,6 @@
76
  {"loss": 0.60055327, "grad_norm": 0.44221529, "learning_rate": 8.59e-06, "token_acc": 0.81496379, "epoch": 2.46157672, "global_step/max_steps": "620/756", "percentage": "82.01%", "elapsed_time": "4h 15m 3s", "remaining_time": "55m 56s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040513}
77
  {"loss": 0.60854549, "grad_norm": 2.7957778, "learning_rate": 7.41e-06, "token_acc": 0.81355507, "epoch": 2.50136782, "global_step/max_steps": "630/756", "percentage": "83.33%", "elapsed_time": "4h 18m 49s", "remaining_time": "51m 45s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040569}
78
  {"loss": 0.6125968, "grad_norm": 0.5052405, "learning_rate": 6.3e-06, "token_acc": 0.81358937, "epoch": 2.54115892, "global_step/max_steps": "640/756", "percentage": "84.66%", "elapsed_time": "4h 22m 32s", "remaining_time": "47m 35s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040629}
 
 
 
 
76
  {"loss": 0.60055327, "grad_norm": 0.44221529, "learning_rate": 8.59e-06, "token_acc": 0.81496379, "epoch": 2.46157672, "global_step/max_steps": "620/756", "percentage": "82.01%", "elapsed_time": "4h 15m 3s", "remaining_time": "55m 56s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040513}
77
  {"loss": 0.60854549, "grad_norm": 2.7957778, "learning_rate": 7.41e-06, "token_acc": 0.81355507, "epoch": 2.50136782, "global_step/max_steps": "630/756", "percentage": "83.33%", "elapsed_time": "4h 18m 49s", "remaining_time": "51m 45s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040569}
78
  {"loss": 0.6125968, "grad_norm": 0.5052405, "learning_rate": 6.3e-06, "token_acc": 0.81358937, "epoch": 2.54115892, "global_step/max_steps": "640/756", "percentage": "84.66%", "elapsed_time": "4h 22m 32s", "remaining_time": "47m 35s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040629}
79
+ {"loss": 0.61151357, "grad_norm": 0.43676135, "learning_rate": 5.28e-06, "token_acc": 0.81315275, "epoch": 2.58095001, "global_step/max_steps": "650/756", "percentage": "85.98%", "elapsed_time": "4h 26m 12s", "remaining_time": "43m 24s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040695}
80
+ {"eval_loss": 2.43642974, "eval_runtime": 81.9213, "eval_samples_per_second": 2.234, "eval_steps_per_second": 0.562, "eval_token_acc": 0.8173546, "epoch": 2.58095001, "global_step/max_steps": "650/756", "percentage": "85.98%", "elapsed_time": "4h 27m 34s", "remaining_time": "43m 38s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040487}
81
+ {"loss": 0.60613508, "grad_norm": 0.44147998, "learning_rate": 4.35e-06, "token_acc": 0.81491268, "epoch": 2.62074111, "global_step/max_steps": "660/756", "percentage": "87.30%", "elapsed_time": "4h 31m 20s", "remaining_time": "39m 28s", "memory(GiB)": 31.67, "train_speed(iter/s)": 0.040539}
runs/events.out.tfevents.1770820661.h004.gautschi.rcac.purdue.edu.2476766.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02678cfcd6db6136246397f99257219991ecf9d1a6f4a5bca59213cd7dc75eae
3
- size 28939
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ced3946a077e6cb8271670a71c699ae9a4d7a6fd213eeceac3c467dcfcfb57
3
+ size 29793