3N3G commited on
Commit
caef6f0
·
verified ·
1 Parent(s): f61e560

Training in progress, step 288

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee915e1b5fcd3e71f045efcc9cbc0312102624597c3d974e5f1950163bd6338e
3
  size 4969539560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ad5883a3cee7c47736b45f9790afc68bdd5c731da8985e21a6cb6b18802bee1
3
  size 4969539560
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a36fb710f6fea75a37049aac8d9eacc734dda5a62ef70bf161d89f8941be5c2
3
  size 1912795688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:652f38f7fb6d6d424d146395fc676655eef11c276b4cc3a9e7a2d7d530069500
3
  size 1912795688
trainer_log.jsonl CHANGED
@@ -781,3 +781,20 @@
781
  {"current_steps": 287, "total_steps": 400, "loss": 0.6352, "lr": 3.049124342432378e-08, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:34:54", "remaining_time": "0:13:44"}
782
  {"current_steps": 288, "total_steps": 400, "loss": 0.6391, "lr": 3.0162835660957385e-08, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:57", "remaining_time": "0:13:35"}
783
  {"current_steps": 288, "total_steps": 400, "eval_loss": 0.641921877861023, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:58", "remaining_time": "0:13:36"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
781
  {"current_steps": 287, "total_steps": 400, "loss": 0.6352, "lr": 3.049124342432378e-08, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:34:54", "remaining_time": "0:13:44"}
782
  {"current_steps": 288, "total_steps": 400, "loss": 0.6391, "lr": 3.0162835660957385e-08, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:57", "remaining_time": "0:13:35"}
783
  {"current_steps": 288, "total_steps": 400, "eval_loss": 0.641921877861023, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:58", "remaining_time": "0:13:36"}
784
+ {"current_steps": 289, "total_steps": 400, "loss": 0.6219, "lr": 2.983631934381639e-08, "epoch": 72.2909090909091, "percentage": 72.25, "elapsed_time": "0:35:28", "remaining_time": "0:13:37"}
785
+ {"current_steps": 290, "total_steps": 400, "loss": 0.6635, "lr": 2.9511719338382535e-08, "epoch": 72.58181818181818, "percentage": 72.5, "elapsed_time": "0:35:35", "remaining_time": "0:13:30"}
786
+ {"current_steps": 291, "total_steps": 400, "loss": 0.6377, "lr": 2.918906036420294e-08, "epoch": 72.87272727272727, "percentage": 72.75, "elapsed_time": "0:35:42", "remaining_time": "0:13:22"}
787
+ {"current_steps": 292, "total_steps": 400, "loss": 0.7822, "lr": 2.886836699300771e-08, "epoch": 73.0, "percentage": 73.0, "elapsed_time": "0:35:45", "remaining_time": "0:13:13"}
788
+ {"current_steps": 293, "total_steps": 400, "loss": 0.609, "lr": 2.8549663646838718e-08, "epoch": 73.2909090909091, "percentage": 73.25, "elapsed_time": "0:35:52", "remaining_time": "0:13:06"}
789
+ {"current_steps": 294, "total_steps": 400, "loss": 0.6728, "lr": 2.8232974596189653e-08, "epoch": 73.58181818181818, "percentage": 73.5, "elapsed_time": "0:35:59", "remaining_time": "0:12:58"}
790
+ {"current_steps": 295, "total_steps": 400, "loss": 0.7013, "lr": 2.791832395815782e-08, "epoch": 73.87272727272727, "percentage": 73.75, "elapsed_time": "0:36:06", "remaining_time": "0:12:51"}
791
+ {"current_steps": 296, "total_steps": 400, "loss": 0.6343, "lr": 2.760573569460757e-08, "epoch": 74.0, "percentage": 74.0, "elapsed_time": "0:36:09", "remaining_time": "0:12:42"}
792
+ {"current_steps": 297, "total_steps": 400, "loss": 0.6528, "lr": 2.729523361034538e-08, "epoch": 74.2909090909091, "percentage": 74.25, "elapsed_time": "0:36:16", "remaining_time": "0:12:34"}
793
+ {"current_steps": 298, "total_steps": 400, "loss": 0.6243, "lr": 2.6986841351307128e-08, "epoch": 74.58181818181818, "percentage": 74.5, "elapsed_time": "0:36:23", "remaining_time": "0:12:27"}
794
+ {"current_steps": 299, "total_steps": 400, "loss": 0.6658, "lr": 2.6680582402757322e-08, "epoch": 74.87272727272727, "percentage": 74.75, "elapsed_time": "0:36:30", "remaining_time": "0:12:20"}
795
+ {"current_steps": 300, "total_steps": 400, "loss": 0.7016, "lr": 2.637648008750062e-08, "epoch": 75.0, "percentage": 75.0, "elapsed_time": "0:36:33", "remaining_time": "0:12:11"}
796
+ {"current_steps": 301, "total_steps": 400, "loss": 0.6661, "lr": 2.6074557564105726e-08, "epoch": 75.2909090909091, "percentage": 75.25, "elapsed_time": "0:36:40", "remaining_time": "0:12:03"}
797
+ {"current_steps": 302, "total_steps": 400, "loss": 0.6277, "lr": 2.5774837825141737e-08, "epoch": 75.58181818181818, "percentage": 75.5, "elapsed_time": "0:36:48", "remaining_time": "0:11:56"}
798
+ {"current_steps": 303, "total_steps": 400, "loss": 0.6863, "lr": 2.547734369542718e-08, "epoch": 75.87272727272727, "percentage": 75.75, "elapsed_time": "0:36:54", "remaining_time": "0:11:49"}
799
+ {"current_steps": 304, "total_steps": 400, "loss": 0.648, "lr": 2.5182097830291825e-08, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"}
800
+ {"current_steps": 304, "total_steps": 400, "eval_loss": 0.6407743096351624, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"}