andrew-healey commited on
Commit
81b103e
·
verified ·
1 Parent(s): 8fcc258

Upload folder using huggingface_hub

Browse files
attention_kindselective_n_heads4_seed1341/log2.txt CHANGED
@@ -520,3 +520,11 @@ max_steps: 8750
520
  8500 train 5.526323 (lr=5.1019e-06) (hash(x)=150696521)
521
  8749 val loss 5.6907
522
  8749 val perplexity 296.0869
 
 
 
 
 
 
 
 
 
520
  8500 train 5.526323 (lr=5.1019e-06) (hash(x)=150696521)
521
  8749 val loss 5.6907
522
  8749 val perplexity 296.0869
523
+ 8600 val loss 5.5609
524
+ 8600 val perplexity 260.0624
525
+ 8600 train 5.497671 (lr=5.0367e-06) (hash(x)=162288191)
526
+ 8700 val loss 5.5574
527
+ 8700 val perplexity 259.1537
528
+ 8700 train 5.420652 (lr=5.0041e-06) (hash(x)=152860941)
529
+ 8749 val loss 5.5552
530
+ 8749 val perplexity 258.5751
attention_kindselective_n_heads4_seed1341/model_08749.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60f9795517c86381d63141ace51ce5da55dbc8de0aa3e2ee26b0ffd6d3c88332
3
  size 92843394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed5116034684e6d34af195f28f93503512a3e0e90722614c503ae4a0ca29f948
3
  size 92843394
attention_kindselective_n_heads4_seed1341/optimizer_08749.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43538ac4619bfa4754892879de2c96b45a186312926324b7e0fa80cc11d61f8b
3
  size 179406214
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fdebfb5ed81da0c541b370e2f0bb47a27698b1c422cf7e238ab56a1bbea0dc7
3
  size 179406214