Upload folder using huggingface_hub
Browse files
attention_kindselective_n_heads4_seed1338/log2.txt
CHANGED
|
@@ -581,3 +581,26 @@ max_steps: 10000
|
|
| 581 |
9200 val loss 6.6710
|
| 582 |
9200 val perplexity 789.1569
|
| 583 |
9200 train 6.815366 (lr=1.7208e-05) (hash(x)=50794720)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 581 |
9200 val loss 6.6710
|
| 582 |
9200 val perplexity 789.1569
|
| 583 |
9200 train 6.815366 (lr=1.7208e-05) (hash(x)=50794720)
|
| 584 |
+
9300 val loss 6.6665
|
| 585 |
+
9300 val perplexity 785.6486
|
| 586 |
+
9300 train 6.457387 (lr=1.6692e-05) (hash(x)=46513190)
|
| 587 |
+
9400 val loss 6.6622
|
| 588 |
+
9400 val perplexity 782.2387
|
| 589 |
+
9400 train 6.348344 (lr=1.6245e-05) (hash(x)=43808238)
|
| 590 |
+
9500 val loss 6.6600
|
| 591 |
+
9500 val perplexity 780.5348
|
| 592 |
+
9500 train 6.504676 (lr=1.5865e-05) (hash(x)=45021888)
|
| 593 |
+
9600 val loss 6.6551
|
| 594 |
+
9600 val perplexity 776.7688
|
| 595 |
+
9600 train 6.715017 (lr=1.5554e-05) (hash(x)=56525570)
|
| 596 |
+
9700 val loss 6.6502
|
| 597 |
+
9700 val perplexity 772.9388
|
| 598 |
+
9700 train 6.868919 (lr=1.5312e-05) (hash(x)=52585913)
|
| 599 |
+
9800 val loss 6.6466
|
| 600 |
+
9800 val perplexity 770.1832
|
| 601 |
+
9800 train 6.803319 (lr=1.5139e-05) (hash(x)=52344698)
|
| 602 |
+
9900 val loss 6.6428
|
| 603 |
+
9900 val perplexity 767.2672
|
| 604 |
+
9900 train 6.650891 (lr=1.5035e-05) (hash(x)=51740945)
|
| 605 |
+
9999 val loss 6.6431
|
| 606 |
+
9999 val perplexity 767.4703
|
attention_kindselective_n_heads4_seed1338/model_09999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 92843394
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d143e8e20039c95e60070ef5bd8bf592ad4ef99043c36d92d9aa77182b6bdf1
|
| 3 |
size 92843394
|
attention_kindselective_n_heads4_seed1338/optimizer_09999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 179406214
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5451ba18371638184e54489586e3c35c8f24271a5db40eb7bb20595d0cf98441
|
| 3 |
size 179406214
|