Upload folder using huggingface_hub
Browse files
attention_kindselective_n_heads2_seed1339/log2.txt
CHANGED
|
@@ -4480,3 +4480,29 @@ max_steps: 50000
|
|
| 4480 |
49100 val loss 5.7549
|
| 4481 |
49100 val perplexity 315.7364
|
| 4482 |
49100 train 5.643294 (lr=7.0508e-06) (hash(x)=48329226)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4480 |
49100 val loss 5.7549
|
| 4481 |
49100 val perplexity 315.7364
|
| 4482 |
49100 train 5.643294 (lr=7.0508e-06) (hash(x)=48329226)
|
| 4483 |
+
49200 val loss 5.7553
|
| 4484 |
+
49200 val perplexity 315.8609
|
| 4485 |
+
49200 train 5.780897 (lr=7.0401e-06) (hash(x)=49512472)
|
| 4486 |
+
49300 val loss 5.7553
|
| 4487 |
+
49300 val perplexity 315.8710
|
| 4488 |
+
49300 train 5.606384 (lr=7.0307e-06) (hash(x)=46541146)
|
| 4489 |
+
49400 val loss 5.7563
|
| 4490 |
+
49400 val perplexity 316.1908
|
| 4491 |
+
49400 train 5.687852 (lr=7.0226e-06) (hash(x)=52192792)
|
| 4492 |
+
49500 val loss 5.7586
|
| 4493 |
+
49500 val perplexity 316.9135
|
| 4494 |
+
49500 train 5.561897 (lr=7.0157e-06) (hash(x)=48954331)
|
| 4495 |
+
49600 val loss 5.7536
|
| 4496 |
+
49600 val perplexity 315.3082
|
| 4497 |
+
49600 train 5.866088 (lr=7.0100e-06) (hash(x)=50364098)
|
| 4498 |
+
49700 val loss 5.7539
|
| 4499 |
+
49700 val perplexity 315.4100
|
| 4500 |
+
49700 train 5.713979 (lr=7.0056e-06) (hash(x)=52016774)
|
| 4501 |
+
49800 val loss 5.7559
|
| 4502 |
+
49800 val perplexity 316.0443
|
| 4503 |
+
49800 train 5.978700 (lr=7.0025e-06) (hash(x)=54182957)
|
| 4504 |
+
49900 val loss 5.7501
|
| 4505 |
+
49900 val perplexity 314.2275
|
| 4506 |
+
49900 train 5.508786 (lr=7.0006e-06) (hash(x)=48188126)
|
| 4507 |
+
49999 val loss 5.7783
|
| 4508 |
+
49999 val perplexity 323.2066
|
attention_kindselective_n_heads2_seed1339/model_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28834adaf88405f49f239fe11965b0ab5d4fdaf387f714bc91e626e39643a5ad
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1339/optimizer_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a024c3d983392ca7d36a7fb3e7d7cca1ab81e9a475835f3d548aefcf7182228
|
| 3 |
size 70895430
|