Upload folder using huggingface_hub
Browse files- attention_kindselective_n_heads2_seed1341/args.json +1 -1
- attention_kindselective_n_heads2_seed1341/log2.txt +0 -0
- attention_kindselective_n_heads2_seed1341/model_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_10000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_12500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_15000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_17500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_20000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_22500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_25000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_27500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_30000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_32500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_35000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_37500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_40000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_42500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_45000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_47500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_49999.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_10000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_12500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_15000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_17500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_20000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_22500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_25000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_27500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_30000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_32500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_35000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_37500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_40000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_42500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_45000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_47500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_49999.pt +1 -1
attention_kindselective_n_heads2_seed1341/args.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1341", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1341, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr":
|
|
|
|
| 1 |
+
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1341", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1341, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 2e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "2e-5_10240_2_1341", "n_embd": 128}
|
attention_kindselective_n_heads2_seed1341/log2.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
attention_kindselective_n_heads2_seed1341/model_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:833f0dde8b3370a73fd5b29b35b80002cad90f31fbf97cc1710b0bd0401b6685
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:074762a518e2a1487a766b7fc817a447a9ee81edbe341801d4a6460ce66a7aaa
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59220abe254d065a0d24d47d896e35917add45c8571c0571da01fb66adcabb66
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_10000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c424946a8efdf35d177e4984506885e8ee52e2c7d6c1a37f0df78f1d6a8abf1
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_12500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eff89b76af29c29ab0d995e3bc18627f498ffb01f6c569ff8fd8162fa4ec9cc9
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_15000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80b275e4a7e90dba140e6c4372782a868300c43d4c22d4580e63b69a94ac08e1
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_17500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b8dc39235bf200c5f89c581f25f04e201e7f92a9e76cb97e67eaad49c6ff1af
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_20000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4975746044eab1bd53156fd67913133a5d29bdcc520bedfd43c349dbf2435505
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_22500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7bcac540009d94c331614fba97e6fb2ecb04f4953a1480757f9c0eb4fb91964
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_25000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b43800b9512435dd54d17e42dffc502f81f8b8f138c1de9d527d13c8b8e7c5b
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_27500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca681dee37249e4a7d38b73b93e80aaac52f6ad63771716f1cb20831fb8aecee
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_30000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:053cd2d4760b64a8f094bae8f4dcce33a9a97c4f2ec10accf802216ec00dbeaa
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_32500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:712a4446453b8445f10ad7c95c14573b057908a15eff85c256fe79c2c4ff933f
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_35000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a0c746bee577af3897b04f0e0feae268267422d99322c91940de61a869ac311
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_37500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d5458b461b03a36592bede692ffd1abcadde566658e19a3080b16b8fb10828d
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_40000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14defa3011505c92fee1bfd380b16c11f1caf3ee6a32c8412d9b7e116d43209e
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_42500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29cf7a0d20b3ad23b735d44139ae267e9254f8ecf159fdd7b1a208b10dcd33c6
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_45000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:583bcc602b6afca749224a52ae97c3ef340e66b51cc8b379779c4a41ec88bdde
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_47500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5ca922531ddd1674a5e6903c244af3319ae050d94b5ba54ebfb915f60a3ef02
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6848d3d6078337cd89f5de01539674bf626f3240fa175997824dacaeddb89190
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/optimizer_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64edb05929ade05c9b5fb0a274f460bb2fcc67b40c1ca69bdda333e582a0f802
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e98e11cad9f76f15e60649def7b8d148c3a8481eb366f5154f1fb4d1a679b200
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a3fd8e1a1fbdf70c72d1eefb6aa15c441f7f7be6965d995ca4b2864a8c6fff29
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_10000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75c841b668f528c705a0e8e6fabe116e1d3447b8ff61bcf6bc48feab623106f0
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_12500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca923fd0cffa3202f35f1e574a075e72cdb55e765e60b9dac4c51d262ec669af
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_15000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba7cba919637418779686d6b9c24c92c3500a4fa90ec4a98e9e8f324e62d906b
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_17500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02c1b7ce0947bb76b9643926f4ad56bf796de44f84acee7a7a49ecb1cfd41083
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_20000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e06b22dafb137d6f832f57c6aaaa1949c54245764a75727666d8bdaaeccec05
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_22500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78090e99719df9bedccfee486ce0897aab7fb6ace4230eabfda898f8f9a11739
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_25000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff86d7c4cbba9fd189d9e7c0a12f0fe65e7f2513df246f1726b9a54983bdafde
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_27500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6769c51b3a0edbc7f268e411527539b85e86644f136b246995303496ffda2082
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_30000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2d823fe934478e36ccece7b685c1b79f60b619ff738643e96b8171e389725cc
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_32500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bebac8071e82274a9c48bca167a49f4478a8e9066532c1caf2791763d47564d
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_35000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8203ef7ec1536f7748d73b121f98415b2dd8528a4d1e8016129a3b7810a38f60
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_37500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2905fb2bb385ed1437c42a0cfbe933dedca97e10ed67d4f6d2b31dbfc855f7af
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_40000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea554486de5f354d233e4d176fb83516570378df60f90e4811ced1694c06d2c4
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_42500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1db1727d9b06ac09b929488f2eb6e477d783ae07a708fd2e0453f2696cd23c86
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_45000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6c2288c9836faed1e5b3133d4853b492b9dd99806495480151e843c74c44ceb
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_47500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:221ae25427ec4f4b69620f6a4985892865965cf1cbe20f6144fe1b9e35356a57
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4110d95714f962580d271d820c79438ce0eb0355b964b3a19c51653049d53f18
|
| 3 |
size 70895430
|