Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- attention_kindselective_n_heads2_seed1338/args.json +1 -1
- attention_kindselective_n_heads2_seed1338/dataloader_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_27500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_30000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_32500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_35000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_37500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_40000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_42500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_45000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_47500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/dataloader_49999.pt +3 -0
- attention_kindselective_n_heads2_seed1338/log2.txt +0 -0
- attention_kindselective_n_heads2_seed1338/model_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_27500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_30000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_32500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_35000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_37500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_40000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_42500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_45000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_47500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/model_49999.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1338/optimizer_27500.pt +3 -0
attention_kindselective_n_heads2_seed1338/args.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"hellaswag": true, "attention_kind": "selective", "log_dir": "
|
|
|
|
| 1 |
+
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 7e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "7e-5_10240_2_1338", "n_embd": 128}
|
attention_kindselective_n_heads2_seed1338/dataloader_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3858f6c832feea78a674d8c5c384061cc7d4f22cddbd0a2be6de33bc91e2c72
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3779d33c2e0a7873fcd8c39402e44260740665950323ad1445480ec339965a
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:450020c7c306c73e5c07c463518ab937102d657515ea5a38da6f2e7291f20324
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0696a655d7c8a9d7d275c7489f74a5a948ee029ac3941b045d6abaf12544a5b1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4eb226bdcee777fd1ca493533704dae226c077ef79c842fc9dc59a534d5381c1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88833bfd821adac4edd1dd0772083ae007c7b8d33041f66e53a679e1fa8993e0
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:554555a425bac43d626c36f1c81c2b0aba51eda3281dab27a9cb56b61f413354
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a52940b3b45414e6cdbec0dbaeba848f52d681c2daf78c269027057332d7fbd
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_30000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:775519ea26122cb70d533c496bcdbbc19f759f3d096e83e98cca1dc10275fe8e
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_32500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3422c8205fe45210246fed3dd6c317b75df02228cd8b75fba669574ce3b2d9
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_35000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:199ed3be67b88981f686112c97a2261729a37e0be3d4b0f4a289985a95d3cdf1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_37500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f77178b3be9dd3f8cd03c935236251f73fde6da7948ba9feda0c888fb8912dfe
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_40000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84f58ba3b4a1f9be7da4e697e06782f0e1ce4d3aca49f1997087fc83aa466dd9
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_42500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf6d24c78d89100d146bce9f26be940db3d71092473d9b55db97d6b35531eac2
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_45000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22bb90b43d81f3da5454f91a70e1ed29aeb2f470a727ce38390ff8a5c4924889
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_47500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55507725e6988f190e4963078652fafa6b68e8d4f79221387612612babf3e1c1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/dataloader_49999.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47776cddb8021172f048a950b83f25b692cb340214b800ce3837c15ceb58907c
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1338/log2.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
attention_kindselective_n_heads2_seed1338/model_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a54d1f2b670087ba176c7561a6cf2d8ec26b363bcc6c9707a21c9a5980179b6f
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f928a89bb8241803129e09214de466b0e25be48f89b7e2934f99d6d5749d67c
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:193c8827a7354eef33e70e2ceba9a981bdc28b041466300f379b40cff44dc5f2
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1d94a8368a19c2219bdff3ede1b15f35e4186b2ee041e02eeab9cfcbe2d47bc
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a70054d4344f6fa14b7d23b7d8cd915dbe453e71455454765a255640317d713
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdc755cb32eae94febfe4656f80338626101e8d7cc9946ce8ce2c3bf03de8ea8
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2355f2bfc63b002de74251d03a24a176aa53512f7eaf6c2641e5f33290d8e80f
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10a4d736bf77b416703a4797c1191ca35753f8493f5d4668711b9c95f183b3da
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c839040407e035acdd07369f6a7cacacdf771ee7182ba8d65658ed3500a4ba0
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:199ef7504e1bb9885ff6357018b4e74c7f0825a645526cfcb799d3d826826947
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a019be3e9ddc6d464dd7a14b1e6170af67015c64b2949663d79def4b69860b15
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_30000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:845e4abf4f3ce7be46e04f77330a53b3c4267e819ddbc02dde4963588f5df254
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_32500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:872c0cf97d562fef9c0eecef1ef811dca604f09bf2632f5c08075360f48425b6
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_35000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09f1131731afab9f36100fb3952537712567ab425d20a58900922e1915b4b8ca
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_37500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:83bd1e335e970a4ba1d9774c9192782c48865ff9b195b90ab4a04a8a5836506c
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_40000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31e467aae3098a92e7e473884dce191399b479efca63f963f5687f6a2b8d2fee
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_42500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0583628a4a6e9c9b032c427141c68cb9110d7d9d4011cf30fa9adbe6064f090b
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_45000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ad45144a3fb89602eff01bc07342d70cc8afb3ad6bc2a5e404be5777c109e494
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_47500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b293468bbf9bdf1ff4b1c1d9ccc3eb09e6d7b5bfbac4c2312351919feacb287
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_49999.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce9b65be8797af36d0449099a38afc632e8eea9f71b403705410b30e880b62ea
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1338/optimizer_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7092b3753d70721281439387dd8c0466cf32802e18f2c8e3ebb74e373ad9d54
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:777848a2f295ac1f4321dda85cf830242cd2621f9860c8db9ad5f9f9a02fbb67
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7a13322cf084a9889bde7b67a5341128f1bf6f74c17096982b119e271984a42
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ef371e7f771a14b9fa2724183416ca81d90cde94a9714987887efb51463c96b
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a99f478b8c7d4ba9df1dead510f69ced94b7074669697b8edcbd10632e530b6
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:868dae1e0f3077c15bc16ad0f8c175245e98ab505151c94f20694e0bca006442
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:956ac4f5e89edc78d304613e83ac3273cbb525614c2379275873d34db6c7a3e9
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:519c8914bf3b0de76b351423fa89e323b48bf7518149bbbc9e5d66c998c8ac23
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:803e0bf8dd7fcbaa44b1bd613dad95c2e96ff9712b4d7f9787f4352ab4ce5da3
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20b8749ff3895e79986c24589212dbacb2058a06bfb9596ad5cd21599b9062d6
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afd8a1b22bbba12a3c72efd70214ac15f5d304126134894d797fbed790ef6ef5
|
| 3 |
+
size 70895430
|