Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- attention_kindselective_n_heads2_seed1341/args.json +1 -1
- attention_kindselective_n_heads2_seed1341/dataloader_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_27500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_30000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_32500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_35000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_37500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_40000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_42500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_45000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_47500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/dataloader_49999.pt +3 -0
- attention_kindselective_n_heads2_seed1341/log2.txt +0 -0
- attention_kindselective_n_heads2_seed1341/model_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/model_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_27500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_30000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_32500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_35000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_37500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_40000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_42500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_45000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_47500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/model_49999.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1341/optimizer_10000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_12500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_15000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_17500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_20000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_22500.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_25000.pt +3 -0
- attention_kindselective_n_heads2_seed1341/optimizer_27500.pt +3 -0
attention_kindselective_n_heads2_seed1341/args.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"hellaswag": true, "attention_kind": "selective", "log_dir": "
|
|
|
|
| 1 |
+
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1341", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1341, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 0.0001, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "10e-5_10240_2_1341", "n_embd": 128}
|
attention_kindselective_n_heads2_seed1341/dataloader_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3858f6c832feea78a674d8c5c384061cc7d4f22cddbd0a2be6de33bc91e2c72
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3779d33c2e0a7873fcd8c39402e44260740665950323ad1445480ec339965a
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:450020c7c306c73e5c07c463518ab937102d657515ea5a38da6f2e7291f20324
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0696a655d7c8a9d7d275c7489f74a5a948ee029ac3941b045d6abaf12544a5b1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4eb226bdcee777fd1ca493533704dae226c077ef79c842fc9dc59a534d5381c1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88833bfd821adac4edd1dd0772083ae007c7b8d33041f66e53a679e1fa8993e0
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:554555a425bac43d626c36f1c81c2b0aba51eda3281dab27a9cb56b61f413354
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a52940b3b45414e6cdbec0dbaeba848f52d681c2daf78c269027057332d7fbd
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_30000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:775519ea26122cb70d533c496bcdbbc19f759f3d096e83e98cca1dc10275fe8e
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_32500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3422c8205fe45210246fed3dd6c317b75df02228cd8b75fba669574ce3b2d9
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_35000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:199ed3be67b88981f686112c97a2261729a37e0be3d4b0f4a289985a95d3cdf1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_37500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f77178b3be9dd3f8cd03c935236251f73fde6da7948ba9feda0c888fb8912dfe
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_40000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84f58ba3b4a1f9be7da4e697e06782f0e1ce4d3aca49f1997087fc83aa466dd9
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_42500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf6d24c78d89100d146bce9f26be940db3d71092473d9b55db97d6b35531eac2
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_45000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22bb90b43d81f3da5454f91a70e1ed29aeb2f470a727ce38390ff8a5c4924889
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_47500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55507725e6988f190e4963078652fafa6b68e8d4f79221387612612babf3e1c1
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/dataloader_49999.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47776cddb8021172f048a950b83f25b692cb340214b800ce3837c15ceb58907c
|
| 3 |
+
size 964
|
attention_kindselective_n_heads2_seed1341/log2.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
attention_kindselective_n_heads2_seed1341/model_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df2dbff4078c4b902e52c1b7e5066b645d7034b614be5e59574471f8960ecc8d
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b8b2db67768b1b7c4f36a2f59bdbf2ce5cdb8709c2f1a8aab106c8f26270d14
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:364f24f243b3307cbb71c22973ac7657870fb5d5ab6db86c6b6ce16187242859
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39597fb5f366edff6ba2340cd9532f6013379941b9f4fa74758f88d9c97ae137
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d31a60ee89698642b0ebc621b75f58a692275ef26044e594d7268780509fd84
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1af66647de9c5fc855d02d637ba618c8144799d5efe8ddc623aa3b3de6f726c
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e82ddeade8b883e1bec9ae78a0caacae82fc16e39d9c5e40a814ee4b400df35
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be0d57d46256da655ab0efb88dce7b9010af64ff833c4c08ae94bcb3b7138cc8
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e93ca9b8574d2d714f7cae55c176cb3e64cb31d5ab43da6c34b0b03b0cbead07
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:454c04312ec7cba780576b7269421be5981dbee4e8a4d91baec0e8013e07cc02
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8961199b8c739f6e36b00526c87a6b5246765f4d1c0dbe1093faede9f3344450
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_30000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:197046029793284598988dd04e5df15c623eaef6f155707df97b86154436a148
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_32500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96771b15cd62ac259acfeaa8c3bea3c6a0311b32a69fc5f4cbdf396812aaa6f2
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_35000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64439ba3a2d2759349369c61c46122f5f8d43d494d81def5c4c784414d39443e
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_37500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:974dfee447c5c353591f60ad35df9d68980e9c6f37f94c1beca686db8af86a80
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_40000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92e9a07a5d7a3a5bbe8777892da0e16dbe8d52cfe28c66d9263c00ba04a7a708
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_42500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff5074eedcb82cb39bd1c3cc5b79ff90173c0a1ed1cc59315acda50a131de0f9
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_45000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd0be6b5f6053bea40260d382a66627f2572e0d23f93145bd41b03959b43fffb
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_47500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f10489eeeefc32b2aec0615aaaedae12a844b5c9ea48c80427d8873fd45e4bb
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/model_49999.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa2f3cec42d9036e2f87260a9e0795ade9b256a480f4f1261f7cffdf84d202db
|
| 3 |
+
size 38587970
|
attention_kindselective_n_heads2_seed1341/optimizer_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08f1a057ee80dea9056a043af4613f7d138e6c121717d5b995f40421c2185b5c
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04707c9dc1a915ce8844444f88086b021a84ba76d2a51ff88b231c3a89315907
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8bde31ee1de5e0b28258329d8e1bfc745047816434565ddeb118534f3321b382
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_10000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e5e3a84f6d97d753668237ae05b7fa519625213870b1b982e72889351306dd8
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_12500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7c7772956f413b64e0b2580b4b54fa679916524a74e477187123032eff1ae02
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_15000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17b316437951257f7981be6620775537819e53492b0b26786967acf06aaba24f
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_17500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37b5c575b4a0eceaad61e429a71cacabbb2b7157606d6b02c3a150f792a4a780
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_20000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35fcaaa4f7c9226e4469c3c8c567557d0558d617c0ee65e7084bc28b23fcdb08
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_22500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01a74d2065d62b5f96d30821d64a6cb8d83df3adc4a127d9141f548214c01d10
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_25000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f69c4fa5bd5d85abce331c063b8f8661ea0716d83655b11b5c59e07943ea8a7a
|
| 3 |
+
size 70895430
|
attention_kindselective_n_heads2_seed1341/optimizer_27500.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b93749c7b464e5db7708c3a19920f5e874f533484b74a8caea9b3b2c5f1598b
|
| 3 |
+
size 70895430
|