andrew-healey commited on
Commit
da48975
·
verified ·
1 Parent(s): 5fd7dbe

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. attention_kindselective_n_heads2_seed1338/args.json +1 -1
  2. attention_kindselective_n_heads2_seed1338/dataloader_10000.pt +3 -0
  3. attention_kindselective_n_heads2_seed1338/dataloader_12500.pt +3 -0
  4. attention_kindselective_n_heads2_seed1338/dataloader_15000.pt +3 -0
  5. attention_kindselective_n_heads2_seed1338/dataloader_17500.pt +3 -0
  6. attention_kindselective_n_heads2_seed1338/dataloader_20000.pt +3 -0
  7. attention_kindselective_n_heads2_seed1338/dataloader_22500.pt +3 -0
  8. attention_kindselective_n_heads2_seed1338/dataloader_25000.pt +3 -0
  9. attention_kindselective_n_heads2_seed1338/dataloader_27500.pt +3 -0
  10. attention_kindselective_n_heads2_seed1338/dataloader_30000.pt +3 -0
  11. attention_kindselective_n_heads2_seed1338/dataloader_32500.pt +3 -0
  12. attention_kindselective_n_heads2_seed1338/dataloader_35000.pt +3 -0
  13. attention_kindselective_n_heads2_seed1338/dataloader_37500.pt +3 -0
  14. attention_kindselective_n_heads2_seed1338/dataloader_40000.pt +3 -0
  15. attention_kindselective_n_heads2_seed1338/dataloader_42500.pt +3 -0
  16. attention_kindselective_n_heads2_seed1338/dataloader_45000.pt +3 -0
  17. attention_kindselective_n_heads2_seed1338/dataloader_47500.pt +3 -0
  18. attention_kindselective_n_heads2_seed1338/dataloader_49999.pt +3 -0
  19. attention_kindselective_n_heads2_seed1338/log2.txt +0 -0
  20. attention_kindselective_n_heads2_seed1338/model_02500.pt +1 -1
  21. attention_kindselective_n_heads2_seed1338/model_05000.pt +1 -1
  22. attention_kindselective_n_heads2_seed1338/model_07500.pt +1 -1
  23. attention_kindselective_n_heads2_seed1338/model_10000.pt +3 -0
  24. attention_kindselective_n_heads2_seed1338/model_12500.pt +3 -0
  25. attention_kindselective_n_heads2_seed1338/model_15000.pt +3 -0
  26. attention_kindselective_n_heads2_seed1338/model_17500.pt +3 -0
  27. attention_kindselective_n_heads2_seed1338/model_20000.pt +3 -0
  28. attention_kindselective_n_heads2_seed1338/model_22500.pt +3 -0
  29. attention_kindselective_n_heads2_seed1338/model_25000.pt +3 -0
  30. attention_kindselective_n_heads2_seed1338/model_27500.pt +3 -0
  31. attention_kindselective_n_heads2_seed1338/model_30000.pt +3 -0
  32. attention_kindselective_n_heads2_seed1338/model_32500.pt +3 -0
  33. attention_kindselective_n_heads2_seed1338/model_35000.pt +3 -0
  34. attention_kindselective_n_heads2_seed1338/model_37500.pt +3 -0
  35. attention_kindselective_n_heads2_seed1338/model_40000.pt +3 -0
  36. attention_kindselective_n_heads2_seed1338/model_42500.pt +3 -0
  37. attention_kindselective_n_heads2_seed1338/model_45000.pt +3 -0
  38. attention_kindselective_n_heads2_seed1338/model_47500.pt +3 -0
  39. attention_kindselective_n_heads2_seed1338/model_49999.pt +3 -0
  40. attention_kindselective_n_heads2_seed1338/optimizer_02500.pt +1 -1
  41. attention_kindselective_n_heads2_seed1338/optimizer_05000.pt +1 -1
  42. attention_kindselective_n_heads2_seed1338/optimizer_07500.pt +1 -1
  43. attention_kindselective_n_heads2_seed1338/optimizer_10000.pt +3 -0
  44. attention_kindselective_n_heads2_seed1338/optimizer_12500.pt +3 -0
  45. attention_kindselective_n_heads2_seed1338/optimizer_15000.pt +3 -0
  46. attention_kindselective_n_heads2_seed1338/optimizer_17500.pt +3 -0
  47. attention_kindselective_n_heads2_seed1338/optimizer_20000.pt +3 -0
  48. attention_kindselective_n_heads2_seed1338/optimizer_22500.pt +3 -0
  49. attention_kindselective_n_heads2_seed1338/optimizer_25000.pt +3 -0
  50. attention_kindselective_n_heads2_seed1338/optimizer_27500.pt +3 -0
attention_kindselective_n_heads2_seed1338/args.json CHANGED
@@ -1 +1 @@
1
- {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_6/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 10000, "warmup_steps": 200, "group": "wider_is_better_6", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 0.0001, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "10e-5_10240_2_1338", "n_embd": 128}
 
1
+ {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 7e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "7e-5_10240_2_1338", "n_embd": 128}
attention_kindselective_n_heads2_seed1338/dataloader_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3858f6c832feea78a674d8c5c384061cc7d4f22cddbd0a2be6de33bc91e2c72
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3779d33c2e0a7873fcd8c39402e44260740665950323ad1445480ec339965a
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:450020c7c306c73e5c07c463518ab937102d657515ea5a38da6f2e7291f20324
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0696a655d7c8a9d7d275c7489f74a5a948ee029ac3941b045d6abaf12544a5b1
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eb226bdcee777fd1ca493533704dae226c077ef79c842fc9dc59a534d5381c1
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88833bfd821adac4edd1dd0772083ae007c7b8d33041f66e53a679e1fa8993e0
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:554555a425bac43d626c36f1c81c2b0aba51eda3281dab27a9cb56b61f413354
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a52940b3b45414e6cdbec0dbaeba848f52d681c2daf78c269027057332d7fbd
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_30000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775519ea26122cb70d533c496bcdbbc19f759f3d096e83e98cca1dc10275fe8e
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_32500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3422c8205fe45210246fed3dd6c317b75df02228cd8b75fba669574ce3b2d9
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_35000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199ed3be67b88981f686112c97a2261729a37e0be3d4b0f4a289985a95d3cdf1
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_37500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77178b3be9dd3f8cd03c935236251f73fde6da7948ba9feda0c888fb8912dfe
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_40000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f58ba3b4a1f9be7da4e697e06782f0e1ce4d3aca49f1997087fc83aa466dd9
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_42500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6d24c78d89100d146bce9f26be940db3d71092473d9b55db97d6b35531eac2
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_45000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22bb90b43d81f3da5454f91a70e1ed29aeb2f470a727ce38390ff8a5c4924889
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_47500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55507725e6988f190e4963078652fafa6b68e8d4f79221387612612babf3e1c1
3
+ size 964
attention_kindselective_n_heads2_seed1338/dataloader_49999.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47776cddb8021172f048a950b83f25b692cb340214b800ce3837c15ceb58907c
3
+ size 964
attention_kindselective_n_heads2_seed1338/log2.txt CHANGED
The diff for this file is too large to render. See raw diff
 
attention_kindselective_n_heads2_seed1338/model_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9157bcc1377e68b286966c0a0341a5e69ef9fc2e367bcc48aba49860b5ba4d4
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a54d1f2b670087ba176c7561a6cf2d8ec26b363bcc6c9707a21c9a5980179b6f
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f41aca9adf817c5b42c183649b46a97fcd1baba88fea3644adb57163bd39ec2
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f928a89bb8241803129e09214de466b0e25be48f89b7e2934f99d6d5749d67c
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f15805825428b7a60e7c78f2ff49c625a1b71822b49facc1d5e458f2e62df939
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:193c8827a7354eef33e70e2ceba9a981bdc28b041466300f379b40cff44dc5f2
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1d94a8368a19c2219bdff3ede1b15f35e4186b2ee041e02eeab9cfcbe2d47bc
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a70054d4344f6fa14b7d23b7d8cd915dbe453e71455454765a255640317d713
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc755cb32eae94febfe4656f80338626101e8d7cc9946ce8ce2c3bf03de8ea8
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2355f2bfc63b002de74251d03a24a176aa53512f7eaf6c2641e5f33290d8e80f
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10a4d736bf77b416703a4797c1191ca35753f8493f5d4668711b9c95f183b3da
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c839040407e035acdd07369f6a7cacacdf771ee7182ba8d65658ed3500a4ba0
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199ef7504e1bb9885ff6357018b4e74c7f0825a645526cfcb799d3d826826947
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a019be3e9ddc6d464dd7a14b1e6170af67015c64b2949663d79def4b69860b15
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_30000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:845e4abf4f3ce7be46e04f77330a53b3c4267e819ddbc02dde4963588f5df254
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_32500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:872c0cf97d562fef9c0eecef1ef811dca604f09bf2632f5c08075360f48425b6
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_35000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09f1131731afab9f36100fb3952537712567ab425d20a58900922e1915b4b8ca
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_37500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83bd1e335e970a4ba1d9774c9192782c48865ff9b195b90ab4a04a8a5836506c
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_40000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31e467aae3098a92e7e473884dce191399b479efca63f963f5687f6a2b8d2fee
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_42500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0583628a4a6e9c9b032c427141c68cb9110d7d9d4011cf30fa9adbe6064f090b
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_45000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad45144a3fb89602eff01bc07342d70cc8afb3ad6bc2a5e404be5777c109e494
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_47500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b293468bbf9bdf1ff4b1c1d9ccc3eb09e6d7b5bfbac4c2312351919feacb287
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/model_49999.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce9b65be8797af36d0449099a38afc632e8eea9f71b403705410b30e880b62ea
3
+ size 38587970
attention_kindselective_n_heads2_seed1338/optimizer_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47848b329fdc5de70e6f1d2c743be1b06f2fc0459c1128539106cc34eb7bd6cb
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7092b3753d70721281439387dd8c0466cf32802e18f2c8e3ebb74e373ad9d54
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23d2ca9117d48314c932bb7aa5c430b045f768930d81a6a6a25c137857f81aad
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:777848a2f295ac1f4321dda85cf830242cd2621f9860c8db9ad5f9f9a02fbb67
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8615fd9af3900fecade21ff7a416b6897eb44dab958718ebeb0d5baae84031b
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7a13322cf084a9889bde7b67a5341128f1bf6f74c17096982b119e271984a42
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef371e7f771a14b9fa2724183416ca81d90cde94a9714987887efb51463c96b
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a99f478b8c7d4ba9df1dead510f69ced94b7074669697b8edcbd10632e530b6
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:868dae1e0f3077c15bc16ad0f8c175245e98ab505151c94f20694e0bca006442
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956ac4f5e89edc78d304613e83ac3273cbb525614c2379275873d34db6c7a3e9
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:519c8914bf3b0de76b351423fa89e323b48bf7518149bbbc9e5d66c998c8ac23
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:803e0bf8dd7fcbaa44b1bd613dad95c2e96ff9712b4d7f9787f4352ab4ce5da3
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20b8749ff3895e79986c24589212dbacb2058a06bfb9596ad5cd21599b9062d6
3
+ size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd8a1b22bbba12a3c72efd70214ac15f5d304126134894d797fbed790ef6ef5
3
+ size 70895430