andrew-healey commited on
Commit
9000217
·
verified ·
1 Parent(s): af87c93

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. attention_kindselective_n_heads2_seed1341/args.json +1 -1
  2. attention_kindselective_n_heads2_seed1341/dataloader_10000.pt +3 -0
  3. attention_kindselective_n_heads2_seed1341/dataloader_12500.pt +3 -0
  4. attention_kindselective_n_heads2_seed1341/dataloader_15000.pt +3 -0
  5. attention_kindselective_n_heads2_seed1341/dataloader_17500.pt +3 -0
  6. attention_kindselective_n_heads2_seed1341/dataloader_20000.pt +3 -0
  7. attention_kindselective_n_heads2_seed1341/dataloader_22500.pt +3 -0
  8. attention_kindselective_n_heads2_seed1341/dataloader_25000.pt +3 -0
  9. attention_kindselective_n_heads2_seed1341/dataloader_27500.pt +3 -0
  10. attention_kindselective_n_heads2_seed1341/dataloader_30000.pt +3 -0
  11. attention_kindselective_n_heads2_seed1341/dataloader_32500.pt +3 -0
  12. attention_kindselective_n_heads2_seed1341/dataloader_35000.pt +3 -0
  13. attention_kindselective_n_heads2_seed1341/dataloader_37500.pt +3 -0
  14. attention_kindselective_n_heads2_seed1341/dataloader_40000.pt +3 -0
  15. attention_kindselective_n_heads2_seed1341/dataloader_42500.pt +3 -0
  16. attention_kindselective_n_heads2_seed1341/dataloader_45000.pt +3 -0
  17. attention_kindselective_n_heads2_seed1341/dataloader_47500.pt +3 -0
  18. attention_kindselective_n_heads2_seed1341/dataloader_49999.pt +3 -0
  19. attention_kindselective_n_heads2_seed1341/log2.txt +0 -0
  20. attention_kindselective_n_heads2_seed1341/model_02500.pt +1 -1
  21. attention_kindselective_n_heads2_seed1341/model_05000.pt +1 -1
  22. attention_kindselective_n_heads2_seed1341/model_07500.pt +1 -1
  23. attention_kindselective_n_heads2_seed1341/model_10000.pt +3 -0
  24. attention_kindselective_n_heads2_seed1341/model_12500.pt +3 -0
  25. attention_kindselective_n_heads2_seed1341/model_15000.pt +3 -0
  26. attention_kindselective_n_heads2_seed1341/model_17500.pt +3 -0
  27. attention_kindselective_n_heads2_seed1341/model_20000.pt +3 -0
  28. attention_kindselective_n_heads2_seed1341/model_22500.pt +3 -0
  29. attention_kindselective_n_heads2_seed1341/model_25000.pt +3 -0
  30. attention_kindselective_n_heads2_seed1341/model_27500.pt +3 -0
  31. attention_kindselective_n_heads2_seed1341/model_30000.pt +3 -0
  32. attention_kindselective_n_heads2_seed1341/model_32500.pt +3 -0
  33. attention_kindselective_n_heads2_seed1341/model_35000.pt +3 -0
  34. attention_kindselective_n_heads2_seed1341/model_37500.pt +3 -0
  35. attention_kindselective_n_heads2_seed1341/model_40000.pt +3 -0
  36. attention_kindselective_n_heads2_seed1341/model_42500.pt +3 -0
  37. attention_kindselective_n_heads2_seed1341/model_45000.pt +3 -0
  38. attention_kindselective_n_heads2_seed1341/model_47500.pt +3 -0
  39. attention_kindselective_n_heads2_seed1341/model_49999.pt +3 -0
  40. attention_kindselective_n_heads2_seed1341/optimizer_02500.pt +1 -1
  41. attention_kindselective_n_heads2_seed1341/optimizer_05000.pt +1 -1
  42. attention_kindselective_n_heads2_seed1341/optimizer_07500.pt +1 -1
  43. attention_kindselective_n_heads2_seed1341/optimizer_10000.pt +3 -0
  44. attention_kindselective_n_heads2_seed1341/optimizer_12500.pt +3 -0
  45. attention_kindselective_n_heads2_seed1341/optimizer_15000.pt +3 -0
  46. attention_kindselective_n_heads2_seed1341/optimizer_17500.pt +3 -0
  47. attention_kindselective_n_heads2_seed1341/optimizer_20000.pt +3 -0
  48. attention_kindselective_n_heads2_seed1341/optimizer_22500.pt +3 -0
  49. attention_kindselective_n_heads2_seed1341/optimizer_25000.pt +3 -0
  50. attention_kindselective_n_heads2_seed1341/optimizer_27500.pt +3 -0
attention_kindselective_n_heads2_seed1341/args.json CHANGED
@@ -1 +1 @@
1
- {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_6/attention_kindselective_n_heads2_seed1341", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 10000, "warmup_steps": 200, "group": "wider_is_better_6", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1341, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 0.00015, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "15e-5_10240_2_1341", "n_embd": 128}
 
1
+ {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1341", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1341, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 0.0001, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "10e-5_10240_2_1341", "n_embd": 128}
attention_kindselective_n_heads2_seed1341/dataloader_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3858f6c832feea78a674d8c5c384061cc7d4f22cddbd0a2be6de33bc91e2c72
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3779d33c2e0a7873fcd8c39402e44260740665950323ad1445480ec339965a
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:450020c7c306c73e5c07c463518ab937102d657515ea5a38da6f2e7291f20324
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0696a655d7c8a9d7d275c7489f74a5a948ee029ac3941b045d6abaf12544a5b1
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eb226bdcee777fd1ca493533704dae226c077ef79c842fc9dc59a534d5381c1
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88833bfd821adac4edd1dd0772083ae007c7b8d33041f66e53a679e1fa8993e0
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:554555a425bac43d626c36f1c81c2b0aba51eda3281dab27a9cb56b61f413354
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a52940b3b45414e6cdbec0dbaeba848f52d681c2daf78c269027057332d7fbd
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_30000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775519ea26122cb70d533c496bcdbbc19f759f3d096e83e98cca1dc10275fe8e
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_32500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3422c8205fe45210246fed3dd6c317b75df02228cd8b75fba669574ce3b2d9
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_35000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199ed3be67b88981f686112c97a2261729a37e0be3d4b0f4a289985a95d3cdf1
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_37500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77178b3be9dd3f8cd03c935236251f73fde6da7948ba9feda0c888fb8912dfe
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_40000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f58ba3b4a1f9be7da4e697e06782f0e1ce4d3aca49f1997087fc83aa466dd9
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_42500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6d24c78d89100d146bce9f26be940db3d71092473d9b55db97d6b35531eac2
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_45000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22bb90b43d81f3da5454f91a70e1ed29aeb2f470a727ce38390ff8a5c4924889
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_47500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55507725e6988f190e4963078652fafa6b68e8d4f79221387612612babf3e1c1
3
+ size 964
attention_kindselective_n_heads2_seed1341/dataloader_49999.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47776cddb8021172f048a950b83f25b692cb340214b800ce3837c15ceb58907c
3
+ size 964
attention_kindselective_n_heads2_seed1341/log2.txt CHANGED
The diff for this file is too large to render. See raw diff
 
attention_kindselective_n_heads2_seed1341/model_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f81c5305e28766ffe17b41d892c4195cc93a4d18969824c3a0f91c8db6cf9c61
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df2dbff4078c4b902e52c1b7e5066b645d7034b614be5e59574471f8960ecc8d
3
  size 38587970
attention_kindselective_n_heads2_seed1341/model_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1981d296a42527ba71384319070268006aa51ed1ce3f34d492953367c7d791d
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b8b2db67768b1b7c4f36a2f59bdbf2ce5cdb8709c2f1a8aab106c8f26270d14
3
  size 38587970
attention_kindselective_n_heads2_seed1341/model_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a38e1ba00e798ca0b0a8d8e9524e6b25782fda42839c6c43fc8de932eaaa2f8
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:364f24f243b3307cbb71c22973ac7657870fb5d5ab6db86c6b6ce16187242859
3
  size 38587970
attention_kindselective_n_heads2_seed1341/model_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39597fb5f366edff6ba2340cd9532f6013379941b9f4fa74758f88d9c97ae137
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d31a60ee89698642b0ebc621b75f58a692275ef26044e594d7268780509fd84
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1af66647de9c5fc855d02d637ba618c8144799d5efe8ddc623aa3b3de6f726c
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e82ddeade8b883e1bec9ae78a0caacae82fc16e39d9c5e40a814ee4b400df35
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0d57d46256da655ab0efb88dce7b9010af64ff833c4c08ae94bcb3b7138cc8
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e93ca9b8574d2d714f7cae55c176cb3e64cb31d5ab43da6c34b0b03b0cbead07
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:454c04312ec7cba780576b7269421be5981dbee4e8a4d91baec0e8013e07cc02
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8961199b8c739f6e36b00526c87a6b5246765f4d1c0dbe1093faede9f3344450
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_30000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:197046029793284598988dd04e5df15c623eaef6f155707df97b86154436a148
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_32500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96771b15cd62ac259acfeaa8c3bea3c6a0311b32a69fc5f4cbdf396812aaa6f2
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_35000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64439ba3a2d2759349369c61c46122f5f8d43d494d81def5c4c784414d39443e
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_37500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974dfee447c5c353591f60ad35df9d68980e9c6f37f94c1beca686db8af86a80
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_40000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92e9a07a5d7a3a5bbe8777892da0e16dbe8d52cfe28c66d9263c00ba04a7a708
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_42500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff5074eedcb82cb39bd1c3cc5b79ff90173c0a1ed1cc59315acda50a131de0f9
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_45000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0be6b5f6053bea40260d382a66627f2572e0d23f93145bd41b03959b43fffb
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_47500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f10489eeeefc32b2aec0615aaaedae12a844b5c9ea48c80427d8873fd45e4bb
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/model_49999.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa2f3cec42d9036e2f87260a9e0795ade9b256a480f4f1261f7cffdf84d202db
3
+ size 38587970
attention_kindselective_n_heads2_seed1341/optimizer_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbe352394c98f7aeb470becf95bc3d2fadc1b26eaace9a300ecb094670cdc944
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08f1a057ee80dea9056a043af4613f7d138e6c121717d5b995f40421c2185b5c
3
  size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b8de7fcbdc412e17dba8f4280f46014e7504b0ac36b8318f82ce0046bc68161
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04707c9dc1a915ce8844444f88086b021a84ba76d2a51ff88b231c3a89315907
3
  size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d1fdfd4cbdb5969528ced4c2cc8e4fab4c83f4ad557140cab2cdaecb053a8fc
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bde31ee1de5e0b28258329d8e1bfc745047816434565ddeb118534f3321b382
3
  size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_10000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e5e3a84f6d97d753668237ae05b7fa519625213870b1b982e72889351306dd8
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_12500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7c7772956f413b64e0b2580b4b54fa679916524a74e477187123032eff1ae02
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_15000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b316437951257f7981be6620775537819e53492b0b26786967acf06aaba24f
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_17500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37b5c575b4a0eceaad61e429a71cacabbb2b7157606d6b02c3a150f792a4a780
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_20000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35fcaaa4f7c9226e4469c3c8c567557d0558d617c0ee65e7084bc28b23fcdb08
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_22500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01a74d2065d62b5f96d30821d64a6cb8d83df3adc4a127d9141f548214c01d10
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_25000.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f69c4fa5bd5d85abce331c063b8f8661ea0716d83655b11b5c59e07943ea8a7a
3
+ size 70895430
attention_kindselective_n_heads2_seed1341/optimizer_27500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b93749c7b464e5db7708c3a19920f5e874f533484b74a8caea9b3b2c5f1598b
3
+ size 70895430