andrew-healey commited on
Commit
8b3486e
·
verified ·
1 Parent(s): 822b8d2

Upload folder using huggingface_hub

Browse files
Files changed (42) hide show
  1. attention_kindselective_n_heads2_seed1338/args.json +1 -1
  2. attention_kindselective_n_heads2_seed1338/log2.txt +0 -0
  3. attention_kindselective_n_heads2_seed1338/model_02500.pt +1 -1
  4. attention_kindselective_n_heads2_seed1338/model_05000.pt +1 -1
  5. attention_kindselective_n_heads2_seed1338/model_07500.pt +1 -1
  6. attention_kindselective_n_heads2_seed1338/model_10000.pt +1 -1
  7. attention_kindselective_n_heads2_seed1338/model_12500.pt +1 -1
  8. attention_kindselective_n_heads2_seed1338/model_15000.pt +1 -1
  9. attention_kindselective_n_heads2_seed1338/model_17500.pt +1 -1
  10. attention_kindselective_n_heads2_seed1338/model_20000.pt +1 -1
  11. attention_kindselective_n_heads2_seed1338/model_22500.pt +1 -1
  12. attention_kindselective_n_heads2_seed1338/model_25000.pt +1 -1
  13. attention_kindselective_n_heads2_seed1338/model_27500.pt +1 -1
  14. attention_kindselective_n_heads2_seed1338/model_30000.pt +1 -1
  15. attention_kindselective_n_heads2_seed1338/model_32500.pt +1 -1
  16. attention_kindselective_n_heads2_seed1338/model_35000.pt +1 -1
  17. attention_kindselective_n_heads2_seed1338/model_37500.pt +1 -1
  18. attention_kindselective_n_heads2_seed1338/model_40000.pt +1 -1
  19. attention_kindselective_n_heads2_seed1338/model_42500.pt +1 -1
  20. attention_kindselective_n_heads2_seed1338/model_45000.pt +1 -1
  21. attention_kindselective_n_heads2_seed1338/model_47500.pt +1 -1
  22. attention_kindselective_n_heads2_seed1338/model_49999.pt +1 -1
  23. attention_kindselective_n_heads2_seed1338/optimizer_02500.pt +1 -1
  24. attention_kindselective_n_heads2_seed1338/optimizer_05000.pt +1 -1
  25. attention_kindselective_n_heads2_seed1338/optimizer_07500.pt +1 -1
  26. attention_kindselective_n_heads2_seed1338/optimizer_10000.pt +1 -1
  27. attention_kindselective_n_heads2_seed1338/optimizer_12500.pt +1 -1
  28. attention_kindselective_n_heads2_seed1338/optimizer_15000.pt +1 -1
  29. attention_kindselective_n_heads2_seed1338/optimizer_17500.pt +1 -1
  30. attention_kindselective_n_heads2_seed1338/optimizer_20000.pt +1 -1
  31. attention_kindselective_n_heads2_seed1338/optimizer_22500.pt +1 -1
  32. attention_kindselective_n_heads2_seed1338/optimizer_25000.pt +1 -1
  33. attention_kindselective_n_heads2_seed1338/optimizer_27500.pt +1 -1
  34. attention_kindselective_n_heads2_seed1338/optimizer_30000.pt +1 -1
  35. attention_kindselective_n_heads2_seed1338/optimizer_32500.pt +1 -1
  36. attention_kindselective_n_heads2_seed1338/optimizer_35000.pt +1 -1
  37. attention_kindselective_n_heads2_seed1338/optimizer_37500.pt +1 -1
  38. attention_kindselective_n_heads2_seed1338/optimizer_40000.pt +1 -1
  39. attention_kindselective_n_heads2_seed1338/optimizer_42500.pt +1 -1
  40. attention_kindselective_n_heads2_seed1338/optimizer_45000.pt +1 -1
  41. attention_kindselective_n_heads2_seed1338/optimizer_47500.pt +1 -1
  42. attention_kindselective_n_heads2_seed1338/optimizer_49999.pt +1 -1
attention_kindselective_n_heads2_seed1338/args.json CHANGED
@@ -1 +1 @@
1
- {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 7e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "7e-5_10240_2_1338", "n_embd": 128}
 
1
+ {"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 2e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "2e-5_10240_2_1338", "n_embd": 128}
attention_kindselective_n_heads2_seed1338/log2.txt CHANGED
The diff for this file is too large to render. See raw diff
 
attention_kindselective_n_heads2_seed1338/model_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a54d1f2b670087ba176c7561a6cf2d8ec26b363bcc6c9707a21c9a5980179b6f
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba81592f720c8cdf511f7e95051064777a5d9a2000464b7a3810548f18a8aedf
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f928a89bb8241803129e09214de466b0e25be48f89b7e2934f99d6d5749d67c
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab493c79e6bd9391be19f95dacd36946aa11de520dfcde797fcb4694fa221f30
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:193c8827a7354eef33e70e2ceba9a981bdc28b041466300f379b40cff44dc5f2
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:455339e606ab8a27837f1f6e7b39afe34242ee9e19e5f6d860b750d8a5979bb5
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_10000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1d94a8368a19c2219bdff3ede1b15f35e4186b2ee041e02eeab9cfcbe2d47bc
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:991888317733e88ef96ff979ebedeb1552571da7914a490656ae6dca4b694224
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_12500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a70054d4344f6fa14b7d23b7d8cd915dbe453e71455454765a255640317d713
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87384aa440cd99899973b5fbc998d5d5cd78ca2dcc1f73ec0d60cac3064c03dc
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_15000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cdc755cb32eae94febfe4656f80338626101e8d7cc9946ce8ce2c3bf03de8ea8
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b04c59624f5472ca84bd617eb7789afe372646eae69d3bc731559608963fa345
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_17500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2355f2bfc63b002de74251d03a24a176aa53512f7eaf6c2641e5f33290d8e80f
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eb7b7edfc056043a505b02fab632917af0daee6816eaa45ca49c02f943dfc21
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_20000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10a4d736bf77b416703a4797c1191ca35753f8493f5d4668711b9c95f183b3da
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5eadfe32d369e9c1b4b6190c8b3d4fd7b3924014c1fc5009c40c90ebc06c869
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_22500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c839040407e035acdd07369f6a7cacacdf771ee7182ba8d65658ed3500a4ba0
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd555e174207081f722e3dff17e9abd83871a0364c4007b353da87a399a8a8fc
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_25000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:199ef7504e1bb9885ff6357018b4e74c7f0825a645526cfcb799d3d826826947
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ce591ea0a44a03c80feefa63907ffe295edfe8b048c11085ec6aace735ca76b
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_27500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a019be3e9ddc6d464dd7a14b1e6170af67015c64b2949663d79def4b69860b15
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e025675b25f7b7886c3f513797e02220f1d053083ecb82c612088711621ec77e
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_30000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845e4abf4f3ce7be46e04f77330a53b3c4267e819ddbc02dde4963588f5df254
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:506a9d9cc49a39da3b0f3c599da8a41a3f7336dbea392b0e72b40101793a09f8
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_32500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:872c0cf97d562fef9c0eecef1ef811dca604f09bf2632f5c08075360f48425b6
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b503f92589caf34cf6bf2f3f10818a5af3bf90a271de835d5e0825d2f69de2c0
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_35000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09f1131731afab9f36100fb3952537712567ab425d20a58900922e1915b4b8ca
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1934c8b164344c01783be64fedd7d53c61893de29b75bd4a0a334acf861a8705
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_37500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83bd1e335e970a4ba1d9774c9192782c48865ff9b195b90ab4a04a8a5836506c
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fba5936653ffe416873107a2687b655cd3aa19fbd167ea1bdc4c532782f2ba8
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_40000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31e467aae3098a92e7e473884dce191399b479efca63f963f5687f6a2b8d2fee
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b876f14fe381dfec1a859b3625c7b4921dbeb197ae6b1d460d8eabe8ec633e22
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_42500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0583628a4a6e9c9b032c427141c68cb9110d7d9d4011cf30fa9adbe6064f090b
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b03d58343fdbb4d097a768dfb8b5beebcc2bb6b3bc4610937a499b75dd1a69
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_45000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad45144a3fb89602eff01bc07342d70cc8afb3ad6bc2a5e404be5777c109e494
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:724c37786fa79101ba2b7deb69218ce6dda25cf10469c8e4a73e6434fa028321
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_47500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c61c7e55bc6fdc5a2b29941a2b66a41aec21ae86bcf0b7f65e27fce807d6198d
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d28c09c8caf71660facb1ed648383efdec514772ce8110342d07a0108f9eac79
3
  size 38587970
attention_kindselective_n_heads2_seed1338/model_49999.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33163b2f060c6c5f5a1cd71a9bcd5d1e2acf53e0674e95c52e8495d8ecf19f49
3
  size 38587970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45716e0689f1d330664c58644e5a4ee67606186e77baca68480204e8c3ffee83
3
  size 38587970
attention_kindselective_n_heads2_seed1338/optimizer_02500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7092b3753d70721281439387dd8c0466cf32802e18f2c8e3ebb74e373ad9d54
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06ee8c4316c3affc9ec3852b48d946d4a6413aec0ae74de4bc1c8003ce86fee2
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_05000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:777848a2f295ac1f4321dda85cf830242cd2621f9860c8db9ad5f9f9a02fbb67
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bbb5e2786de47ac2cb908d948a2c72c9b1e74cec6408ad1dbacb2c2f4fbc7f4
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_07500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7a13322cf084a9889bde7b67a5341128f1bf6f74c17096982b119e271984a42
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dd1aeccf6084a2f725ac7e4f95573e953d82c48a967560cdd0485d9dc9754e2
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_10000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ef371e7f771a14b9fa2724183416ca81d90cde94a9714987887efb51463c96b
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab93f477e7482043279b1b317f32d2eceab9cc97ca0ac104439a2a24f09bdef5
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_12500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a99f478b8c7d4ba9df1dead510f69ced94b7074669697b8edcbd10632e530b6
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315c8369f7577cb9629620ff0f4b37b13ba367524ceb2da9e1e055a7e00dd16e
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_15000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:868dae1e0f3077c15bc16ad0f8c175245e98ab505151c94f20694e0bca006442
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0feb69a3f0cf2be11702503658063e43dcd15d9f4a42f09feb49669457aa3db4
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_17500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:956ac4f5e89edc78d304613e83ac3273cbb525614c2379275873d34db6c7a3e9
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afb719d13bcb4274e19bf23ca852357a8883cd993425618cf23b1f8e85fa35bb
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_20000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:519c8914bf3b0de76b351423fa89e323b48bf7518149bbbc9e5d66c998c8ac23
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a2183cc97063a30273e5b4a95476ab256374beb9ff5df6f12f76167a0c9c4c8
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_22500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:803e0bf8dd7fcbaa44b1bd613dad95c2e96ff9712b4d7f9787f4352ab4ce5da3
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7c41bffb6b0a638833e5581d15ecbd2d81fdd43d3c6acfad2be41dd706112d
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_25000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20b8749ff3895e79986c24589212dbacb2058a06bfb9596ad5cd21599b9062d6
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e9b4a0a411cfe91007d8a9f695b7bfde4d4553612acc91ed10d4b0f83e964c2
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_27500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afd8a1b22bbba12a3c72efd70214ac15f5d304126134894d797fbed790ef6ef5
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:901d4bb59b1a3e12e098d6cb9284e9796fd7c77a87e7b2fcb0e8f3acd3003de5
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_30000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16f2dec0aac9f1da12e2f06988a2be697955594ae225250f2a203de88498201a
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5045966e27883b3856358d6fe44d7e4d292db1de7f6fd1d1d85b5980d4e09f71
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_32500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93426294ec5f595bdb39a5517a2d0f740fe8993a4d81b04290c2da208f650b55
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be5164a0ca8e59991b91c97cafd2b5fce3c3e4086a14fa28af3cb7386303e3ac
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_35000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e33c6faf2dcd2e2ec56ca1999a1be79b262979e57419fc53ec3e32916d57678b
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19878151975707f4e5960866e894cdd18cca1f074bdd6a976c886cd08bc5afb3
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_37500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ee5c0c3bdf5d64ebf3f0c7f1614361f69b9acb1a7938d41ed8eb3c0c86618ce
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f443345f55c6f7249fddf5afe8525d75793b95c72d6891e973fc24da2a06c13
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_40000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:038da380a90d0f3a3ff1f8a8cc805cfa0790e4014a458c7138d8dd6a2b50e5fa
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87dc545057f2139ddebead539bbadf3ca7ec33d8e5790dcdd7a1eb320f327e92
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_42500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd996b57c32f76d090a9779436b1904f1829f2772b25933692896324d69cf9bc
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5feb1a5b43c04c6c94fb77e185ef931df90f300374df01f1bed8e30e1f1985f5
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_45000.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4254e56f80cb905e03718cbefc34fe7a5e8094876ee7e8c57d07edc92b5a629
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65a3cb252d7dda8183ec5327ba4e6c6bdbaa5611077eaa504664d42f77f1c479
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_47500.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:336781bbe92c707410ef574515b5a29bed7ef2b59eae47fac04a5d57c5a08b0d
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a2ad3e25c84854f1f6a561978f5a2d263eefa7451fc2969567a96062406cc13
3
  size 70895430
attention_kindselective_n_heads2_seed1338/optimizer_49999.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f919e489d0aee4db2867bde0664bdf90b8304dc8b004630eb73a6f44d69afdf
3
  size 70895430
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f45761dca825b9857fb8377f687290b259ef10f2d077bcbc40fed60077879087
3
  size 70895430