Upload folder using huggingface_hub
Browse files- attention_kindselective_n_heads2_seed1338/args.json +1 -1
- attention_kindselective_n_heads2_seed1338/log2.txt +0 -0
- attention_kindselective_n_heads2_seed1338/model_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_10000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_12500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_15000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_17500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_20000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_22500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_25000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_27500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_30000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_32500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_35000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_37500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_40000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_42500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_45000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_47500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/model_49999.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_02500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_05000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_07500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_10000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_12500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_15000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_17500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_20000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_22500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_25000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_27500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_30000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_32500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_35000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_37500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_40000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_42500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_45000.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_47500.pt +1 -1
- attention_kindselective_n_heads2_seed1338/optimizer_49999.pt +1 -1
attention_kindselective_n_heads2_seed1338/args.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr":
|
|
|
|
| 1 |
+
{"hellaswag": true, "attention_kind": "selective", "log_dir": "wider_is_better_7/attention_kindselective_n_heads2_seed1338", "resume_checkpoint": null, "resume_optimizer": false, "add_a_head": false, "add_head_to_start": true, "new_head_init": "normal", "n_heads": 2, "protect_bos_token": true, "prevent_from_masking_myself": true, "max_steps": 50000, "warmup_steps": 200, "group": "wider_is_better_7", "use_wandb": true, "kill_self_after_run": false, "random_seed": 1338, "memory_penalty_epsilon": 0.1, "selection_head_linear_combo": "none", "selection_head_linear_combo_scale": 1.0, "protection_kind": "none", "leaky_relu_alpha": null, "leaky_relu_bias": null, "use_compile": true, "use_mini_model": false, "upload_to_hf": true, "seq_len": 256, "batch_size": 40, "total_batch_size": 10240, "protection_head_scaling_factor": 1.0, "protection_head_bias": 0.0, "n_sliced_masks": null, "n_latent_masks": null, "mask_layernorm": false, "residual_attention_masks": false, "compute_base_shapes": false, "base_shapes_savefile": null, "mup": true, "disable_selection": false, "mup_enable_coord_check_logging": false, "max_lr": 2e-05, "decay_lr": true, "readout_zero_init": false, "query_zero_init": false, "l1_loss": false, "debugpy": false, "key": "2e-5_10240_2_1338", "n_embd": 128}
|
attention_kindselective_n_heads2_seed1338/log2.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
attention_kindselective_n_heads2_seed1338/model_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba81592f720c8cdf511f7e95051064777a5d9a2000464b7a3810548f18a8aedf
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab493c79e6bd9391be19f95dacd36946aa11de520dfcde797fcb4694fa221f30
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:455339e606ab8a27837f1f6e7b39afe34242ee9e19e5f6d860b750d8a5979bb5
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_10000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:991888317733e88ef96ff979ebedeb1552571da7914a490656ae6dca4b694224
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_12500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87384aa440cd99899973b5fbc998d5d5cd78ca2dcc1f73ec0d60cac3064c03dc
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_15000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b04c59624f5472ca84bd617eb7789afe372646eae69d3bc731559608963fa345
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_17500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2eb7b7edfc056043a505b02fab632917af0daee6816eaa45ca49c02f943dfc21
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_20000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5eadfe32d369e9c1b4b6190c8b3d4fd7b3924014c1fc5009c40c90ebc06c869
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_22500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd555e174207081f722e3dff17e9abd83871a0364c4007b353da87a399a8a8fc
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_25000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ce591ea0a44a03c80feefa63907ffe295edfe8b048c11085ec6aace735ca76b
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_27500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e025675b25f7b7886c3f513797e02220f1d053083ecb82c612088711621ec77e
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_30000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:506a9d9cc49a39da3b0f3c599da8a41a3f7336dbea392b0e72b40101793a09f8
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_32500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b503f92589caf34cf6bf2f3f10818a5af3bf90a271de835d5e0825d2f69de2c0
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_35000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1934c8b164344c01783be64fedd7d53c61893de29b75bd4a0a334acf861a8705
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_37500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fba5936653ffe416873107a2687b655cd3aa19fbd167ea1bdc4c532782f2ba8
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_40000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b876f14fe381dfec1a859b3625c7b4921dbeb197ae6b1d460d8eabe8ec633e22
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_42500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64b03d58343fdbb4d097a768dfb8b5beebcc2bb6b3bc4610937a499b75dd1a69
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_45000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:724c37786fa79101ba2b7deb69218ce6dda25cf10469c8e4a73e6434fa028321
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_47500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d28c09c8caf71660facb1ed648383efdec514772ce8110342d07a0108f9eac79
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/model_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 38587970
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45716e0689f1d330664c58644e5a4ee67606186e77baca68480204e8c3ffee83
|
| 3 |
size 38587970
|
attention_kindselective_n_heads2_seed1338/optimizer_02500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06ee8c4316c3affc9ec3852b48d946d4a6413aec0ae74de4bc1c8003ce86fee2
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_05000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bbb5e2786de47ac2cb908d948a2c72c9b1e74cec6408ad1dbacb2c2f4fbc7f4
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_07500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2dd1aeccf6084a2f725ac7e4f95573e953d82c48a967560cdd0485d9dc9754e2
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_10000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab93f477e7482043279b1b317f32d2eceab9cc97ca0ac104439a2a24f09bdef5
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_12500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:315c8369f7577cb9629620ff0f4b37b13ba367524ceb2da9e1e055a7e00dd16e
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_15000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0feb69a3f0cf2be11702503658063e43dcd15d9f4a42f09feb49669457aa3db4
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_17500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afb719d13bcb4274e19bf23ca852357a8883cd993425618cf23b1f8e85fa35bb
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_20000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a2183cc97063a30273e5b4a95476ab256374beb9ff5df6f12f76167a0c9c4c8
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_22500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f7c41bffb6b0a638833e5581d15ecbd2d81fdd43d3c6acfad2be41dd706112d
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_25000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e9b4a0a411cfe91007d8a9f695b7bfde4d4553612acc91ed10d4b0f83e964c2
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_27500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:901d4bb59b1a3e12e098d6cb9284e9796fd7c77a87e7b2fcb0e8f3acd3003de5
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_30000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5045966e27883b3856358d6fe44d7e4d292db1de7f6fd1d1d85b5980d4e09f71
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_32500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be5164a0ca8e59991b91c97cafd2b5fce3c3e4086a14fa28af3cb7386303e3ac
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_35000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19878151975707f4e5960866e894cdd18cca1f074bdd6a976c886cd08bc5afb3
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_37500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f443345f55c6f7249fddf5afe8525d75793b95c72d6891e973fc24da2a06c13
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_40000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87dc545057f2139ddebead539bbadf3ca7ec33d8e5790dcdd7a1eb320f327e92
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_42500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5feb1a5b43c04c6c94fb77e185ef931df90f300374df01f1bed8e30e1f1985f5
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_45000.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:65a3cb252d7dda8183ec5327ba4e6c6bdbaa5611077eaa504664d42f77f1c479
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_47500.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a2ad3e25c84854f1f6a561978f5a2d263eefa7451fc2969567a96062406cc13
|
| 3 |
size 70895430
|
attention_kindselective_n_heads2_seed1338/optimizer_49999.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 70895430
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f45761dca825b9857fb8377f687290b259ef10f2d077bcbc40fed60077879087
|
| 3 |
size 70895430
|