mohammadmahdinouri commited on
Commit
1f72b7f
·
verified ·
1 Parent(s): 8ec7133

Upload ModernALBERTForMaskedLM

Browse files
Files changed (2) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "ModernALBERTForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "concat_routing_inputs": false,
8
  "embedding_size": 128,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
@@ -20,7 +20,7 @@
20
  "num_static_groups": 2,
21
  "pad_token_id": 0,
22
  "router_aux_loss_coef": 0.01,
23
- "router_warmup_steps": 4000,
24
  "routing_noise_std": 1.0,
25
  "routing_noise_type": "gumbel",
26
  "static_group_depth": 3,
 
4
  "ModernALBERTForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "concat_routing_inputs": true,
8
  "embedding_size": 128,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
 
20
  "num_static_groups": 2,
21
  "pad_token_id": 0,
22
  "router_aux_loss_coef": 0.01,
23
+ "router_warmup_steps": 7000,
24
  "routing_noise_std": 1.0,
25
  "routing_noise_type": "gumbel",
26
  "static_group_depth": 3,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dcf1e1f704e8d754cbd9e9af95ad2b4fdef9e0cdf7ca4b106895ca7f3d14a74
3
- size 285802032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32fd6720cbb77b54aba9f333ed2550e295a9a15a4152f17337f8d0be7bdf5c57
3
+ size 286096944