lhallee commited on
Commit
737f3bf
·
verified ·
1 Parent(s): 2180ff2

Upload FastEsmForMaskedLM

Browse files
Files changed (2) hide show
  1. config.json +37 -39
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,39 +1,37 @@
1
- {
2
- "_name_or_path": "facebook/esm2_t33_650M_UR50D",
3
- "architectures": [
4
- "FastEsmForMaskedLM"
5
- ],
6
- "attention_probs_dropout_prob": 0.0,
7
- "attn_backend": "sdpa",
8
- "auto_map": {
9
- "AutoConfig": "modeling_fastesm.FastEsmConfig",
10
- "AutoModel": "modeling_fastesm.FastEsmModel",
11
- "AutoModelForMaskedLM": "modeling_fastesm.FastEsmForMaskedLM",
12
- "AutoModelForSequenceClassification": "modeling_fastesm.FastEsmForSequenceClassification",
13
- "AutoModelForTokenClassification": "modeling_fastesm.FastEsmForTokenClassification"
14
- },
15
- "classifier_dropout": null,
16
- "emb_layer_norm_before": false,
17
- "esmfold_config": null,
18
- "hidden_act": "gelu",
19
- "hidden_dropout_prob": 0.0,
20
- "hidden_size": 1280,
21
- "initializer_range": 0.02,
22
- "intermediate_size": 5120,
23
- "is_folding_model": false,
24
- "layer_norm_eps": 1e-05,
25
- "mask_token_id": 32,
26
- "max_position_embeddings": 1026,
27
- "model_type": "fast_esm",
28
- "num_attention_heads": 20,
29
- "num_hidden_layers": 33,
30
- "pad_token_id": 1,
31
- "position_embedding_type": "rotary",
32
- "tie_word_embeddings": false,
33
- "token_dropout": true,
34
- "torch_dtype": "float32",
35
- "transformers_version": "4.48.1",
36
- "use_cache": true,
37
- "vocab_list": null,
38
- "vocab_size": 33
39
- }
 
1
+ {
2
+ "architectures": [
3
+ "FastEsmForMaskedLM"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.0,
6
+ "attn_backend": "sdpa",
7
+ "auto_map": {
8
+ "AutoConfig": "modeling_fastesm.FastEsmConfig",
9
+ "AutoModel": "modeling_fastesm.FastEsmModel",
10
+ "AutoModelForMaskedLM": "modeling_fastesm.FastEsmForMaskedLM",
11
+ "AutoModelForSequenceClassification": "modeling_fastesm.FastEsmForSequenceClassification",
12
+ "AutoModelForTokenClassification": "modeling_fastesm.FastEsmForTokenClassification"
13
+ },
14
+ "classifier_dropout": null,
15
+ "dtype": "float32",
16
+ "emb_layer_norm_before": false,
17
+ "esmfold_config": null,
18
+ "hidden_act": "gelu",
19
+ "hidden_dropout_prob": 0.0,
20
+ "hidden_size": 1280,
21
+ "initializer_range": 0.02,
22
+ "intermediate_size": 5120,
23
+ "is_folding_model": false,
24
+ "layer_norm_eps": 1e-05,
25
+ "mask_token_id": 32,
26
+ "max_position_embeddings": 1026,
27
+ "model_type": "fast_esm",
28
+ "num_attention_heads": 20,
29
+ "num_hidden_layers": 33,
30
+ "pad_token_id": 1,
31
+ "position_embedding_type": "rotary",
32
+ "tie_word_embeddings": false,
33
+ "token_dropout": true,
34
+ "transformers_version": "5.1.0",
35
+ "vocab_list": null,
36
+ "vocab_size": 33
37
+ }
 
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a15142e94ecf36f0edde9b37796f591e609ebe1694ca411e93640f0ee384994a
3
- size 2604413888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa66b476930e90de0e30a385f77fbd9e5d1c0d766d33f1a0535b1cdee5badf92
3
+ size 2604413816