krishanmittal018 commited on
Commit
1f37852
·
verified ·
1 Parent(s): 006be3e

Upload DistilBertForMaskedLM

Browse files
Files changed (2) hide show
  1. config.json +24 -16
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,25 +1,33 @@
1
  {
 
2
  "architectures": [
3
- "BertForMaskedLM"
4
  ],
5
- "attention_probs_dropout_prob": 0.1,
6
- "classifier_dropout": null,
7
- "gradient_checkpointing": false,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.1,
10
- "hidden_size": 768,
 
 
 
11
  "initializer_range": 0.02,
12
- "intermediate_size": 3072,
13
- "layer_norm_eps": 1e-12,
 
 
14
  "max_position_embeddings": 512,
15
- "model_type": "bert",
16
- "num_attention_heads": 12,
17
- "num_hidden_layers": 12,
 
18
  "pad_token_id": 0,
19
- "position_embedding_type": "absolute",
 
 
 
20
  "torch_dtype": "float32",
21
  "transformers_version": "4.55.3",
22
- "type_vocab_size": 2,
23
- "use_cache": true,
24
- "vocab_size": 28996
25
  }
 
1
  {
2
+ "activation": "gelu",
3
  "architectures": [
4
+ "DistilBertForMaskedLM"
5
  ],
6
+ "attention_dropout": 0.1,
7
+ "dim": 768,
8
+ "dropout": 0.1,
9
+ "finetuning_task": "sst-2",
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "NEGATIVE",
13
+ "1": "POSITIVE"
14
+ },
15
  "initializer_range": 0.02,
16
+ "label2id": {
17
+ "NEGATIVE": 0,
18
+ "POSITIVE": 1
19
+ },
20
  "max_position_embeddings": 512,
21
+ "model_type": "distilbert",
22
+ "n_heads": 12,
23
+ "n_layers": 6,
24
+ "output_past": true,
25
  "pad_token_id": 0,
26
+ "qa_dropout": 0.1,
27
+ "seq_classif_dropout": 0.2,
28
+ "sinusoidal_pos_embds": false,
29
+ "tie_weights_": true,
30
  "torch_dtype": "float32",
31
  "transformers_version": "4.55.3",
32
+ "vocab_size": 30522
 
 
33
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:283b7b2e8fc1d79cfe3106fc4cdc44633798d4f94204a12ea614ed808269efba
3
- size 433386912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70904d387a795d9ec9d07cc7552e90a2e7e1c9af2ffb0757a93cede65317c6f9
3
+ size 267954768