dbaezaj commited on
Commit
4d12340
·
1 Parent(s): b0a2a75

Upload DistilBertForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +14 -7
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,14 +1,18 @@
1
  {
2
- "_name_or_path": "bert-base-cased",
 
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
 
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
 
 
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
 
10
  "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "id2label": {
13
  "0": "LABEL_0",
14
  "1": "LABEL_1",
@@ -27,15 +31,18 @@
27
  },
28
  "layer_norm_eps": 1e-12,
29
  "max_position_embeddings": 512,
30
- "model_type": "bert",
31
- "num_attention_heads": 12,
32
- "num_hidden_layers": 12,
33
  "pad_token_id": 0,
34
  "position_embedding_type": "absolute",
35
  "problem_type": "single_label_classification",
 
 
 
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.35.0",
38
  "type_vocab_size": 2,
39
  "use_cache": true,
40
- "vocab_size": 28996
41
  }
 
1
  {
2
+ "_name_or_path": "test_trainer",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
  "attention_probs_dropout_prob": 0.1,
9
  "classifier_dropout": null,
10
+ "dim": 768,
11
+ "dropout": 0.1,
12
  "gradient_checkpointing": false,
13
  "hidden_act": "gelu",
14
+ "hidden_dim": 3072,
15
  "hidden_dropout_prob": 0.1,
 
16
  "id2label": {
17
  "0": "LABEL_0",
18
  "1": "LABEL_1",
 
31
  },
32
  "layer_norm_eps": 1e-12,
33
  "max_position_embeddings": 512,
34
+ "model_type": "distilbert",
35
+ "n_heads": 12,
36
+ "n_layers": 12,
37
  "pad_token_id": 0,
38
  "position_embedding_type": "absolute",
39
  "problem_type": "single_label_classification",
40
+ "qa_dropout": 0.1,
41
+ "seq_classif_dropout": 0.2,
42
+ "sinusoidal_pos_embds": false,
43
  "torch_dtype": "float32",
44
  "transformers_version": "4.35.0",
45
  "type_vocab_size": 2,
46
  "use_cache": true,
47
+ "vocab_size": 30522
48
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bff502bb7a26a95a8ac3a116639ade5afe4b80f043416c945b8abf6fbf3ee574
3
- size 433279996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a7a02274b2a61273e9168bd3fca3bd4ca1a6ff84ec780942774bfaf377eb387
3
+ size 437962484