gavincyi commited on
Commit
0dea81a
·
1 Parent(s): 408bab7

Upload TFDistilBertForSequenceClassification

Browse files
Files changed (3) hide show
  1. README.md +47 -0
  2. config.json +14 -7
  3. tf_model.h5 +3 -0
README.md ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - generated_from_keras_callback
4
+ model-index:
5
+ - name: test_model
6
+ results: []
7
+ ---
8
+
9
+ <!-- This model card has been generated automatically according to the information Keras had access to. You should
10
+ probably proofread and complete it, then remove this comment. -->
11
+
12
+ # test_model
13
+
14
+ This model was trained from scratch on an unknown dataset.
15
+ It achieves the following results on the evaluation set:
16
+
17
+
18
+ ## Model description
19
+
20
+ More information needed
21
+
22
+ ## Intended uses & limitations
23
+
24
+ More information needed
25
+
26
+ ## Training and evaluation data
27
+
28
+ More information needed
29
+
30
+ ## Training procedure
31
+
32
+ ### Training hyperparameters
33
+
34
+ The following hyperparameters were used during training:
35
+ - optimizer: None
36
+ - training_precision: float32
37
+
38
+ ### Training results
39
+
40
+
41
+
42
+ ### Framework versions
43
+
44
+ - Transformers 4.28.1
45
+ - TensorFlow 2.12.0
46
+ - Datasets 2.11.0
47
+ - Tokenizers 0.13.3
config.json CHANGED
@@ -1,14 +1,18 @@
1
  {
2
- "_name_or_path": "bert-base-cased",
 
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
 
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
 
 
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
 
10
  "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "id2label": {
13
  "0": "LABEL_0",
14
  "1": "LABEL_1",
@@ -27,14 +31,17 @@
27
  },
28
  "layer_norm_eps": 1e-12,
29
  "max_position_embeddings": 512,
30
- "model_type": "bert",
31
- "num_attention_heads": 12,
32
- "num_hidden_layers": 12,
33
  "pad_token_id": 0,
34
  "position_embedding_type": "absolute",
35
  "problem_type": "single_label_classification",
 
 
 
36
  "torch_dtype": "float32",
37
- "transformers_version": "4.27.4",
38
  "type_vocab_size": 2,
39
  "use_cache": true,
40
  "vocab_size": 28996
 
1
  {
2
+ "_name_or_path": "test_model",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
  "attention_probs_dropout_prob": 0.1,
9
  "classifier_dropout": null,
10
+ "dim": 768,
11
+ "dropout": 0.1,
12
  "gradient_checkpointing": false,
13
  "hidden_act": "gelu",
14
+ "hidden_dim": 3072,
15
  "hidden_dropout_prob": 0.1,
 
16
  "id2label": {
17
  "0": "LABEL_0",
18
  "1": "LABEL_1",
 
31
  },
32
  "layer_norm_eps": 1e-12,
33
  "max_position_embeddings": 512,
34
+ "model_type": "distilbert",
35
+ "n_heads": 12,
36
+ "n_layers": 12,
37
  "pad_token_id": 0,
38
  "position_embedding_type": "absolute",
39
  "problem_type": "single_label_classification",
40
+ "qa_dropout": 0.1,
41
+ "seq_classif_dropout": 0.2,
42
+ "sinusoidal_pos_embds": false,
43
  "torch_dtype": "float32",
44
+ "transformers_version": "4.28.1",
45
  "type_vocab_size": 2,
46
  "use_cache": true,
47
  "vocab_size": 28996
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6463d76553fe8eebc6e3edc8ea3438f63fb117e6e9c14345a2ae21af35fe9abb
3
+ size 433503344