akmmsr commited on
Commit
0917c3b
·
1 Parent(s): 32254e8

Training in progress epoch 0

Browse files
Files changed (3) hide show
  1. README.md +5 -7
  2. config.json +18 -94
  3. tf_model.h5 +2 -2
README.md CHANGED
@@ -14,9 +14,9 @@ probably proofread and complete it, then remove this comment. -->
14
 
15
  This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
- - Train Loss: 0.0306
18
- - Validation Loss: 0.0584
19
- - Epoch: 2
20
 
21
  ## Model description
22
 
@@ -42,14 +42,12 @@ The following hyperparameters were used during training:
42
 
43
  | Train Loss | Validation Loss | Epoch |
44
  |:----------:|:---------------:|:-----:|
45
- | 0.2443 | 0.0889 | 0 |
46
- | 0.0519 | 0.0613 | 1 |
47
- | 0.0306 | 0.0584 | 2 |
48
 
49
 
50
  ### Framework versions
51
 
52
  - Transformers 4.24.0
53
  - TensorFlow 2.9.2
54
- - Datasets 2.7.0
55
  - Tokenizers 0.13.2
 
14
 
15
  This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
+ - Train Loss: 0.1758
18
+ - Validation Loss: 0.0625
19
+ - Epoch: 0
20
 
21
  ## Model description
22
 
 
42
 
43
  | Train Loss | Validation Loss | Epoch |
44
  |:----------:|:---------------:|:-----:|
45
+ | 0.1758 | 0.0625 | 0 |
 
 
46
 
47
 
48
  ### Framework versions
49
 
50
  - Transformers 4.24.0
51
  - TensorFlow 2.9.2
52
+ - Datasets 2.7.1
53
  - Tokenizers 0.13.2
config.json CHANGED
@@ -10,104 +10,28 @@
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
- "0": "\"",
14
- "1": "''",
15
- "10": "CC",
16
- "11": "CD",
17
- "12": "DT",
18
- "13": "EX",
19
- "14": "FW",
20
- "15": "IN",
21
- "16": "JJ",
22
- "17": "JJR",
23
- "18": "JJS",
24
- "19": "LS",
25
- "2": "#",
26
- "20": "MD",
27
- "21": "NN",
28
- "22": "NNP",
29
- "23": "NNPS",
30
- "24": "NNS",
31
- "25": "NN|SYM",
32
- "26": "PDT",
33
- "27": "POS",
34
- "28": "PRP",
35
- "29": "PRP$",
36
- "3": "$",
37
- "30": "RB",
38
- "31": "RBR",
39
- "32": "RBS",
40
- "33": "RP",
41
- "34": "SYM",
42
- "35": "TO",
43
- "36": "UH",
44
- "37": "VB",
45
- "38": "VBD",
46
- "39": "VBG",
47
- "4": "(",
48
- "40": "VBN",
49
- "41": "VBP",
50
- "42": "VBZ",
51
- "43": "WDT",
52
- "44": "WP",
53
- "45": "WP$",
54
- "46": "WRB",
55
- "5": ")",
56
- "6": ",",
57
- "7": ".",
58
- "8": ":",
59
- "9": "``"
60
  },
61
  "initializer_range": 0.02,
62
  "intermediate_size": 3072,
63
  "label2id": {
64
- "\"": "0",
65
- "#": "2",
66
- "$": "3",
67
- "''": "1",
68
- "(": "4",
69
- ")": "5",
70
- ",": "6",
71
- ".": "7",
72
- ":": "8",
73
- "CC": "10",
74
- "CD": "11",
75
- "DT": "12",
76
- "EX": "13",
77
- "FW": "14",
78
- "IN": "15",
79
- "JJ": "16",
80
- "JJR": "17",
81
- "JJS": "18",
82
- "LS": "19",
83
- "MD": "20",
84
- "NN": "21",
85
- "NNP": "22",
86
- "NNPS": "23",
87
- "NNS": "24",
88
- "NN|SYM": "25",
89
- "PDT": "26",
90
- "POS": "27",
91
- "PRP": "28",
92
- "PRP$": "29",
93
- "RB": "30",
94
- "RBR": "31",
95
- "RBS": "32",
96
- "RP": "33",
97
- "SYM": "34",
98
- "TO": "35",
99
- "UH": "36",
100
- "VB": "37",
101
- "VBD": "38",
102
- "VBG": "39",
103
- "VBN": "40",
104
- "VBP": "41",
105
- "VBZ": "42",
106
- "WDT": "43",
107
- "WP": "44",
108
- "WP$": "45",
109
- "WRB": "46",
110
- "``": "9"
111
  },
112
  "layer_norm_eps": 1e-12,
113
  "max_position_embeddings": 512,
 
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
+ "0": "O",
14
+ "1": "B-PER",
15
+ "2": "I-PER",
16
+ "3": "B-ORG",
17
+ "4": "I-ORG",
18
+ "5": "B-LOC",
19
+ "6": "I-LOC",
20
+ "7": "B-MISC",
21
+ "8": "I-MISC"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  },
23
  "initializer_range": 0.02,
24
  "intermediate_size": 3072,
25
  "label2id": {
26
+ "B-LOC": "5",
27
+ "B-MISC": "7",
28
+ "B-ORG": "3",
29
+ "B-PER": "1",
30
+ "I-LOC": "6",
31
+ "I-MISC": "8",
32
+ "I-ORG": "4",
33
+ "I-PER": "2",
34
+ "O": "0"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
35
  },
36
  "layer_norm_eps": 1e-12,
37
  "max_position_embeddings": 512,
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c27f1b4ae00f785432231a1d2df1c0033c65dfadd96548890a0d9836e2ee917
3
- size 431296708
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eeea1b8e7662865c2984383a54a0ee0dc6f48a639a2f6bac1a0b66d82ea8a46
3
+ size 431179820