prachuryyaIITG commited on
Commit
3dc271b
·
verified ·
1 Parent(s): fa0521b

Upload 5 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,298 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "FacebookAI/xlm-roberta-large",
3
+ "architectures": [
4
+ "XLMRobertaForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "id2label": {
14
+ "0": "B-art-broadcastprogram",
15
+ "1": "B-art-film",
16
+ "2": "B-art-music",
17
+ "3": "B-art-other",
18
+ "4": "B-art-painting",
19
+ "5": "B-art-writtenart",
20
+ "6": "B-building-airport",
21
+ "7": "B-building-hospital",
22
+ "8": "B-building-hotel",
23
+ "9": "B-building-library",
24
+ "10": "B-building-other",
25
+ "11": "B-building-restaurant",
26
+ "12": "B-building-sportsfacility",
27
+ "13": "B-building-theater",
28
+ "14": "B-event-attack/battle/war/militaryconflict",
29
+ "15": "B-event-disaster",
30
+ "16": "B-event-election",
31
+ "17": "B-event-other",
32
+ "18": "B-event-protest",
33
+ "19": "B-event-sportsevent",
34
+ "20": "B-location-GPE",
35
+ "21": "B-location-bodiesofwater",
36
+ "22": "B-location-island",
37
+ "23": "B-location-mountain",
38
+ "24": "B-location-other",
39
+ "25": "B-location-park",
40
+ "26": "B-location-road/railway/highway/transit",
41
+ "27": "B-organization-company",
42
+ "28": "B-organization-education",
43
+ "29": "B-organization-government/governmentagency",
44
+ "30": "B-organization-media/newspaper",
45
+ "31": "B-organization-other",
46
+ "32": "B-organization-politicalparty",
47
+ "33": "B-organization-religion",
48
+ "34": "B-organization-showorganization",
49
+ "35": "B-organization-sportsleague",
50
+ "36": "B-organization-sportsteam",
51
+ "37": "B-other-astronomything",
52
+ "38": "B-other-award",
53
+ "39": "B-other-biologything",
54
+ "40": "B-other-chemicalthing",
55
+ "41": "B-other-currency",
56
+ "42": "B-other-disease",
57
+ "43": "B-other-educationaldegree",
58
+ "44": "B-other-god",
59
+ "45": "B-other-language",
60
+ "46": "B-other-law",
61
+ "47": "B-other-livingthing",
62
+ "48": "B-other-medical",
63
+ "49": "B-person-actor",
64
+ "50": "B-person-artist/author",
65
+ "51": "B-person-athlete",
66
+ "52": "B-person-director",
67
+ "53": "B-person-other",
68
+ "54": "B-person-politician",
69
+ "55": "B-person-scholar",
70
+ "56": "B-person-soldier",
71
+ "57": "B-product-airplane",
72
+ "58": "B-product-car",
73
+ "59": "B-product-food",
74
+ "60": "B-product-game",
75
+ "61": "B-product-other",
76
+ "62": "B-product-ship",
77
+ "63": "B-product-software",
78
+ "64": "B-product-train",
79
+ "65": "B-product-weapon",
80
+ "66": "I-art-broadcastprogram",
81
+ "67": "I-art-film",
82
+ "68": "I-art-music",
83
+ "69": "I-art-other",
84
+ "70": "I-art-painting",
85
+ "71": "I-art-writtenart",
86
+ "72": "I-building-airport",
87
+ "73": "I-building-hospital",
88
+ "74": "I-building-hotel",
89
+ "75": "I-building-library",
90
+ "76": "I-building-other",
91
+ "77": "I-building-restaurant",
92
+ "78": "I-building-sportsfacility",
93
+ "79": "I-building-theater",
94
+ "80": "I-event-attack/battle/war/militaryconflict",
95
+ "81": "I-event-disaster",
96
+ "82": "I-event-election",
97
+ "83": "I-event-other",
98
+ "84": "I-event-protest",
99
+ "85": "I-event-sportsevent",
100
+ "86": "I-location-GPE",
101
+ "87": "I-location-bodiesofwater",
102
+ "88": "I-location-island",
103
+ "89": "I-location-mountain",
104
+ "90": "I-location-other",
105
+ "91": "I-location-park",
106
+ "92": "I-location-road/railway/highway/transit",
107
+ "93": "I-organization-company",
108
+ "94": "I-organization-education",
109
+ "95": "I-organization-government/governmentagency",
110
+ "96": "I-organization-media/newspaper",
111
+ "97": "I-organization-other",
112
+ "98": "I-organization-politicalparty",
113
+ "99": "I-organization-religion",
114
+ "100": "I-organization-showorganization",
115
+ "101": "I-organization-sportsleague",
116
+ "102": "I-organization-sportsteam",
117
+ "103": "I-other-astronomything",
118
+ "104": "I-other-award",
119
+ "105": "I-other-biologything",
120
+ "106": "I-other-chemicalthing",
121
+ "107": "I-other-currency",
122
+ "108": "I-other-disease",
123
+ "109": "I-other-educationaldegree",
124
+ "110": "I-other-god",
125
+ "111": "I-other-language",
126
+ "112": "I-other-law",
127
+ "113": "I-other-livingthing",
128
+ "114": "I-other-medical",
129
+ "115": "I-person-actor",
130
+ "116": "I-person-artist/author",
131
+ "117": "I-person-athlete",
132
+ "118": "I-person-director",
133
+ "119": "I-person-other",
134
+ "120": "I-person-politician",
135
+ "121": "I-person-scholar",
136
+ "122": "I-person-soldier",
137
+ "123": "I-product-airplane",
138
+ "124": "I-product-car",
139
+ "125": "I-product-food",
140
+ "126": "I-product-game",
141
+ "127": "I-product-other",
142
+ "128": "I-product-ship",
143
+ "129": "I-product-software",
144
+ "130": "I-product-train",
145
+ "131": "I-product-weapon",
146
+ "132": "O"
147
+ },
148
+ "initializer_range": 0.02,
149
+ "intermediate_size": 4096,
150
+ "label2id": {
151
+ "B-art-broadcastprogram": 0,
152
+ "B-art-film": 1,
153
+ "B-art-music": 2,
154
+ "B-art-other": 3,
155
+ "B-art-painting": 4,
156
+ "B-art-writtenart": 5,
157
+ "B-building-airport": 6,
158
+ "B-building-hospital": 7,
159
+ "B-building-hotel": 8,
160
+ "B-building-library": 9,
161
+ "B-building-other": 10,
162
+ "B-building-restaurant": 11,
163
+ "B-building-sportsfacility": 12,
164
+ "B-building-theater": 13,
165
+ "B-event-attack/battle/war/militaryconflict": 14,
166
+ "B-event-disaster": 15,
167
+ "B-event-election": 16,
168
+ "B-event-other": 17,
169
+ "B-event-protest": 18,
170
+ "B-event-sportsevent": 19,
171
+ "B-location-GPE": 20,
172
+ "B-location-bodiesofwater": 21,
173
+ "B-location-island": 22,
174
+ "B-location-mountain": 23,
175
+ "B-location-other": 24,
176
+ "B-location-park": 25,
177
+ "B-location-road/railway/highway/transit": 26,
178
+ "B-organization-company": 27,
179
+ "B-organization-education": 28,
180
+ "B-organization-government/governmentagency": 29,
181
+ "B-organization-media/newspaper": 30,
182
+ "B-organization-other": 31,
183
+ "B-organization-politicalparty": 32,
184
+ "B-organization-religion": 33,
185
+ "B-organization-showorganization": 34,
186
+ "B-organization-sportsleague": 35,
187
+ "B-organization-sportsteam": 36,
188
+ "B-other-astronomything": 37,
189
+ "B-other-award": 38,
190
+ "B-other-biologything": 39,
191
+ "B-other-chemicalthing": 40,
192
+ "B-other-currency": 41,
193
+ "B-other-disease": 42,
194
+ "B-other-educationaldegree": 43,
195
+ "B-other-god": 44,
196
+ "B-other-language": 45,
197
+ "B-other-law": 46,
198
+ "B-other-livingthing": 47,
199
+ "B-other-medical": 48,
200
+ "B-person-actor": 49,
201
+ "B-person-artist/author": 50,
202
+ "B-person-athlete": 51,
203
+ "B-person-director": 52,
204
+ "B-person-other": 53,
205
+ "B-person-politician": 54,
206
+ "B-person-scholar": 55,
207
+ "B-person-soldier": 56,
208
+ "B-product-airplane": 57,
209
+ "B-product-car": 58,
210
+ "B-product-food": 59,
211
+ "B-product-game": 60,
212
+ "B-product-other": 61,
213
+ "B-product-ship": 62,
214
+ "B-product-software": 63,
215
+ "B-product-train": 64,
216
+ "B-product-weapon": 65,
217
+ "I-art-broadcastprogram": 66,
218
+ "I-art-film": 67,
219
+ "I-art-music": 68,
220
+ "I-art-other": 69,
221
+ "I-art-painting": 70,
222
+ "I-art-writtenart": 71,
223
+ "I-building-airport": 72,
224
+ "I-building-hospital": 73,
225
+ "I-building-hotel": 74,
226
+ "I-building-library": 75,
227
+ "I-building-other": 76,
228
+ "I-building-restaurant": 77,
229
+ "I-building-sportsfacility": 78,
230
+ "I-building-theater": 79,
231
+ "I-event-attack/battle/war/militaryconflict": 80,
232
+ "I-event-disaster": 81,
233
+ "I-event-election": 82,
234
+ "I-event-other": 83,
235
+ "I-event-protest": 84,
236
+ "I-event-sportsevent": 85,
237
+ "I-location-GPE": 86,
238
+ "I-location-bodiesofwater": 87,
239
+ "I-location-island": 88,
240
+ "I-location-mountain": 89,
241
+ "I-location-other": 90,
242
+ "I-location-park": 91,
243
+ "I-location-road/railway/highway/transit": 92,
244
+ "I-organization-company": 93,
245
+ "I-organization-education": 94,
246
+ "I-organization-government/governmentagency": 95,
247
+ "I-organization-media/newspaper": 96,
248
+ "I-organization-other": 97,
249
+ "I-organization-politicalparty": 98,
250
+ "I-organization-religion": 99,
251
+ "I-organization-showorganization": 100,
252
+ "I-organization-sportsleague": 101,
253
+ "I-organization-sportsteam": 102,
254
+ "I-other-astronomything": 103,
255
+ "I-other-award": 104,
256
+ "I-other-biologything": 105,
257
+ "I-other-chemicalthing": 106,
258
+ "I-other-currency": 107,
259
+ "I-other-disease": 108,
260
+ "I-other-educationaldegree": 109,
261
+ "I-other-god": 110,
262
+ "I-other-language": 111,
263
+ "I-other-law": 112,
264
+ "I-other-livingthing": 113,
265
+ "I-other-medical": 114,
266
+ "I-person-actor": 115,
267
+ "I-person-artist/author": 116,
268
+ "I-person-athlete": 117,
269
+ "I-person-director": 118,
270
+ "I-person-other": 119,
271
+ "I-person-politician": 120,
272
+ "I-person-scholar": 121,
273
+ "I-person-soldier": 122,
274
+ "I-product-airplane": 123,
275
+ "I-product-car": 124,
276
+ "I-product-food": 125,
277
+ "I-product-game": 126,
278
+ "I-product-other": 127,
279
+ "I-product-ship": 128,
280
+ "I-product-software": 129,
281
+ "I-product-train": 130,
282
+ "I-product-weapon": 131,
283
+ "O": 132
284
+ },
285
+ "layer_norm_eps": 1e-05,
286
+ "max_position_embeddings": 514,
287
+ "model_type": "xlm-roberta",
288
+ "num_attention_heads": 16,
289
+ "num_hidden_layers": 24,
290
+ "output_past": true,
291
+ "pad_token_id": 1,
292
+ "position_embedding_type": "absolute",
293
+ "torch_dtype": "float32",
294
+ "transformers_version": "4.47.0",
295
+ "type_vocab_size": 1,
296
+ "use_cache": true,
297
+ "vocab_size": 250002
298
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab8bbf9bf16848810af5aadc53ab20ae8b93c1c8c519b4c10b12c38f28e0ffa7
3
+ size 2235957164
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8373f9cd3d27591e1924426bcc1c8799bc5a9affc4fc857982c5d66668dd1f41
3
+ size 17082832
tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "250001": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "<s>",
48
+ "eos_token": "</s>",
49
+ "extra_special_tokens": {},
50
+ "mask_token": "<mask>",
51
+ "model_max_length": 512,
52
+ "pad_token": "<pad>",
53
+ "sep_token": "</s>",
54
+ "tokenizer_class": "XLMRobertaTokenizer",
55
+ "unk_token": "<unk>"
56
+ }