techsword commited on
Commit
605fc43
·
verified ·
1 Parent(s): 5aa269f

Upload Wav2Vec2ForSequenceClassification

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. config.json +624 -0
  3. model.safetensors +3 -0
README.md CHANGED
@@ -6,4 +6,4 @@ language:
6
  base_model:
7
  - facebook/wav2vec2-base
8
  pipeline_tag: audio-classification
9
- ---
 
6
  base_model:
7
  - facebook/wav2vec2-base
8
  pipeline_tag: audio-classification
9
+ ---
config.json ADDED
@@ -0,0 +1,624 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/home/gshen/work_dir/unprobe/finetuned_models/wav2vec2-sid-finetuned/checkpoint-1300",
3
+ "activation_dropout": 0.0,
4
+ "adapter_attn_dim": null,
5
+ "adapter_kernel_size": 3,
6
+ "adapter_stride": 2,
7
+ "add_adapter": false,
8
+ "apply_spec_augment": true,
9
+ "architectures": [
10
+ "Wav2Vec2ForSequenceClassification"
11
+ ],
12
+ "attention_dropout": 0.1,
13
+ "bos_token_id": 1,
14
+ "classifier_proj_size": 256,
15
+ "codevector_dim": 256,
16
+ "contrastive_logits_temperature": 0.1,
17
+ "conv_bias": false,
18
+ "conv_dim": [
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512,
25
+ 512
26
+ ],
27
+ "conv_kernel": [
28
+ 10,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 3,
33
+ 2,
34
+ 2
35
+ ],
36
+ "conv_stride": [
37
+ 5,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2,
43
+ 2
44
+ ],
45
+ "ctc_loss_reduction": "sum",
46
+ "ctc_zero_infinity": false,
47
+ "diversity_loss_weight": 0.1,
48
+ "do_stable_layer_norm": false,
49
+ "eos_token_id": 2,
50
+ "feat_extract_activation": "gelu",
51
+ "feat_extract_norm": "group",
52
+ "feat_proj_dropout": 0.1,
53
+ "feat_quantizer_dropout": 0.0,
54
+ "final_dropout": 0.0,
55
+ "freeze_feat_extract_train": true,
56
+ "hidden_act": "gelu",
57
+ "hidden_dropout": 0.1,
58
+ "hidden_size": 768,
59
+ "id2label": {
60
+ "0": "103",
61
+ "1": "1034",
62
+ "2": "1040",
63
+ "3": "1069",
64
+ "4": "1081",
65
+ "5": "1088",
66
+ "6": "1098",
67
+ "7": "1116",
68
+ "8": "118",
69
+ "9": "1183",
70
+ "10": "1235",
71
+ "11": "1246",
72
+ "12": "125",
73
+ "13": "1263",
74
+ "14": "1334",
75
+ "15": "1355",
76
+ "16": "1363",
77
+ "17": "1447",
78
+ "18": "1455",
79
+ "19": "150",
80
+ "20": "1502",
81
+ "21": "1553",
82
+ "22": "1578",
83
+ "23": "1594",
84
+ "24": "1624",
85
+ "25": "163",
86
+ "26": "1723",
87
+ "27": "1737",
88
+ "28": "1743",
89
+ "29": "1841",
90
+ "30": "1867",
91
+ "31": "1898",
92
+ "32": "19",
93
+ "33": "1926",
94
+ "34": "196",
95
+ "35": "1963",
96
+ "36": "1970",
97
+ "37": "198",
98
+ "38": "1992",
99
+ "39": "200",
100
+ "40": "2002",
101
+ "41": "2007",
102
+ "42": "201",
103
+ "43": "2092",
104
+ "44": "211",
105
+ "45": "2136",
106
+ "46": "2159",
107
+ "47": "2182",
108
+ "48": "2196",
109
+ "49": "226",
110
+ "50": "2289",
111
+ "51": "229",
112
+ "52": "233",
113
+ "53": "2384",
114
+ "54": "2391",
115
+ "55": "2416",
116
+ "56": "2436",
117
+ "57": "248",
118
+ "58": "250",
119
+ "59": "2514",
120
+ "60": "2518",
121
+ "61": "254",
122
+ "62": "26",
123
+ "63": "2691",
124
+ "64": "27",
125
+ "65": "2764",
126
+ "66": "2817",
127
+ "67": "2836",
128
+ "68": "2843",
129
+ "69": "289",
130
+ "70": "2893",
131
+ "71": "2910",
132
+ "72": "2911",
133
+ "73": "2952",
134
+ "74": "298",
135
+ "75": "2989",
136
+ "76": "302",
137
+ "77": "307",
138
+ "78": "311",
139
+ "79": "3112",
140
+ "80": "3168",
141
+ "81": "32",
142
+ "82": "3214",
143
+ "83": "322",
144
+ "84": "3235",
145
+ "85": "3240",
146
+ "86": "3242",
147
+ "87": "3259",
148
+ "88": "328",
149
+ "89": "332",
150
+ "90": "3374",
151
+ "91": "3436",
152
+ "92": "3440",
153
+ "93": "3486",
154
+ "94": "3526",
155
+ "95": "3607",
156
+ "96": "3664",
157
+ "97": "3699",
158
+ "98": "3723",
159
+ "99": "374",
160
+ "100": "3807",
161
+ "101": "3830",
162
+ "102": "3857",
163
+ "103": "3879",
164
+ "104": "39",
165
+ "105": "3947",
166
+ "106": "3982",
167
+ "107": "3983",
168
+ "108": "40",
169
+ "109": "4014",
170
+ "110": "4018",
171
+ "111": "403",
172
+ "112": "405",
173
+ "113": "4051",
174
+ "114": "4088",
175
+ "115": "412",
176
+ "116": "4137",
177
+ "117": "4160",
178
+ "118": "4195",
179
+ "119": "4214",
180
+ "120": "426",
181
+ "121": "4267",
182
+ "122": "4297",
183
+ "123": "4340",
184
+ "124": "4362",
185
+ "125": "4397",
186
+ "126": "4406",
187
+ "127": "441",
188
+ "128": "4441",
189
+ "129": "445",
190
+ "130": "446",
191
+ "131": "4481",
192
+ "132": "458",
193
+ "133": "460",
194
+ "134": "4640",
195
+ "135": "4680",
196
+ "136": "4788",
197
+ "137": "481",
198
+ "138": "4813",
199
+ "139": "4830",
200
+ "140": "4853",
201
+ "141": "4859",
202
+ "142": "4898",
203
+ "143": "5022",
204
+ "144": "5049",
205
+ "145": "5104",
206
+ "146": "5163",
207
+ "147": "5192",
208
+ "148": "5322",
209
+ "149": "5339",
210
+ "150": "5390",
211
+ "151": "5393",
212
+ "152": "5456",
213
+ "153": "5463",
214
+ "154": "5514",
215
+ "155": "5561",
216
+ "156": "5652",
217
+ "157": "5678",
218
+ "158": "5688",
219
+ "159": "5703",
220
+ "160": "5750",
221
+ "161": "5778",
222
+ "162": "5789",
223
+ "163": "5808",
224
+ "164": "5867",
225
+ "165": "587",
226
+ "166": "60",
227
+ "167": "6000",
228
+ "168": "6019",
229
+ "169": "6064",
230
+ "170": "6078",
231
+ "171": "6081",
232
+ "172": "6147",
233
+ "173": "6181",
234
+ "174": "6209",
235
+ "175": "625",
236
+ "176": "6272",
237
+ "177": "6367",
238
+ "178": "6385",
239
+ "179": "6415",
240
+ "180": "6437",
241
+ "181": "6454",
242
+ "182": "6476",
243
+ "183": "6529",
244
+ "184": "6531",
245
+ "185": "6563",
246
+ "186": "669",
247
+ "187": "6818",
248
+ "188": "6836",
249
+ "189": "6848",
250
+ "190": "6880",
251
+ "191": "6925",
252
+ "192": "696",
253
+ "193": "7059",
254
+ "194": "7067",
255
+ "195": "7078",
256
+ "196": "7113",
257
+ "197": "7148",
258
+ "198": "7178",
259
+ "199": "7190",
260
+ "200": "7226",
261
+ "201": "7264",
262
+ "202": "7278",
263
+ "203": "730",
264
+ "204": "7302",
265
+ "205": "7312",
266
+ "206": "7367",
267
+ "207": "7402",
268
+ "208": "7447",
269
+ "209": "7505",
270
+ "210": "7511",
271
+ "211": "7517",
272
+ "212": "7635",
273
+ "213": "7780",
274
+ "214": "7794",
275
+ "215": "78",
276
+ "216": "7800",
277
+ "217": "7859",
278
+ "218": "8014",
279
+ "219": "8051",
280
+ "220": "8063",
281
+ "221": "8088",
282
+ "222": "8095",
283
+ "223": "8098",
284
+ "224": "8108",
285
+ "225": "8123",
286
+ "226": "8226",
287
+ "227": "8238",
288
+ "228": "83",
289
+ "229": "831",
290
+ "230": "8312",
291
+ "231": "8324",
292
+ "232": "839",
293
+ "233": "8419",
294
+ "234": "8425",
295
+ "235": "8465",
296
+ "236": "8468",
297
+ "237": "8580",
298
+ "238": "8609",
299
+ "239": "8629",
300
+ "240": "8630",
301
+ "241": "87",
302
+ "242": "8747",
303
+ "243": "8770",
304
+ "244": "8797",
305
+ "245": "8838",
306
+ "246": "887",
307
+ "247": "89",
308
+ "248": "8975",
309
+ "249": "909",
310
+ "250": "911"
311
+ },
312
+ "initializer_range": 0.02,
313
+ "intermediate_size": 3072,
314
+ "label2id": {
315
+ "103": 0,
316
+ "1034": 1,
317
+ "1040": 2,
318
+ "1069": 3,
319
+ "1081": 4,
320
+ "1088": 5,
321
+ "1098": 6,
322
+ "1116": 7,
323
+ "118": 8,
324
+ "1183": 9,
325
+ "1235": 10,
326
+ "1246": 11,
327
+ "125": 12,
328
+ "1263": 13,
329
+ "1334": 14,
330
+ "1355": 15,
331
+ "1363": 16,
332
+ "1447": 17,
333
+ "1455": 18,
334
+ "150": 19,
335
+ "1502": 20,
336
+ "1553": 21,
337
+ "1578": 22,
338
+ "1594": 23,
339
+ "1624": 24,
340
+ "163": 25,
341
+ "1723": 26,
342
+ "1737": 27,
343
+ "1743": 28,
344
+ "1841": 29,
345
+ "1867": 30,
346
+ "1898": 31,
347
+ "19": 32,
348
+ "1926": 33,
349
+ "196": 34,
350
+ "1963": 35,
351
+ "1970": 36,
352
+ "198": 37,
353
+ "1992": 38,
354
+ "200": 39,
355
+ "2002": 40,
356
+ "2007": 41,
357
+ "201": 42,
358
+ "2092": 43,
359
+ "211": 44,
360
+ "2136": 45,
361
+ "2159": 46,
362
+ "2182": 47,
363
+ "2196": 48,
364
+ "226": 49,
365
+ "2289": 50,
366
+ "229": 51,
367
+ "233": 52,
368
+ "2384": 53,
369
+ "2391": 54,
370
+ "2416": 55,
371
+ "2436": 56,
372
+ "248": 57,
373
+ "250": 58,
374
+ "2514": 59,
375
+ "2518": 60,
376
+ "254": 61,
377
+ "26": 62,
378
+ "2691": 63,
379
+ "27": 64,
380
+ "2764": 65,
381
+ "2817": 66,
382
+ "2836": 67,
383
+ "2843": 68,
384
+ "289": 69,
385
+ "2893": 70,
386
+ "2910": 71,
387
+ "2911": 72,
388
+ "2952": 73,
389
+ "298": 74,
390
+ "2989": 75,
391
+ "302": 76,
392
+ "307": 77,
393
+ "311": 78,
394
+ "3112": 79,
395
+ "3168": 80,
396
+ "32": 81,
397
+ "3214": 82,
398
+ "322": 83,
399
+ "3235": 84,
400
+ "3240": 85,
401
+ "3242": 86,
402
+ "3259": 87,
403
+ "328": 88,
404
+ "332": 89,
405
+ "3374": 90,
406
+ "3436": 91,
407
+ "3440": 92,
408
+ "3486": 93,
409
+ "3526": 94,
410
+ "3607": 95,
411
+ "3664": 96,
412
+ "3699": 97,
413
+ "3723": 98,
414
+ "374": 99,
415
+ "3807": 100,
416
+ "3830": 101,
417
+ "3857": 102,
418
+ "3879": 103,
419
+ "39": 104,
420
+ "3947": 105,
421
+ "3982": 106,
422
+ "3983": 107,
423
+ "40": 108,
424
+ "4014": 109,
425
+ "4018": 110,
426
+ "403": 111,
427
+ "405": 112,
428
+ "4051": 113,
429
+ "4088": 114,
430
+ "412": 115,
431
+ "4137": 116,
432
+ "4160": 117,
433
+ "4195": 118,
434
+ "4214": 119,
435
+ "426": 120,
436
+ "4267": 121,
437
+ "4297": 122,
438
+ "4340": 123,
439
+ "4362": 124,
440
+ "4397": 125,
441
+ "4406": 126,
442
+ "441": 127,
443
+ "4441": 128,
444
+ "445": 129,
445
+ "446": 130,
446
+ "4481": 131,
447
+ "458": 132,
448
+ "460": 133,
449
+ "4640": 134,
450
+ "4680": 135,
451
+ "4788": 136,
452
+ "481": 137,
453
+ "4813": 138,
454
+ "4830": 139,
455
+ "4853": 140,
456
+ "4859": 141,
457
+ "4898": 142,
458
+ "5022": 143,
459
+ "5049": 144,
460
+ "5104": 145,
461
+ "5163": 146,
462
+ "5192": 147,
463
+ "5322": 148,
464
+ "5339": 149,
465
+ "5390": 150,
466
+ "5393": 151,
467
+ "5456": 152,
468
+ "5463": 153,
469
+ "5514": 154,
470
+ "5561": 155,
471
+ "5652": 156,
472
+ "5678": 157,
473
+ "5688": 158,
474
+ "5703": 159,
475
+ "5750": 160,
476
+ "5778": 161,
477
+ "5789": 162,
478
+ "5808": 163,
479
+ "5867": 164,
480
+ "587": 165,
481
+ "60": 166,
482
+ "6000": 167,
483
+ "6019": 168,
484
+ "6064": 169,
485
+ "6078": 170,
486
+ "6081": 171,
487
+ "6147": 172,
488
+ "6181": 173,
489
+ "6209": 174,
490
+ "625": 175,
491
+ "6272": 176,
492
+ "6367": 177,
493
+ "6385": 178,
494
+ "6415": 179,
495
+ "6437": 180,
496
+ "6454": 181,
497
+ "6476": 182,
498
+ "6529": 183,
499
+ "6531": 184,
500
+ "6563": 185,
501
+ "669": 186,
502
+ "6818": 187,
503
+ "6836": 188,
504
+ "6848": 189,
505
+ "6880": 190,
506
+ "6925": 191,
507
+ "696": 192,
508
+ "7059": 193,
509
+ "7067": 194,
510
+ "7078": 195,
511
+ "7113": 196,
512
+ "7148": 197,
513
+ "7178": 198,
514
+ "7190": 199,
515
+ "7226": 200,
516
+ "7264": 201,
517
+ "7278": 202,
518
+ "730": 203,
519
+ "7302": 204,
520
+ "7312": 205,
521
+ "7367": 206,
522
+ "7402": 207,
523
+ "7447": 208,
524
+ "7505": 209,
525
+ "7511": 210,
526
+ "7517": 211,
527
+ "7635": 212,
528
+ "7780": 213,
529
+ "7794": 214,
530
+ "78": 215,
531
+ "7800": 216,
532
+ "7859": 217,
533
+ "8014": 218,
534
+ "8051": 219,
535
+ "8063": 220,
536
+ "8088": 221,
537
+ "8095": 222,
538
+ "8098": 223,
539
+ "8108": 224,
540
+ "8123": 225,
541
+ "8226": 226,
542
+ "8238": 227,
543
+ "83": 228,
544
+ "831": 229,
545
+ "8312": 230,
546
+ "8324": 231,
547
+ "839": 232,
548
+ "8419": 233,
549
+ "8425": 234,
550
+ "8465": 235,
551
+ "8468": 236,
552
+ "8580": 237,
553
+ "8609": 238,
554
+ "8629": 239,
555
+ "8630": 240,
556
+ "87": 241,
557
+ "8747": 242,
558
+ "8770": 243,
559
+ "8797": 244,
560
+ "8838": 245,
561
+ "887": 246,
562
+ "89": 247,
563
+ "8975": 248,
564
+ "909": 249,
565
+ "911": 250
566
+ },
567
+ "layer_norm_eps": 1e-05,
568
+ "layerdrop": 0.0,
569
+ "mask_channel_length": 10,
570
+ "mask_channel_min_space": 1,
571
+ "mask_channel_other": 0.0,
572
+ "mask_channel_prob": 0.0,
573
+ "mask_channel_selection": "static",
574
+ "mask_feature_length": 10,
575
+ "mask_feature_min_masks": 0,
576
+ "mask_feature_prob": 0.0,
577
+ "mask_time_length": 10,
578
+ "mask_time_min_masks": 2,
579
+ "mask_time_min_space": 1,
580
+ "mask_time_other": 0.0,
581
+ "mask_time_prob": 0.05,
582
+ "mask_time_selection": "static",
583
+ "model_type": "wav2vec2",
584
+ "no_mask_channel_overlap": false,
585
+ "no_mask_time_overlap": false,
586
+ "num_adapter_layers": 3,
587
+ "num_attention_heads": 12,
588
+ "num_codevector_groups": 2,
589
+ "num_codevectors_per_group": 320,
590
+ "num_conv_pos_embedding_groups": 16,
591
+ "num_conv_pos_embeddings": 128,
592
+ "num_feat_extract_layers": 7,
593
+ "num_hidden_layers": 12,
594
+ "num_negatives": 100,
595
+ "output_hidden_size": 768,
596
+ "pad_token_id": 0,
597
+ "proj_codevector_dim": 256,
598
+ "tdnn_dilation": [
599
+ 1,
600
+ 2,
601
+ 3,
602
+ 1,
603
+ 1
604
+ ],
605
+ "tdnn_dim": [
606
+ 512,
607
+ 512,
608
+ 512,
609
+ 512,
610
+ 1500
611
+ ],
612
+ "tdnn_kernel": [
613
+ 5,
614
+ 3,
615
+ 3,
616
+ 1,
617
+ 1
618
+ ],
619
+ "torch_dtype": "float32",
620
+ "transformers_version": "4.49.0",
621
+ "use_weighted_layer_sum": false,
622
+ "vocab_size": 32,
623
+ "xvector_output_dim": 512
624
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad53456e0641cf893908e491f4bc7f3f07b5eda246ca533a373830e809d3f70
3
+ size 378558364