ikrysinska commited on
Commit
ffe8144
·
1 Parent(s): 85ec06a

Upload processor

Browse files
Files changed (2) hide show
  1. tokenizer_config.json +11 -11
  2. vocab.json +39 -39
tokenizer_config.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "added_tokens_decoder": {
3
- "0": {
4
- "content": "t͡ʃ",
5
  "lstrip": true,
6
  "normalized": false,
7
  "rstrip": true,
8
  "single_word": false,
9
  "special": false
10
  },
11
- "14": {
12
  "content": "oʊ",
13
  "lstrip": true,
14
  "normalized": false,
@@ -16,8 +16,8 @@
16
  "single_word": false,
17
  "special": false
18
  },
19
- "16": {
20
- "content": "",
21
  "lstrip": true,
22
  "normalized": false,
23
  "rstrip": true,
@@ -25,30 +25,30 @@
25
  "special": false
26
  },
27
  "17": {
28
- "content": "",
29
  "lstrip": true,
30
  "normalized": false,
31
  "rstrip": true,
32
  "single_word": false,
33
  "special": false
34
  },
35
- "22": {
36
- "content": "ɔɪ",
37
  "lstrip": true,
38
  "normalized": false,
39
  "rstrip": true,
40
  "single_word": false,
41
  "special": false
42
  },
43
- "38": {
44
- "content": "d͡ʒ",
45
  "lstrip": true,
46
  "normalized": false,
47
  "rstrip": true,
48
  "single_word": false,
49
  "special": false
50
  },
51
- "39": {
52
  "content": "aʊ",
53
  "lstrip": true,
54
  "normalized": false,
 
1
  {
2
  "added_tokens_decoder": {
3
+ "1": {
4
+ "content": "",
5
  "lstrip": true,
6
  "normalized": false,
7
  "rstrip": true,
8
  "single_word": false,
9
  "special": false
10
  },
11
+ "4": {
12
  "content": "oʊ",
13
  "lstrip": true,
14
  "normalized": false,
 
16
  "single_word": false,
17
  "special": false
18
  },
19
+ "10": {
20
+ "content": "t͡ʃ",
21
  "lstrip": true,
22
  "normalized": false,
23
  "rstrip": true,
 
25
  "special": false
26
  },
27
  "17": {
28
+ "content": "d͡ʒ",
29
  "lstrip": true,
30
  "normalized": false,
31
  "rstrip": true,
32
  "single_word": false,
33
  "special": false
34
  },
35
+ "23": {
36
+ "content": "",
37
  "lstrip": true,
38
  "normalized": false,
39
  "rstrip": true,
40
  "single_word": false,
41
  "special": false
42
  },
43
+ "25": {
44
+ "content": "ɔɪ",
45
  "lstrip": true,
46
  "normalized": false,
47
  "rstrip": true,
48
  "single_word": false,
49
  "special": false
50
  },
51
+ "28": {
52
  "content": "aʊ",
53
  "lstrip": true,
54
  "normalized": false,
vocab.json CHANGED
@@ -2,44 +2,44 @@
2
  " ": 42,
3
  "[PAD]": 41,
4
  "[UNK]": 40,
5
- "aɪ": 16,
6
- "aʊ": 39,
7
- "b": 21,
8
- "d": 25,
9
- "d͡ʒ": 38,
10
- "eɪ": 17,
11
- "f": 5,
12
- "h": 29,
13
- "i": 13,
14
- "j": 36,
15
- "k": 18,
16
- "l": 4,
17
- "m": 31,
18
- "n": 19,
19
- "oʊ": 14,
20
- "p": 2,
21
  "s": 32,
22
- "t": 35,
23
- "t͡ʃ": 0,
24
- "u": 15,
25
- "v": 6,
26
- "w": 30,
27
- "z": 26,
28
- "æ": 37,
29
- "ð": 11,
30
- "ŋ": 8,
31
- "ɑ": 10,
32
- "ɔ": 1,
33
- "ɔɪ": 22,
34
- "ə": 20,
35
- "ɛ": 3,
36
- "ɝ": 23,
37
- "ɡ": 33,
38
- "ɪ": 34,
39
- "ɹ": 7,
40
- "ʃ": 24,
41
- "ʊ": 27,
42
- "ʌ": 12,
43
- "ʒ": 28,
44
- "θ": 9
45
  }
 
2
  " ": 42,
3
  "[PAD]": 41,
4
  "[UNK]": 40,
5
+ "aɪ": 23,
6
+ "aʊ": 28,
7
+ "b": 12,
8
+ "d": 3,
9
+ "d͡ʒ": 17,
10
+ "eɪ": 1,
11
+ "f": 31,
12
+ "h": 16,
13
+ "i": 35,
14
+ "j": 24,
15
+ "k": 22,
16
+ "l": 5,
17
+ "m": 15,
18
+ "n": 33,
19
+ "oʊ": 4,
20
+ "p": 37,
21
  "s": 32,
22
+ "t": 11,
23
+ "t͡ʃ": 10,
24
+ "u": 39,
25
+ "v": 29,
26
+ "w": 21,
27
+ "z": 19,
28
+ "æ": 30,
29
+ "ð": 2,
30
+ "ŋ": 7,
31
+ "ɑ": 9,
32
+ "ɔ": 14,
33
+ "ɔɪ": 25,
34
+ "ə": 6,
35
+ "ɛ": 34,
36
+ "ɝ": 18,
37
+ "ɡ": 36,
38
+ "ɪ": 8,
39
+ "ɹ": 27,
40
+ "ʃ": 38,
41
+ "ʊ": 13,
42
+ "ʌ": 0,
43
+ "ʒ": 26,
44
+ "θ": 20
45
  }