izzako commited on
Commit
a0dea34
·
verified ·
1 Parent(s): 5c9831b

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +27 -0
  2. tokenizer_config.json +1 -1
tokenizer.json CHANGED
@@ -63,6 +63,12 @@
63
  "id": "A",
64
  "type_id": 0
65
  }
 
 
 
 
 
 
66
  }
67
  ],
68
  "pair": [
@@ -78,6 +84,12 @@
78
  "type_id": 0
79
  }
80
  },
 
 
 
 
 
 
81
  {
82
  "SpecialToken": {
83
  "id": "<s>",
@@ -89,9 +101,24 @@
89
  "id": "B",
90
  "type_id": 1
91
  }
 
 
 
 
 
 
92
  }
93
  ],
94
  "special_tokens": {
 
 
 
 
 
 
 
 
 
95
  "<s>": {
96
  "id": "<s>",
97
  "ids": [
 
63
  "id": "A",
64
  "type_id": 0
65
  }
66
+ },
67
+ {
68
+ "SpecialToken": {
69
+ "id": "</s>",
70
+ "type_id": 0
71
+ }
72
  }
73
  ],
74
  "pair": [
 
84
  "type_id": 0
85
  }
86
  },
87
+ {
88
+ "SpecialToken": {
89
+ "id": "</s>",
90
+ "type_id": 0
91
+ }
92
+ },
93
  {
94
  "SpecialToken": {
95
  "id": "<s>",
 
101
  "id": "B",
102
  "type_id": 1
103
  }
104
+ },
105
+ {
106
+ "SpecialToken": {
107
+ "id": "</s>",
108
+ "type_id": 1
109
+ }
110
  }
111
  ],
112
  "special_tokens": {
113
+ "</s>": {
114
+ "id": "</s>",
115
+ "ids": [
116
+ 2
117
+ ],
118
+ "tokens": [
119
+ "</s>"
120
+ ]
121
+ },
122
  "<s>": {
123
  "id": "<s>",
124
  "ids": [
tokenizer_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "add_bos_token": true,
3
- "add_eos_token": false,
4
  "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
  "0": {
 
1
  {
2
  "add_bos_token": true,
3
+ "add_eos_token": true,
4
  "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
  "0": {