Samuael commited on
Commit
620321d
·
verified ·
1 Parent(s): 6f7611f

Upload tokenizer

Browse files
sentencepiece.bpe.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b2c9b3910462e773a7ace377cb26a40053dcfe4054d8eb8ecc5460495a93d9b
3
- size 253575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4e4c09bd68c20916dfa8472b3c979527234d7b22afa71e1ea0bb36ee79a1bbd
3
+ size 253571
special_tokens_map.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "additional_special_tokens": [
3
- "▁በኋላ",
4
- "ብር"
5
  ],
6
  "bos_token": "<s>",
7
  "cls_token": "<s>",
 
1
  {
2
  "additional_special_tokens": [
3
+ "ar_AR",
4
+ "cs_CZ"
5
  ],
6
  "bos_token": "<s>",
7
  "cls_token": "<s>",
tokenizer_config.json CHANGED
@@ -234,8 +234,8 @@
234
  }
235
  },
236
  "additional_special_tokens": [
237
- "▁በኋላ",
238
- "ብር"
239
  ],
240
  "bos_token": "<s>",
241
  "clean_up_tokenization_spaces": true,
 
234
  }
235
  },
236
  "additional_special_tokens": [
237
+ "ar_AR",
238
+ "cs_CZ"
239
  ],
240
  "bos_token": "<s>",
241
  "clean_up_tokenization_spaces": true,