gayom
/

KoSC

text2text-generation

Model card Files Files and versions

gayom commited on May 11, 2023

Commit

2aa89b5

·

1 Parent(s): eab8d26

Upload tokenizer

Files changed (2) hide show

tokenizer.json +1 -0
tokenizer_config.json +1 -2

tokenizer.json CHANGED Viewed

@@ -2103,6 +2103,7 @@
     "continuing_subword_prefix": null,
     "end_of_word_suffix": null,
     "fuse_unk": false,
     "vocab": {
       "<s>": 0,
       "</s>": 1,

     "continuing_subword_prefix": null,
     "end_of_word_suffix": null,
     "fuse_unk": false,
+    "byte_fallback": false,
     "vocab": {
       "<s>": 0,
       "</s>": 1,

tokenizer_config.json CHANGED Viewed

@@ -1,6 +1,5 @@
 {
   "model_max_length": 1000000000000000019884624838656,
-  "name_or_path": "gogamza/kobart-base-v2",
-  "special_tokens_map_file": "/root/.cache/huggingface/hub/models--gogamza--kobart-base-v2/snapshots/f9f2ec35d3c32a1ecc7a3281f9626b7ec1913fed/special_tokens_map.json",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

 {
+  "clean_up_tokenization_spaces": true,
   "model_max_length": 1000000000000000019884624838656,
   "tokenizer_class": "PreTrainedTokenizerFast"
 }