rebase

Files changed (6) hide show

added_tokens.json DELETED Viewed

@@ -1,40 +0,0 @@
-{
-  "\t\t": 50294,
-  "\t\t\t": 50293,
-  "\t\t\t\t": 50292,
-  "\t\t\t\t\t": 50291,
-  "\t\t\t\t\t\t": 50290,
-  "\t\t\t\t\t\t\t": 50289,
-  "\t\t\t\t\t\t\t\t": 50288,
-  "\t\t\t\t\t\t\t\t\t": 50287,
-  "  ": 50286,
-  "   ": 50285,
-  "    ": 50284,
-  "     ": 50283,
-  "      ": 50282,
-  "       ": 50281,
-  "        ": 50280,
-  "         ": 50279,
-  "          ": 50278,
-  "           ": 50277,
-  "            ": 50276,
-  "             ": 50275,
-  "              ": 50274,
-  "               ": 50273,
-  "                ": 50272,
-  "                 ": 50271,
-  "                  ": 50270,
-  "                   ": 50269,
-  "                    ": 50268,
-  "                     ": 50267,
-  "                      ": 50266,
-  "                       ": 50265,
-  "                        ": 50264,
-  "                         ": 50263,
-  "                          ": 50262,
-  "                           ": 50261,
-  "                            ": 50260,
-  "                             ": 50259,
-  "                              ": 50258,
-  "                               ": 50257
-}

merges.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|endoftext|>",
-  "pad_token": 50256,
-  "unk_token": "<|endoftext|>"
-}

tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json DELETED Viewed

@@ -1,10 +0,0 @@
-{
-  "add_prefix_space": false,
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|endoftext|>",
-  "model_max_length": 1024,
-  "name_or_path": "gpt2",
-  "special_tokens_map_file": null,
-  "tokenizer_class": "GPT2Tokenizer",
-  "unk_token": "<|endoftext|>"
-}

vocab.json DELETED Viewed

The diff for this file is too large to render. See raw diff