| { | |
| "tokenizer_type": "BPE", | |
| "vocab_size": 388, | |
| "pattern": "'(?i:[sdmt]|ll|ve|re)|[^\\r\\n\\p{L}\\p{N}]?+\\p{L}+|\\p{N}{1,3}| ?[^\\s\\p{L}\\p{N}]++[\\r\\n]*|\\s*[\\r\\n]|\\s+(?!\\S)|\\s+", | |
| "special_tokens": {}, | |
| "training_config": { | |
| "vocab_size": 256, | |
| "dataset_fraction": "train[0:1000]", | |
| "moves_key": "moves_custom", | |
| "separator": " " | |
| } | |
| } |