turing552 commited on
Commit
d8657c1
·
verified ·
1 Parent(s): 66c3b44

End of training

Browse files
Files changed (1) hide show
  1. tokenizer.json +1 -1
tokenizer.json CHANGED
@@ -46,7 +46,7 @@
46
  {
47
  "type": "Split",
48
  "pattern": {
49
- "Regex": "<\\|startoftext\\|>|<\\|endoftext\\|>|'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+"
50
  },
51
  "behavior": "Removed",
52
  "invert": true
 
46
  {
47
  "type": "Split",
48
  "pattern": {
49
+ "Regex": "'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+"
50
  },
51
  "behavior": "Removed",
52
  "invert": true