arxyzan commited on
Commit
77d17ca
·
1 Parent(s): c2c95ad

Hezar: Upload tokenizer_config.yaml

Browse files
Files changed (1) hide show
  1. preprocessor//tokenizer_config.yaml +10 -0
preprocessor//tokenizer_config.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ config_type: preprocessor
2
+ max_length: 512
3
+ truncation_strategy: longest_first
4
+ truncation_direction: right
5
+ stride: 0
6
+ padding_strategy: longest
7
+ padding_direction: right
8
+ pad_token_id: 0
9
+ pad_token: '[PAD]'
10
+ pad_token_type_id: 0