waceke commited on
Commit
843a935
·
verified ·
1 Parent(s): 579a72e

Training done

Browse files
preprocessor_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
- 1280,
24
- 960
25
  ]
26
  }
 
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
  "size": [
23
+ 2560,
24
+ 1920
25
  ]
26
  }
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 768,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 768
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 1536,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 1536
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
tokenizer_config.json CHANGED
@@ -1530,11 +1530,18 @@
1530
  "cls_token": "<s>",
1531
  "eos_token": "</s>",
1532
  "mask_token": "<mask>",
 
1533
  "model_max_length": 1000000000000000019884624838656,
 
1534
  "pad_token": "<pad>",
 
 
1535
  "processor_class": "DonutProcessor",
1536
  "sep_token": "</s>",
1537
  "sp_model_kwargs": {},
 
1538
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
1539
  "unk_token": "<unk>"
1540
  }
 
1530
  "cls_token": "<s>",
1531
  "eos_token": "</s>",
1532
  "mask_token": "<mask>",
1533
+ "max_length": 768,
1534
  "model_max_length": 1000000000000000019884624838656,
1535
+ "pad_to_multiple_of": null,
1536
  "pad_token": "<pad>",
1537
+ "pad_token_type_id": 0,
1538
+ "padding_side": "right",
1539
  "processor_class": "DonutProcessor",
1540
  "sep_token": "</s>",
1541
  "sp_model_kwargs": {},
1542
+ "stride": 0,
1543
  "tokenizer_class": "XLMRobertaTokenizer",
1544
+ "truncation_side": "right",
1545
+ "truncation_strategy": "longest_first",
1546
  "unk_token": "<unk>"
1547
  }