File size: 1,275 Bytes
eb7f4b2
 
62c18ce
243bac5
 
 
 
 
 
 
62c18ce
 
 
243bac5
 
62c18ce
243bac5
62c18ce
 
243bac5
62c18ce
 
 
 
 
 
 
243bac5
62c18ce
 
 
 
 
 
 
243bac5
62c18ce
 
 
 
243bac5
62c18ce
 
 
 
 
243bac5
62c18ce
243bac5
 
62c18ce
 
 
 
 
 
 
 
 
 
 
243bac5
62c18ce
 
 
 
 
243bac5
62c18ce
eb7f4b2
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
{
  "model_type": "kiri-ocr",
  "architectures": ["KiriOCR"],
  "library_name": "pytorch",
  "torch_dtype": "float32",

  "hidden_size": 256,
  "num_hidden_layers": 7,
  "num_attention_heads": 8,

  "image_height": 48,
  "image_width": 640,
  "max_decoder_length": 260,

  "vocab_size": 966,
  "unk_token": "<unk>",

  "collapse_whitespace": true,
  "unicode_nfc": true,

  "encoder": {
    "dim": 256,
    "num_layers": 4,
    "num_heads": 8,
    "feedforward_dim": 1024,
    "dropout": 0.15
  },

  "decoder": {
    "enabled": true,
    "dim": 256,
    "num_layers": 3,
    "num_heads": 8,
    "feedforward_dim": 1024
  },

  "ctc": {
    "enabled": true,
    "fusion_alpha": 0.5
  },

  "language_model": {
    "enabled": true,
    "fusion_enabled_eval": true,
    "fusion_alpha": 0.35
  },

  "inference": {
    "use_fp16": false,
    "use_autocast": false,
    "beam_width": 4,
    "beam_length_penalty": 0.6,
    "eos_logp_bias": 5.0,
    "eos_logp_boost": 5.0,
    "eos_bias_until_length": 3,
    "repeat_last_penalty": 3.0,
    "unk_logp_penalty": 2.0,
    "max_length_ratio": 1.5,
    "max_length_pad": 10,
    "memory_max_length_ratio": 0.75
  },

  "preprocessing": {
    "mean": 0.5,
    "std": 0.5,
    "pad_value": 128
  },

  "transformers_version": "4.40.0"
}