File size: 1,275 Bytes
eb7f4b2 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce 243bac5 62c18ce eb7f4b2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 |
{
"model_type": "kiri-ocr",
"architectures": ["KiriOCR"],
"library_name": "pytorch",
"torch_dtype": "float32",
"hidden_size": 256,
"num_hidden_layers": 7,
"num_attention_heads": 8,
"image_height": 48,
"image_width": 640,
"max_decoder_length": 260,
"vocab_size": 966,
"unk_token": "<unk>",
"collapse_whitespace": true,
"unicode_nfc": true,
"encoder": {
"dim": 256,
"num_layers": 4,
"num_heads": 8,
"feedforward_dim": 1024,
"dropout": 0.15
},
"decoder": {
"enabled": true,
"dim": 256,
"num_layers": 3,
"num_heads": 8,
"feedforward_dim": 1024
},
"ctc": {
"enabled": true,
"fusion_alpha": 0.5
},
"language_model": {
"enabled": true,
"fusion_enabled_eval": true,
"fusion_alpha": 0.35
},
"inference": {
"use_fp16": false,
"use_autocast": false,
"beam_width": 4,
"beam_length_penalty": 0.6,
"eos_logp_bias": 5.0,
"eos_logp_boost": 5.0,
"eos_bias_until_length": 3,
"repeat_last_penalty": 3.0,
"unk_logp_penalty": 2.0,
"max_length_ratio": 1.5,
"max_length_pad": 10,
"memory_max_length_ratio": 0.75
},
"preprocessing": {
"mean": 0.5,
"std": 0.5,
"pad_value": 128
},
"transformers_version": "4.40.0"
} |