| { | |
| "model_type": "kiri-ocr", | |
| "architectures": ["KiriOCR"], | |
| "library_name": "pytorch", | |
| "torch_dtype": "float32", | |
| "hidden_size": 256, | |
| "num_hidden_layers": 7, | |
| "num_attention_heads": 8, | |
| "image_height": 48, | |
| "image_width": 640, | |
| "max_decoder_length": 260, | |
| "vocab_size": 966, | |
| "unk_token": "<unk>", | |
| "collapse_whitespace": true, | |
| "unicode_nfc": true, | |
| "encoder": { | |
| "dim": 256, | |
| "num_layers": 4, | |
| "num_heads": 8, | |
| "feedforward_dim": 1024, | |
| "dropout": 0.15 | |
| }, | |
| "decoder": { | |
| "enabled": true, | |
| "dim": 256, | |
| "num_layers": 3, | |
| "num_heads": 8, | |
| "feedforward_dim": 1024 | |
| }, | |
| "ctc": { | |
| "enabled": true, | |
| "fusion_alpha": 0.5 | |
| }, | |
| "language_model": { | |
| "enabled": true, | |
| "fusion_enabled_eval": true, | |
| "fusion_alpha": 0.35 | |
| }, | |
| "inference": { | |
| "use_fp16": false, | |
| "use_autocast": false, | |
| "beam_width": 4, | |
| "beam_length_penalty": 0.6, | |
| "eos_logp_bias": 5.0, | |
| "eos_logp_boost": 5.0, | |
| "eos_bias_until_length": 3, | |
| "repeat_last_penalty": 3.0, | |
| "unk_logp_penalty": 2.0, | |
| "max_length_ratio": 1.5, | |
| "max_length_pad": 10, | |
| "memory_max_length_ratio": 0.75 | |
| }, | |
| "preprocessing": { | |
| "mean": 0.5, | |
| "std": 0.5, | |
| "pad_value": 128 | |
| }, | |
| "transformers_version": "4.40.0" | |
| } |