{ "model_type": "kiri-ocr", "architectures": ["KiriOCR"], "library_name": "pytorch", "torch_dtype": "float32", "hidden_size": 256, "num_hidden_layers": 7, "num_attention_heads": 8, "image_height": 48, "image_width": 640, "max_decoder_length": 260, "vocab_size": 966, "unk_token": "", "collapse_whitespace": true, "unicode_nfc": true, "encoder": { "dim": 256, "num_layers": 4, "num_heads": 8, "feedforward_dim": 1024, "dropout": 0.15 }, "decoder": { "enabled": true, "dim": 256, "num_layers": 3, "num_heads": 8, "feedforward_dim": 1024 }, "ctc": { "enabled": true, "fusion_alpha": 0.5 }, "language_model": { "enabled": true, "fusion_enabled_eval": true, "fusion_alpha": 0.35 }, "inference": { "use_fp16": false, "use_autocast": false, "beam_width": 4, "beam_length_penalty": 0.6, "eos_logp_bias": 5.0, "eos_logp_boost": 5.0, "eos_bias_until_length": 3, "repeat_last_penalty": 3.0, "unk_logp_penalty": 2.0, "max_length_ratio": 1.5, "max_length_pad": 10, "memory_max_length_ratio": 0.75 }, "preprocessing": { "mean": 0.5, "std": 0.5, "pad_value": 128 }, "transformers_version": "4.40.0" }