| { |
| "model_name": "eslav_PP-OCRv5_mobile_rec", |
| "model_type": "recognition", |
| "framework": "PaddleOCR", |
| "version": "PP-OCRv5", |
| "language_group": "eslav", |
| "supported_languages": [ |
| "Russian", |
| "Bulgarian", |
| "Ukrainian", |
| "Belarusian", |
| "English" |
| ], |
| "description": "PP-OCRv5 East Slavic text recognition model", |
| "accuracy": 81.6, |
| "dataset": "7,031 East Slavic text images", |
| "original_format": "PaddlePaddle", |
| "converted_format": "ONNX", |
| "opset_version": 11, |
| "dictionary_file": "ppocrv5_eslav_dict.txt", |
| "input_shape": "dynamic (batch_size, 3, 32, dynamic_width)", |
| "output_shape": "dynamic (batch_size, sequence_length, num_classes)", |
| "source": "https://github.com/PaddlePaddle/PaddleOCR", |
| "documentation": "https://www.paddleocr.ai/main/en/version3.x/algorithm/PP-OCRv5/PP-OCRv5_multi_languages.html", |
| "usage": { |
| "library": "onnxruntime", |
| "preprocessing": "Grayscale or RGB image, resized to height=32, normalized", |
| "postprocessing": "CTC decoding with character dictionary", |
| "dictionary_format": "One character per line, UTF-8 encoding" |
| } |
| } |