{ "model_name": "latin_PP-OCRv5_mobile_rec", "model_type": "recognition", "framework": "PaddleOCR", "version": "PP-OCRv5", "language_group": "latin", "supported_languages": [ "English", "French", "German", "Afrikaans", "Italian", "Spanish", "Bosnian", "Portuguese", "Czech", "Welsh", "Danish", "Estonian", "Irish", "Croatian", "Uzbek", "Hungarian", "Serbian (Latin)", "Indonesian", "Occitan", "Icelandic", "Lithuanian", "Maori", "Malay", "Dutch", "Norwegian", "Polish", "Slovak", "Slovenian", "Albanian", "Swedish", "Swahili", "Tagalog", "Turkish", "Latin" ], "description": "PP-OCRv5 Latin script text recognition model (32 languages)", "accuracy": 84.7, "dataset": "3,111 Latin script images", "original_format": "PaddlePaddle", "converted_format": "ONNX", "opset_version": 11, "dictionary_file": "ppocrv5_latin_dict.txt", "input_shape": "dynamic (batch_size, 3, 32, dynamic_width)", "output_shape": "dynamic (batch_size, sequence_length, num_classes)", "source": "https://github.com/PaddlePaddle/PaddleOCR", "documentation": "https://www.paddleocr.ai/main/en/version3.x/algorithm/PP-OCRv5/PP-OCRv5_multi_languages.html", "usage": { "library": "onnxruntime", "preprocessing": "Grayscale or RGB image, resized to height=32, normalized", "postprocessing": "CTC decoding with character dictionary", "dictionary_format": "One character per line, UTF-8 encoding" } }