Reorg: move v2/v3/v4 pth to legacy/, English README as default (+ README_zh.md), update config.json

- moved 5 legacy pth files (v2/v3/v4) from repo root to legacy/ via in-repo LFS copy
- deleted two obsolete root yml (superseded by configs/rec/PP-OCRv5/*.yml)
- replaced README.md with English primary version (zh copy kept as README_zh.md)
- updated config.json to reflect the full 15-model v5 catalog + legacy map

No PP-OCRv5 safetensors / yml / dict URLs changed.

Files changed (10) hide show

PP-OCRv5_server_det.yml +0 -174
PP-OCRv5_server_rec.yml +0 -136
README.md +130 -98
README_zh.md +287 -0
config.json +113 -18
ch_ptocr_mobile_v2.0_cls_infer.pth → legacy/ch_ptocr_mobile_v2.0_cls_infer.pth +0 -0
ch_ptocr_v4_det_infer.pth → legacy/ch_ptocr_v4_det_infer.pth +0 -0
ch_ptocr_v4_rec_infer.pth → legacy/ch_ptocr_v4_rec_infer.pth +0 -0
en_ptocr_v3_det_infer.pth → legacy/en_ptocr_v3_det_infer.pth +0 -0
en_ptocr_v4_rec_infer.pth → legacy/en_ptocr_v4_rec_infer.pth +0 -0

PP-OCRv5_server_det.yml DELETED Viewed

@@ -1,174 +0,0 @@
-Global:
-  model_name: PP-OCRv5_server_det # To use static model for inference.
-  debug: false
-  use_gpu: true
-  epoch_num: &epoch_num 500
-  log_smooth_window: 20
-  print_batch_step: 10
-  save_model_dir: ./output/PP-OCRv5_server_det
-  save_epoch_step: 10
-  eval_batch_step:
-  - 0
-  - 1500
-  cal_metric_during_train: false
-  checkpoints:
-  pretrained_model: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PPHGNetV2_B4_ocr_det.pdparams
-  save_inference_dir: null
-  use_visualdl: false
-  infer_img: doc/imgs_en/img_10.jpg
-  save_res_path: ./checkpoints/det_db/predicts_db.txt
-  distributed: true
-Architecture:
-  model_type: det
-  algorithm: DB
-  Transform: null
-  Backbone:
-    name: PPHGNetV2_B4
-    det: True
-  Neck:
-    name: LKPAN
-    out_channels: 256
-    intracl: true
-  Head:
-    name: PFHeadLocal
-    k: 50
-    mode: "large"
-Loss:
-  name: DBLoss
-  balance_loss: true
-  main_loss_type: DiceLoss
-  alpha: 5
-  beta: 10
-  ohem_ratio: 3
-Optimizer:
-  name: Adam
-  beta1: 0.9
-  beta2: 0.999
-  lr:
-    name: Cosine
-    learning_rate: 0.001 #(8*8c)
-    warmup_epoch: 2
-  regularizer:
-    name: L2
-    factor: 1e-6
-PostProcess:
-  name: DBPostProcess
-  thresh: 0.3
-  box_thresh: 0.6
-  max_candidates: 1000
-  unclip_ratio: 1.5
-Metric:
-  name: DetMetric
-  main_indicator: hmean
-Train:
-  dataset:
-    name: SimpleDataSet
-    data_dir: ./train_data/icdar2015/text_localization/
-    label_file_list:
-      - ./train_data/icdar2015/text_localization/train_icdar2015_label.txt
-    ratio_list: [1.0]
-    transforms:
-    - DecodeImage:
-        img_mode: BGR
-        channel_first: false
-    - DetLabelEncode: null
-    - CopyPaste: null
-    - IaaAugment:
-        augmenter_args:
-        - type: Fliplr
-          args:
-            p: 0.5
-        - type: Affine
-          args:
-            rotate:
-            - -10
-            - 10
-        - type: Resize
-          args:
-            size:
-            - 0.5
-            - 3
-    - EastRandomCropData:
-        size:
-        - 640
-        - 640
-        max_tries: 50
-        keep_ratio: true
-    - MakeBorderMap:
-        shrink_ratio: 0.4
-        thresh_min: 0.3
-        thresh_max: 0.7
-        total_epoch: *epoch_num
-    - MakeShrinkMap:
-        shrink_ratio: 0.4
-        min_text_size: 8
-        total_epoch: *epoch_num
-    - NormalizeImage:
-        scale: 1./255.
-        mean:
-        - 0.485
-        - 0.456
-        - 0.406
-        std:
-        - 0.229
-        - 0.224
-        - 0.225
-        order: hwc
-    - ToCHWImage: null
-    - KeepKeys:
-        keep_keys:
-        - image
-        - threshold_map
-        - threshold_mask
-        - shrink_map
-        - shrink_mask
-  loader:
-    shuffle: true
-    drop_last: false
-    batch_size_per_card: 8
-    num_workers: 8
-Eval:
-  dataset:
-    name: SimpleDataSet
-    data_dir: ./train_data/icdar2015/text_localization/
-    label_file_list:
-      - ./train_data/icdar2015/text_localization/test_icdar2015_label.txt
-    transforms:
-    transforms:
-    - DecodeImage:
-        img_mode: BGR
-        channel_first: false
-    - DetLabelEncode: null
-    - DetResizeForTest:
-    - NormalizeImage:
-        scale: 1./255.
-        mean:
-        - 0.485
-        - 0.456
-        - 0.406
-        std:
-        - 0.229
-        - 0.224
-        - 0.225
-        order: hwc
-    - ToCHWImage: null
-    - KeepKeys:
-        keep_keys:
-        - image
-        - shape
-        - polys
-        - ignore_tags
-  loader:
-    shuffle: false
-    drop_last: false
-    batch_size_per_card: 1
-    num_workers: 2
-profiler_options: null

PP-OCRv5_server_rec.yml DELETED Viewed

@@ -1,136 +0,0 @@
-Global:
-  model_name: PP-OCRv5_server_rec # To use static model for inference.
-  debug: false
-  use_gpu: true
-  epoch_num: 75
-  log_smooth_window: 20
-  print_batch_step: 10
-  save_model_dir: ./output/PP-OCRv5_server_rec
-  save_epoch_step: 1
-  eval_batch_step: [0, 2000]
-  cal_metric_during_train: true
-  calc_epoch_interval: 1
-  pretrained_model:
-  checkpoints:
-  save_inference_dir:
-  use_visualdl: false
-  infer_img: doc/imgs_words/ch/word_1.jpg
-  character_dict_path: ./pytorchocr/utils/dict/ppocrv5_dict.txt
-  max_text_length: &max_text_length 25
-  infer_mode: false
-  use_space_char: true
-  distributed: true
-  save_res_path: ./output/rec/predicts_ppocrv5.txt
-  d2s_train_image_shape: [3, 48, 320]
-Optimizer:
-  name: Adam
-  beta1: 0.9
-  beta2: 0.999
-  lr:
-    name: Cosine
-    learning_rate: 0.0005
-    warmup_epoch: 1
-  regularizer:
-    name: L2
-    factor: 3.0e-05
-Architecture:
-  model_type: rec
-  algorithm: SVTR_HGNet
-  Transform:
-  Backbone:
-    name: PPHGNetV2_B4
-    text_rec: True
-  Head:
-    name: MultiHead
-    head_list:
-      - CTCHead:
-          Neck:
-            name: svtr
-            dims: 120
-            depth: 2
-            hidden_dims: 120
-            kernel_size: [1, 3]
-            use_guide: True
-          Head:
-            fc_decay: 0.00001
-      - NRTRHead:
-          nrtr_dim: 384
-          max_text_length: *max_text_length
-Loss:
-  name: MultiLoss
-  loss_config_list:
-    - CTCLoss:
-    - NRTRLoss:
-PostProcess:
-  name: CTCLabelDecode
-Metric:
-  name: RecMetric
-  main_indicator: acc
-Train:
-  dataset:
-    name: MultiScaleDataSet
-    ds_width: false
-    data_dir: ./train_data/
-    ext_op_transform_idx: 1
-    label_file_list:
-    - ./train_data/train_list.txt
-    transforms:
-    - DecodeImage:
-        img_mode: BGR
-        channel_first: false
-    - RecAug:
-    - MultiLabelEncode:
-        gtc_encode: NRTRLabelEncode
-    - KeepKeys:
-        keep_keys:
-        - image
-        - label_ctc
-        - label_gtc
-        - length
-        - valid_ratio
-  sampler:
-    name: MultiScaleSampler
-    scales: [[320, 32], [320, 48], [320, 64]]
-    first_bs: &bs 128
-    fix_bs: false
-    divided_factor: [8, 16] # w, h
-    is_training: True
-  loader:
-    shuffle: true
-    batch_size_per_card: *bs
-    drop_last: true
-    num_workers: 16
-Eval:
-  dataset:
-    name: SimpleDataSet
-    data_dir: ./train_data
-    label_file_list:
-    - ./train_data/val_list.txt
-    transforms:
-    - DecodeImage:
-        img_mode: BGR
-        channel_first: false
-    - MultiLabelEncode:
-        gtc_encode: NRTRLabelEncode
-    - RecResizeImg:
-        image_shape: [3, 48, 320]
-    - KeepKeys:
-        keep_keys:
-        - image
-        - label_ctc
-        - label_gtc
-        - length
-        - valid_ratio
-  loader:
-    shuffle: false
-    drop_last: false
-    batch_size_per_card: 128
-    num_workers: 4

README.md CHANGED Viewed

@@ -28,116 +28,128 @@ pipeline_tag: image-to-text
 # PP-OCRv5 PyTorch Model Zoo
-PP-OCRv5 全系列模型的 **PyTorch** 版本（safetensors 格式），从百度 PaddlePaddle 官方 `.pdparams` 动态图权重精确转换而来，**推理结果与 PaddleOCR 原版位精确一致**。
-- **文本检测**：2 个（mobile / server）
-- **文本识别（基础）**：2 个，覆盖 简中 / 繁中 / 英文 / 日文
-- **文本识别（多语言）**：11 个，覆盖 100+ 语种（韩 / 法 / 德 / 俄 / 阿拉伯 / 天城文 / 泰 / 希腊 / 泰米尔 / 泰卢固 / 纯英文等）
-> 本仓库**仅包含权重、配置和字典**，不包含推理代码。推理请配合 [PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) 使用，或参考下文"自定义 Python 推理"章节自行集成。
 ---
-## 仓库结构
 ```
 .
-├── README.md
-├── LICENSE                                                     # Apache 2.0
-├── *.safetensors                                               # 15 个 PP-OCRv5 权重（位于根目录）
 ├── configs/
 │   ├── det/PP-OCRv5/
-│   │   ├── PP-OCRv5_mobile_det.yml                             # 移动端检测
-│   │   └── PP-OCRv5_server_det.yml                             # 服务端检测
 │   └── rec/PP-OCRv5/
-│       ├── PP-OCRv5_mobile_rec.yml                             # 基础识别（中繁英日，移动端）
-│       ├── PP-OCRv5_server_rec.yml                             # 基础识别（中繁英日，服务端）
-│       └── multi_language/
-│           ├── en_PP-OCRv5_mobile_rec.yaml                     # 英文专用
-│           ├── korean_PP-OCRv5_mobile_rec.yml                  # 韩文 + 英文
-│           ├── latin_PP-OCRv5_mobile_rec.yml                   # 拉丁字母 40+ 语种（法/德/西/意/葡 等）
-│           ├── eslav_PP-OCRv5_mobile_rec.yml                   # 东斯拉夫（俄/白俄/乌克兰）
-│           ├── cyrillic_PP-OCRv5_mobile_rec.yaml               # 西里尔字母 33 种
-│           ├── arabic_PP-OCRv5_mobile_rec.yaml                 # 阿拉伯 / 波斯 / 维吾尔 / 乌尔都 等
-│           ├── devanagari_PP-OCRv5_mobile_rec.yaml             # 天城文系 14 种（印地/马拉地/尼泊尔/梵文 等）
-│           ├── th_PP-OCRv5_mobile_rec.yaml                     # 泰文
-│           ├── el_PP-OCRv5_mobile_rec.yaml                     # 希腊文
-│           ├── ta_PP-OCRv5_mobile_rec.yaml                     # 泰米尔文
-│           └── te_PP-OCRv5_mobile_rec.yaml                     # 泰卢固文
-└── dicts/                                                      # 字符集字典（rec 推理必需）
-    ├── ppocrv5_dict.txt                                        # 基础（中繁英日）
-    ├── ppocrv5_en_dict.txt
-    ├── ppocrv5_korean_dict.txt
-    └── ...（共 12 个）
 ```
-> 所有 rec yaml 的 `character_dict_path` 已改写为相对路径 `./dicts/...`，`git clone` 或 `snapshot_download` 下载后**无需修改路径**即可使用。
 ---
-## 模型清单
-### 文本检测
-| 权重文件 | 对应 yaml | 场景 | 文件大小 |
 |---|---|---|---|
-| `ptocr_v5_mobile_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_mobile_det.yml` | 移动端 / CPU 推荐 | ~14 MB |
-| `ptocr_v5_server_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_server_det.yml` | 服务端 / 高精度 | ~101 MB |
-### 文本识别（基础）
-| 权重文件 | 对应 yaml | 支持语种 | 文件大小 |
 |---|---|---|---|
-| `ptocr_v5_mobile_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_mobile_rec.yml` | 简中 / 繁中 / 英文 / 日文 | ~31 MB |
-| `ptocr_v5_server_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_server_rec.yml` | 简中 / 繁中 / 英文 / 日文 | ~128 MB |
-### 文本识别（多语言）
-所有多语言识别模型共享相同网络（`SVTR_LCNet` + `PPLCNetV3`），仅字符集不同。文件大小 23–28 MB。
-| 权重文件 | 支持语种 |
 |---|---|
-| `ptocr_v5_en_mobile_rec.safetensors` | 英文专用（针对英文场景定向优化） |
-| `ptocr_v5_korean_mobile_rec.safetensors` | 韩文、英文 |
-| `ptocr_v5_latin_mobile_rec.safetensors` | 法文、德文、南非荷兰文、意大利文、西班牙文、葡萄牙文、捷克文、丹麦文、爱沙尼亚文、克罗地亚文、荷兰文、挪威文、波兰文、瑞典文、芬兰文、土耳其文、越南文 等 40+ 语种 |
-| `ptocr_v5_eslav_mobile_rec.safetensors` | 俄罗斯文、白俄罗斯文、乌克兰文、英文 |
-| `ptocr_v5_cyrillic_mobile_rec.safetensors` | 俄文、白俄文、乌克兰文、塞尔维亚（西里尔）、保加利亚、蒙古 等 33 种西里尔字母语言 |
-| `ptocr_v5_arabic_mobile_rec.safetensors` | 阿拉伯文、波斯文、维吾尔文、乌尔都文、普什图文、信德文 等 |
-| `ptocr_v5_devanagari_mobile_rec.safetensors` | 印地文、马拉地文、尼泊尔文、梵文 等 14 种天城文系语言 |
-| `ptocr_v5_th_mobile_rec.safetensors` | 泰文、英文 |
-| `ptocr_v5_el_mobile_rec.safetensors` | 希腊文、英文 |
-| `ptocr_v5_ta_mobile_rec.safetensors` | 泰米尔文、英文 |
-| `ptocr_v5_te_mobile_rec.safetensors` | 泰卢固文、英文 |
 ---
-## 快速开始
-### 下载权重
 ```python
 from huggingface_hub import snapshot_download, hf_hub_download
-# 方式 1：下载整个仓库（权重 + yml + 字典 + README）
 repo_dir = snapshot_download(repo_id="JoyCN/PaddleOCR-Pytorch")
-print("仓库下载到：", repo_dir)
-# 方式 2：只下载单个权重文件
 weight_path = hf_hub_download(
     repo_id="JoyCN/PaddleOCR-Pytorch",
-    filename="ptocr_v5_korean_mobile_rec.safetensors"
 )
 ```
-### 使用 PaddleOCR2Pytorch 项目做推理（推荐）
 ```bash
-# 1. clone 推理代码仓
 git clone https://github.com/frotms/PaddleOCR2Pytorch
 cd PaddleOCR2Pytorch
 pip install torch safetensors pyyaml shapely pyclipper opencv-python pillow scikit-image
-# 2. 用本仓库下载的权重 + yml（假设下载到 /path/to/hf_repo）
 python tools/infer/predict_rec.py \
   --image_dir doc/imgs_words/korean/1.jpg \
   --rec_algorithm SVTR_LCNet \
@@ -148,36 +160,35 @@ python tools/infer/predict_rec.py \
   --use_gpu False
 ```
-> PaddleOCR2Pytorch 的 `base_ocr_v20.py` 已原生支持 `.safetensors`（按后缀自动识别，向后兼容 `.pth`）。
-### 自定义 Python 推理代码
-如果你不想依赖 PaddleOCR2Pytorch 完整推理栈，下面是**一个最小 rec 推理代码片段**的骨架。它展示了如何加载权重并做前向推理——但你仍然需要 PaddleOCR2Pytorch 项目中的网络定义代码（`pytorchocr/modeling/`）。
 ```python
 import sys, numpy as np, cv2, torch, yaml
 from safetensors.torch import load_file
-# 以下 import 需要你先 clone https://github.com/frotms/PaddleOCR2Pytorch
-# 并把其根目录加入 PYTHONPATH
 sys.path.insert(0, "/path/to/PaddleOCR2Pytorch")
 from pytorchocr.modeling.architectures.base_model import BaseModel
 from pytorchocr.postprocess import build_post_process
-HF_REPO = "/path/to/hf_repo"   # snapshot_download 得到的路径
 yml_path    = f"{HF_REPO}/configs/rec/PP-OCRv5/multi_language/korean_PP-OCRv5_mobile_rec.yml"
 weight_path = f"{HF_REPO}/ptocr_v5_korean_mobile_rec.safetensors"
-# 1. 读配置 + 字符集
 with open(yml_path, encoding="utf-8") as f:
     cfg = yaml.safe_load(f)
-dict_path = cfg["Global"]["character_dict_path"]      # './dicts/ppocrv5_korean_dict.txt'
 dict_abs  = f"{HF_REPO}/{dict_path.lstrip('./')}"
 with open(dict_abs, encoding="utf-8") as f:
     chars = [l.strip("\n\r") for l in f]
-n_char = len(chars) + 2                               # +1 blank, +1 space（依 use_space_char 而定）
-# 2. 构建网络 + 加载权重（safetensors 零代码执行、mmap 快速加载）
 cfg["Architecture"]["Head"]["out_channels_list"] = {
     "CTCLabelDecode": n_char,
     "SARLabelDecode": n_char + 2,
@@ -187,7 +198,7 @@ net = BaseModel(cfg["Architecture"], out_channels=n_char)
 net.load_state_dict(load_file(weight_path, device="cpu"))
 net.eval()
-# 3. 读图 + 预处理（resize 到 [3, 48, 320]，归一化到 [-1, 1]）
 img = cv2.imread("input_word.jpg")
 h, w = img.shape[:2]
 ratio = w / h
@@ -199,56 +210,77 @@ x = canvas.astype(np.float32).transpose(2, 0, 1) / 255.0
 x = (x - 0.5) / 0.5
 x = torch.from_numpy(x).unsqueeze(0)
-# 4. 前向 + CTC 解码
 with torch.no_grad():
     logits = net(x)
-post_op = build_post_process({"name": "CTCLabelDecode",
-                              "character_dict_path": dict_abs,
-                              "use_space_char": True})
 result = post_op(logits)
-print("识别结果:", result)     # e.g. [('바탕으로', 0.9998)]
 ```
-### 推理所需依赖
 ```
-torch >= 1.13
-safetensors >= 0.4
 numpy, pillow, opencv-python
 pyyaml, shapely, pyclipper
-scikit-image      # det 后处理需要
 ```
 ---
-## 转换 & 验证来源
-- 源权重：PaddlePaddle 官方 `.pdparams`，来自 [paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/](https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/)
-- 转换工具：[PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) 中的 `converter/ppocr_v5_det_converter.py` / `ppocr_v5_rec_converter.py`
-- 验证：在 macOS Apple Silicon (M 系列) CPU 环境下做过端到端推理，**多语言识别结果与 PaddleOCR 官方 `.pdparams` 位精确一致**（float32 小数点后 8 位完全相同）
-样例推理输出（CPU，<0.7 s / 张）：
-| 样例 | 识别结果 | 置信度 |
 |---|---|---|
-| 中文 `word_1.jpg` | 韩国小馆 | 0.99797755 |
-| 韩文 `korean/1.jpg` | 바탕으로 | 0.99977183 |
-| 法文 `french/1.jpg` | de l'amendement, | 0.99656343 |
-| 阿拉伯 `arabic/ar_1.jpg` | الكيصياوي | 0.68281130 |
 ---
-## 许可证 & 致谢
 - **License**: Apache License 2.0
-- 权重来源：[PaddleOCR](https://github.com/PaddlePaddle/PaddleOCR) by PaddlePaddle 团队，Apache 2.0
-- 转换工具：[PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch)，Apache 2.0
-如果本仓库对你有帮助，请同时给上述两个原始项目 star 致谢。
 ---
-## 引用
 ```bibtex
 @misc{pp_ocrv5_pytorch_joycn_2025,

 # PP-OCRv5 PyTorch Model Zoo
+PyTorch weights (**safetensors** format) for the full **PP-OCRv5** family, converted bit-exactly from the official PaddlePaddle `.pdparams` dynamic-graph weights — inference outputs are **identical to the original PaddleOCR** down to float32 precision.
+- **Text Detection**: 2 models (mobile / server)
+- **Text Recognition (base)**: 2 models covering Simplified Chinese / Traditional Chinese / English / Japanese
+- **Text Recognition (multilingual)**: 11 models covering **100+ languages** (Korean, French, German, Russian, Arabic, Devanagari, Thai, Greek, Tamil, Telugu, etc.)
+> This repo contains **weights + configs + dictionaries only**, not inference code. For inference, use [PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch), or follow the "Custom Python Inference" section below.
+>
+> Also available: [README_zh.md](./README_zh.md) (中文版).
 ---
+## Repository Layout
 ```
 .
+├── README.md / README_zh.md
+├── LICENSE                                                 # Apache 2.0
+├── config.json                                             # Repo metadata + model index
+│
+├── ptocr_v5_*.safetensors                                  # 15 PP-OCRv5 weights at root (stable URLs)
+├── ptocr_v5_server_{det,rec}.pth                           # Legacy pth copies of V5 server (kept)
+│
 ├── configs/
 │   ├── det/PP-OCRv5/
+│   │   ├── PP-OCRv5_mobile_det.yml
+│   │   └── PP-OCRv5_server_det.yml
 │   └── rec/PP-OCRv5/
+│       ├── PP-OCRv5_mobile_rec.yml                         # zh / zh-Hant / en / ja
+│       ├── PP-OCRv5_server_rec.yml
+│       └── multi_language/                                 # 11 multilingual rec yamls
+│           ├── en_PP-OCRv5_mobile_rec.yaml
+│           ├── korean_PP-OCRv5_mobile_rec.yml
+│           ├── latin_PP-OCRv5_mobile_rec.yml               # French / German / Spanish / ...  (40+ Latin-script)
+│           ├── eslav_PP-OCRv5_mobile_rec.yml               # Russian / Belarusian / Ukrainian
+│           ├── cyrillic_PP-OCRv5_mobile_rec.yaml           # 33 Cyrillic-script languages
+│           ├── arabic_PP-OCRv5_mobile_rec.yaml             # Arabic / Persian / Uyghur / Urdu / ...
+│           ├── devanagari_PP-OCRv5_mobile_rec.yaml         # Hindi / Marathi / Nepali / Sanskrit / ...
+│           ├── th_PP-OCRv5_mobile_rec.yaml                 # Thai
+│           ├── el_PP-OCRv5_mobile_rec.yaml                 # Greek
+│           ├── ta_PP-OCRv5_mobile_rec.yaml                 # Tamil
+│           └── te_PP-OCRv5_mobile_rec.yaml                 # Telugu
+│
+├── dicts/                                                  # Character set dictionaries (required for rec)
+│   ├── ppocrv5_dict.txt                                    # base (zh / zh-Hant / en / ja)
+│   └── ppocrv5_<lang>_dict.txt                             # 11 multilingual dicts
+│
+└── legacy/                                                 # Older PP-OCR v2/v3/v4 weights (kept for back-compat)
+    ├── ch_ptocr_mobile_v2.0_cls_infer.pth
+    ├── ch_ptocr_v4_det_infer.pth
+    ├── ch_ptocr_v4_rec_infer.pth
+    ├── en_ptocr_v3_det_infer.pth
+    └── en_ptocr_v4_rec_infer.pth
 ```
+> All rec yamls use relative `character_dict_path: ./dicts/...`. After `git clone` or `snapshot_download`, paths resolve correctly with **no modification required**.
 ---
+## Model Catalog
+### Text Detection
+| Weight | Config | Use case | Size |
 |---|---|---|---|
+| `ptocr_v5_mobile_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_mobile_det.yml` | Mobile / CPU-friendly | ~14 MB |
+| `ptocr_v5_server_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_server_det.yml` | Server / high-accuracy | ~101 MB |
+### Text Recognition (Base)
+| Weight | Config | Languages | Size |
 |---|---|---|---|
+| `ptocr_v5_mobile_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_mobile_rec.yml` | Simplified / Traditional Chinese, English, Japanese | ~31 MB |
+| `ptocr_v5_server_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_server_rec.yml` | same as above, higher accuracy | ~128 MB |
+### Text Recognition (Multilingual)
+All multilingual rec models share the same architecture (`SVTR_LCNet` + `PPLCNetV3`); they differ only by character dictionary. File size 23–28 MB each.
+| Weight | Supported languages |
 |---|---|
+| `ptocr_v5_en_mobile_rec.safetensors` | English (dedicated model optimized for English-only scenarios) |
+| `ptocr_v5_korean_mobile_rec.safetensors` | Korean, English |
+| `ptocr_v5_latin_mobile_rec.safetensors` | French, German, Spanish, Italian, Portuguese, Dutch, Swedish, Danish, Norwegian, Finnish, Polish, Czech, Turkish, Vietnamese, ... (40+ Latin-script) |
+| `ptocr_v5_eslav_mobile_rec.safetensors` | Russian, Belarusian, Ukrainian, English |
+| `ptocr_v5_cyrillic_mobile_rec.safetensors` | 33 Cyrillic-script languages (Russian, Serbian-Cyrillic, Bulgarian, Mongolian, Kazakh, ...) |
+| `ptocr_v5_arabic_mobile_rec.safetensors` | Arabic, Persian, Uyghur, Urdu, Pashto, Sindhi, ... |
+| `ptocr_v5_devanagari_mobile_rec.safetensors` | 14 Devanagari-script languages (Hindi, Marathi, Nepali, Sanskrit, ...) |
+| `ptocr_v5_th_mobile_rec.safetensors` | Thai, English |
+| `ptocr_v5_el_mobile_rec.safetensors` | Greek, English |
+| `ptocr_v5_ta_mobile_rec.safetensors` | Tamil, English |
+| `ptocr_v5_te_mobile_rec.safetensors` | Telugu, English |
 ---
+## Quick Start
+### Download Weights
 ```python
 from huggingface_hub import snapshot_download, hf_hub_download
+# Option 1: download the whole repo (weights + configs + dicts + README)
 repo_dir = snapshot_download(repo_id="JoyCN/PaddleOCR-Pytorch")
+print("downloaded to:", repo_dir)
+# Option 2: fetch a single weight file
 weight_path = hf_hub_download(
     repo_id="JoyCN/PaddleOCR-Pytorch",
+    filename="ptocr_v5_korean_mobile_rec.safetensors",
 )
 ```
+### Inference via PaddleOCR2Pytorch (Recommended)
 ```bash
+# 1. clone the inference code repo
 git clone https://github.com/frotms/PaddleOCR2Pytorch
 cd PaddleOCR2Pytorch
 pip install torch safetensors pyyaml shapely pyclipper opencv-python pillow scikit-image
+# 2. Assume you ran snapshot_download above into /path/to/hf_repo
 python tools/infer/predict_rec.py \
   --image_dir doc/imgs_words/korean/1.jpg \
   --rec_algorithm SVTR_LCNet \
   --use_gpu False
 ```
+> PaddleOCR2Pytorch `base_ocr_v20.py` auto-detects `.safetensors` vs `.pth` by extension (backward compatible).
+### Custom Python Inference
+A minimal skeleton showing how to load the weights and run a forward pass. You still need the network definitions from the PaddleOCR2Pytorch `pytorchocr/modeling/` package.
 ```python
 import sys, numpy as np, cv2, torch, yaml
 from safetensors.torch import load_file
+# Requires https://github.com/frotms/PaddleOCR2Pytorch on PYTHONPATH
 sys.path.insert(0, "/path/to/PaddleOCR2Pytorch")
 from pytorchocr.modeling.architectures.base_model import BaseModel
 from pytorchocr.postprocess import build_post_process
+HF_REPO = "/path/to/hf_repo"   # the path returned by snapshot_download
 yml_path    = f"{HF_REPO}/configs/rec/PP-OCRv5/multi_language/korean_PP-OCRv5_mobile_rec.yml"
 weight_path = f"{HF_REPO}/ptocr_v5_korean_mobile_rec.safetensors"
+# 1. load config + dictionary
 with open(yml_path, encoding="utf-8") as f:
     cfg = yaml.safe_load(f)
+dict_path = cfg["Global"]["character_dict_path"]          # './dicts/ppocrv5_korean_dict.txt'
 dict_abs  = f"{HF_REPO}/{dict_path.lstrip('./')}"
 with open(dict_abs, encoding="utf-8") as f:
     chars = [l.strip("\n\r") for l in f]
+n_char = len(chars) + 2                                   # +1 blank, +1 space (if use_space_char)
+# 2. build network + load weights (safetensors = zero-code-exec, mmap-fast)
 cfg["Architecture"]["Head"]["out_channels_list"] = {
     "CTCLabelDecode": n_char,
     "SARLabelDecode": n_char + 2,
 net.load_state_dict(load_file(weight_path, device="cpu"))
 net.eval()
+# 3. preprocess (resize to [3, 48, 320], normalize to [-1, 1])
 img = cv2.imread("input_word.jpg")
 h, w = img.shape[:2]
 ratio = w / h
 x = (x - 0.5) / 0.5
 x = torch.from_numpy(x).unsqueeze(0)
+# 4. forward + CTC decode
 with torch.no_grad():
     logits = net(x)
+post_op = build_post_process({
+    "name": "CTCLabelDecode",
+    "character_dict_path": dict_abs,
+    "use_space_char": True,
+})
 result = post_op(logits)
+print("prediction:", result)          # e.g. [('바탕으로', 0.9998)]
 ```
+### Runtime Dependencies
 ```
+torch        >= 1.13
+safetensors  >= 0.4
 numpy, pillow, opencv-python
 pyyaml, shapely, pyclipper
+scikit-image                # required by det post-processing
 ```
 ---
+## Conversion & Verification
+- **Source weights**: official PaddlePaddle `.pdparams` from
+  `https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/`
+- **Converter**: [PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) — scripts `converter/ppocr_v5_det_converter.py` / `converter/ppocr_v5_rec_converter.py`
+- **Verification**: end-to-end inference was run on macOS Apple Silicon (M-series) CPU; multilingual rec outputs are **bit-exact** with the original PaddleOCR `.pdparams` (float32 values match to 8 decimal places).
+Sample inference results (CPU, < 0.7 s / image):
+| Sample | Prediction | Confidence |
 |---|---|---|
+| Chinese `word_1.jpg` | 韩国小馆 | 0.99797755 |
+| Korean `korean/1.jpg` | 바탕으로 | 0.99977183 |
+| French `french/1.jpg` | de l'amendement, | 0.99656343 |
+| Arabic `arabic/ar_1.jpg` | الكيصياوي | 0.68281130 |
 ---
+## Legacy Files (`legacy/`)
+Older PP-OCR (v2 / v3 / v4) checkpoints previously at the repo root have been **moved into `legacy/`** for clarity. They are still present and continue to work — just add the `legacy/` prefix to your path.
+If you were previously using any of these URLs at the root:
+```
+legacy/ch_ptocr_mobile_v2.0_cls_infer.pth
+legacy/ch_ptocr_v4_det_infer.pth
+legacy/ch_ptocr_v4_rec_infer.pth
+legacy/en_ptocr_v3_det_infer.pth
+legacy/en_ptocr_v4_rec_infer.pth
+```
+The 15 PP-OCRv5 safetensors files **remain at the repo root** — their URLs did not change.
+---
+## License & Credits
 - **License**: Apache License 2.0
+- Weights originate from [PaddleOCR](https://github.com/PaddlePaddle/PaddleOCR) by the PaddlePaddle team (Apache 2.0).
+- Converted with [PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) (Apache 2.0).
+If this repo helps you, please also star both of those original projects.
 ---
+## Citation
 ```bibtex
 @misc{pp_ocrv5_pytorch_joycn_2025,

README_zh.md ADDED Viewed

	@@ -0,0 +1,287 @@

+---
+license: apache-2.0
+language:
+- zh
+- en
+- ja
+- ko
+- fr
+- de
+- es
+- ru
+- ar
+- hi
+- th
+- el
+library_name: pytorch
+tags:
+- ocr
+- text-detection
+- text-recognition
+- paddleocr
+- pp-ocrv5
+- multilingual
+- svtr
+- db
+pipeline_tag: image-to-text
+---
+# PP-OCRv5 PyTorch Model Zoo（中文版）
+> 本仓库的主 README 为英文版 [README.md](./README.md)。本文件为中文对照版。
+PP-OCRv5 全系列模型的 **PyTorch** 版本（safetensors 格式），从百度 PaddlePaddle 官方 `.pdparams` 动态图权重精确转换而来，**推理结果与 PaddleOCR 原版位精确一致**。
+- **文本检测**：2 个（mobile / server）
+- **文本识别（基础）**：2 个，覆盖 简中 / 繁中 / 英文 / 日文
+- **文本识别（多语言）**：11 个，覆盖 100+ 语种（韩 / 法 / 德 / 俄 / 阿拉伯 / 天城文 / 泰 / 希腊 / 泰米尔 / 泰卢固 / 纯英文等）
+> 本仓库**仅包含权重、配置和字典**，不包含推理代码。推理请配合 [PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) 使用，或参考下文"自定义 Python 推理"章节自行集成。
+---
+## 仓库结构
+```
+.
+├── README.md / README_zh.md
+├── LICENSE                                                     # Apache 2.0
+├── config.json                                                 # 仓库元数据 + 模型索引
+├── *.safetensors                                               # 15 个 PP-OCRv5 权重（位于根目录，URL 稳定）
+├── ptocr_v5_server_{det,rec}.pth                               # V5 服务端的 pth 副本（向后兼容保留）
+├── configs/
+│   ├── det/PP-OCRv5/
+│   │   ├── PP-OCRv5_mobile_det.yml                             # 移动端检测
+│   │   └── PP-OCRv5_server_det.yml                             # 服务端检测
+│   └── rec/PP-OCRv5/
+│       ├── PP-OCRv5_mobile_rec.yml                             # 基础识别（中繁英日，移动端）
+│       ├── PP-OCRv5_server_rec.yml                             # 基础识别（中繁英日，服务端）
+│       └── multi_language/
+│           ├── en_PP-OCRv5_mobile_rec.yaml                     # 英文专用
+│           ├── korean_PP-OCRv5_mobile_rec.yml                  # 韩文 + 英文
+│           ├── latin_PP-OCRv5_mobile_rec.yml                   # 拉丁字母 40+ 语种（法/德/西/意/葡 等）
+│           ├── eslav_PP-OCRv5_mobile_rec.yml                   # 东斯拉夫（俄/白俄/乌克兰）
+│           ├── cyrillic_PP-OCRv5_mobile_rec.yaml               # 西里尔字母 33 种
+│           ├── arabic_PP-OCRv5_mobile_rec.yaml                 # 阿拉伯 / 波斯 / 维吾尔 / 乌尔都 等
+│           ├── devanagari_PP-OCRv5_mobile_rec.yaml             # 天城文系 14 种（印地/马拉地/尼泊尔/梵文 等）
+│           ├── th_PP-OCRv5_mobile_rec.yaml                     # 泰文
+│           ├── el_PP-OCRv5_mobile_rec.yaml                     # 希腊文
+│           ├── ta_PP-OCRv5_mobile_rec.yaml                     # 泰米尔文
+│           └── te_PP-OCRv5_mobile_rec.yaml                     # 泰卢固文
+└── dicts/                                                      # 字符集字典（rec 推理必需）
+    ├── ppocrv5_dict.txt                                        # 基础（中繁英日）
+    ├── ppocrv5_en_dict.txt
+    ├── ppocrv5_korean_dict.txt
+    └── ...（共 12 个）
+legacy/                                                         # 旧版本（v2/v3/v4）pth 集中目录
+├── ch_ptocr_mobile_v2.0_cls_infer.pth
+├── ch_ptocr_v4_det_infer.pth
+├── ch_ptocr_v4_rec_infer.pth
+├── en_ptocr_v3_det_infer.pth
+└── en_ptocr_v4_rec_infer.pth
+```
+> 所有 rec yaml 的 `character_dict_path` 已改写为相对路径 `./dicts/...`，`git clone` 或 `snapshot_download` 下载后**无需修改路径**即可使用。
+---
+## 模型清单
+### 文本检测
+| 权重文件 | 对应 yaml | 场景 | 文件大小 |
+|---|---|---|---|
+| `ptocr_v5_mobile_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_mobile_det.yml` | 移动端 / CPU 推荐 | ~14 MB |
+| `ptocr_v5_server_det.safetensors` | `configs/det/PP-OCRv5/PP-OCRv5_server_det.yml` | 服务端 / 高精度 | ~101 MB |
+### 文本识别（基础）
+| 权重文件 | 对应 yaml | 支持语种 | 文件大小 |
+|---|---|---|---|
+| `ptocr_v5_mobile_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_mobile_rec.yml` | 简中 / 繁中 / 英文 / 日文 | ~31 MB |
+| `ptocr_v5_server_rec.safetensors` | `configs/rec/PP-OCRv5/PP-OCRv5_server_rec.yml` | 简中 / 繁中 / 英文 / 日文 | ~128 MB |
+### 文本识别（多语言）
+所有多语言识别模型共享相同网络（`SVTR_LCNet` + `PPLCNetV3`），仅字符集不同。文件大小 23–28 MB。
+| 权重文件 | 支持语种 |
+|---|---|
+| `ptocr_v5_en_mobile_rec.safetensors` | 英文专用（针对英文场景定向优化） |
+| `ptocr_v5_korean_mobile_rec.safetensors` | 韩文、英文 |
+| `ptocr_v5_latin_mobile_rec.safetensors` | 法文、德文、南非荷兰文、意大利文、西班牙文、葡萄牙文、捷克文、丹麦文、爱沙尼亚文、克罗地亚文、荷兰文、挪威文、波兰文、瑞典文、芬兰文、土耳其文、越南文 等 40+ 语种 |
+| `ptocr_v5_eslav_mobile_rec.safetensors` | 俄罗斯文、白俄罗斯文、乌克兰文、英文 |
+| `ptocr_v5_cyrillic_mobile_rec.safetensors` | 俄文、白俄文、乌克兰文、塞尔维亚（西里尔）、保加利亚、蒙古 等 33 种西里尔字母语言 |
+| `ptocr_v5_arabic_mobile_rec.safetensors` | 阿拉伯文、波斯文、维吾尔文、乌尔都文、普什图文、信德文 等 |
+| `ptocr_v5_devanagari_mobile_rec.safetensors` | 印地文、马拉地文、尼泊尔文、梵文 等 14 种天城文系语言 |
+| `ptocr_v5_th_mobile_rec.safetensors` | 泰文、英文 |
+| `ptocr_v5_el_mobile_rec.safetensors` | 希腊文、英文 |
+| `ptocr_v5_ta_mobile_rec.safetensors` | 泰米尔文、英文 |
+| `ptocr_v5_te_mobile_rec.safetensors` | 泰卢固文、英文 |
+---
+## 快速开始
+### 下载权重
+```python
+from huggingface_hub import snapshot_download, hf_hub_download
+# 方式 1：下载整个仓库（权重 + yml + 字典 + README）
+repo_dir = snapshot_download(repo_id="JoyCN/PaddleOCR-Pytorch")
+print("仓库下载到：", repo_dir)
+# 方式 2：只下载单个权重文件
+weight_path = hf_hub_download(
+    repo_id="JoyCN/PaddleOCR-Pytorch",
+    filename="ptocr_v5_korean_mobile_rec.safetensors"
+)
+```
+### 使用 PaddleOCR2Pytorch 项目做推理（推荐）
+```bash
+# 1. clone 推理代码仓
+git clone https://github.com/frotms/PaddleOCR2Pytorch
+cd PaddleOCR2Pytorch
+pip install torch safetensors pyyaml shapely pyclipper opencv-python pillow scikit-image
+# 2. 用本仓库下载的权重 + yml（假设下载到 /path/to/hf_repo）
+python tools/infer/predict_rec.py \
+  --image_dir doc/imgs_words/korean/1.jpg \
+  --rec_algorithm SVTR_LCNet \
+  --rec_model_path /path/to/hf_repo/ptocr_v5_korean_mobile_rec.safetensors \
+  --rec_yaml_path  /path/to/hf_repo/configs/rec/PP-OCRv5/multi_language/korean_PP-OCRv5_mobile_rec.yml \
+  --rec_image_shape "3,48,320" \
+  --rec_char_dict_path /path/to/hf_repo/dicts/ppocrv5_korean_dict.txt \
+  --use_gpu False
+```
+> PaddleOCR2Pytorch 的 `base_ocr_v20.py` 已原生支持 `.safetensors`（按后缀自动识别，向后兼容 `.pth`）。
+### 自定义 Python 推理代码
+如果你不想依赖 PaddleOCR2Pytorch 完整推理栈，下面是**一个最小 rec 推理代码片段**的骨架。它展示了如何加载权重并做前向推理——但你仍然需要 PaddleOCR2Pytorch 项目中的网络定义代码（`pytorchocr/modeling/`）。
+```python
+import sys, numpy as np, cv2, torch, yaml
+from safetensors.torch import load_file
+# 以下 import 需要你先 clone https://github.com/frotms/PaddleOCR2Pytorch
+# 并把其根目录加入 PYTHONPATH
+sys.path.insert(0, "/path/to/PaddleOCR2Pytorch")
+from pytorchocr.modeling.architectures.base_model import BaseModel
+from pytorchocr.postprocess import build_post_process
+HF_REPO = "/path/to/hf_repo"   # snapshot_download 得到的路径
+yml_path    = f"{HF_REPO}/configs/rec/PP-OCRv5/multi_language/korean_PP-OCRv5_mobile_rec.yml"
+weight_path = f"{HF_REPO}/ptocr_v5_korean_mobile_rec.safetensors"
+# 1. 读配置 + 字符集
+with open(yml_path, encoding="utf-8") as f:
+    cfg = yaml.safe_load(f)
+dict_path = cfg["Global"]["character_dict_path"]      # './dicts/ppocrv5_korean_dict.txt'
+dict_abs  = f"{HF_REPO}/{dict_path.lstrip('./')}"
+with open(dict_abs, encoding="utf-8") as f:
+    chars = [l.strip("\n\r") for l in f]
+n_char = len(chars) + 2                               # +1 blank, +1 space（依 use_space_char 而定）
+# 2. 构建网络 + 加载权重（safetensors 零代码执行、mmap 快速加载）
+cfg["Architecture"]["Head"]["out_channels_list"] = {
+    "CTCLabelDecode": n_char,
+    "SARLabelDecode": n_char + 2,
+    "NRTRLabelDecode": n_char + 3,
+}
+net = BaseModel(cfg["Architecture"], out_channels=n_char)
+net.load_state_dict(load_file(weight_path, device="cpu"))
+net.eval()
+# 3. 读图 + 预处理（resize 到 [3, 48, 320]，归一化到 [-1, 1]）
+img = cv2.imread("input_word.jpg")
+h, w = img.shape[:2]
+ratio = w / h
+tw = min(int(48 * ratio), 320)
+img = cv2.resize(img, (tw, 48))
+canvas = np.zeros((48, 320, 3), dtype=np.uint8)
+canvas[:, :tw] = img
+x = canvas.astype(np.float32).transpose(2, 0, 1) / 255.0
+x = (x - 0.5) / 0.5
+x = torch.from_numpy(x).unsqueeze(0)
+# 4. 前向 + CTC 解码
+with torch.no_grad():
+    logits = net(x)
+post_op = build_post_process({"name": "CTCLabelDecode",
+                              "character_dict_path": dict_abs,
+                              "use_space_char": True})
+result = post_op(logits)
+print("识别结果:", result)     # e.g. [('바탕으로', 0.9998)]
+```
+### 推理所需依赖
+```
+torch >= 1.13
+safetensors >= 0.4
+numpy, pillow, opencv-python
+pyyaml, shapely, pyclipper
+scikit-image      # det 后处理需要
+```
+---
+## 转换 & 验证来源
+- 源权重：PaddlePaddle 官方 `.pdparams`，来自 [paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/](https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/)
+- 转换工具：[PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch) 中的 `converter/ppocr_v5_det_converter.py` / `ppocr_v5_rec_converter.py`
+- 验证：在 macOS Apple Silicon (M 系列) CPU 环境下做过端到端推理，**多语言识别结果与 PaddleOCR 官方 `.pdparams` 位精确一致**（float32 小数点后 8 位完全相同）
+样例推理输出（CPU，<0.7 s / 张）：
+| 样例 | 识别结果 | 置信度 |
+|---|---|---|
+| 中文 `word_1.jpg` | 韩国小馆 | 0.99797755 |
+| 韩文 `korean/1.jpg` | 바탕으로 | 0.99977183 |
+| 法文 `french/1.jpg` | de l'amendement, | 0.99656343 |
+| 阿拉伯 `arabic/ar_1.jpg` | الكيصياوي | 0.68281130 |
+---
+## Legacy 文件说明（`legacy/`）
+原本放在仓库根目录的 PP-OCR v2 / v3 / v4 老版本权重，现已**统一迁移到 `legacy/` 目录**以便整理。这些文件仍然存在且可正常使用，只需在 URL 路径前面加上 `legacy/` 前缀即可：
+```
+legacy/ch_ptocr_mobile_v2.0_cls_infer.pth
+legacy/ch_ptocr_v4_det_infer.pth
+legacy/ch_ptocr_v4_rec_infer.pth
+legacy/en_ptocr_v3_det_infer.pth
+legacy/en_ptocr_v4_rec_infer.pth
+```
+**15 个 PP-OCRv5 safetensors 权重依然位于仓库根目录，URL 未变**。
+---
+## 许可证 & 致谢
+- **License**: Apache License 2.0
+- 权重来源：[PaddleOCR](https://github.com/PaddlePaddle/PaddleOCR) by PaddlePaddle 团队，Apache 2.0
+- 转换工具：[PaddleOCR2Pytorch](https://github.com/frotms/PaddleOCR2Pytorch)，Apache 2.0
+如果本仓库对你有帮助，请同时给上述两个原始项目 star 致谢。
+---
+## 引用
+```bibtex
+@misc{pp_ocrv5_pytorch_joycn_2025,
+  title        = {PP-OCRv5 PyTorch Model Zoo},
+  author       = {JoyCN},
+  howpublished = {\url{https://huggingface.co/JoyCN/PaddleOCR-Pytorch}},
+  year         = {2025}
+}
+```

config.json CHANGED Viewed

@@ -1,27 +1,122 @@
 {
   "library_name": "pytorch",
-  "format": "pth",
-  "weights": {
-    "det": {
-      "safetensors": "ptocr_v5_server_det.safetensors",
-      "pth": "ptocr_v5_server_det.pth"
-    },
-    "rec": {
-      "safetensors": "ptocr_v5_server_rec.safetensors",
-      "pth": "ptocr_v5_server_rec.pth"
-    }
-  },
-  "homepage": "https://github.com/frotms/PaddleOCR2Pytorch",
   "created": "2025-09-16",
-  "notes": "Presence of this file helps Hub track downloads (query file).",
-  "formats": [
-    "safetensors",
-    "pth"
-  ],
   "compat": {
     "project": "PaddleOCR2Pytorch",
     "repo": "https://github.com/frotms/PaddleOCR2Pytorch",
     "license": "Apache-2.0"
   },
-  "updated": "2025-09-16"
 }

 {
   "library_name": "pytorch",
+  "format": "safetensors",
+  "formats": ["safetensors", "pth"],
+  "homepage": "https://huggingface.co/JoyCN/PaddleOCR-Pytorch",
+  "source_project": "https://github.com/frotms/PaddleOCR2Pytorch",
+  "upstream_project": "https://github.com/PaddlePaddle/PaddleOCR",
+  "license": "Apache-2.0",
   "created": "2025-09-16",
+  "updated": "2026-04-15",
+  "notes": "PP-OCRv5 full model zoo (2 det + 2 base rec + 11 multilingual rec), bit-exact conversion of official PaddlePaddle .pdparams to PyTorch. Older PP-OCR v2/v3/v4 checkpoints kept under legacy/.",
   "compat": {
     "project": "PaddleOCR2Pytorch",
     "repo": "https://github.com/frotms/PaddleOCR2Pytorch",
     "license": "Apache-2.0"
   },
+  "models": {
+    "ppocrv5": {
+      "det": {
+        "mobile": {
+          "safetensors": "ptocr_v5_mobile_det.safetensors",
+          "yaml": "configs/det/PP-OCRv5/PP-OCRv5_mobile_det.yml"
+        },
+        "server": {
+          "safetensors": "ptocr_v5_server_det.safetensors",
+          "pth": "ptocr_v5_server_det.pth",
+          "yaml": "configs/det/PP-OCRv5/PP-OCRv5_server_det.yml"
+        }
+      },
+      "rec_base": {
+        "mobile": {
+          "safetensors": "ptocr_v5_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/PP-OCRv5_mobile_rec.yml",
+          "dict": "dicts/ppocrv5_dict.txt",
+          "languages": ["zh-Hans", "zh-Hant", "en", "ja"]
+        },
+        "server": {
+          "safetensors": "ptocr_v5_server_rec.safetensors",
+          "pth": "ptocr_v5_server_rec.pth",
+          "yaml": "configs/rec/PP-OCRv5/PP-OCRv5_server_rec.yml",
+          "dict": "dicts/ppocrv5_dict.txt",
+          "languages": ["zh-Hans", "zh-Hant", "en", "ja"]
+        }
+      },
+      "rec_multilingual": {
+        "en": {
+          "safetensors": "ptocr_v5_en_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/en_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_en_dict.txt",
+          "languages": ["en"]
+        },
+        "korean": {
+          "safetensors": "ptocr_v5_korean_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/korean_PP-OCRv5_mobile_rec.yml",
+          "dict": "dicts/ppocrv5_korean_dict.txt",
+          "languages": ["ko", "en"]
+        },
+        "latin": {
+          "safetensors": "ptocr_v5_latin_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/latin_PP-OCRv5_mobile_rec.yml",
+          "dict": "dicts/ppocrv5_latin_dict.txt",
+          "languages": ["fr", "de", "es", "it", "pt", "nl", "sv", "da", "no", "fi", "pl", "cs", "tr", "vi", "af", "bs", "cy", "et", "ga", "hr", "uz", "hu", "id", "is", "lt", "mi", "ms", "sk", "sl", "sq", "sw", "tl", "la", "az", "ku", "lv", "mt", "pi", "ro", "eu", "gl", "lb", "rm", "ca", "qu", "rs_latin", "oc"]
+        },
+        "eslav": {
+          "safetensors": "ptocr_v5_eslav_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/eslav_PP-OCRv5_mobile_rec.yml",
+          "dict": "dicts/ppocrv5_eslav_dict.txt",
+          "languages": ["ru", "be", "uk", "en"]
+        },
+        "cyrillic": {
+          "safetensors": "ptocr_v5_cyrillic_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/cyrillic_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_cyrillic_dict.txt",
+          "languages": ["ru", "be", "uk", "rs_cyrillic", "bg", "mn", "kk", "ky", "tg", "mk", "tt", "cv", "ba", "mhr", "mo", "udm", "kv", "os", "bua", "xal", "tyv", "sah", "kaa", "ab", "ady", "kbd", "av", "dar", "inh", "ce", "lki", "lez", "tab", "en"]
+        },
+        "arabic": {
+          "safetensors": "ptocr_v5_arabic_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/arabic_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_arabic_dict.txt",
+          "languages": ["ar", "fa", "ug", "ur", "ps", "ku", "sd", "bal", "en"]
+        },
+        "devanagari": {
+          "safetensors": "ptocr_v5_devanagari_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/devanagari_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_devanagari_dict.txt",
+          "languages": ["hi", "mr", "ne", "bh", "mai", "ang", "bho", "mah", "sck", "new", "gom", "sa", "bgc", "en"]
+        },
+        "th": {
+          "safetensors": "ptocr_v5_th_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/th_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_th_dict.txt",
+          "languages": ["th", "en"]
+        },
+        "el": {
+          "safetensors": "ptocr_v5_el_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/el_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_el_dict.txt",
+          "languages": ["el", "en"]
+        },
+        "ta": {
+          "safetensors": "ptocr_v5_ta_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/ta_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_ta_dict.txt",
+          "languages": ["ta", "en"]
+        },
+        "te": {
+          "safetensors": "ptocr_v5_te_mobile_rec.safetensors",
+          "yaml": "configs/rec/PP-OCRv5/multi_language/te_PP-OCRv5_mobile_rec.yaml",
+          "dict": "dicts/ppocrv5_te_dict.txt",
+          "languages": ["te", "en"]
+        }
+      }
+    }
+  },
+  "legacy": {
+    "ppocrv2_cls_ch": "legacy/ch_ptocr_mobile_v2.0_cls_infer.pth",
+    "ppocrv3_det_en": "legacy/en_ptocr_v3_det_infer.pth",
+    "ppocrv4_det_ch": "legacy/ch_ptocr_v4_det_infer.pth",
+    "ppocrv4_rec_ch": "legacy/ch_ptocr_v4_rec_infer.pth",
+    "ppocrv4_rec_en": "legacy/en_ptocr_v4_rec_infer.pth"
+  }
 }

ch_ptocr_mobile_v2.0_cls_infer.pth → legacy/ch_ptocr_mobile_v2.0_cls_infer.pth RENAMED Viewed

File without changes

ch_ptocr_v4_det_infer.pth → legacy/ch_ptocr_v4_det_infer.pth RENAMED Viewed

File without changes

ch_ptocr_v4_rec_infer.pth → legacy/ch_ptocr_v4_rec_infer.pth RENAMED Viewed

File without changes

en_ptocr_v3_det_infer.pth → legacy/en_ptocr_v3_det_infer.pth RENAMED Viewed

File without changes

en_ptocr_v4_rec_infer.pth → legacy/en_ptocr_v4_rec_infer.pth RENAMED Viewed

File without changes