Spaces:

LinhKL2002
/

App

Build error

App Files Files Community

LinhKL2002 commited on Apr 29, 2025

Commit

4dbe5d1

verified ·

1 Parent(s): 35b4c2a

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.dockerignore +73 -0
.dockerignore.bak +68 -0
.gitattributes +1 -0
.gradio/certificate.pem +31 -0
Dockerfile +27 -0
README.md +3 -9
__init__.py +5 -0
__pycache__/__init__.cpython-310.pyc +0 -0
__pycache__/image_enhancement.cpython-310.pyc +0 -0
__pycache__/image_enhancement.cpython-311.pyc +0 -0
__pycache__/image_enhancement.cpython-313.pyc +0 -0
__pycache__/main.cpython-310.pyc +0 -0
__pycache__/main.cpython-311.pyc +0 -0
__pycache__/main.cpython-313.pyc +0 -0
app.py +29 -0
cal_rec_boxes/__init__.py +4 -0
cal_rec_boxes/__pycache__/__init__.cpython-310.pyc +0 -0
cal_rec_boxes/__pycache__/__init__.cpython-311.pyc +0 -0
cal_rec_boxes/__pycache__/__init__.cpython-312.pyc +0 -0
cal_rec_boxes/__pycache__/__init__.cpython-313.pyc +0 -0
cal_rec_boxes/__pycache__/main.cpython-310.pyc +0 -0
cal_rec_boxes/__pycache__/main.cpython-311.pyc +0 -0
cal_rec_boxes/__pycache__/main.cpython-312.pyc +0 -0
cal_rec_boxes/__pycache__/main.cpython-313.pyc +0 -0
cal_rec_boxes/main.py +281 -0
ch_ppocr_cls/__init__.py +4 -0
ch_ppocr_cls/__pycache__/__init__.cpython-310.pyc +0 -0
ch_ppocr_cls/__pycache__/__init__.cpython-311.pyc +0 -0
ch_ppocr_cls/__pycache__/__init__.cpython-312.pyc +0 -0
ch_ppocr_cls/__pycache__/__init__.cpython-313.pyc +0 -0
ch_ppocr_cls/__pycache__/text_cls.cpython-310.pyc +0 -0
ch_ppocr_cls/__pycache__/text_cls.cpython-311.pyc +0 -0
ch_ppocr_cls/__pycache__/text_cls.cpython-312.pyc +0 -0
ch_ppocr_cls/__pycache__/text_cls.cpython-313.pyc +0 -0
ch_ppocr_cls/__pycache__/utils.cpython-310.pyc +0 -0
ch_ppocr_cls/__pycache__/utils.cpython-311.pyc +0 -0
ch_ppocr_cls/__pycache__/utils.cpython-312.pyc +0 -0
ch_ppocr_cls/__pycache__/utils.cpython-313.pyc +0 -0
ch_ppocr_cls/text_cls.py +114 -0
ch_ppocr_cls/utils.py +28 -0
ch_ppocr_det/__init__.py +4 -0
ch_ppocr_det/__pycache__/__init__.cpython-310.pyc +0 -0
ch_ppocr_det/__pycache__/__init__.cpython-311.pyc +0 -0
ch_ppocr_det/__pycache__/__init__.cpython-312.pyc +0 -0
ch_ppocr_det/__pycache__/__init__.cpython-313.pyc +0 -0
ch_ppocr_det/__pycache__/text_detect.cpython-310.pyc +0 -0
ch_ppocr_det/__pycache__/text_detect.cpython-311.pyc +0 -0
ch_ppocr_det/__pycache__/text_detect.cpython-312.pyc +0 -0
ch_ppocr_det/__pycache__/text_detect.cpython-313.pyc +0 -0
ch_ppocr_det/__pycache__/utils.cpython-310.pyc +0 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,73 @@

+# Python bytecode and cache
+__pycache__/
+*.pyc
+*.pyo
+*.pyd
+.pytest_cache/
+.coverage
+# IDE/editor files
+.idea/
+.vscode/
+*.swp
+*.swo
+# Build and distribution outputs
+dist/
+build/
+out/
+# Test and debug artifacts
+test/
+tests/
+debug/
+*.log
+# Version control
+.git/
+.gitignore
+.svn/
+.hg/
+# Environment and secrets
+.env*
+*.env
+*.pem
+*.key
+*.crt
+config.local.*
+*.local.yml
+# Documentation and markdown
+README*
+*.md
+docs/
+# Docker and compose files
+Dockerfile*
+docker-compose*
+# Temporary and local files
+tmp/
+temp/
+*.tmp
+.local/
+local/
+# Backup files
+*.bak
+# Project-specific: results and models (if not needed in build)
+results/
+# Exclude empty model placeholder, but keep actual models
+models/.gitkeep
+# Allow ONNX models to be included (remove models/ if you want to exclude all models)
+# models/
+# Miscellaneous
+*.DS_Store
+# Exclude self
+.dockerignore

.dockerignore.bak ADDED Viewed

	@@ -0,0 +1,68 @@

+# Python bytecode and cache
+__pycache__/
+*.pyc
+*.pyo
+*.pyd
+.pytest_cache/
+.coverage
+# Development and IDE artifacts
+.idea/
+.vscode/
+*.swp
+*.swo
+# Build outputs
+build/
+dist/
+out/
+# Test and debug files
+test/
+tests/
+debug/
+*.log
+# Version control
+.git/
+.gitignore
+.svn/
+.hg/
+# Environment and secrets
+.env*
+*.env
+*.pem
+*.key
+*.crt
+config.local.*
+*.local.yml
+# Documentation
+README*
+*.md
+docs/
+# Docker files (do not ignore Dockerfile and docker-compose.yml in root)
+Dockerfile*
+docker-compose*
+!Dockerfile
+!docker-compose.yml
+# Temporary and local files
+tmp/
+temp/
+*.tmp
+.local/
+local/
+# Project-specific: results and model artifacts (keep models/ for .onnx, ignore results/)
+results/
+# Miscellaneous
+*.bak
+*.orig
+*.old
+# Exclude .gitkeep from ignore (if needed for empty dirs)
+!models/.gitkeep

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tmp/uploaded_1745856378.pdf filter=lfs diff=lfs merge=lfs -text

.gradio/certificate.pem ADDED Viewed

	@@ -0,0 +1,31 @@

+-----BEGIN CERTIFICATE-----
+MIIFazCCA1OgAwIBAgIRAIIQz7DSQONZRGPgu2OCiwAwDQYJKoZIhvcNAQELBQAw
+TzELMAkGA1UEBhMCVVMxKTAnBgNVBAoTIEludGVybmV0IFNlY3VyaXR5IFJlc2Vh
+cmNoIEdyb3VwMRUwEwYDVQQDEwxJU1JHIFJvb3QgWDEwHhcNMTUwNjA0MTEwNDM4
+WhcNMzUwNjA0MTEwNDM4WjBPMQswCQYDVQQGEwJVUzEpMCcGA1UEChMgSW50ZXJu
+ZXQgU2VjdXJpdHkgUmVzZWFyY2ggR3JvdXAxFTATBgNVBAMTDElTUkcgUm9vdCBY
+MTCCAiIwDQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAK3oJHP0FDfzm54rVygc
+h77ct984kIxuPOZXoHj3dcKi/vVqbvYATyjb3miGbESTtrFj/RQSa78f0uoxmyF+
+0TM8ukj13Xnfs7j/EvEhmkvBioZxaUpmZmyPfjxwv60pIgbz5MDmgK7iS4+3mX6U
+A5/TR5d8mUgjU+g4rk8Kb4Mu0UlXjIB0ttov0DiNewNwIRt18jA8+o+u3dpjq+sW
+T8KOEUt+zwvo/7V3LvSye0rgTBIlDHCNAymg4VMk7BPZ7hm/ELNKjD+Jo2FR3qyH
+B5T0Y3HsLuJvW5iB4YlcNHlsdu87kGJ55tukmi8mxdAQ4Q7e2RCOFvu396j3x+UC
+B5iPNgiV5+I3lg02dZ77DnKxHZu8A/lJBdiB3QW0KtZB6awBdpUKD9jf1b0SHzUv
+KBds0pjBqAlkd25HN7rOrFleaJ1/ctaJxQZBKT5ZPt0m9STJEadao0xAH0ahmbWn
+OlFuhjuefXKnEgV4We0+UXgVCwOPjdAvBbI+e0ocS3MFEvzG6uBQE3xDk3SzynTn
+jh8BCNAw1FtxNrQHusEwMFxIt4I7mKZ9YIqioymCzLq9gwQbooMDQaHWBfEbwrbw
+qHyGO0aoSCqI3Haadr8faqU9GY/rOPNk3sgrDQoo//fb4hVC1CLQJ13hef4Y53CI
+rU7m2Ys6xt0nUW7/vGT1M0NPAgMBAAGjQjBAMA4GA1UdDwEB/wQEAwIBBjAPBgNV
+HRMBAf8EBTADAQH/MB0GA1UdDgQWBBR5tFnme7bl5AFzgAiIyBpY9umbbjANBgkq
+hkiG9w0BAQsFAAOCAgEAVR9YqbyyqFDQDLHYGmkgJykIrGF1XIpu+ILlaS/V9lZL
+ubhzEFnTIZd+50xx+7LSYK05qAvqFyFWhfFQDlnrzuBZ6brJFe+GnY+EgPbk6ZGQ
+3BebYhtF8GaV0nxvwuo77x/Py9auJ/GpsMiu/X1+mvoiBOv/2X/qkSsisRcOj/KK
+NFtY2PwByVS5uCbMiogziUwthDyC3+6WVwW6LLv3xLfHTjuCvjHIInNzktHCgKQ5
+ORAzI4JMPJ+GslWYHb4phowim57iaztXOoJwTdwJx4nLCgdNbOhdjsnvzqvHu7Ur
+TkXWStAmzOVyyghqpZXjFaH3pO3JLF+l+/+sKAIuvtd7u+Nxe5AW0wdeRlN8NwdC
+jNPElpzVmbUq4JUagEiuTDkHzsxHpFKVK7q4+63SM1N95R1NbdWhscdCb+ZAJzVc
+oyi3B43njTOQ5yOf+1CceWxG1bQVs5ZufpsMljq4Ui0/1lvh+wjChP4kqKOJ2qxq
+4RgqsahDYVvTH9w7jXbyLeiNdd8XM2w9U/t7y0Ff/9yi0GE44Za4rF2LN9d11TPA
+mRGunUHBcnWEvgJBQl9nJEiU0Zsnvgc/ubhPgXRR4Xq37Z0j4r7g1SgEEzwxA57d
+emyPxgcYxn/eR44/KJ4EBs+lVDR3veyJm+kXQ99b21/+jh5Xos1AnX5iItreGCc=
+-----END CERTIFICATE-----

Dockerfile ADDED Viewed

	@@ -0,0 +1,27 @@

+# syntax=docker/dockerfile:1.4
+# Base image
+FROM python:3.12-slim AS base
+# Install system dependencies for OpenCV and ffmpeg at runtime
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
+    libgl1-mesa-glx \
+    libglib2.0-0 \
+    libsm6 \
+    libxext6 \
+    libx11-dev \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+# Builder stage: install Python dependencies
+WORKDIR /app
+# 4. Copy requirements and install
+COPY requirements.txt .
+RUN pip install --no-cache-dir --upgrade pip && \
+    pip install --default-timeout=100 --no-cache-dir -r requirements.txt
+# 5. Copy app source
+COPY . .
+EXPOSE 7860
+CMD ["python", "demo_v5.py"]

README.md CHANGED Viewed

@@ -1,12 +1,6 @@
 ---
-title: Rapidocr Ort
-emoji: 🏆
-colorFrom: green
-colorTo: blue
 sdk: gradio
-sdk_version: 5.27.1
-app_file: app.py
-pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: rapidocr_ort
+app_file: demo_v5.py
 sdk: gradio
+sdk_version: 5.27.0
 ---

__init__.py ADDED Viewed

	@@ -0,0 +1,5 @@

+# -*- encoding: utf-8 -*-
+# @Author: SWHL
+# @Contact: liekkaskono@163.com
+from .main import RapidOCR
+from .utils import LoadImageError, VisRes

__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (246 Bytes). View file

__pycache__/image_enhancement.cpython-310.pyc ADDED Viewed

Binary file (41.3 kB). View file

__pycache__/image_enhancement.cpython-311.pyc ADDED Viewed

Binary file (68.9 kB). View file

__pycache__/image_enhancement.cpython-313.pyc ADDED Viewed

Binary file (62.3 kB). View file

__pycache__/main.cpython-310.pyc ADDED Viewed

Binary file (9.89 kB). View file

__pycache__/main.cpython-311.pyc ADDED Viewed

Binary file (20 kB). View file

__pycache__/main.cpython-313.pyc ADDED Viewed

Binary file (17.7 kB). View file

app.py ADDED Viewed

	@@ -0,0 +1,29 @@

+import gradio as gr
+import numpy as np
+import cv2
+from pathlib import Path
+from main import RapidOCR
+ocr_engine = RapidOCR()
+def extract_text_from_bottom(image: np.ndarray):
+    h = image.shape[0]
+#    bottom_crop = image[int(h * 0.7):, :]
+    result, _ = ocr_engine(image, use_det=True, use_cls=False, use_rec=True)
+    if not result:
+        return "No text found."
+    texts = [r[1] for r in result]
+    return "\n".join(texts)
+demo = gr.Interface(
+    fn=extract_text_from_bottom,
+    inputs=gr.Image(type="numpy"),
+    outputs="text",
+    title="",
+    description="",
+)
+demo.launch()

cal_rec_boxes/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@

+# -*- encoding: utf-8 -*-
+# @Author: SWHL
+# @Contact: liekkaskono@163.com
+from .main import CalRecBoxes

cal_rec_boxes/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (174 Bytes). View file

cal_rec_boxes/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (222 Bytes). View file

cal_rec_boxes/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (226 Bytes). View file

cal_rec_boxes/__pycache__/__init__.cpython-313.pyc ADDED Viewed

Binary file (215 Bytes). View file

cal_rec_boxes/__pycache__/main.cpython-310.pyc ADDED Viewed

Binary file (7.78 kB). View file

cal_rec_boxes/__pycache__/main.cpython-311.pyc ADDED Viewed

Binary file (16.8 kB). View file

cal_rec_boxes/__pycache__/main.cpython-312.pyc ADDED Viewed

Binary file (14.8 kB). View file

cal_rec_boxes/__pycache__/main.cpython-313.pyc ADDED Viewed

Binary file (14.8 kB). View file

cal_rec_boxes/main.py ADDED Viewed

	@@ -0,0 +1,281 @@

+# -*- encoding: utf-8 -*-
+# @Author: SWHL / Joker1212
+# @Contact: liekkaskono@163.com
+import copy
+import math
+from typing import Any, List, Optional, Tuple
+import cv2
+import numpy as np
+class CalRecBoxes:
+    """计算识别文字的汉字单字和英文单词的坐标框。代码借鉴自PaddlePaddle/PaddleOCR和fanqie03/char-detection"""
+    def __init__(self):
+        pass
+    def __call__(
+        self,
+        imgs: Optional[List[np.ndarray]],
+        dt_boxes: Optional[List[np.ndarray]],
+        rec_res: Optional[List[Any]],
+    ):
+        res = []
+        for img, box, rec_res in zip(imgs, dt_boxes, rec_res):
+            direction = self.get_box_direction(box)
+            rec_txt, rec_conf, rec_word_info = rec_res[0], rec_res[1], rec_res[2]
+            h, w = img.shape[:2]
+            img_box = np.array([[0, 0], [w, 0], [w, h], [0, h]])
+            word_box_content_list, word_box_list, conf_list = self.cal_ocr_word_box(
+                rec_txt, img_box, rec_word_info
+            )
+            word_box_list = self.adjust_box_overlap(copy.deepcopy(word_box_list))
+            word_box_list = self.reverse_rotate_crop_image(
+                copy.deepcopy(box), word_box_list, direction
+            )
+            res.append(
+                [rec_txt, rec_conf, word_box_list, word_box_content_list, conf_list]
+            )
+        return res
+    @staticmethod
+    def get_box_direction(box: np.ndarray) -> str:
+        direction = "w"
+        img_crop_width = int(
+            max(
+                np.linalg.norm(box[0] - box[1]),
+                np.linalg.norm(box[2] - box[3]),
+            )
+        )
+        img_crop_height = int(
+            max(
+                np.linalg.norm(box[0] - box[3]),
+                np.linalg.norm(box[1] - box[2]),
+            )
+        )
+        if img_crop_height * 1.0 / img_crop_width >= 1.5:
+            direction = "h"
+        return direction
+    @staticmethod
+    def cal_ocr_word_box(
+        rec_txt: str, box: np.ndarray, rec_word_info: List[Tuple[str, List[int]]]
+    ) -> Tuple[List[str], List[List[int]], List[float]]:
+        """Calculate the detection frame for each word based on the results of recognition and detection of ocr
+        汉字坐标是单字的
+        英语坐标是单词级别的
+        """
+        col_num, word_list, word_col_list, state_list, conf_list = rec_word_info
+        box = box.tolist()
+        bbox_x_start = box[0][0]
+        bbox_x_end = box[1][0]
+        bbox_y_start = box[0][1]
+        bbox_y_end = box[2][1]
+        cell_width = (bbox_x_end - bbox_x_start) / col_num
+        word_box_list = []
+        word_box_content_list = []
+        cn_width_list = []
+        en_width_list = []
+        cn_col_list = []
+        en_col_list = []
+        def cal_char_width(width_list, word_col_):
+            if len(word_col_) == 1:
+                return
+            char_total_length = (word_col_[-1] - word_col_[0]) * cell_width
+            char_width = char_total_length / (len(word_col_) - 1)
+            width_list.append(char_width)
+        def cal_box(col_list, width_list, word_box_list_):
+            if len(col_list) == 0:
+                return
+            if len(width_list) != 0:
+                avg_char_width = np.mean(width_list)
+            else:
+                avg_char_width = (bbox_x_end - bbox_x_start) / len(rec_txt)
+            for center_idx in col_list:
+                center_x = (center_idx + 0.5) * cell_width
+                cell_x_start = max(int(center_x - avg_char_width / 2), 0) + bbox_x_start
+                cell_x_end = (
+                    min(int(center_x + avg_char_width / 2), bbox_x_end - bbox_x_start)
+                    + bbox_x_start
+                )
+                cell = [
+                    [cell_x_start, bbox_y_start],
+                    [cell_x_end, bbox_y_start],
+                    [cell_x_end, bbox_y_end],
+                    [cell_x_start, bbox_y_end],
+                ]
+                word_box_list_.append(cell)
+        for word, word_col, state in zip(word_list, word_col_list, state_list):
+            if state == "cn":
+                cal_char_width(cn_width_list, word_col)
+                cn_col_list += word_col
+                word_box_content_list += word
+            else:
+                cal_char_width(en_width_list, word_col)
+                en_col_list += word_col
+                word_box_content_list += word
+        cal_box(cn_col_list, cn_width_list, word_box_list)
+        cal_box(en_col_list, en_width_list, word_box_list)
+        sorted_word_box_list = sorted(word_box_list, key=lambda box: box[0][0])
+        return word_box_content_list, sorted_word_box_list, conf_list
+    @staticmethod
+    def adjust_box_overlap(
+        word_box_list: List[List[List[int]]],
+    ) -> List[List[List[int]]]:
+        # 调整bbox有重叠的地方
+        for i in range(len(word_box_list) - 1):
+            cur, nxt = word_box_list[i], word_box_list[i + 1]
+            if cur[1][0] > nxt[0][0]:  # 有交集
+                distance = abs(cur[1][0] - nxt[0][0])
+                cur[1][0] -= distance / 2
+                cur[2][0] -= distance / 2
+                nxt[0][0] += distance - distance / 2
+                nxt[3][0] += distance - distance / 2
+        return word_box_list
+    def reverse_rotate_crop_image(
+        self,
+        bbox_points: np.ndarray,
+        word_points_list: List[List[List[int]]],
+        direction: str = "w",
+    ) -> List[List[List[int]]]:
+        """
+        get_rotate_crop_image的逆操作
+        img为原图
+        part_img为crop后的图
+        bbox_points为part_img中对应在原图的bbox, 四个点，左上，右上，右下，左下
+        part_points为在part_img中的点[(x, y), (x, y)]
+        """
+        bbox_points = np.float32(bbox_points)
+        left = int(np.min(bbox_points[:, 0]))
+        top = int(np.min(bbox_points[:, 1]))
+        bbox_points[:, 0] = bbox_points[:, 0] - left
+        bbox_points[:, 1] = bbox_points[:, 1] - top
+        img_crop_width = int(np.linalg.norm(bbox_points[0] - bbox_points[1]))
+        img_crop_height = int(np.linalg.norm(bbox_points[0] - bbox_points[3]))
+        pts_std = np.array(
+            [
+                [0, 0],
+                [img_crop_width, 0],
+                [img_crop_width, img_crop_height],
+                [0, img_crop_height],
+            ]
+        ).astype(np.float32)
+        M = cv2.getPerspectiveTransform(bbox_points, pts_std)
+        _, IM = cv2.invert(M)
+        new_word_points_list = []
+        for word_points in word_points_list:
+            new_word_points = []
+            for point in word_points:
+                new_point = point
+                if direction == "h":
+                    new_point = self.s_rotate(
+                        math.radians(-90), new_point[0], new_point[1], 0, 0
+                    )
+                    new_point[0] = new_point[0] + img_crop_width
+                p = np.float32(new_point + [1])
+                x, y, z = np.dot(IM, p)
+                new_point = [x / z, y / z]
+                new_point = [int(new_point[0] + left), int(new_point[1] + top)]
+                new_word_points.append(new_point)
+            new_word_points = self.order_points(new_word_points)
+            new_word_points_list.append(new_word_points)
+        return new_word_points_list
+    @staticmethod
+    def s_rotate(angle, valuex, valuey, pointx, pointy):
+        """绕pointx,pointy顺时针旋转
+        https://blog.csdn.net/qq_38826019/article/details/84233397
+        """
+        valuex = np.array(valuex)
+        valuey = np.array(valuey)
+        sRotatex = (
+            (valuex - pointx) * math.cos(angle)
+            + (valuey - pointy) * math.sin(angle)
+            + pointx
+        )
+        sRotatey = (
+            (valuey - pointy) * math.cos(angle)
+            - (valuex - pointx) * math.sin(angle)
+            + pointy
+        )
+        return [sRotatex, sRotatey]
+    @staticmethod
+    def order_points(box: List[List[int]]) -> List[List[int]]:
+        """矩形框顺序排列"""
+        def convert_to_1x2(p):
+            if p.shape == (2,):
+                return p.reshape((1, 2))
+            elif p.shape == (1, 2):
+                return p
+            else:
+                return p[:1, :]
+        box = np.array(box).reshape((-1, 2))
+        center_x, center_y = np.mean(box[:, 0]), np.mean(box[:, 1])
+        if np.any(box[:, 0] == center_x) and np.any(
+            box[:, 1] == center_y
+        ):  # 有两点横坐标相等，有两点纵坐标相等，菱形
+            p1 = box[np.where(box[:, 0] == np.min(box[:, 0]))]
+            p2 = box[np.where(box[:, 1] == np.min(box[:, 1]))]
+            p3 = box[np.where(box[:, 0] == np.max(box[:, 0]))]
+            p4 = box[np.where(box[:, 1] == np.max(box[:, 1]))]
+        elif np.all(box[:, 0] == center_x):  # 四个点的横坐标都相同
+            y_sort = np.argsort(box[:, 1])
+            p1 = box[y_sort[0]]
+            p2 = box[y_sort[1]]
+            p3 = box[y_sort[2]]
+            p4 = box[y_sort[3]]
+        elif np.any(box[:, 0] == center_x) and np.all(
+            box[:, 1] != center_y
+        ):  # 只有两点横坐标相等，先上下再左右
+            p12, p34 = (
+                box[np.where(box[:, 1] < center_y)],
+                box[np.where(box[:, 1] > center_y)],
+            )
+            p1, p2 = (
+                p12[np.where(p12[:, 0] == np.min(p12[:, 0]))],
+                p12[np.where(p12[:, 0] == np.max(p12[:, 0]))],
+            )
+            p3, p4 = (
+                p34[np.where(p34[:, 0] == np.max(p34[:, 0]))],
+                p34[np.where(p34[:, 0] == np.min(p34[:, 0]))],
+            )
+        else:  # 只有两点纵坐标相等，或者是没有相等的，先左右再上下
+            p14, p23 = (
+                box[np.where(box[:, 0] < center_x)],
+                box[np.where(box[:, 0] > center_x)],
+            )
+            p1, p4 = (
+                p14[np.where(p14[:, 1] == np.min(p14[:, 1]))],
+                p14[np.where(p14[:, 1] == np.max(p14[:, 1]))],
+            )
+            p2, p3 = (
+                p23[np.where(p23[:, 1] == np.min(p23[:, 1]))],
+                p23[np.where(p23[:, 1] == np.max(p23[:, 1]))],
+            )
+        # 解决单字切割后横坐标完全相同的shape错误
+        p1 = convert_to_1x2(p1)
+        p2 = convert_to_1x2(p2)
+        p3 = convert_to_1x2(p3)
+        p4 = convert_to_1x2(p4)
+        return np.array([p1, p2, p3, p4]).reshape((-1, 2)).tolist()

ch_ppocr_cls/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@

+# -*- encoding: utf-8 -*-
+# @Author: SWHL
+# @Contact: liekkaskono@163.com
+from .text_cls import TextClassifier

ch_ppocr_cls/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (180 Bytes). View file

ch_ppocr_cls/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (228 Bytes). View file

ch_ppocr_cls/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (232 Bytes). View file

ch_ppocr_cls/__pycache__/__init__.cpython-313.pyc ADDED Viewed

Binary file (221 Bytes). View file

ch_ppocr_cls/__pycache__/text_cls.cpython-310.pyc ADDED Viewed

Binary file (3.25 kB). View file

ch_ppocr_cls/__pycache__/text_cls.cpython-311.pyc ADDED Viewed

Binary file (6.27 kB). View file

ch_ppocr_cls/__pycache__/text_cls.cpython-312.pyc ADDED Viewed

Binary file (5.62 kB). View file

ch_ppocr_cls/__pycache__/text_cls.cpython-313.pyc ADDED Viewed

Binary file (5.69 kB). View file

ch_ppocr_cls/__pycache__/utils.cpython-310.pyc ADDED Viewed

Binary file (1.03 kB). View file

ch_ppocr_cls/__pycache__/utils.cpython-311.pyc ADDED Viewed

Binary file (1.51 kB). View file

ch_ppocr_cls/__pycache__/utils.cpython-312.pyc ADDED Viewed

Binary file (1.19 kB). View file

ch_ppocr_cls/__pycache__/utils.cpython-313.pyc ADDED Viewed

Binary file (1.23 kB). View file

ch_ppocr_cls/text_cls.py ADDED Viewed

	@@ -0,0 +1,114 @@

+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import argparse
+import copy
+import math
+import time
+from typing import Any, Dict, List, Tuple, Union
+import cv2
+import numpy as np
+from rapidocr_onnxruntime.utils import OrtInferSession, read_yaml
+from .utils import ClsPostProcess
+class TextClassifier:
+    def __init__(self, config: Dict[str, Any]):
+        self.cls_image_shape = config["cls_image_shape"]
+        self.cls_batch_num = config["cls_batch_num"]
+        self.cls_thresh = config["cls_thresh"]
+        self.postprocess_op = ClsPostProcess(config["label_list"])
+        self.infer = OrtInferSession(config)
+    def __call__(
+        self, img_list: Union[np.ndarray, List[np.ndarray]]
+    ) -> Tuple[List[np.ndarray], List[List[Union[str, float]]], float]:
+        if isinstance(img_list, np.ndarray):
+            img_list = [img_list]
+        img_list = copy.deepcopy(img_list)
+        # Calculate the aspect ratio of all text bars
+        width_list = [img.shape[1] / float(img.shape[0]) for img in img_list]
+        # Sorting can speed up the cls process
+        indices = np.argsort(np.array(width_list))
+        img_num = len(img_list)
+        cls_res = [["", 0.0]] * img_num
+        batch_num = self.cls_batch_num
+        elapse = 0
+        for beg_img_no in range(0, img_num, batch_num):
+            end_img_no = min(img_num, beg_img_no + batch_num)
+            norm_img_batch = []
+            for ino in range(beg_img_no, end_img_no):
+                norm_img = self.resize_norm_img(img_list[indices[ino]])
+                norm_img = norm_img[np.newaxis, :]
+                norm_img_batch.append(norm_img)
+            norm_img_batch = np.concatenate(norm_img_batch).astype(np.float32)
+            starttime = time.time()
+            prob_out = self.infer(norm_img_batch)[0]
+            cls_result = self.postprocess_op(prob_out)
+            elapse += time.time() - starttime
+            for rno, (label, score) in enumerate(cls_result):
+                cls_res[indices[beg_img_no + rno]] = [label, score]
+                if "180" in label and score > self.cls_thresh:
+                    img_list[indices[beg_img_no + rno]] = cv2.rotate(
+                        img_list[indices[beg_img_no + rno]], 1
+                    )
+        return img_list, cls_res, elapse
+    def resize_norm_img(self, img: np.ndarray) -> np.ndarray:
+        img_c, img_h, img_w = self.cls_image_shape
+        h, w = img.shape[:2]
+        ratio = w / float(h)
+        if math.ceil(img_h * ratio) > img_w:
+            resized_w = img_w
+        else:
+            resized_w = int(math.ceil(img_h * ratio))
+        resized_image = cv2.resize(img, (resized_w, img_h))
+        resized_image = resized_image.astype("float32")
+        if img_c == 1:
+            resized_image = resized_image / 255
+            resized_image = resized_image[np.newaxis, :]
+        else:
+            resized_image = resized_image.transpose((2, 0, 1)) / 255
+        resized_image -= 0.5
+        resized_image /= 0.5
+        padding_im = np.zeros((img_c, img_h, img_w), dtype=np.float32)
+        padding_im[:, :, :resized_w] = resized_image
+        return padding_im
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--image_path", type=str, help="image_dir|image_path")
+    parser.add_argument("--config_path", type=str, default="config.yaml")
+    args = parser.parse_args()
+    config = read_yaml(args.config_path)
+    text_classifier = TextClassifier(config)
+    img = cv2.imread(args.image_path)
+    img_list, cls_res, predict_time = text_classifier(img)
+    for ino in range(len(img_list)):
+        print(f"cls result:{cls_res[ino]}")

ch_ppocr_cls/utils.py ADDED Viewed

	@@ -0,0 +1,28 @@

+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import List, Tuple
+import numpy as np
+class ClsPostProcess:
+    def __init__(self, label_list: List[str]):
+        self.label_list = label_list
+    def __call__(self, preds: np.ndarray) -> List[Tuple[str, float]]:
+        pred_idxs = preds.argmax(axis=1)
+        decode_out = [
+            (self.label_list[idx], preds[i, idx]) for i, idx in enumerate(pred_idxs)
+        ]
+        return decode_out

ch_ppocr_det/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@

+# -*- encoding: utf-8 -*-
+# @Author: SWHL
+# @Contact: liekkaskono@163.com
+from .text_detect import TextDetector

ch_ppocr_det/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (200 Bytes). View file

ch_ppocr_det/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (229 Bytes). View file

ch_ppocr_det/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (233 Bytes). View file

ch_ppocr_det/__pycache__/__init__.cpython-313.pyc ADDED Viewed

Binary file (222 Bytes). View file

ch_ppocr_det/__pycache__/text_detect.cpython-310.pyc ADDED Viewed

Binary file (3.49 kB). View file

ch_ppocr_det/__pycache__/text_detect.cpython-311.pyc ADDED Viewed

Binary file (6.56 kB). View file

ch_ppocr_det/__pycache__/text_detect.cpython-312.pyc ADDED Viewed

Binary file (5.99 kB). View file

ch_ppocr_det/__pycache__/text_detect.cpython-313.pyc ADDED Viewed

Binary file (6.02 kB). View file

ch_ppocr_det/__pycache__/utils.cpython-310.pyc ADDED Viewed

Binary file (7.34 kB). View file