Upload gradio demo

Browse files

Files changed (8) hide show

.gitattributes +1 -0
README.md +32 -21
assert/gradio_demo.jpg +0 -0
experiment/gradio_x2.avi +0 -0
python/__pycache__/common.cpython-313.pyc +0 -0
python/__pycache__/imgproc.cpython-313.pyc +0 -0
python/gradio_demo.py +326 -0
video/gradio.png +3 -0

.gitattributes CHANGED Viewed

@@ -43,3 +43,4 @@ model_convert/axmodel/espcn_x2_T9_2k.axmodel filter=lfs diff=lfs merge=lfs -text
 model_convert/axmodel/620/edsr_x2_small_1.axmodel filter=lfs diff=lfs merge=lfs -text
 model_convert/axmodel/620/edsr_x2_small_2.axmodel filter=lfs diff=lfs merge=lfs -text
 *.axmodel filter=lfs diff=lfs merge=lfs -text

 model_convert/axmodel/620/edsr_x2_small_1.axmodel filter=lfs diff=lfs merge=lfs -text
 model_convert/axmodel/620/edsr_x2_small_2.axmodel filter=lfs diff=lfs merge=lfs -text
 *.axmodel filter=lfs diff=lfs merge=lfs -text
+video/gradio.png filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -38,28 +38,17 @@ Download all files from this repository to the device
 ```
-root@ax650:~/SuperResolution# tree
 .
-|-- model_convert
-|	-- axmodel
-|   	`-- edsr_baseline_x2_1.axmodel
-|   	`-- espcn_x2_T9.axmodel
-|	-- onnx
-|   	`-- edsr_baseline_x2_1.onnx
-|   	`-- espcn_x2_T9.onnx
-|   `-- build_config_edsr.json
-|   `-- build_config_espcn.json
-|-- python
-|   `-- run_onnx.py
-|   `-- run_axmodel.py
-|   `-- common.py
-|   `-- imgproc.py
-|-- video
-|   `-- test_1920x1080.mp4
-|   `-- 1.png
-|   `-- 2.png
 ```
 ### Requirements
@@ -98,6 +87,7 @@ Average time: 0.373 seconds for each frame
 ```
 The output file in `experiment/test_1920x1080_x2.avi`
 Output Data:
@@ -106,4 +96,25 @@ Output Data:
 │   └── test_1920x1080_x2.avi
 ```
-![Example Image](video/2.png)

 ```
+root@ax650:~/SuperResolution# tree -L 1
 .
+├── assert
+├── config.json
+├── experiment
+├── model_convert
+├── python
+├── README.md
+└── video
+6 directories, 2 files
 ```
 ### Requirements
 ```
 The output file in `experiment/test_1920x1080_x2.avi`
+![Example Image](video/2.png)
 Output Data:
 │   └── test_1920x1080_x2.avi
 ```
+#### Inference with M.2 Accelerator card
+```bash
+$ cd python
+$ python gradio_demo.py
+[INFO] Available providers:  ['AXCLRTExecutionProvider']
+[INFO] Using provider: AXCLRTExecutionProvider
+[INFO] SOC Name: AX650N
+[INFO] VNPU type: VNPUType.DISABLED
+[INFO] Compiler version: 4.2 6bff2f67
+[INFO] Using provider: AXCLRTExecutionProvider
+[INFO] SOC Name: AX650N
+[INFO] VNPU type: VNPUType.DISABLED
+[INFO] Compiler version: 4.2 6bff2f67
+* Running on local URL:  http://0.0.0.0:7860
+* To create a public link, set `share=True` in `launch()`.
+```
+Then use the M.2 Accelerator card IP instead of the 0.0.0.0, and use chrome open the URL: http://[your ip]:7860
+![gradio_demo](./assert/gradio_demo.jpg)

assert/gradio_demo.jpg ADDED Viewed

experiment/gradio_x2.avi ADDED Viewed

Binary file (32.2 kB). View file

python/__pycache__/common.cpython-313.pyc ADDED Viewed

Binary file (4.47 kB). View file

python/__pycache__/imgproc.cpython-313.pyc ADDED Viewed

Binary file (32.1 kB). View file

python/gradio_demo.py ADDED Viewed

	@@ -0,0 +1,326 @@

+import gradio as gr
+import cv2
+import numpy as np
+import os
+import tempfile
+import time
+import axengine as axe
+import common
+import imgproc
+rgb_range=255
+scale=2
+def from_numpy(x):
+    return x if isinstance(x, np.ndarray) else np.array(x)
+def quantize(img, rgb_range):
+    pixel_range = 255 / rgb_range
+    return np.round(np.clip(img * pixel_range, 0, 255)) / pixel_range
+# 初始化EDSR和ESPCN模型
+def init_SRmodel(EDSR_path="../model_convert/axmodel/edsr_baseline_x2_1.axmodel",
+                 ESPCN_path="../model_convert/axmodel/espcn_x2_T9.axmodel"):
+    EDSR_session = axe.InferenceSession(EDSR_path)
+    ESPCN_session = axe.InferenceSession(ESPCN_path)
+    return [EDSR_session, ESPCN_session]
+SR_sessions=init_SRmodel()
+def EDSR_infer(frame, EDSR_session=SR_sessions[0]):
+    output_names = [x.name for x in EDSR_session.get_outputs()]
+    input_name = EDSR_session.get_inputs()[0].name
+    lr_y_image, = common.set_channel(frame, n_channels=3)
+    lr_y_image, = common.np_prepare(lr_y_image, rgb_range=rgb_range)
+    sr = EDSR_session.run(output_names, {input_name: lr_y_image})
+    if isinstance(sr, (list, tuple)):
+        sr = from_numpy(sr[0]) if len(sr) == 1 else [from_numpy(x) for x in sr]
+    else:
+        sr = from_numpy(sr)
+    sr = quantize(sr, rgb_range).squeeze(0)
+    normalized = sr * 255 / rgb_range
+    ndarr = normalized.transpose(1, 2, 0).astype(np.uint8)
+    return ndarr
+def ESPCN_infer(frame, ESPCN_session=SR_sessions[1]):
+    output_names = [x.name for x in ESPCN_session.get_outputs()]
+    input_name = ESPCN_session.get_inputs()[0].name
+    lr_y_image, lr_cb_image, lr_cr_image = imgproc.preprocess_one_frame(frame)
+    bic_cb_image = cv2.resize(lr_cb_image,
+                (int(lr_cb_image.shape[1] * scale),
+                int(lr_cb_image.shape[0] * scale)),
+                interpolation=cv2.INTER_CUBIC)
+    bic_cr_image = cv2.resize(lr_cr_image,
+                (int(lr_cr_image.shape[1] * scale),
+                int(lr_cr_image.shape[0] * scale)),
+                interpolation=cv2.INTER_CUBIC)
+    sr = ESPCN_session.run(output_names, {input_name: lr_y_image})
+    if isinstance(sr, (list, tuple)):
+        sr = from_numpy(sr[0]) if len(sr) == 1 else [from_numpy(x) for x in sr]
+    else:
+        sr = from_numpy(sr)
+    ndarr = imgproc.array_to_image(sr)
+    sr_y_image = ndarr.astype(np.float32) / 255.0
+    sr_ycbcr_image = cv2.merge([sr_y_image[:, :, 0], bic_cb_image, bic_cr_image])
+    sr_image = imgproc.ycbcr_to_bgr(sr_ycbcr_image)
+    sr_image = np.clip(sr_image* 255.0, 0 , 255).astype(np.uint8)
+    return sr_image
+# ======================
+# 模拟超分辨率模型
+# ======================
+def EDSR_MODEL(input_data, is_video=False):
+    if is_video:
+        output_frames = []
+        for frame in input_data:
+            out = EDSR_infer(frame=frame)
+            output_frames.append(out)
+        return output_frames
+    else:
+        out = EDSR_infer(frame=input_data)
+        return out
+def ESPCN_MODEL(input_data, is_video=False):
+    if is_video:
+        output_frames = []
+        for frame in input_data:
+            out = ESPCN_infer(frame=frame)
+            output_frames.append(out)
+        return output_frames
+    else:
+        out = ESPCN_infer(frame=input_data)
+        return out
+# ======================
+# 全局状态（单用户）
+# ======================
+class AppState:
+    def __init__(self):
+        self.original_img = None    # 原始图（BGR, 高分辨率）
+        self.sr_img = None          # 超分图（BGR, 高分辨率）
+        self.is_video = False
+app_state = AppState()
+# ======================
+# 核心处理函数
+# ======================
+def process_super_resolution(input_file, model_choice):
+    global app_state
+    if input_file is None:
+        raise gr.Error("请先上传图片或视频！")
+    file_path = input_file
+    app_state = AppState()
+    info_text = ""
+    is_video = any(ext in file_path.lower() for ext in ['.mp4', '.avi', '.mov', '.mkv'])
+    if is_video:
+        # --- 视频处理（直接保存高分辨率）---
+        cap = cv2.VideoCapture(file_path)
+        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        fps = cap.get(cv2.CAP_PROP_FPS)
+        info_text += f"🎬 视频信息:\n- 总帧数: {total_frames}\n- 帧率: {fps:.2f} FPS\n"
+        frames = []
+        while True:
+            ret, frame = cap.read()
+            if not ret:
+                break
+            frames.append(frame)
+        cap.release()
+        model_func = EDSR_MODEL if model_choice == "EDSR_MODEL" else ESPCN_MODEL
+        start_time = time.time()
+        output_data = model_func(frames, is_video=True)
+        infer_time = time.time() - start_time
+        info_text += f"\n⏱️ 推理时间: {infer_time:.2f} 秒\n"
+        full_video_path = os.path.join(tempfile.gettempdir(), f"sr_video_x2.mp4")
+        h_out, w_out = output_data[0].shape[:2]
+        info_text += f"- 超分后尺寸: {w_out} x {h_out}\n"
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        out_video = cv2.VideoWriter(full_video_path, fourcc, fps, (w_out, h_out))
+        for frame in output_data:
+            out_video.write(frame)
+        out_video.release()
+        app_state.is_video = True
+        return (
+            gr.update(value=None, visible=False),  # image_display
+            gr.update(visible=False),              # btn_original
+            gr.update(visible=False),              # btn_sr
+            gr.update(value="当前: 无", visible=False),
+            gr.update(value=full_video_path, visible=True),
+            gr.update(value=full_video_path, visible=True),
+            gr.update(visible=False),
+            info_text
+        )
+    else:
+        # --- 图片处理（保存原始高分辨率）---
+        img = cv2.imread(file_path)
+        if img is None:
+            raise gr.Error("无法读取图片！")
+        h, w = img.shape[:2]
+        info_text += f"🖼️ 图片信息:\n- 原始尺寸: {w} x {h}\n"
+        app_state.original_img = img.copy()
+        model_func = EDSR_MODEL if model_choice == "EDSR_MODEL" else ESPCN_MODEL
+        start_time = time.time()
+        sr_img = model_func(img, is_video=False)
+        infer_time = time.time() - start_time
+        info_text += f"\n⏱️ 推理时间: {infer_time:.2f} 秒\n"
+        h_out, w_out = sr_img.shape[:2]
+        info_text += f"- 超分后尺寸: {w_out} x {h_out}\n"
+        sr_img_path = os.path.join(tempfile.gettempdir(), f"sr_image_x2.png")
+        cv2.imwrite(sr_img_path, sr_img)
+        app_state.sr_img = sr_img
+        app_state.is_video = False
+        # 默认显示原图（高分辨率，但 UI 会限制尺寸）
+        return (
+            gr.update(value=app_state.original_img[:, :, ::-1], visible=True),  # BGR→RGB
+            gr.update(visible=True),
+            gr.update(visible=True),
+            gr.update(value="当前: 原图", visible=True),
+            gr.update(visible=False),
+            gr.update(visible=False),
+            gr.update(value=sr_img_path, visible=True),
+            info_text
+        )
+# ======================
+# 切换显示函数（直接使用原始高分辨率图）
+# ======================
+def show_original():
+    if app_state.original_img is None:
+        return gr.update(), gr.update()
+    # OpenCV BGR → RGB
+    rgb_img = app_state.original_img[:, :, ::-1]
+    return gr.update(value=rgb_img), gr.update(value="当前: 原图")
+def show_sr():
+    if app_state.sr_img is None:
+        return gr.update(), gr.update()
+    rgb_img = app_state.sr_img[:, :, ::-1]
+    return gr.update(value=rgb_img), gr.update(value="当前: 超分图")
+# ======================
+# Gradio UI
+# ======================
+with gr.Blocks(title="超分辨率可视化工具", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🚀 超分辨率模型效果可视化")
+    gr.Markdown("上传图片或视频，选择模型，点击箭头切换原图/超分图！")
+    input_file = gr.File(
+        label="📂 上传图片或视频",
+        file_types=["image", "video"],
+        file_count="single"
+    )
+    with gr.Row():
+        model_choice = gr.Radio(
+            choices=["EDSR_MODEL", "ESPCN_MODEL"],
+            value="EDSR_MODEL",
+            label="🔍 选择超分辨率模型"
+        )
+        run_btn = gr.Button("🚀 开始超分", variant="primary")
+    # 图片区：硬性限定尺寸，直接显示原始高分辨率图
+    with gr.Column(visible=False) as image_section:
+        image_label = gr.Textbox(value="当前: 原图", interactive=False, lines=1)
+        image_display = gr.Image(
+            label="🖼️ 图像显示",
+            width=800,    # 👈 固定宽度
+            height=600    # 👈 固定高度
+        )
+        with gr.Row():
+            btn_original = gr.Button("◀ 原图")
+            btn_sr = gr.Button("超分图 ▶")
+    # 视频区：硬性限定高度
+    output_video_player = gr.Video(
+        label="▶️ 超分视频（高分辨率）",
+        visible=False,
+        height=450  # 宽度自适应，高度固定
+    )
+    with gr.Row():
+        download_image = gr.File(label="📥 下载超分图片（原图）", visible=False)
+        download_video = gr.File(label="📥 下载超分视频（完整分辨率）", visible=False)
+    info_box = gr.Textbox(label="📊 处理信息", lines=6, interactive=False)
+    run_btn.click(
+        fn=process_super_resolution,
+        inputs=[input_file, model_choice],
+        outputs=[
+            image_display,
+            btn_original,
+            btn_sr,
+            image_label,
+            output_video_player,
+            download_video,
+            download_image,
+            info_box
+        ]
+    )
+    btn_original.click(show_original, outputs=[image_display, image_label])
+    btn_sr.click(show_sr, outputs=[image_display, image_label])
+    def toggle_ui(file):
+        if file is None:
+            return (
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=False)
+            )
+        if any(ext in file.lower() for ext in ['.mp4', '.avi', '.mov', '.mkv']):
+            return (
+                gr.update(visible=False),
+                gr.update(visible=False),
+                gr.update(visible=True),
+                gr.update(visible=True)
+            )
+        else:
+            return (
+                gr.update(visible=True),
+                gr.update(visible=True),
+                gr.update(visible=False),
+                gr.update(visible=False)
+            )
+    input_file.change(
+        fn=toggle_ui,
+        inputs=input_file,
+        outputs=[
+            image_section,
+            download_image,
+            output_video_player,
+            download_video
+        ]
+    )
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)

video/gradio.png ADDED Viewed

Git LFS Details

SHA256: 727a7d51411a1c32525a2c42662758ae952915b62ff06c7fb18488ffbdba3b22
Pointer size: 132 Bytes
Size of remote file: 2.07 MB