Spaces:

djl234
/

GDNet_2025

Sleeping

App Files Files Community

djl234 commited on Mar 17, 2025

Commit

eb9155a

verified ·

1 Parent(s): 2d1e815

Update app.py

Browse files

[feat]box interactive seg

Files changed (1) hide show

app.py +53 -43

app.py CHANGED Viewed

@@ -30,7 +30,6 @@ def show_coord(evt: gr.SelectData):
 def generate_mask(img, coord):
     #x, y = map(int, coord.split(','))
     #
     mask = sepia((img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8), stack_image=False)
     mask = F.interpolate(torch.from_numpy(mask).unsqueeze(0).unsqueeze(0),size=[img.shape[0],img.shape[1]],mode='bilinear').squeeze().numpy()
@@ -45,44 +44,6 @@ def generate_mask(img, coord):
     mix = (1-mask_torch)*img+mask_torch*img*0.5+mask_torch*col*0.5
     return mix.numpy().astype(np.uint8)#overlay_mask(img, mask)
-def overlay_mask(img, mask):
-    # 前置校验（参考网页1数据验证方案）
-    assert mask is not None, "掩码数据为空"
-    assert img.size > 0 and mask.size > 0, "输入图像或掩码尺寸异常"
-    # 数据类型强制转换（根据网页2的浮点型要求）
-    mask_float = mask.astype(np.float32) if mask.dtype != np.float32 else mask
-    # 维度压缩（应对4D数组问题）
-    if mask_float.ndim == 4:
-        mask_float = np.squeeze(mask_float, axis=(0,1))  # 去除批次和通道维度
-    # 尺寸调整（参考网页3的最佳实践）
-    try:
-        mask_resized = cv2.resize(
-            mask_float,
-            (img.shape[1], img.shape[0]),
-            interpolation=cv2.INTER_CUBIC  # 使用高阶插值保持缺陷边缘
-        )
-    except cv2.error as e:
-        print(f"Resize参数异常: 原图尺寸{img.shape} 掩码尺寸{mask.shape}")
-        raise
-    # 通道统一（三通道对齐）
-    if len(mask_resized.shape) == 2:
-        mask_rgb = cv2.cvtColor(mask_resized, cv2.COLOR_GRAY2BGR)
-    else:
-        mask_rgb = mask_resized
-    # 归一化处理
-    return (cv2.addWeighted(
-        img.astype(np.float32)/255,
-        0.7,
-        mask_rgb.astype(np.float32)/255,
-        0.3,
-        0
-    )*255).astype(np.uint8)
 def create_mode2_interface():
     with gr.Blocks() as mode2:
         with gr.Column():
@@ -115,6 +76,39 @@ def create_mode2_interface():
             outputs=mask_output
         )
     return mode2
 #import argparse
 device='cpu'
 net = build_model(device).to(device)
@@ -227,7 +221,7 @@ def create_mode1_interface():
 with gr.Blocks(title="交互式图像组分割系统") as demo:
     # 模式选择器
-    mode = gr.Radio(["多图协同分割", "点提示交互分割"],
                    value="多图协同分割",
                    label="运行模式")
@@ -246,13 +240,29 @@ with gr.Blocks(title="交互式图像组分割系统") as demo:
                 outputs=output_img
             )
-        with gr.Tab("点选模式", id=1) as tab2:
             # 模式2界面组件
             img_input = gr.Image(type="numpy", label="点击上传图片并选择点")
             coord_store = gr.Textbox(visible=False)
             mask_btn = gr.Button("生成分割掩码")
             mask_output = gr.Image(label="分割结果")
             @img_input.select(inputs=[], outputs=coord_store)
             def store_coordinate(evt: gr.SelectData):
                 return f"{evt.index[0]},{evt.index[1]}"
@@ -265,9 +275,9 @@ with gr.Blocks(title="交互式图像组分割系统") as demo:
     # 动态显示控制
     mode.change(
-        lambda x: (gr.update(visible=x=="多图协同分割"), gr.update(visible=x=="点提示交互分割")),
         inputs=mode,
-        outputs=[tab1, tab2]
     )
 demo.launch(debug=True)

 def generate_mask(img, coord):
     #x, y = map(int, coord.split(','))
     #
     mask = sepia((img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8),(img*0.999999).astype(np.uint8), stack_image=False)
     mask = F.interpolate(torch.from_numpy(mask).unsqueeze(0).unsqueeze(0),size=[img.shape[0],img.shape[1]],mode='bilinear').squeeze().numpy()
     mix = (1-mask_torch)*img+mask_torch*img*0.5+mask_torch*col*0.5
     return mix.numpy().astype(np.uint8)#overlay_mask(img, mask)
 def create_mode2_interface():
     with gr.Blocks() as mode2:
         with gr.Column():
             outputs=mask_output
         )
     return mode2
+def create_mode3_interface():
+    with gr.Blocks() as mode2:
+        with gr.Column():
+            img_input = gr.Image(
+                type="numpy",
+                sources=["upload"],  # 正确复数形式参数[2](@ref)
+                label="点击上传图片并选择框",
+                interactive=True
+            )
+            # 坐标存储组件
+            coord_store = gr.Textbox(visible=False)
+            # 绑定点击事件
+            @img_input.select(inputs=[], outputs=coord_store)
+            def capture_coordinates(evt: gr.SelectData):
+                return f"{evt.index[0]},{evt.index[1]}"
+            # 修改3：正确绑定点击事件
+            @img_input.select(inputs=img_input, outputs=coord_store)
+            def store_coordinate(evt: gr.SelectData):
+                return f"{evt.index[0]},{evt.index[1]}"
+            btn = gr.Button("生成分割掩码")
+            mask_output = gr.Image(label="分割结果")
+        btn.click(
+            generate_mask,
+            inputs=[img_input, coord_store],
+            outputs=mask_output
+        )
+    return mode2
 #import argparse
 device='cpu'
 net = build_model(device).to(device)
 with gr.Blocks(title="交互式图像组分割系统") as demo:
     # 模式选择器
+    mode = gr.Radio(["多图协同分割", "点提示交互分割","框提示交互分割"],
                    value="多图协同分割",
                    label="运行模式")
                 outputs=output_img
             )
+        with gr.Tab("点选交互模式", id=1) as tab2:
             # 模式2界面组件
             img_input = gr.Image(type="numpy", label="点击上传图片并选择点")
             coord_store = gr.Textbox(visible=False)
             mask_btn = gr.Button("生成分割掩码")
             mask_output = gr.Image(label="分割结果")
+            @img_input.select(inputs=[], outputs=coord_store)
+            def store_coordinate(evt: gr.SelectData):
+                return f"{evt.index[0]},{evt.index[1]}"
+            mask_btn.click(
+                generate_mask,
+                inputs=[img_input, coord_store],
+                outputs=mask_output
+            )
+        with gr.Tab("框选交互模式", id=2) as tab3:
+            # 模式2界面组件
+            img_input = gr.Image(type="numpy", label="点击上传图片并选择框")
+            coord_store = gr.Textbox(visible=False)
+            mask_btn = gr.Button("生成分割掩码")
+            mask_output = gr.Image(label="分割结果")
             @img_input.select(inputs=[], outputs=coord_store)
             def store_coordinate(evt: gr.SelectData):
                 return f"{evt.index[0]},{evt.index[1]}"
     # 动态显示控制
     mode.change(
+        lambda x: (gr.update(visible=x=="多图协同分割"), gr.update(visible=x=="点提示交互分割"), gr.update(visible=x=="框提示交互分割")),
         inputs=mode,
+        outputs=[tab1, tab2, tab3]
     )
 demo.launch(debug=True)