support for multi-iamge
Browse files
app.py
CHANGED
|
@@ -63,31 +63,38 @@ def segment_reference(image, click):
|
|
| 63 |
|
| 64 |
return masks
|
| 65 |
|
| 66 |
-
def segment_target(
|
| 67 |
-
|
| 68 |
ref_image = np.array(ref_image)
|
| 69 |
-
state = sam_utils.load_masks(sam2_vid,
|
| 70 |
-
out = sam_utils.propagate_masks(sam2_vid, state)[
|
| 71 |
-
return
|
| 72 |
|
| 73 |
def on_reference_upload(img):
|
| 74 |
global click_coords
|
| 75 |
click_coords = [] # clear the clicks
|
| 76 |
return "Click Info: Cleared (new image uploaded)"
|
| 77 |
|
| 78 |
-
def visualize_segmentation(image, masks,
|
| 79 |
# Visualize the segmentation result
|
| 80 |
-
|
| 81 |
-
ax
|
|
|
|
|
|
|
|
|
|
| 82 |
for i, mask in enumerate(masks):
|
| 83 |
-
sam_utils.show_mask(mask, ax[0], obj_id=i, alpha=0.75)
|
| 84 |
-
ax[0].axis('off')
|
| 85 |
-
ax[0].set_title("Reference Image with Expert Segmentation")
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 91 |
# save it to buffer
|
| 92 |
plt.tight_layout()
|
| 93 |
buf = BytesIO()
|
|
@@ -106,12 +113,18 @@ def record_click(img, evt: gr.SelectData):
|
|
| 106 |
click_coords.append([evt.index[0], evt.index[1]])
|
| 107 |
return f"Clicked at: {click_coords}"
|
| 108 |
|
| 109 |
-
def generate(reference_image,
|
|
|
|
| 110 |
if not click_coords:
|
| 111 |
return None, "Click on the reference image first!"
|
|
|
|
|
|
|
|
|
|
| 112 |
ref_mask = segment_reference(reference_image, click_coords)
|
| 113 |
-
|
| 114 |
-
vis = visualize_segmentation(reference_image, ref_mask,
|
|
|
|
|
|
|
| 115 |
return vis, "Done!"
|
| 116 |
|
| 117 |
with gr.Blocks() as demo:
|
|
@@ -119,7 +132,7 @@ with gr.Blocks() as demo:
|
|
| 119 |
|
| 120 |
with gr.Row():
|
| 121 |
reference_img = gr.Image(type="pil", label="Reference Image")
|
| 122 |
-
target_img = gr.
|
| 123 |
|
| 124 |
click_info = gr.Textbox(label="Click Info")
|
| 125 |
generate_btn = gr.Button("Generate")
|
|
|
|
| 63 |
|
| 64 |
return masks
|
| 65 |
|
| 66 |
+
def segment_target(target_images, ref_image, ref_mask):
|
| 67 |
+
target_images = [np.array(target_image) for target_image in target_images]
|
| 68 |
ref_image = np.array(ref_image)
|
| 69 |
+
state = sam_utils.load_masks(sam2_vid, target_images, ref_image, ref_mask)
|
| 70 |
+
out = sam_utils.propagate_masks(sam2_vid, state)[1:]
|
| 71 |
+
return [mask['segmentation'] for mask in out]
|
| 72 |
|
| 73 |
def on_reference_upload(img):
|
| 74 |
global click_coords
|
| 75 |
click_coords = [] # clear the clicks
|
| 76 |
return "Click Info: Cleared (new image uploaded)"
|
| 77 |
|
| 78 |
+
def visualize_segmentation(image, masks, target_images, target_masks):
|
| 79 |
# Visualize the segmentation result
|
| 80 |
+
num_tgt = len(target_images)
|
| 81 |
+
fig, ax = plt.subplots(2, num_tgt, figsize=(6*num_tgt, 12))
|
| 82 |
+
if num_tgt == 1:
|
| 83 |
+
ax = np.expand_dims(ax, axis=1)
|
| 84 |
+
ax[0][0].imshow(image.convert("L"), cmap='gray')
|
| 85 |
for i, mask in enumerate(masks):
|
| 86 |
+
sam_utils.show_mask(mask, ax[0][0], obj_id=i, alpha=0.75)
|
| 87 |
+
ax[0][0].axis('off')
|
| 88 |
+
ax[0][0].set_title("Reference Image with Expert Segmentation")
|
| 89 |
+
for i in range(1, num_tgt):
|
| 90 |
+
# set the rest to empty
|
| 91 |
+
ax[0][i].axis('off')
|
| 92 |
+
for i in range(num_tgt):
|
| 93 |
+
ax[1][i].imshow(target_images[i].convert("L"), cmap='gray')
|
| 94 |
+
for j, mask in enumerate(target_masks[i]):
|
| 95 |
+
sam_utils.show_mask(mask, ax[1][i], obj_id=j, alpha=0.75)
|
| 96 |
+
ax[1][i].axis('off')
|
| 97 |
+
ax[1][i].set_title("Target Image with Inferred Segmentation")
|
| 98 |
# save it to buffer
|
| 99 |
plt.tight_layout()
|
| 100 |
buf = BytesIO()
|
|
|
|
| 113 |
click_coords.append([evt.index[0], evt.index[1]])
|
| 114 |
return f"Clicked at: {click_coords}"
|
| 115 |
|
| 116 |
+
def generate(reference_image, target_images):
|
| 117 |
+
global click_coords
|
| 118 |
if not click_coords:
|
| 119 |
return None, "Click on the reference image first!"
|
| 120 |
+
|
| 121 |
+
target_images = [Image.open(f.name).convert("RGB").resize((1024,1024)) for f in target_images]
|
| 122 |
+
|
| 123 |
ref_mask = segment_reference(reference_image, click_coords)
|
| 124 |
+
tgt_masks = segment_target(target_images, reference_image, ref_mask)
|
| 125 |
+
vis = visualize_segmentation(reference_image, ref_mask, target_images, tgt_masks)
|
| 126 |
+
# clear the clicks
|
| 127 |
+
click_coords = []
|
| 128 |
return vis, "Done!"
|
| 129 |
|
| 130 |
with gr.Blocks() as demo:
|
|
|
|
| 132 |
|
| 133 |
with gr.Row():
|
| 134 |
reference_img = gr.Image(type="pil", label="Reference Image")
|
| 135 |
+
target_img = gr.File(file_types=["image"], file_count="multiple", label="Target Images")
|
| 136 |
|
| 137 |
click_info = gr.Textbox(label="Click Info")
|
| 138 |
generate_btn = gr.Button("Generate")
|