Spaces:

openvision
/

YOLO26

Runtime error

App Files Files Community

openvision commited on Jan 16

Commit

dbd2e13

verified ·

1 Parent(s): 48750e1

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -29

app.py CHANGED Viewed

@@ -20,34 +20,34 @@ TASK_TO_REPO_TEMPLATE = {
 YOLOE_REPO_TEMPLATE = "openvision/yoloe26-{scale}-seg"
 model_cache = {}
 def _scale_from_ui_name(model_name: str) -> str:
-    """
-    Convert dropdown model string to scale token used in repo names.
-    Examples:
-        "YOLO26-N"  -> "n"
-        "YOLOE26-N" -> "n"
-    """
     return model_name.split("-")[-1].strip().lower()
 def _get_model(repo_id: str) -> YOLO:
-    """Download (if needed) and cache YOLO model from a repo that contains 'model.pt'."""
     cache_key = f"{repo_id}::model.pt"
     if cache_key not in model_cache:
-        weights_path = hf_hub_download(repo_id=repo_id, filename="model.pt")
         model_cache[cache_key] = YOLO(weights_path)
     return model_cache[cache_key]
 def predict_yolo26(image, model_name, task, conf, iou, retina):
-    """Run YOLO26 inference for various tasks."""
     scale = _scale_from_ui_name(model_name)
-    repo_tmpl = TASK_TO_REPO_TEMPLATE[task]
-    repo_id = repo_tmpl.format(scale=scale)
     model = _get_model(repo_id)
     use_retina = bool(retina) and task == "Segmentation"
@@ -60,35 +60,50 @@ def predict_yolo26(image, model_name, task, conf, iou, retina):
     return Image.fromarray(results[0].plot()[..., ::-1]), None
 def predict_yoloe26(image, model_name, classes_text, conf, retina):
-    """Run YOLOE26 open-vocabulary inference with text prompts."""
     scale = _scale_from_ui_name(model_name)
     repo_id = YOLOE_REPO_TEMPLATE.format(scale=scale)
-    model = _get_model(repo_id)
-    names = [c.strip() for c in classes_text.split(",") if c.strip()]
     model.set_classes(names, model.get_text_pe(names))
     res = model.predict(source=image, conf=conf, imgsz=640, retina_masks=bool(retina))[0]
     return Image.fromarray(res.plot()[..., ::-1])
 theme = gr.themes.Base().set(
-    button_primary_background_fill="#111F68", button_primary_background_fill_hover="#042AFF"
 )
-# Build interface
-with gr.Blocks(title="Ultralytics YOLO26 & YOLOE26 Demo") as demo:
     gr.Markdown(
         "# 🚀 Ultralytics YOLO26 & YOLOE26 Demo\n"
-        "Showcasing YOLO26 tasks and YOLOE26 open-vocabulary segmentation. "
-        "[GitHub](https://github.com/ultralytics/ultralytics) | [Docs](https://docs.ultralytics.com/models/yolo26/)"
     )
     with gr.Tabs():
         with gr.Tab("YOLO26 Tasks"):
-            gr.Markdown("### Ultralytics YOLO26: Detection, Segmentation, Pose, OBB, Classification")
             with gr.Row():
                 with gr.Column():
                     y26_image = gr.Image(type="pil", label="Upload Image")
@@ -100,6 +115,7 @@ with gr.Blocks(title="Ultralytics YOLO26 & YOLOE26 Demo") as demo:
                         y26_iou = gr.Slider(0, 1, value=0.45, label="IoU Threshold")
                         y26_retina = gr.Checkbox(value=True, label="Retina Masks", info="Higher quality masks, slower inference")
                     y26_btn = gr.Button("Run Inference", variant="primary")
                 with gr.Column():
                     y26_output = gr.Image(type="pil", label="Result")
                     y26_label = gr.Label(label="Classification Results", visible=False)
@@ -131,32 +147,45 @@ with gr.Blocks(title="Ultralytics YOLO26 & YOLOE26 Demo") as demo:
             )
         with gr.Tab("YOLOE26 Open-Vocabulary"):
-            gr.Markdown("### Ultralytics YOLOE26: Open-Vocabulary Segmentation - Detect any object by text description")
             with gr.Row():
                 with gr.Column():
                     ye_image = gr.Image(type="pil", label="Upload Image")
-                    with gr.Row():
-                        ye_model = gr.Dropdown(["YOLOE26-N"], value="YOLOE26-N", label="Model")
-                        ye_classes = gr.Textbox(label="Classes")
                     with gr.Accordion("Advanced Settings", open=False):
                         ye_conf = gr.Slider(0, 1, value=0.2, label="Confidence Threshold")
                         ye_retina = gr.Checkbox(value=True, label="Retina Masks", info="Higher quality masks, slower inference")
                     ye_btn = gr.Button("Run Inference", variant="primary")
                 with gr.Column():
                     ye_output = gr.Image(type="pil", label="Result")
             gr.Examples(
                 examples=[
                     [str(ASSETS / "bus.jpg"), "YOLOE26-N", "person, bus, car", 0.2, True],
                     [str(ASSETS / "zidane.jpg"), "YOLOE26-N", "person, football, grass", 0.2, True],
                 ],
                 inputs=[ye_image, ye_model, ye_classes, ye_conf, ye_retina],
                 outputs=ye_output,
                 fn=predict_yoloe26,
-                #cache_examples=True,
             )
-            ye_btn.click(predict_yoloe26, [ye_image, ye_model, ye_classes, ye_conf, ye_retina], ye_output)
 if __name__ == "__main__":
-    demo.launch(theme=theme, allowed_paths=[str(ASSETS), str(ASSETS.parent)])

 YOLOE_REPO_TEMPLATE = "openvision/yoloe26-{scale}-seg"
+weights_cache = {}
 model_cache = {}
 def _scale_from_ui_name(model_name: str) -> str:
     return model_name.split("-")[-1].strip().lower()
+def _get_weights(repo_id: str) -> str:
+    """Download (if needed) and cache model.pt path."""
+    cache_key = f"{repo_id}::model.pt"
+    if cache_key not in weights_cache:
+        weights_cache[cache_key] = hf_hub_download(repo_id=repo_id, filename="model.pt")
+    return weights_cache[cache_key]
 def _get_model(repo_id: str) -> YOLO:
+    """Download (if needed) and cache YOLO model (safe for YOLO26 tasks)."""
     cache_key = f"{repo_id}::model.pt"
     if cache_key not in model_cache:
+        weights_path = _get_weights(repo_id)
         model_cache[cache_key] = YOLO(weights_path)
     return model_cache[cache_key]
 def predict_yolo26(image, model_name, task, conf, iou, retina):
     scale = _scale_from_ui_name(model_name)
+    repo_id = TASK_TO_REPO_TEMPLATE[task].format(scale=scale)
     model = _get_model(repo_id)
     use_retina = bool(retina) and task == "Segmentation"
     return Image.fromarray(results[0].plot()[..., ::-1]), None
+def _parse_classes(classes_text: str):
+    if classes_text is None:
+        return []
+    names = [c.strip() for c in classes_text.split(",") if c.strip()]
+    # de-dup while preserving order
+    seen = set()
+    out = []
+    for n in names:
+        if n.lower() not in seen:
+            out.append(n)
+            seen.add(n.lower())
+    return out
 def predict_yoloe26(image, model_name, classes_text, conf, retina):
+    names = _parse_classes(classes_text)
+    if not names:
+        raise gr.Error("Enter at least 1 class (comma-separated). Example: 'cat, dog, bicycle'")
     scale = _scale_from_ui_name(model_name)
     repo_id = YOLOE_REPO_TEMPLATE.format(scale=scale)
+    weights_path = _get_weights(repo_id)
+    model = YOLO(weights_path)
     model.set_classes(names, model.get_text_pe(names))
     res = model.predict(source=image, conf=conf, imgsz=640, retina_masks=bool(retina))[0]
     return Image.fromarray(res.plot()[..., ::-1])
 theme = gr.themes.Base().set(
+    button_primary_background_fill="#111F68",
+    button_primary_background_fill_hover="#042AFF",
 )
+with gr.Blocks(title="Ultralytics YOLO26 & YOLOE26 Demo", theme=theme) as demo:
     gr.Markdown(
         "# 🚀 Ultralytics YOLO26 & YOLOE26 Demo\n"
+        "YOLO26 tasks + YOLOE26 open-vocabulary segmentation."
     )
     with gr.Tabs():
         with gr.Tab("YOLO26 Tasks"):
+            gr.Markdown("### Detection, Segmentation, Pose, OBB, Classification")
             with gr.Row():
                 with gr.Column():
                     y26_image = gr.Image(type="pil", label="Upload Image")
                         y26_iou = gr.Slider(0, 1, value=0.45, label="IoU Threshold")
                         y26_retina = gr.Checkbox(value=True, label="Retina Masks", info="Higher quality masks, slower inference")
                     y26_btn = gr.Button("Run Inference", variant="primary")
                 with gr.Column():
                     y26_output = gr.Image(type="pil", label="Result")
                     y26_label = gr.Label(label="Classification Results", visible=False)
             )
         with gr.Tab("YOLOE26 Open-Vocabulary"):
+            gr.Markdown("### Open-Vocabulary Segmentation (text prompts)")
             with gr.Row():
                 with gr.Column():
                     ye_image = gr.Image(type="pil", label="Upload Image")
+                    ye_model = gr.Dropdown(["YOLOE26-N"], value="YOLOE26-N", label="Model")
+                    ye_classes = gr.Textbox(
+                        label="Classes (comma-separated)",
+                        placeholder="e.g. cat, dog, bicycle",
+                        value="person, bus, car",
+                    )
                     with gr.Accordion("Advanced Settings", open=False):
                         ye_conf = gr.Slider(0, 1, value=0.2, label="Confidence Threshold")
                         ye_retina = gr.Checkbox(value=True, label="Retina Masks", info="Higher quality masks, slower inference")
                     ye_btn = gr.Button("Run Inference", variant="primary")
                 with gr.Column():
                     ye_output = gr.Image(type="pil", label="Result")
+            ye_prompt_state = gr.State(ye_classes.value)
+            ye_classes.change(lambda s: s, ye_classes, ye_prompt_state)
             gr.Examples(
                 examples=[
                     [str(ASSETS / "bus.jpg"), "YOLOE26-N", "person, bus, car", 0.2, True],
                     [str(ASSETS / "zidane.jpg"), "YOLOE26-N", "person, football, grass", 0.2, True],
+                    [str(ASSETS / "bus.jpg"), "YOLOE26-N", "bicycle, traffic light, road", 0.2, True],
                 ],
                 inputs=[ye_image, ye_model, ye_classes, ye_conf, ye_retina],
                 outputs=ye_output,
                 fn=predict_yoloe26,
             )
+            ye_btn.click(
+                predict_yoloe26,
+                [ye_image, ye_model, ye_prompt_state, ye_conf, ye_retina],
+                ye_output,
+            )
 if __name__ == "__main__":
+    demo.launch(allowed_paths=[str(ASSETS), str(ASSETS.parent)])