Spaces:

pavankalyan123456
/

deformableDertdroneobject

Runtime error

App Files Files Community

pavankalyan123456 commited on Nov 10, 2025

Commit

3bbb111

verified ·

1 Parent(s): 6d16bfb

Update app.py

Browse files

Files changed (1) hide show

app.py +95 -87

app.py CHANGED Viewed

@@ -12,106 +12,114 @@ from datetime import datetime
 # ---------------------------------
 st.set_page_config(page_title="Drone Object Detection", layout="wide")
 st.title("🚁 Drone Object Detection (Deformable DETR)")
-st.write("🛰 Detect objects in drone footage using a Transformer-based DETR model.")
-# ---------------------------------
-# 🔄 Status Display
-# ---------------------------------
-st.info("⚙️ Initializing app... this may take 2–5 minutes the first time.")
-# ---------------------------------
-# 🚀 Load Model with Caching
-# ---------------------------------
-@st.cache_resource(show_spinner="Loading Deformable DETR model (first time may take several minutes)...")
-def load_model():
-    processor = AutoImageProcessor.from_pretrained("SenseTime/deformable-detr")
-    model = DeformableDetrForObjectDetection.from_pretrained("SenseTime/deformable-detr")
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-    model = model.to(device)
-    return processor, model, device
-processor, model, device = load_model()
-st.success("✅ Model loaded successfully!")
 # ---------------------------------
-# 🎛️ Sidebar Options
 # ---------------------------------
 st.sidebar.header("⚙️ Options")
 input_type = st.sidebar.radio("Select Input Type", ["🎞️ Video Upload", "📷 Live Camera"])
 save_output = st.sidebar.radio("💾 Save detected video?", ["Yes", "No"])
-capture_images = st.sidebar.checkbox("📸 Capture Photos During Detection", value=True)
-# Output dirs
 output_dir = "drone_outputs"
 os.makedirs(output_dir, exist_ok=True)
 # ---------------------------------
-# 🎥 Video Upload Mode
 # ---------------------------------
-if input_type == "🎞️ Video Upload":
-    video_file = st.file_uploader("Upload Drone Video", type=["mp4", "avi", "mov", "mkv"])
-    if video_file:
-        tfile = tempfile.NamedTemporaryFile(delete=False)
-        tfile.write(video_file.read())
-        cap = cv2.VideoCapture(tfile.name)
-        stframe = st.empty()
-        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-        output_video_path = os.path.join(output_dir, f"detected_{timestamp}.avi")
-        output_image_dir = os.path.join(output_dir, f"captures_{timestamp}")
-        os.makedirs(output_image_dir, exist_ok=True)
-        if save_output == "Yes":
-            fourcc = cv2.VideoWriter_fourcc(*'XVID')
-            out = cv2.VideoWriter(output_video_path, fourcc, 20.0,
-                                  (int(cap.get(3)), int(cap.get(4))))
-            st.info("💾 Saving detected video...")
-        frame_count = 0
-        st.info("🚀 Running object detection... Please wait...")
-        while cap.isOpened():
-            ret, frame = cap.read()
-            if not ret:
-                break
-            frame_count += 1
-            image_pil = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
-            inputs = processor(images=image_pil, return_tensors="pt").to(device)
-            outputs = model(**inputs)
-            target_sizes = torch.tensor([image_pil.size[::-1]]).to(device)
-            results = processor.post_process_object_detection(outputs, target_sizes=target_sizes, threshold=0.6)[0]
-            draw = ImageDraw.Draw(image_pil)
-            for score, label, box in zip(results["scores"], results["labels"], results["boxes"]):
-                box = [round(i, 2) for i in box.tolist()]
-                draw.rectangle(box, outline="red", width=3)
-                draw.text((box[0], box[1]), f"{model.config.id2label[label.item()]} {round(score.item(), 2)}", fill="white")
-            annotated = cv2.cvtColor(np.array(image_pil), cv2.COLOR_RGB2BGR)
-            stframe.image(annotated, channels="BGR", use_container_width=True)
-            if save_output == "Yes":
-                out.write(annotated)
-            if capture_images and frame_count % 50 == 0:
-                capture_path = os.path.join(output_image_dir, f"capture_{frame_count}.jpg")
-                cv2.imwrite(capture_path, annotated)
-        cap.release()
-        if save_output == "Yes":
-            out.release()
-            st.success(f"✅ Detected video saved at: `{output_video_path}`")
-        if capture_images:
-            st.info(f"📸 Captured frames saved in: `{output_image_dir}`")
-        st.success("🎉 Detection complete!")
 # ---------------------------------
-# ⚠️ Live Camera Mode
 # ---------------------------------
-elif input_type == "📷 Live Camera":
-    st.warning("⚠️ Live camera is not supported on Hugging Face Spaces.")
-    st.write("To use live webcam, run locally:")
-    st.code("streamlit run src/streamlit_app.py", language="bash")

 # ---------------------------------
 st.set_page_config(page_title="Drone Object Detection", layout="wide")
 st.title("🚁 Drone Object Detection (Deformable DETR)")
+st.write("🛰 Detect objects in drone footage using a Transformer-based Deformable DETR model.")
+st.info("⚙️ App ready. Click **Load Model** to start — the first load may take 2–5 min on Hugging Face.")
 # ---------------------------------
+# 🎛️ Sidebar
 # ---------------------------------
 st.sidebar.header("⚙️ Options")
 input_type = st.sidebar.radio("Select Input Type", ["🎞️ Video Upload", "📷 Live Camera"])
 save_output = st.sidebar.radio("💾 Save detected video?", ["Yes", "No"])
+capture_images = st.sidebar.checkbox("📸 Capture photos during detection", value=True)
 output_dir = "drone_outputs"
 os.makedirs(output_dir, exist_ok=True)
 # ---------------------------------
+# 🚀 Model Loader (lazy, on click)
 # ---------------------------------
+@st.cache_resource(show_spinner=False)
+def load_model():
+    with st.spinner("⏳ Downloading Deformable DETR model… please wait"):
+        processor = AutoImageProcessor.from_pretrained("SenseTime/deformable-detr")
+        model = DeformableDetrForObjectDetection.from_pretrained("SenseTime/deformable-detr")
+        device = "cuda" if torch.cuda.is_available() else "cpu"
+        model = model.to(device)
+    return processor, model, device
 # ---------------------------------
+# 🧠 Load model only when user clicks
 # ---------------------------------
+if st.button("🚀 Load Model and Start"):
+    try:
+        processor, model, device = load_model()
+        st.success("✅ Model loaded successfully!")
+        # ----- VIDEO UPLOAD -----
+        if input_type == "🎞️ Video Upload":
+            video_file = st.file_uploader("Upload Drone Video", type=["mp4", "avi", "mov", "mkv"])
+            if video_file:
+                tfile = tempfile.NamedTemporaryFile(delete=False)
+                tfile.write(video_file.read())
+                cap = cv2.VideoCapture(tfile.name)
+                stframe = st.empty()
+                timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+                output_video_path = os.path.join(output_dir, f"detected_{timestamp}.avi")
+                output_image_dir = os.path.join(output_dir, f"captures_{timestamp}")
+                os.makedirs(output_image_dir, exist_ok=True)
+                if save_output == "Yes":
+                    fourcc = cv2.VideoWriter_fourcc(*'XVID')
+                    out = cv2.VideoWriter(output_video_path, fourcc, 20.0,
+                                          (int(cap.get(3)), int(cap.get(4))))
+                    st.info("💾 Saving detected video...")
+                frame_count = 0
+                st.info("🚀 Running object detection...")
+                while cap.isOpened():
+                    ret, frame = cap.read()
+                    if not ret:
+                        break
+                    frame_count += 1
+                    image_pil = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
+                    inputs = processor(images=image_pil, return_tensors="pt").to(device)
+                    outputs = model(**inputs)
+                    target_sizes = torch.tensor([image_pil.size[::-1]]).to(device)
+                    results = processor.post_process_object_detection(
+                        outputs, target_sizes=target_sizes, threshold=0.6
+                    )[0]
+                    draw = ImageDraw.Draw(image_pil)
+                    for score, label, box in zip(results["scores"], results["labels"], results["boxes"]):
+                        box = [round(i, 2) for i in box.tolist()]
+                        draw.rectangle(box, outline="red", width=3)
+                        draw.text(
+                            (box[0], box[1]),
+                            f"{model.config.id2label[label.item()]} {round(score.item(), 2)}",
+                            fill="white"
+                        )
+                    annotated = cv2.cvtColor(np.array(image_pil), cv2.COLOR_RGB2BGR)
+                    stframe.image(annotated, channels="BGR", use_container_width=True)
+                    if save_output == "Yes":
+                        out.write(annotated)
+                    if capture_images and frame_count % 50 == 0:
+                        cv2.imwrite(
+                            os.path.join(output_image_dir, f"capture_{frame_count}.jpg"),
+                            annotated
+                        )
+                cap.release()
+                if save_output == "Yes":
+                    out.release()
+                    st.success(f"✅ Saved video: `{output_video_path}`")
+                if capture_images:
+                    st.info(f"📸 Captured frames in `{output_image_dir}`")
+                st.success("🎉 Detection complete!")
+        # ----- LIVE CAMERA -----
+        elif input_type == "📷 Live Camera":
+            st.warning("⚠️ Live camera not supported on Hugging Face Spaces.\nRun locally instead:")
+            st.code("streamlit run app.py", language="bash")
+    except Exception as e:
+        st.error(f"❌ Error loading model: {e}")
+else:
+    st.warning("👆 Click **Load Model and Start** to begin detection.")