SAM3-Demo

Running

App Files Files Community

Translsis commited on Dec 23, 2025

Commit

e31d0be

verified ·

1 Parent(s): 7cae504

Update app.py

Browse files

Files changed (1) hide show

app.py +93 -48

app.py CHANGED Viewed

@@ -412,7 +412,7 @@ def process_image_job(job):
         'duration': f"{(datetime.now() - start).total_seconds():.2f}s"
     }
-@spaces.GPU
 def process_video_job(job):
     start = datetime.now()
     cap = cv2.VideoCapture(job['video'])
@@ -420,16 +420,21 @@ def process_video_job(job):
     w, h = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)), int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     frames = []
-    limit = job.get('frame_limit', 0)
     count = 0
     while cap.isOpened():
         ret, frame = cap.read()
-        if not ret or (limit > 0 and count >= limit):
             break
         frames.append(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
         count += 1
     cap.release()
     session = VID_PROCESSOR.init_video_session(video=frames, inference_device=device, dtype=torch.bfloat16)
     session = VID_PROCESSOR.add_text_prompt(inference_session=session, text=job['prompt'])
@@ -444,6 +449,8 @@ def process_video_job(job):
     ]
     total = len(frames)
     for idx, out in enumerate(VID_MODEL.propagate_in_video_iterator(inference_session=session, max_frame_num_to_track=total)):
         proc = VID_PROCESSOR.postprocess_outputs(session, out)
         orig = Image.fromarray(frames[out.frame_idx])
@@ -480,11 +487,19 @@ def process_video_job(job):
             writers[1].write(np.zeros((h, w, 3), dtype=np.uint8))
             writers[2].write(orig_bgr)
-        processing_results[job['id']]['progress'] = int((idx + 1) / total * 100)
     for w in writers:
         w.release()
     return {
         'output_path': out_path,
         'mask_video_path': mask_path,
@@ -530,49 +545,65 @@ def process_click_job(job):
 # ============ BACKGROUND WORKER ============
 def background_worker():
     while True:
-        job = processing_queue.get()
-        if job is None:
-            break
-        processing_results[job['id']] = {'status': 'processing', 'progress': 0}
         try:
-            if job['type'] == 'image':
-                result = process_image_job(job)
-            elif job['type'] == 'video':
-                result = process_video_job(job)
-            elif job['type'] == 'click':
-                result = process_click_job(job)
-            processing_results[job['id']] = {
-                'status': 'completed',
-                'result': result,
-                'progress': 100
-            }
-            save_history({
-                'id': job['id'],
-                'type': job['type'],
-                'prompt': job.get('prompt', 'N/A'),
-                'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
-                'status': 'completed',
-                **result
-            })
         except Exception as e:
-            processing_results[job['id']] = {
-                'status': 'error',
-                'error': str(e),
-                'progress': 0
-            }
-            save_history({
-                'id': job['id'],
-                'type': job['type'],
-                'prompt': job.get('prompt', 'N/A'),
-                'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
-                'status': 'error',
-                'error': str(e)
-            })
 threading.Thread(target=background_worker, daemon=True).start()
@@ -676,9 +707,17 @@ with gr.Blocks(css=custom_css, theme=app_theme, title="SAM3 Segmentation") as de
                         with gr.Accordion("⚙️ Settings", open=True):
                             vid_frames = gr.Slider(
                                 10, 500, 60, 10,
-                                label="Max Frames (0 = All frames)",
-                                info="Giới hạn số frame để xử lý nhanh hơn"
                             )
                         vid_submit = gr.Button("🚀 Submit Job (Background)", variant="primary", size="lg")
                         vid_check = gr.Button("🔍 Check Status", variant="secondary")
@@ -1019,9 +1058,15 @@ with gr.Blocks(css=custom_css, theme=app_theme, title="SAM3 Segmentation") as de
         """)
 if __name__ == "__main__":
     demo.launch(
-        css=custom_css,
-        theme=app_theme,
-        ssr_mode=False,
-        show_error=True
     )

         'duration': f"{(datetime.now() - start).total_seconds():.2f}s"
     }
+@spaces.GPU(duration=300)
 def process_video_job(job):
     start = datetime.now()
     cap = cv2.VideoCapture(job['video'])
     w, h = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH)), int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     frames = []
+    limit = job.get('frame_limit', 60)
+    if limit == 0:
+        limit = 999999
     count = 0
     while cap.isOpened():
         ret, frame = cap.read()
+        if not ret or count >= limit:
             break
         frames.append(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
         count += 1
     cap.release()
+    print(f"📹 Processing {len(frames)} frames...")
     session = VID_PROCESSOR.init_video_session(video=frames, inference_device=device, dtype=torch.bfloat16)
     session = VID_PROCESSOR.add_text_prompt(inference_session=session, text=job['prompt'])
     ]
     total = len(frames)
+    processed = 0
     for idx, out in enumerate(VID_MODEL.propagate_in_video_iterator(inference_session=session, max_frame_num_to_track=total)):
         proc = VID_PROCESSOR.postprocess_outputs(session, out)
         orig = Image.fromarray(frames[out.frame_idx])
             writers[1].write(np.zeros((h, w, 3), dtype=np.uint8))
             writers[2].write(orig_bgr)
+        processed += 1
+        progress = int((processed / total) * 100)
+        processing_results[job['id']]['progress'] = progress
+        # Log progress every 10%
+        if progress % 10 == 0:
+            print(f"⏳ Video progress: {progress}% ({processed}/{total} frames)")
     for w in writers:
         w.release()
+    print(f"✅ Video completed: {len(frames)} frames in {(datetime.now() - start).total_seconds():.2f}s")
     return {
         'output_path': out_path,
         'mask_video_path': mask_path,
 # ============ BACKGROUND WORKER ============
 def background_worker():
     while True:
         try:
+            job = processing_queue.get()
+            if job is None:
+                break
+            job_id = job['id']
+            job_type = job['type']
+            print(f"🚀 Starting job {job_id[:8]} - Type: {job_type}")
+            processing_results[job_id] = {'status': 'processing', 'progress': 0}
+            try:
+                if job_type == 'image':
+                    result = process_image_job(job)
+                elif job_type == 'video':
+                    result = process_video_job(job)
+                elif job_type == 'click':
+                    result = process_click_job(job)
+                processing_results[job_id] = {
+                    'status': 'completed',
+                    'result': result,
+                    'progress': 100
+                }
+                print(f"✅ Job {job_id[:8]} completed successfully")
+                save_history({
+                    'id': job_id,
+                    'type': job_type,
+                    'prompt': job.get('prompt', 'N/A'),
+                    'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
+                    'status': 'completed',
+                    **result
+                })
+            except Exception as e:
+                print(f"❌ Job {job_id[:8]} failed: {str(e)}")
+                import traceback
+                traceback.print_exc()
+                processing_results[job_id] = {
+                    'status': 'error',
+                    'error': str(e),
+                    'progress': 0
+                }
+                save_history({
+                    'id': job_id,
+                    'type': job_type,
+                    'prompt': job.get('prompt', 'N/A'),
+                    'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
+                    'status': 'error',
+                    'error': str(e)
+                })
         except Exception as e:
+            print(f"⚠️ Worker error: {e}")
+            import traceback
+            traceback.print_exc()
 threading.Thread(target=background_worker, daemon=True).start()
                         with gr.Accordion("⚙️ Settings", open=True):
                             vid_frames = gr.Slider(
                                 10, 500, 60, 10,
+                                label="Max Frames (Giảm để xử lý nhanh hơn)",
+                                info="Khuyến nghị: 30-60 frames cho video ngắn, 100-200 cho video dài"
                             )
+                            gr.Markdown("""
+                            **💡 Lưu ý xử lý video:**
+                            - Video chạy background, không bị timeout
+                            - Nhấn "Check Status" để xem progress
+                            - Video dài sẽ mất nhiều thời gian hơn
+                            - Giảm số frames nếu muốn xử lý nhanh
+                            """)
                         vid_submit = gr.Button("🚀 Submit Job (Background)", variant="primary", size="lg")
                         vid_check = gr.Button("🔍 Check Status", variant="secondary")
         """)
 if __name__ == "__main__":
+    print("🚀 Starting SAM3 Application...")
+    print(f"📁 Output directory: {OUTPUTS_DIR}")
+    print(f"📥 Downloads directory: {DOWNLOADS_DIR}")
+    print(f"📊 History file: {HISTORY_FILE}")
     demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        max_threads=10,
+        show_error=True,
+        share=False
     )