Spaces:

AutoFramingSoftware
/

afs-backend

Sleeping

App Files Files Community

GeraldoRiberia commited on Feb 24

Commit

679b5d0

1 Parent(s): 9f43980

h

Browse files

Files changed (2) hide show

.DS_Store +0 -0
server.py +212 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

server.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from fastapi import FastAPI, WebSocket, WebSocketDisconnect
 from fastapi.middleware.cors import CORSMiddleware
 import uvicorn
 import cv2
 import numpy as np
@@ -8,6 +9,9 @@ import json
 import logging
 import asyncio
 from concurrent.futures import ThreadPoolExecutor
 from services.single_tracker import SingleTracker
 from services.multi_tracker import MultiTracker
@@ -19,6 +23,24 @@ logger = logging.getLogger(__name__)
 # Executor for CPU-bound tasks
 executor = ThreadPoolExecutor(max_workers=1)
 app = FastAPI(title="AFS Tracking Backend")
 app.add_middleware(
@@ -43,8 +65,120 @@ def decode_binary_image(img_data: bytes):
         logger.error(f"Failed to decode image: {e}")
         return None
 @app.websocket("/ws")
 async def websocket_endpoint(websocket: WebSocket):
     await websocket.accept()
     logger.info("New WebSocket connection established.")
@@ -62,6 +196,40 @@ async def websocket_endpoint(websocket: WebSocket):
                         logger.info(f"Switching mode from {current_mode} to {payload['mode']}")
                         current_mode = payload["mode"]
                         await websocket.send_json({"type": "mode_ack", "mode": current_mode})
                 except json.JSONDecodeError:
                     logger.error("Invalid JSON received.")
                 continue
@@ -96,11 +264,55 @@ async def websocket_endpoint(websocket: WebSocket):
                 # Send results back to client
                 response_data["mode"] = current_mode
                 await websocket.send_json(response_data)
     except WebSocketDisconnect:
         logger.info("WebSocket client disconnected.")
     except Exception as e:
         logger.error(f"WebSocket error: {e}")
 if __name__ == "__main__":
     uvicorn.run("server:app", host="0.0.0.0", port=8000, reload=True)

 from fastapi import FastAPI, WebSocket, WebSocketDisconnect
 from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import StreamingResponse
 import uvicorn
 import cv2
 import numpy as np
 import logging
 import asyncio
 from concurrent.futures import ThreadPoolExecutor
+from datetime import datetime
+import threading
+import pyvirtualcam
 from services.single_tracker import SingleTracker
 from services.multi_tracker import MultiTracker
 # Executor for CPU-bound tasks
 executor = ThreadPoolExecutor(max_workers=1)
+# --- OBS and Recording State ---
+latest_obs_frame = None  # Store the latest JPEG encoded cropped frame for the OBS feed (deprecated by vcam)
+obs_frame_lock = threading.Lock()
+is_obs_active = False
+vcam = None # Virtual Camera reference
+is_recording = False
+video_writer = None
+recording_filename = ""
+# --- Center Stage State (EMA Smoothing) ---
+current_cx = 0.5
+current_cy = 0.5
+current_scale = 1.0
+# Configurable parameters for smooth panning
+SMOOTHING_FACTOR = 0.1  # Lower is smoother but slower (similar to Dart's TweenAnimation)
+TARGET_ASPECT_RATIO = 16.0 / 9.0  # Assuming output is meant to be 16:9
 app = FastAPI(title="AFS Tracking Backend")
 app.add_middleware(
         logger.error(f"Failed to decode image: {e}")
         return None
+def apply_center_stage_crop(frame, tracking_data):
+    """
+    Applies an exponential moving average (EMA) to smoothly pan and zoom
+    the frame based on the tracking target bounding box.
+    Returns the cropped frame.
+    """
+    global current_cx, current_cy, current_scale
+    h, w = frame.shape[:2]
+    # Defaults
+    target_cx = 0.5
+    target_cy = 0.5
+    target_scale = 1.0
+    # Calculate target state based on tracking data
+    boxes = tracking_data.get("boxes", [])
+    if tracking_data.get("mode") == "multi":
+        if "aggregate_box" in tracking_data:
+            ab = tracking_data["aggregate_box"]
+            box_cx = (ab["x1"] + ab["x2"]) / 2.0
+            box_cy = (ab["y1"] + ab["y2"]) / 2.0
+            box_w = ab["x2"] - ab["x1"]
+            box_h = ab["y2"] - ab["y1"]
+            target_cx = box_cx / w
+            target_cy = box_cy / h
+            # Target scale logic (from Dart): max dimension proportion * 1.5 margin
+            max_dim = max(box_w / w, box_h / h)
+            target_scale = 1.0 / (max_dim * 1.5)
+            # Clamp scale
+            target_scale = max(1.0, min(target_scale, 3.0))
+    else: # single
+        target_box = None
+        for b in boxes:
+            if b.get("is_target"):
+                target_box = b
+                break
+        if target_box:
+            box_cx = (target_box["x1"] + target_box["x2"]) / 2.0
+            box_cy = (target_box["y1"] + target_box["y2"]) / 2.0
+            box_w = target_box["x2"] - target_box["x1"]
+            box_h = target_box["y2"] - target_box["y1"]
+            target_cx = box_cx / w
+            target_cy = box_cy / h
+            max_dim = max(box_w / w, box_h / h)
+            target_scale = 1.0 / (max_dim * 2.0) # slightly tighter for single person
+            target_scale = max(1.0, min(target_scale, 3.0))
+    # Apply EMA smoothing
+    current_cx += (target_cx - current_cx) * SMOOTHING_FACTOR
+    current_cy += (target_cy - current_cy) * SMOOTHING_FACTOR
+    current_scale += (target_scale - current_scale) * SMOOTHING_FACTOR
+    # Calculate crop dimensions
+    # When scale is S, the crop width is w / S
+    crop_w = int(w / current_scale)
+    crop_h = int(h / current_scale)
+    # Enforce aspect ratio
+    # If crop_w / crop_h is not 16:9, adjust one to match
+    current_ar = crop_w / max(1, crop_h)
+    if current_ar > TARGET_ASPECT_RATIO:
+        # Too wide, shrink width
+        crop_w = int(crop_h * TARGET_ASPECT_RATIO)
+    else:
+        # Too tall, shrink height
+        crop_h = int(crop_w / TARGET_ASPECT_RATIO)
+    # Calculate top-left point of crop, clamping to frame boundaries
+    center_px_x = int(current_cx * w)
+    center_px_y = int(current_cy * h)
+    start_x = max(0, center_px_x - crop_w // 2)
+    start_y = max(0, center_px_y - crop_h // 2)
+    # Adjust if crop box goes out of bounds
+    if start_x + crop_w > w:
+        start_x = w - crop_w
+    if start_y + crop_h > h:
+        start_y = h - crop_h
+    # Crop
+    cropped = frame[start_y:start_y+crop_h, start_x:start_x+crop_w]
+    return cropped
+async def generate_obs_stream():
+    """Generator for the MJPEG stream used by OBS."""
+    global latest_obs_frame
+    while True:
+        with obs_frame_lock:
+            if latest_obs_frame is not None:
+                yield (b'--frame\r\n'
+                       b'Content-Type: image/jpeg\r\n\r\n' + latest_obs_frame + b'\r\n')
+            else:
+                # If no frame yet, yield a blank frame or sleep
+                await asyncio.sleep(0.1)
+                continue
+        # Use asyncio sleep to prevent blocking the event loop
+        await asyncio.sleep(0.033) # roughly 30 fps
+@app.get("/obs_feed")
+async def obs_feed():
+    """Endpoint for OBS Media Source to connect to."""
+    return StreamingResponse(generate_obs_stream(), media_type="multipart/x-mixed-replace; boundary=frame")
 @app.websocket("/ws")
 async def websocket_endpoint(websocket: WebSocket):
+    global is_recording, video_writer, recording_filename, latest_obs_frame, is_obs_active, vcam
     await websocket.accept()
     logger.info("New WebSocket connection established.")
                         logger.info(f"Switching mode from {current_mode} to {payload['mode']}")
                         current_mode = payload["mode"]
                         await websocket.send_json({"type": "mode_ack", "mode": current_mode})
+                    elif "command" in payload:
+                        # Handle recording commands
+                        command = payload["command"]
+                        if command == "start_recording":
+                            if not is_recording:
+                                is_recording = True
+                                recording_filename = f"capture_{datetime.now().strftime('%Y%m%d_%H%M%S')}.mp4"
+                                logger.info(f"Started recording to {recording_filename}")
+                                await websocket.send_json({"type": "recording_ack", "status": "started"})
+                        elif command == "stop_recording":
+                            if is_recording:
+                                is_recording = False
+                                if video_writer is not None:
+                                    video_writer.release()
+                                    video_writer = None
+                                logger.info(f"Stopped recording. File saved as {recording_filename}")
+                        elif command == "start_obs":
+                            if not is_obs_active:
+                                is_obs_active = True
+                                logger.info("Started OBS Virtual Camera stream")
+                                try:
+                                    if vcam is None:
+                                        vcam = pyvirtualcam.Camera(width=1280, height=720, fps=30)
+                                except Exception as e:
+                                    logger.error(f"Failed to start vcam: {e}")
+                                await websocket.send_json({"type": "obs_ack", "status": "started"})
+                        elif command == "stop_obs":
+                            if is_obs_active:
+                                is_obs_active = False
+                                logger.info("Stopped OBS Virtual Camera stream")
+                                if vcam is not None:
+                                    vcam.close()
+                                    vcam = None
+                                await websocket.send_json({"type": "obs_ack", "status": "stopped"})
                 except json.JSONDecodeError:
                     logger.error("Invalid JSON received.")
                 continue
                 # Send results back to client
                 response_data["mode"] = current_mode
                 await websocket.send_json(response_data)
+                # Apply Crop and Handle OBS / Recording
+                try:
+                    cropped_frame = apply_center_stage_crop(frame, response_data)
+                    # 1. Update OBS Virtual Camera
+                    if is_obs_active and vcam is not None:
+                        try:
+                            # Virtual cameras generally strict size requirements
+                            cam_frame = cv2.resize(cropped_frame, (vcam.width, vcam.height))
+                            cam_frame = cv2.cvtColor(cam_frame, cv2.COLOR_BGR2RGB)
+                            vcam.send(cam_frame)
+                        except Exception as e:
+                            logger.error(f"Failed to push vcam frame: {e}")
+                    # 2. Update Recording Output
+                    if is_recording:
+                        h, w = cropped_frame.shape[:2]
+                        if video_writer is None:
+                            # Initialize writer with the exact dimensions of the FIRST cropped frame
+                            fourcc = cv2.VideoWriter_fourcc(*'avc1')
+                            video_writer = cv2.VideoWriter(recording_filename, fourcc, 5.0, (w, h))
+                        # Ensure we try to resize cleanly if aspect ratio forces slight off-by-one errors over time
+                        if video_writer is not None:
+                            target_w = int(video_writer.get(cv2.CAP_PROP_FRAME_WIDTH))
+                            target_h = int(video_writer.get(cv2.CAP_PROP_FRAME_HEIGHT))
+                            if (w, h) != (target_w, target_h):
+                                cropped_frame = cv2.resize(cropped_frame, (target_w, target_h))
+                            video_writer.write(cropped_frame)
+                except Exception as e:
+                    logger.error(f"Error handling post-process crops: {e}")
     except WebSocketDisconnect:
         logger.info("WebSocket client disconnected.")
     except Exception as e:
         logger.error(f"WebSocket error: {e}")
+    finally:
+        # Cleanup Virtual Camera
+        if vcam is not None:
+            vcam.close()
+            vcam = None
+        is_obs_active = False
+        # Cleanup Recording
+        if video_writer is not None:
+            video_writer.release()
+            video_writer = None
+        is_recording = False
 if __name__ == "__main__":
     uvicorn.run("server:app", host="0.0.0.0", port=8000, reload=True)