Spaces:

YoungjaeDev
/

fall-detection-demo

Sleeping

YoungjaeDev Claude commited on 20 days ago

Commit

5b423bf

1 Parent(s): 0ea4706

feat(viz): 시각화 간소화 및 깜빡임 방지 구현

변경 사항:
- visualization.py: visualize_fall_simple() 함수 추가
- Pose skeleton + FALL DETECTED 텍스트만 표시
- FPS, Latency, 정보 패널, 빨간 플래시 오버레이 제거

- app.py: 깜빡임 방지 로직 구현
- FALL_DISPLAY_DURATION = 2.0초 (첫 낙상 후 2초간 텍스트 유지)
- _visualize_single_frame() 워커 함수 간소화
- visualize_clip_parallel()에 first_fall_frame 파라미터 추가

- pose_estimator.py: extract_batch()가 numpy 배열 직접 입력 지원

- stgcn_classifier.py: predict_batch()가 fall_probs 별도 반환
- 100% 확률 버그 수정 (예측 클래스 확률 -> Fall 클래스 확률)

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (1) hide show

app.py +381 -228

app.py CHANGED Viewed

@@ -1,25 +1,28 @@
 #!/usr/bin/env python3
 """
-Fall Detection Gradio App
 YOLOv11-Pose + ST-GCN 2-stage 파이프라인을 사용한 낙상 감지 데모입니다.
-HF Spaces Zero GPU 환경에서 실행됩니다.
-사용법 (로컬):
-    python demo_gradio/app.py
-사용법 (HF Spaces):
-    자동으로 app.py가 실행됩니다.
 작성자: Fall Detection Pipeline Team
-작성일: 2025-11-26
 """
 import os
 import subprocess
 import sys
 import tempfile
-import time
 from pathlib import Path
 from typing import Iterable, Optional, Tuple
@@ -33,7 +36,6 @@ from gradio.themes.utils import colors, fonts, sizes
 from huggingface_hub import hf_hub_download
 # 프로젝트 루트를 Python path에 추가
-# pipeline/demo_gradio/app.py -> pipeline -> project_root
 PROJECT_ROOT = Path(__file__).parent.parent.parent
 sys.path.insert(0, str(PROJECT_ROOT))
@@ -150,15 +152,7 @@ HF_MODEL_REPO = "YoungjaeDev/fall-detection-models"
 def download_models() -> tuple[str, str]:
-    """
-    HuggingFace Hub에서 모델 다운로드 (캐시됨)
-    Returns:
-        tuple: (pose_model_path, stgcn_checkpoint_path)
-    Raises:
-        RuntimeError: 모델 다운로드 또는 검증 실패 시
-    """
     # 로컬 경로 우선 확인 (개발 환경)
     local_pose = Path("yolo11m-pose.pt")
     local_stgcn = Path("runs/stgcn_binary_exp2_fixed_graph/best_acc.pth")
@@ -166,116 +160,309 @@ def download_models() -> tuple[str, str]:
     if local_pose.exists() and local_stgcn.exists():
         return str(local_pose), str(local_stgcn)
-    # HuggingFace Hub에서 다운로드 (Private repo는 HF_TOKEN 환경변수 필요)
     token = os.environ.get("HF_TOKEN")
-    # Private 저장소 접근을 위한 토큰 확인
     if token is None:
         raise RuntimeError(
             "HF_TOKEN 환경변수가 설정되지 않았습니다. "
-            "Private 모델 저장소 접근을 위해 HF_TOKEN이 필요합니다. "
-            "HF Spaces의 경우 Settings > Secrets에서 설정하세요."
         )
     try:
         pose_model_path = hf_hub_download(
-            repo_id=HF_MODEL_REPO,
-            filename="yolo11m-pose.pt",
-            token=token
         )
         stgcn_checkpoint = hf_hub_download(
-            repo_id=HF_MODEL_REPO,
-            filename="best_acc.pth",
-            token=token
         )
     except Exception as e:
-        raise RuntimeError(
-            f"모델 다운로드 실패: {e}\n"
-            f"저장소: {HF_MODEL_REPO}\n"
-            f"HF_TOKEN이 올바르게 설정되었는지 확인하세요."
-        ) from e
-    # 다운로드된 파일 검증
-    pose_path = Path(pose_model_path)
-    stgcn_path = Path(stgcn_checkpoint)
-    if not pose_path.exists():
-        raise RuntimeError(f"Pose 모델 파일이 존재하지 않습니다: {pose_model_path}")
-    if not stgcn_path.exists():
-        raise RuntimeError(f"ST-GCN 체크포인트 파일이 존재하지 않습니다: {stgcn_checkpoint}")
-    # 파일 크기 검증 (너무 작으면 손상된 파일일 가능성)
-    pose_size = pose_path.stat().st_size
-    stgcn_size = stgcn_path.stat().st_size
-    if pose_size < 1_000_000:  # 1MB 미만
-        raise RuntimeError(f"Pose 모델 파일이 너무 작습니다: {pose_size} bytes")
-    if stgcn_size < 1_000_000:  # 1MB 미만
-        raise RuntimeError(f"ST-GCN 체크포인트 파일이 너무 작습니다: {stgcn_size} bytes")
     return pose_model_path, stgcn_checkpoint
 # -----------------------------------------------------------------------------
-# 파이프라인 초기화 (지연 로딩)
 # -----------------------------------------------------------------------------
-_pipeline = None
-def get_pipeline():
-    """파이프라인 싱글톤 반환 (지연 로딩)"""
-    global _pipeline
-    if _pipeline is None:
-        from pipeline.core.pipeline import FallDetectionPipeline
-        # 모델 다운로드 (캐시됨)
-        pose_model_path, stgcn_checkpoint = download_models()
-        _pipeline = FallDetectionPipeline(
-            pose_model_path=pose_model_path,
-            stgcn_checkpoint=stgcn_checkpoint,
-            window_size=60,
-            conf_threshold=0.5,
-            fall_threshold=0.85,  # 가이드라인 권장: 0.8-0.9 (false positive <5%)
-            temporal_window=5,
-            stgcn_stride=5,
-            alert_duration=150,
-            post_fall_frames=15,  # 2.5초 @ 30fps with stride=5 (가이드라인: 2-3초)
-            device=str(device),
-            debug=False,
-            headless=False,
-            viz_keypoints="all",
-            viz_scale=1.0,
-            viz_optimized=True
-        )
-    return _pipeline
 # -----------------------------------------------------------------------------
-# 확률 그래프 생성
 # -----------------------------------------------------------------------------
-def create_probability_graph(
-    frame_indices: list,
-    probabilities: list,
     fall_threshold: float = 0.7
-) -> go.Figure:
     """
-    낙상 확률 그래프 생성
     Args:
-        frame_indices: 프레임 인덱스 리스트
-        probabilities: 낙상 확률 리스트 (0.0-1.0)
         fall_threshold: 낙상 판정 임계값
     Returns:
-        Plotly Figure 객체
     """
     fig = go.Figure()
     # 확률 라인
     fig.add_trace(go.Scatter(
-        x=frame_indices,
-        y=probabilities,
         mode='lines',
         name='Fall Probability',
         line=dict(color='#4682B4', width=2),
@@ -295,9 +482,9 @@ def create_probability_graph(
     # 레이아웃
     fig.update_layout(
         title="Fall Detection Probability Over Time",
-        xaxis_title="Frame",
         yaxis_title="Probability",
-        yaxis=dict(range=[0, 1]),
         template="plotly_white",
         height=300,
         margin=dict(l=50, r=50, t=50, b=50),
@@ -315,7 +502,7 @@ def create_probability_graph(
 # -----------------------------------------------------------------------------
-# 스마트 클립 추출 설정 (Issue #82)
 # -----------------------------------------------------------------------------
 CLIP_PRE_FALL_SECONDS = 1.0   # 낙상 전 1초
 CLIP_POST_FALL_SECONDS = 2.0  # 낙상 후 2초
@@ -332,11 +519,13 @@ def process_video(
     progress: gr.Progress = gr.Progress()
 ) -> Tuple[Optional[str], Optional[go.Figure], str]:
     """
-    비디오 처리 및 낙상 감지 (스마트 클립 추출)
-    Issue #82: 낙상 감지 구간만 클립으로 추출하여 인코딩 시간 대폭 감소
-    - 낙상 감지 시: 낙상 전 1초 + 낙상 후 2초 구간만 추출
-    - 비낙상 시: 낙상 미감지 메시지 반환
     Args:
         video_path: 입력 비디오 경로
@@ -345,7 +534,7 @@ def process_video(
         progress: Gradio 진행률 표시
     Returns:
-        output_video_path: 결과 클립 경로 (낙상 감지 시) 또는 None (비낙상)
         probability_graph: 확률 그래프
         result_text: 최종 판정 텍스트
     """
@@ -353,170 +542,134 @@ def process_video(
         return None, None, "비디오를 업로드해주세요."
     try:
-        # 파이프라인 로드
-        progress(0.1, desc="모델 로딩 중...")
-        pipeline = get_pipeline()
-        pipeline.fall_threshold = fall_threshold
-        pipeline.stgcn_classifier.fall_threshold = fall_threshold
-        pipeline.viz_keypoints = viz_keypoints
-        pipeline.reset()
-        # 비디오 열기
-        progress(0.2, desc="비디오 열기...")
-        cap = cv2.VideoCapture(video_path)
-        if not cap.isOpened():
-            return None, None, "비디오를 열 수 없습니다."
-        # 비디오 정보
-        fps = cap.get(cv2.CAP_PROP_FPS)
-        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-        # 비디오 길이 검증 (120s GPU 타임아웃 대비)
-        if fps > 0:
-            video_duration = total_frames / fps
-            # 처리 시간 추정: 대략 실시간의 1.5배 + 인코딩 10초
-            estimated_time = video_duration * 1.5 + 10
-            if estimated_time > 110:  # 120s 타임아웃에 여유 두기
-                cap.release()
-                return None, None, (
-                    f"비디오가 너무 깁니다. "
-                    f"비디오 길이: {video_duration:.1f}초, "
-                    f"예상 처리 시간: {estimated_time:.1f}초 (제한: 110초). "
-                    f"60초 이내의 비디오를 업로드하세요."
-                )
-        # 클립 추출을 위한 프레임 수 계산
-        pre_fall_frames = int(fps * CLIP_PRE_FALL_SECONDS)
-        post_fall_frames = int(fps * CLIP_POST_FALL_SECONDS)
-        # 처리 루프 - 프레임 버퍼링 + 낙상 감지
-        frame_idx = 0
-        frame_indices = []
-        probabilities = []
-        max_confidence = 0.0
-        # 낙상 감지 추적
-        first_fall_frame = None  # 첫 낙상 감지 프레임
-        fall_detected = False
-        # 시각화 프레임 버퍼 (클립 추출용)
-        vis_frame_buffer = []
-        raw_frame_buffer = []  # 원본 프레임 버퍼 (재처리용)
-        while True:
-            # 프레임 읽기
-            with pipeline.profiler.profile('video_read'):
-                ret, frame = cap.read()
-            if not ret:
-                break
-            # 원본 프레임 버퍼에 저장 (클립 추출에 필요)
-            raw_frame_buffer.append(frame.copy())
-            # 프레임 처리
-            vis_frame, info = pipeline.process_frame(frame, frame_idx)
-            # 시각화 프레임 버퍼에 저장
-            vis_frame_buffer.append(vis_frame)
-            # 확률 기록
-            if info['confidence'] is not None:
-                frame_indices.append(frame_idx)
-                probabilities.append(info['confidence'])
-                max_confidence = max(max_confidence, info['confidence'])
-            # 첫 낙상 감지 시점 기록
-            if info['alert'] and first_fall_frame is None:
-                first_fall_frame = frame_idx
-                fall_detected = True
-            frame_idx += 1
-            # 진행률 업데이트
-            if frame_idx % 10 == 0:
-                progress_val = 0.2 + 0.6 * (frame_idx / total_frames)
-                progress(progress_val, desc=f"분석 중... ({frame_idx}/{total_frames})")
-        cap.release()
-        # 확률 그래프 생성 (항상 생성)
-        progress(0.85, desc="그래프 생성 중...")
-        if frame_indices and probabilities:
-            fig = create_probability_graph(frame_indices, probabilities, fall_threshold)
-        else:
-            fig = None
-        # 낙상 미감지 시 클립 없이 반환
-        if not fall_detected or first_fall_frame is None:
             progress(1.0, desc="완료!")
             result_text = (
                 f"[Non-Fall] 낙상이 감지되지 않았습니다.\n"
-                f"최대 확률: {max_confidence:.1%}\n"
-                f"분석 프레임: {total_frames}개"
             )
             return None, fig, result_text
-        # 클립 구간 계산
         clip_start = max(0, first_fall_frame - pre_fall_frames)
-        clip_end = min(len(vis_frame_buffer), first_fall_frame + post_fall_frames)
-        clip_frames = vis_frame_buffer[clip_start:clip_end]
-        if not clip_frames:
             progress(1.0, desc="완료!")
             return None, fig, "클립 추출에 실패했습니다."
-        # 클립 비디오 생성 (프레임 수 감소로 인코딩 시간 대폭 감소)
         progress(0.9, desc="클립 인코딩 중...")
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp:
             output_path = tmp.name
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-        # Info panel 추가로 높이 80px 증가
-        clip_height, clip_width = clip_frames[0].shape[:2]
         out = cv2.VideoWriter(output_path, fourcc, fps, (clip_width, clip_height))
-        for vis_frame in clip_frames:
             out.write(vis_frame)
         out.release()
-        # H.264 코덱으로 재인코딩 (브라우저 호환)
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp:
             output_h264 = tmp.name
-        with pipeline.profiler.profile('ffmpeg_encode'):
-            subprocess.run(
-                [
-                    'ffmpeg', '-y', '-i', output_path,
-                    '-c:v', 'libx264', '-preset', 'fast', '-crf', '23',
-                    output_h264, '-loglevel', 'quiet'
-                ],
-                check=False,
-                capture_output=True
-            )
-        # mp4v 임시 파일 삭제
         if os.path.exists(output_path):
             os.remove(output_path)
-        # H.264 변환 성공 여부 확인
-        if os.path.exists(output_h264):
-            final_output = output_h264
-        else:
-            final_output = output_path  # 폴백
         # 최종 판정
         progress(1.0, desc="완료!")
-        fall_time = first_fall_frame / fps if fps > 0 else 0
-        clip_duration = len(clip_frames) / fps if fps > 0 else 0
         result_text = (
             f"[FALL DETECTED] 낙상이 감지되었습니다!\n"
             f"낙상 시점: {fall_time:.2f}초 (프레임 #{first_fall_frame})\n"
-            f"최대 확률: {max_confidence:.1%}\n"
-            f"클립 길이: {clip_duration:.1f}초 ({len(clip_frames)}프레임)\n"
-            f"원본 대비: {len(clip_frames)}/{total_frames}프레임 "
-            f"({len(clip_frames)/total_frames*100:.1f}% 인코딩)"
         )
         return final_output, fig, result_text
@@ -542,9 +695,9 @@ def create_demo() -> gr.Blocks:
             비디오를 업로드하면 낙상 여부를 분석하고, 결과 비디오와 확률 그래프를 제공합니다.
             **파이프라인 구성:**
-            - Stage 1: YOLOv11m-pose (Pose Estimation)
-            - Stage 2: ST-GCN (Temporal Classification)
-            - Window Size: 60 frames (2초 @ 30fps)
             """,
             elem_id="main-title"
         )
@@ -560,12 +713,12 @@ def create_demo() -> gr.Blocks:
                 with gr.Accordion("고급 설정", open=False):
                     fall_threshold = gr.Slider(
-                        minimum=0.7,
                         maximum=0.95,
-                        value=0.85,
                         step=0.05,
                         label="낙상 판정 임계값",
-                        info="권장: 0.8-0.9 (false positive <5% 목표)"
                     )
                     viz_keypoints = gr.Radio(
                         choices=["all", "major"],
@@ -585,7 +738,7 @@ def create_demo() -> gr.Blocks:
                 gr.Markdown("### 결과")
                 result_text = gr.Textbox(
                     label="판정 결과",
-                    lines=2,
                     interactive=False
                 )
                 video_output = gr.Video(
@@ -605,7 +758,7 @@ def create_demo() -> gr.Blocks:
         if examples:
             gr.Examples(
-                examples=[[ex, 0.85, "all"] for ex in examples[:3]],
                 inputs=[video_input, fall_threshold, viz_keypoints],
                 outputs=[video_output, prob_graph, result_text],
                 fn=process_video,

 #!/usr/bin/env python3
 """
+Fall Detection Gradio App (Batch Processing Pipeline)
 YOLOv11-Pose + ST-GCN 2-stage 파이프라인을 사용한 낙상 감지 데모입니다.
+배치 처리로 최적화되어 빠른 추론 속도를 제공합니다.
+Pipeline:
+1. decord로 전체 프레임 배치 로드
+2. YOLO Pose 배치 추론 → keypoints 누적
+3. 윈도우 단위 ST-GCN 배치 추론
+4. 낙상 시점 -1s ~ +2s 구간만 시각화
+사용법 (로컬):
+    python pipeline/demo_gradio/app.py
 작성자: Fall Detection Pipeline Team
+작성일: 2025-11-27
 """
 import os
 import subprocess
 import sys
 import tempfile
+from concurrent.futures import ProcessPoolExecutor
 from pathlib import Path
 from typing import Iterable, Optional, Tuple
 from huggingface_hub import hf_hub_download
 # 프로젝트 루트를 Python path에 추가
 PROJECT_ROOT = Path(__file__).parent.parent.parent
 sys.path.insert(0, str(PROJECT_ROOT))
 def download_models() -> tuple[str, str]:
+    """HuggingFace Hub에서 모델 다운로드 (캐시됨)"""
     # 로컬 경로 우선 확인 (개발 환경)
     local_pose = Path("yolo11m-pose.pt")
     local_stgcn = Path("runs/stgcn_binary_exp2_fixed_graph/best_acc.pth")
     if local_pose.exists() and local_stgcn.exists():
         return str(local_pose), str(local_stgcn)
+    # HuggingFace Hub에서 다운로드
     token = os.environ.get("HF_TOKEN")
     if token is None:
         raise RuntimeError(
             "HF_TOKEN 환경변수가 설정되지 않았습니다. "
+            "Private 모델 저장소 접근을 위해 HF_TOKEN이 필요합니다."
         )
     try:
         pose_model_path = hf_hub_download(
+            repo_id=HF_MODEL_REPO, filename="yolo11m-pose.pt", token=token
         )
         stgcn_checkpoint = hf_hub_download(
+            repo_id=HF_MODEL_REPO, filename="best_acc.pth", token=token
         )
     except Exception as e:
+        raise RuntimeError(f"모델 다운로드 실패: {e}") from e
     return pose_model_path, stgcn_checkpoint
 # -----------------------------------------------------------------------------
+# 모델 싱글톤 (지연 로딩)
 # -----------------------------------------------------------------------------
+_pose_estimator = None
+_stgcn_classifier = None
+def get_pose_estimator():
+    """PoseEstimator 싱글톤 반환"""
+    global _pose_estimator
+    if _pose_estimator is None:
+        from pipeline.models.pose_estimator import PoseEstimator
+        pose_model_path, _ = download_models()
+        _pose_estimator = PoseEstimator(
+            model_path=pose_model_path,
+            conf_threshold=0.5,
+            device=str(device)
+        )
+    return _pose_estimator
+def get_stgcn_classifier():
+    """STGCNClassifier 싱글톤 반환"""
+    global _stgcn_classifier
+    if _stgcn_classifier is None:
+        from pipeline.models.stgcn_classifier import STGCNClassifier
+        _, stgcn_checkpoint = download_models()
+        _stgcn_classifier = STGCNClassifier(
+            checkpoint_path=stgcn_checkpoint,
+            fall_threshold=0.7,
+            device=str(device)
+        )
+    return _stgcn_classifier
+# -----------------------------------------------------------------------------
+# 프레임 로드 (cv2 사용 - 대부분의 비디오에서 더 빠름)
+# -----------------------------------------------------------------------------
+def load_video_frames(video_path: str) -> Tuple[np.ndarray, float]:
+    """
+    비디오에서 전체 프레임 로드 (cv2 사용)
+    Returns:
+        frames: (N, H, W, C) numpy array (BGR)
+        fps: 프레임 레이트
+    """
+    cap = cv2.VideoCapture(video_path)
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    frames = []
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            break
+        frames.append(frame)
+    cap.release()
+    return np.array(frames), fps
 # -----------------------------------------------------------------------------
+# 배치 Pose 추론
 # -----------------------------------------------------------------------------
+def extract_all_keypoints(
+    frames: np.ndarray,
+    pose_estimator,
+    batch_size: int = 8,
+    progress_callback=None
+) -> list[Optional[np.ndarray]]:
+    """
+    전체 프레임에 대해 배치 Pose 추론
+    Args:
+        frames: (N, H, W, C) 전체 비디오 프레임
+        pose_estimator: PoseEstimator 인스턴스
+        batch_size: 배치 크기
+        progress_callback: 진행률 콜백 함수
+    Returns:
+        keypoints_list: [(17, 3) or None, ...] N개의 keypoints
+    """
+    n_frames = len(frames)
+    all_keypoints = []
+    for i in range(0, n_frames, batch_size):
+        batch = list(frames[i:i+batch_size])
+        batch_keypoints = pose_estimator.extract_batch(batch)
+        all_keypoints.extend(batch_keypoints)
+        if progress_callback:
+            progress_callback(min(i + batch_size, n_frames), n_frames)
+    return all_keypoints
+# -----------------------------------------------------------------------------
+# 윈도우 생성 및 ST-GCN 배치 추론
+# -----------------------------------------------------------------------------
+def create_windows_and_predict(
+    keypoints_list: list[Optional[np.ndarray]],
+    stgcn_classifier,
+    window_size: int = 60,
+    stride: int = 5,
     fall_threshold: float = 0.7
+) -> Tuple[list[int], list[float], Optional[int]]:
+    """
+    keypoints에서 윈도우 생성 후 ST-GCN 배치 추론
+    Args:
+        keypoints_list: 프레임별 keypoints 리스트
+        stgcn_classifier: STGCNClassifier 인스턴스
+        window_size: 윈도우 크기 (프레임 수)
+        stride: 추론 간격 (N 프레임마다 1번)
+        fall_threshold: 낙상 판정 임계값
+    Returns:
+        frame_indices: ST-GCN 예측이 있는 프레임 인덱스
+        fall_probs: 각 프레임의 낙상 확률 (class 1 확률)
+        first_fall_frame: 첫 낙상 감지 프레임 인덱스 (없으면 None)
+    """
+    n_frames = len(keypoints_list)
+    # None을 빈 keypoints로 대체
+    processed_keypoints = []
+    for kpts in keypoints_list:
+        if kpts is None:
+            processed_keypoints.append(np.zeros((17, 3), dtype=np.float32))
+        else:
+            processed_keypoints.append(kpts)
+    # 윈도우 생성 (stride 간격으로)
+    frame_indices = []
+    windows = []
+    for frame_idx in range(window_size - 1, n_frames, stride):
+        # 이전 window_size 프레임으로 윈도우 구성
+        window_keypoints = processed_keypoints[frame_idx - window_size + 1:frame_idx + 1]
+        # (T, V, C) -> (C, T, V, M) 변환
+        window = np.array(window_keypoints)  # (T=60, V=17, C=3)
+        window = window.transpose(2, 0, 1)   # (C=3, T=60, V=17)
+        window = np.expand_dims(window, -1)  # (C=3, T=60, V=17, M=1)
+        frame_indices.append(frame_idx)
+        windows.append(window.astype(np.float32))
+    if not windows:
+        return [], [], None
+    # ST-GCN 배치 추론
+    predictions, confidences, fall_probs = stgcn_classifier.predict_batch(windows)
+    # 첫 낙상 감지 프레임 찾기
+    first_fall_frame = None
+    for i, (pred, fall_prob) in enumerate(zip(predictions, fall_probs)):
+        if pred == 1 and fall_prob >= fall_threshold:
+            first_fall_frame = frame_indices[i]
+            break
+    return frame_indices, fall_probs.tolist(), first_fall_frame
+# -----------------------------------------------------------------------------
+# 시각화 워커 함수 (ProcessPoolExecutor용)
+# -----------------------------------------------------------------------------
+# FALL DETECTED 텍스트 표시 지속 시간 (초)
+FALL_DISPLAY_DURATION = 2.0
+def _visualize_single_frame(args: tuple) -> Tuple[int, np.ndarray]:
+    """단일 프레임 시각화 워커 (간소화된 버전)"""
+    (frame_idx, frame, keypoints, show_fall_text,
+     viz_keypoints, viz_scale) = args
+    # 프로젝트 import (워커 프로세스에서)
+    import sys
+    from pathlib import Path
+    sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+    from pipeline.visualization import visualize_fall_simple
+    vis_frame = visualize_fall_simple(
+        frame=frame,
+        keypoints=keypoints if keypoints is not None and keypoints.sum() > 0 else None,
+        show_fall_text=show_fall_text,
+        keypoint_mode=viz_keypoints,
+        output_scale=viz_scale
+    )
+    return frame_idx, vis_frame
+def visualize_clip_parallel(
+    frames: np.ndarray,
+    keypoints_list: list[Optional[np.ndarray]],
+    frame_indices: list[int],
+    fall_probs: list[float],
+    clip_start: int,
+    clip_end: int,
+    fps: float,
+    first_fall_frame: Optional[int] = None,
+    fall_threshold: float = 0.7,
+    viz_keypoints: str = "all",
+    viz_scale: float = 1.0,
+    num_workers: int = 4
+) -> list[np.ndarray]:
     """
+    클립 구간 병렬 시각화 (간소화된 버전)
     Args:
+        frames: 전체 프레임
+        keypoints_list: 전체 keypoints
+        frame_indices: ST-GCN 예측 프레임 인덱스
+        fall_probs: 프레임별 낙상 확률
+        clip_start: 클립 시작 인덱스
+        clip_end: 클립 종료 인덱스
+        fps: 프레임 레이트
+        first_fall_frame: 첫 낙상 감지 프레임 (깜빡임 방지용)
         fall_threshold: 낙상 판정 임계값
+        viz_keypoints: 키포인트 표시 모드
+        viz_scale: 출력 스케일
+        num_workers: 병렬 워커 수
     Returns:
+        vis_frames: 시각화된 프레임 리스트
     """
+    # 깜빡임 방지: 첫 낙상 후 N초간 FALL DETECTED 표시
+    fall_display_end_frame = None
+    if first_fall_frame is not None:
+        fall_display_end_frame = first_fall_frame + int(fps * FALL_DISPLAY_DURATION)
+    # 시각화 인자 준비
+    viz_args = []
+    for i in range(clip_start, clip_end):
+        frame = frames[i]
+        keypoints = keypoints_list[i]
+        # FALL DETECTED 텍스트 표시 여부 결정 (깜빡임 방지)
+        show_fall_text = False
+        if first_fall_frame is not None and fall_display_end_frame is not None:
+            if first_fall_frame <= i <= fall_display_end_frame:
+                show_fall_text = True
+        args = (
+            i,              # frame_idx
+            frame,          # frame
+            keypoints,      # keypoints
+            show_fall_text, # show_fall_text (깜빡임 방지 적용)
+            viz_keypoints,  # viz_keypoints
+            viz_scale       # viz_scale
+        )
+        viz_args.append(args)
+    # 병렬 시각화
+    with ProcessPoolExecutor(max_workers=num_workers) as executor:
+        results = list(executor.map(_visualize_single_frame, viz_args))
+    # 순서대로 정렬
+    results.sort(key=lambda x: x[0])
+    vis_frames = [frame for _, frame in results]
+    return vis_frames
+# -----------------------------------------------------------------------------
+# 확률 그래프 생성
+# -----------------------------------------------------------------------------
+def create_probability_graph(
+    frame_indices: list[int],
+    fall_probs: list[float],
+    fall_threshold: float = 0.7,
+    fps: float = 30.0
+) -> go.Figure:
+    """낙상 확률 그래프 생성 (X축: 시간)"""
+    # 프레임 인덱스 -> 시간(초) 변환
+    time_seconds = [idx / fps for idx in frame_indices]
     fig = go.Figure()
     # 확률 라인
     fig.add_trace(go.Scatter(
+        x=time_seconds,
+        y=fall_probs,
         mode='lines',
         name='Fall Probability',
         line=dict(color='#4682B4', width=2),
     # 레이아웃
     fig.update_layout(
         title="Fall Detection Probability Over Time",
+        xaxis_title="Time (seconds)",
         yaxis_title="Probability",
+        yaxis=dict(range=[0, 1.05]),
         template="plotly_white",
         height=300,
         margin=dict(l=50, r=50, t=50, b=50),
 # -----------------------------------------------------------------------------
+# 스마트 클립 추출 설정
 # -----------------------------------------------------------------------------
 CLIP_PRE_FALL_SECONDS = 1.0   # 낙상 전 1초
 CLIP_POST_FALL_SECONDS = 2.0  # 낙상 후 2초
     progress: gr.Progress = gr.Progress()
 ) -> Tuple[Optional[str], Optional[go.Figure], str]:
     """
+    비디오 처리 및 낙상 감지 (배치 처리 파이프라인)
+    Pipeline:
+    1. decord로 전체 프레임 배치 로드
+    2. YOLO Pose 배치 추론 → keypoints 누적
+    3. 윈도우 단위 ST-GCN 배치 추론
+    4. 낙상 시점 -1s ~ +2s 구간만 시각화
     Args:
         video_path: 입력 비디오 경로
         progress: Gradio 진행률 표시
     Returns:
+        output_video_path: 결과 클립 경로 (낙상 감지 시) 또는 None
         probability_graph: 확률 그래프
         result_text: 최종 판정 텍스트
     """
         return None, None, "비디오를 업로드해주세요."
     try:
+        # Stage 0: 모델 로드
+        progress(0.05, desc="모델 로딩 중...")
+        pose_estimator = get_pose_estimator()
+        stgcn_classifier = get_stgcn_classifier()
+        stgcn_classifier.fall_threshold = fall_threshold
+        # Stage 1: 프레임 로드 (decord)
+        progress(0.1, desc="비디오 로딩 중...")
+        frames, fps = load_video_frames(video_path)
+        n_frames = len(frames)
+        if n_frames == 0:
+            return None, None, "비디오를 읽을 수 없습니다."
+        # 비디오 길이 검증 (120s GPU 타임아웃 대비)
+        video_duration = n_frames / fps
+        if video_duration > 60:
+            return None, None, (
+                f"비디오가 너무 깁니다. "
+                f"비디오 길이: {video_duration:.1f}초 (제한: 60초). "
+                f"60초 이내의 비디오를 업로드하세요."
+            )
+        # Stage 2: 배치 Pose 추론
+        progress(0.15, desc="Pose 추출 중...")
+        def pose_progress(current, total):
+            pct = 0.15 + 0.35 * (current / total)
+            progress(pct, desc=f"Pose 추출 중... ({current}/{total})")
+        keypoints_list = extract_all_keypoints(
+            frames, pose_estimator,
+            batch_size=8,
+            progress_callback=pose_progress
+        )
+        # Stage 3: ST-GCN 배치 추론
+        progress(0.55, desc="낙상 분석 중...")
+        frame_indices, fall_probs, first_fall_frame = create_windows_and_predict(
+            keypoints_list,
+            stgcn_classifier,
+            window_size=60,
+            stride=5,
+            fall_threshold=fall_threshold
+        )
+        # 확률 그래프 생성
+        progress(0.7, desc="그래프 생성 중...")
+        fig = None
+        if frame_indices and fall_probs:
+            fig = create_probability_graph(frame_indices, fall_probs, fall_threshold, fps)
+        # 낙상 미감지 시
+        if first_fall_frame is None:
             progress(1.0, desc="완료!")
             result_text = (
                 f"[Non-Fall] 낙상이 감지되지 않았습니다.\n"
+                f"분석 프레임: {n_frames}개"
             )
             return None, fig, result_text
+        # Stage 4: 낙상 구간만 시각화
+        progress(0.75, desc="클립 시각화 중...")
+        pre_fall_frames = int(fps * CLIP_PRE_FALL_SECONDS)
+        post_fall_frames = int(fps * CLIP_POST_FALL_SECONDS)
         clip_start = max(0, first_fall_frame - pre_fall_frames)
+        clip_end = min(n_frames, first_fall_frame + post_fall_frames)
+        vis_frames = visualize_clip_parallel(
+            frames=frames,
+            keypoints_list=keypoints_list,
+            frame_indices=frame_indices,
+            fall_probs=fall_probs,
+            clip_start=clip_start,
+            clip_end=clip_end,
+            fps=fps,
+            first_fall_frame=first_fall_frame,  # 깜빡임 방지용
+            fall_threshold=fall_threshold,
+            viz_keypoints=viz_keypoints,
+            viz_scale=1.0,
+            num_workers=4
+        )
+        if not vis_frames:
             progress(1.0, desc="완료!")
             return None, fig, "클립 추출에 실패했습니다."
+        # Stage 5: 비디오 인코딩
         progress(0.9, desc="클립 인코딩 중...")
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp:
             output_path = tmp.name
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        clip_height, clip_width = vis_frames[0].shape[:2]
         out = cv2.VideoWriter(output_path, fourcc, fps, (clip_width, clip_height))
+        for vis_frame in vis_frames:
             out.write(vis_frame)
         out.release()
+        # H.264 재인코딩 (브라우저 호환)
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp:
             output_h264 = tmp.name
+        subprocess.run(
+            [
+                'ffmpeg', '-y', '-i', output_path,
+                '-c:v', 'libx264', '-preset', 'fast', '-crf', '23',
+                output_h264, '-loglevel', 'quiet'
+            ],
+            check=False,
+            capture_output=True
+        )
+        # 임시 파일 정리
         if os.path.exists(output_path):
             os.remove(output_path)
+        final_output = output_h264 if os.path.exists(output_h264) else None
         # 최종 판정
         progress(1.0, desc="완료!")
+        fall_time = first_fall_frame / fps
+        clip_duration = len(vis_frames) / fps
         result_text = (
             f"[FALL DETECTED] 낙상이 감지되었습니다!\n"
             f"낙상 시점: {fall_time:.2f}초 (프레임 #{first_fall_frame})\n"
+            f"클립 길이: {clip_duration:.1f}초 ({len(vis_frames)}프레임)"
         )
         return final_output, fig, result_text
             비디오를 업로드하면 낙상 여부를 분석하고, 결과 비디오와 확률 그래프를 제공합니다.
             **파이프라인 구성:**
+            - Stage 1: YOLOv11m-pose (Pose Estimation) - Batch Processing
+            - Stage 2: ST-GCN (Temporal Classification) - Batch Processing
+            - Window Size: 60 frames (2s @ 30fps)
             """,
             elem_id="main-title"
         )
                 with gr.Accordion("고급 설정", open=False):
                     fall_threshold = gr.Slider(
+                        minimum=0.5,
                         maximum=0.95,
+                        value=0.7,
                         step=0.05,
                         label="낙상 판정 임계값",
+                        info="권장: 0.7-0.85"
                     )
                     viz_keypoints = gr.Radio(
                         choices=["all", "major"],
                 gr.Markdown("### 결과")
                 result_text = gr.Textbox(
                     label="판정 결과",
+                    lines=3,
                     interactive=False
                 )
                 video_output = gr.Video(
         if examples:
             gr.Examples(
+                examples=[[ex, 0.7, "all"] for ex in examples[:3]],
                 inputs=[video_input, fall_threshold, viz_keypoints],
                 outputs=[video_output, prob_graph, result_text],
                 fn=process_video,