Spaces:

1mpreccable
/

YOGAI

Sleeping

File size: 8,565 Bytes

import gradio as gr
import cv2
import numpy as np
import mediapipe as mp
from mediapipe.python.solutions import drawing_utils as mp_drawing
from PoseClassification.pose_embedding import FullBodyPoseEmbedding
from PoseClassification.pose_classifier import PoseClassifier
from PoseClassification.utils import EMADictSmoothing
import time

# Initialize components
mp_pose = mp.solutions.pose
pose_tracker = mp_pose.Pose()
pose_embedder = FullBodyPoseEmbedding()
pose_classifier = PoseClassifier(
    pose_samples_folder="data/yoga_poses_csvs_out",
    pose_embedder=pose_embedder,
    top_n_by_max_distance=30,
    top_n_by_mean_distance=10,
)
pose_classification_filter = EMADictSmoothing(window_size=10, alpha=0.2)

class_names = ["chair", "cobra", "dog", "goddess", "plank", "tree", "warrior", "none"]
position_threshold = 8.0


def check_major_current_position(positions_detected: dict, threshold_position) -> str:
    if max(positions_detected.values()) < float(threshold_position):
        return "none"
    return max(positions_detected, key=positions_detected.get)


def process_frame(frame):
    frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    result = pose_tracker.process(image=frame_rgb)
    pose_landmarks = result.pose_landmarks

    if pose_landmarks is not None:
        frame_height, frame_width = frame.shape[0], frame.shape[1]
        pose_landmarks = np.array(
            [
                [lmk.x * frame_width, lmk.y * frame_height, lmk.z * frame_width]
                for lmk in pose_landmarks.landmark
            ],
            dtype=np.float32,
        )
        pose_classification = pose_classifier(pose_landmarks)
        pose_classification_filtered = pose_classification_filter(pose_classification)
        current_position = pose_classification_filtered
    else:
        current_position = {"none": 10.0}

    current_position_major = check_major_current_position(
        current_position, position_threshold
    )
    return current_position_major, frame


def yoga_position_from_stream():
    current_position = "none"
    position_timer = 0
    last_update_time = 0
    recording = False
    recorded_frames = []
    start_time = 0
    frame_count = 0

    def classify_pose(frame):
        nonlocal current_position, position_timer, last_update_time, recording, recorded_frames, start_time, frame_count
        if frame is None:
            return (
                None,
                None,
                current_position,
                f"Duration: {int(position_timer)} seconds",
            )

        new_position, processed_frame = process_frame(frame)

        if new_position != current_position:
            current_position = new_position
            position_timer = 0
            last_update_time = cv2.getTickCount() / cv2.getTickFrequency()
        else:
            current_time = cv2.getTickCount() / cv2.getTickFrequency()
            position_timer += current_time - last_update_time
            last_update_time = current_time

        mp_drawing.draw_landmarks(
            image=processed_frame,
            landmark_list=pose_tracker.process(
                cv2.cvtColor(processed_frame, cv2.COLOR_BGR2RGB)
            ).pose_landmarks,
            connections=mp_pose.POSE_CONNECTIONS,
        )

        cv2.putText(
            processed_frame,
            f"Pose: {current_position}",
            (10, 30),
            cv2.FONT_HERSHEY_SIMPLEX,
            1,
            (0, 255, 0),
            2,
        )
        cv2.putText(
            processed_frame,
            f"Duration: {int(position_timer)} seconds",
            (10, 70),
            cv2.FONT_HERSHEY_SIMPLEX,
            1,
            (0, 255, 0),
            2,
        )

        if recording:
            recorded_frames.append(processed_frame)
            frame_count += 1
            if frame_count == 1:
                start_time = time.time()

        return (
            frame,
            processed_frame,
            current_position,
            f"Duration: {int(position_timer)} seconds",
        )

    def toggle_debug(debug_mode):
        return [
            gr.update(visible=debug_mode),
            gr.update(visible=not debug_mode),
            gr.update(visible=debug_mode),
        ]

    def start_recording():
        nonlocal recording, recorded_frames, start_time, frame_count
        recording = True
        recorded_frames = []
        start_time = 0
        frame_count = 0
        return "Recording started"

    def stop_recording():
        nonlocal recording
        recording = False
        return "Recording stopped"

    def save_video():
        nonlocal recorded_frames, start_time, frame_count
        if not recorded_frames:
            return None, "No recorded frames available"

        output_path = "recorded_yoga_session.mp4"
        height, width, _ = recorded_frames[0].shape

        # Calculate the actual frame rate
        elapsed_time = time.time() - start_time
        fps = frame_count / elapsed_time if elapsed_time > 0 else 30.0

        fourcc = cv2.VideoWriter_fourcc(*"mp4v")
        out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))

        for frame in recorded_frames:
            # Convert frame to BGR color space before writing
            frame_bgr = cv2.cvtColor(frame, cv2.COLOR_RGB2BGR)
            out.write(frame_bgr)
        out.release()

        return output_path, f"Video saved successfully at {fps:.2f} FPS"

    with gr.Column() as yoga_stream:
        gr.Markdown("# Yoga Position Classifier", elem_classes=["custom-title"])
        gr.Markdown(
            "Stream live yoga sessions and get real-time pose classification.",
            elem_classes=["custom-subtitle"],
        )

        with gr.Row():
            with gr.Column(scale=3):
                video_feed = gr.Webcam(streaming=True, elem_classes=["custom-webcam"])

            with gr.Column(scale=2):
                pose_output = gr.Textbox(
                    label="Current Pose", elem_classes=["custom-textbox"]
                )
                timer_output = gr.Textbox(
                    label="Pose Duration", elem_classes=["custom-textbox"]
                )
                debug_toggle = gr.Checkbox(
                    label="Debug Mode", value=False, elem_classes=["custom-checkbox"]
                )

        with gr.Column(visible=False) as debug_view:
            classified_video = gr.Image(
                label="Classified Video Feed", elem_classes=["custom-image"]
            )
            with gr.Row():
                start_button = gr.Button(
                    "Start Recording", elem_classes=["custom-button"]
                )
                stop_button = gr.Button(
                    "Stop Recording", elem_classes=["custom-button"]
                )
            save_button = gr.Button("Save Recording", elem_classes=["custom-button"])
            recording_status = gr.Textbox(
                label="Recording Status", elem_classes=["custom-textbox"]
            )
            recorded_video = gr.Video(
                label="Recorded Video", elem_classes=["custom-video"]
            )
            download_button = gr.Button(
                "Download Recorded Video", elem_classes=["custom-button"]
            )

        debug_toggle.change(
            toggle_debug,
            inputs=[debug_toggle],
            outputs=[debug_view, video_feed, classified_video],
        )

        video_feed.stream(
            classify_pose,
            inputs=[video_feed],
            outputs=[video_feed, classified_video, pose_output, timer_output],
            show_progress=False,
        )

        start_button.click(start_recording, outputs=[recording_status])
        stop_button.click(stop_recording, outputs=[recording_status])
        save_button.click(save_video, outputs=[recorded_video, recording_status])
        download_button.click(lambda: "recorded_yoga_session.mp4", outputs=[gr.File()])

    return yoga_stream


if __name__ == "__main__":
    with gr.Blocks(
        css="""
        .custom-title { font-size: 36px; font-weight: bold; margin-bottom: 10px; }
        .custom-subtitle { font-size: 18px; margin-bottom: 20px; }
        .custom-webcam { height: 480px; }
        .custom-textbox input { font-size: 24px; }
        .custom-checkbox label { font-size: 18px; }
        .custom-button { font-size: 18px; }
        .custom-image img { max-height: 400px; }
        .custom-video video { max-height: 400px; }
        """
    ) as demo:
        yoga_position_from_stream()
    demo.launch()