Spaces:

Phani-1
/

Pose_Estimation

Runtime error

App Files Files Community

Phani-1 commited on Jun 22, 2024

Commit

d9b157e

verified ·

1 Parent(s): 6b5ca8e

Update app.py

Browse files

Files changed (1) hide show

app.py +195 -209

app.py CHANGED Viewed

@@ -1,209 +1,195 @@
-import cv2
-import tempfile
-import numpy as np
-import mediapipe as mp
-import streamlit as st
-import tensorflow as tf
-POSE_CONNECTIONS = [
-    (0, 1), (1, 2), (2, 3), (3, 7),
-    (0, 4), (4, 5), (5, 6), (6, 8),
-    (9, 10), (11, 12), (11, 13), (13, 15),
-    (15, 17), (15, 19), (15, 21), (17, 19),
-    (12, 14), (14, 16), (16, 18), (16, 20),
-    (16, 22), (18, 20), (11, 23), (12, 24),
-    (23, 24), (23, 25), (24, 26), (25, 27),
-    (26, 28), (27, 29), (28, 30), (29, 31),
-    (30, 32)
-]
-@st.cache_resource
-def load_model():
-    return tf.saved_model.load("Models/ssd_mobilenet/saved_model")
-model = load_model()
-mp_pose = mp.solutions.pose
-labels = {1: 'person'}
-def detect_persons(image):
-    tensor_img = tf.convert_to_tensor(image)
-    tensor_img = tensor_img[tf.newaxis, ...]
-    detections = model(tensor_img)
-    boxes = detections['detection_boxes'][0].numpy()
-    scores = detections['detection_scores'][0].numpy()
-    classes = detections['detection_classes'][0].numpy().astype(np.int32)
-    return boxes, scores, classes
-def draw_landmarks(img, landmarks):
-    height, width, _ = img.shape
-    for lm in landmarks.landmark:
-        cx, cy = int(lm.x * width), int(lm.y * height)
-        cv2.circle(img, (cx, cy), 8, (0, 0, 255), -1)
-    for connection in POSE_CONNECTIONS:
-        start_idx, end_idx = connection
-        if landmarks.landmark[start_idx] and landmarks.landmark[end_idx]:
-            start_point = landmarks.landmark[start_idx]
-            end_point = landmarks.landmark[end_idx]
-            start_coordinates = (int(start_point.x * width), int(start_point.y * height))
-            end_coordinates = (int(end_point.x * width), int(end_point.y * height))
-            cv2.line(img, start_coordinates, end_coordinates, (0, 255, 0), 3)
-    return img
-def draw_bounding_box(img, box, width, height):
-    y_min, x_min, y_max, x_max = box
-    left, right, top, bottom = x_min * width, x_max * width, y_min * height, y_max * height
-    cv2.rectangle(img, (int(left), int(top)), (int(right), int(bottom)), (255, 0, 0), 2)
-def process_frame(frame, pose, draw_box):
-    image_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-    boxes, scores, classes = detect_persons(image_rgb)
-    height, width, _ = frame.shape
-    for i in range(len(scores)):
-        if scores[i] > 0.5 and classes[i] == 1:
-            y_min, x_min, y_max, x_max = boxes[i]
-            left, right, top, bottom = x_min * width, x_max * width, y_min * height, y_max * height
-            person_roi = frame[int(top):int(bottom), int(left):int(right)]
-            results = pose.process(cv2.cvtColor(person_roi, cv2.COLOR_BGR2RGB))
-            if results.pose_landmarks:
-                person_roi = draw_landmarks(person_roi, results.pose_landmarks)
-            frame[int(top):int(bottom), int(left):int(right)] = person_roi
-            if draw_box:
-                draw_bounding_box(frame, boxes[i], width, height)
-    return frame
-def main():
-    st.markdown(
-        """
-        <style>
-            .title {
-                font-size: 36px;
-                color: #000000;
-                padding-bottom: 40px;
-                border-bottom: 4px solid #000000;
-            }
-            .intro {
-                font-size: 18px;
-                margin-top: 20px;
-                margin-bottom: 20px;
-            }
-            .upload-section {
-                background-color: #f0f0f0;
-                padding: 20px;
-                border-radius: 10px;
-                margin-bottom: 20px;
-            }
-            .button-primary {
-                background-color: #008CBA;
-                color: white;
-                font-weight: bold;
-                padding: 10px 20px;
-                border-radius: 5px;
-                transition: background-color 0.3s ease;
-                text-align: center;
-                display: inline-block;
-                cursor: pointer;
-            }
-            .button-primary:hover {
-                background-color: #005f7f;
-            }
-        </style>
-        """,
-        unsafe_allow_html=True
-    )
-    st.markdown("<p class='title'>Multi-Person Pose Estimation</p>", unsafe_allow_html=True)
-    st.markdown("<p class='intro'>Choose an operation type:</p>", unsafe_allow_html=True)
-    operation_type = st.radio("Choose operation type", ("Input", "Demo"))
-    if operation_type == "Input":
-        input_type = st.radio("Choose input type", ("Image", "Video"))
-        if input_type == "Image":
-            uploaded_file = st.file_uploader(
-                "Upload an image file (.jpg, .jpeg, .png)",
-                type=["jpg", "jpeg", "png"]
-            )
-        else:
-            uploaded_file = st.file_uploader(
-                "Upload a video file (.mp4, .mov, .avi, .mkv)",
-                type=["mp4", "mov", "avi", "mkv"]
-            )
-        draw_box = st.checkbox("Draw bounding box", value=False)
-        pose = mp_pose.Pose()
-        if uploaded_file is not None:
-            with tempfile.NamedTemporaryFile(delete=False) as temp_file:
-                temp_file.write(uploaded_file.read())
-                file_path = temp_file.name
-            if input_type == "Video":
-                cam = cv2.VideoCapture(file_path)
-                st_frame = st.empty()
-                while cam.isOpened():
-                    success, frame = cam.read()
-                    if not success:
-                        break
-                    frame = process_frame(frame, pose, draw_box)
-                    st_frame.image(frame, channels='BGR', use_column_width=True)
-                    st.empty()
-                st.text("Completed")
-                cam.release()
-            elif input_type == "Image":
-                image = cv2.imread(file_path)
-                processed_image = process_frame(image, pose, draw_box)
-                st.image(processed_image, channels='BGR', use_column_width=True)
-    elif operation_type == "Demo":
-        st.empty()
-        st.markdown("<p class='intro'>Demo video will be shown below:</p>", unsafe_allow_html=True)
-        demo_video_path = "Videos/video.mp4"
-        cam = cv2.VideoCapture(demo_video_path)
-        st_frame = st.empty()
-        pose = mp_pose.Pose()
-        while cam.isOpened():
-            success, frame = cam.read()
-            if not success:
-                break
-            frame = process_frame(frame, pose, draw_box=False)
-            st_frame.image(frame, channels='BGR', use_column_width=True)
-            st.empty()
-        st.text("Completed")
-        cam.release()
-if __name__ == "__main__":
-    main()

+import gc
+import cv2
+import tempfile
+import numpy as np
+import mediapipe as mp
+import streamlit as st
+import tensorflow as tf
+POSE_CONNECTIONS = [
+    (0, 1), (1, 2), (2, 3), (3, 7),
+    (0, 4), (4, 5), (5, 6), (6, 8),
+    (9, 10), (11, 12), (11, 13), (13, 15),
+    (15, 17), (15, 19), (15, 21), (17, 19),
+    (12, 14), (14, 16), (16, 18), (16, 20),
+    (16, 22), (18, 20), (11, 23), (12, 24),
+    (23, 24), (23, 25), (24, 26), (25, 27),
+    (26, 28), (27, 29), (28, 30), (29, 31),
+    (30, 32)
+]
+@st.cache_resource
+def load_model():
+    return tf.saved_model.load("Models/ssd_mobilenet/saved_model")
+model = load_model()
+mp_pose = mp.solutions.pose
+labels = {1: 'person'}
+def detect_persons(image):
+    tensor_img = tf.convert_to_tensor(image)
+    tensor_img = tensor_img[tf.newaxis, ...]
+    detections = model(tensor_img)
+    boxes = detections['detection_boxes'][0].numpy()
+    scores = detections['detection_scores'][0].numpy()
+    classes = detections['detection_classes'][0].numpy().astype(np.int32)
+    return boxes, scores, classes
+def draw_landmarks(img, landmarks):
+    height, width, _ = img.shape
+    for lm in landmarks.landmark:
+        cx, cy = int(lm.x * width), int(lm.y * height)
+        cv2.circle(img, (cx, cy), 8, (0, 0, 255), -1)
+    for connection in POSE_CONNECTIONS:
+        start_idx, end_idx = connection
+        if landmarks.landmark[start_idx] and landmarks.landmark[end_idx]:
+            start_point = landmarks.landmark[start_idx]
+            end_point = landmarks.landmark[end_idx]
+            start_coordinates = (int(start_point.x * width), int(start_point.y * height))
+            end_coordinates = (int(end_point.x * width), int(end_point.y * height))
+            cv2.line(img, start_coordinates, end_coordinates, (0, 255, 0), 3)
+    return img
+def draw_bounding_box(img, box, width, height):
+    y_min, x_min, y_max, x_max = box
+    left, right, top, bottom = x_min * width, x_max * width, y_min * height, y_max * height
+    cv2.rectangle(img, (int(left), int(top)), (int(right), int(bottom)), (255, 0, 0), 2)
+def process_frame(frame, pose, draw_box):
+    image_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+    boxes, scores, classes = detect_persons(image_rgb)
+    height, width, _ = frame.shape
+    for i in range(len(scores)):
+        if scores[i] > 0.5 and classes[i] == 1:
+            y_min, x_min, y_max, x_max = boxes[i]
+            left, right, top, bottom = x_min * width, x_max * width, y_min * height, y_max * height
+            person_roi = frame[int(top):int(bottom), int(left):int(right)]
+            results = pose.process(cv2.cvtColor(person_roi, cv2.COLOR_BGR2RGB))
+            if results.pose_landmarks:
+                person_roi = draw_landmarks(person_roi, results.pose_landmarks)
+            frame[int(top):int(bottom), int(left):int(right)] = person_roi
+            if draw_box:
+                draw_bounding_box(frame, boxes[i], width, height)
+    return frame
+def main():
+    st.markdown(
+        """
+        <style>
+            .title {
+                font-size: 36px;
+                color: #000000;
+                padding-bottom: 40px;
+                border-bottom: 4px solid #000000;
+            }
+            .intro {
+                font-size: 18px;
+                margin-top: 20px;
+                margin-bottom: 20px;
+            }
+            .upload-section {
+                background-color: #f0f0f0;
+                padding: 20px;
+                border-radius: 10px;
+                margin-bottom: 20px;
+            }
+            .button-primary {
+                background-color: #008CBA;
+                color: white;
+                font-weight: bold;
+                padding: 10px 20px;
+                border-radius: 5px;
+                transition: background-color 0.3s ease;
+                text-align: center;
+                display: inline-block;
+                cursor: pointer;
+            }
+            .button-primary:hover {
+                background-color: #005f7f;
+            }
+        </style>
+        """,
+        unsafe_allow_html=True
+    )
+    st.markdown("<p class='title'>Multi-Person Pose Estimation</p>", unsafe_allow_html=True)
+    st.markdown("<p class='intro'>Choose an operation type:</p>", unsafe_allow_html=True)
+    operation_type = st.radio("Choose operation type", ("Input", "Demo"))
+    if operation_type == "Input":
+        input_type = st.radio("Choose input type", ("Image", "Video"))
+        if input_type == "Image":
+            uploaded_file = st.file_uploader(
+                "Upload an image file (.jpg, .jpeg, .png)",
+                type=["jpg", "jpeg", "png"]
+            )
+        else:
+            uploaded_file = st.file_uploader(
+                "Upload a video file (.mp4, .mov, .avi, .mkv)",
+                type=["mp4", "mov", "avi", "mkv"]
+            )
+        draw_box = st.checkbox("Draw bounding box", value=False)
+        pose = mp_pose.Pose()
+        if uploaded_file is not None:
+            with tempfile.NamedTemporaryFile(delete=False) as temp_file:
+                temp_file.write(uploaded_file.read())
+                file_path = temp_file.name
+            if input_type == "Video":
+                cam = cv2.VideoCapture(file_path)
+                st_frame = st.empty()
+                while cam.isOpened():
+                    success, frame = cam.read()
+                    if not success:
+                        break
+                    frame = process_frame(frame, pose, draw_box)
+                    st_frame.image(frame, channels='BGR', use_column_width=True)
+                    # Ensure proper synchronization and frame display
+                    st_frame.empty()
+                st.text("Completed")
+                cam.release()
+            elif input_type == "Image":
+                image = cv2.imread(file_path)
+                processed_image = process_frame(image, pose, draw_box)
+                st.image(processed_image, channels='BGR', use_column_width=True)
+            gc.collect()
+    elif operation_type == "Demo":
+        st.empty()
+        st.markdown("<p class='intro'>Demo video will be shown below:</p>", unsafe_allow_html=True)
+        demo_video_path = "Videos/video.mp4"
+        cam = cv2.VideoCapture(demo_video_path)
+        st_frame = st.empty()
+        pose = mp_pose.Pose()
+        while cam.isOpened():
+            success, frame = cam.read()
+            if not success:
+                break
+            frame = process_frame(frame, pose, draw_box=False)
+            st_frame.image(frame, channels='BGR', use_column_width=True)
+            st_frame.empty()
+        st.text("Completed")
+        cam.release()
+        gc.collect()
+if __name__ == "__main__":
+    main()