Spaces:

iDrops
/

Exercise_Tracking_Demo

Sleeping

App Files Files Community

iDrops commited on Jun 7, 2024

Commit

5577555

verified ·

1 Parent(s): 36a36a7

Update utils.py

Browse files

Files changed (1) hide show

utils.py +112 -20

utils.py CHANGED Viewed

@@ -2,6 +2,7 @@ import cv2
 import mediapipe as mp
 import numpy as np
 correct = cv2.imread('right.png')
 correct = cv2.cvtColor(correct, cv2.COLOR_BGR2RGB)
 incorrect = cv2.imread('wrong.png')
@@ -9,19 +10,30 @@ incorrect = cv2.cvtColor(incorrect, cv2.COLOR_BGR2RGB)
 def draw_rounded_rect(img, rect_start, rect_end, corner_width, box_color):
     x1, y1 = rect_start
     x2, y2 = rect_end
     w = corner_width
-    # draw filled rectangles
     cv2.rectangle(img, (x1 + w, y1), (x2 - w, y1 + w), box_color, -1)
     cv2.rectangle(img, (x1 + w, y2 - w), (x2 - w, y2), box_color, -1)
     cv2.rectangle(img, (x1, y1 + w), (x1 + w, y2 - w), box_color, -1)
     cv2.rectangle(img, (x2 - w, y1 + w), (x2, y2 - w), box_color, -1)
     cv2.rectangle(img, (x1 + w, y1 + w), (x2 - w, y2 - w), box_color, -1)
-    # draw filled ellipses
     cv2.ellipse(img, (x1 + w, y1 + w), (w, w),
                 angle = 0, startAngle = -90, endAngle = -180, color = box_color, thickness = -1)
@@ -36,12 +48,21 @@ def draw_rounded_rect(img, rect_start, rect_end, corner_width, box_color):
     return img
 def draw_dotted_line(frame, lm_coord, start, end, line_color):
     pix_step = 0
     for i in range(start, end+1, 8):
         cv2.circle(frame, (lm_coord[0], i+pix_step), 2, line_color, -1, lineType=cv2.LINE_AA)
@@ -61,33 +82,62 @@ def draw_text(
     overlay_image = False,
     overlay_type = None
 ):
     offset = box_offset
     x, y = pos
     text_size, _ = cv2.getTextSize(msg, font, font_scale, font_thickness)
     text_w, text_h = text_size
     rec_start = tuple(p - o for p, o in zip(pos, offset))
     rec_end = tuple(m + n - o for m, n, o in zip((x + text_w, y + text_h), offset, (25, 0)))
     resize_height = 0
     if overlay_image:
         resize_height = rec_end[1] - rec_start[1]
-        # print("Height: ", resize_height)
-        # print("Width: ", rec_end[0] - rec_start[0])
         img = draw_rounded_rect(img, rec_start, (rec_end[0]+resize_height, rec_end[1]), width, text_color_bg)
         if overlay_type == "correct":
             overlay_res = cv2.resize(correct, (resize_height, resize_height), interpolation = cv2.INTER_AREA)
         elif overlay_type == "incorrect":
             overlay_res = cv2.resize(incorrect, (resize_height, resize_height), interpolation = cv2.INTER_AREA)
         img[rec_start[1]:rec_start[1]+resize_height, rec_start[0]+width:rec_start[0]+width+resize_height] = overlay_res
     else:
         img = draw_rounded_rect(img, rec_start, rec_end, width, text_color_bg)
     cv2.putText(
         img,
         msg,
@@ -99,39 +149,69 @@ def draw_text(
         cv2.LINE_AA,
     )
     return text_size
 def find_angle(p1, p2, ref_pt = np.array([0,0])):
     p1_ref = p1 - ref_pt
     p2_ref = p2 - ref_pt
     cos_theta = (np.dot(p1_ref,p2_ref)) / (1.0 * np.linalg.norm(p1_ref) * np.linalg.norm(p2_ref))
     theta = np.arccos(np.clip(cos_theta, -1.0, 1.0))
-    degree = int(180 / np.pi) * theta
     return int(degree)
-def get_landmark_array(pose_landmark, key, frame_width, frame_height):
     denorm_x = int(pose_landmark[key].x * frame_width)
     denorm_y = int(pose_landmark[key].y * frame_height)
     return np.array([denorm_x, denorm_y])
-def get_landmark_features(kp_results, dict_features, feature, frame_width, frame_height):
     if feature == 'nose':
         return get_landmark_array(kp_results, dict_features[feature], frame_width, frame_height)
@@ -149,8 +229,20 @@ def get_landmark_features(kp_results, dict_features, feature, frame_width, frame
     else:
        raise ValueError("feature needs to be either 'nose', 'left' or 'right")
 def get_mediapipe_pose(
                         static_image_mode = False,
                         model_complexity = 1,
                         smooth_landmarks = True,

 import mediapipe as mp
 import numpy as np
+# Load the correct and incorrect posture images as BGR colors
 correct = cv2.imread('right.png')
 correct = cv2.cvtColor(correct, cv2.COLOR_BGR2RGB)
 incorrect = cv2.imread('wrong.png')
 def draw_rounded_rect(img, rect_start, rect_end, corner_width, box_color):
+  """
+  This function draws a rectangle with rounded corners on an image.
+  Args:
+      img: The image to draw on.
+      rect_start: The top-left corner of the rectangle as a tuple (x1, y1).
+      rect_end: The bottom-right corner of the rectangle as a tuple (x2, y2).
+      corner_width: The width of the rounded corners.
+      box_color: The color of the rectangle in BGR format.
+  """
     x1, y1 = rect_start
     x2, y2 = rect_end
     w = corner_width
+    # Draw filled rectangles for each side of the box
     cv2.rectangle(img, (x1 + w, y1), (x2 - w, y1 + w), box_color, -1)
     cv2.rectangle(img, (x1 + w, y2 - w), (x2 - w, y2), box_color, -1)
     cv2.rectangle(img, (x1, y1 + w), (x1 + w, y2 - w), box_color, -1)
     cv2.rectangle(img, (x2 - w, y1 + w), (x2, y2 - w), box_color, -1)
     cv2.rectangle(img, (x1 + w, y1 + w), (x2 - w, y2 - w), box_color, -1)
+    # Draw filled ellipses for the corners
     cv2.ellipse(img, (x1 + w, y1 + w), (w, w),
                 angle = 0, startAngle = -90, endAngle = -180, color = box_color, thickness = -1)
     return img
 def draw_dotted_line(frame, lm_coord, start, end, line_color):
+  """
+  This function draws a dotted line on a frame based on landmark coordinates.
+  Args:
+      frame: The image to draw on.
+      lm_coord: The landmark coordinates as a NumPy array.
+      start: The index of the starting landmark in the lm_coord array.
+      end: The index of the ending landmark in the lm_coord array.
+      line_color: The color of the line in BGR format.
+  """
     pix_step = 0
+    # Draw circles at every 8th element between the start and end landmarks
     for i in range(start, end+1, 8):
         cv2.circle(frame, (lm_coord[0], i+pix_step), 2, line_color, -1, lineType=cv2.LINE_AA)
     overlay_image = False,
     overlay_type = None
 ):
+      """
+  This function draws text with a customizable background box on an image.
+  Args:
+      img: The image to draw on.
+      msg: The message to display as a string.
+      width: The thickness of the background box border (default: 7).
+      font: The font style for the text (default: cv2.FONT_HERSHEY_SIMPLEX).
+      pos: The top-left corner coordinates of the text box (default: (0, 0)).
+      font_scale: The scaling factor for the font size (default: 1).
+      font_thickness: The thickness of the text (default: 2).
+      text_color: The color of the text in BGR format (default: green - (0, 255, 0)).
+      text_color_bg: The color of the background box in BGR format (default: black - (0, 0, 0)).
+      box_offset: The offset for the background box relative to the text (default: (20, 10)).
+      overlay_image: Flag to display an overlay image inside the box (default: False).
+      overlay_type: Type of overlay image ("correct" or "incorrect") - used when overlay_image is True.
+  Returns:
+      The size of the drawn text (width, height) as a NumPy array.
+  """
     offset = box_offset
     x, y = pos
+    # Get the size of the text with the specified font and scale
     text_size, _ = cv2.getTextSize(msg, font, font_scale, font_thickness)
     text_w, text_h = text_size
+    # Calculate the top-left and bottom-right corners of the text box with padding
     rec_start = tuple(p - o for p, o in zip(pos, offset))
     rec_end = tuple(m + n - o for m, n, o in zip((x + text_w, y + text_h), offset, (25, 0)))
     resize_height = 0
+    # Handle overlay image logic
     if overlay_image:
         resize_height = rec_end[1] - rec_start[1]
+        # Draw a rounded rectangle box with the background color
         img = draw_rounded_rect(img, rec_start, (rec_end[0]+resize_height, rec_end[1]), width, text_color_bg)
+        # Resize the overlay image based on the box height
         if overlay_type == "correct":
             overlay_res = cv2.resize(correct, (resize_height, resize_height), interpolation = cv2.INTER_AREA)
         elif overlay_type == "incorrect":
             overlay_res = cv2.resize(incorrect, (resize_height, resize_height), interpolation = cv2.INTER_AREA)
+        # Overlay the resized image onto the background box
         img[rec_start[1]:rec_start[1]+resize_height, rec_start[0]+width:rec_start[0]+width+resize_height] = overlay_res
     else:
         img = draw_rounded_rect(img, rec_start, rec_end, width, text_color_bg)
+    # Draw the text onto the image with specified parameters
     cv2.putText(
         img,
         msg,
         cv2.LINE_AA,
     )
     return text_size
 def find_angle(p1, p2, ref_pt = np.array([0,0])):
+  """
+  This function calculates the angle between two points relative to a reference point.
+  Args:
+      p1: The first point coordinates as a NumPy array (x, y).
+      p2: The second point coordinates as a NumPy array (x, y).
+      ref_pt: The reference point coordinates as a NumPy array (default: [0, 0]).
+  Returns:
+      The angle between the two points in degrees (int).
+  """
+    # Subtract the reference point from both points for normalization
     p1_ref = p1 - ref_pt
     p2_ref = p2 - ref_pt
+    # Calculate the cosine of the angle using the dot product
     cos_theta = (np.dot(p1_ref,p2_ref)) / (1.0 * np.linalg.norm(p1_ref) * np.linalg.norm(p2_ref))
+    # Clip the cosine value to avoid potential errors
     theta = np.arccos(np.clip(cos_theta, -1.0, 1.0))
+    # Convert the angle from radians to degrees and cast to integer
+    degree = int(180 / np.pi) * theta
     return int(degree)
+def get_landmark_array(pose_landmark, key, frame_width, frame_height):
+  """
+  This function extracts the normalized image coordinates for a landmark.
+  Args:
+      pose_landmark: A MediaPipe pose landmark object.
+      key: The key name of the landmark to extract (e.g., 'nose', 'shoulder.x').
+      frame_width: The width of the image frame.
+      frame_height: The height of the image frame.
+  Returns:
+      A NumPy array containing the normalized x and y coordinates of the landmark.
+  """
     denorm_x = int(pose_landmark[key].x * frame_width)
     denorm_y = int(pose_landmark[key].y * frame_height)
     return np.array([denorm_x, denorm_y])
+def get_landmark_features(kp_results, dict_features, feature, frame_width, frame_height):
+  """
+  This function extracts landmark coordinates for various body parts based on a feature name.
+  Args:
+      kp_results: The MediaPipe pose landmark results object.
+      dict_features: A dictionary containing landmark key names for different body parts.
+      feature: The name of the body part feature to extract (e.g., 'nose', 'left', 'right').
+      frame_width: The width of the image frame.
+      frame_height: The height of the image frame.
+  Returns:
+      A list containing the landmark coordinates (as NumPy arrays) or raises an error if the feature is invalid.
+  """
     if feature == 'nose':
         return get_landmark_array(kp_results, dict_features[feature], frame_width, frame_height)
     else:
        raise ValueError("feature needs to be either 'nose', 'left' or 'right")
 def get_mediapipe_pose(
+''''
+  This function creates a MediaPipe Pose object for human pose estimation.
+  Args:
+      static_image_mode: Flag for processing a single static image (default: False).
+      model_complexity: Level of complexity for the pose model (default: 1).
+      smooth_landmarks: Enable smoothing of detected landmarks (default: True).
+      min_detection_confidence: Minimum confidence threshold for person detection (default: 0.5).
+      min_tracking_confidence: Minimum confidence threshold for pose tracking (default: 0.5).
+  Returns:
+      A MediaPipe Pose object.
+''''
                         static_image_mode = False,
                         model_complexity = 1,
                         smooth_landmarks = True,