Spaces:

Natwar
/

Sign_Language_Detection

Sleeping

App Files Files Community

Natwar commited on Apr 15, 2025

Commit

5069bfa

verified ·

1 Parent(s): 8bd1b32

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -30

app.py CHANGED Viewed

@@ -1,7 +1,34 @@
-# Install required dependencies
-!pip install -q mediapipe tensorflow opencv-python-headless gradio Pillow numpy
 import os
 import numpy as np
 import tensorflow as tf
 import cv2
@@ -18,7 +45,7 @@ class handTracker():
         self.modelComplexity = modelComplexity
         self.detectionConfidence = detectionConfidence
         self.trackConfidence = trackConfidence
         self.mpHands = mp.solutions.hands
         self.hands = self.mpHands.Hands(
             static_image_mode=self.mode,
@@ -26,51 +53,51 @@ class handTracker():
             model_complexity=self.modelComplexity,
             min_detection_confidence=self.detectionConfidence,
             min_tracking_confidence=self.trackConfidence)
         self.mpDraw = mp.solutions.drawing_utils
         self.mpDrawStyles = mp.solutions.drawing_styles
     def findAndDrawHands(self, frame):
         RGBimage = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
         self.results = self.hands.process(RGBimage)
         if self.results.multi_hand_landmarks:
             for handLms in self.results.multi_hand_landmarks:
                 self.mpDraw.draw_landmarks(
-                    frame,
                     handLms,
                     self.mpHands.HAND_CONNECTIONS,
                     self.mpDrawStyles.get_default_hand_landmarks_style(),
                     self.mpDrawStyles.get_default_hand_connections_style())
         return frame
     def findLandmarks(self, frame, handNo=0):
         landmarkList = []
         x_list = []
         y_list = []
         bbox = []
         if self.results.multi_hand_landmarks:
             if handNo < len(self.results.multi_hand_landmarks):
                 myHand = self.results.multi_hand_landmarks[handNo]
                 for id, lm in enumerate(myHand.landmark):
                     h, w, c = frame.shape
                     cx, cy = int(lm.x * w), int(lm.y * h)
                     x_list.append(cx)
                     y_list.append(cy)
                     landmarkList.append([id, cx, cy])
                 if x_list and y_list:
                     xmin, xmax = min(x_list), max(x_list)
                     ymin, ymax = min(y_list), max(y_list)
                     padding = 20
                     xmin = max(0, xmin - padding)
                     ymin = max(0, ymin - padding)
                     boxW = min(w - xmin, xmax - xmin + 2*padding)
                     boxH = min(h - ymin, ymax - ymin + 2*padding)
                     if boxW > boxH:
                         diff = boxW - boxH
                         ymin = max(0, ymin - diff//2)
@@ -79,7 +106,7 @@ class handTracker():
                         diff = boxH - boxW
                         xmin = max(0, xmin - diff//2)
                         boxW = min(w - xmin, boxH)
                     bbox = [xmin, ymin, boxW, boxH]
         return landmarkList, bbox
@@ -97,10 +124,10 @@ def load_model_with_compatibility(model_path):
                     if 'groups' in kwargs:
                         del kwargs['groups']
                     super(CustomDepthwiseConv2D, self).__init__(**kwargs)
             custom_objects = {'DepthwiseConv2D': CustomDepthwiseConv2D}
             model = tf.keras.models.load_model(
-                model_path,
                 custom_objects=custom_objects,
                 compile=False
             )
@@ -114,7 +141,7 @@ def create_simple_asl_model():
     labels = ['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',
              'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S',
              'T', 'U', 'V', 'W', 'X', 'Y']
     print("Creating a new compatible model...")
     model = tf.keras.Sequential([
         tf.keras.layers.Conv2D(32, (3, 3), activation='relu', input_shape=(224, 224, 3)),
@@ -128,7 +155,7 @@ def create_simple_asl_model():
         tf.keras.layers.Dense(len(labels), activation='softmax')
     ])
     model.compile(optimizer='adam',
-                  loss='sparse_categorical_crossentropy',
                   metrics=['accuracy'])
     return model
@@ -145,7 +172,7 @@ def preprocess_hand_roi(hand_roi, target_shape):
             hand_roi_rgb = cv2.cvtColor(hand_roi, cv2.COLOR_GRAY2RGB)
         else:
             hand_roi_rgb = hand_roi.copy()
         resized = cv2.resize(hand_roi_rgb, (target_shape[0], target_shape[1]))
         normalized = resized.astype('float32') / 255.0
     else:
@@ -153,12 +180,12 @@ def preprocess_hand_roi(hand_roi, target_shape):
             hand_roi_gray = cv2.cvtColor(hand_roi, cv2.COLOR_BGR2GRAY)
         else:
             hand_roi_gray = hand_roi
         resized = cv2.resize(hand_roi_gray, (target_shape[0], target_shape[1]))
         normalized = resized.astype('float32') / 255.0
         if len(normalized.shape) == 2:
             normalized = normalized[..., np.newaxis]
     return np.expand_dims(normalized, axis=0), resized
 def process_image(input_image):
@@ -166,16 +193,16 @@ def process_image(input_image):
     tracker = handTracker(detectionConfidence=0.7)
     frame_with_hands = tracker.findAndDrawHands(frame.copy())
     landmarks, bbox = tracker.findLandmarks(frame)
     if not bbox:
         return "No hand detected", None
     x, y, w, h = bbox
     hand_roi = frame[y:y+h, x:x+w]
     cv2.rectangle(frame_with_hands, (x, y), (x+w, y+h), (0, 255, 0), 2)
     model_input, _ = preprocess_hand_roi(hand_roi, model_input_shape)
     try:
         prediction = model.predict(model_input, verbose=0)[0]
         predicted_class = np.argmax(prediction)
@@ -183,11 +210,11 @@ def process_image(input_image):
         letter = labels[predicted_class] if predicted_class < len(labels) else "Unknown"
     except:
         return "Prediction error", None
     result_text = f"Prediction: {letter} (Confidence: {confidence:.2f})"
-    cv2.putText(frame_with_hands, result_text, (10, 30),
                 cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2)
     output_image = cv2.cvtColor(frame_with_hands, cv2.COLOR_BGR2RGB)
     return result_text, Image.fromarray(output_image)
@@ -204,4 +231,4 @@ interface = gr.Interface(
 )
 if __name__ == "__main__":
-    interface.launch(share=True)

 import os
+import subprocess
+import sys
+import pkg_resources
+import warnings
+warnings.filterwarnings("ignore")
+def install_package(package, version=None):
+    package_spec = f"{package}=={version}" if version else package
+    print(f"Installing {package_spec}...")
+    try:
+        subprocess.check_call([sys.executable, "-m", "pip", "install", "--no-cache-dir", package_spec])
+    except subprocess.CalledProcessError as e:
+        print(f"Failed to install {package_spec}: {e}")
+        raise
+# Required packages
+required_packages = {
+    "mediapipe": None,
+    "tensorflow": None,
+    "opencv-python-headless": None,
+    "gradio": None,
+    "Pillow": None,
+    "numpy": None
+}
+installed_packages = {pkg.key for pkg in pkg_resources.working_set}
+for package, version in required_packages.items():
+    if package not in installed_packages:
+        install_package(package, version)
 import numpy as np
 import tensorflow as tf
 import cv2
         self.modelComplexity = modelComplexity
         self.detectionConfidence = detectionConfidence
         self.trackConfidence = trackConfidence
         self.mpHands = mp.solutions.hands
         self.hands = self.mpHands.Hands(
             static_image_mode=self.mode,
             model_complexity=self.modelComplexity,
             min_detection_confidence=self.detectionConfidence,
             min_tracking_confidence=self.trackConfidence)
         self.mpDraw = mp.solutions.drawing_utils
         self.mpDrawStyles = mp.solutions.drawing_styles
     def findAndDrawHands(self, frame):
         RGBimage = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
         self.results = self.hands.process(RGBimage)
         if self.results.multi_hand_landmarks:
             for handLms in self.results.multi_hand_landmarks:
                 self.mpDraw.draw_landmarks(
+                    frame,
                     handLms,
                     self.mpHands.HAND_CONNECTIONS,
                     self.mpDrawStyles.get_default_hand_landmarks_style(),
                     self.mpDrawStyles.get_default_hand_connections_style())
         return frame
     def findLandmarks(self, frame, handNo=0):
         landmarkList = []
         x_list = []
         y_list = []
         bbox = []
         if self.results.multi_hand_landmarks:
             if handNo < len(self.results.multi_hand_landmarks):
                 myHand = self.results.multi_hand_landmarks[handNo]
                 for id, lm in enumerate(myHand.landmark):
                     h, w, c = frame.shape
                     cx, cy = int(lm.x * w), int(lm.y * h)
                     x_list.append(cx)
                     y_list.append(cy)
                     landmarkList.append([id, cx, cy])
                 if x_list and y_list:
                     xmin, xmax = min(x_list), max(x_list)
                     ymin, ymax = min(y_list), max(y_list)
                     padding = 20
                     xmin = max(0, xmin - padding)
                     ymin = max(0, ymin - padding)
                     boxW = min(w - xmin, xmax - xmin + 2*padding)
                     boxH = min(h - ymin, ymax - ymin + 2*padding)
                     if boxW > boxH:
                         diff = boxW - boxH
                         ymin = max(0, ymin - diff//2)
                         diff = boxH - boxW
                         xmin = max(0, xmin - diff//2)
                         boxW = min(w - xmin, boxH)
                     bbox = [xmin, ymin, boxW, boxH]
         return landmarkList, bbox
                     if 'groups' in kwargs:
                         del kwargs['groups']
                     super(CustomDepthwiseConv2D, self).__init__(**kwargs)
             custom_objects = {'DepthwiseConv2D': CustomDepthwiseConv2D}
             model = tf.keras.models.load_model(
+                model_path,
                 custom_objects=custom_objects,
                 compile=False
             )
     labels = ['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',
              'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S',
              'T', 'U', 'V', 'W', 'X', 'Y']
     print("Creating a new compatible model...")
     model = tf.keras.Sequential([
         tf.keras.layers.Conv2D(32, (3, 3), activation='relu', input_shape=(224, 224, 3)),
         tf.keras.layers.Dense(len(labels), activation='softmax')
     ])
     model.compile(optimizer='adam',
+                  loss='sparse_categorical_crossentropy',
                   metrics=['accuracy'])
     return model
             hand_roi_rgb = cv2.cvtColor(hand_roi, cv2.COLOR_GRAY2RGB)
         else:
             hand_roi_rgb = hand_roi.copy()
         resized = cv2.resize(hand_roi_rgb, (target_shape[0], target_shape[1]))
         normalized = resized.astype('float32') / 255.0
     else:
             hand_roi_gray = cv2.cvtColor(hand_roi, cv2.COLOR_BGR2GRAY)
         else:
             hand_roi_gray = hand_roi
         resized = cv2.resize(hand_roi_gray, (target_shape[0], target_shape[1]))
         normalized = resized.astype('float32') / 255.0
         if len(normalized.shape) == 2:
             normalized = normalized[..., np.newaxis]
     return np.expand_dims(normalized, axis=0), resized
 def process_image(input_image):
     tracker = handTracker(detectionConfidence=0.7)
     frame_with_hands = tracker.findAndDrawHands(frame.copy())
     landmarks, bbox = tracker.findLandmarks(frame)
     if not bbox:
         return "No hand detected", None
     x, y, w, h = bbox
     hand_roi = frame[y:y+h, x:x+w]
     cv2.rectangle(frame_with_hands, (x, y), (x+w, y+h), (0, 255, 0), 2)
     model_input, _ = preprocess_hand_roi(hand_roi, model_input_shape)
     try:
         prediction = model.predict(model_input, verbose=0)[0]
         predicted_class = np.argmax(prediction)
         letter = labels[predicted_class] if predicted_class < len(labels) else "Unknown"
     except:
         return "Prediction error", None
     result_text = f"Prediction: {letter} (Confidence: {confidence:.2f})"
+    cv2.putText(frame_with_hands, result_text, (10, 30),
                 cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2)
     output_image = cv2.cvtColor(frame_with_hands, cv2.COLOR_BGR2RGB)
     return result_text, Image.fromarray(output_image)
 )
 if __name__ == "__main__":
+    interface.launch(share=True)