AkashKhatri
/

sign-language-interpretor

Model card Files Files and versions

xet

Community

AkashKhatri commited on Dec 7, 2023

Commit

ba534be

1 Parent(s): b82b792

upload

Browse files

Files changed (2) hide show

sign_asl_cnn_30_epochs.h5 +3 -0
streamlit_app.py +152 -0

sign_asl_cnn_30_epochs.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bb7dbc904898a1b2e60dc5d60fc045bb5dea4fd422fb292b3de22f83e49a2d9
+size 495899136

streamlit_app.py ADDED Viewed

	@@ -0,0 +1,152 @@

+import streamlit as st
+import numpy as np
+from keras.models import load_model
+import cv2
+from io import BytesIO
+import mediapipe as mp
+# Load the model
+model = load_model('sign_asl_cnn_30_epochs.h5')
+class_labels = {i: str(i) if i < 10 else chr(65 + i - 10) for i in range(36)}
+# Function to preprocess the image
+def preprocess_image(image):
+    image = cv2.resize(image, (200, 200))
+    image = image / 255.0
+    image = image.reshape(1, 200, 200, 3)
+    return image
+# Function to predict the sign language letter
+def predict_letter(image):
+    processed_image = preprocess_image(image)
+    predictions = model.predict(processed_image)
+    predicted_class = np.argmax(predictions, axis=1)[0]
+    sign_letter = class_labels[predicted_class]
+    return sign_letter
+# Function to detect hands in the image
+def detect_hands(image):
+    mp_hands = mp.solutions.hands
+    hands = mp_hands.Hands()
+    margin = 15
+    # Convert the image to RGB
+    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    # Process the image and get the hand landmarks
+    results = hands.process(image_rgb)
+    if results.multi_hand_landmarks:
+        for landmarks in results.multi_hand_landmarks:
+            # Get bounding box coordinates of the hand
+            landmarks_xy = [(int(landmark.x * image.shape[1]), int(landmark.y * image.shape[0]))
+                            for landmark in landmarks.landmark]
+            # Define the bounding box for the hand
+            x_min = max(0, min(landmarks_xy, key=lambda x: x[0])[0] - margin)
+            y_min = max(0, min(landmarks_xy, key=lambda x: x[1])[1] - margin)
+            x_max = min(image.shape[1], max(landmarks_xy, key=lambda x: x[0])[0] + margin)
+            y_max = min(image.shape[0], max(landmarks_xy, key=lambda x: x[1])[1] + margin)
+            # Extract the hand region
+            roi = image[y_min:y_max, x_min:x_max]
+            # Check if the ROI is empty
+            if roi.size == 0:
+                continue
+            # Resize the ROI to match your model's input shape
+            roi = cv2.resize(roi, (200, 200), interpolation=cv2.INTER_AREA)
+            hsv = cv2.cvtColor(roi, cv2.COLOR_BGR2RGB)
+            lower_yellow = np.array([93, 72, 51])
+            upper_yellow = np.array([224, 194, 183])
+            mask = cv2.inRange(hsv, lower_yellow, upper_yellow)
+            roi = cv2.bitwise_and(roi, roi, mask=mask)
+            roi = roi.reshape(1, 200, 200, 3)  # Ensure it matches your model's input shape
+            # Make predictions using your classifier
+            predictions = model.predict(roi)
+            predicted_class = int(np.argmax(predictions, axis=1)[0])
+            result = class_labels[predicted_class]
+            # Draw result on the image
+            cv2.putText(image, str(result), (x_min, y_min - 10),
+                        cv2.FONT_HERSHEY_COMPLEX, 1, (0, 255, 0), 2)
+            # Draw bounding box on the image
+            cv2.rectangle(image, (x_min, y_min), (x_max, y_max), (255, 0, 0), 2)
+    return image
+# Streamlit app
+st.title('Sign Language Recognition')
+# Sidebar with radio button for Upload/Webcam
+selected_option = st.sidebar.radio("Select Option", ["Upload", "Webcam"], index=0)
+if selected_option == "Upload":
+    uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "png"])
+    if uploaded_file is not None:
+        if st.button('Predict'):
+            contents = uploaded_file.read()
+            nparr = np.frombuffer(contents, np.uint8)
+            image = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+            # Make the prediction
+            predicted_letter = predict_letter(image)
+            # Display the predicted letter
+            st.write('Predicted Letter:', predicted_letter)
+elif selected_option == "Webcam":
+    # Placeholder for webcam frame
+    webcam_frame = st.empty()
+    # Placeholder for predicted letter in webcam mode
+    predicted_letter_webcam = st.empty()
+    # Placeholder for webcam capture status
+    webcam_capture_status = st.empty()
+    # Placeholder for webcam stop button
+    webcam_stop_button = st.empty()
+    # Placeholder for webcam status
+    webcam_status = st.empty()
+    # Placeholder for webcam button
+    webcam_button = st.button("Start Webcam")
+    if webcam_button:
+        webcam_status.text("Webcam is on.")
+        webcam_stop_button = st.button("Stop Webcam")
+        # OpenCV video capture
+        cap = cv2.VideoCapture(0)
+        while True:
+            # Read the frame from the webcam
+            ret, frame = cap.read()
+            # Display the frame in Streamlit
+            webcam_frame.image(frame, channels="BGR")
+            # Detect hands in the current frame
+            frame = detect_hands(frame)
+            # Convert the frame to JPEG format
+            _, jpeg = cv2.imencode(".jpg", frame)
+            # Display the predicted letter
+            predicted_letter = predict_letter(frame)
+            predicted_letter_webcam.text(f"Predicted Letter: {predicted_letter}")
+            # Check if the "Stop Webcam" button is clicked
+            if webcam_stop_button:
+                webcam_status.text("Webcam is off.")
+                break
+        # Release the webcam when done
+        cap.release()