Spaces:

Zeqhx
/

MSL-Project

Sleeping

Zeqh Claude Sonnet 4.5 commited on Dec 31, 2025

Commit

e06c4c9

1 Parent(s): ebdf66c

Update to more accurate model with scaler normalization

- Updated to new trained model (more accurate)
- Added scaler.bin for feature normalization
- Updated to 10 gesture classes (removed 'hi')
- Increased sequence length from 10 to 30 frames
- Raised confidence threshold from 0.5 to 0.7
- Added joblib dependency for scaler loading

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

Files changed (5) hide show

Dockerfile +1 -0
app.py +18 -3
requirements.txt +2 -1
scaler.bin +3 -0
trained_model.pth +2 -2

Dockerfile CHANGED Viewed

@@ -21,6 +21,7 @@ COPY app.py .
 COPY model.py .
 COPY preprocessing.py .
 COPY trained_model.pth .
 # Expose port 7860 (Hugging Face Spaces default)
 EXPOSE 7860

 COPY model.py .
 COPY preprocessing.py .
 COPY trained_model.pth .
+COPY scaler.bin .
 # Expose port 7860 (Hugging Face Spaces default)
 EXPOSE 7860

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ FastAPI application for Sign Language Recognition API
 import os
 import torch
 import numpy as np
 from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
@@ -33,7 +34,7 @@ app.add_middleware(
 # Gesture classes
 GESTURES = [
     'minum', 'berjalan', 'berlari', 'bola', 'dari',
-    'hi', 'jangan', 'mohon', 'pen', 'teh tarik', 'tolong'
 ]
 # Configuration
@@ -41,7 +42,7 @@ INPUT_SIZE = 258
 HIDDEN_SIZE = 64
 NUM_CLASSES = len(GESTURES)
 SEQUENCE_LENGTH = 30
-CONFIDENCE_THRESHOLD = 0.5
 # Device configuration
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -50,6 +51,7 @@ print(f"Using device: {device}")
 # Load model
 model = CustomLSTM(INPUT_SIZE, HIDDEN_SIZE, NUM_CLASSES).to(device)
 model_path = "trained_model.pth"
 try:
     model.load_state_dict(torch.load(model_path, map_location=device))
@@ -59,6 +61,14 @@ except Exception as e:
     print(f"Error loading model: {e}")
     raise
 # Initialize MediaPipe
 mp_holistic = mp.solutions.holistic
 holistic = mp_holistic.Holistic(
@@ -161,8 +171,13 @@ async def predict(request: FrameRequest):
         # Make prediction
         sequence = sequences[request.session_id][-SEQUENCE_LENGTH:]
         input_tensor = torch.tensor(
-            np.expand_dims(sequence, axis=0),
             dtype=torch.float32
         ).to(device)

 import os
 import torch
 import numpy as np
+import joblib
 from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 # Gesture classes
 GESTURES = [
     'minum', 'berjalan', 'berlari', 'bola', 'dari',
+    'jangan', 'mohon', 'pen', 'teh tarik', 'tolong'
 ]
 # Configuration
 HIDDEN_SIZE = 64
 NUM_CLASSES = len(GESTURES)
 SEQUENCE_LENGTH = 30
+CONFIDENCE_THRESHOLD = 0.7
 # Device configuration
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load model
 model = CustomLSTM(INPUT_SIZE, HIDDEN_SIZE, NUM_CLASSES).to(device)
 model_path = "trained_model.pth"
+scaler_path = "scaler.bin"
 try:
     model.load_state_dict(torch.load(model_path, map_location=device))
     print(f"Error loading model: {e}")
     raise
+# Load scaler
+try:
+    scaler = joblib.load(scaler_path)
+    print(f"Scaler loaded successfully from {scaler_path}")
+except Exception as e:
+    print(f"Error loading scaler: {e}")
+    raise
 # Initialize MediaPipe
 mp_holistic = mp.solutions.holistic
 holistic = mp_holistic.Holistic(
         # Make prediction
         sequence = sequences[request.session_id][-SEQUENCE_LENGTH:]
+        sequence_array = np.array(sequence)
+        # Apply scaler transformation
+        sequence_scaled = scaler.transform(sequence_array)
         input_tensor = torch.tensor(
+            np.expand_dims(sequence_scaled, axis=0),
             dtype=torch.float32
         ).to(device)

requirements.txt CHANGED Viewed

@@ -8,6 +8,7 @@ pydantic==2.5.0
 torch==2.1.0
 torchvision==0.16.0
 numpy==1.26.4
 # Computer Vision & MediaPipe
 opencv-python-headless==4.10.0.84
@@ -17,4 +18,4 @@ mediapipe==0.10.21
 Pillow==10.1.0
 # CORS support
-# FastAPI includes CORS middleware via Starlette; no extra package needed.

 torch==2.1.0
 torchvision==0.16.0
 numpy==1.26.4
+joblib==1.3.2
 # Computer Vision & MediaPipe
 opencv-python-headless==4.10.0.84
 Pillow==10.1.0
 # CORS support
+python-cors==1.0.0

scaler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7c9eeb95ab696a19b0a68a4c04f8b892f95dc527a3ac2284ea6fd2530f9c29c
+size 6807

trained_model.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7d97b7dcaea6c08b904d37264641b699af89b8e4347042668b9805371dd06a5
-size 489131

 version https://git-lfs.github.com/spec/v1
+oid sha256:91c78878580fd5637c8e3d9314ccdd97a150074234453d9f0d10e54d7651ac62
+size 487643