Added web inference option

Files changed (5) hide show

web/Dockerfile +30 -0
web/gaze_server.py +293 -0
web/gaze_tracking.html +666 -0
web/readme.md +122 -0
web/requirements.txt +7 -0

web/Dockerfile ADDED Viewed

	@@ -0,0 +1,30 @@

+FROM python:3.11-slim
+WORKDIR /app
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    libglib2.0-0 \
+    libsm6 \
+    libxext6 \
+    libxrender-dev \
+    libgomp1 \
+    libglib2.0-0 \
+    libgl1-mesa-glx \
+    && rm -rf /var/lib/apt/lists/*
+# Copy requirements
+COPY requirements.txt .
+# Install Python dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy application files
+COPY gaze_server.py .
+COPY best_gaze_model.h5 .
+# Expose port
+EXPOSE 5000
+# Run the server
+CMD ["python", "gaze_server.py", "--host", "0.0.0.0", "--port", "5000"]

web/gaze_server.py ADDED Viewed

	@@ -0,0 +1,293 @@

+from flask import Flask, request, jsonify
+from flask_cors import CORS
+import cv2
+import numpy as np
+import tensorflow as tf
+import base64
+import time
+from io import BytesIO
+from PIL import Image
+import logging
+app = Flask(__name__)
+CORS(app)  # Enable CORS for all routes
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+class GazeInferenceServer:
+    def __init__(self, model_path):
+        """Initialize the gaze inference server."""
+        self.model_path = model_path
+        self.model = None
+        self.face_cascade = None
+        self.eye_cascade = None
+        # Model parameters
+        self.face_size = (224, 224)
+        self.eye_size = (80, 60)
+        # Load model and cascades
+        self._load_model()
+        self._load_cascades()
+        logger.info("Gaze inference server initialized")
+    def _load_model(self):
+        """Load the TensorFlow model."""
+        try:
+            # Define custom objects
+            custom_objects = {
+                'euclidean_distance_metric': self._euclidean_distance_metric,
+                'mse': tf.keras.losses.MeanSquaredError(),
+            }
+            # Try to load model
+            try:
+                self.model = tf.keras.models.load_model(
+                    self.model_path,
+                    custom_objects=custom_objects
+                )
+            except:
+                # Alternative loading method
+                self.model = tf.keras.models.load_model(
+                    self.model_path,
+                    compile=False
+                )
+                self.model.compile(
+                    optimizer=tf.keras.optimizers.Adam(learning_rate=0.001),
+                    loss='mse',
+                    metrics=['mae', self._euclidean_distance_metric]
+                )
+            logger.info(f"Model loaded successfully from {self.model_path}")
+        except Exception as e:
+            logger.error(f"Failed to load model: {e}")
+            raise
+    @staticmethod
+    def _euclidean_distance_metric(y_true, y_pred):
+        """Custom metric for model."""
+        return tf.sqrt(tf.reduce_sum(tf.square(y_true - y_pred), axis=-1))
+    def _load_cascades(self):
+        """Load Haar cascades for face and eye detection."""
+        self.face_cascade = cv2.CascadeClassifier(
+            cv2.data.haarcascades + 'haarcascade_frontalface_default.xml'
+        )
+        self.eye_cascade = cv2.CascadeClassifier(
+            cv2.data.haarcascades + 'haarcascade_eye.xml'
+        )
+        logger.info("Haar cascades loaded")
+    def extract_eye_regions(self, face_image):
+        """Extract left and right eye regions from face image."""
+        gray = cv2.cvtColor(face_image, cv2.COLOR_BGR2GRAY)
+        eyes = self.eye_cascade.detectMultiScale(gray, 1.1, 4)
+        if len(eyes) >= 2:
+            # Sort by x-coordinate
+            eyes = sorted(eyes, key=lambda e: e[0])
+            # Extract eyes
+            lx, ly, lw, lh = eyes[0]
+            left_eye = face_image[ly:ly+lh, lx:lx+lw]
+            left_eye = cv2.resize(left_eye, self.eye_size)
+            rx, ry, rw, rh = eyes[1]
+            right_eye = face_image[ry:ry+rh, rx:rx+rw]
+            right_eye = cv2.resize(right_eye, self.eye_size)
+            return left_eye, right_eye, True
+        else:
+            # Fallback to approximate eye regions
+            h, w = face_image.shape[:2]
+            left_region = face_image[h//4:h//2, w//4:w//2]
+            right_region = face_image[h//4:h//2, w//2:3*w//4]
+            left_eye = cv2.resize(left_region, self.eye_size)
+            right_eye = cv2.resize(right_region, self.eye_size)
+            return left_eye, right_eye, False
+    def preprocess_inputs(self, face, left_eye, right_eye):
+        """Preprocess images for model input."""
+        # Normalize to [0, 1]
+        face = face.astype(np.float32) / 255.0
+        left_eye = left_eye.astype(np.float32) / 255.0
+        right_eye = right_eye.astype(np.float32) / 255.0
+        # Add batch dimension
+        face = np.expand_dims(face, axis=0)
+        left_eye = np.expand_dims(left_eye, axis=0)
+        right_eye = np.expand_dims(right_eye, axis=0)
+        return [face, left_eye, right_eye]
+    def predict_gaze(self, image_data, screen_width, screen_height):
+        """Predict gaze position from image."""
+        start_time = time.time()
+        try:
+            # Decode base64 image
+            image_bytes = base64.b64decode(image_data)
+            image = Image.open(BytesIO(image_bytes))
+            image_np = np.array(image)
+            # Convert RGB to BGR for OpenCV
+            if len(image_np.shape) == 3 and image_np.shape[2] == 3:
+                image_np = cv2.cvtColor(image_np, cv2.COLOR_RGB2BGR)
+            # Resize face image
+            face_resized = cv2.resize(image_np, self.face_size)
+            # Extract eye regions
+            left_eye, right_eye, eyes_found = self.extract_eye_regions(face_resized)
+            # Preprocess for model
+            inputs = self.preprocess_inputs(face_resized, left_eye, right_eye)
+            # Predict gaze
+            gaze_pred = self.model.predict(inputs, verbose=0)[0]
+            print(f"Raw gaze prediction: {gaze_pred}")  # Debugging output
+            # Convert to screen coordinates
+            gaze_x = float(gaze_pred[0] * screen_width)
+            gaze_y = float(gaze_pred[1] * screen_height)
+            # Ensure within bounds
+            gaze_x = max(0, min(gaze_x, screen_width))
+            gaze_y = max(0, min(gaze_y, screen_height))
+            print(f"Predicted gaze position: ({gaze_x}, {gaze_y})")  # Debugging output
+            inference_time = (time.time() - start_time) * 1000  # Convert to ms
+            return {
+                'success': True,
+                'gaze_position': {
+                    'x': gaze_x,
+                    'y': gaze_y
+                },
+                'eyes_found': eyes_found,
+                'inference_time': inference_time
+            }
+        except Exception as e:
+            logger.error(f"Prediction error: {e}")
+            return {
+                'success': False,
+                'error': str(e)
+            }
+# Global server instance
+server = None
+@app.route('/health', methods=['GET'])
+def health_check():
+    """Health check endpoint."""
+    return jsonify({
+        'status': 'healthy',
+        'model_loaded': server is not None and server.model is not None
+    })
+@app.route('/predict', methods=['POST'])
+def predict():
+    """Predict gaze position from image."""
+    try:
+        data = request.json
+        if not data or 'image' not in data:
+            return jsonify({
+                'success': False,
+                'error': 'No image data provided'
+            }), 400
+        # Get parameters
+        image_data = data['image']
+        screen_width = data.get('screen_width', 1920)
+        screen_height = data.get('screen_height', 1080)
+        # Predict gaze
+        result = server.predict_gaze(image_data, screen_width, screen_height)
+        return jsonify(result)
+    except Exception as e:
+        logger.error(f"Prediction endpoint error: {e}")
+        return jsonify({
+            'success': False,
+            'error': str(e)
+        }), 500
+@app.route('/calibrate', methods=['POST'])
+def calibrate():
+    """Calibration endpoint (placeholder for future implementation)."""
+    return jsonify({
+        'success': True,
+        'message': 'Calibration not yet implemented'
+    })
+def create_app(model_path='best_gaze_model.h5'):
+    """Create and configure the Flask app."""
+    global server
+    # Initialize server
+    server = GazeInferenceServer(model_path)
+    return app
+if __name__ == '__main__':
+    import argparse
+    import os
+    # Parse arguments
+    parser = argparse.ArgumentParser(description='Gaze Inference Server')
+    parser.add_argument(
+        '--model',
+        type=str,
+        default='best_gaze_model.h5',
+        help='Path to the trained model'
+    )
+    parser.add_argument(
+        '--port',
+        type=int,
+        default=5000,
+        help='Port to run the server on'
+    )
+    parser.add_argument(
+        '--host',
+        type=str,
+        default='0.0.0.0',
+        help='Host to run the server on'
+    )
+    args = parser.parse_args()
+    # Check if model exists
+    if not os.path.exists(args.model):
+        print(f"Error: Model file '{args.model}' not found!")
+        exit(1)
+    # Suppress TensorFlow warnings
+    os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
+    # Create app
+    app = create_app(args.model)
+    # Run server
+    print(f"\n{'='*50}")
+    print(f"Starting Gaze Inference Server")
+    print(f"Model: {args.model}")
+    print(f"Server: http://{args.host}:{args.port}")
+    print(f"{'='*50}\n")
+    app.run(
+        host=args.host,
+        port=args.port,
+        debug=False,
+        threaded=True
+    )

web/gaze_tracking.html ADDED Viewed

	@@ -0,0 +1,666 @@

+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Gaze Tracking Interface</title>
+    <style>
+        body {
+            margin: 0;
+            padding: 0;
+            font-family: Arial, sans-serif;
+            background-color: #1a1a1a;
+            color: white;
+            overflow: hidden;
+        }
+        #container {
+            display: flex;
+            height: 100vh;
+        }
+        #video-container {
+            position: relative;
+            width: 320px;
+            background-color: #2a2a2a;
+            padding: 20px;
+        }
+        #video {
+            width: 100%;
+            height: 240px;
+            background-color: #000;
+            border: 2px solid #444;
+            border-radius: 8px;
+        }
+        #canvas {
+            display: none;
+        }
+        #gaze-screen {
+            flex: 1;
+            position: relative;
+            background-color: #000;
+            cursor: none;
+        }
+        #gaze-cursor {
+            position: absolute;
+            width: 40px;
+            height: 40px;
+            pointer-events: none;
+            transition: transform 0.1s ease-out;
+            transform: translate(-50%, -50%);
+        }
+        .crosshair {
+            position: absolute;
+            background-color: #00ff00;
+        }
+        .crosshair-h {
+            width: 40px;
+            height: 3px;
+            top: 50%;
+            left: 0;
+            transform: translateY(-50%);
+        }
+        .crosshair-v {
+            width: 3px;
+            height: 40px;
+            left: 50%;
+            top: 0;
+            transform: translateX(-50%);
+        }
+        .center-dot {
+            position: absolute;
+            width: 10px;
+            height: 10px;
+            background-color: #ff0000;
+            border: 2px solid #fff;
+            border-radius: 50%;
+            top: 50%;
+            left: 50%;
+            transform: translate(-50%, -50%);
+        }
+        #trail {
+            position: absolute;
+            top: 0;
+            left: 0;
+            width: 100%;
+            height: 100%;
+            pointer-events: none;
+        }
+        .controls {
+            margin-top: 20px;
+        }
+        button {
+            background-color: #4CAF50;
+            border: none;
+            color: white;
+            padding: 10px 20px;
+            margin: 5px;
+            cursor: pointer;
+            border-radius: 4px;
+            font-size: 14px;
+            transition: background-color 0.3s;
+        }
+        button:hover {
+            background-color: #45a049;
+        }
+        button:disabled {
+            background-color: #666;
+            cursor: not-allowed;
+        }
+        #status {
+            margin-top: 20px;
+            padding: 10px;
+            background-color: #333;
+            border-radius: 4px;
+            font-size: 14px;
+        }
+        .status-connected {
+            color: #4CAF50;
+        }
+        .status-disconnected {
+            color: #f44336;
+        }
+        .info {
+            margin-top: 20px;
+            font-size: 12px;
+            color: #888;
+        }
+        #fps {
+            position: absolute;
+            top: 10px;
+            left: 10px;
+            background-color: rgba(0, 0, 0, 0.7);
+            padding: 5px 10px;
+            border-radius: 4px;
+            font-size: 14px;
+        }
+        #coordinates {
+            position: absolute;
+            top: 40px;
+            left: 10px;
+            background-color: rgba(0, 0, 0, 0.7);
+            padding: 5px 10px;
+            border-radius: 4px;
+            font-size: 14px;
+        }
+        .face-box {
+            position: absolute;
+            border: 2px solid #00ff00;
+            pointer-events: none;
+        }
+        .eye-box {
+            position: absolute;
+            border: 2px solid #ffff00;
+            pointer-events: none;
+        }
+        #smoothing-slider {
+            width: 100%;
+            margin-top: 10px;
+        }
+        .slider-container {
+            margin-top: 20px;
+        }
+        .slider-label {
+            font-size: 12px;
+            color: #888;
+            margin-bottom: 5px;
+        }
+    </style>
+</head>
+<body>
+    <div id="container">
+        <div id="video-container">
+            <video id="video" autoplay></video>
+            <canvas id="canvas"></canvas>
+            <div class="controls">
+                <button id="startBtn">Start Tracking</button>
+                <button id="stopBtn" disabled>Stop Tracking</button>
+                <button id="calibrateBtn">Calibrate</button>
+            </div>
+            <div id="status" class="status-disconnected">
+                Status: Not connected
+            </div>
+            <div class="slider-container">
+                <div class="slider-label">Smoothing: <span id="smoothing-value">5</span></div>
+                <input type="range" id="smoothing-slider" min="1" max="20" value="5">
+            </div>
+            <div class="info">
+                <p>Face Detection: <span id="face-status">Not detected</span></p>
+                <p>Model Inference: <span id="inference-time">0</span> ms</p>
+                <p>Server: <span id="server-url">http://localhost:5000</span></p>
+            </div>
+        </div>
+        <div id="gaze-screen">
+            <canvas id="trail"></canvas>
+            <div id="gaze-cursor">
+                <div class="crosshair crosshair-h"></div>
+                <div class="crosshair crosshair-v"></div>
+                <div class="center-dot"></div>
+            </div>
+            <div id="fps">FPS: 0</div>
+            <div id="coordinates">X: 0, Y: 0</div>
+        </div>
+    </div>
+    <script src="https://cdn.jsdelivr.net/npm/@tensorflow/tfjs"></script>
+    <script src="https://cdn.jsdelivr.net/npm/@tensorflow-models/blazeface"></script>
+    <script>
+        class GazeTracker {
+            constructor() {
+                this.video = document.getElementById('video');
+                this.canvas = document.getElementById('canvas');
+                this.ctx = this.canvas.getContext('2d');
+                this.trailCanvas = document.getElementById('trail');
+                this.trailCtx = this.trailCanvas.getContext('2d');
+                this.gazeCursor = document.getElementById('gaze-cursor');
+                this.startBtn = document.getElementById('startBtn');
+                this.stopBtn = document.getElementById('stopBtn');
+                this.calibrateBtn = document.getElementById('calibrateBtn');
+                this.smoothingSlider = document.getElementById('smoothing-slider');
+                this.isTracking = false;
+                this.faceModel = null;
+                this.serverUrl = 'http://localhost:5000';
+                // Gaze position and smoothing
+                this.currentGaze = { x: window.innerWidth / 2, y: window.innerHeight / 2 };
+                this.gazeHistory = [];
+                this.smoothingWindow = 5;
+                // Initialize Kalman filter after DOM is ready
+                this.kalmanFilter = null;
+                // Trail points
+                this.trailPoints = [];
+                this.maxTrailLength = 30;
+                // Performance tracking
+                this.lastTime = performance.now();
+                this.frameCount = 0;
+                this.fps = 0;
+                this.setupEventListeners();
+                this.resizeTrailCanvas();
+                window.addEventListener('resize', () => this.resizeTrailCanvas());
+                // Initialize Kalman filter after a short delay to ensure DOM is ready
+                setTimeout(() => {
+                    this.kalmanFilter = this.initKalmanFilter();
+                }, 100);
+            }
+            initKalmanFilter() {
+                // Get initial screen dimensions
+                const gazeScreen = document.getElementById('gaze-screen');
+                const initialX = gazeScreen ? gazeScreen.offsetWidth / 2 : window.innerWidth / 2;
+                const initialY = gazeScreen ? gazeScreen.offsetHeight / 2 : window.innerHeight / 2;
+                return {
+                    x: { estimate: initialX, uncertainty: 1000 },
+                    y: { estimate: initialY, uncertainty: 1000 },
+                    processNoise: 1,
+                    measurementNoise: 25
+                };
+            }
+            kalmanUpdate(axis, measurement) {
+                const filter = this.kalmanFilter[axis];
+                // Check for valid measurement
+                if (isNaN(measurement) || !isFinite(measurement)) {
+                    console.warn(`Invalid measurement for ${axis}: ${measurement}`);
+                    return filter.estimate;
+                }
+                // Predict
+                filter.uncertainty += filter.processNoise;
+                // Update
+                const gain = filter.uncertainty / (filter.uncertainty + filter.measurementNoise);
+                filter.estimate = filter.estimate + gain * (measurement - filter.estimate);
+                filter.uncertainty = (1 - gain) * filter.uncertainty;
+                // Check for NaN
+                if (isNaN(filter.estimate) || !isFinite(filter.estimate)) {
+                    console.warn(`Kalman filter produced NaN for ${axis}, resetting...`);
+                    // Reset to measurement
+                    filter.estimate = measurement;
+                    filter.uncertainty = 1000;
+                }
+                return filter.estimate;
+            }
+            resizeTrailCanvas() {
+                const gazeScreen = document.getElementById('gaze-screen');
+                this.trailCanvas.width = gazeScreen.offsetWidth;
+                this.trailCanvas.height = gazeScreen.offsetHeight;
+            }
+            setupEventListeners() {
+                this.startBtn.addEventListener('click', () => this.start());
+                this.stopBtn.addEventListener('click', () => this.stop());
+                this.calibrateBtn.addEventListener('click', () => this.calibrate());
+                // Add keyboard shortcut for testing
+                document.addEventListener('keypress', (e) => {
+                    if (e.key === 't' || e.key === 'T') {
+                        // Test cursor movement
+                        console.log('Testing cursor movement...');
+                        const testX = Math.random() * window.innerWidth;
+                        const testY = Math.random() * window.innerHeight;
+                        this.updateGazePosition({ x: testX, y: testY });
+                    } else if (e.key === 'k' || e.key === 'K') {
+                        // Toggle Kalman filter
+                        if (this.kalmanFilter) {
+                            this.kalmanFilter = null;
+                            console.log('Kalman filter disabled');
+                            alert('Kalman filter disabled - using simple averaging only');
+                        } else {
+                            this.kalmanFilter = this.initKalmanFilter();
+                            console.log('Kalman filter enabled');
+                            alert('Kalman filter enabled');
+                        }
+                    }
+                });
+                this.smoothingSlider.addEventListener('input', (e) => {
+                    this.smoothingWindow = parseInt(e.target.value);
+                    document.getElementById('smoothing-value').textContent = this.smoothingWindow;
+                    this.gazeHistory = [];
+                });
+            }
+            async start() {
+                try {
+                    // Get camera stream
+                    const stream = await navigator.mediaDevices.getUserMedia({
+                        video: { width: 640, height: 480 }
+                    });
+                    this.video.srcObject = stream;
+                    // Wait for video to load
+                    await new Promise(resolve => {
+                        this.video.onloadedmetadata = resolve;
+                    });
+                    // Set canvas size
+                    this.canvas.width = this.video.videoWidth;
+                    this.canvas.height = this.video.videoHeight;
+                    // Load face detection model
+                    if (!this.faceModel) {
+                        this.updateStatus('Loading face detection model...', false);
+                        this.faceModel = await blazeface.load();
+                    }
+                    // Check server connection
+                    await this.checkServerConnection();
+                    this.isTracking = true;
+                    this.startBtn.disabled = true;
+                    this.stopBtn.disabled = false;
+                    this.updateStatus('Tracking active', true);
+                    this.trackGaze();
+                } catch (error) {
+                    console.error('Error starting tracking:', error);
+                    this.updateStatus('Error: ' + error.message, false);
+                }
+            }
+            stop() {
+                this.isTracking = false;
+                if (this.video.srcObject) {
+                    this.video.srcObject.getTracks().forEach(track => track.stop());
+                }
+                this.startBtn.disabled = false;
+                this.stopBtn.disabled = true;
+                this.updateStatus('Tracking stopped', false);
+            }
+            async checkServerConnection() {
+                try {
+                    const response = await fetch(`${this.serverUrl}/health`);
+                    if (!response.ok) throw new Error('Server not responding');
+                    return true;
+                } catch (error) {
+                    throw new Error('Cannot connect to inference server. Make sure the Python server is running.');
+                }
+            }
+            async trackGaze() {
+                if (!this.isTracking) return;
+                const startTime = performance.now();
+                // Capture frame
+                this.ctx.drawImage(this.video, 0, 0);
+                // Detect faces
+                const predictions = await this.faceModel.estimateFaces(
+                    this.canvas,
+                    false  // Don't flip horizontally
+                );
+                if (predictions.length > 0) {
+                    const face = predictions[0];
+                    // Update face status
+                    document.getElementById('face-status').textContent = 'Detected';
+                    // Extract face region
+                    const [x1, y1] = face.topLeft;
+                    const [x2, y2] = face.bottomRight;
+                    const width = x2 - x1;
+                    const height = y2 - y1;
+                    // Add padding
+                    const padding = Math.max(width, height) * 0.2;
+                    const faceX = Math.max(0, x1 - padding);
+                    const faceY = Math.max(0, y1 - padding);
+                    const faceWidth = Math.min(this.canvas.width - faceX, width + 2 * padding);
+                    const faceHeight = Math.min(this.canvas.height - faceY, height + 2 * padding);
+                    // Get face image data
+                    const faceImageData = this.ctx.getImageData(faceX, faceY, faceWidth, faceHeight);
+                    // Send to server for inference
+                    const gazePosition = await this.sendToServer(faceImageData, {
+                        x: faceX,
+                        y: faceY,
+                        width: faceWidth,
+                        height: faceHeight
+                    });
+                    if (gazePosition) {
+                        this.updateGazePosition(gazePosition);
+                    }
+                } else {
+                    document.getElementById('face-status').textContent = 'Not detected';
+                }
+                // Update performance metrics
+                this.updatePerformanceMetrics(startTime);
+                // Continue tracking
+                requestAnimationFrame(() => this.trackGaze());
+            }
+            async sendToServer(imageData, faceRect) {
+                try {
+                    // Convert ImageData to base64
+                    const tempCanvas = document.createElement('canvas');
+                    tempCanvas.width = imageData.width;
+                    tempCanvas.height = imageData.height;
+                    const tempCtx = tempCanvas.getContext('2d');
+                    tempCtx.putImageData(imageData, 0, 0);
+                    const base64Image = tempCanvas.toDataURL('image/jpeg', 0.8).split(',')[1];
+                    // Get actual screen dimensions
+                    const gazeScreen = document.getElementById('gaze-screen');
+                    const screenWidth = gazeScreen.offsetWidth;
+                    const screenHeight = gazeScreen.offsetHeight;
+                    console.log('Sending screen dimensions:', { screenWidth, screenHeight });
+                    const response = await fetch(`${this.serverUrl}/predict`, {
+                        method: 'POST',
+                        headers: {
+                            'Content-Type': 'application/json',
+                        },
+                        body: JSON.stringify({
+                            image: base64Image,
+                            face_rect: faceRect,
+                            screen_width: screenWidth,
+                            screen_height: screenHeight
+                        })
+                    });
+                    if (!response.ok) throw new Error('Server error');
+                    const data = await response.json();
+                    console.log('Received gaze position:', data.gaze_position);
+                    // Update inference time
+                    document.getElementById('inference-time').textContent =
+                        data.inference_time ? data.inference_time.toFixed(1) : '0';
+                    return data.gaze_position;
+                } catch (error) {
+                    console.error('Error sending to server:', error);
+                    return null;
+                }
+            }
+            updateGazePosition(position) {
+                // Validate input
+                if (!position || isNaN(position.x) || isNaN(position.y)) {
+                    console.error('Invalid position received:', position);
+                    return;
+                }
+                // Add to history
+                this.gazeHistory.push(position);
+                if (this.gazeHistory.length > this.smoothingWindow) {
+                    this.gazeHistory.shift();
+                }
+                // Calculate smoothed position
+                let smoothedX, smoothedY;
+                if (this.gazeHistory.length > 0) {
+                    // Moving average
+                    const avgX = this.gazeHistory.reduce((sum, p) => sum + p.x, 0) / this.gazeHistory.length;
+                    const avgY = this.gazeHistory.reduce((sum, p) => sum + p.y, 0) / this.gazeHistory.length;
+                    // Try Kalman filter if initialized, otherwise use average
+                    if (this.kalmanFilter) {
+                        smoothedX = this.kalmanUpdate('x', avgX);
+                        smoothedY = this.kalmanUpdate('y', avgY);
+                        // Fallback if Kalman produces NaN
+                        if (isNaN(smoothedX) || isNaN(smoothedY)) {
+                            console.warn('Kalman filter failed, using average');
+                            smoothedX = avgX;
+                            smoothedY = avgY;
+                        }
+                    } else {
+                        smoothedX = avgX;
+                        smoothedY = avgY;
+                    }
+                } else {
+                    smoothedX = position.x;
+                    smoothedY = position.y;
+                }
+                // Ensure coordinates are within screen bounds
+                const gazeScreen = document.getElementById('gaze-screen');
+                smoothedX = Math.max(0, Math.min(smoothedX, gazeScreen.offsetWidth));
+                smoothedY = Math.max(0, Math.min(smoothedY, gazeScreen.offsetHeight));
+                console.log('Updating gaze position:', {
+                    raw: position,
+                    smoothed: { x: smoothedX, y: smoothedY },
+                    screenBounds: {
+                        width: gazeScreen.offsetWidth,
+                        height: gazeScreen.offsetHeight
+                    }
+                });
+                // Update cursor position
+                this.currentGaze = { x: smoothedX, y: smoothedY };
+                this.gazeCursor.style.left = `${smoothedX}px`;
+                this.gazeCursor.style.top = `${smoothedY}px`;
+                // Update coordinates display
+                document.getElementById('coordinates').textContent =
+                    `X: ${Math.round(smoothedX)}, Y: ${Math.round(smoothedY)}`;
+                // Update trail
+                this.updateTrail(smoothedX, smoothedY);
+            }
+            updateTrail(x, y) {
+                this.trailPoints.push({ x, y, time: Date.now() });
+                // Remove old points
+                if (this.trailPoints.length > this.maxTrailLength) {
+                    this.trailPoints.shift();
+                }
+                // Clear and redraw trail
+                this.trailCtx.clearRect(0, 0, this.trailCanvas.width, this.trailCanvas.height);
+                if (this.trailPoints.length > 1) {
+                    this.trailCtx.beginPath();
+                    this.trailCtx.moveTo(this.trailPoints[0].x, this.trailPoints[0].y);
+                    for (let i = 1; i < this.trailPoints.length; i++) {
+                        const point = this.trailPoints[i];
+                        const prevPoint = this.trailPoints[i - 1];
+                        // Gradient effect
+                        const alpha = i / this.trailPoints.length;
+                        this.trailCtx.strokeStyle = `rgba(0, 255, 0, ${alpha * 0.5})`;
+                        this.trailCtx.lineWidth = 2;
+                        this.trailCtx.beginPath();
+                        this.trailCtx.moveTo(prevPoint.x, prevPoint.y);
+                        this.trailCtx.lineTo(point.x, point.y);
+                        this.trailCtx.stroke();
+                    }
+                }
+            }
+            updatePerformanceMetrics(startTime) {
+                const endTime = performance.now();
+                const frameTime = endTime - startTime;
+                this.frameCount++;
+                if (endTime - this.lastTime >= 1000) {
+                    this.fps = this.frameCount;
+                    this.frameCount = 0;
+                    this.lastTime = endTime;
+                    document.getElementById('fps').textContent = `FPS: ${this.fps}`;
+                }
+            }
+            updateStatus(message, isConnected) {
+                const statusEl = document.getElementById('status');
+                statusEl.textContent = `Status: ${message}`;
+                statusEl.className = isConnected ? 'status-connected' : 'status-disconnected';
+            }
+            async calibrate() {
+                // Implement calibration logic
+                alert('Calibration feature coming soon!');
+            }
+        }
+        // Initialize tracker when page loads
+        let tracker;
+        window.addEventListener('DOMContentLoaded', () => {
+            tracker = new GazeTracker();
+        });
+    </script>
+</body>
+</html>

web/readme.md ADDED Viewed

	@@ -0,0 +1,122 @@

+# Gaze Tracking Web Interface
+This system provides a web-based interface for real-time gaze tracking using your trained TensorFlow model. It uses the browser's webcam for face detection and communicates with a Python Flask server for gaze inference.
+## Components
+1. **HTML Interface** (`gaze_tracking.html`): Web-based UI with webcam capture and gaze visualization
+2. **Flask Server** (`gaze_server.py`): Python backend that runs your TensorFlow model
+3. **Face Detection**: Uses TensorFlow.js BlazeFace in the browser + OpenCV Haar cascades on the server
+## Features
+- Real-time face detection in the browser
+- Smooth gaze tracking with Kalman filtering
+- Visual gaze trail
+- FPS and performance monitoring
+- Adjustable smoothing parameters
+- Full-screen gaze visualization
+## Setup Instructions
+### 1. Install Python Dependencies
+```bash
+pip install -r requirements.txt
+```
+### 2. Start the Flask Server
+```bash
+python gaze_server.py --model best_gaze_model.h5 --port 5000
+```
+Options:
+- `--model`: Path to your trained model (default: `best_gaze_model.h5`)
+- `--port`: Server port (default: 5000)
+- `--host`: Server host (default: 0.0.0.0)
+### 3. Open the HTML Interface
+1. Open `gaze_tracking.html` in a modern web browser (Chrome/Firefox/Edge)
+2. Allow camera access when prompted
+3. Click "Start Tracking" to begin
+## How It Works
+1. **Face Detection**: The browser uses BlazeFace (TensorFlow.js) to detect faces in real-time
+2. **Face Extraction**: When a face is detected, the face region is extracted and sent to the server
+3. **Eye Detection**: The server uses OpenCV to detect eye regions within the face
+4. **Model Inference**: Your trained model processes the face and eye images to predict gaze coordinates
+5. **Smoothing**: The browser applies moving average and Kalman filtering for smooth cursor movement
+6. **Visualization**: The gaze position is displayed as a crosshair with a trail effect
+## Architecture
+```
+Browser (Client)                    Python Server
+┌─────────────────┐                ┌──────────────────┐
+│                 │                │                  │
+│  Webcam Feed    │                │  TensorFlow      │
+│       ↓         │                │  Gaze Model      │
+│  Face Detection │  HTTP POST     │       ↑          │
+│  (BlazeFace)    │  →→→→→→→→→→→→  │  Face & Eyes     │
+│       ↓         │  (Base64 img)  │  Processing      │
+│  Send Face ROI  │                │       ↓          │
+│       ↓         │  ←←←←←←←←←←←←  │  Gaze Position   │
+│  Smoothing &    │  (JSON resp)   │  Prediction      │
+│  Visualization  │                │                  │
+│                 │                │                  │
+└─────────────────┘                └──────────────────┘
+```
+## Controls
+- **Start/Stop Tracking**: Control gaze tracking
+- **Smoothing Slider**: Adjust smoothing window (1-20 frames)
+- **Calibrate**: (Coming soon) Calibration for improved accuracy
+## Performance Tips
+1. **Lighting**: Ensure good, even lighting on your face
+2. **Position**: Sit at a comfortable distance from the camera
+3. **Stability**: Keep your head relatively stable for best results
+4. **Browser**: Use Chrome or Firefox for best performance
+## Troubleshooting
+### Server Won't Start
+- Check if the model file exists at the specified path
+- Ensure all Python dependencies are installed
+- Check if port 5000 is available
+### No Face Detection
+- Ensure adequate lighting
+- Check camera permissions in browser
+- Try adjusting your distance from the camera
+### Poor Tracking Accuracy
+- The model may need calibration for your specific setup
+- Try adjusting the smoothing parameter
+- Ensure eyes are clearly visible to the camera
+## API Endpoints
+- `GET /health`: Health check
+- `POST /predict`: Gaze prediction endpoint
+  - Request: `{ image: base64, screen_width: int, screen_height: int }`
+  - Response: `{ gaze_position: {x, y}, inference_time: float }`
+## Future Enhancements
+- User-specific calibration system
+- Multi-face tracking support
+- Gaze heatmap visualization
+- Recording and playback features
+- WebSocket support for lower latency
+## Security Notes
+- The server runs locally by default
+- For remote access, consider adding authentication
+- Use HTTPS in production environments

web/requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+# Minimal requirements for Python 3.12 compatibility
+flask>=3.0.0
+flask-cors>=4.0.0
+tensorflow>=2.15.0
+opencv-python>=4.9.0.80
+numpy>=1.26.2
+pillow>=10.1.0