Spaces:

msmaje
/

multimodels_voice_security_system

Sleeping

App Files Files Community

msmaje commited on Jun 8, 2025

Commit

2ac8d9b

verified ·

1 Parent(s): 047fc3c

Update app.py

Browse files

Files changed (1) hide show

app.py +213 -135

app.py CHANGED Viewed

@@ -140,11 +140,45 @@ class VoiceSecuritySystem:
         self.preprocessor = AudioPreprocessor()
         self.models = {}
         self.label_encoder = LabelEncoder()
         self.model_info = {
-            "resnet18": {"name": "ResNet-18", "description": "Fast and efficient for real-time applications"},
-            "resnet50": {"name": "ResNet-50", "description": "Balanced performance and accuracy"},
-            "efficientnet_b0": {"name": "EfficientNet-B0", "description": "Optimized for mobile deployment"},
-            "mobilenet_v2": {"name": "MobileNet-V2", "description": "Lightweight with good accuracy"}
         }
         self.load_models()
@@ -152,7 +186,7 @@ class VoiceSecuritySystem:
         """Load all pre-trained models"""
         # This would load your actual trained models
         # For demo purposes, we'll create placeholder models
-        num_classes = 10  # Adjust based on your actual number of users
         # Initialize label encoder with dummy classes
         dummy_classes = [f"user_{i+1}" for i in range(num_classes)]
@@ -172,9 +206,9 @@ class VoiceSecuritySystem:
                 # model.load_state_dict(torch.load(f"models/{model_name}.pth", map_location=self.device))
                 model.eval()
                 self.models[model_name] = model
-                print(f"Loaded {model_name} successfully")
             except Exception as e:
-                print(f"Error loading {model_name}: {e}")
     def predict_voice(self, audio_file, model_name, confidence_threshold):
         """Predict voice access using selected model"""
@@ -205,7 +239,7 @@ class VoiceSecuritySystem:
                 # Create visualization
                 viz_plot = self.create_prediction_visualization(probabilities.cpu().numpy()[0],
-                                                             predicted_class, confidence_score)
                 # Determine access decision
                 if confidence_score >= confidence_threshold:
@@ -217,12 +251,24 @@ class VoiceSecuritySystem:
                     message = f"Access denied - Low confidence"
                     security_status = f"⚠️ UNAUTHORIZED ACCESS ATTEMPT"
                 detailed_info = f"""
-                **Model Used:** {self.model_info[model_name]['name']}
-                **Predicted User:** {predicted_class}
-                **Confidence Score:** {confidence_score:.3f}
-                **Threshold:** {confidence_threshold}
-                **Decision:** {'GRANT' if confidence_score >= confidence_threshold else 'DENY'}
                 """
                 return status, message, confidence_score, viz_plot, detailed_info
@@ -232,12 +278,12 @@ class VoiceSecuritySystem:
     def create_prediction_visualization(self, probabilities, predicted_class, confidence):
         """Create visualization of prediction results"""
-        fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))
-        # Color scheme without blue
         colors = ['#FF6B6B', '#4ECDC4', '#45B7D1', '#96CEB4', '#F7DC6F', '#BB8FCE', '#85C1E9', '#F8C471', '#82E0AA', '#F1948A']
-        # Plot 1: Top 5 predictions
         top_5_indices = np.argsort(probabilities)[-5:][::-1]
         top_5_probs = probabilities[top_5_indices]
         top_5_labels = [self.label_encoder.inverse_transform([i])[0] for i in top_5_indices]
@@ -245,21 +291,22 @@ class VoiceSecuritySystem:
         bars = ax1.barh(range(len(top_5_labels)), top_5_probs, color=colors[:len(top_5_labels)])
         ax1.set_yticks(range(len(top_5_labels)))
         ax1.set_yticklabels(top_5_labels)
-        ax1.set_xlabel('Confidence Score')
-        ax1.set_title('Top 5 Predictions')
         ax1.set_xlim(0, 1)
-        # Highlight the top prediction
-        bars[0].set_color('#FFD93D')
         bars[0].set_edgecolor('#FF8C00')
-        bars[0].set_linewidth(2)
-        # Add value labels
         for i, (bar, prob) in enumerate(zip(bars, top_5_probs)):
-            ax1.text(prob + 0.01, bar.get_y() + bar.get_height()/2,
-                    f'{prob:.3f}', va='center', fontweight='bold')
-        # Plot 2: Confidence gauge
         theta = np.linspace(0, np.pi, 100)
         r = np.ones_like(theta)
@@ -268,53 +315,57 @@ class VoiceSecuritySystem:
         ax2.set_theta_direction(1)
         ax2.set_ylim(0, 1)
-        # Color segments based on confidence levels
         if confidence < 0.3:
-            color = '#FF6B6B'  # Red
-            status_text = 'LOW'
         elif confidence < 0.7:
-            color = '#F7DC6F'  # Yellow
-            status_text = 'MEDIUM'
         else:
-            color = '#58D68D'  # Green
-            status_text = 'HIGH'
-        # Draw gauge
-        ax2.fill_between(theta, 0, r, alpha=0.3, color='lightgray')
         confidence_theta = theta[int(confidence * len(theta))]
-        ax2.plot([confidence_theta, confidence_theta], [0, 1], color=color, linewidth=8)
         ax2.fill_between(theta[:int(confidence * len(theta))], 0, r[:int(confidence * len(theta))],
-                        alpha=0.7, color=color)
-        ax2.set_title(f'Confidence: {confidence:.3f}\nLevel: {status_text}', pad=20)
         ax2.set_ylim(0, 1)
         ax2.set_yticklabels([])
-        ax2.set_xticklabels(['Low', '', '', 'Medium', '', '', 'High'])
         plt.tight_layout()
         return fig
     def create_empty_plot(self):
         """Create empty plot for error cases"""
-        fig, ax = plt.subplots(figsize=(8, 6))
-        ax.text(0.5, 0.5, 'No Data Available', ha='center', va='center',
-                fontsize=20, color='gray')
         ax.set_xlim(0, 1)
         ax.set_ylim(0, 1)
         ax.axis('off')
         return fig
     def get_model_comparison(self):
-        """Return model comparison information"""
         comparison_data = []
         for model_key, info in self.model_info.items():
-            # In actual deployment, you would load real metrics
             comparison_data.append([
                 info['name'],
-                info['description'],
-                f"{np.random.uniform(0.85, 0.95):.3f}",  # Mock accuracy
-                f"{np.random.uniform(0.01, 0.05):.3f}",  # Mock FAR
-                f"{np.random.uniform(0.02, 0.08):.3f}"   # Mock FRR
             ])
         return comparison_data
@@ -329,200 +380,226 @@ def get_model_info(model_name):
     """Get information about selected model"""
     if model_name in voice_system.model_info:
         info = voice_system.model_info[model_name]
-        return f"**{info['name']}**\n\n{info['description']}"
     return "Model information not available"
-# Custom CSS for styling (no blue colors)
 custom_css = """
 .gradio-container {
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
 }
 .gr-button-primary {
     background: linear-gradient(45deg, #FF6B6B, #FF8E53) !important;
     border: none !important;
 }
 .gr-button-secondary {
     background: linear-gradient(45deg, #4ECDC4, #44A08D) !important;
     border: none !important;
 }
 .gr-panel {
     background: rgba(255, 255, 255, 0.95) !important;
-    backdrop-filter: blur(10px) !important;
-    border-radius: 15px !important;
-    border: 1px solid rgba(255, 255, 255, 0.2) !important;
 }
 .gr-form {
     background: transparent !important;
 }
 .gr-box {
-    border-radius: 10px !important;
     border: 1px solid #E0E0E0 !important;
 }
 h1, h2, h3 {
     color: #2C3E50 !important;
-    text-shadow: 1px 1px 2px rgba(0,0,0,0.1) !important;
 }
-.security-status {
-    padding: 10px;
-    border-radius: 8px;
-    margin: 10px 0;
     font-weight: bold;
-}
-.access-granted {
-    background-color: #D5F4E6;
-    color: #27AE60;
-    border-left: 4px solid #27AE60;
-}
-.access-denied {
-    background-color: #FADBD8;
-    color: #E74C3C;
-    border-left: 4px solid #E74C3C;
 }
 """
-# Create Gradio interface
-with gr.Blocks(css=custom_css, title="🔊 Voice Recognition Security System") as app:
     gr.HTML("""
-    <div style="text-align: center; padding: 20px; background: linear-gradient(45deg, #667eea, #764ba2); color: white; border-radius: 15px; margin-bottom: 20px;">
-        <h1 style="margin: 0; font-size: 2.5em; text-shadow: 2px 2px 4px rgba(0,0,0,0.3);">🔊 Voice Recognition Security System</h1>
-        <p style="margin: 10px 0 0 0; font-size: 1.2em; opacity: 0.9;">Advanced AI-powered voice authentication with multiple deep learning models</p>
     </div>
     """)
     with gr.Row():
         with gr.Column(scale=1):
-            gr.HTML("<h2>🎯 Authentication Panel</h2>")
-            # Audio input
             audio_input = gr.Audio(
-                label="🎤 Upload Voice Sample",
                 type="filepath",
                 elem_id="audio_input"
             )
-            # Model selection
             model_selector = gr.Dropdown(
                 choices=[
-                    ("ResNet-18 (Fast & Efficient)", "resnet18"),
-                    ("ResNet-50 (Balanced Performance)", "resnet50"),
-                    ("EfficientNet-B0 (Mobile Optimized)", "efficientnet_b0"),
-                    ("MobileNet-V2 (Lightweight)", "mobilenet_v2")
                 ],
                 value="resnet18",
-                label="🤖 Select AI Model",
-                info="Choose the deep learning model for voice recognition"
             )
-            # Confidence threshold
             confidence_slider = gr.Slider(
                 minimum=0.1,
                 maximum=1.0,
-                value=0.7,
                 step=0.05,
-                label="🎚️ Security Threshold",
-                info="Higher values = More secure but stricter"
             )
-            # Process button
             process_btn = gr.Button(
-                "🔍 Authenticate Voice",
                 variant="primary",
                 size="lg"
             )
-            # Model info display
             model_info_display = gr.Markdown(
                 get_model_info("resnet18"),
-                label="📋 Model Information"
             )
         with gr.Column(scale=2):
-            gr.HTML("<h2>📊 Authentication Results</h2>")
             with gr.Row():
                 with gr.Column():
-                    # Status display
                     status_output = gr.Textbox(
-                        label="🚦 Access Status",
                         interactive=False,
                         elem_id="status_output"
                     )
-                    # Message display
                     message_output = gr.Textbox(
-                        label="💬 System Message",
                         interactive=False
                     )
-                    # Confidence display
                     confidence_output = gr.Number(
-                        label="📈 Confidence Score",
                         interactive=False,
                         precision=3
                     )
                 with gr.Column():
-                    # Detailed information
                     detailed_info = gr.Markdown(
-                        label="🔍 Detailed Analysis"
                     )
-            # Visualization plot
             plot_output = gr.Plot(
-                label="📈 Prediction Visualization",
                 elem_id="plot_output"
             )
-    # Model comparison section
     with gr.Row():
-        gr.HTML("<h2>⚖️ Model Comparison</h2>")
     with gr.Row():
         comparison_table = gr.Dataframe(
-            headers=["Model", "Description", "Accuracy", "FAR (False Accept)", "FRR (False Reject)"],
             value=voice_system.get_model_comparison(),
-            label="📊 Performance Metrics",
             interactive=False
         )
-    # Information section
     with gr.Row():
         with gr.Column():
             gr.HTML("""
-            <div style="background: linear-gradient(45deg, #FFF3E0, #FFE0B2); padding: 20px; border-radius: 10px; border-left: 4px solid #FF9800;">
-                <h3>🛡️ Security Features</h3>
-                <ul>
-                    <li><strong>Multi-Model Architecture:</strong> Choose from 4 state-of-the-art models</li>
-                    <li><strong>Confidence-Based Authentication:</strong> Adjustable security thresholds</li>
-                    <li><strong>Real-Time Processing:</strong> Fast voice recognition and analysis</li>
-                    <li><strong>Detailed Analytics:</strong> Comprehensive prediction visualization</li>
                 </ul>
             </div>
             """)
         with gr.Column():
             gr.HTML("""
-            <div style="background: linear-gradient(45deg, #E8F5E8, #C8E6C9); padding: 20px; border-radius: 10px; border-left: 4px solid #4CAF50;">
-                <h3>📖 How to Use</h3>
-                <ol>
-                    <li><strong>Upload Audio:</strong> Record or upload a voice sample (3 seconds recommended)</li>
-                    <li><strong>Select Model:</strong> Choose the AI model based on your needs</li>
-                    <li><strong>Set Threshold:</strong> Adjust security level (0.7 recommended for balanced security)</li>
-                    <li><strong>Authenticate:</strong> Click the button to process your voice</li>
-                    <li><strong>Review Results:</strong> Check the detailed analysis and visualization</li>
                 </ol>
             </div>
             """)
     # Event handlers
     model_selector.change(
         fn=get_model_info,
@@ -536,14 +613,15 @@ with gr.Blocks(css=custom_css, title="🔊 Voice Recognition Security System") a
         outputs=[status_output, message_output, confidence_output, plot_output, detailed_info]
     )
-    # Footer
     gr.HTML("""
-    <div style="text-align: center; padding: 20px; margin-top: 30px; background: linear-gradient(45deg, #37474F, #455A64); color: white; border-radius: 10px;">
-        <p style="margin: 0; opacity: 0.8;">🔒 Advanced Voice Recognition Security System | Powered by Deep Learning & Transfer Learning</p>
-        <p style="margin: 5px 0 0 0; font-size: 0.9em; opacity: 0.6;">Supported formats: WAV, MP3, FLAC, M4A, OGG | Optimized for 16kHz sample rate</p>
     </div>
     """)
 # Launch configuration
 if __name__ == "__main__":
     app.launch(

         self.preprocessor = AudioPreprocessor()
         self.models = {}
         self.label_encoder = LabelEncoder()
+        # Updated model info with actual training results
         self.model_info = {
+            "resnet18": {
+                "name": "ResNet-18 🏆 CHAMPION",
+                "description": "🥇 BEST PERFORMING MODEL - Perfect 100% accuracy with 11.3M parameters (4.9M trainable). Exceptional security with 0.06% FAR and 0% FRR. Ideal for high-security applications requiring zero false rejections.",
+                "accuracy": "100.00%",
+                "far": "0.0006",
+                "frr": "0.0000",
+                "parameters": "11.3M total (4.9M trainable)",
+                "status": "🏆 CHAMPION"
+            },
+            "resnet50": {
+                "name": "ResNet-50 🥈 HIGH PERFORMER",
+                "description": "🥈 EXCELLENT ACCURACY - 99.94% accuracy with 24.6M parameters (16.0M trainable). Near-perfect performance with robust feature extraction. Best for applications requiring high accuracy with acceptable computational overhead.",
+                "accuracy": "99.94%",
+                "far": "0.0006",
+                "frr": "0.0000",
+                "parameters": "24.6M total (16.0M trainable)",
+                "status": "🥈 RUNNER-UP"
+            },
+            "efficientnet_b0": {
+                "name": "EfficientNet-B0 ⚡ EFFICIENT",
+                "description": "⚡ MOBILE OPTIMIZED - 99.76% accuracy with only 4.7M parameters (3.8M trainable). Excellent efficiency-accuracy trade-off. Perfect for mobile deployment with minimal computational requirements.",
+                "accuracy": "99.76%",
+                "far": "0.0030",
+                "frr": "0.0000",
+                "parameters": "4.7M total (3.8M trainable)",
+                "status": "⚡ EFFICIENT"
+            },
+            "mobilenet_v2": {
+                "name": "MobileNet-V2 📱 LIGHTWEIGHT",
+                "description": "📱 ULTRA-LIGHTWEIGHT - 99.76% accuracy with just 2.9M parameters (1.1M trainable). Smallest model with excellent performance. Ideal for edge devices and real-time applications with limited resources.",
+                "accuracy": "99.76%",
+                "far": "0.0012",
+                "frr": "0.0000",
+                "parameters": "2.9M total (1.1M trainable)",
+                "status": "📱 COMPACT"
+            }
         }
         self.load_models()
         """Load all pre-trained models"""
         # This would load your actual trained models
         # For demo purposes, we'll create placeholder models
+        num_classes = 26  # Based on your training output (26 users)
         # Initialize label encoder with dummy classes
         dummy_classes = [f"user_{i+1}" for i in range(num_classes)]
                 # model.load_state_dict(torch.load(f"models/{model_name}.pth", map_location=self.device))
                 model.eval()
                 self.models[model_name] = model
+                print(f"✅ Loaded {model_name} successfully")
             except Exception as e:
+                print(f"❌ Error loading {model_name}: {e}")
     def predict_voice(self, audio_file, model_name, confidence_threshold):
         """Predict voice access using selected model"""
                 # Create visualization
                 viz_plot = self.create_prediction_visualization(probabilities.cpu().numpy()[0],
+                                                                predicted_class, confidence_score)
                 # Determine access decision
                 if confidence_score >= confidence_threshold:
                     message = f"Access denied - Low confidence"
                     security_status = f"⚠️ UNAUTHORIZED ACCESS ATTEMPT"
+                model_stats = self.model_info[model_name]
                 detailed_info = f"""
+                ## 🤖 Model Performance
+                **Model Used:** {model_stats['name']}
+                **Training Accuracy:** {model_stats['accuracy']}
+                **Model Size:** {model_stats['parameters']}
+                **Status:** {model_stats['status']}
+                ## 🔍 Prediction Results
+                **Predicted User:** {predicted_class}
+                **Confidence Score:** {confidence_score:.3f}
+                **Security Threshold:** {confidence_threshold}
+                **Decision:** {'✅ GRANT ACCESS' if confidence_score >= confidence_threshold else '❌ DENY ACCESS'}
+                ## 🛡️ Security Metrics
+                **False Accept Rate (FAR):** {model_stats['far']}
+                **False Reject Rate (FRR):** {model_stats['frr']}
+                **Security Level:** {'🔒 HIGH' if confidence_score >= 0.8 else '🔓 MEDIUM' if confidence_score >= 0.5 else '⚠️ LOW'}
                 """
                 return status, message, confidence_score, viz_plot, detailed_info
     def create_prediction_visualization(self, probabilities, predicted_class, confidence):
         """Create visualization of prediction results"""
+        fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 6))
+        # Enhanced color scheme
         colors = ['#FF6B6B', '#4ECDC4', '#45B7D1', '#96CEB4', '#F7DC6F', '#BB8FCE', '#85C1E9', '#F8C471', '#82E0AA', '#F1948A']
+        # Plot 1: Top 5 predictions with enhanced styling
         top_5_indices = np.argsort(probabilities)[-5:][::-1]
         top_5_probs = probabilities[top_5_indices]
         top_5_labels = [self.label_encoder.inverse_transform([i])[0] for i in top_5_indices]
         bars = ax1.barh(range(len(top_5_labels)), top_5_probs, color=colors[:len(top_5_labels)])
         ax1.set_yticks(range(len(top_5_labels)))
         ax1.set_yticklabels(top_5_labels)
+        ax1.set_xlabel('Confidence Score', fontweight='bold')
+        ax1.set_title('🎯 Top 5 User Predictions', fontweight='bold', fontsize=12)
         ax1.set_xlim(0, 1)
+        ax1.grid(axis='x', alpha=0.3)
+        # Highlight the top prediction with gold color
+        bars[0].set_color('#FFD700')
         bars[0].set_edgecolor('#FF8C00')
+        bars[0].set_linewidth(3)
+        # Add value labels with better formatting
         for i, (bar, prob) in enumerate(zip(bars, top_5_probs)):
+            ax1.text(prob + 0.02, bar.get_y() + bar.get_height()/2,
+                     f'{prob:.3f}', va='center', fontweight='bold', fontsize=10)
+        # Plot 2: Enhanced confidence gauge
         theta = np.linspace(0, np.pi, 100)
         r = np.ones_like(theta)
         ax2.set_theta_direction(1)
         ax2.set_ylim(0, 1)
+        # Enhanced color segments based on confidence levels
         if confidence < 0.3:
+            color = '#FF4757'  # Red
+            status_text = '⚠️ LOW'
+            risk_level = 'HIGH RISK'
         elif confidence < 0.7:
+            color = '#FFA726'  # Orange
+            status_text = '🟡 MEDIUM'
+            risk_level = 'MODERATE RISK'
         else:
+            color = '#66BB6A'  # Green
+            status_text = '✅ HIGH'
+            risk_level = 'LOW RISK'
+        # Draw enhanced gauge
+        ax2.fill_between(theta, 0, r, alpha=0.2, color='lightgray')
         confidence_theta = theta[int(confidence * len(theta))]
+        ax2.plot([confidence_theta, confidence_theta], [0, 1], color=color, linewidth=10)
         ax2.fill_between(theta[:int(confidence * len(theta))], 0, r[:int(confidence * len(theta))],
+                         alpha=0.8, color=color)
+        ax2.set_title(f'🎚️ Confidence Level\n{confidence:.3f} - {status_text}\n{risk_level}',
+                      pad=30, fontweight='bold')
         ax2.set_ylim(0, 1)
         ax2.set_yticklabels([])
+        ax2.set_xticklabels(['🔴 Low', '', '🟡 Med', '', '🟢 High'], fontweight='bold')
         plt.tight_layout()
         return fig
     def create_empty_plot(self):
         """Create empty plot for error cases"""
+        fig, ax = plt.subplots(figsize=(10, 6))
+        ax.text(0.5, 0.5, '📊 No Data Available\nPlease upload an audio file',
+                ha='center', va='center', fontsize=18, color='gray', fontweight='bold')
         ax.set_xlim(0, 1)
         ax.set_ylim(0, 1)
         ax.axis('off')
         return fig
     def get_model_comparison(self):
+        """Return model comparison information with actual training results"""
         comparison_data = []
         for model_key, info in self.model_info.items():
             comparison_data.append([
                 info['name'],
+                info['accuracy'],
+                info['far'],
+                info['frr'],
+                info['parameters'],
+                info['status']
             ])
         return comparison_data
     """Get information about selected model"""
     if model_name in voice_system.model_info:
         info = voice_system.model_info[model_name]
+        return f"## {info['name']}\n\n{info['description']}\n\n**📊 Key Stats:**\n- Accuracy: {info['accuracy']}\n- Parameters: {info['parameters']}\n- FAR: {info['far']} | FRR: {info['frr']}"
     return "Model information not available"
+# Enhanced custom CSS
 custom_css = """
 .gradio-container {
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
+    font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif !important;
 }
 .gr-button-primary {
     background: linear-gradient(45deg, #FF6B6B, #FF8E53) !important;
     border: none !important;
+    font-weight: bold !important;
+    text-transform: uppercase !important;
+    letter-spacing: 1px !important;
 }
 .gr-button-secondary {
     background: linear-gradient(45deg, #4ECDC4, #44A08D) !important;
     border: none !important;
 }
 .gr-panel {
     background: rgba(255, 255, 255, 0.95) !important;
+    backdrop-filter: blur(15px) !important;
+    border-radius: 20px !important;
+    border: 2px solid rgba(255, 255, 255, 0.3) !important;
+    box-shadow: 0 8px 32px rgba(0, 0, 0, 0.1) !important;
 }
 .gr-form {
     background: transparent !important;
 }
 .gr-box {
+    border-radius: 15px !important;
     border: 1px solid #E0E0E0 !important;
+    box-shadow: 0 4px 16px rgba(0, 0, 0, 0.05) !important;
 }
 h1, h2, h3 {
     color: #2C3E50 !important;
+    text-shadow: 2px 2px 4px rgba(0,0,0,0.1) !important;
 }
+.champion-badge {
+    background: linear-gradient(45deg, #FFD700, #FFA500);
+    padding: 5px 10px;
+    border-radius: 20px;
+    color: #333;
     font-weight: bold;
+    display: inline-block;
+    margin: 5px;
 }
 """
+# Create enhanced Gradio interface
+with gr.Blocks(css=custom_css, title="🔊 Voice Recognition Security System - Trained Results") as app:
     gr.HTML("""
+    <div style="text-align: center; padding: 30px; background: linear-gradient(45deg, #667eea, #764ba2); color: white; border-radius: 20px; margin-bottom: 25px; box-shadow: 0 10px 30px rgba(0,0,0,0.3);">
+        <h1 style="margin: 0; font-size: 3em; text-shadow: 3px 3px 6px rgba(0,0,0,0.4);">🔊 Voice Recognition Security System</h1>
+        <p style="margin: 15px 0 10px 0; font-size: 1.3em; opacity: 0.95;">Advanced AI-powered voice authentication with 4 deep learning models</p>
+        <div style="background: rgba(255,255,255,0.2); padding: 10px; border-radius: 10px; margin-top: 15px;">
+            <p style="margin: 0; font-size: 1.1em; font-weight: bold;">🏆 Training Complete: 26 Users | 1,693 Samples | Best Accuracy: 100%</p>
+        </div>
     </div>
     """)
     with gr.Row():
         with gr.Column(scale=1):
+            gr.HTML("<h2>🎯 Authentication Control Panel</h2>")
+            # Audio input with enhanced styling
             audio_input = gr.Audio(
+                label="🎤 Upload Voice Sample (WAV, MP3, FLAC supported)",
                 type="filepath",
                 elem_id="audio_input"
             )
+            # Model selection with performance indicators
             model_selector = gr.Dropdown(
                 choices=[
+                    ("🏆 ResNet-18 - CHAMPION (100% Accuracy)", "resnet18"),
+                    ("🥈 ResNet-50 - HIGH PERFORMER (99.94% Accuracy)", "resnet50"),
+                    ("⚡ EfficientNet-B0 - EFFICIENT (99.76% Accuracy)", "efficientnet_b0"),
+                    ("📱 MobileNet-V2 - LIGHTWEIGHT (99.76% Accuracy)", "mobilenet_v2")
                 ],
                 value="resnet18",
+                label="🤖 Select AI Model (Ranked by Performance)",
+                info="All models trained on 26 users with augmented dataset"
             )
+            # Enhanced confidence threshold
             confidence_slider = gr.Slider(
                 minimum=0.1,
                 maximum=1.0,
+                value=0.8,
                 step=0.05,
+                label="🎚️ Security Threshold (Recommended: 0.8 for high security)",
+                info="Higher values = More secure but may increase false rejections"
             )
+            # Enhanced process button
             process_btn = gr.Button(
+                "🔍 AUTHENTICATE VOICE",
                 variant="primary",
                 size="lg"
             )
+            # Enhanced model info display
             model_info_display = gr.Markdown(
                 get_model_info("resnet18"),
+                label="📋 Model Performance Details"
             )
         with gr.Column(scale=2):
+            gr.HTML("<h2>📊 Authentication Results & Analysis</h2>")
             with gr.Row():
                 with gr.Column():
+                    # Enhanced status display
                     status_output = gr.Textbox(
+                        label="🚦 Access Decision",
                         interactive=False,
                         elem_id="status_output"
                     )
+                    # Enhanced message display
                     message_output = gr.Textbox(
+                        label="💬 System Response",
                         interactive=False
                     )
+                    # Enhanced confidence display
                     confidence_output = gr.Number(
+                        label="📈 Confidence Score (0.000-1.000)",
                         interactive=False,
                         precision=3
                     )
                 with gr.Column():
+                    # Enhanced detailed information
                     detailed_info = gr.Markdown(
+                        label="🔍 Comprehensive Analysis Report"
                     )
+            # Enhanced visualization plot
             plot_output = gr.Plot(
+                label="📈 Prediction Visualization & Confidence Analysis",
                 elem_id="plot_output"
             )
+    # Enhanced model comparison section
     with gr.Row():
+        gr.HTML("<h2>⚖️ Model Performance Comparison (Training Results)</h2>")
     with gr.Row():
         comparison_table = gr.Dataframe(
+            headers=["Model", "Accuracy", "FAR (False Accept)", "FRR (False Reject)", "Parameters", "Status"],
             value=voice_system.get_model_comparison(),
+            label="📊 Actual Training Performance Metrics",
             interactive=False
         )
+    # Enhanced information sections
     with gr.Row():
         with gr.Column():
             gr.HTML("""
+            <div style="background: linear-gradient(45deg, #FFF3E0, #FFE0B2); padding: 25px; border-radius: 15px; border-left: 6px solid #FF9800; box-shadow: 0 6px 20px rgba(0,0,0,0.1);">
+                <h3>🛡️ Advanced Security Features</h3>
+                <ul style="line-height: 1.8;">
+                    <li><strong>🏆 Champion Model:</strong> ResNet-18 achieved perfect 100% accuracy</li>
+                    <li><strong>📊 Multi-Model Architecture:</strong> 4 state-of-the-art models to choose from</li>
+                    <li><strong>🎯 Zero False Rejections:</strong> All models achieved 0% FRR</li>
+                    <li><strong>⚡ Real-Time Processing:</strong> Optimized for fast authentication</li>
+                    <li><strong>📈 Detailed Analytics:</strong> Comprehensive prediction visualization</li>
+                    <li><strong>🔒 Adjustable Security:</strong> Customizable confidence thresholds</li>
                 </ul>
             </div>
             """)
         with gr.Column():
             gr.HTML("""
+            <div style="background: linear-gradient(45deg, #E8F5E8, #C8E6C9); padding: 25px; border-radius: 15px; border-left: 6px solid #4CAF50; box-shadow: 0 6px 20px rgba(0,0,0,0.1);">
+                <h3>📖 Usage Instructions</h3>
+                <ol style="line-height: 1.8;">
+                    <li><strong>🎤 Upload Audio:</strong> Record or upload voice sample (3 seconds optimal)</li>
+                    <li><strong>🤖 Select Model:</strong> Choose from our trained models (ResNet-18 recommended)</li>
+                    <li><strong>🎚️ Set Threshold:</strong> Adjust security level (0.8 recommended for high security)</li>
+                    <li><strong>🔍 Authenticate:</strong> Click to process and analyze your voice</li>
+                    <li><strong>📊 Review Results:</strong> Check detailed analysis and confidence metrics</li>
                 </ol>
+                <div style="background: rgba(76, 175, 80, 0.1); padding: 10px; border-radius: 8px; margin-top: 15px;">
+                    <strong>💡 Tip:</strong> ResNet-18 offers perfect accuracy with optimal performance!
+                </div>
             </div>
             """)
+    # Training details section
+    with gr.Row():
+        gr.HTML("""
+        <div style="background: linear-gradient(45deg, #E3F2FD, #BBDEFB); padding: 25px; border-radius: 15px; border-left: 6px solid #2196F3; box-shadow: 0 6px 20px rgba(0,0,0,0.1);">
+            <h3>🎓 Training Details & Achievements</h3>
+            <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(300px, 1fr)); gap: 20px; margin-top: 15px;">
+                <div>
+                    <h4>📊 Dataset Information</h4>
+                    <ul>
+                        <li><strong>Users:</strong> 26 unique speakers</li>
+                        <li><strong>Samples:</strong> 1,693 base samples</li>
+                        <li><strong>Augmentation:</strong> 3x factor for training</li>
+                        <li><strong>GPU:</strong> Tesla T4 (14.7 GB)</li>
+                    </ul>
+                </div>
+                <div>
+                    <h4>🏆 Best Model Achievements</h4>
+                    <ul>
+                        <li><strong>ResNet-18:</strong> 100% Perfect Accuracy 🥇</li>
+                        <li><strong>Parameters:</strong> 11.3M (4.9M trainable)</li>
+                        <li><strong>Training Time:</strong> 20 epochs (~14 minutes)</li>
+                        <li><strong>Security Score:</strong> 0.9997</li>
+                    </ul>
+                </div>
+            </div>
+        </div>
+        """)
     # Event handlers
     model_selector.change(
         fn=get_model_info,
         outputs=[status_output, message_output, confidence_output, plot_output, detailed_info]
     )
+    # Enhanced footer
     gr.HTML("""
+    <div style="text-align: center; padding: 25px; margin-top: 40px; background: linear-gradient(45deg, #37474F, #455A64); color: white; border-radius: 15px; box-shadow: 0 8px 25px rgba(0,0,0,0.2);">
+        <h4>Developed with PyTorch & Gradio</h4>
+        <p>&copy; 2025 - Voice Security System. All rights reserved.</p>
     </div>
     """)
 # Launch configuration
 if __name__ == "__main__":
     app.launch(