Spaces:

UAJK-Practice
/

Voice_Detection

Sleeping

App Files Files Community

AbdulWahab14 commited on 29 days ago

Commit

117e85b

verified ·

1 Parent(s): e6c5942

Update app.py

Browse files

Files changed (1) hide show

app.py +507 -176

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# app.py — DeepFake Audio Detector (Hemgg/Deepfake-audio-detection + DSP Ensemble)
 import os
 import subprocess
 import tempfile
@@ -16,7 +16,7 @@ import gradio as gr
 from transformers import AutoFeatureExtractor, AutoModelForAudioClassification
 # ==========================================
-# 1. MODEL LOADING (once at startup)
 # ==========================================
 MODEL_NAME = "Hemgg/Deepfake-audio-detection"
 print("[+] Loading AI forensic model...")
@@ -33,12 +33,9 @@ print(f"[+] Model loaded on {device}")
 # 2. AUDIO / VIDEO PREPROCESSING
 # ==========================================
 def convert_to_audio(file_path):
-    """Convert video to 16kHz mono WAV or pass audio through."""
     ext = os.path.splitext(file_path)[1].lower().lstrip('.')
     if ext in ["wav", "mp3", "flac", "m4a", "ogg", "aac", "wma"]:
         return file_path
     if ext in ["mp4", "mkv", "avi", "mov", "webm", "flv"]:
         print("[+] Video detected → extracting audio via ffmpeg...")
         out = tempfile.mktemp(suffix=".wav")
@@ -50,7 +47,6 @@ def convert_to_audio(file_path):
         ]
         subprocess.run(cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, check=True)
         return out
     raise ValueError(f"Unsupported file format: {ext}")
 def load_audio(path):
@@ -59,25 +55,15 @@ def load_audio(path):
     return audio
 # ==========================================
-# 3. MODEL INFERENCE
 # ==========================================
 def predict(audio):
-    inputs = extractor(
-        audio,
-        sampling_rate=16000,
-        return_tensors="pt",
-        padding=True
-    ).to(device)
     with torch.no_grad():
         logits = model(**inputs).logits
         probs = torch.softmax(logits, dim=-1)[0]
-    return float(probs[0]), float(probs[1])  # (human_prob, ai_prob)
-# ==========================================
-# 4. DSP FEATURE ANALYSIS
-# ==========================================
 def audio_features(audio):
     mfcc = librosa.feature.mfcc(y=audio, sr=16000)
     return {
@@ -85,261 +71,606 @@ def audio_features(audio):
         "energy": float(np.mean(audio ** 2))
     }
-# ==========================================
-# 5. ENSEMBLE SCORING ENGINE
-# ==========================================
 def analyze(file_path):
     audio_path = convert_to_audio(file_path)
     audio = load_audio(audio_path)
     human_p, ai_p = predict(audio)
     feats = audio_features(audio)
-    # Ensemble: 60% neural + 40% DSP anomaly signal
     anomaly = (feats["mfcc"] / 500.0) + (feats["energy"] * 2.0)
     ai_score = np.clip((ai_p * 0.6 + anomaly * 0.4), 0.0, 1.0)
     if ai_score < 0.35:
-        verdict = "🧑 HUMAN VOICE"
         level = "LOW RISK"
     elif ai_score < 0.65:
-        verdict = "⚠️ UNCERTAIN / MIXED SIGNAL"
         level = "MEDIUM RISK"
     else:
-        verdict = "🤖 AI / SYNTHETIC VOICE"
         level = "HIGH RISK"
     confidence = int(ai_score * 100)
-    return verdict, level, confidence, ai_score, feats, audio_path
 # ==========================================
-# 6. VISUALIZATION
 # ==========================================
 def generate_audio_plots(audio_path):
     y, sr = librosa.load(audio_path, sr=16000, duration=10)
-    fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(10, 6))
-    fig.patch.set_facecolor('#0d0d0d')
-    # Waveform
-    ax1.set_facecolor('#1a1a2e')
-    librosa.display.waveshow(y, sr=sr, ax=ax1, color='#00d4ff')
-    ax1.set_title('Audio Waveform', color='white', fontsize=12)
-    ax1.tick_params(colors='white')
-    # Mel Spectrogram
-    ax2.set_facecolor('#1a1a2e')
     mel = librosa.feature.melspectrogram(y=y, sr=sr, n_mels=128)
     mel_db = librosa.power_to_db(mel, ref=np.max)
-    img = librosa.display.specshow(
-        mel_db, sr=sr, ax=ax2,
-        x_axis='time', y_axis='mel', cmap='magma'
-    )
     cbar = plt.colorbar(img, ax=ax2, format='%+2.0f dB')
-    cbar.ax.yaxis.set_tick_params(color='white')
-    plt.setp(plt.getp(cbar.ax.axes, 'yticklabels'), color='white')
-    ax2.set_title('Mel Spectrogram', color='white', fontsize=12)
-    ax2.tick_params(colors='white')
-    ax2.yaxis.label.set_color('white')
-    ax2.xaxis.label.set_color('white')
     plt.tight_layout()
     plot_path = '/tmp/audio_analysis.png'
-    plt.savefig(plot_path, facecolor='#0d0d0d', bbox_inches='tight', dpi=150)
     plt.close()
     return plot_path
 # ==========================================
-# 7. GRADIO HANDLERS
 # ==========================================
 def detect_audio(audio_file):
     if audio_file is None:
-        return None, "❌ No audio file provided", "N/A"
     try:
-        verdict, level, confidence, ai_score, feats, audio_path = analyze(audio_file)
         plot_path = generate_audio_plots(audio_path)
         percentage = ai_score * 100
-        status = "⚠️ HIGH RISK" if percentage > 65 else "🟡 SUSPICIOUS" if percentage > 35 else "🟢 LIKELY REAL"
-        result_text = f"""
-## 🔊 Audio Analysis Result
-| Metric | Value |
-|--------|-------|
-| **AI Probability** | {percentage:.1f}% |
-| **Verdict** | {verdict} |
-| **Risk Level** | {level} |
-| **Confidence** | {confidence}% |
-| **Status** | {status} |
-### DSP Features
-- **MFCC Variance**: {feats['mfcc']:.4f}
-- **Signal Energy**: {feats['energy']:.6f}
-### Interpretation
-- **0-35%**: 🟢 Very likely genuine / human-created
-- **35-65%**: 🟡 Uncertain / mixed signal, needs review
-- **65-100%**: 🔴 Almost certainly AI-generated / synthetic
-"""
-        return plot_path, result_text, f"{percentage:.1f}%"
     except Exception as e:
-        return None, f"❌ Error analyzing audio: {str(e)}", "N/A"
 def detect_video(video_file):
     if video_file is None:
-        return None, "❌ No video file provided", "N/A"
     try:
-        # Extract audio track from video and run the same forensic model
-        verdict, level, confidence, ai_score, feats, audio_path = analyze(video_file)
         plot_path = generate_audio_plots(audio_path)
         percentage = ai_score * 100
-        status = "⚠️ HIGH RISK" if percentage > 65 else "🟡 SUSPICIOUS" if percentage > 35 else "🟢 LIKELY REAL"
-        result_text = f"""
-## 🎬 Video Analysis Result (Audio Track)
-| Metric | Value |
-|--------|-------|
-| **AI Probability** | {percentage:.1f}% |
-| **Verdict** | {verdict} |
-| **Risk Level** | {level} |
-| **Confidence** | {confidence}% |
-| **Status** | {status} |
-### Analysis Note
-This check was performed on the **audio track** extracted from the uploaded video.
-Deepfake videos frequently contain synthetic audio — this model detects those artifacts.
-### DSP Features
-- **MFCC Variance**: {feats['mfcc']:.4f}
-- **Signal Energy**: {feats['energy']:.6f}
-### Interpretation
-- **0-35%**: 🟢 Very likely genuine / human-created
-- **35-65%**: 🟡 Uncertain / mixed signal, needs review
-- **65-100%**: 🔴 Almost certainly AI-generated / synthetic
-"""
-        return plot_path, result_text, f"{percentage:.1f}%"
     except Exception as e:
-        return None, f"❌ Error analyzing video: {str(e)}", "N/A"
 # ==========================================
-# 8. GRADIO UI
 # ==========================================
 def build_ui():
     with gr.Blocks(
-        title="🔍 DeepFake AI Detector",
         theme=gr.themes.Base(
-            primary_hue="blue",
             neutral_hue="slate",
         ),
-        css="""
-        .gradio-container { max-width: 1100px; margin: auto; }
-        .result-box { border-radius: 12px; padding: 16px; }
-        h1 { text-align: center; }
-        .score-display { font-size: 48px; font-weight: bold; text-align: center; }
-        """
     ) as demo:
         gr.HTML("""
-        <div style="text-align:center; padding: 20px 0;">
-            <h1 style="font-size: 2.5em; font-weight: 800;">🔍 DeepFake AI Detector</h1>
-            <p style="font-size: 1.1em; color: #888;">
-                Upload audio or video to detect AI generation.<br>
-                Powered by <code>Hemgg/Deepfake-audio-detection</code> with DSP ensemble scoring.
             </p>
         </div>
         """)
         with gr.Tabs():
-            # ── Audio Tab ──────────────────────────────────────────────────────
-            with gr.TabItem("🔊 Audio Detection"):
-                gr.Markdown("### Upload an audio file to check if it's AI-generated")
                 with gr.Row():
-                    with gr.Column(scale=1):
                         audio_input = gr.Audio(
-                            label="Upload Audio (MP3, WAV, M4A, OGG)",
-                            type="filepath"
                         )
                         audio_btn = gr.Button("🔍 Analyze Audio", variant="primary", size="lg")
                     with gr.Column(scale=2):
-                        audio_score = gr.Textbox(
-                            label="🎯 AI Score",
-                            interactive=False,
-                            placeholder="Result will appear here..."
                         )
-                        audio_plot = gr.Image(label="📊 Audio Analysis")
-                        audio_result = gr.Markdown(label="📋 Detailed Report")
                 audio_btn.click(
                     fn=detect_audio,
                     inputs=[audio_input],
-                    outputs=[audio_plot, audio_result, audio_score]
                 )
-            # ── Video Tab ──────────────────────────────────────────────────────
-            with gr.TabItem("🎬 Video Detection"):
-                gr.Markdown("### Upload a video file to analyze its audio track for deepfake artifacts")
                 with gr.Row():
-                    with gr.Column(scale=1):
                         video_input = gr.Video(
-                            label="Upload Video (MP4, AVI, MOV, WEBM)",
                         )
                         video_btn = gr.Button("🔍 Analyze Video", variant="primary", size="lg")
                     with gr.Column(scale=2):
-                        video_score = gr.Textbox(
-                            label="🎯 AI Score",
-                            interactive=False,
-                            placeholder="Result will appear here..."
                         )
-                        video_plot = gr.Image(label="📊 Audio Analysis")
-                        video_result = gr.Markdown(label="📋 Detailed Report")
                 video_btn.click(
                     fn=detect_video,
                     inputs=[video_input],
-                    outputs=[video_plot, video_result, video_score]
                 )
-            # ── About Tab ─────────────────────────────────────────────────────
-            with gr.TabItem("ℹ️ How It Works"):
-                gr.Markdown("""
-## 🧠 Detection Methodology
-### Model
-- **Base**: `Hemgg/Deepfake-audio-detection` (Transformer-based audio classifier)
-- **Device**: CUDA if available, otherwise CPU
-- **Ensemble**: Neural output + DSP anomaly signal
-### Audio Features (DSP Layer)
-| Feature | What it detects |
-|---------|----------------|
-| MFCC Variance | Unnatural vocal tract patterns |
-| Signal Energy | Abnormal amplitude distribution |
-| Neural Probability | Direct transformer classification |
-### Score Interpretation
-- **0-35%**: 🟢 Very likely genuine
-- **35-65%**: 🟡 Uncertain / mixed signal
-- **65-100%**: 🔴 Almost certainly AI-generated
-### ⚠️ Limitations
-- No detector is 100% accurate
-- Newer AI models may evade detection
-- Low quality media reduces accuracy
-- Always combine with human judgment
                 """)
     return demo
@@ -348,5 +679,5 @@ if __name__ == "__main__":
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860,
-        share=False  # Hugging Face Spaces handles the public URL
     )

+# app.py — DeepFake AI Forensics (Premium UI + Animated Waves + Confidence Circle)
 import os
 import subprocess
 import tempfile
 from transformers import AutoFeatureExtractor, AutoModelForAudioClassification
 # ==========================================
+# 1. MODEL LOADING
 # ==========================================
 MODEL_NAME = "Hemgg/Deepfake-audio-detection"
 print("[+] Loading AI forensic model...")
 # 2. AUDIO / VIDEO PREPROCESSING
 # ==========================================
 def convert_to_audio(file_path):
     ext = os.path.splitext(file_path)[1].lower().lstrip('.')
     if ext in ["wav", "mp3", "flac", "m4a", "ogg", "aac", "wma"]:
         return file_path
     if ext in ["mp4", "mkv", "avi", "mov", "webm", "flv"]:
         print("[+] Video detected → extracting audio via ffmpeg...")
         out = tempfile.mktemp(suffix=".wav")
         ]
         subprocess.run(cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, check=True)
         return out
     raise ValueError(f"Unsupported file format: {ext}")
 def load_audio(path):
     return audio
 # ==========================================
+# 3. INFERENCE & DSP
 # ==========================================
 def predict(audio):
+    inputs = extractor(audio, sampling_rate=16000, return_tensors="pt", padding=True).to(device)
     with torch.no_grad():
         logits = model(**inputs).logits
         probs = torch.softmax(logits, dim=-1)[0]
+    return float(probs[0]), float(probs[1])
 def audio_features(audio):
     mfcc = librosa.feature.mfcc(y=audio, sr=16000)
     return {
         "energy": float(np.mean(audio ** 2))
     }
 def analyze(file_path):
     audio_path = convert_to_audio(file_path)
     audio = load_audio(audio_path)
     human_p, ai_p = predict(audio)
     feats = audio_features(audio)
     anomaly = (feats["mfcc"] / 500.0) + (feats["energy"] * 2.0)
     ai_score = np.clip((ai_p * 0.6 + anomaly * 0.4), 0.0, 1.0)
     if ai_score < 0.35:
+        verdict = "HUMAN VOICE"
         level = "LOW RISK"
+        color = "#00ff88"
+        icon = "🧑"
+        glow = "rgba(0,255,136,0.25)"
     elif ai_score < 0.65:
+        verdict = "UNCERTAIN / MIXED"
         level = "MEDIUM RISK"
+        color = "#ffcc00"
+        icon = "⚠️"
+        glow = "rgba(255,204,0,0.25)"
     else:
+        verdict = "AI / SYNTHETIC VOICE"
         level = "HIGH RISK"
+        color = "#ff4444"
+        icon = "🤖"
+        glow = "rgba(255,68,68,0.25)"
     confidence = int(ai_score * 100)
+    return verdict, level, confidence, ai_score, feats, audio_path, color, icon, glow
 # ==========================================
+# 4. VISUALIZATION
 # ==========================================
 def generate_audio_plots(audio_path):
     y, sr = librosa.load(audio_path, sr=16000, duration=10)
+    fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(12, 7))
+    fig.patch.set_facecolor('#08080f')
+    ax1.set_facecolor('#0f0f1a')
+    librosa.display.waveshow(y, sr=sr, ax=ax1, color='#00d4ff', alpha=0.85)
+    ax1.set_title('Waveform Analysis', color='#c0c0e0', fontsize=13, fontweight='bold', pad=12)
+    ax1.tick_params(colors='#555588')
+    for spine in ax1.spines.values():
+        spine.set_color('#222244')
+    ax2.set_facecolor('#0f0f1a')
     mel = librosa.feature.melspectrogram(y=y, sr=sr, n_mels=128)
     mel_db = librosa.power_to_db(mel, ref=np.max)
+    img = librosa.display.specshow(mel_db, sr=sr, ax=ax2, x_axis='time', y_axis='mel', cmap='magma')
     cbar = plt.colorbar(img, ax=ax2, format='%+2.0f dB')
+    cbar.ax.yaxis.set_tick_params(color='#555588')
+    plt.setp(plt.getp(cbar.ax.axes, 'yticklabels'), color='#555588')
+    ax2.set_title('Mel Spectrogram', color='#c0c0e0', fontsize=13, fontweight='bold', pad=12)
+    ax2.tick_params(colors='#555588')
+    ax2.yaxis.label.set_color('#555588')
+    ax2.xaxis.label.set_color('#555588')
+    for spine in ax2.spines.values():
+        spine.set_color('#222244')
     plt.tight_layout()
     plot_path = '/tmp/audio_analysis.png'
+    plt.savefig(plot_path, facecolor='#08080f', bbox_inches='tight', dpi=150)
     plt.close()
     return plot_path
 # ==========================================
+# 5. HTML BUILDERS
+# ==========================================
+def confidence_circle(percentage, color):
+    """SVG circular progress indicator."""
+    radius = 50
+    circumference = 2 * 3.14159 * radius
+    offset = circumference - (percentage / 100) * circumference
+    return f"""
+    <div style="display: flex; flex-direction: column; align-items: center; justify-content: center; margin: 10px 0;">
+        <div style="position: relative; width: 140px; height: 140px; filter: drop-shadow(0 0 12px {color}40);">
+            <svg width="140" height="140" viewBox="0 0 120 120" style="transform: rotate(-90deg);">
+                <circle cx="60" cy="60" r="{radius}" stroke="#1a1a2e" stroke-width="10" fill="none"/>
+                <circle cx="60" cy="60" r="{radius}" stroke="{color}" stroke-width="10" fill="none"
+                    stroke-linecap="round"
+                    stroke-dasharray="{circumference}"
+                    stroke-dashoffset="{offset}"
+                    style="transition: stroke-dashoffset 1.2s ease-out;"/>
+            </svg>
+            <div style="position: absolute; top: 50%; left: 50%; transform: translate(-50%, -50%); text-align: center;">
+                <div style="font-size: 2em; font-weight: 800; color: {color}; line-height: 1;">{percentage}%</div>
+                <div style="font-size: 0.65em; color: #555588; text-transform: uppercase; letter-spacing: 1px;">Confidence</div>
+            </div>
+        </div>
+    </div>
+    """
+EQUALIZER_HTML = """
+<div style="display: flex; align-items: flex-end; justify-content: center; height: 50px; gap: 5px; margin: 16px 0;">
+    <div class="eq-bar" style="width: 6px; height: 40%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.8s infinite ease-in-out 0s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 70%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.9s infinite ease-in-out 0.1s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 50%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.7s infinite ease-in-out 0.2s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 80%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 1.0s infinite ease-in-out 0.15s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 60%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.85s infinite ease-in-out 0.05s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 90%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.75s infinite ease-in-out 0.25s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 45%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.95s infinite ease-in-out 0.3s;"></div>
+    <div class="eq-bar" style="width: 6px; height: 65%; background: linear-gradient(to top, #4f46e5, #00d4ff); border-radius: 3px; animation: eq-bounce 0.8s infinite ease-in-out 0.12s;"></div>
+</div>
+"""
+# ==========================================
+# 6. GRADIO HANDLERS
 # ==========================================
 def detect_audio(audio_file):
     if audio_file is None:
+        return (
+            None,
+            '<div style="text-align:center;color:#ff4444;padding:30px;">❌ No audio file provided</div>',
+            "Waiting...",
+            "#666666",
+            EQUALIZER_HTML + '<div style="text-align:center;color:#444466;font-size:0.9em;">Upload audio to begin forensic analysis</div>'
+        )
     try:
+        verdict, level, confidence, ai_score, feats, audio_path, color, icon, glow = analyze(audio_file)
         plot_path = generate_audio_plots(audio_path)
         percentage = ai_score * 100
+        status_emoji = "🟢" if percentage < 35 else "🟡" if percentage < 65 else "🔴"
+        status_text = "LIKELY REAL" if percentage < 35 else "SUSPICIOUS" if percentage < 65 else "HIGH RISK"
+        circle = confidence_circle(confidence, color)
+        result_html = f"""
+        <div style="background: linear-gradient(145deg, #0c0c14 0%, #141424 100%);
+                    border: 1px solid {color}30; border-radius: 20px; padding: 28px;
+                    box-shadow: 0 0 40px {glow}, inset 0 1px 0 rgba(255,255,255,0.03);">
+            <div style="display: flex; align-items: center; gap: 20px; margin-bottom: 24px; flex-wrap: wrap;">
+                <div style="font-size: 3em; line-height: 1;">{icon}</div>
+                <div style="flex: 1; min-width: 200px;">
+                    <div style="font-size: 0.8em; color: #555588; text-transform: uppercase; letter-spacing: 2px; margin-bottom: 4px;">Final Verdict</div>
+                    <div style="font-size: 1.5em; font-weight: 800; color: {color}; letter-spacing: -0.5px;">{verdict}</div>
+                </div>
+                <div style="min-width: 140px;">
+                    {circle}
+                </div>
+            </div>
+            <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(140px, 1fr)); gap: 12px; margin-bottom: 24px;">
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid {color};">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">AI Probability</div>
+                    <div style="font-size: 1.5em; font-weight: 700; color: {color};">{percentage:.1f}%</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid {color};">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Risk Level</div>
+                    <div style="font-size: 1.2em; font-weight: 700; color: {color};">{level}</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid #00d4ff;">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Confidence</div>
+                    <div style="font-size: 1.2em; font-weight: 700; color: #00d4ff;">{confidence}%</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid #ffcc00;">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Status</div>
+                    <div style="font-size: 1em; font-weight: 600; color: #ffcc00;">{status_emoji} {status_text}</div>
+                </div>
+            </div>
+            <div style="background: #08080f; border-radius: 12px; padding: 18px; margin-bottom: 20px;">
+                <div style="font-size: 0.75em; color: #444466; text-transform: uppercase; letter-spacing: 1.5px; margin-bottom: 12px;">🔬 DSP Forensic Signatures</div>
+                <div style="display: flex; justify-content: space-around; font-family: 'SF Mono', monospace; font-size: 0.9em; flex-wrap: wrap; gap: 12px;">
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">MFCC Variance</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{feats['mfcc']:.4f}</div>
+                    </div>
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">Signal Energy</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{feats['energy']:.6f}</div>
+                    </div>
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">Neural Score</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{ai_score:.4f}</div>
+                    </div>
+                </div>
+            </div>
+            <div style="font-size: 0.8em; color: #3a3a55; border-top: 1px solid #1a1a2e; padding-top: 14px; line-height: 1.6;">
+                <strong style="color: #555588;">Interpretation Guide:</strong><br>
+                <span style="color: #00ff88;">● 0–35%</span> Very likely genuine human voice &nbsp;|&nbsp;
+                <span style="color: #ffcc00;">● 35–65%</span> Mixed signal, manual review advised &nbsp;|&nbsp;
+                <span style="color: #ff4444;">● 65–100%</span> Strong synthetic / AI indicators detected
+            </div>
+        </div>
+        """
+        return plot_path, result_html, f"{percentage:.1f}%", color, ""
     except Exception as e:
+        return None, f"<div style='color:#ff4444;padding:30px;'>❌ Analysis Error: {str(e)}</div>", "Error", "#ff4444", ""
 def detect_video(video_file):
     if video_file is None:
+        return (
+            None,
+            '<div style="text-align:center;color:#ff4444;padding:30px;">❌ No video file provided</div>',
+            "Waiting...",
+            "#666666",
+            EQUALIZER_HTML + '<div style="text-align:center;color:#444466;font-size:0.9em;">Upload video to extract & analyze audio track</div>'
+        )
     try:
+        verdict, level, confidence, ai_score, feats, audio_path, color, icon, glow = analyze(video_file)
         plot_path = generate_audio_plots(audio_path)
         percentage = ai_score * 100
+        status_emoji = "🟢" if percentage < 35 else "🟡" if percentage < 65 else "🔴"
+        status_text = "LIKELY REAL" if percentage < 35 else "SUSPICIOUS" if percentage < 65 else "HIGH RISK"
+        circle = confidence_circle(confidence, color)
+        result_html = f"""
+        <div style="background: linear-gradient(145deg, #0c0c14 0%, #141424 100%);
+                    border: 1px solid {color}30; border-radius: 20px; padding: 28px;
+                    box-shadow: 0 0 40px {glow}, inset 0 1px 0 rgba(255,255,255,0.03);">
+            <div style="display: flex; align-items: center; gap: 20px; margin-bottom: 24px; flex-wrap: wrap;">
+                <div style="font-size: 3em; line-height: 1;">{icon}</div>
+                <div style="flex: 1; min-width: 200px;">
+                    <div style="font-size: 0.8em; color: #555588; text-transform: uppercase; letter-spacing: 2px; margin-bottom: 4px;">Audio Track Verdict</div>
+                    <div style="font-size: 1.5em; font-weight: 800; color: {color}; letter-spacing: -0.5px;">{verdict}</div>
+                </div>
+                <div style="min-width: 140px;">
+                    {circle}
+                </div>
+            </div>
+            <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(140px, 1fr)); gap: 12px; margin-bottom: 24px;">
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid {color};">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">AI Probability</div>
+                    <div style="font-size: 1.5em; font-weight: 700; color: {color};">{percentage:.1f}%</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid {color};">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Risk Level</div>
+                    <div style="font-size: 1.2em; font-weight: 700; color: {color};">{level}</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid #00d4ff;">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Confidence</div>
+                    <div style="font-size: 1.2em; font-weight: 700; color: #00d4ff;">{confidence}%</div>
+                </div>
+                <div style="background: #08080f; border-radius: 12px; padding: 16px; border-left: 3px solid #ffcc00;">
+                    <div style="font-size: 0.7em; color: #444466; text-transform: uppercase; letter-spacing: 1px; margin-bottom: 6px;">Status</div>
+                    <div style="font-size: 1em; font-weight: 600; color: #ffcc00;">{status_emoji} {status_text}</div>
+                </div>
+            </div>
+            <div style="background: #08080f; border-radius: 12px; padding: 18px; margin-bottom: 20px;">
+                <div style="font-size: 0.75em; color: #444466; text-transform: uppercase; letter-spacing: 1.5px; margin-bottom: 12px;">🔬 DSP Forensic Signatures (Audio Track)</div>
+                <div style="display: flex; justify-content: space-around; font-family: 'SF Mono', monospace; font-size: 0.9em; flex-wrap: wrap; gap: 12px;">
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">MFCC Variance</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{feats['mfcc']:.4f}</div>
+                    </div>
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">Signal Energy</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{feats['energy']:.6f}</div>
+                    </div>
+                    <div style="text-align: center;">
+                        <div style="color: #555588; font-size: 0.8em;">Neural Score</div>
+                        <div style="color: #e0e0ff; font-weight: 600;">{ai_score:.4f}</div>
+                    </div>
+                </div>
+            </div>
+            <div style="font-size: 0.8em; color: #3a3a55; border-top: 1px solid #1a1a2e; padding-top: 14px; line-height: 1.6;">
+                <strong style="color: #555588;">Analysis Note:</strong> Deepfake videos frequently contain synthetic audio tracks.
+                This scan was performed on the extracted audio waveform. Always verify visual cues separately for complete assessment.
+            </div>
+        </div>
+        """
+        return plot_path, result_html, f"{percentage:.1f}%", color, ""
     except Exception as e:
+        return None, f"<div style='color:#ff4444;padding:30px;'>❌ Analysis Error: {str(e)}</div>", "Error", "#ff4444", ""
 # ==========================================
+# 7. GRADIO UI
 # ==========================================
+CUSTOM_CSS = """
+@import url('https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700;800&display=swap');
+.gradio-container {
+    max-width: 1250px !important;
+    margin: auto !important;
+    font-family: 'Inter', sans-serif !important;
+    background: #050508 !important;
+}
+body { background: #050508 !important; }
+/* Tabs */
+.tab-nav {
+    background: #0f0f1a !important;
+    border-radius: 14px !important;
+    padding: 6px !important;
+    border: 1px solid #1e1e32 !important;
+    margin-bottom: 24px !important;
+    gap: 6px !important;
+}
+.tab-nav button {
+    color: #555588 !important;
+    font-weight: 600 !important;
+    border-radius: 10px !important;
+    padding: 10px 28px !important;
+    border: none !important;
+    background: transparent !important;
+    transition: all 0.3s ease !important;
+}
+.tab-nav button:hover { color: #8888bb !important; }
+.tab-nav button.selected {
+    background: linear-gradient(135deg, #4f46e5 0%, #7c3aed 100%) !important;
+    color: #ffffff !important;
+    box-shadow: 0 4px 20px rgba(124, 58, 237, 0.35) !important;
+}
+/* Inputs & Upload */
+.upload-container {
+    background: #0a0a12 !important;
+    border: 2px dashed #252540 !important;
+    border-radius: 16px !important;
+    transition: all 0.3s ease !important;
+}
+.upload-container:hover {
+    border-color: #4f46e5 !important;
+    background: #0f0f1a !important;
+    box-shadow: 0 0 30px rgba(79, 70, 229, 0.1) !important;
+}
+/* Buttons */
+button.primary {
+    background: linear-gradient(135deg, #4f46e5 0%, #7c3aed 100%) !important;
+    border: none !important;
+    border-radius: 12px !important;
+    font-weight: 700 !important;
+    letter-spacing: 0.5px !important;
+    padding: 14px 32px !important;
+    box-shadow: 0 4px 24px rgba(124, 58, 237, 0.3) !important;
+    transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1) !important;
+}
+button.primary:hover {
+    transform: translateY(-2px) !important;
+    box-shadow: 0 8px 32px rgba(124, 58, 237, 0.45) !important;
+}
+/* Equalizer Animation */
+@keyframes eq-bounce {
+    0%, 100% { transform: scaleY(0.25); opacity: 0.5; }
+    50% { transform: scaleY(1); opacity: 1; }
+}
+/* Scrollbar */
+::-webkit-scrollbar { width: 8px; }
+::-webkit-scrollbar-track { background: #08080f; }
+::-webkit-scrollbar-thumb { background: #252540; border-radius: 4px; }
+::-webkit-scrollbar-thumb:hover { background: #4f46e5; }
+/* Format badges helper */
+.format-badge {
+    display: inline-block;
+    background: #12121a;
+    border: 1px solid #252540;
+    color: #6666aa;
+    padding: 4px 12px;
+    border-radius: 20px;
+    font-size: 0.75em;
+    font-weight: 600;
+    letter-spacing: 0.5px;
+}
+"""
 def build_ui():
     with gr.Blocks(
+        title="DeepFake AI Forensics",
         theme=gr.themes.Base(
+            primary_hue="violet",
             neutral_hue="slate",
+            font=["Inter", "system-ui", "sans-serif"],
         ),
+        css=CUSTOM_CSS,
     ) as demo:
+        # Header
         gr.HTML("""
+        <div style="text-align: center; padding: 40px 20px 10px 20px;">
+            <div style="display: inline-block; position: relative;">
+                <div style="position: absolute; top: -30px; left: 50%; transform: translateX(-50%); width: 280px; height: 280px;
+                            background: radial-gradient(circle, rgba(124,58,237,0.12) 0%, transparent 70%); border-radius: 50%; pointer-events: none;"></div>
+                <h1 style="font-size: 2.8em; font-weight: 800; margin: 0;
+                           background: linear-gradient(135deg, #c4b5fd 0%, #60a5fa 40%, #00d4ff 100%);
+                           -webkit-background-clip: text; -webkit-text-fill-color: transparent; background-clip: text;
+                           letter-spacing: -1.5px; position: relative;">
+                    🔍 DeepFake AI Forensics
+                </h1>
+            </div>
+            <p style="font-size: 1.05em; color: #444466; margin-top: 14px; max-width: 560px; margin-left: auto; margin-right: auto; line-height: 1.6;">
+                Neural + DSP ensemble detection for synthetic voice identification.
             </p>
         </div>
         """)
         with gr.Tabs():
+            # ═══════════════════════════════════════════
+            # AUDIO TAB
+            # ═══════════════════════════════════════════
+            with gr.TabItem("🔊 Audio Detection", id=0):
                 with gr.Row():
+                    # LEFT: Upload & Controls
+                    with gr.Column(scale=1, min_width=340):
+                        gr.Markdown("### Upload Audio File", elem_classes="section-title")
+                        # Format badges
+                        gr.HTML("""
+                        <div style="margin-bottom: 12px; display: flex; flex-wrap: wrap; gap: 6px;">
+                            <span class="format-badge">MP3</span>
+                            <span class="format-badge">WAV</span>
+                            <span class="format-badge">M4A</span>
+                            <span class="format-badge">FLAC</span>
+                            <span class="format-badge">OGG</span>
+                        </div>
+                        <div style="font-size: 0.8em; color: #444466; margin-bottom: 16px; display: flex; align-items: center; gap: 6px;">
+                            <span style="font-size: 1.2em;">📎</span>
+                            <span>Maximum file size: <strong style="color: #6666aa;">50 MB</strong></span>
+                        </div>
+                        """)
                         audio_input = gr.Audio(
+                            label="",
+                            type="filepath",
+                            elem_classes="upload-container"
                         )
+                        # Animated equalizer (shows when audio present, decorative)
+                        audio_waves = gr.HTML(value=EQUALIZER_HTML + '<div style="text-align:center;color:#333355;font-size:0.85em;">Audio waveform ready for analysis</div>')
                         audio_btn = gr.Button("🔍 Analyze Audio", variant="primary", size="lg")
+                        # Big score display
+                        audio_score_text = gr.Textbox(
+                            label="",
+                            value="--%",
+                            interactive=False,
+                            elem_classes="score-display"
+                        )
+                    # RIGHT: Results
                     with gr.Column(scale=2):
+                        gr.Markdown("### Forensic Analysis Report", elem_classes="section-title")
+                        audio_plot = gr.Image(
+                            label="",
+                            show_label=False,
+                            elem_classes="result-image"
+                        )
+                        audio_result = gr.HTML(
+                            value="""
+                            <div style="background: #0a0a12; border: 2px dashed #1e1e32; border-radius: 20px; padding: 50px 30px; text-align: center; margin-top: 8px;">
+                                <div style="font-size: 3em; margin-bottom: 16px;">📊</div>
+                                <div style="color: #333355; font-size: 1.1em; font-weight: 600;">Results will appear here</div>
+                                <div style="color: #222244; font-size: 0.9em; margin-top: 8px;">Upload an audio file and click analyze to begin</div>
+                            </div>
+                            """
                         )
                 audio_btn.click(
                     fn=detect_audio,
                     inputs=[audio_input],
+                    outputs=[audio_plot, audio_result, audio_score_text, audio_score_text, audio_waves]
                 )
+            # ═══════════════════════════════════════════
+            # VIDEO TAB
+            # ═══════════════════════════════════════════
+            with gr.TabItem("🎬 Video Detection", id=1):
                 with gr.Row():
+                    with gr.Column(scale=1, min_width=340):
+                        gr.Markdown("### Upload Video File", elem_classes="section-title")
+                        gr.HTML("""
+                        <div style="margin-bottom: 12px; display: flex; flex-wrap: wrap; gap: 6px;">
+                            <span class="format-badge">MP4</span>
+                            <span class="format-badge">MOV</span>
+                            <span class="format-badge">AVI</span>
+                            <span class="format-badge">MKV</span>
+                            <span class="format-badge">WEBM</span>
+                        </div>
+                        <div style="font-size: 0.8em; color: #444466; margin-bottom: 16px; display: flex; align-items: center; gap: 6px;">
+                            <span style="font-size: 1.2em;">📎</span>
+                            <span>Maximum file size: <strong style="color: #6666aa;">100 MB</strong></span>
+                        </div>
+                        """)
                         video_input = gr.Video(
+                            label="",
+                            elem_classes="upload-container"
                         )
+                        video_waves = gr.HTML(value=EQUALIZER_HTML + '<div style="text-align:center;color:#333355;font-size:0.85em;">Video loaded — audio track ready for extraction</div>')
                         video_btn = gr.Button("🔍 Analyze Video", variant="primary", size="lg")
+                        video_score_text = gr.Textbox(
+                            label="",
+                            value="--%",
+                            interactive=False
+                        )
                     with gr.Column(scale=2):
+                        gr.Markdown("### Forensic Analysis Report", elem_classes="section-title")
+                        video_plot = gr.Image(
+                            label="",
+                            show_label=False
+                        )
+                        video_result = gr.HTML(
+                            value="""
+                            <div style="background: #0a0a12; border: 2px dashed #1e1e32; border-radius: 20px; padding: 50px 30px; text-align: center; margin-top: 8px;">
+                                <div style="font-size: 3em; margin-bottom: 16px;">🎬</div>
+                                <div style="color: #333355; font-size: 1.1em; font-weight: 600;">Results will appear here</div>
+                                <div style="color: #222244; font-size: 0.9em; margin-top: 8px;">Upload a video to extract & analyze its audio track</div>
+                            </div>
+                            """
                         )
                 video_btn.click(
                     fn=detect_video,
                     inputs=[video_input],
+                    outputs=[video_plot, video_result, video_score_text, video_score_text, video_waves]
                 )
+            # ═══════════════════════════════════════════
+            # ABOUT TAB
+            # ═══════════════════════════════════════════
+            with gr.TabItem("ℹ️ How It Works", id=2):
+                gr.HTML("""
+                <div style="max-width: 900px; margin: auto; padding: 20px 0 40px 0;">
+                    <h2 style="color: #c0c0e0; font-size: 1.7em; margin-bottom: 28px; text-align: center; font-weight: 700;">🧠 Detection Pipeline</h2>
+                    <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(260px, 1fr)); gap: 18px; margin-bottom: 36px;">
+                        <div style="background: linear-gradient(145deg, #0c0c14 0%, #141424 100%); border: 1px solid #1e1e32; border-radius: 16px; padding: 24px;">
+                            <div style="font-size: 2em; margin-bottom: 10px;">🧠</div>
+                            <h3 style="color: #a78bfa; margin: 0 0 6px 0; font-size: 1.1em;">Transformer Classifier</h3>
+                            <p style="color: #444466; font-size: 0.9em; line-height: 1.5; margin: 0;">
+                                <code style="background: #0a0a12; padding: 2px 6px; border-radius: 4px; color: #8888bb;">Hemgg/Deepfake-audio-detection</code>
+                                base model running on GPU/CPU with HuggingFace Transformers.
+                            </p>
+                        </div>
+                        <div style="background: linear-gradient(145deg, #0c0c14 0%, #141424 100%); border: 1px solid #1e1e32; border-radius: 16px; padding: 24px;">
+                            <div style="font-size: 2em; margin-bottom: 10px;">📊</div>
+                            <h3 style="color: #60a5fa; margin: 0 0 6px 0; font-size: 1.1em;">DSP Ensemble</h3>
+                            <p style="color: #444466; font-size: 0.9em; line-height: 1.5; margin: 0;">
+                                MFCC variance + signal energy anomaly detection fused with neural output (60/40 weighting).
+                            </p>
+                        </div>
+                        <div style="background: linear-gradient(145deg, #0c0c14 0%, #141424 100%); border: 1px solid #1e1e32; border-radius: 16px; padding: 24px;">
+                            <div style="font-size: 2em; margin-bottom: 10px;">🎬</div>
+                            <h3 style="color: #00d4ff; margin: 0 0 6px 0; font-size: 1.1em;">Video Extraction</h3>
+                            <p style="color: #444466; font-size: 0.9em; line-height: 1.5; margin: 0;">
+                                FFmpeg extracts mono 16kHz audio from any video format before forensic scanning.
+                            </p>
+                        </div>
+                    </div>
+                    <h3 style="color: #c0c0e0; margin-bottom: 16px; font-size: 1.2em;">📈 Score Interpretation</h3>
+                    <div style="background: #08080f; border-radius: 14px; padding: 20px; border: 1px solid #1a1a2e; margin-bottom: 28px;">
+                        <div style="display: flex; align-items: center; margin-bottom: 10px; padding: 10px 14px; background: #0c0c14; border-radius: 10px; border-left: 4px solid #00ff88;">
+                            <span style="color: #00ff88; font-weight: 700; min-width: 70px; font-size: 0.95em;">0–35%</span>
+                            <span style="color: #444466; margin-left: 12px; font-size: 0.9em;">🟢 Very likely genuine / human-created</span>
+                        </div>
+                        <div style="display: flex; align-items: center; margin-bottom: 10px; padding: 10px 14px; background: #0c0c14; border-radius: 10px; border-left: 4px solid #ffcc00;">
+                            <span style="color: #ffcc00; font-weight: 700; min-width: 70px; font-size: 0.95em;">35–65%</span>
+                            <span style="color: #444466; margin-left: 12px; font-size: 0.9em;">🟡 Uncertain / mixed signal — manual review recommended</span>
+                        </div>
+                        <div style="display: flex; align-items: center; padding: 10px 14px; background: #0c0c14; border-radius: 10px; border-left: 4px solid #ff4444;">
+                            <span style="color: #ff4444; font-weight: 700; min-width: 70px; font-size: 0.95em;">65–100%</span>
+                            <span style="color: #444466; margin-left: 12px; font-size: 0.9em;">🔴 Strong AI-generated / synthetic voice indicators</span>
+                        </div>
+                    </div>
+                    <div style="background: #140a0a; border: 1px solid #331a1a; border-radius: 14px; padding: 20px; color: #884444; font-size: 0.88em; line-height: 1.6;">
+                        <strong style="color: #cc5555;">⚠️ Important Limitations</strong><br><br>
+                        No automated detector is 100% accurate. Adversarial AI models may evade detection.
+                        Compressed or noisy audio reduces reliability. Always use human expert judgment for critical decisions.
+                    </div>
+                </div>
                 """)
+        # Footer
+        gr.HTML("""
+        <div style="text-align: center; padding: 30px 20px; color: #2a2a44; font-size: 0.82em; border-top: 1px solid #12121a; margin-top: 10px;">
+            Neural Audio Forensics • Powered by HuggingFace Transformers & DSP Signal Processing
+        </div>
+        """)
     return demo
     demo.launch(
         server_name="0.0.0.0",
         server_port=7860,
+        share=False
     )