Spaces:

farwew
/

David

Runtime error

App Files Files Community

farwew commited on Jul 31, 2025

Commit

e231c61

verified ·

1 Parent(s): aa11893

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -14

app.py CHANGED Viewed

@@ -1,19 +1,20 @@
-import gradio as gr
 import torch
 import torch.nn as nn
 import numpy as np
 from torchvision import transforms as T
 from torchvision.transforms.v2 import ToDtype
 from decord import VideoReader, cpu
-from trainers import vificlip
-from utils.config import get_config
-from utils.logger import create_logger
 # -------------------------
-# Setup Device & Seed
 # -------------------------
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-torch.manual_seed(42)
 # -------------------------
 # Transform
@@ -34,16 +35,22 @@ class ClassificationHead(nn.Module):
     def __init__(self, input_dim=512, num_classes=1):
         super().__init__()
         self.dense = nn.Linear(input_dim, num_classes)
     def forward(self, x):
         return self.dense(x)
 # -------------------------
-# Load ViFi-CLIP + Classifier
 # -------------------------
 cfgpth = 'configs/zero_shot/train/k400/16_16_vifi_clip.yaml'
-model_path = 'vifi_clip_30_epochs_k400_full_finetuned.pth'
 classifier_path = 'best_detector_model.pt'
 class parse_option:
     def __init__(self):
         self.config = cfgpth
@@ -69,7 +76,7 @@ classifier.to(device)
 classifier.eval()
 # -------------------------
-# Inference Function (with threshold)
 # -------------------------
 def predict_video(video_path, threshold=0.5):
     preprocess = _transform(224)
@@ -104,15 +111,15 @@ def predict_video(video_path, threshold=0.5):
         return f"❌ Error: {str(e)}"
 # -------------------------
-# Gradio UI (with slider)
 # -------------------------
 gr.Interface(
     fn=predict_video,
     inputs=[
-        gr.Video(type="filepath", label="Upload Video"),
         gr.Slider(0.0, 1.0, value=0.5, step=0.01, label="Threshold (Real ≥ Threshold)")
     ],
     outputs="text",
-    title="Fake Video Detection with Threshold Control",
-    description="Upload a video to classify it as Real or Fake. Adjust the threshold to tune sensitivity."
 ).launch()

+import os
 import torch
 import torch.nn as nn
 import numpy as np
 from torchvision import transforms as T
 from torchvision.transforms.v2 import ToDtype
 from decord import VideoReader, cpu
+import gradio as gr
 # -------------------------
+# Step 0: Download model from Google Drive if not exists
 # -------------------------
+model_path = 'vifi_clip_30_epochs_k400_full_finetuned.pth'
+if not os.path.exists(model_path):
+    print(f"🔽 Downloading model to {model_path}...")
+    os.system("pip install -q gdown")
+    os.system("gdown --id 1Nx30Kbu5xnv6dPwz4I3Ivy380LCdp1Md -O vifi_clip_30_epochs_k400_full_finetuned.pth")
 # -------------------------
 # Transform
     def __init__(self, input_dim=512, num_classes=1):
         super().__init__()
         self.dense = nn.Linear(input_dim, num_classes)
     def forward(self, x):
         return self.dense(x)
 # -------------------------
+# Load ViFi-CLIP Model
 # -------------------------
+from trainers import vificlip
+from utils.config import get_config
+from utils.logger import create_logger
 cfgpth = 'configs/zero_shot/train/k400/16_16_vifi_clip.yaml'
 classifier_path = 'best_detector_model.pt'
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 class parse_option:
     def __init__(self):
         self.config = cfgpth
 classifier.eval()
 # -------------------------
+# Inference Function
 # -------------------------
 def predict_video(video_path, threshold=0.5):
     preprocess = _transform(224)
         return f"❌ Error: {str(e)}"
 # -------------------------
+# Gradio UI
 # -------------------------
 gr.Interface(
     fn=predict_video,
     inputs=[
+        gr.Video(type="filepath", label="Upload Video (.mp4)"),
         gr.Slider(0.0, 1.0, value=0.5, step=0.01, label="Threshold (Real ≥ Threshold)")
     ],
     outputs="text",
+    title="🧠 Deepfake Detection with ViFi-CLIP",
+    description="Upload a video to classify it as Real or Fake. Threshold slider lets you adjust sensitivity."
 ).launch()