Spaces:

RGriya
/

deepfake-audio-api

Sleeping

App Files Files Community

RGriya commited on Feb 27

Commit

2df6447

verified ·

1 Parent(s): dd49b9c

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +16 -0
README.md +29 -0
app.py +89 -0
requirements.txt +8 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,16 @@

+FROM python:3.11-slim
+WORKDIR /app
+RUN apt-get update && apt-get install -y \
+    libsndfile1 ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY app.py .
+EXPOSE 7860
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

README.md ADDED Viewed

	@@ -0,0 +1,29 @@

+---
+title: Deepfake Audio Detection API
+emoji: 🎙️
+colorFrom: purple
+colorTo: blue
+sdk: docker
+app_port: 7860
+pinned: false
+---
+# Deepfake Audio Detection API
+REST API for detecting AI-generated / deepfake audio using Wav2Vec2 (98.82% accuracy).
+## Endpoints
+**GET /health**
+```json
+{"status": "ok"}
+```
+**POST /detect** — send audio file as multipart form
+```bash
+curl -X POST https://rgriya-deepfake-audio-api.hf.space/detect \
+  -F "file=@your_audio.wav"
+```
+```json
+{"label": "fake", "fake": 0.97, "real": 0.03}
+```

app.py ADDED Viewed

	@@ -0,0 +1,89 @@

+"""
+Pure FastAPI — no Gradio dependency at all.
+HuggingFace Spaces serves FastAPI apps directly.
+GET  /health  → {"status":"ok"}
+POST /detect  → multipart file=<audio> → {"label":"fake","fake":0.97,"real":0.03}
+"""
+import io
+import numpy as np
+import soundfile as sf
+from fastapi import FastAPI, File, UploadFile, HTTPException
+from fastapi.responses import HTMLResponse
+from transformers import pipeline
+import torch
+MODEL = "mo-thecreator/Deepfake-audio-detection"
+print(f"Loading {MODEL} ...")
+classifier = pipeline(
+    "audio-classification",
+    model=MODEL,
+    device=0 if torch.cuda.is_available() else -1,
+)
+print("Model ready.")
+app = FastAPI(title="Deepfake Audio Detection")
+def classify(raw_bytes: bytes) -> dict:
+    buf = io.BytesIO(raw_bytes)
+    try:
+        data, sr = sf.read(buf, dtype="float32", always_2d=False)
+    except Exception:
+        import librosa
+        buf.seek(0)
+        data, sr = librosa.load(buf, sr=16000, mono=True)
+        sr = 16000
+    if data.ndim > 1:
+        data = data.mean(axis=1)
+    peak = np.abs(data).max()
+    if peak > 1.0:
+        data /= peak
+    if sr != 16000:
+        import librosa
+        data = librosa.resample(data, orig_sr=sr, target_sr=16000)
+    out = io.BytesIO()
+    sf.write(out, data, 16000, format="WAV", subtype="PCM_16")
+    out.seek(0)
+    results = classifier(out.read())
+    print(f"Results: {results}")
+    scores = {r["label"]: float(r["score"]) for r in results}
+    return {"label": max(scores, key=scores.get), **scores}
+@app.get("/", response_class=HTMLResponse)
+def root():
+    return """
+    <html><body style="font-family:sans-serif;max-width:600px;margin:40px auto;padding:20px">
+    <h2>🎙️ Deepfake Audio Detection API</h2>
+    <p>Model: <code>mo-thecreator/Deepfake-audio-detection</code> (Wav2Vec2, 98.82% accuracy)</p>
+    <h3>Endpoints</h3>
+    <code>GET  /health</code> — health check<br><br>
+    <code>POST /detect</code> — multipart <code>file=&lt;audio&gt;</code><br>
+    <pre>{"label": "fake", "fake": 0.97, "real": 0.03}</pre>
+    <h3>Test</h3>
+    <form action="/detect" method="post" enctype="multipart/form-data">
+      <input type="file" name="file" accept="audio/*">
+      <button type="submit">Detect</button>
+    </form>
+    </body></html>
+    """
+@app.get("/health")
+def health():
+    return {"status": "ok", "model": MODEL}
+@app.post("/detect")
+async def detect(file: UploadFile = File(...)):
+    try:
+        raw = await file.read()
+        print(f"/detect: {len(raw)} bytes  filename={file.filename}")
+        return classify(raw)
+    except Exception as e:
+        import traceback; traceback.print_exc()
+        raise HTTPException(status_code=500, detail=str(e))

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+fastapi>=0.110.0
+uvicorn>=0.29.0
+transformers>=4.39.0
+torch>=2.0.0
+torchaudio>=2.0.0
+librosa>=0.10.0
+soundfile>=0.12.0
+python-multipart>=0.0.9