Spaces:

Offex
/

Transcripttiktok

Running

App Files Files Community

Offex commited on 4 days ago

Commit

0a869f5

verified ·

1 Parent(s): 666ec0a

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -57

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ import shutil
 import requests
 from faster_whisper import WhisperModel
-# 1. Model Setup
 model = None
 def load_model():
@@ -16,85 +16,87 @@ def load_model():
         print("✅ Model Loaded!")
     return model
-# 2. Helper: TikTok Short URL to Long URL Resolver
 def get_actual_url(short_url):
     try:
-        # User-Agent lagana zaroori hai taaki TikTok redirect allow kare
         headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'}
         response = requests.head(short_url, allow_redirects=True, headers=headers)
-        print(f"🔗 Converted {short_url} to {response.url}")
         return response.url
     except:
         return short_url
-# 3. Audio Download Function
-def get_audio(url):
-    try:
-        # Pehle URL ko resolve karo (Short -> Long)
-        actual_url = get_actual_url(url)
-        output = "tiktok_audio"
-        if os.path.exists(f"{output}.mp3"): os.remove(f"{output}.mp3")
-        ffmpeg_path = shutil.which("ffmpeg") or "/usr/bin/ffmpeg"
-        ydl_opts = {
-            'format': 'bestaudio/best',
-            'outtmpl': output,
-            'ffmpeg_location': ffmpeg_path,
-            'postprocessors': [{
-                'key': 'FFmpegExtractAudio',
-                'preferredcodec': 'mp3',
-                'preferredquality': '192',
-            }],
-            'quiet': False,
-            'no_warnings': True,
-            'nocheckcertificate': True, # SSL Errors ignore karne ke liye
-            'ignoreerrors': False,
-            # TikTok Special Options
-            'extractor_args': {'tiktok': {'app_version': ['30.0.0']}},
-            'http_headers': {
-                'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
-                'Referer': 'https://www.tiktok.com/'
-            }
         }
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             ydl.download([actual_url])
-        return f"{output}.mp3"
     except Exception as e:
-        return f"❌ Download Error: {str(e)}"
-# 4. Transcription Function
-def transcribe(url):
-    if not url: return "⚠️ URL missing!"
-    print(f"Processing: {url}")
-    audio = get_audio(url)
-    if not audio.endswith(".mp3"):
-        return audio # Return error message
     try:
         current_model = load_model()
-        # Beam size 1 is faster for CPU
-        segments, _ = current_model.transcribe(audio, beam_size=1)
         text = " ".join([s.text for s in segments])
-        return text
     except Exception as e:
-        return f"Transcription Error: {str(e)}"
-# 5. UI
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🚀 TikTok Transcriber (Fixed)")
-    gr.Markdown("Agar 'Status Code 0' error aaye, to TikTok ne server IP block kiya hai. Dobara try karein.")
     with gr.Row():
-        link = gr.Textbox(label="TikTok URL", placeholder="Paste https://vt.tiktok.com/... link")
-        btn = gr.Button("Transcribe", variant="primary")
-    out = gr.Textbox(label="Result", lines=10)
-    btn.click(fn=transcribe, inputs=link, outputs=out)
 demo.launch()

 import requests
 from faster_whisper import WhisperModel
+# --- 1. Model Setup ---
 model = None
 def load_model():
         print("✅ Model Loaded!")
     return model
+# --- 2. URL Resolver (Short -> Long) ---
 def get_actual_url(short_url):
     try:
         headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'}
         response = requests.head(short_url, allow_redirects=True, headers=headers)
         return response.url
     except:
         return short_url
+# --- 3. Process Video (Download & Transcribe) ---
+def process_video(url):
+    if not url:
+        return None, "⚠️ URL missing!"
+    print(f"Processing: {url}")
+    # 1. Resolve URL
+    actual_url = get_actual_url(url)
+    # 2. Download Video (MP4)
+    output_file = "tiktok_video.mp4"
+    # Purani file safai
+    if os.path.exists(output_file): os.remove(output_file)
+    ffmpeg_path = shutil.which("ffmpeg") or "/usr/bin/ffmpeg"
+    ydl_opts = {
+        'format': 'best[ext=mp4]/best',  # <-- Ab hum Video download kar rahe hain
+        'outtmpl': "tiktok_video.%(ext)s",
+        'ffmpeg_location': ffmpeg_path,
+        'quiet': False,
+        'no_warnings': True,
+        'nocheckcertificate': True,
+        'http_headers': {
+            'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
+            'Referer': 'https://www.tiktok.com/'
         }
+    }
+    try:
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             ydl.download([actual_url])
     except Exception as e:
+        return None, f"❌ Download Error: {str(e)}"
+    if not os.path.exists(output_file):
+        return None, "❌ Video download failed."
+    # 3. Transcribe (Audio from Video)
     try:
         current_model = load_model()
+        # Whisper direct video file se audio padh lega
+        segments, _ = current_model.transcribe(output_file, beam_size=1)
         text = " ".join([s.text for s in segments])
+        # Return Video Path AND Transcript Text
+        return output_file, text
     except Exception as e:
+        return output_file, f"Transcription Error: {str(e)}"
+# --- 4. UI Design ---
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🎵 TikTok Downloader & Transcriber")
+    gr.Markdown("Link paste karo -> Video download karo -> Text copy karo (Ek sath!)")
     with gr.Row():
+        link_input = gr.Textbox(label="TikTok URL", placeholder="Paste link here...", scale=4)
+        btn = gr.Button("🚀 Process", variant="primary", scale=1)
+    with gr.Row():
+        # Left Side: Video Player
+        with gr.Column():
+            video_out = gr.Video(label="Download Video", format="mp4")
+        # Right Side: Code Box for Easy Copy
+        with gr.Column():
+            # 'gr.Code' use kiya hai taki 1-click copy button mile
+            transcript_out = gr.Code(label="Transcript (Click Copy Icon 📋)", language=None, lines=10)
+    # Button Action
+    btn.click(fn=process_video, inputs=link_input, outputs=[video_out, transcript_out])
 demo.launch()