Spaces:

Ricky01anjay
/

dubbingAI

Paused

App Files Files Community

Ricky01anjay commited on Mar 5

Commit

715617d

verified ·

1 Parent(s): d0df8c3

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -29

app.py CHANGED Viewed

@@ -9,9 +9,10 @@ import subprocess
 from flask import Flask, request, jsonify, render_template_string, send_from_directory
 import whisper
 import edge_tts
-# Nonaktifkan logging Flask default jika ingin benar-benar bersih
 import logging
 log = logging.getLogger('werkzeug')
 log.setLevel(logging.ERROR)
@@ -27,7 +28,7 @@ VOICE_MAP = {
     'ja-JP': 'ja-JP-KeitaNeural'
 }
-# Load Whisper tanpa log
 whisper_model = whisper.load_model("base")
 def get_audio_duration(file_path):
@@ -71,16 +72,15 @@ async def generate_tts(text, voice, path):
 def process_dubbing(task_id, video_path, target_voice, custom_prompt):
     try:
-        tasks[task_id]['status'] = 'Processing Audio...'
         orig_audio = os.path.join(app.config['UPLOAD_FOLDER'], f"{task_id}_orig.wav")
-        # Extract audio (Silent)
         subprocess.run(['ffmpeg', '-loglevel', 'quiet', '-y', '-i', video_path, '-vn', '-acodec', 'pcm_s16le', '-ar', '44100', orig_audio], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
-        # Transcribe (Silent)
         result = whisper_model.transcribe(orig_audio, verbose=False)
         segments = result['segments']
-        # Translate
         translated_segments = translate_segments_llm(segments, custom_prompt)
         processed_audio_files = []
@@ -96,17 +96,19 @@ def process_dubbing(task_id, video_path, target_voice, custom_prompt):
             asyncio.run(generate_tts(text, VOICE_MAP.get(target_voice, 'id-ID-ArdiNeural'), raw_tts))
             tts_dur = get_audio_duration(raw_tts)
-            speed = min(max(tts_dur / duration_orig, 0.5), 2.0) if duration_orig > 0 else 1.0
-            # Sync (Silent)
             subprocess.run(['ffmpeg', '-loglevel', 'quiet', '-y', '-i', raw_tts, '-filter:a', f'atempo={speed}', '-ar', '44100', sync_tts], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
             processed_audio_files.append({'path': sync_tts, 'start': start_t})
-        tasks[task_id]['status'] = 'Final Rendering...'
-        # Filter: Hapus vokal (bandreject), Volume 50%, Mix Dubbing
-        filter_complex = "[0:a]bandreject=f=1200:width_type=h:w=1000,volume=0.5[bg];"
         inputs_cmd = ['ffmpeg', '-loglevel', 'quiet', '-y', '-i', video_path]
         amix_inputs = "[bg]"
@@ -117,10 +119,16 @@ def process_dubbing(task_id, video_path, target_voice, custom_prompt):
             filter_complex += f"[{idx}:a]adelay={start_ms}|{start_ms}[dub{idx}];"
             amix_inputs += f"[dub{idx}]"
         filter_complex += f"{amix_inputs}amix=inputs={len(processed_audio_files)+1}:duration=first:dropout_transition=0[outa]"
         output_video = os.path.join(app.config['UPLOAD_FOLDER'], f"{task_id}_output.mp4")
-        final_cmd = inputs_cmd + ['-filter_complex', filter_complex, '-map', '0:v', '-map', '[outa]', '-c:v', 'libx264', '-preset', 'ultrafast', '-c:a', 'aac', output_video]
         subprocess.run(final_cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
@@ -137,7 +145,7 @@ def process_dubbing(task_id, video_path, target_voice, custom_prompt):
         tasks[task_id]['status'] = 'Error'
         tasks[task_id]['error_message'] = str(e)
-# --- WEB UI ---
 @app.route('/')
 def index():
@@ -165,28 +173,31 @@ HTML_TEMPLATE = """
 <!DOCTYPE html>
 <html>
 <head>
-    <title>AI Dubbing Silent Mode</title>
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
-    <style>body{background:#000;color:#fff;display:flex;align-items:center;justify-content:center;height:100vh;}.card{background:#111;border:1px solid #333;width:400px;padding:20px;border-radius:15px;}</style>
 </head>
 <body>
-    <div class="card text-center">
-        <h4>🎙️ AI Dubbing Sync</h4>
-        <p class="text-secondary small">Vocal removed, Background 50%</p>
         <form id="u">
-            <input type="file" id="v" class="form-control mb-2 bg-dark text-white" required>
-            <select id="s" class="form-select mb-2 bg-dark text-white">
-                <option value="id-ID">Indonesia</option>
-                <option value="en-US">English</option>
-                <option value="ja-JP">Japanese</option>
             </select>
-            <textarea id="p" class="form-control mb-3 bg-dark text-white" placeholder="Custom prompt..."></textarea>
             <button type="submit" id="b" class="btn btn-primary w-100">Mulai Proses</button>
         </form>
-        <div id="l" class="mt-3 d-none"><div class="spinner-border spinner-border-sm text-primary"></div> <span id="st">...</span></div>
-        <div id="r" class="mt-3 d-none">
-            <video id="vd" controls class="w-100 rounded mb-2"></video>
-            <a id="dl" href="#" class="btn btn-success btn-sm w-100" download>Download Result</a>
         </div>
     </div>
     <script>

 from flask import Flask, request, jsonify, render_template_string, send_from_directory
 import whisper
 import edge_tts
 import logging
+# Matikan log Flask & Werkzeug
+os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
 log = logging.getLogger('werkzeug')
 log.setLevel(logging.ERROR)
     'ja-JP': 'ja-JP-KeitaNeural'
 }
+# Load Whisper (Model Base sangat ringan untuk RAM 16GB)
 whisper_model = whisper.load_model("base")
 def get_audio_duration(file_path):
 def process_dubbing(task_id, video_path, target_voice, custom_prompt):
     try:
+        tasks[task_id]['status'] = 'Mengekstrak Suara...'
         orig_audio = os.path.join(app.config['UPLOAD_FOLDER'], f"{task_id}_orig.wav")
         subprocess.run(['ffmpeg', '-loglevel', 'quiet', '-y', '-i', video_path, '-vn', '-acodec', 'pcm_s16le', '-ar', '44100', orig_audio], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
+        # Transkripsi Whisper (Silent)
         result = whisper_model.transcribe(orig_audio, verbose=False)
         segments = result['segments']
+        # Translasi AI
         translated_segments = translate_segments_llm(segments, custom_prompt)
         processed_audio_files = []
             asyncio.run(generate_tts(text, VOICE_MAP.get(target_voice, 'id-ID-ArdiNeural'), raw_tts))
+            # Sync Speed
             tts_dur = get_audio_duration(raw_tts)
+            speed = min(max(tts_dur / duration_orig, 0.6), 1.9) if duration_orig > 0 else 1.0
             subprocess.run(['ffmpeg', '-loglevel', 'quiet', '-y', '-i', raw_tts, '-filter:a', f'atempo={speed}', '-ar', '44100', sync_tts], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
             processed_audio_files.append({'path': sync_tts, 'start': start_t})
+        tasks[task_id]['status'] = 'Menghapus Vokal & Rendering...'
+        # LOGIKA HAPUS VOKAL (Stereotools Center Removal) + Volume BG 100% (1.0)
+        # Filter stereotools mengekstrak side channel (instrumen) dan membuang center channel (vokal).
+        filter_complex = "[0:a]stereotools=mlev=0.0:slev=1.0:phasel=1:phaser=1[bg];"
         inputs_cmd = ['ffmpeg', '-loglevel', 'quiet', '-y', '-i', video_path]
         amix_inputs = "[bg]"
             filter_complex += f"[{idx}:a]adelay={start_ms}|{start_ms}[dub{idx}];"
             amix_inputs += f"[dub{idx}]"
+        # Mixing: BG tetap volume 1.0 (aslinya), Dubbing volume 1.0
         filter_complex += f"{amix_inputs}amix=inputs={len(processed_audio_files)+1}:duration=first:dropout_transition=0[outa]"
         output_video = os.path.join(app.config['UPLOAD_FOLDER'], f"{task_id}_output.mp4")
+        final_cmd = inputs_cmd + [
+            '-filter_complex', filter_complex,
+            '-map', '0:v', '-map', '[outa]',
+            '-c:v', 'libx264', '-preset', 'ultrafast', '-crf', '23', '-c:a', 'aac', '-b:a', '192k',
+            output_video
+        ]
         subprocess.run(final_cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
         tasks[task_id]['status'] = 'Error'
         tasks[task_id]['error_message'] = str(e)
+# --- UI DASAR ---
 @app.route('/')
 def index():
 <!DOCTYPE html>
 <html>
 <head>
+    <title>AI Dubbing No Vocal</title>
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
+    <style>body{background:#000;color:#fff;display:flex;align-items:center;justify-content:center;height:100vh;}.card{background:#111;border:1px solid #333;width:420px;padding:25px;border-radius:20px;}</style>
 </head>
 <body>
+    <div class="card shadow-lg">
+        <h4 class="text-center mb-3">🎙️ Dubbing Sync Pro</h4>
+        <p class="text-center text-secondary small mb-4">Background Asli 100% | Vokal Dihapus</p>
         <form id="u">
+            <input type="file" id="v" class="form-control mb-2 bg-dark text-white border-secondary" required>
+            <select id="s" class="form-select mb-2 bg-dark text-white border-secondary">
+                <option value="id-ID">Indonesia 🇮🇩</option>
+                <option value="en-US">English 🇺🇸</option>
+                <option value="ja-JP">Japanese 🇯🇵</option>
             </select>
+            <textarea id="p" class="form-control mb-3 bg-dark text-white border-secondary" placeholder="Prompt (Opsional)..."></textarea>
             <button type="submit" id="b" class="btn btn-primary w-100">Mulai Proses</button>
         </form>
+        <div id="l" class="mt-4 d-none text-center">
+            <div class="spinner-border text-primary spinner-border-sm"></div>
+            <span id="st" class="ms-2 small">Menyiapkan...</span>
+        </div>
+        <div id="r" class="mt-4 d-none text-center">
+            <video id="vd" controls class="w-100 rounded border border-secondary mb-3"></video>
+            <a id="dl" href="#" class="btn btn-success w-100 btn-sm" download>Download Hasil</a>
         </div>
     </div>
     <script>