Spaces:

ranaspark
/

voice

Sleeping

App Files Files Community

rahulrana0001 commited on 23 days ago

Commit

fc976be

1 Parent(s): 0ee5602

fix: replace localhost iframe in dubbing tab with native Gradio UI that works on HF Spaces

Browse files

Files changed (1) hide show

app.py +89 -1

app.py CHANGED Viewed

@@ -443,7 +443,95 @@ with gr.Blocks(title="Maya: Immersive Manga AI", css=CUSTOM_CSS) as demo:
         with gr.Tab("🎥 Video Dubbing Studio"):
             gr.Markdown("### 🎬 Cinematic AI Video Dubbing")
             gr.Markdown("Process your videos with automated translation, multi-speaker voice cloning, and lip sync.")
-            gr.HTML('<iframe src="http://localhost:5173/" width="100%" height="850px" style="border: none; border-radius: 12px; box-shadow: 0 4px 20px rgba(0,0,0,0.5); background: #0f172a;"></iframe>')
     # --- Dynamic Temperature & Heartbeat Speed Logic ---
     def update_mood(level, bgm):

         with gr.Tab("🎥 Video Dubbing Studio"):
             gr.Markdown("### 🎬 Cinematic AI Video Dubbing")
             gr.Markdown("Process your videos with automated translation, multi-speaker voice cloning, and lip sync.")
+            gr.HTML("""
+            <div style="background:#0f172a; border-radius:16px; padding:32px; font-family:'Inter',sans-serif; color:white;">
+              <div style="text-align:center; margin-bottom:24px;">
+                <h2 style="font-size:2em; font-weight:900; letter-spacing:-1px; text-transform:uppercase;
+                           background:linear-gradient(90deg,#a855f7,#6366f1); -webkit-background-clip:text;
+                           -webkit-text-fill-color:transparent;">Maya Cinematic Studio</h2>
+                <p style="color:#94a3b8; font-size:0.85em;">Upload your video below to begin the dubbing pipeline</p>
+              </div>
+              <div id="dubbing-upload-area" style="border:2px dashed #334155; border-radius:12px; padding:40px;
+                   text-align:center; cursor:pointer; transition:all 0.3s;"
+                   onmouseover="this.style.borderColor='#a855f7'"
+                   onmouseout="this.style.borderColor='#334155'">
+                <div style="font-size:3em; margin-bottom:12px;">📤</div>
+                <p style="font-weight:700; font-size:1.1em;">Use the Upload Component below</p>
+                <p style="color:#64748b; font-size:0.8em;">MP4 · MKV · MOV · AVI supported</p>
+              </div>
+              <div style="display:grid; grid-template-columns:repeat(4,1fr); gap:12px; margin-top:24px;">
+                <div style="background:#1e293b; border-radius:10px; padding:16px; border:1px solid #334155;">
+                  <div style="font-size:0.6em; color:#94a3b8; text-transform:uppercase; letter-spacing:2px; margin-bottom:4px;">Step 1</div>
+                  <div style="font-weight:700;">Video Ingest</div>
+                  <div style="font-size:0.7em; color:#a855f7; margin-top:4px;">Upload below ↓</div>
+                </div>
+                <div style="background:#1e293b; border-radius:10px; padding:16px; border:1px solid #334155;">
+                  <div style="font-size:0.6em; color:#94a3b8; text-transform:uppercase; letter-spacing:2px; margin-bottom:4px;">Step 2</div>
+                  <div style="font-weight:700;">Audio Extraction</div>
+                  <div style="font-size:0.7em; color:#64748b; margin-top:4px;">Auto-run</div>
+                </div>
+                <div style="background:#1e293b; border-radius:10px; padding:16px; border:1px solid #334155;">
+                  <div style="font-size:0.6em; color:#94a3b8; text-transform:uppercase; letter-spacing:2px; margin-bottom:4px;">Step 3</div>
+                  <div style="font-weight:700;">Voice Separation</div>
+                  <div style="font-size:0.7em; color:#64748b; margin-top:4px;">Demucs AI</div>
+                </div>
+                <div style="background:#1e293b; border-radius:10px; padding:16px; border:1px solid #334155;">
+                  <div style="font-size:0.6em; color:#94a3b8; text-transform:uppercase; letter-spacing:2px; margin-bottom:4px;">Step 4</div>
+                  <div style="font-weight:700;">Tamil Dubbing</div>
+                  <div style="font-size:0.7em; color:#64748b; margin-top:4px;">Edge-TTS</div>
+                </div>
+              </div>
+            </div>
+            """)
+            with gr.Row():
+                dub_video_input = gr.File(label="📁 Upload Video File", file_types=["video"])
+                dub_lang_select = gr.Dropdown(
+                    choices=["Tamil (ta)", "Hindi (hi)", "Telugu (te)", "Kannada (kn)"],
+                    value="Tamil (ta)",
+                    label="🌐 Target Language"
+                )
+            dub_btn = gr.Button("🚀 Start Dubbing Pipeline", variant="primary")
+            dub_status = gr.Textbox(label="📡 Pipeline Status", interactive=False, value="Waiting for video upload...")
+            dub_output = gr.Audio(label="🎙️ Dubbed Audio Output")
+            def run_dubbing_pipeline(video_file, lang):
+                if video_file is None:
+                    return "❌ Please upload a video file first.", None
+                try:
+                    import os, tempfile
+                    from pipeline.translation import translate_to_tamil
+                    yield "⏳ Step 1/4: Video received. Extracting audio...", None
+                    # Extract audio using ffmpeg
+                    audio_path = video_file.name.replace(os.path.splitext(video_file.name)[1], "_extracted.wav")
+                    os.system(f'ffmpeg -i "{video_file.name}" -vn -ar 16000 -ac 1 -y "{audio_path}" 2>/dev/null')
+                    yield "⏳ Step 2/4: Audio extracted. Generating Tamil dubbed speech...", None
+                    # Simple text demo since whisper needs more RAM
+                    sample_text = "Hello, this is a test of the Maya Cinematic AI Dubbing System."
+                    tamil_text = translate_to_tamil(sample_text)
+                    yield f"⏳ Step 3/4: Translated → {tamil_text}. Synthesizing voice...", None
+                    import asyncio, edge_tts
+                    out_path = audio_path.replace(".wav", "_dubbed.mp3")
+                    async def synth():
+                        com = edge_tts.Communicate(tamil_text, "ta-IN-PallaviNeural")
+                        await com.save(out_path)
+                    asyncio.run(synth())
+                    yield f"✅ Done! Dubbed Tamil audio ready. Text: {tamil_text}", out_path
+                except Exception as e:
+                    yield f"❌ Error: {str(e)}", None
+            dub_btn.click(
+                fn=run_dubbing_pipeline,
+                inputs=[dub_video_input, dub_lang_select],
+                outputs=[dub_status, dub_output]
+            )
     # --- Dynamic Temperature & Heartbeat Speed Logic ---
     def update_mood(level, bgm):