Spaces:

scratchyourbrain123
/

MuseTalk

Running

App Files Files Community

scratchyourbrain123 commited on Oct 22, 2025

Commit

fea5695

verified ·

1 Parent(s): dc5a491

Create initial Gradio app for MuseTalk

Browse files

Initial setup of MuseTalk Space with Gradio interface for audio-driven lip sync

Files changed (1) hide show

app.py +80 -0

app.py ADDED Viewed

	@@ -0,0 +1,80 @@

+import gradio as gr
+import os
+import subprocess
+import sys
+# MuseTalk Gradio Interface
+def setup_musetalk():
+    """Clone and setup MuseTalk repository"""
+    if not os.path.exists('MuseTalk'):
+        subprocess.run(['git', 'clone', 'https://github.com/TMElyralab/MuseTalk.git'], check=True)
+    os.chdir('MuseTalk')
+    subprocess.run([sys.executable, '-m', 'pip', 'install', '-r', 'requirements.txt'], check=True)
+def inference(video_file, audio_file, bbox_shift=0):
+    """Run MuseTalk inference"""
+    try:
+        # Run inference script
+        cmd = [
+            sys.executable,
+            'scripts/inference/gradio_demo.py',
+            '--video', video_file.name,
+            '--audio', audio_file.name,
+            '--bbox_shift', str(bbox_shift)
+        ]
+        result = subprocess.run(cmd, capture_output=True, text=True)
+        # Return the generated video
+        output_path = 'results/output.mp4'
+        if os.path.exists(output_path):
+            return output_path
+        else:
+            return None
+    except Exception as e:
+        return f"Error: {str(e)}"
+# Create Gradio interface
+with gr.Blocks(title="MuseTalk - Real-time Audio-Driven Lip Sync") as demo:
+    gr.Markdown("""
+    # MuseTalk: Real-Time High-Quality Lip Synchronization
+    Upload a video and audio file to generate lip-synced output.
+    **Note:** First run will download required model weights (~2GB).
+    """)
+    with gr.Row():
+        with gr.Column():
+            video_input = gr.Video(label="Input Video")
+            audio_input = gr.Audio(label="Input Audio", type="filepath")
+            bbox_shift = gr.Slider(minimum=-10, maximum=10, value=0, step=1,
+                                   label="BBox Shift",
+                                   info="Adjust face bounding box position")
+            submit_btn = gr.Button("Generate", variant="primary")
+        with gr.Column():
+            video_output = gr.Video(label="Output Video")
+    submit_btn.click(
+        fn=inference,
+        inputs=[video_input, audio_input, bbox_shift],
+        outputs=video_output
+    )
+    gr.Markdown("""
+    ## About MuseTalk
+    MuseTalk generates lip-synchronized videos from input video and audio files.
+    - [GitHub Repository](https://github.com/TMElyralab/MuseTalk)
+    - [Model Weights](https://huggingface.co/TMElyralab/MuseTalk)
+    """)
+if __name__ == "__main__":
+    # Setup MuseTalk on first run
+    try:
+        setup_musetalk()
+    except Exception as e:
+        print(f"Setup warning: {e}")
+    demo.launch()