VibeVoice-demo-dev

Paused

App Files Files Community

broadfield-dev commited on Aug 25

Commit

1cb26d6

verified ·

1 Parent(s): 4324db0

Update app.py

Browse files

Files changed (1) hide show

app.py +68 -17

app.py CHANGED Viewed

@@ -3,6 +3,11 @@ import subprocess
 import sys
 from pathlib import Path
 # --- 1. Clone the VibeVoice Repository ---
 repo_dir = "VibeVoice"
 if not os.path.exists(repo_dir):
@@ -21,10 +26,11 @@ if not os.path.exists(repo_dir):
 else:
     print("Repository already exists. Skipping clone.")
-# --- 2. Install the Package ---
 os.chdir(repo_dir)
 print(f"Changed directory to: {os.getcwd()}")
 print("Installing the VibeVoice package...")
 try:
     subprocess.run(
@@ -38,38 +44,83 @@ except subprocess.CalledProcessError as e:
     print(f"Error installing package: {e.stderr}")
     sys.exit(1)
-# --- 3. Modify the demo script for CPU execution (Robust Method) ---
 demo_script_path = Path("demo/gradio_demo.py")
-print(f"Modifying {demo_script_path} for CPU execution...")
 try:
-    # Read the entire file content
     file_content = demo_script_path.read_text()
-    # Define the original GPU-specific model loading block
-    original_block = """        self.model = VibeVoiceForConditionalGenerationInference.from_pretrained(
             self.model_path,
             torch_dtype=torch.bfloat16,
             device_map='cuda',
             attn_implementation="flash_attention_2",
         )"""
-    # Define the new CPU-compatible block
-    replacement_block = """        self.model = VibeVoiceForConditionalGenerationInference.from_pretrained(
             self.model_path,
             torch_dtype=torch.float32,  # Use float32 for CPU
             device_map="cpu",
         )"""
-    # Replace the entire block
-    if original_block in file_content:
-        modified_content = file_content.replace(original_block, replacement_block)
-        # Write the modified content back to the file
-        demo_script_path.write_text(modified_content)
-        print("Script modified successfully.")
-    else:
-        print("Warning: GPU-specific model loading block not found. The script might have been updated. Proceeding without modification.")
 except Exception as e:
     print(f"An error occurred while modifying the script: {e}")

 import sys
 from pathlib import Path
+# --- 0. Hardcoded Toggle for Execution Environment ---
+# Set this to True to use Hugging Face ZeroGPU
+# Set this to False to use a pure CPU environment
+USE_ZEROGPU = True
 # --- 1. Clone the VibeVoice Repository ---
 repo_dir = "VibeVoice"
 if not os.path.exists(repo_dir):
 else:
     print("Repository already exists. Skipping clone.")
+# --- 2. Install Dependencies ---
 os.chdir(repo_dir)
 print(f"Changed directory to: {os.getcwd()}")
+# Install the main package
 print("Installing the VibeVoice package...")
 try:
     subprocess.run(
     print(f"Error installing package: {e.stderr}")
     sys.exit(1)
+# Install 'spaces' if using ZeroGPU
+if USE_ZEROGPU:
+    print("Installing the 'spaces' library for ZeroGPU...")
+    try:
+        subprocess.run(
+            [sys.executable, "-m", "pip", "install", "huggingface-hub", "gradio", "spaces"],
+            check=True,
+            capture_output=True,
+            text=True
+        )
+        print("'spaces' library installed successfully.")
+    except subprocess.CalledProcessError as e:
+        print(f"Error installing 'spaces' library: {e.stderr}")
+        sys.exit(1)
+# --- 3. Modify the demo script based on the toggle ---
 demo_script_path = Path("demo/gradio_demo.py")
+print(f"Reading {demo_script_path}...")
 try:
     file_content = demo_script_path.read_text()
+    if USE_ZEROGPU:
+        print("Optimizing for ZeroGPU execution...")
+        # Ensure the original GPU block is present
+        original_block = """        self.model = VibeVoiceForConditionalGenerationInference.from_pretrained(
             self.model_path,
             torch_dtype=torch.bfloat16,
             device_map='cuda',
             attn_implementation="flash_attention_2",
         )"""
+        if original_block in file_content:
+            # Add 'import spaces' at the beginning of the file
+            modified_content = "import spaces\n" + file_content
+            # Decorate the model loading and generation functions with @spaces.GPU
+            # This is a robust way to ensure both setup and inference get GPU access
+            modified_content = modified_content.replace(
+                "class VibeVoiceGradioInterface:",
+                "@spaces.GPU\nclass VibeVoiceGradioInterface:"
+            )
+            print("Script modified for ZeroGPU successfully.")
+            # Write the modified content back to the file
+            demo_script_path.write_text(modified_content)
+        else:
+            print("Warning: Original GPU-specific model loading block not found. The script might have been updated. Proceeding with potential ZeroGPU compatibility.")
+    else:
+        print("Modifying for CPU execution...")
+        # Define the original GPU-specific model loading block
+        original_block = """        self.model = VibeVoiceForConditionalGenerationInference.from_pretrained(
+            self.model_path,
+            torch_dtype=torch.bfloat16,
+            device_map='cuda',
+            attn_implementation="flash_attention_2",
+        )"""
+        # Define the new CPU-compatible block
+        replacement_block = """        self.model = VibeVoiceForConditionalGenerationInference.from_pretrained(
             self.model_path,
             torch_dtype=torch.float32,  # Use float32 for CPU
             device_map="cpu",
         )"""
+        # Replace the entire block
+        if original_block in file_content:
+            modified_content = file_content.replace(original_block, replacement_block)
+            # Write the modified content back to the file
+            demo_script_path.write_text(modified_content)
+            print("Script modified for CPU successfully.")
+        else:
+            print("Warning: GPU-specific model loading block not found. The script might have been updated. Proceeding without modification.")
 except Exception as e:
     print(f"An error occurred while modifying the script: {e}")