Spaces:

sugakrit6
/

TrainRVC

Sleeping

App Files Files Community

sugakrit6 commited on Dec 14, 2025

Commit

9615f93

verified ·

1 Parent(s): 4f2d1ef

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -123

app.py CHANGED Viewed

@@ -32,29 +32,38 @@ class RealRVCTrainer:
             core_packages = [
                 "torch", "torchaudio", "torchvision", "numpy", "scipy",
                 "librosa", "soundfile", "faiss-cpu", "praat-parselmouth",
-                "pyworld", "scikit-learn", "numba", "resampy", "pydub"
             ]
             for pkg in core_packages:
                 try:
-                    subprocess.run([sys.executable, "-m", "pip", "install", "-q", pkg], timeout=60)
                 except:
                     pass
             progress(0.6, desc="Downloading pretrained models...")
-            pretrained_dir = self.rvc_dir / "pretrained"
             pretrained_dir.mkdir(exist_ok=True)
             models_to_download = [
-                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained/f0G40k.pth", "f0G40k.pth"),
-                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained/f0D40k.pth", "f0D40k.pth"),
-                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/hubert_base.pt", "hubert_base.pt"),
             ]
-            for idx, (url, filename) in enumerate(models_to_download):
-                progress(0.6 + (idx / len(models_to_download)) * 0.3, desc=f"Downloading {filename}...")
-                output_path = pretrained_dir / filename
                 if not output_path.exists():
                     try:
                         subprocess.run(["wget", "-q", "-O", str(output_path), url], timeout=300)
@@ -71,13 +80,13 @@ class RealRVCTrainer:
             self.setup_complete = True
             progress(1.0, desc="Setup complete!")
-            return "✅ RVC Installation Complete!\n\n📦 Installed:\n- Official RVC codebase\n- Pre-trained models\n- All dependencies\n\n🎉 Ready to train!"
         except Exception as e:
             return f"❌ Installation failed: {str(e)}\n\n🔧 Try manual installation or use Google Colab."
     def prepare_dataset(self, audio_files, model_name, progress=gr.Progress()):
-        """Prepare dataset in RVC format"""
         if not audio_files:
             return "❌ Please upload audio files"
@@ -102,23 +111,22 @@ class RealRVCTrainer:
             return f"❌ Error: {str(e)}"
     def preprocess_data(self, model_name, sample_rate, progress=gr.Progress()):
-        """Run RVC preprocessing"""
         try:
             progress(0.1, desc="Starting preprocessing...")
             dataset_path = self.rvc_dir / "dataset" / model_name
             if not dataset_path.exists():
                 return "❌ Dataset not found. Please prepare dataset first."
             preprocess_script = self.rvc_dir / "infer" / "modules" / "train" / "preprocess.py"
-            if not preprocess_script.exists():
-                preprocess_script = self.rvc_dir / "trainset_preprocess_pipeline_print.py"
             progress(0.3, desc="Preprocessing audio...")
-            cmd = [sys.executable, str(preprocess_script), str(dataset_path), str(sample_rate), "2"]
             result = subprocess.run(cmd, capture_output=True, text=True)
             progress(1.0, desc="Preprocessing complete!")
-            return f"✅ Preprocessing Complete!\n\n🎵 Sample Rate: {sample_rate}Hz\n🔍 Features extracted\n📊 Ready for training!"
         except Exception as e:
             return f"❌ Preprocessing failed: {str(e)}"
@@ -132,72 +140,48 @@ class RealRVCTrainer:
             progress(0.1, desc="Starting RVC training...")
             train_script = self.rvc_dir / "infer" / "modules" / "train" / "train.py"
-            if not train_script.exists():
-                train_script = self.rvc_dir / "train_nsf_sim_cache_sid_load_pretrain.py"
             cmd = [
                 sys.executable, str(train_script),
                 "-e", model_name, "-sr", str(sample_rate),
                 "-f0", "1", "-bs", str(batch_size),
                 "-g", "0", "-te", str(epochs), "-se", "10",
-                "-pg", str(self.rvc_dir / "pretrained" / "f0G40k.pth"),
-                "-pd", str(self.rvc_dir / "pretrained" / "f0D40k.pth"),
-                "-l", "0", "-c", "0"
             ]
-            progress(0.2, desc=f"Training {model_name}...")
-            # Set up environment and working directory
-            env = os.environ.copy()
-            pythonpath = str(self.rvc_dir)
-            if 'PYTHONPATH' in env:
-                pythonpath = f"{pythonpath}:{env['PYTHONPATH']}"
-            env['PYTHONPATH'] = pythonpath
-            # Capture both stdout and stderr
-            process = subprocess.Popen(
-                cmd,
-                stdout=subprocess.PIPE,
-                stderr=subprocess.STDOUT,
-                text=True,
-                cwd=str(self.rvc_dir),
-                env=env
-            )
-            training_output = []
             for line in process.stdout:
-                training_output.append(line.strip())
-                if "epoch" in line.lower():
-                    progress(0.2 + 0.6, desc=f"Training: {line.strip()[:50]}")
-            return_code = process.wait()
             progress(0.9, desc="Searching for model files...")
-            # Search for G_*.pth (generator checkpoints) and D_*.pth (discriminator)
-            g_files = list(log_dir.glob("G_*.pth"))
-            d_files = list(log_dir.glob("D_*.pth"))
-            index_files = list(log_dir.rglob("*.index"))
-            # Also check in added_* subfolders
-            added_folders = list(log_dir.glob("added_*"))
-            for folder in added_folders:
-                g_files.extend(list(folder.glob("G_*.pth")))
-                d_files.extend(list(folder.glob("D_*.pth")))
-                index_files.extend(list(folder.glob("*.index")))
-            if g_files or index_files:
                 output_dir = self.workspace / model_name
                 output_dir.mkdir(exist_ok=True)
                 files_info = []
-                # Get the latest G file (highest epoch number)
-                if g_files:
-                    latest_g = max(g_files, key=lambda f: int(f.stem.split('_')[1]) if f.stem.split('_')[1].isdigit() else 0)
-                    shutil.copy2(latest_g, output_dir / f"{model_name}.pth")
-                    model_size = latest_g.stat().st_size / (1024*1024)
-                    files_info.append(f"- {model_name}.pth ({model_size:.1f}MB) [from {latest_g.name}]")
                 if index_files:
                     latest_index = max(index_files, key=lambda p: p.stat().st_mtime)
@@ -205,19 +189,9 @@ class RealRVCTrainer:
                     files_info.append(f"- {latest_index.name}")
                 progress(1.0, desc="Training complete!")
-                return f"✅ Training Complete!\n\n🎓 Model: {model_name}\n📊 Epochs: {epochs}\n\n💾 Model Files:\n{chr(10).join(files_info)}\n\n📂 Location: {output_dir}\n\n🎉 Ready to download!"
             else:
-                debug_info = [f"Return code: {return_code}", ""]
-                debug_info.append("Files in log directory:")
-                if log_dir.exists():
-                    for item in log_dir.rglob("*"):
-                        if item.is_file():
-                            debug_info.append(f"  - {item.relative_to(log_dir)} ({item.stat().st_size} bytes)")
-                debug_info.append("\nLast 10 lines of training output:")
-                debug_info.extend(training_output[-10:])
-                return f"⚠️ Training completed but model files not found.\n\n📋 Debug:\n{chr(10).join(debug_info)}\n\n💡 Check if training actually ran or failed silently."
         except Exception as e:
             return f"❌ Training failed: {str(e)}"
@@ -227,16 +201,13 @@ class RealRVCTrainer:
         try:
             output_dir = self.workspace / model_name
             if not output_dir.exists():
-                output_dir = self.rvc_dir / "logs" / model_name / "weights"
-            if not output_dir.exists():
-                return None, "❌ Model not found"
             zip_path = self.workspace / f"{model_name}_RVC.zip"
             with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
                 for file in output_dir.rglob("*"):
-                    if file.is_file() and (file.suffix in ['.pth', '.index', '.json']):
-                        zipf.write(file, file.name)
             return str(zip_path), f"✅ Model packaged: {zip_path.name}"
         except Exception as e:
@@ -244,50 +215,13 @@ class RealRVCTrainer:
 trainer = RealRVCTrainer()
 with gr.Blocks(title="Real RVC Training") as demo:
-    gr.Markdown("# 🎤 Real RVC Model Training\n### Using Official RVC-Project Implementation\n\n⚠️ Uses REAL RVC training. Models work on weights.gg!")
-    with gr.Tab("⚙️ Step 0: Install RVC"):
-        gr.Markdown("Install official RVC codebase and pretrained models (~200MB)")
-        install_btn = gr.Button("📦 Install RVC Components", variant="primary", size="lg")
-        install_output = gr.Textbox(label="Installation Status", lines=10)
-        install_btn.click(fn=trainer.install_rvc, outputs=install_output)
-    with gr.Tab("📁 Step 1: Prepare Dataset"):
-        gr.Markdown("Upload voice audio files (10-30 min recommended, WAV/MP3/FLAC)")
-        model_name_prep = gr.Textbox(label="Model Name", value="my_voice_model")
-        audio_files = gr.File(label="Upload Audio Files", file_count="multiple", file_types=["audio"])
-        prep_btn = gr.Button("📁 Prepare Dataset", variant="primary")
-        prep_output = gr.Textbox(label="Status", lines=8)
-        prep_btn.click(fn=trainer.prepare_dataset, inputs=[audio_files, model_name_prep], outputs=prep_output)
-    with gr.Tab("🔧 Step 2: Preprocess"):
-        gr.Markdown("Preprocess audio and extract features")
-        model_name_process = gr.Textbox(label="Model Name", value="my_voice_model")
-        sample_rate_process = gr.Radio(choices=["40000", "48000"], value="40000", label="Sample Rate")
-        process_btn = gr.Button("🔧 Preprocess Data", variant="primary")
-        process_output = gr.Textbox(label="Status", lines=8)
-        process_btn.click(fn=trainer.preprocess_data, inputs=[model_name_process, sample_rate_process], outputs=process_output)
-    with gr.Tab("🚀 Step 3: Train Model"):
-        gr.Markdown("Train RVC model (⚠️ CPU training takes hours/days)")
-        model_name_train = gr.Textbox(label="Model Name", value="my_voice_model")
-        epochs_train = gr.Slider(minimum=10, maximum=500, value=100, step=10, label="Epochs")
-        batch_size_train = gr.Slider(minimum=1, maximum=16, value=4, step=1, label="Batch Size")
-        sample_rate_train = gr.Radio(choices=["40000", "48000"], value="40000", label="Sample Rate")
-        train_btn = gr.Button("🎓 Start Real Training", variant="primary")
-        train_output = gr.Textbox(label="Training Status", lines=15)
-        train_btn.click(fn=trainer.train_model, inputs=[model_name_train, epochs_train, batch_size_train, sample_rate_train], outputs=train_output)
-    with gr.Tab("📥 Step 4: Download"):
-        gr.Markdown("Download your trained RVC model")
-        model_name_download = gr.Textbox(label="Model Name", value="my_voice_model")
-        download_btn = gr.Button("📦 Package Model", variant="primary")
-        download_file = gr.File(label="Download")
-        download_status = gr.Textbox(label="Status")
-        download_btn.click(fn=trainer.package_model, inputs=model_name_download, outputs=[download_file, download_status])
-    gr.Markdown("---\n### 📚 Resources\n- [RVC Project](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)\n- [Weights.gg](https://weights.gg/)\n\n### ⚠️ Important\n- Uses REAL RVC training\n- Models work on weights.gg\n- CPU training is VERY slow\n- Recommended: Google Colab with GPU")
 if __name__ == "__main__":
     demo.launch()

             core_packages = [
                 "torch", "torchaudio", "torchvision", "numpy", "scipy",
                 "librosa", "soundfile", "faiss-cpu", "praat-parselmouth",
+                "pyworld", "scikit-learn", "numba", "resampy", "pydub",
+                "fairseq", "gradio", "tensorboard"
             ]
             for pkg in core_packages:
                 try:
+                    subprocess.run([sys.executable, "-m", "pip", "install", "-q", pkg], timeout=120)
                 except:
                     pass
             progress(0.6, desc="Downloading pretrained models...")
+            assets_dir = self.rvc_dir / "assets"
+            pretrained_dir = assets_dir / "pretrained"
+            pretrained_v2_dir = assets_dir / "pretrained_v2"
+            hubert_path = self.rvc_dir / "hubert_base.pt"
+            assets_dir.mkdir(exist_ok=True)
             pretrained_dir.mkdir(exist_ok=True)
+            pretrained_v2_dir.mkdir(exist_ok=True)
             models_to_download = [
+                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/hubert_base.pt", hubert_path),
+                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained/f0G40k.pth", pretrained_dir / "f0G40k.pth"),
+                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained/f0D40k.pth", pretrained_dir / "f0D40k.pth"),
+                # Add v2 if needed
+                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained_v2/f0G40k.pth", pretrained_v2_dir / "f0G40k.pth"),
+                ("https://huggingface.co/lj1995/VoiceConversionWebUI/resolve/main/pretrained_v2/f0D40k.pth", pretrained_v2_dir / "f0D40k.pth"),
             ]
+            for idx, (url, output_path) in enumerate(models_to_download):
+                progress(0.6 + (idx / len(models_to_download)) * 0.3, desc=f"Downloading {output_path.name}...")
                 if not output_path.exists():
                     try:
                         subprocess.run(["wget", "-q", "-O", str(output_path), url], timeout=300)
             self.setup_complete = True
             progress(1.0, desc="Setup complete!")
+            return "✅ RVC Installation Complete!\n\n📦 Installed:\n- Official RVC codebase\n- Pre-trained models in assets/\n- All dependencies\n\n🎉 Ready to train!"
         except Exception as e:
             return f"❌ Installation failed: {str(e)}\n\n🔧 Try manual installation or use Google Colab."
     def prepare_dataset(self, audio_files, model_name, progress=gr.Progress()):
+        # (unchanged - your code here is fine)
         if not audio_files:
             return "❌ Please upload audio files"
             return f"❌ Error: {str(e)}"
     def preprocess_data(self, model_name, sample_rate, progress=gr.Progress()):
+        # (mostly unchanged, but use correct preprocess script path)
         try:
             progress(0.1, desc="Starting preprocessing...")
             dataset_path = self.rvc_dir / "dataset" / model_name
             if not dataset_path.exists():
                 return "❌ Dataset not found. Please prepare dataset first."
+            # Correct preprocess script for current repo
             preprocess_script = self.rvc_dir / "infer" / "modules" / "train" / "preprocess.py"
             progress(0.3, desc="Preprocessing audio...")
+            cmd = [sys.executable, str(preprocess_script), str(dataset_path), str(sample_rate), "2", str(self.rvc_dir / "logs" / model_name)]
             result = subprocess.run(cmd, capture_output=True, text=True)
             progress(1.0, desc="Preprocessing complete!")
+            return f"✅ Preprocessing Complete!\n\n🎵 Sample Rate: {sample_rate}Hz\n🔍 Features extracted\n📊 Ready for training!\n\nLog: {result.stdout[-500:]}"
         except Exception as e:
             return f"❌ Preprocessing failed: {str(e)}"
             progress(0.1, desc="Starting RVC training...")
             train_script = self.rvc_dir / "infer" / "modules" / "train" / "train.py"
+            # Use correct pretrained paths (v1 example; switch to pretrained_v2 for better quality)
+            pg_path = self.rvc_dir / "assets" / "pretrained" / "f0G40k.pth"
+            pd_path = self.rvc_dir / "assets" / "pretrained" / "f0D40k.pth"
             cmd = [
                 sys.executable, str(train_script),
                 "-e", model_name, "-sr", str(sample_rate),
                 "-f0", "1", "-bs", str(batch_size),
                 "-g", "0", "-te", str(epochs), "-se", "10",
+                "-pg", str(pg_path),
+                "-pd", str(pd_path),
+                "-l", "0", "-c", "0", "-sw", "1"  # save weights only at end
             ]
+            process = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, text=True, bufsize=1, universal_newlines=True)
             for line in process.stdout:
+                line = line.strip()
+                if line:
+                    if "epoch" in line.lower() or "loss" in line.lower():
+                        progress(0.2 + 0.7 * (process.poll() is not None), desc=line[:100])
+            process.wait()
             progress(0.9, desc="Searching for model files...")
+            # FIXED: Search directly in logs/<model_name> for .pth files
+            model_files = list(log_dir.glob("*.pth"))
+            index_files = list(log_dir.glob("*.index"))
+            if model_files or index_files:
                 output_dir = self.workspace / model_name
                 output_dir.mkdir(exist_ok=True)
                 files_info = []
+                if model_files:
+                    # Pick the latest G_*.pth or the one with highest steps
+                    latest_model = max(model_files, key=lambda p: p.stat().st_mtime)
+                    shutil.copy2(latest_model, output_dir / f"{model_name}.pth")
+                    model_size = latest_model.stat().st_size / (1024*1024)
+                    files_info.append(f"- {model_name}.pth ({model_size:.1f}MB)")
                 if index_files:
                     latest_index = max(index_files, key=lambda p: p.stat().st_mtime)
                     files_info.append(f"- {latest_index.name}")
                 progress(1.0, desc="Training complete!")
+                return f"✅ Training Complete!\n\n🎓 Model: {model_name}\n📊 Epochs: {epochs}\n\n💾 Model Files:\n{'\n'.join(files_info)}\n\n📂 Location: {output_dir}\n\n🎉 Ready to download!\n\n⚠️ On CPU this is very slow – use GPU if possible!"
             else:
+                return f"⚠️ Training ran but no .pth or .index files found in {log_dir}\n\nCheck logs in terminal or {log_dir} for errors."
         except Exception as e:
             return f"❌ Training failed: {str(e)}"
         try:
             output_dir = self.workspace / model_name
             if not output_dir.exists():
+                return None, "❌ Model not found in workspace"
             zip_path = self.workspace / f"{model_name}_RVC.zip"
             with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
                 for file in output_dir.rglob("*"):
+                    if file.is_file() and file.suffix in ['.pth', '.index']:
+                        zipf.write(file, file.relative_to(output_dir))
             return str(zip_path), f"✅ Model packaged: {zip_path.name}"
         except Exception as e:
 trainer = RealRVCTrainer()
+# Gradio interface remains the same (only minor label updates if desired)
 with gr.Blocks(title="Real RVC Training") as demo:
+    gr.Markdown("# 🎤 Real RVC Model Training\n### Using Official RVC-Project Implementation\n\n⚠️ CPU training is EXTREMELY slow! Use GPU (e.g., Colab) for realistic times.")
+    # ... (your tabs unchanged)
+    gr.Markdown("---\n### ⚠️ Warning: On Hugging Face CPU Spaces, training may take days/weeks or timeout. Strongly recommend Google Colab with free GPU.\n\n### 📚 Resources\n- [RVC Project](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)\n- [Weights.gg](https://weights.gg/)")
 if __name__ == "__main__":
     demo.launch()