Spaces:

sg123321
/

xtts

Sleeping

App Files Files Community

sg123321 commited on 17 days ago

Commit

1dd5ac4

verified ·

1 Parent(s): c0b8023

Update app.py

Browse files

Files changed (1) hide show

app.py +136 -59

app.py CHANGED Viewed

@@ -1,87 +1,164 @@
 import uuid
 import gradio as gr
 import torch
 import spaces
 from TTS.api import TTS
 from supabase import create_client, Client
-# 👇 यहाँ हमने आपकी नई अलग फाइल को इंपोर्ट किया
-import config
-# 1. Setup Supabase (Using config file)
 supabase = None
 if config.IS_CONNECTED:
     try:
         supabase: Client = create_client(config.SUPABASE_URL, config.SUPABASE_KEY)
-        print("✅ Supabase Client Connected!")
     except Exception as e:
-        print(f"❌ Connection Error: {e}")
-# 2. Terms & Model Setup
-import os
 os.environ["COQUI_TOS_AGREED"] = "1"
 device = "cuda" if torch.cuda.is_available() else "cpu"
-print(f"⚙️ Device: {device}")
-print("⏳ Loading XTTS Model...")
 tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
-# 3. Main Logic
 @spaces.GPU(duration=120)
-def clone_voice(text, language, speaker_audio):
-    if not text or not speaker_audio:
-        return None, "Error: Text or Audio missing"
-    filename = f"generated_{uuid.uuid4()}.wav"
-    output_path = "output.wav"
-    # A. Generate Audio
-    print("🎙️ Generating...")
     tts.tts_to_file(
         text=text,
         file_path=output_path,
-        speaker_wav=speaker_audio,
         language=language
     )
-    # B. Upload using Config vars
-    storage_url = "Not Saved"
-    if supabase:
-        try:
-            with open(output_path, 'rb') as f:
-                supabase.storage.from_("voice-bucket").upload(filename, f)
-            # URL बनाना
-            storage_url = f"{config.SUPABASE_URL}/storage/v1/object/public/voice-bucket/{filename}"
-            print(f"✅ Uploaded: {storage_url}")
-            # Database Entry
-            data = {
-                "name": f"Clone_{language}",
-                "file_path": storage_url,
-                "ref_text": text
-            }
-            supabase.table("clones").insert(data).execute()
-        except Exception as e:
-            print(f"❌ Error: {e}")
-            storage_url = f"Error: {e}"
-    return output_path, storage_url
-# 4. Interface
-with gr.Interface(
-    fn=clone_voice,
-    inputs=[
-        gr.Textbox(label="Text", value="Config file test successful!", lines=2),
-        gr.Dropdown(label="Language", choices=["hi", "en"], value="hi"),
-        gr.Audio(label="Audio", type="filepath")
-    ],
-    outputs=[
-        gr.Audio(label="Result"),
-        gr.Textbox(label="Cloud Link")
-    ],
-    title="🚀 Shubham's Clean Code XTTS",
-    description="Running with separate config file."
-) as iface:
-    iface.launch(server_name="0.0.0.0", server_port=7860)

+import os
 import uuid
 import gradio as gr
 import torch
 import spaces
 from TTS.api import TTS
 from supabase import create_client, Client
+import config # आपकी config file
+# 1. Supabase Connection
 supabase = None
 if config.IS_CONNECTED:
     try:
         supabase: Client = create_client(config.SUPABASE_URL, config.SUPABASE_KEY)
+        print("✅ Supabase Connected!")
     except Exception as e:
+        print(f"❌ Supabase Error: {e}")
+# 2. Model Setup
 os.environ["COQUI_TOS_AGREED"] = "1"
 device = "cuda" if torch.cuda.is_available() else "cpu"
+print(f"⏳ Loading XTTS Model on {device}...")
 tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
+# --- Helper Functions ---
+def get_voice_list():
+    """Supabase Bucket से फाइलों की लिस्ट लाता है"""
+    if not supabase: return []
+    try:
+        # 'voice-bucket' से सारी फाइलें लाना
+        res = supabase.storage.from_("voice-bucket").list()
+        # सिर्फ ऑडियो फाइलें छांटना
+        files = [f['name'] for f in res if f['name'].endswith(('.wav', '.mp3'))]
+        return files
+    except Exception as e:
+        print(f"List Error: {e}")
+        return []
+def download_cloud_voice(filename):
+    """क्लाउड से फाइल डाउनलोड करके temp फोल्डर में रखता है"""
+    local_path = f"temp_{filename}"
+    with open(local_path, 'wb+') as f:
+        res = supabase.storage.from_("voice-bucket").download(filename)
+        f.write(res)
+    return local_path
+# --- Main Logic ---
 @spaces.GPU(duration=120)
+def generate_preview(text, language, upload_voice, cloud_voice_name):
+    # 1. Voice Selection Logic (Upload को पहली प्राथमिकता)
+    speaker_wav = None
+    if upload_voice is not None:
+        print("🎙️ Using Uploaded Voice")
+        speaker_wav = upload_voice
+    elif cloud_voice_name:
+        print(f"☁️ Using Cloud Voice: {cloud_voice_name}")
+        try:
+            speaker_wav = download_cloud_voice(cloud_voice_name)
+        except Exception as e:
+            return None, f"Error downloading voice: {e}"
+    else:
+        return None, "⚠️ Please upload a voice OR select one from Cloud!"
+    # 2. Preview Logic (Delete Previous / Overwrite)
+    # हम हमेशा एक ही नाम 'preview.wav' यूज़ करेंगे।
+    # इससे जब भी नया ऑडियो बनेगा, पुराना वाला अपने आप मिट जाएगा।
+    output_path = "preview.wav"
+    print("🔄 Generating Preview...")
     tts.tts_to_file(
         text=text,
         file_path=output_path,
+        speaker_wav=speaker_wav,
         language=language
     )
+    return output_path, "✅ Preview Ready! Save karne ke liye neeche button dabayein."
+def save_to_cloud(preview_path, text, language):
+    """सिर्फ तब सेव करेगा जब यूजर चाहेगा"""
+    if not preview_path or not os.path.exists(preview_path):
+        return "⚠️ No preview found! Pehle 'Generate Preview' karein."
+    if not supabase:
+        return "❌ Supabase not connected!"
+    # फाइल का नया यूनिक नाम
+    filename = f"final_{language}_{uuid.uuid4()}.wav"
+    try:
+        print("☁️ Uploading to Supabase...")
+        with open(preview_path, 'rb') as f:
+            supabase.storage.from_("voice-bucket").upload(filename, f)
+        # पब्लिक लिंक
+        storage_url = f"{config.SUPABASE_URL}/storage/v1/object/public/voice-bucket/{filename}"
+        # डेटाबेस एंट्री
+        data = {
+            "name": f"Clone_{language}",
+            "file_path": storage_url,
+            "ref_text": text
+        }
+        supabase.table("clones").insert(data).execute()
+        return f"🎉 Saved Successfully! Link: {storage_url}"
+    except Exception as e:
+        return f"❌ Save Error: {e}"
+# --- UI Layout (Blocks) ---
+with gr.Blocks(title="Shubham's Ultimate Voice Cloner") as app:
+    gr.Markdown("## 🚀 XTTS Voice Cloning (With Preview & Cloud Select)")
+    with gr.Row():
+        # Text Input Area
+        with gr.Column():
+            txt_input = gr.Textbox(label="Text to Speak", lines=3, value="Namaste, main ab preview lekar cloud par save ho sakta hoon.")
+            lang_dropdown = gr.Dropdown(label="Language", choices=["hi", "en", "es", "fr"], value="hi")
+        # Voice Selection Area
+        with gr.Column():
+            gr.Markdown("### 🎤 Select Voice Source")
+            # Tab 1: Upload
+            voice_upload = gr.Audio(label="Option A: Upload New Voice", type="filepath")
+            # Tab 2: Cloud Select
+            voice_dropdown = gr.Dropdown(label="Option B: Choose from Supabase", choices=get_voice_list(), interactive=True)
+            refresh_btn = gr.Button("🔄 Refresh Cloud List") # लिस्ट रिफ्रेश करने के लिए
+    # Action Buttons
+    btn_preview = gr.Button("🔊 Generate Preview (Wait for it...)", variant="primary")
+    # Output Area
+    audio_output = gr.Audio(label="Preview Audio (Temporary)")
+    status_msg = gr.Textbox(label="Status", interactive=False)
+    # Save Button (Preview ke baad dabana hai)
+    btn_save = gr.Button("☁️ Save this to Supabase", variant="secondary")
+    # --- Click Events ---
+    # 1. Refresh Button Logic
+    def refresh_list():
+        return gr.Dropdown(choices=get_voice_list())
+    refresh_btn.click(refresh_list, outputs=voice_dropdown)
+    # 2. Preview Generation
+    btn_preview.click(
+        fn=generate_preview,
+        inputs=[txt_input, lang_dropdown, voice_upload, voice_dropdown],
+        outputs=[audio_output, status_msg]
+    )
+    # 3. Save to Cloud
+    btn_save.click(
+        fn=save_to_cloud,
+        inputs=[audio_output, txt_input, lang_dropdown],
+        outputs=status_msg
+    )
+if __name__ == "__main__":
+    app.launch(server_name="0.0.0.0", server_port=7860)