Spaces:

Agents-MCP-Hackathon
/

pdf_explainer

Paused

App Files Files Community

spagestic commited on Jun 6, 2025

Commit

c8f218f

1 Parent(s): fa5acc0

chatterbox imported

Browse files

Files changed (6) hide show

.env.example +6 -0
ui/chatterbox/check_api_health.py +13 -0
ui/chatterbox/custom_css.py +9 -0
ui/chatterbox/generate_sample_text.py +10 -0
ui/chatterbox/generate_tts_audio.py +62 -0
ui/chatterbox/update_char_count.py +3 -0

.env.example CHANGED Viewed

@@ -3,3 +3,9 @@
 # Mistral AI API Key - Get yours from https://console.mistral.ai/
 MISTRAL_API_KEY=your_mistral_api_key_here

 # Mistral AI API Key - Get yours from https://console.mistral.ai/
 MISTRAL_API_KEY=your_mistral_api_key_here
+HEALTH_ENDPOINT=https://your-modal-endpoint/chatterbox-health
+GENERATE_AUDIO_ENDPOINT=https://your-modal-endpoint/chatterbox-generate-audio
+GENERATE_JSON_ENDPOINT=https://your-modal-endpoint/chatterbox-generate-json
+GENERATE_WITH_FILE_ENDPOINT=https://your-modal-endpoint/chatterbox-generate-with-file
+GENERATE_ENDPOINT=https://your-modal-endpoint/chatterbox-generate

ui/chatterbox/check_api_health.py ADDED Viewed

	@@ -0,0 +1,13 @@

+def check_api_health():
+    import requests
+    import os
+    HEALTH_ENDPOINT = os.getenv("HEALTH_ENDPOINT", "YOUR-MODAL-ENDPOINT-URL/health")
+    try:
+        response = requests.get(HEALTH_ENDPOINT, timeout=10)
+        if response.status_code == 200:
+            data = response.json()
+            return f"✅ API Status: {data.get('status', 'Unknown')} | Model Loaded: {data.get('model_loaded', False)}"
+        else:
+            return f"⚠️ API returned status code: {response.status_code}"
+    except Exception as e:
+        return f"❌ API Health Check Failed: {str(e)}"

ui/chatterbox/custom_css.py ADDED Viewed

	@@ -0,0 +1,9 @@

+custom_css = """
+.gradio-container {
+    max-width: 1200px !important;
+}
+.status-box {
+    padding: 10px;
+    border-radius: 5px;
+}
+"""

ui/chatterbox/generate_sample_text.py ADDED Viewed

	@@ -0,0 +1,10 @@

+def generate_sample_text():
+    import random
+    samples = [
+        "Hello! This is a test of the Chatterbox TTS system running on Modal.",
+        "The quick brown fox jumps over the lazy dog.",
+        "Welcome to the future of text-to-speech technology.",
+        "Now let's make my mum's favourite. So three mars bars into the pan. Then we add the tuna and just stir for a bit, just let the chocolate and fish infuse.",
+        "This is an example of voice cloning using artificial intelligence.",
+    ]
+    return random.choice(samples)

ui/chatterbox/generate_tts_audio.py ADDED Viewed

	@@ -0,0 +1,62 @@

+def generate_tts_audio(text_input: str, audio_prompt_input, progress=None):
+    import os
+    import requests
+    import tempfile
+    import soundfile as sf
+    import numpy as np
+    import gradio as gr
+    GENERATE_AUDIO_ENDPOINT = os.getenv("GENERATE_AUDIO_ENDPOINT", "YOUR-MODAL-ENDPOINT-URL/generate_audio")
+    GENERATE_WITH_FILE_ENDPOINT = os.getenv("GENERATE_WITH_FILE_ENDPOINT", "YOUR-MODAL-ENDPOINT-URL/generate_with_file")
+    if not text_input or len(text_input.strip()) == 0:
+        raise gr.Error("Please enter some text to synthesize.")
+    if len(text_input) > 1000:
+        raise gr.Error("Text is too long. Maximum 1000 characters allowed.")
+    if progress: progress(0.1, desc="Preparing request...")
+    try:
+        if audio_prompt_input is None:
+            if progress: progress(0.3, desc="Sending request to API...")
+            payload = {"text": text_input}
+            response = requests.post(
+                GENERATE_AUDIO_ENDPOINT,
+                json=payload,
+                headers={"Content-Type": "application/json"},
+                timeout=60
+            )
+            if response.status_code != 200:
+                raise gr.Error(f"API Error: {response.status_code} - {response.text}")
+            if progress: progress(0.8, desc="Processing audio response...")
+            with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_file:
+                temp_file.write(response.content)
+                temp_path = temp_file.name
+            audio_data, sample_rate = sf.read(temp_path)
+            os.unlink(temp_path)
+            if progress: progress(1.0, desc="Complete!")
+            return (sample_rate, audio_data)
+        else:
+            if progress: progress(0.3, desc="Preparing voice prompt...")
+            files = {'text': (None, text_input)}
+            with open(audio_prompt_input, 'rb') as f:
+                audio_content = f.read()
+            files['voice_prompt'] = ('voice_prompt.wav', audio_content, 'audio/wav')
+            if progress: progress(0.5, desc="Sending request with voice cloning...")
+            response = requests.post(
+                GENERATE_WITH_FILE_ENDPOINT,
+                files=files,
+                timeout=120
+            )
+            if response.status_code != 200:
+                raise gr.Error(f"API Error: {response.status_code} - {response.text}")
+            if progress: progress(0.8, desc="Processing cloned voice response...")
+            with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_file:
+                temp_file.write(response.content)
+                temp_path = temp_file.name
+            audio_data, sample_rate = sf.read(temp_path)
+            os.unlink(temp_path)
+            if progress: progress(1.0, desc="Voice cloning complete!")
+            return (sample_rate, audio_data)
+    except requests.exceptions.Timeout:
+        raise gr.Error("Request timed out. The API might be under heavy load. Please try again.")
+    except requests.exceptions.ConnectionError:
+        raise gr.Error("Unable to connect to the API. Please check if the endpoint URL is correct.")
+    except Exception as e:
+        raise gr.Error(f"Error generating audio: {str(e)}")

ui/chatterbox/update_char_count.py ADDED Viewed

	@@ -0,0 +1,3 @@

+def update_char_count(text):
+    count = len(text) if text else 0
+    return f"{count}/1000"