Spaces:

hivecorp
/

manager1

Sleeping

App Files Files Community

hivecorp commited on Feb 13, 2025

Commit

996d0ad

verified ·

1 Parent(s): dd6cda6

Create app.py

Browse files

Files changed (1) hide show

app.py +83 -0

app.py ADDED Viewed

	@@ -0,0 +1,83 @@

+import os
+import requests
+import uvicorn
+from fastapi import FastAPI
+from pydub import AudioSegment
+from uuid import uuid4
+app = FastAPI()
+# Your first Hugging Face TTS API URL
+TTS_API_URL = "https://hivecorp-s8test.hf.space/tts"
+MAX_LENGTH = 250  # Max characters per chunk
+def split_text(text, max_length=MAX_LENGTH):
+    """Splits text into smaller chunks at sentence boundaries."""
+    chunks = []
+    current_chunk = ""
+    sentences = text.split(". ")
+    for sentence in sentences:
+        if len(current_chunk + sentence) > max_length:
+            chunks.append(current_chunk.strip())
+            current_chunk = ""
+        current_chunk += sentence + ". "
+    if current_chunk:
+        chunks.append(current_chunk.strip())
+    return chunks
+def call_tts_api(text, voice):
+    """Calls the TTS API with the text & voice and returns the generated MP3 file."""
+    response = requests.post(TTS_API_URL, json={"text": text, "voice": voice})
+    if response.status_code == 200:
+        filename = f"audio_{uuid4().hex}.mp3"
+        with open(filename, "wb") as f:
+            f.write(response.content)
+        return filename
+    return None
+def merge_audio(files):
+    """Merges multiple MP3 files into one using pydub."""
+    final_audio = AudioSegment.empty()
+    for file in files:
+        audio = AudioSegment.from_file(file, format="mp3")
+        final_audio += audio
+    final_filename = "final_audio.mp3"
+    final_audio.export(final_filename, format="mp3")
+    # Cleanup temp files
+    for file in files:
+        os.remove(file)
+    return final_filename
+@app.post("/generate-audio")
+async def generate_audio(text: str, voice: str):
+    """Processes text, splits it, calls TTS API, and merges MP3s."""
+    text_chunks = split_text(text)
+    audio_files = [call_tts_api(chunk, voice) for chunk in text_chunks]
+    if None in audio_files:
+        return {"error": "TTS API failed for some parts"}
+    merged_file = merge_audio(audio_files)
+    return {"audio_url": f"/download/{merged_file}"}
+@app.get("/download/{filename}")
+async def download_file(filename: str):
+    """Endpoint to download the merged MP3 file."""
+    return {"file": filename}
+# Ensure the app starts when running in Hugging Face Spaces
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=7860)