Spaces:

ttsEmo
/

TTS_API

Sleeping

App Files Files Community

MariaKaiser commited on Mar 21

Commit

6e485a0

verified ·

1 Parent(s): c1730b4

Update app.py

Browse files

Files changed (1) hide show

app.py +101 -26

app.py CHANGED Viewed

@@ -278,6 +278,8 @@ async def concat_story_audio(story: StoryCreationDTO, base_output: str, final_pa
 app = FastAPI(title="EGTTS Arabic TTS API")
 #___________________Test end point to test supabase fetch
 from fastapi import Query
@@ -345,7 +347,7 @@ emotion_map = {
     "NARRATION": "narration"
 }
-def generate_tagged_text(text: str, emotion_enum: str, intensity_enum: int) -> str:
     """
     Convert enums to <emo_x> <int_y> format and concatenate with text
     """
@@ -355,37 +357,110 @@ def generate_tagged_text(text: str, emotion_enum: str, intensity_enum: int) -> s
 #-----------------------------------------------------------
-@app.post("/tts/")
-async def process_story(story: StoryCreationDTO):
-  # Optional: print info for debugging
-    print(story.storyId)
-    for cast in story.cast:
-        print(cast.name, cast.voiceReference)
-    for chapter in story.chapters:
-        for scene in chapter.scenes:
-            for sentence in scene.sentences:
-                print(sentence.speaker, sentence.sentence)
-    # 1️⃣ Generate all sentence audios and folder structure
-    await generate_story_audios(story, base_output=OUTPUT_DIR)
-     # 2️⃣ Concatenate all into final story audio
-    final_story_path = os.path.join(OUTPUT_DIR, story.storyId, f"{story.storyId}_full.wav")
-    final_generated_story_path = await concat_story_audio(story, base_output=OUTPUT_DIR, final_path=final_story_path)
-    # Convert to base64 and get duration
-    audio_b64, duration = audio_to_base64(final_generated_story_path)
-    response = TTSResponse(
-        file_name= os.path.basename(final_generated_story_path),
-        duration=duration,
-        audio_base64=audio_b64
-    )
-    return response
-#----------------------------Test------------------------------------
 @app.post("/tts_test/")
 async def tts_endpoint(

 app = FastAPI(title="EGTTS Arabic TTS API")
+tasks = {}
 #___________________Test end point to test supabase fetch
 from fastapi import Query
     "NARRATION": "narration"
 }
+def generate_tagged_text(text: str, emotion_enum: str, intensity_enum: str) -> str:
     """
     Convert enums to <emo_x> <int_y> format and concatenate with text
     """
 #-----------------------------------------------------------
+#-----------------Post End Point_____________________________
+# @app.post("/tts/")
+# async def process_story(story: StoryCreationDTO):
+#   # Optional: print info for debugging
+#     print(story.storyId)
+#     for cast in story.cast:
+#         print(cast.name, cast.voiceReference)
+#     for chapter in story.chapters:
+#         for scene in chapter.scenes:
+#             for sentence in scene.sentences:
+#                 print(sentence.speaker, sentence.sentence)
+#     # 1️⃣ Generate all sentence audios and folder structure
+#     await generate_story_audios(story, base_output=OUTPUT_DIR)
+#      # 2️⃣ Concatenate all into final story audio
+#     final_story_path = os.path.join(OUTPUT_DIR, story.storyId, f"{story.storyId}_full.wav")
+#     final_generated_story_path = await concat_story_audio(story, base_output=OUTPUT_DIR, final_path=final_story_path)
+#     # Convert to base64 and get duration
+#     audio_b64, duration = audio_to_base64(final_generated_story_path)
+#     response = TTSResponse(
+#         file_name= os.path.basename(final_generated_story_path),
+#         duration=duration,
+#         audio_base64=audio_b64
+#     )
+#     return response
+async def run_tts_pipeline(task_id: str, story: StoryCreationDTO):
+    try:
+        await generate_story_audios(story, base_output=OUTPUT_DIR)
+        final_story_path = os.path.join(
+            OUTPUT_DIR,
+            story.storyId,
+            f"{story.storyId}_full.wav"
+        )
+        final_generated_story_path = await concat_story_audio(
+            story,
+            base_output=OUTPUT_DIR,
+            final_path=final_story_path
+        )
+        audio_b64, duration = audio_to_base64(final_generated_story_path)
+        tasks[task_id] = {
+            "status": "completed",
+            "result": {
+                "file_name": os.path.basename(final_generated_story_path),
+                "duration": duration,
+                "audio_base64": audio_b64
+            }
+        }
+    except Exception as e:
+        tasks[task_id] = {
+            "status": "failed",
+            "error": str(e)
+        }
+from fastapi import BackgroundTasks
+import uuid
+@app.post("/tts/")
+async def process_story(story: StoryCreationDTO, background_tasks: BackgroundTasks):
+    task_id = str(uuid.uuid4())
+    tasks[task_id] = {
+        "status": "processing",
+        "result": None
+    }
+    background_tasks.add_task(run_tts_pipeline, task_id, story)
+    return {"task_id": task_id}
+#-----------------------Results Get End Point ______________________________________
+@app.get("/results/{task_id}")
+async def get_results(task_id: str):
+    if task_id not in tasks:
+        return {"status": "not_found"}
+    task = tasks[task_id]
+    if task["status"] == "processing":
+        return {"status": "processing"}
+    if task["status"] == "failed":
+        return {
+            "status": "failed",
+            "error": task["error"]
+        }
+    return task["result"]
+#----------------------------Test End Point to test tts inference------------------------------------
 @app.post("/tts_test/")
 async def tts_endpoint(