AI_Avatar_Chat

Paused

bravedims commited on Aug 7, 2025

Commit

dd21570

1 Parent(s): f63a9e3

Fix ElevenLabs API issues and improve error handling

- Remove hardcoded API key and add proper validation
- Improve voice ID handling and logging
- Add detailed error messages and traceback logging
- Add API key validation before making TTS calls
- This should fix the 'Voice ID: (empty)' and 'Error generating speech:' issues

Files changed (1) hide show

app.py +15 -3

app.py CHANGED Viewed

@@ -57,7 +57,9 @@ class GenerateResponse(BaseModel):
 class ElevenLabsClient:
     def __init__(self, api_key: str = None):
-        self.api_key = api_key or os.getenv("ELEVENLABS_API_KEY", "sk_c7a0b115cd48fc026226158c5ac87755b063c802ad892de6")
         self.base_url = "https://api.elevenlabs.io/v1"
     async def text_to_speech(self, text: str, voice_id: str = "21m00Tcm4TlvDq8ikWAM") -> str:
@@ -103,7 +105,10 @@ class ElevenLabsClient:
             logger.error(f"Network error calling ElevenLabs: {e}")
             raise HTTPException(status_code=400, detail=f"Network error calling ElevenLabs: {e}")
         except Exception as e:
-            logger.error(f"Error generating speech: {e}")
             raise HTTPException(status_code=500, detail=f"Error generating speech: {e}")
 class OmniAvatarAPI:
@@ -195,10 +200,16 @@ class OmniAvatarAPI:
             if request.text_to_speech:
                 # Generate speech from text using ElevenLabs
                 logger.info(f"Generating speech from text: {request.text_to_speech[:50]}...")
                 audio_path = await self.elevenlabs_client.text_to_speech(
                     request.text_to_speech,
-                    request.voice_id or "21m00Tcm4TlvDq8ikWAM"
                 )
                 audio_generated = True
@@ -480,3 +491,4 @@ app = gr.mount_gradio_app(app, iface, path="/gradio")
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)

 class ElevenLabsClient:
     def __init__(self, api_key: str = None):
+        self.api_key = api_key or os.getenv("ELEVENLABS_API_KEY")
+        if not self.api_key:
+            logger.warning("No ElevenLabs API key found. Text-to-speech will not work.")
         self.base_url = "https://api.elevenlabs.io/v1"
     async def text_to_speech(self, text: str, voice_id: str = "21m00Tcm4TlvDq8ikWAM") -> str:
             logger.error(f"Network error calling ElevenLabs: {e}")
             raise HTTPException(status_code=400, detail=f"Network error calling ElevenLabs: {e}")
         except Exception as e:
+            logger.error(f"Error generating speech: {str(e)}")
+            logger.error(f"Exception type: {type(e).__name__}")
+            import traceback
+            logger.error(f"Traceback: {traceback.format_exc()}")
             raise HTTPException(status_code=500, detail=f"Error generating speech: {e}")
 class OmniAvatarAPI:
             if request.text_to_speech:
                 # Generate speech from text using ElevenLabs
+                voice_id = request.voice_id or "21m00Tcm4TlvDq8ikWAM"
                 logger.info(f"Generating speech from text: {request.text_to_speech[:50]}...")
+                logger.info(f"Using voice ID: {voice_id}")
+                if not self.elevenlabs_client.api_key:
+                    raise HTTPException(status_code=503, detail="ElevenLabs API key not configured")
                 audio_path = await self.elevenlabs_client.text_to_speech(
                     request.text_to_speech,
+                    voice_id
                 )
                 audio_generated = True
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)