Spaces:

shanusherly
/

audio

Sleeping

App Files Files Community

shanusherly commited on 15 days ago

Commit

db74b09

verified ·

1 Parent(s): c29b700

Update app.py

Browse files

Files changed (1) hide show

app.py +164 -271

app.py CHANGED Viewed

@@ -1,271 +1,164 @@
-import os
-import re
-import requests
-import json
-import gradio as gr
-# Google Gemini imports
-import google.generativeai as genai
-from langchain_google_genai import ChatGoogleGenerativeAI
-from langchain_core.prompts import PromptTemplate
-# legacy chains + memory now live in langchain_classic
-from langchain_classic.chains import LLMChain
-from langchain_classic.memory import ConversationBufferMemory
-# ElevenLabs imports
-from elevenlabs.client import ElevenLabs
-from elevenlabs import save
-# Google Gemini API Key
-GEMINI_API_KEY = "YOUR_GEMINI_API_KEY"
-# ElevenLabs API Key
-ELEVENLABS_API_KEY = "YOUR_ELEVENLABS_API_KEY"
-# ElevenLabs Voice ID (Rachel voice by default)
-ELEVENLABS_VOICE_ID = "21m00Tcm4TlvDq8ikWAM"
-# Configure Gemini
-genai.configure(api_key=GEMINI_API_KEY)
-# Initialize ElevenLabs client
-elevenlabs_client = ElevenLabs(api_key=ELEVENLABS_API_KEY)
-print("✅ API keys configured successfully!")
-template = """You are a helpful assistant to answer user queries.
-{chat_history}
-User: {user_message}
-Chatbot:"""
-prompt = PromptTemplate(
-    input_variables=["chat_history", "user_message"],
-    template=template
-)
-memory = ConversationBufferMemory(memory_key="chat_history")
-print("✅ Prompt template created!")
-# Initialize Gemini model using direct Google GenerativeAI (NOT LangChain wrapper)
-import google.generativeai as genai
-# Configure the Gemini model directly
-gemini_model = genai.GenerativeModel('gemini-2.5-flash')
-# Create a custom LLM wrapper for LangChain compatibility
-class GeminiLLM:
-    def __init__(self, model):
-        self.model = model
-        self.memory_history = []
-    def predict(self, user_message):
-        # Build conversation context
-        full_prompt = f"You are a helpful assistant to answer user queries.\n"
-        for msg in self.memory_history:
-            full_prompt += f"{msg}\n"
-        full_prompt += f"User: {user_message}\nChatbot:"
-        # Generate response
-        response = self.model.generate_content(full_prompt)
-        answer = response.text
-        # Update memory
-        self.memory_history.append(f"User: {user_message}")
-        self.memory_history.append(f"Chatbot: {answer}")
-        # Keep only last 10 exchanges to avoid token limits
-        if len(self.memory_history) > 20:
-            self.memory_history = self.memory_history[-20:]
-        return answer
-# Initialize the custom LLM
-llm_chain = GeminiLLM(gemini_model)
-print("✅ Gemini LLM initialized with direct SDK!")
-def generate_audio_elevenlabs(text):
-    """
-    Generate audio using ElevenLabs API
-    Returns audio file path or error message
-    """
-    try:
-        # Generate audio
-        audio = elevenlabs_client.generate(
-            text=text,
-            voice=ELEVENLABS_VOICE_ID,
-            model="eleven_monolingual_v1"  # or "eleven_multilingual_v2"
-        )
-        # Save audio to file
-        output_path = f"/content/output_audio_{hash(text) % 10000}.mp3"
-        save(audio, output_path)
-        return {
-            "type": "SUCCESS",
-            "response": output_path,
-            "message": "Audio generated successfully"
-        }
-    except Exception as e:
-        return {
-            "type": "ERROR",
-            "response": str(e),
-            "message": f"Audio generation failed: {str(e)}"
-        }
-def generate_audio_elevenlabs_http(text):
-    """
-    Alternative method using direct HTTP API calls
-    More reliable for some use cases
-    """
-    url = f"https://api.elevenlabs.io/v1/text-to-speech/{ELEVENLABS_VOICE_ID}"
-    headers = {
-        "Accept": "audio/mpeg",
-        "Content-Type": "application/json",
-        "xi-api-key": ELEVENLABS_API_KEY
-    }
-    data = {
-        "text": text,
-        "model_id": "eleven_monolingual_v1",
-        "voice_settings": {
-            "stability": 0.5,
-            "similarity_boost": 0.5,
-            "style": 0.5,
-            "use_speaker_boost": True
-        }
-    }
-    try:
-        response = requests.post(url, json=data, headers=headers)
-        response.raise_for_status()
-        # Save audio file
-        output_path = f"/content/output_audio_{hash(text) % 10000}.mp3"
-        with open(output_path, 'wb') as f:
-            f.write(response.content)
-        return {
-            "type": "SUCCESS",
-            "response": output_path,
-            "message": "Audio generated successfully"
-        }
-    except requests.exceptions.RequestException as e:
-        return {
-            "type": "ERROR",
-            "response": str(e),
-            "message": f"Audio generation failed: {str(e)}"
-        }
-print("✅ ElevenLabs audio functions defined!")
-def get_audio_reply_for_question(text):
-    """
-    Generate audio for the chatbot response
-    """
-    generated_audio_event = generate_audio_elevenlabs(text)
-    final_response = {
-        "audio_path": '',
-        "message": ''
-    }
-    if generated_audio_event["type"] == "SUCCESS":
-        audio_path = generated_audio_event["response"]
-        final_response['audio_path'] = audio_path
-        final_response['message'] = "Audio generated successfully"
-    else:
-        final_response['message'] = generated_audio_event['message']
-    return final_response
-print("✅ Audio reply function defined!")
-def get_text_response(user_message):
-    """
-    Get text response from Gemini
-    """
-    try:
-        response = llm_chain.predict(user_message=user_message)
-        return response
-    except Exception as e:
-        error_msg = f"Error in Gemini response: {str(e)}"
-        print(error_msg)
-        return f"Sorry, I encountered an error: {str(e)}"
-print("✅ Text response function defined!")
-def get_text_response_and_audio_response(user_message):
-    """
-    Get both text response from Gemini and audio from ElevenLabs
-    """
-    # Get text response from Gemini
-    text_response = get_text_response(user_message)
-    # Generate audio for the response
-    audio_reply = get_audio_reply_for_question(text_response)
-    final_response = {
-        'text': text_response,
-        'audio_path': audio_reply.get('audio_path', ''),
-        'message': audio_reply.get('message', '')
-    }
-    return final_response
-print("✅ Combined response function defined!")
-def chat_bot_response(message, history):
-    """
-    Main chatbot function for Gradio interface
-    Returns tuple of (text_response, audio_file_path)
-    """
-    try:
-        # Get text and audio response
-        response = get_text_response_and_audio_response(message)
-        text_response = response['text']
-        audio_path = response['audio_path']
-        if audio_path and os.path.exists(audio_path):
-            # Return both text and audio
-            return text_response
-        else:
-            # Return only text if audio fails
-            return text_response
-    except Exception as e:
-        error_msg = f"Error: {str(e)}"
-        print(error_msg)
-        return error_msg
-print("✅ Chatbot response handler defined!")
-demo = gr.ChatInterface(
-    fn=chat_bot_response,
-    title="🤖 Gemini + ElevenLabs Chatbot",
-    description="Chat with Google Gemini AI with voice responses from ElevenLabs",
-    examples=[
-        "How are you doing?",
-        "What are your interests?",
-        "Tell me a short story",
-        "What's the weather like today?",
-        "Explain quantum computing in simple terms"
-    ],
-    theme=gr.themes.Soft()
-)
-print("✅ Gradio interface created!")
-if __name__ == "__main__":
-    # Launch with public link
-    demo.launch(
-        share=True,  # Creates public link
-        debug=True   # Shows errors and logs
-    )

+import os
+import re
+import requests
+import json
+import gradio as gr
+# Google Gemini imports
+import google.generativeai as genai
+# LangChain imports
+from langchain_core.prompts import PromptTemplate
+from langchain_classic.chains import LLMChain
+from langchain_classic.memory import ConversationBufferMemory
+# -----------------------------
+# READ API KEYS FROM ENVIRONMENT
+# -----------------------------
+GEMINI_API_KEY = os.environ.get("GEMINI_API_KEY")
+ELEVENLABS_API_KEY = os.environ.get("ELEVENLABS_API_KEY")
+# ElevenLabs Voice ID
+ELEVENLABS_VOICE_ID = "21m00Tcm4TlvDq8ikWAM"
+# Configure Gemini
+genai.configure(api_key=GEMINI_API_KEY)
+print("✅ API keys loaded safely from environment!")
+# -----------------------------
+# PROMPT + MEMORY
+# -----------------------------
+template = """You are a helpful assistant to answer user queries.
+{chat_history}
+User: {user_message}
+Chatbot:"""
+prompt = PromptTemplate(
+    input_variables=["chat_history", "user_message"],
+    template=template
+)
+memory = ConversationBufferMemory(memory_key="chat_history")
+print("✅ Prompt template created!")
+# -----------------------------
+# CUSTOM GEMINI WRAPPER
+# -----------------------------
+gemini_model = genai.GenerativeModel('gemini-2.5-flash')
+class GeminiLLM:
+    def __init__(self, model):
+        self.model = model
+        self.memory_history = []
+    def predict(self, user_message):
+        full_prompt = "You are a helpful assistant.\n"
+        for msg in self.memory_history:
+            full_prompt += f"{msg}\n"
+        full_prompt += f"User: {user_message}\nChatbot:"
+        response = self.model.generate_content(full_prompt)
+        answer = response.text
+        # Add to memory
+        self.memory_history.append(f"User: {user_message}")
+        self.memory_history.append(f"Chatbot: {answer}")
+        # Keep last 20 messages
+        if len(self.memory_history) > 20:
+            self.memory_history = self.memory_history[-20:]
+        return answer
+llm_chain = GeminiLLM(gemini_model)
+print("�� Gemini wrapper initialized!")
+# -----------------------------
+# ELEVENLABS AUDIO FUNCTION
+# -----------------------------
+def generate_audio_elevenlabs(text):
+    from elevenlabs.client import ElevenLabs
+    from elevenlabs import save
+    try:
+        client = ElevenLabs(api_key=ELEVENLABS_API_KEY)
+        audio = client.generate(
+            text=text,
+            voice=ELEVENLABS_VOICE_ID,
+            model="eleven_monolingual_v1"
+        )
+        output_path = f"/tmp/output_{abs(hash(text)) % 100000}.mp3"
+        save(audio, output_path)
+        return {
+            "type": "SUCCESS",
+            "response": output_path
+        }
+    except Exception as e:
+        return {
+            "type": "ERROR",
+            "response": str(e)
+        }
+print("✅ ElevenLabs audio function ready!")
+# -----------------------------
+# TEXT RESPONSE
+# -----------------------------
+def get_text_response(user_message):
+    try:
+        return llm_chain.predict(user_message=user_message)
+    except Exception as e:
+        return f"Error: {str(e)}"
+# -----------------------------
+# COMBINED RESPONSE
+# -----------------------------
+def get_text_response_and_audio_response(user_message):
+    text_response = get_text_response(user_message)
+    audio_reply = generate_audio_elevenlabs(text_response)
+    return {
+        "text": text_response,
+        "audio_path": audio_reply.get("response", "")
+    }
+# -----------------------------
+# MAIN CHATBOT RESPONSE HANDLER
+# -----------------------------
+def chat_bot_response(message, history):
+    try:
+        result = get_text_response_and_audio_response(message)
+        return result["text"]
+    except Exception as e:
+        return f"Error: {str(e)}"
+print("✅ Chatbot handler ready!")
+# -----------------------------
+# UI (UNCHANGED)
+# -----------------------------
+demo = gr.ChatInterface(
+    fn=chat_bot_response,
+    title="🤖 Gemini + ElevenLabs Chatbot",
+    description="Chat with Google Gemini AI with voice responses from ElevenLabs",
+    examples=[
+        "How are you doing?",
+        "What are your interests?",
+        "Tell me a short story",
+        "What's the weather like today?",
+        "Explain quantum computing in simple terms"
+    ],
+    theme=gr.themes.Soft()
+)
+print("✅ Gradio interface created!")
+if __name__ == "__main__":
+    demo.launch(debug=True, share=True)