Spaces:

PhilSpiel
/

Johnny

Sleeping

App Files Files Community

PhilSpiel commited on Nov 15, 2023

Commit

6ef2d0a

1 Parent(s): c5166bc

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -27

app.py CHANGED Viewed

@@ -10,25 +10,34 @@ client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
 # Set the ElevenLabs API key using an environment variable
 elevenlabs_api_key = os.getenv("ELEVENLABS_API_KEY")
-# Define the function that generates the speech
-def generate_speech(input_text):
-    # Build completion with OpenAI
     completion = client.chat.completions.create(
         model="gpt-3.5-turbo-1106",
-        messages=[
-            {"role": "system",
-             "content": "You are Johnny Carson, interviewing a guest (the user) on the Tonight Show in 1978. While chatting with the user, you make occasional jokes using Johnny Carson's characteristic humor. Your knowledge of the world ends in 1978."},
-            {"role": "user", "content": input_text}
-        ]
     )
     # Extract generated text (response by the assistant) from OpenAI's API response
-    message_content = completion.choices[0].message.content.strip()  # Remove whitespace from the ends
-    # Prepare the text for TTS conversion (you may want to process the text further)
-    text_to_speech = message_content
-    # ElevenLabs TTS API settings and request
     url = "https://api.elevenlabs.io/v1/text-to-speech/eIH76iW9yjOWnOKIkd6y/stream"
     headers = {
         "Accept": "audio/mpeg",
@@ -36,18 +45,18 @@ def generate_speech(input_text):
         "xi-api-key": elevenlabs_api_key
     }
     data = {
-  "text": text_to_speech,
-  "model_id": "eleven_multilingual_v2",
-  "voice_settings": {
-    "stability": 1.0,
-    "similarity_boost": 1.0,
-    "excitement": 0.9,
-    "speed": 1.1,
-    "volume": 80,
-    "pitch": 2.0,
-    "breathiness": 0.8,
-    "voice_id": "eIH76iW9yjOWnOKIkd6y"
-  	  }
     }
     response = requests.post(url, json=data, headers=headers)
@@ -59,11 +68,14 @@ def generate_speech(input_text):
         print("Error with ElevenLabs API:", response.status_code, response.text)
         raise Exception(f"Failed to generate speech, status code: {response.status_code}, response: {response.text}")
-# Define the Gradio interface
 iface = gr.Interface(
     fn=generate_speech,
-    inputs=gr.Textbox(),
-    outputs=gr.Audio(autoplay=True),  # Setting autoplay to True
     live=False
 )

 # Set the ElevenLabs API key using an environment variable
 elevenlabs_api_key = os.getenv("ELEVENLABS_API_KEY")
+# Initialize empty history list to maintain the conversation context
+history_openai_format = [
+    {"role": "system",
+     "content": "You are Johnny Carson, interviewing a guest (the user) on the Tonight Show in 1978. While chatting with the user, you make occasional jokes using Johnny Carson's characteristic humor. Your knowledge of the world ends in 1978."}
+]
+# Define the function that takes a name and text input to generate the speech
+def generate_speech(name, input_text):
+    # Include the user's name in the dialogue if provided
+    personalized_greeting = f"Welcome to the Tonight Show, {name}. " if name else ""
+    # Append user message to history with personalized greeting
+    history_openai_format.append({"role": "user", "content": personalized_greeting + input_text})
+    # Build completion with OpenAI using the accumulated history
     completion = client.chat.completions.create(
         model="gpt-3.5-turbo-1106",
+        messages=history_openai_format
     )
     # Extract generated text (response by the assistant) from OpenAI's API response
+    message_content = completion.choices[0].message.content.strip()
+    # Append assistant's message to history
+    history_openai_format.append({"role": "assistant", "content": message_content})
+    # Prepare the text for TTS conversion with ElevenLabs API settings
+    text_to_speech = message_content
     url = "https://api.elevenlabs.io/v1/text-to-speech/eIH76iW9yjOWnOKIkd6y/stream"
     headers = {
         "Accept": "audio/mpeg",
         "xi-api-key": elevenlabs_api_key
     }
     data = {
+        "text": text_to_speech,
+        "model_id": "eleven_multilingual_v2",
+        "voice_settings": {
+            "stability": 1.0,
+            "similarity_boost": 1.0,
+            "excitement": 0.9,
+            "speed": 1.1,
+            "volume": 80,
+            "pitch": 2.0,
+            "breathiness": 0.8,
+            "voice_id": "eIH76iW9yjOWnOKIkd6y"
+    	}
     }
     response = requests.post(url, json=data, headers=headers)
         print("Error with ElevenLabs API:", response.status_code, response.text)
         raise Exception(f"Failed to generate speech, status code: {response.status_code}, response: {response.text}")
+# Define the Gradio interface with inputs for name and user text
 iface = gr.Interface(
     fn=generate_speech,
+    inputs=[
+        gr.Textbox(label="Your Name (optional):", placeholder="Enter your name"),
+        gr.Textbox(label="Your question or comment:")
+    ],
+    outputs=gr.Audio(autoplay=True),
     live=False
 )