Spaces:

PhilSpiel
/

Johnny

Sleeping

App Files Files Community

PhilSpiel commited on Nov 15, 2023

Commit

698100a

1 Parent(s): 0b627aa

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -16

app.py CHANGED Viewed

@@ -19,24 +19,25 @@ history_openai_format = [
 def generate_speech(name, input_text):
     global history_openai_format  # Use the global history variable to maintain state
-    # Include the user's name in the dialogue if provided
-    personalized_greeting = f"Welcome to the Tonight Show, {name}. " if name else ""
-    # Append user message to history with personalized greeting
-    current_exchange = [{"role": "user", "content": personalized_greeting + input_text}]
-    # Build completion with OpenAI using the current exchange and the accumulated history
     completion = client.chat.completions.create(
         model="gpt-3.5-turbo-1106",
-        messages=history_openai_format + current_exchange
     )
     # Extract generated text (response by the assistant) from completion
-    message_content = completion.choices[0].message.content.strip()
-    # Update the conversation history with the current exchange
-    # This ensures the full history is preserved for the next call but only the latest messages are sent to TTS
-    history_openai_format.extend(current_exchange + [{"role": "assistant", "content": message_content}])
     # Use ElevenLabs TTS API settings and request for the latest assistant response
     url = "https://api.elevenlabs.io/v1/text-to-speech/eIH76iW9yjOWnOKIkd6y/stream"
@@ -46,7 +47,7 @@ def generate_speech(name, input_text):
         "xi-api-key": elevenlabs_api_key
     }
     data = {
-        "text": message_content,
         "model_id": "eleven_multilingual_v2",
         "voice_settings": {
             "stability": 1.0,
@@ -63,7 +64,7 @@ def generate_speech(name, input_text):
     # Send the request to ElevenLabs API
     response = requests.post(url, json=data, headers=headers)
-    # Return the response content if successful, otherwise, print error details
     if response.status_code == 200:
         # Return only the audio of the latest assistant message
         return response.content
@@ -83,7 +84,4 @@ iface = gr.Interface(
 )
 # Launch the interface
-iface.launch(show_api=False)
-# Clear the conversation history when the interface is closed or interrupted
-history_openai_format.clear()  # This line will reset the history when the script is stopped

 def generate_speech(name, input_text):
     global history_openai_format  # Use the global history variable to maintain state
+    # Append user message to history
+    if name:
+        input_text = f"Welcome to the Tonight Show, {name}. " + input_text
+    # Add user's input to the history
+    history_openai_format.append({"role": "user", "content": input_text})
+    # Build completion with OpenAI using the accumulated history
     completion = client.chat.completions.create(
         model="gpt-3.5-turbo-1106",
+        messages=history_openai_format
     )
     # Extract generated text (response by the assistant) from completion
+    message_parts = completion.choices[0].message.content.split("\n")
+    assistant_message = message_parts[-1].strip()  # Get the last line which is the assistant's response
+    # Append assistant's message to history
+    history_openai_format.append({"role": "assistant", "content": assistant_message})
     # Use ElevenLabs TTS API settings and request for the latest assistant response
     url = "https://api.elevenlabs.io/v1/text-to-speech/eIH76iW9yjOWnOKIkd6y/stream"
         "xi-api-key": elevenlabs_api_key
     }
     data = {
+        "text": assistant_message,
         "model_id": "eleven_multilingual_v2",
         "voice_settings": {
             "stability": 1.0,
     # Send the request to ElevenLabs API
     response = requests.post(url, json=data, headers=headers)
+    # Return the response content if successful, otherwise print error details
     if response.status_code == 200:
         # Return only the audio of the latest assistant message
         return response.content
 )
 # Launch the interface
+iface.launch(show_api=False)