JohnnyTTS

Sleeping

App Files Files Community

PhilSpiel commited on Nov 15, 2023

Commit

3d43559

1 Parent(s): f986fb8

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -26

app.py CHANGED Viewed

@@ -1,46 +1,45 @@
-import gradio as gr
-import os
-import requests
-import re
-from openai import OpenAI
 # Initialize OpenAI API client with API key
 client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
 # Define the function that generates the speech
 def generate_speech(input_text):
-    # Build completion with OpenAI
     completion = client.chat.completions.create(
-        model="gpt-3.5-turbo-1106",
-        messages=[
-            {"role": "system",
-             "content": "You are Johnny Carson, interviewing a guest (the user) on the Tonight Show in 1978. While chatting with the user, you make occasional jokes using Johnny Carson's characteristic humor. Your knowledge of the world ends in 1978."},
-            {"role": "user", "content": input_text}
         ]
     )
     # Extract generated text (response by the assistant) from OpenAI's API response
     message_content = completion.choices[0].message.content.strip()  # Remove whitespace from the ends
-    # Prepare the text for TTS conversion (you may want to process the text further)
-    #text_to_speech = message_content
     response = client.audio.speech.create(
-        model="tts-1",
-        voice="alloy",
-        input=str(message_content)
-        )
     return response.content
-# Define the Gradio interface
 iface = gr.Interface(
-    fn=generate_speech,
-    inputs=gr.Textbox(),
-    outputs=gr.Audio(autoplay=True),  # Setting autoplay to True
-    live=False
 )
 # Launch the interface
-iface.launch(show_api=False)

+# Import necessary libraries
+import gradio as gr  # Gradio for creating simple UI for functions
+import os  # For accessing environment variables
+from openai import OpenAI  # OpenAI API client
 # Initialize OpenAI API client with API key
 client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
 # Define the function that generates the speech
 def generate_speech(input_text):
+    # Build conversation completion with the OpenAI chat model
     completion = client.chat.completions.create(
+        model="gpt-3.5-turbo-1106",  # Specify the model to use
+        messages=[  # This is the conversation history with user input appended
+            {
+                "role": "system",  # System message with instructions for the AI
+                "content": (os.getenv("PROMPT"))
+            },
+            {"role": "user", "content": input_text}  # The user's input message
         ]
     )
     # Extract generated text (response by the assistant) from OpenAI's API response
     message_content = completion.choices[0].message.content.strip()  # Remove whitespace from the ends
+    # Use OpenAI's text-to-speech API to convert the text response to audio
     response = client.audio.speech.create(
+        model="tts-1",  # Specify the TTS model to use
+        voice="alloy",  # Specify the voice model to use
+        input=str(message_content)  # The text we want to convert to speech
+    )
+    # Return the binary audio data received from OpenAI
     return response.content
+# Define the Gradio interface with our function
 iface = gr.Interface(
+    fn=generate_speech,  # Function to invoke
+    inputs=gr.Textbox(),  # Input element in the UI: a textbox for user text
+    outputs=gr.Audio(autoplay=True),  # Output element in the UI: an audio player
+    live=False  # Whether or not to automatically call the function on input change
 )
 # Launch the interface
+iface.launch(show_api=False)  # Start the Gradio UI; hide the API schema part of the interface