Spaces:

Sayiqa
/

voice_app

Sleeping

App Files Files Community

Sayiqa commited on Dec 18, 2024

Commit

9db2c3c

verified ·

1 Parent(s): 16ab1f7

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -17

app.py CHANGED Viewed

@@ -240,8 +240,8 @@ text_to_image.enable_attention_slicing()
 text_to_image.safety_checker = None
 text_to_image.scheduler = DPMSolverMultistepScheduler.from_config(text_to_image.scheduler.config)
-# Load conversational model using text-generation task
-chat_pipeline = pipeline("text-generation", model="microsoft/DialoGPT-medium")
 # Preprocess audio file into NumPy array
 def preprocess_audio(audio_path):
@@ -274,14 +274,14 @@ def generate_image_from_text(text):
     except Exception as e:
         return f"Error in image generation: {str(e)}"
-# ChatGPT-like conversational response
-def chat_with_gpt(prompt):
     try:
-        # Generate conversational response
-        response = chat_pipeline(prompt, max_length=100, num_return_sequences=1)
-        return response[0]["generated_text"]
     except Exception as e:
-        return f"Error in chat response: {str(e)}"
 # Combined processing function
 def process_audio_and_generate_results(audio_path):
@@ -335,22 +335,23 @@ voice_to_image_and_chat_iface = gr.Interface(
     description="Upload an audio file to transcribe speech to text and generate an image based on the transcription.",
 )
-# Gradio interface for ChatGPT-like functionality
-chat_iface = gr.Interface(
-    fn=chat_with_gpt,
-    inputs=gr.Textbox(label="Enter your prompt for ChatGPT"),
-    outputs=gr.Textbox(label="ChatGPT Response"),
-    title="ChatGPT",
-    description="Chat with GPT-like conversational AI.",
 )
 # Combined Gradio app
 iface = gr.TabbedInterface(
-    interface_list=[speech_to_text_iface, voice_to_image_and_chat_iface, chat_iface],
-    tab_names=["Speech-to-Text", "Voice-to-Image", "ChatGPT"]
 )
 # Launch Gradio interface
 iface.launch(debug=True, share=True)

 text_to_image.safety_checker = None
 text_to_image.scheduler = DPMSolverMultistepScheduler.from_config(text_to_image.scheduler.config)
+# Load question-answering model
+qa_pipeline = pipeline("question-answering", model="distilbert-base-uncased-distilled-squad")
 # Preprocess audio file into NumPy array
 def preprocess_audio(audio_path):
     except Exception as e:
         return f"Error in image generation: {str(e)}"
+# Question answering function
+def answer_question(question):
     try:
+        context = """Imran Khan is a Pakistani politician, former cricketer, and philanthropist. He is the 22nd Prime Minister of Pakistan, serving from 2018 to 2022. Khan is the founder of the political party Pakistan Tehreek-e-Insaf (PTI). He was one of the most successful cricketers of his time and led Pakistan to victory in the 1992 Cricket World Cup."""
+        answer = qa_pipeline(question=question, context=context)
+        return answer['answer']
     except Exception as e:
+        return f"Error in answering question: {str(e)}"
 # Combined processing function
 def process_audio_and_generate_results(audio_path):
     description="Upload an audio file to transcribe speech to text and generate an image based on the transcription.",
 )
+# Gradio interface for Question Answering
+qa_iface = gr.Interface(
+    fn=answer_question,
+    inputs=gr.Textbox(label="Ask a question"),
+    outputs=gr.Textbox(label="Answer"),
+    title="Question Answering",
+    description="Ask a factual question, and get an answer.",
 )
 # Combined Gradio app
 iface = gr.TabbedInterface(
+    interface_list=[speech_to_text_iface, voice_to_image_and_chat_iface, qa_iface],
+    tab_names=["Speech-to-Text", "Voice-to-Image", "Question Answering"]
 )
 # Launch Gradio interface
 iface.launch(debug=True, share=True)