Spaces:

andgrt
/

doc-qa-demo-gradio

Runtime error

andgrt commited on Nov 3, 2024

Commit

09be984

1 Parent(s): 2891eba

fixes

Files changed (1) hide show

app.py CHANGED Viewed

@@ -88,9 +88,9 @@ def text_to_speech(text):
     return text, (16000, audio.squeeze())
-def transcribe(image, audio):
     if not image or not audio:
-        return
     sr, y = audio
@@ -102,11 +102,18 @@ def transcribe(image, audio):
     transcription_text = transcriber({"sampling_rate": sr, "raw": y})["text"]
-    return generate_answer(image, transcription_text)
 qa_interface = gr.Interface(
-    fn=generate_answer,
     inputs=[
         gr.Image(type="pil"),
         gr.Textbox(label="Вопрос (на русском)", placeholder="Ваш вопрос"),
@@ -120,7 +127,7 @@ qa_interface = gr.Interface(
 )
 speech_interface = gr.Interface(
-    fn=transcribe,
     inputs=[
         gr.Image(type="pil"),
         gr.Audio(sources="microphone", label="Голосовой ввод"),

     return text, (16000, audio.squeeze())
+def transcribe_pipeline(image, audio):
     if not image or not audio:
+        return None, None
     sr, y = audio
     transcription_text = transcriber({"sampling_rate": sr, "raw": y})["text"]
+    return text_to_speech(generate_answer(image, transcription_text))
+def text_pipeline(image, question):
+    if not image or not question:
+        return None, None
+    return text_to_speech(generate_answer(image, question))
 qa_interface = gr.Interface(
+    fn=text_pipeline,
     inputs=[
         gr.Image(type="pil"),
         gr.Textbox(label="Вопрос (на русском)", placeholder="Ваш вопрос"),
 )
 speech_interface = gr.Interface(
+    fn=transcribe_pipeline,
     inputs=[
         gr.Image(type="pil"),
         gr.Audio(sources="microphone", label="Голосовой ввод"),