gopalagra commited on
Commit
61d0d7a
Β·
verified Β·
1 Parent(s): 402146f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -347,6 +347,9 @@ def vqa_answer(image, question):
347
  return answer, None
348
 
349
 
 
 
 
350
  # ----------------------
351
  # Gradio UI
352
  # ----------------------
@@ -359,7 +362,7 @@ with gr.Blocks(title="BLIP Vision App") as demo:
359
  lang_in = gr.Dropdown(["Hindi", "French", "Spanish"], label="Translate To", value="Hindi")
360
  eng_out = gr.Textbox(label="English Caption")
361
  trans_out = gr.Textbox(label="Translated Caption")
362
- audio_out = gr.Audio(label="Audio Output", type="filepath")
363
  btn1 = gr.Button("Generate Caption, Translate & Speak")
364
  btn1.click(generate_caption_translate_speak, inputs=[img_in, lang_in], outputs=[eng_out, trans_out, audio_out])
365
 
@@ -368,7 +371,7 @@ with gr.Blocks(title="BLIP Vision App") as demo:
368
  img_vqa = gr.Image(type="pil", label="Upload Image")
369
  q_in = gr.Textbox(label="Ask a Question about the Image")
370
  ans_out = gr.Textbox(label="Answer")
371
- beep_out = gr.Audio(label="Alert Sound", type="filepath")
372
  btn2 = gr.Button("Ask")
373
  btn2.click(vqa_answer, inputs=[img_vqa, q_in], outputs=[ans_out, beep_out])
374
 
 
347
  return answer, None
348
 
349
 
350
+ # ----------------------
351
+ # Gradio UI
352
+ # ----------------------
353
  # ----------------------
354
  # Gradio UI
355
  # ----------------------
 
362
  lang_in = gr.Dropdown(["Hindi", "French", "Spanish"], label="Translate To", value="Hindi")
363
  eng_out = gr.Textbox(label="English Caption")
364
  trans_out = gr.Textbox(label="Translated Caption")
365
+ audio_out = gr.Audio(label="Audio Output", type="filepath", autoplay=True) # πŸ‘ˆ added autoplay
366
  btn1 = gr.Button("Generate Caption, Translate & Speak")
367
  btn1.click(generate_caption_translate_speak, inputs=[img_in, lang_in], outputs=[eng_out, trans_out, audio_out])
368
 
 
371
  img_vqa = gr.Image(type="pil", label="Upload Image")
372
  q_in = gr.Textbox(label="Ask a Question about the Image")
373
  ans_out = gr.Textbox(label="Answer")
374
+ beep_out = gr.Audio(label="Alert Sound", type="filepath", autoplay=True) # πŸ‘ˆ added autoplay
375
  btn2 = gr.Button("Ask")
376
  btn2.click(vqa_answer, inputs=[img_vqa, q_in], outputs=[ans_out, beep_out])
377