Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -3,17 +3,17 @@ from transformers import AutoProcessor, BlipForConditionalGeneration, AutoTokeni
|
|
| 3 |
import librosa
|
| 4 |
import numpy as np
|
| 5 |
import torch
|
| 6 |
-
import image_text_model
|
| 7 |
-
import audio_model
|
| 8 |
import open_clip
|
| 9 |
|
| 10 |
#CONSTANTS
|
| 11 |
|
| 12 |
def generate_captions_speech(image):
|
| 13 |
|
| 14 |
-
caption_blip_large = generate_caption(blip_processor_large, blip_model_large, image)
|
| 15 |
print('generate_captions>>>'+caption_blip_large)
|
| 16 |
-
return caption_blip_large,text_to_speech(caption_blip_large,"Surprise Me!")
|
| 17 |
|
| 18 |
|
| 19 |
# Define la interfaz de usuario utilizando Gradio entradas y salidas
|
|
|
|
| 3 |
import librosa
|
| 4 |
import numpy as np
|
| 5 |
import torch
|
| 6 |
+
import image_text_model as itm
|
| 7 |
+
import audio_model as am
|
| 8 |
import open_clip
|
| 9 |
|
| 10 |
#CONSTANTS
|
| 11 |
|
| 12 |
def generate_captions_speech(image):
|
| 13 |
|
| 14 |
+
caption_blip_large = itm.generate_caption(blip_processor_large, blip_model_large, image)
|
| 15 |
print('generate_captions>>>'+caption_blip_large)
|
| 16 |
+
return caption_blip_large,am.text_to_speech(caption_blip_large,"Surprise Me!")
|
| 17 |
|
| 18 |
|
| 19 |
# Define la interfaz de usuario utilizando Gradio entradas y salidas
|