Spaces:

SandraCLV
/

injectModel1intoModel2

Sleeping

SandraCLV commited on Oct 29, 2023

Commit

ab46ebc

1 Parent(s): d6da658

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,13 +6,6 @@ import torch
 # el resultado del primero modelo(texto generado) en la entrada del 2º modelo
 # texto to audio
-def transform(example_batch):
-    # Take a list of PIL images and turn them to pixel values
-    inputs = feature_extractor([x.convert("RGB") for x in example_batch['image']], return_tensors='pt')
-    # Don't forget to include the labels!
-    inputs['labels'] = example_batch['labels']
-    return inputs
 # Cargar el modelo que convierte imagen a texto
 image_to_text_model = pipeline("image-classification")
@@ -23,7 +16,7 @@ text_to_audio_model = pipeline("text-to-speech")
 # Función para la interfaz de Gradio
 def image_to_audio(input_image):
     # Convertir la imagen a texto
-    text_output = transform(image_to_text_model(input_image)[0]['label'])
     # Generar audio a partir del texto
     audio_output = text_to_audio_model(text_output)[0]['audio']
@@ -34,7 +27,7 @@ def image_to_audio(input_image):
 # Interfaz Gradio
 iface = gr.Interface(
     fn=image_to_audio,
-    inputs=gr.Image(),
     outputs="audio",
     live=True,
     interpretation="default",

 # el resultado del primero modelo(texto generado) en la entrada del 2º modelo
 # texto to audio
 # Cargar el modelo que convierte imagen a texto
 image_to_text_model = pipeline("image-classification")
 # Función para la interfaz de Gradio
 def image_to_audio(input_image):
     # Convertir la imagen a texto
+    text_output = image_to_text_model(input_image)[0]['label']
     # Generar audio a partir del texto
     audio_output = text_to_audio_model(text_output)[0]['audio']
 # Interfaz Gradio
 iface = gr.Interface(
     fn=image_to_audio,
+    inputs= gr.Image(type="pil"),
     outputs="audio",
     live=True,
     interpretation="default",