Update app.py
Browse files
app.py
CHANGED
|
@@ -8,11 +8,13 @@ import torch
|
|
| 8 |
pipe1 = pipeline("automatic-speech-recognition", model="openai/whisper-base")
|
| 9 |
pipe2 = pipeline("summarization", model="facebook/bart-large-cnn")
|
| 10 |
pipe3 = DiffusionPipeline.from_pretrained("stable-diffusion-v1-5/stable-diffusion-v1-5")
|
|
|
|
| 11 |
|
| 12 |
def audio_to_image(audio):
|
| 13 |
-
transcription = pipe1(audio)
|
|
|
|
| 14 |
|
| 15 |
-
summary = pipe2(
|
| 16 |
summary_text = summary[0]['summary_text']
|
| 17 |
|
| 18 |
prompt = summary_text
|
|
|
|
| 8 |
pipe1 = pipeline("automatic-speech-recognition", model="openai/whisper-base")
|
| 9 |
pipe2 = pipeline("summarization", model="facebook/bart-large-cnn")
|
| 10 |
pipe3 = DiffusionPipeline.from_pretrained("stable-diffusion-v1-5/stable-diffusion-v1-5")
|
| 11 |
+
pipe3.to("cuda" if torch.cuda.is_available() else "cpu")
|
| 12 |
|
| 13 |
def audio_to_image(audio):
|
| 14 |
+
transcription = pipe1(audio)
|
| 15 |
+
transcription_text = transcription['text']
|
| 16 |
|
| 17 |
+
summary = pipe2(transcription_text, max_length=50, min_length=10, do_sample=False)
|
| 18 |
summary_text = summary[0]['summary_text']
|
| 19 |
|
| 20 |
prompt = summary_text
|