RP-Azul commited on
Commit
092f19b
·
verified ·
1 Parent(s): db6a6ed

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -4
app.py CHANGED
@@ -7,21 +7,23 @@ from transformers import pipeline
7
  import gradio as gr
8
 
9
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
 
 
10
  # code from the Model card
11
  processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
12
  model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
13
  vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 
 
14
 
15
-
16
- speech = pipeline("text-to-speech", model="microsoft/speecht5_tts")
17
  def summarize_text_and_speak(prompt):
18
  summary = summarizer(prompt, max_length=150, min_length=30, do_sample=False)
19
  summary_text = summary[0]['summary_text']
20
  #inputs = processor(text="Hello, my dog is cute.", return_tensors="pt")
21
  inputs = processor(text=summary_text, return_tensors="pt")
22
  #speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
23
- speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
24
- return summary_text, audio["audio"]
25
 
26
  interface = gr.Interface(
27
  fn=summarize_text_and_speak,
 
7
  import gradio as gr
8
 
9
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
10
+ speech = pipeline("text-to-speech", model="microsoft/speecht5_tts")
11
+
12
  # code from the Model card
13
  processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
14
  model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
15
  vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
16
+ speaker_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
17
+ speaker_embeddings = torch.tensor(speaker_dataset[0]["xvector"]).unsqueeze(0)
18
 
 
 
19
  def summarize_text_and_speak(prompt):
20
  summary = summarizer(prompt, max_length=150, min_length=30, do_sample=False)
21
  summary_text = summary[0]['summary_text']
22
  #inputs = processor(text="Hello, my dog is cute.", return_tensors="pt")
23
  inputs = processor(text=summary_text, return_tensors="pt")
24
  #speech = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
25
+ speech_audio = model.generate_speech(inputs["input_ids"], speaker_embeddings, vocoder=vocoder)
26
+ return summary_text, speech_audio
27
 
28
  interface = gr.Interface(
29
  fn=summarize_text_and_speak,