nambn0321 commited on
Commit
08d90fe
Β·
verified Β·
1 Parent(s): 5df6d6b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +27 -12
app.py CHANGED
@@ -21,21 +21,35 @@ vocoder = vocoder.to(device)
21
  speaker_embedding = torch.zeros(1, 512).to(device)
22
 
23
  def tts_generate(text):
24
- # Preprocess input
25
- inputs = processor(text=text, return_tensors="pt").to(device)
 
 
 
 
26
 
27
- # Generate mel spectrogram
28
- with torch.no_grad():
29
- mel = model.generate_speech(inputs["input_ids"], speaker_embedding)
 
 
30
 
31
- # Convert mel spectrogram to waveform
32
- waveform = vocoder(mel)
33
- waveform = waveform.cpu()
 
 
34
 
35
- # Save waveform to file
36
- torchaudio.save("output.wav", waveform, sample_rate=16000)
 
 
37
 
38
- return "output.wav"
 
 
 
 
39
 
40
  # Gradio interface
41
  demo = gr.Interface(
@@ -47,4 +61,5 @@ demo = gr.Interface(
47
  )
48
 
49
  if __name__ == "__main__":
50
- demo.launch()
 
 
21
  speaker_embedding = torch.zeros(1, 512).to(device)
22
 
23
  def tts_generate(text):
24
+ print(f"πŸ“ Input text: {text}")
25
+ try:
26
+ # Preprocess input
27
+ print("πŸ”„ Processing input...")
28
+ inputs = processor(text=text, return_tensors="pt").to(device)
29
+ print("βœ… Text processed.")
30
 
31
+ # Generate mel spectrogram
32
+ print("🎀 Generating speech...")
33
+ with torch.no_grad():
34
+ mel = model.generate_speech(inputs["input_ids"], speaker_embedding)
35
+ print("βœ… Mel spectrogram generated.")
36
 
37
+ # Convert mel spectrogram to waveform
38
+ print("🎚️ Vocoding waveform...")
39
+ waveform = vocoder(mel)
40
+ waveform = waveform.cpu()
41
+ print("βœ… Waveform generated.")
42
 
43
+ # Save waveform
44
+ output_path = "output.wav"
45
+ torchaudio.save(output_path, waveform, sample_rate=16000)
46
+ print(f"πŸ’Ύ Audio saved to {output_path}")
47
 
48
+ return output_path
49
+
50
+ except Exception as e:
51
+ print("❌ Error during TTS generation:", e)
52
+ return "Error during speech synthesis."
53
 
54
  # Gradio interface
55
  demo = gr.Interface(
 
61
  )
62
 
63
  if __name__ == "__main__":
64
+ print("πŸš€ Launching Gradio demo...")
65
+ demo.launch()