Spaces:

nambn0321
/

TTS_run

Runtime error

nambn0321 commited on Aug 3, 2025

Commit

9a99cf5

verified ·

1 Parent(s): 9b0cc34

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,33 +5,33 @@ import torchaudio
 from transformers import SpeechT5Processor, SpeechT5ForTextToSpeech
 from transformers.models.speecht5 import SpeechT5HifiGan
-# processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
-# model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
-# vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
-# device = "cuda" if torch.cuda.is_available() else "cpu"
-# model = model.to(device)
-# vocoder = vocoder.to(device)
-# speaker_embedding = torch.zeros(1, 512).to(device)
-# Load model and processor
-processor = SpeechT5Processor.from_pretrained("nambn0321/TTS_with_T5")
-model = SpeechT5ForTextToSpeech.from_pretrained(
-    "nambn0321/TTS_with_T5",
-    use_safetensors=True,
-    trust_remote_code=True
-)
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
-# Move to CUDA if available
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model = model.to(device)
 vocoder = vocoder.to(device)
-# Dummy speaker embedding (or load your real one here)
 speaker_embedding = torch.zeros(1, 512).to(device)
 def tts_generate(text):
     print(f"📝 Input text: {text}")
     try:

 from transformers import SpeechT5Processor, SpeechT5ForTextToSpeech
 from transformers.models.speecht5 import SpeechT5HifiGan
+processor = SpeechT5Processor.from_pretrained("microsoft/speecht5_tts")
+model = SpeechT5ForTextToSpeech.from_pretrained("microsoft/speecht5_tts")
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model = model.to(device)
 vocoder = vocoder.to(device)
 speaker_embedding = torch.zeros(1, 512).to(device)
+# Load model and processor
+# processor = SpeechT5Processor.from_pretrained("nambn0321/TTS_with_T5")
+# model = SpeechT5ForTextToSpeech.from_pretrained(
+#     "nambn0321/TTS_with_T5",
+#     use_safetensors=True,
+#     trust_remote_code=True
+# )
+# vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
+# # Move to CUDA if available
+# device = "cuda" if torch.cuda.is_available() else "cpu"
+# model = model.to(device)
+# vocoder = vocoder.to(device)
+# # Dummy speaker embedding (or load your real one here)
+# speaker_embedding = torch.zeros(1, 512).to(device)
 def tts_generate(text):
     print(f"📝 Input text: {text}")
     try: