Spaces:

Rajhuggingface4253
/

neu

Paused

Rajhuggingface4253 commited on Oct 18

Commit

7d77f94

verified ·

1 Parent(s): 74ce059

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -145,12 +145,11 @@ class NeuTTSWrapper:
         """Blocking synthesis for standard endpoint."""
-        # 2. Encode reference
-        ref_s = self.tts_model.encode_reference(reference_audio)
         # 3. Infer full text
         with torch.no_grad():
-            audio = self.tts_model.infer(text, ref_s, speed=1.0)
         return audio.cpu().numpy()
     def stream_speech_blocking(self, text: str, ref_audio_path: str, speed: float, audio_format: str) -> Generator[bytes, None, None]:
@@ -173,7 +172,7 @@ class NeuTTSWrapper:
             # Infer sentence
             with torch.no_grad():
-                audio_chunk = self.tts_model.infer(sentence, ref_s, speed=speed)
             # Convert and yield
             yield self._convert_to_streamable_format(audio_chunk.cpu().numpy(), audio_format)

         """Blocking synthesis for standard endpoint."""
+        ref_s = self.tts_model.encode_reference(ref_audio_path)
         # 3. Infer full text
         with torch.no_grad():
+            audio = self.tts_model.infer(text, ref_s)
         return audio.cpu().numpy()
     def stream_speech_blocking(self, text: str, ref_audio_path: str, speed: float, audio_format: str) -> Generator[bytes, None, None]:
             # Infer sentence
             with torch.no_grad():
+                audio_chunk = self.tts_model.infer(sentence, ref_s)
             # Convert and yield
             yield self._convert_to_streamable_format(audio_chunk.cpu().numpy(), audio_format)