Spaces:

yasserrmd
/

NotebookLlama

Sleeping

App Files Files Community

yasserrmd commited on Oct 30, 2024

Commit

8797420

verified ·

1 Parent(s): fce33e5

Update generate_audio.py

Browse files

Files changed (1) hide show

generate_audio.py +8 -7

generate_audio.py CHANGED Viewed

@@ -1,6 +1,6 @@
 # generate_audio.py
-import spaces
 import pickle
 import torch
 import numpy as np
@@ -18,7 +18,7 @@ class TTSGenerator:
     """
     A class to generate podcast-style audio from a transcript using ParlerTTS and Bark models.
     """
-    @spaces.GPU
     def __init__(self, transcript_file_path,output_audio_path):
         """
         Initialize the TTS generator with the path to the rewritten transcript file.
@@ -48,7 +48,7 @@ class TTSGenerator:
         # self.bark_sampling_rate = 24000
         # self.voice_preset = "v2/en_speaker_6"
-    @spaces.GPU
     def load_transcript(self):
         """
         Loads the rewritten transcript from the specified file.
@@ -59,7 +59,7 @@ class TTSGenerator:
         with open(self.transcript_file_path, 'rb') as f:
             return ast.literal_eval(pickle.load(f))
-    @spaces.GPU(duration=30)
     def generate_speaker1_audio(self, text):
         """
         Generate audio for Speaker 1 using ParlerTTS.
@@ -92,7 +92,7 @@ class TTSGenerator:
         audio_arr = generation.cpu().numpy().squeeze()
         return audio_arr, self.parler_model.config.sampling_rate
-    @spaces.GPU(duration=30)
     def generate_speaker2_audio(self, text):
         """
         Generate audio for Speaker 2 using Bark.
@@ -130,8 +130,9 @@ class TTSGenerator:
         # audio_arr = speech_output[0].cpu().numpy()
         return audio_arr, self.parler_model.config.sampling_rate
     @staticmethod
-    @spaces.GPU
     def numpy_to_audio_segment(audio_arr, sampling_rate):
         """
         Convert numpy array to AudioSegment.
@@ -149,7 +150,7 @@ class TTSGenerator:
         byte_io.seek(0)
         return AudioSegment.from_wav(byte_io)
-    @spaces.GPU(duration=300)
     def generate_audio(self):
         """
         Converts the transcript into audio and saves it to a file.

 # generate_audio.py
+#import spaces
 import pickle
 import torch
 import numpy as np
     """
     A class to generate podcast-style audio from a transcript using ParlerTTS and Bark models.
     """
+    #@spaces.GPU
     def __init__(self, transcript_file_path,output_audio_path):
         """
         Initialize the TTS generator with the path to the rewritten transcript file.
         # self.bark_sampling_rate = 24000
         # self.voice_preset = "v2/en_speaker_6"
+    #@spaces.GPU
     def load_transcript(self):
         """
         Loads the rewritten transcript from the specified file.
         with open(self.transcript_file_path, 'rb') as f:
             return ast.literal_eval(pickle.load(f))
+    #@spaces.GPU(duration=30)
     def generate_speaker1_audio(self, text):
         """
         Generate audio for Speaker 1 using ParlerTTS.
         audio_arr = generation.cpu().numpy().squeeze()
         return audio_arr, self.parler_model.config.sampling_rate
+    #@spaces.GPU(duration=30)
     def generate_speaker2_audio(self, text):
         """
         Generate audio for Speaker 2 using Bark.
         # audio_arr = speech_output[0].cpu().numpy()
         return audio_arr, self.parler_model.config.sampling_rate
+    #@spaces.GPU
     @staticmethod
     def numpy_to_audio_segment(audio_arr, sampling_rate):
         """
         Convert numpy array to AudioSegment.
         byte_io.seek(0)
         return AudioSegment.from_wav(byte_io)
+    #@spaces.GPU(duration=300)
     def generate_audio(self):
         """
         Converts the transcript into audio and saves it to a file.