Spaces:

backtracking
/

tiny-tts-demo

Running

App Files Files Community

backtracking commited on Feb 25

Commit

23f9c22

verified ·

1 Parent(s): 753aa08

Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

tiny_tts/__init__.py +1 -1
tiny_tts/__pycache__/__init__.cpython-310.pyc +0 -0
tiny_tts/__pycache__/infer.cpython-310.pyc +0 -0
tiny_tts/infer.py +13 -2
tiny_tts/utils/config.py +1 -1

tiny_tts/__init__.py CHANGED Viewed

@@ -38,7 +38,7 @@ class TinyTTS:
         self.model = load_engine(checkpoint_path, self.device)
-    def speak(self, text, output_path="output.wav", speaker="LJ"):
         """Synthesize text to speech and save to output_path."""
         print(f"Synthesizing: {text}")

         self.model = load_engine(checkpoint_path, self.device)
+    def speak(self, text, output_path="output.wav", speaker="female"):
         """Synthesize text to speech and save to output_path."""
         print(f"Synthesizing: {text}")

tiny_tts/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (3.03 kB). View file

tiny_tts/__pycache__/infer.cpython-310.pyc ADDED Viewed

Binary file (5.61 kB). View file

tiny_tts/infer.py CHANGED Viewed

@@ -123,13 +123,25 @@ def get_latest_checkpoint(checkpoint_dir):
 def main():
     parser = argparse.ArgumentParser(description="TinyTTS — English Text-to-Speech Inference")
     parser.add_argument("--text", "-t", type=str, default="The weather is nice today, and I feel very relaxed.", help="Text to synthesize")
-    parser.add_argument("--checkpoint", "-c", type=str, required=True, help="Path to checkpoint (G_*.pth) or directory containing checkpoints")
     parser.add_argument("--output", "-o", type=str, default="english_test.wav", help="Output audio file path")
     parser.add_argument("--speaker", "-s", type=str, default="female", help="Speaker ID")
     parser.add_argument("--device", type=str, default="cuda", help="Device to use (cuda or cpu)")
     args = parser.parse_args()
     if not os.path.exists(args.checkpoint):
         print(f"Error: Checkpoint or directory not found at {args.checkpoint}")
         sys.exit(1)
@@ -167,6 +179,5 @@ def main():
         final_output = os.path.join(out_dir, f"{name}_step{step_str}_spk{args.speaker}{ext}")
         synthesize(args.text, final_output, model, speaker=args.speaker, device=args.device)
 if __name__ == "__main__":
     main()

 def main():
     parser = argparse.ArgumentParser(description="TinyTTS — English Text-to-Speech Inference")
     parser.add_argument("--text", "-t", type=str, default="The weather is nice today, and I feel very relaxed.", help="Text to synthesize")
+    parser.add_argument("--checkpoint", "-c", type=str, default=None, help="Path to checkpoint. Auto-downloads if not provided.")
     parser.add_argument("--output", "-o", type=str, default="english_test.wav", help="Output audio file path")
     parser.add_argument("--speaker", "-s", type=str, default="female", help="Speaker ID")
     parser.add_argument("--device", type=str, default="cuda", help="Device to use (cuda or cpu)")
     args = parser.parse_args()
+    if args.checkpoint is None:
+        try:
+            from huggingface_hub import hf_hub_download
+            print("Downloading/Loading checkpoint from Hugging Face Hub (backtracking/tiny-tts)...")
+            args.checkpoint = hf_hub_download(repo_id="backtracking/tiny-tts", filename="G.pth")
+        except ImportError:
+            print("Error: huggingface_hub is required for auto-download. Run: pip install huggingface_hub")
+            sys.exit(1)
+        except Exception as e:
+            print(f"Error downloading checkpoint: {e}")
+            sys.exit(1)
     if not os.path.exists(args.checkpoint):
         print(f"Error: Checkpoint or directory not found at {args.checkpoint}")
         sys.exit(1)
         final_output = os.path.join(out_dir, f"{name}_step{step_str}_spk{args.speaker}{ext}")
         synthesize(args.text, final_output, model, speaker=args.speaker, device=args.device)
 if __name__ == "__main__":
     main()

tiny_tts/utils/config.py CHANGED Viewed

@@ -8,7 +8,7 @@ SPEC_CHANNELS = FILTER_LENGTH // 2 + 1  # 1025
 # Speakers
 N_SPEAKERS = 1
-SPK2ID = {"LJ": 0}
 # Model
 MODEL_PARAMS = dict(

 # Speakers
 N_SPEAKERS = 1
+SPK2ID = {"female": 0}
 # Model
 MODEL_PARAMS = dict(