Persian-TTS

Build error

App Files Files Community

Kamtera commited on Jan 19, 2023

Commit

34fce4e

1 Parent(s): 3d3ba6d

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -15

app.py CHANGED Viewed

@@ -6,25 +6,47 @@ import gradio as gr
 from TTS.utils.manage import ModelManager
 from TTS.utils.synthesizer import Synthesizer
 MAX_TXT_LEN = 800
 model_path = os.getcwd() + "/best_model.pth"
 config_path = os.getcwd() + "/config.json"
-synthesizer = Synthesizer(
-        model_path, config_path
-)
-def tts(text: str):
     if len(text) > MAX_TXT_LEN:
         text = text[:MAX_TXT_LEN]
         print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
     print(text)
     # synthesize
     if synthesizer is None:
         raise NameError("model not found")
     wavs = synthesizer.tts(text)
@@ -37,20 +59,28 @@ def tts(text: str):
 description="""
 This is a demo of persian text to speech model.
-Model can be found here: https://huggingface.co/Kamtera/persian-tts-female-glow_tts
-Model trained on this dataset : https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-famale
 """
 article= ""
 examples=[
-    ["شیش سیخ جیگر سیخی شیش هزار"],
-    ["سه شیشه شیر ، سه سیر سرشیر"],
-    ["دزدی دزدید ز بز دزدی بزی ، عجب دزدی که دزدید ز بز دزدی بزی"],
-    ["مثنوی یکی از قالب های شعری است ک هر بیت قافیه ی جداگانه دارد"],
-    ["در گلو ماند خس او سالها، چیست آن خس مهر جاه و مالها"],
 ]
 iface = gr.Interface(
     fn=tts,
@@ -58,11 +88,16 @@ iface = gr.Interface(
         gr.Textbox(
             label="Text",
             value="زندگی فقط یک بار است؛ از آن به خوبی استفاده کن",
-        )
     ],
     outputs=gr.Audio(label="Output",type='filepath'),
     examples=examples,
-    title="🗣️Persian ttt - glow_tts 🗣️",
     description=description,
     article=article,
     live=False

 from TTS.utils.manage import ModelManager
 from TTS.utils.synthesizer import Synthesizer
+MODEL_NAMES=[
+    "vits-male",
+    "vits-female",
+    "glowtts-male",
+    "glowtts-female"
+]
 MAX_TXT_LEN = 800
 model_path = os.getcwd() + "/best_model.pth"
 config_path = os.getcwd() + "/config.json"
+from TTS.utils.download import download_url
+modelInfo=[
+    ["vits-male","best_model_65633.pth","config-0.json","https://huggingface.co/Kamtera/persian-tts-male-vits/resolve/main/"],
+    ["vits-female","checkpoint_48000.pth","config-2.json","https://huggingface.co/Kamtera/persian-tts-female-vits/resolve/main/"],
+    ["glowtts-male","best_model_77797.pth","config-1.json","https://huggingface.co/Kamtera/persian-tts-male-glow_tts/resolve/main/"],
+    ["glowtts-female","best_model.pth","config.json","https://huggingface.co/Kamtera/persian-tts-female-glow_tts/resolve/main/"]
+]
+for d in modelInfo:
+    directory=d[0]
+    if not os.path.exists(directory):
+        os.makedirs(directory)
+    download_url(
+        d[3]+d[1],directory,"best_model.pth"
+    )
+    download_url(
+        d[3]+d[2],directory,"config.json"
+    )
+def tts(text: str,model_name: str):
     if len(text) > MAX_TXT_LEN:
         text = text[:MAX_TXT_LEN]
         print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
     print(text)
     # synthesize
+    synthesizer = Synthesizer(
+        model_name+"/best_model.pth", model_name+"/config.json"
+    )
     if synthesizer is None:
         raise NameError("model not found")
     wavs = synthesizer.tts(text)
 description="""
 This is a demo of persian text to speech model.
+Models can be found here:
+https://huggingface.co/Kamtera/persian-tts-female-vits
+https://huggingface.co/Kamtera/persian-tts-male-vits
+https://huggingface.co/Kamtera/persian-tts-male-glow_tts
+https://huggingface.co/Kamtera/persian-tts-female-glow_tts
+Models trained on these datasets :
+https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset
+https://www.kaggle.com/datasets/magnoliasis/persian-tts-dataset-famale
 """
 article= ""
 examples=[
+    ["و خداوند شما را با ارسال روح در جسم زندگانی و حیات بخشید","vits-male"],
+    ["تاجر تو چه تجارت می کنی ، تو را چه که چه تجارت می کنم؟","vits-female"],
+    ["شیش سیخ جیگر سیخی شیش هزار","vits-female"],
+    ["سه شیشه شیر ، سه سیر سرشیر","vits-female"],
+    ["دزدی دزدید ز بز دزدی بزی ، عجب دزدی که دزدید ز بز دزدی بزی","vits-female"],
+    ["مثنوی یکی از قالب های شعری است ک هر بیت قافیه ی جداگانه دارد","vits-female"],
+    ["در گلو ماند خس او سالها، چیست آن خس مهر جاه و مالها","vits-female"],
 ]
 iface = gr.Interface(
     fn=tts,
         gr.Textbox(
             label="Text",
             value="زندگی فقط یک بار است؛ از آن به خوبی استفاده کن",
+        ),
+        gr.Radio(
+            label="Pick a TTS Model ",
+            choices=MODEL_NAMES,
+            value="vits-female",
+        ),
     ],
     outputs=gr.Audio(label="Output",type='filepath'),
     examples=examples,
+    title="🗣️ Persian tts 🗣️",
     description=description,
     article=article,
     live=False