Text_to_speech_tts

Sleeping

App Files Files Community

Jekyll2000 commited on Mar 18, 2024

Commit

9e74171

verified ·

1 Parent(s): 60e27ae

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -38

app.py CHANGED Viewed

@@ -1,3 +1,24 @@
 import logging
 import os
 import time
@@ -8,13 +29,14 @@ import soundfile as sf
 from model import get_pretrained_model, language_to_models
-title = "Text-to-speech (TTS)-by-Haseeb Ahmed"
 description = """
 This space shows how to convert text to speech with Next-gen Kaldi.
 It is running on CPU within a docker container provided by Hugging Face.
 """
 # css style is copied from
@@ -26,10 +48,10 @@ css = """
 .result_item_error {background-color:#ff7070;color:white;align-self:start}
 """
-#examples = [
-#    ["Min-nan (闽南话)", "csukuangfj/vits-mms-nan", "ài piaǸ chiah ē iaN̂", 0, 1.0],
-#   ["Thai", "csukuangfj/vits-mms-tha", "ฉันรักคุณ", 0, 1.0],
-#]
 def update_model_dropdown(language: str):
@@ -128,22 +150,22 @@ with demo:
                 placeholder="Please input your text here",
             )
-           # input_sid = gr.Textbox(
-            #    label="Speaker ID",
-             #   info="Speaker ID",
-              #  lines=1,
-               # max_lines=1,
-               # value="0",
-               # placeholder="Speaker ID. Valid only for mult-speaker model",
-            #)
-           # input_speed = gr.Slider(
-            #    minimum=0.1,
-             #   maximum=10,
-              #  value=1,
-               # step=0.1,
-                #label="Speed (larger->faster; smaller->slower)",
-            #)
             input_button = gr.Button("Submit")
@@ -151,21 +173,21 @@ with demo:
             output_info = gr.HTML(label="Info")
-            #gr.Examples(
-               # examples=examples,
-               # fn=process,
-               # inputs=[
-                #    language_radio,
-                #    model_dropdown,
-                #    input_text,
-                #    input_sid,
-             #       input_speed,
-              #  ],
-              #  outputs=[
-               #     output_audio,
-               #     output_info,
-              #  ],
-          #  )
         input_button.click(
             process,
@@ -173,8 +195,8 @@ with demo:
                 language_radio,
                 model_dropdown,
                 input_text,
-                #input_sid,
-                #input_speed,
             ],
             outputs=[
                 output_audio,

+#!/usr/bin/env python3
+#
+# Copyright      2022-2023  Xiaomi Corp.        (authors: Fangjun Kuang)
+#
+# See LICENSE for clarification regarding multiple authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# References:
+# https://gradio.app/docs/#dropdown
 import logging
 import os
 import time
 from model import get_pretrained_model, language_to_models
+title = "# Text-to-speech (TTS): Haseeb Ahmed"
 description = """
 This space shows how to convert text to speech with Next-gen Kaldi.
 It is running on CPU within a docker container provided by Hugging Face.
 """
 # css style is copied from
 .result_item_error {background-color:#ff7070;color:white;align-self:start}
 """
+examples = [
+    ["Min-nan (闽南话)", "csukuangfj/vits-mms-nan", "ài piaǸ chiah ē iaN̂", 0, 1.0],
+    ["Thai", "csukuangfj/vits-mms-tha", "ฉันรักคุณ", 0, 1.0],
+]
 def update_model_dropdown(language: str):
                 placeholder="Please input your text here",
             )
+            input_sid = gr.Textbox(
+                label="Speaker ID",
+                info="Speaker ID",
+                lines=1,
+                max_lines=1,
+                value="0",
+                placeholder="Speaker ID. Valid only for mult-speaker model",
+            )
+            input_speed = gr.Slider(
+                minimum=0.1,
+                maximum=10,
+                value=1,
+                step=0.1,
+                label="Speed (larger->faster; smaller->slower)",
+            )
             input_button = gr.Button("Submit")
             output_info = gr.HTML(label="Info")
+            gr.Examples(
+                examples=examples,
+                fn=process,
+                inputs=[
+                    language_radio,
+                    model_dropdown,
+                    input_text,
+                    input_sid,
+                    input_speed,
+                ],
+                outputs=[
+                    output_audio,
+                    output_info,
+                ],
+            )
         input_button.click(
             process,
                 language_radio,
                 model_dropdown,
                 input_text,
+                input_sid,
+                input_speed,
             ],
             outputs=[
                 output_audio,