clone

Build error

App Files Files Community

nikkmitra commited on Oct 8, 2024

Commit

57c110b

verified ·

1 Parent(s): 336f9db

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -16

app.py CHANGED Viewed

@@ -56,33 +56,67 @@ def check_voice_files():
     else:
         return "**All voice files are present.** 🎉"
 @spaces.GPU(duration=120)
 def tts_generate(text, voice, language):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
         temp_audio_path = temp_audio.name
-    voice_file = hf_hub_download(repo_id="nikkmitra/clone", filename=celebrity_voices[voice], repo_type="space", token=hf_token)
-    tts.tts_to_file(
-        text=text,
-        speaker_wav=voice_file,
-        language=language,
-        file_path=temp_audio_path
-    )
     return temp_audio_path
 @spaces.GPU(enable_queue=True)
 def clone_voice(text, audio_file, language):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
         temp_audio_path = temp_audio.name
-    tts.tts_to_file(
-        text=text,
-        speaker_wav=audio_file,
-        language=language,
-        file_path=temp_audio_path
-    )
     return temp_audio_path
@@ -113,7 +147,7 @@ with gr.Blocks() as demo:
             with gr.Row():
                 clone_text = gr.Textbox(label="Text to speak")
                 clone_audio = gr.Audio(label="Voice reference audio file", type="filepath")
-                clone_language = gr.Dropdown(["en", "es", "fr", "de", "it", "ar"], label="Language", value="en")
             clone_generate_btn = gr.Button("Generate")
             clone_output = gr.Audio(label="Generated Audio")
@@ -129,4 +163,4 @@ demo.launch()
 # Clean up temporary files (this will run after the Gradio server is closed)
 for file in os.listdir():
     if file.endswith('.wav') and file.startswith('tmp'):
-        os.remove(file)

     else:
         return "**All voice files are present.** 🎉"
+# New function to split text into chunks of 100 tokens
+def split_text_into_chunks(text, max_tokens=100):
+    """
+    Splits the input text into chunks with a maximum of `max_tokens` tokens each.
+    Inserts a newline after each chunk.
+    """
+    words = text.split()
+    chunks = []
+    for i in range(0, len(words), max_tokens):
+        chunk = ' '.join(words[i:i + max_tokens])
+        chunks.append(chunk)
+    return '\n'.join(chunks)
 @spaces.GPU(duration=120)
 def tts_generate(text, voice, language):
+    # Check for Hindi language and split text if necessary
+    if language == "hi":
+        text = split_text_into_chunks(text, max_tokens=100)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
         temp_audio_path = temp_audio.name
+    try:
+        voice_file = hf_hub_download(repo_id="nikkmitra/clone", filename=celebrity_voices[voice], repo_type="space", token=hf_token)
+    except Exception as e:
+        return f"Error downloading voice file: {e}"
+    try:
+        tts.tts_to_file(
+            text=text,
+            speaker_wav=voice_file,
+            language=language,
+            file_path=temp_audio_path
+        )
+    except AssertionError as ae:
+        return f"Error: {ae}"
+    except Exception as e:
+        return f"An unexpected error occurred: {e}"
     return temp_audio_path
 @spaces.GPU(enable_queue=True)
 def clone_voice(text, audio_file, language):
+    # Check for Hindi language and split text if necessary
+    if language == "hi":
+        text = split_text_into_chunks(text, max_tokens=100)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
         temp_audio_path = temp_audio.name
+    try:
+        tts.tts_to_file(
+            text=text,
+            speaker_wav=audio_file,
+            language=language,
+            file_path=temp_audio_path
+        )
+    except AssertionError as ae:
+        return f"Error: {ae}"
+    except Exception as e:
+        return f"An unexpected error occurred: {e}"
     return temp_audio_path
             with gr.Row():
                 clone_text = gr.Textbox(label="Text to speak")
                 clone_audio = gr.Audio(label="Voice reference audio file", type="filepath")
+                clone_language = gr.Dropdown(["en", "es", "fr", "de", "it", "ar", "hi"], label="Language", value="en")
             clone_generate_btn = gr.Button("Generate")
             clone_output = gr.Audio(label="Generated Audio")
 # Clean up temporary files (this will run after the Gradio server is closed)
 for file in os.listdir():
     if file.endswith('.wav') and file.startswith('tmp'):
+        os.remove(file)