Spaces:

Oriserve
/

OriTTS

Running

App Files Files Community

ajajali09 commited on May 13, 2025

Commit

0faef2a

1 Parent(s): cd4dc72

added error logs and changes some emojies

Browse files

Files changed (1) hide show

app.py +34 -19

app.py CHANGED Viewed

@@ -74,7 +74,7 @@ def get_random_sentence(language):
 def toggle_generate_button_state(choice, text_input, recording_data=None):
-    if choice == "Predefined Voice":
         return (
             gr.update(interactive=True),
             gr.update(
@@ -85,7 +85,7 @@ def toggle_generate_button_state(choice, text_input, recording_data=None):
             gr.update(visible=False, value=None),
         )
-    elif choice == "Record/Upload Voice":
         if recording_data is None:
             return (
                 gr.update(interactive=False),
@@ -382,6 +382,17 @@ def handle_input_pronunc_pair(key,value,pronunc_dict):
         gr.Error("Tried to set key value pair in pronunciation dict with empty value please check input")
 def process_voice_clone(filepath, user_id):
     try:
         url = parameters.voice_clone_URL
         payload = {"user_id": user_id}
@@ -396,14 +407,14 @@ def process_voice_clone(filepath, user_id):
             response = response.json()
             response = response["voice_id"]
             return response
         else:
             response = response.json()
-            gr.Error(response["message"])
-            return ["Jyoti"]
     except Exception as e:
         print(f"An Error occurred: {e}")
-        gr.Error("Falid to clone your voice and reverting to default voice")
-        return ["Jyoti"]
 def tts_inference(
     session_id: str,
@@ -428,10 +439,14 @@ def tts_inference(
         clone_voice_name = process_voice_clone(recording_data, user_id)
         if clone_voice_name is not None:
             voice_name = str(clone_voice_name)
     else:
         voice_name = [agents[agent]]
-    print("Parameters Recieved:\n")
     print("speechReqId", session_id)
     print("text", [text])
     print("language", [language_codes[language]])
@@ -443,7 +458,7 @@ def tts_inference(
     print("speech_rate", speech_rate)
     print("loudness", loudness)
     print("refine_grneration", refine_generation)
-    print("\n")
     try:
         if not text or text.strip() == "":
@@ -549,7 +564,7 @@ def tts_inference(
                         code=response.status_code,
                         session_id=session_id,
                         language=language,
-                        input_method="Select Voice" if agent else "Record/Upload Voice",
                         agent_used=voice_name,
                         voice_path=saved_path,
                         text_input=text,
@@ -620,10 +635,10 @@ def tts_tab():
             🌐 **Select Language**
             * Choose from our listed languages
-            🎭 **Choose Voice**
             * Select from the curated collection of high-quality voices
             * Each voice is optimized for natural speech patterns
-            * You can give your on voice by clicking on Record/Upload Voice
             ✍️ **Enter Your Text**
             * Type or paste your text in the input box
@@ -644,7 +659,7 @@ def tts_tab():
             * Your feedback helps improve our system
             💾 **Access Your Audio**
-            * Download generated audio for offline use
             """)
                 # Language and Voice Selection
@@ -678,16 +693,16 @@ def tts_tab():
                         )
                     input_toggle = gr.Radio(
-                        choices=["Predefined Voice", "Record/Upload Voice"],
-                        value="Predefined Voice",
-                        label="🎭 Choose Input Method",
                         interactive=True,
                         visible=True,
                     )
                     with gr.Row():
                         agent_dropdown = gr.Dropdown(
-                            label="🎭 Select Voice",
                             choices=list(agents.keys()),
                             value=list(agents.keys())[0],
                             interactive=True,
@@ -852,13 +867,13 @@ def tts_tab():
                     gr.HTML("""
                         <div class="voice-param-heading">💡 Pro Tips</div>
                         <ul style="margin-top: 5px; padding-left: 15px; font-size: 1em;">
-                            <li>For minimal hallucination use default low values</li>
                             <li>Start with defaults and adjust gradually</li>
                             <li>Test different combinations for specific use cases</li>
                             <li>Higher values may increase processing time</li>
                             <li>Monitor quality vs performance trade-offs</li>
-                            <li>Add your pronunciation of any words if doesn't sound well</li>
-                            <li>If you don't like the pronunce of any word then add your on word with key and value pair</li>
                             <li><b style = "color:red">Note:-</b>Pronunciation pairs are <i style="color:red">case sensitive</i></li>
                         </ul>
                     """)

 def toggle_generate_button_state(choice, text_input, recording_data=None):
+    if choice == "Ori voices":
         return (
             gr.update(interactive=True),
             gr.update(
             gr.update(visible=False, value=None),
         )
+    elif choice == "Voice clone":
         if recording_data is None:
             return (
                 gr.update(interactive=False),
         gr.Error("Tried to set key value pair in pronunciation dict with empty value please check input")
 def process_voice_clone(filepath, user_id):
+    """
+    Make the clone of given audio
+    Parameters:
+    -filepath(str): The given audio path
+    -user_id(str): User id
+    Returns:
+    -voice name(str):The voice name of the cloned voice
+    """
     try:
         url = parameters.voice_clone_URL
         payload = {"user_id": user_id}
             response = response.json()
             response = response["voice_id"]
             return response
+        elif response.status_code==422:
+            print(response.text)
         else:
             response = response.json()
+            return None
     except Exception as e:
         print(f"An Error occurred: {e}")
+        return None
 def tts_inference(
     session_id: str,
         clone_voice_name = process_voice_clone(recording_data, user_id)
         if clone_voice_name is not None:
             voice_name = str(clone_voice_name)
+            print(f"The voice name, get from voice clone API:::--{voice_name}")
+        else:
+            gr.Error("Sorry, we are facing some issues with cloning this voice.\nPlease reload the app and try again.")
+            print("Did not get any voice name from voice clone api:------")
     else:
         voice_name = [agents[agent]]
+    print("\nParameters Recieved:\n")
     print("speechReqId", session_id)
     print("text", [text])
     print("language", [language_codes[language]])
     print("speech_rate", speech_rate)
     print("loudness", loudness)
     print("refine_grneration", refine_generation)
+    print("\n\n")
     try:
         if not text or text.strip() == "":
                         code=response.status_code,
                         session_id=session_id,
                         language=language,
+                        input_method="Select Voice" if agent else "Voice clone",
                         agent_used=voice_name,
                         voice_path=saved_path,
                         text_input=text,
             🌐 **Select Language**
             * Choose from our listed languages
+            🎤 **Choose Voice**
             * Select from the curated collection of high-quality voices
             * Each voice is optimized for natural speech patterns
+            * You can give your own voice by clicking on Voice clone
             ✍️ **Enter Your Text**
             * Type or paste your text in the input box
             * Your feedback helps improve our system
             💾 **Access Your Audio**
+            * Download the generated audio for offline use
             """)
                 # Language and Voice Selection
                         )
                     input_toggle = gr.Radio(
+                        choices=["Ori voices", "Voice clone"],
+                        value="Ori voices",
+                        label="🎤 Choose Input Method",
                         interactive=True,
                         visible=True,
                     )
                     with gr.Row():
                         agent_dropdown = gr.Dropdown(
+                            label="🗣️ Select Voice",
                             choices=list(agents.keys()),
                             value=list(agents.keys())[0],
                             interactive=True,
                     gr.HTML("""
                         <div class="voice-param-heading">💡 Pro Tips</div>
                         <ul style="margin-top: 5px; padding-left: 15px; font-size: 1em;">
+                            <li>For minimal hallucination, use default low values</li>
                             <li>Start with defaults and adjust gradually</li>
                             <li>Test different combinations for specific use cases</li>
                             <li>Higher values may increase processing time</li>
                             <li>Monitor quality vs performance trade-offs</li>
+                            <li>Add your pronunciation of any word that doesn't sound well</li>
+                            <li>If you don't like the pronunciation of any word, then add your word with the key and value pair</li>
                             <li><b style = "color:red">Note:-</b>Pronunciation pairs are <i style="color:red">case sensitive</i></li>
                         </ul>
                     """)