Spaces:

Oriserve
/

OriTTS

Running

App Files Files Community

ajajali09 commited on Dec 2, 2025

Commit

1558975

1 Parent(s): 5cb697f

fix in a bug

Browse files

Files changed (3) hide show

S3_bucket.py +0 -1
app.py +2 -21
utils.py +9 -52

S3_bucket.py CHANGED Viewed

@@ -183,5 +183,4 @@ class AWS:
         self.s3_client.upload_fileobj(
             obj, self.bucket_name, s3_key, ExtraArgs={"ContentType": "audio/wav"}
         )
-        print("raw wav file uploaded to s3!")
         return None

         self.s3_client.upload_fileobj(
             obj, self.bucket_name, s3_key, ExtraArgs={"ContentType": "audio/wav"}
         )
         return None

app.py CHANGED Viewed

@@ -74,7 +74,7 @@ if st.session_state.page == "Home":
         st.title("Home")
         st.markdown("---")
         st.header("Models......")
-        model = st.radio("Select Model", ["V1", "V2"])
         if model == "V1":
             st.header("Languages.....")
             language = st.selectbox("Select Language", list(utils.V1_LANGUAGES.keys()))
@@ -85,9 +85,6 @@ if st.session_state.page == "Home":
                 reference_audio = None
             else:
                 st.info("Give a reference audio (min 5 seconds)")
-                # audio_file = st.file_uploader("Reference Audio", type=['wav', 'mp3', 'flac'])
-                # reference_audio = audio_file
-                # default_speaker = None
                 audio_source = st.radio(
                     "Reference audio source",
                     ["Upload file", "Record audio"],
@@ -118,9 +115,6 @@ if st.session_state.page == "Home":
                 reference_audio = None
             else:
                 st.info("Give a reference audio (min 5 seconds)")
-                # audio_file = st.file_uploader("Reference Audio", type=['wav', 'mp3', 'flac'])
-                # reference_audio = audio_file
-                # default_speaker = None
                 audio_source = st.radio(
                     "Reference audio source",
                     ["Upload file", "Record audio"],
@@ -223,13 +217,9 @@ if st.session_state.page == "Home":
     if generate_btn:
         session_id = utils.generate_session_id()
-        print(f"\n\nGenerate btn is pressed.....\nThis is the session ID : -{session_id}")
         # Validate pronunciation input
-        # if pr_key.strip() and pr_value.strip():
         pronunciation_dict_str = st.session_state.pronunc_dict
-        # else:
-        #     pronunciation_dict_str = {}
         input_text = st.session_state.input_text
         if not input_text.strip():
@@ -284,7 +274,6 @@ if st.session_state.page == "Home":
                                 else:
                                     result = utils.v2_clone_voice(tmp_file.name, user_id, token)
                                 voice_id = result['voice_id']
-                                print(f"Voice Clone succesfully from mode {model} id is {voice_id}")
                                 reference_audio.seek(0)
                                 classes.upload_voice_clone_audio(reference_audio, voice_id)
                                 voice_path = cache_key
@@ -312,14 +301,6 @@ if st.session_state.page == "Home":
                             )
                         )
                     loop.close()
-                # st.success(status_msg)
-                # st.audio(audio, sample_rate=sr)
-                # st.session_state.show_feedback = True
-                # st.session_state.last_session_id = session_id
-                # st.success(status_msg)
                 # Store audio + session info in state, mark as available
                 st.session_state.last_msg = status_msg
                 st.session_state.last_audio = audio
@@ -327,7 +308,7 @@ if st.session_state.page == "Home":
                 st.session_state.last_session_id = session_id
                 st.session_state.has_audio = True
                 st.session_state.show_feedback = True
             except Exception as e:
                 st.error(f"Error: {str(e)}")
                 st.session_state.show_feedback = False

         st.title("Home")
         st.markdown("---")
         st.header("Models......")
+        model = st.radio("Select Model", ["V2", "V1"])
         if model == "V1":
             st.header("Languages.....")
             language = st.selectbox("Select Language", list(utils.V1_LANGUAGES.keys()))
                 reference_audio = None
             else:
                 st.info("Give a reference audio (min 5 seconds)")
                 audio_source = st.radio(
                     "Reference audio source",
                     ["Upload file", "Record audio"],
                 reference_audio = None
             else:
                 st.info("Give a reference audio (min 5 seconds)")
                 audio_source = st.radio(
                     "Reference audio source",
                     ["Upload file", "Record audio"],
     if generate_btn:
         session_id = utils.generate_session_id()
         # Validate pronunciation input
         pronunciation_dict_str = st.session_state.pronunc_dict
         input_text = st.session_state.input_text
         if not input_text.strip():
                                 else:
                                     result = utils.v2_clone_voice(tmp_file.name, user_id, token)
                                 voice_id = result['voice_id']
                                 reference_audio.seek(0)
                                 classes.upload_voice_clone_audio(reference_audio, voice_id)
                                 voice_path = cache_key
                             )
                         )
                     loop.close()
                 # Store audio + session info in state, mark as available
                 st.session_state.last_msg = status_msg
                 st.session_state.last_audio = audio
                 st.session_state.last_session_id = session_id
                 st.session_state.has_audio = True
                 st.session_state.show_feedback = True
+                print("Generation completed......")
             except Exception as e:
                 st.error(f"Error: {str(e)}")
                 st.session_state.show_feedback = False

utils.py CHANGED Viewed

@@ -46,16 +46,13 @@ def generate_session_id():
 def unpack_pkl_data(s3_key=parameters.pkl_data_key):
     exists = aws.check_if_exists(object_key=s3_key)
     if not exists:
-        print("Pickle file does not exist!!!")
         return None
     try:
         with aws.fs.open(f"s3://{aws.bucket_name}/{s3_key}", "rb") as f:
             file_bytes = f.read()
             loaded_data = pickle.loads(file_bytes)
-            print("Load pickle data completed.")
             return loaded_data
     except Exception as e:
-        print(f"Unable to load pickle file from S3 due to this: {e}")
         return None
 st.session_state.loaded_data = unpack_pkl_data()
@@ -69,7 +66,6 @@ if st.session_state.loaded_data:
     V1_SPEAKERS = st.session_state.loaded_data['V1_SPEAKERS']
     V2_SPEAKERS = st.session_state.loaded_data['V2_SPEAKERS']
 else:
-    print("Failed to load pickle data. Exiting script.")
     st.stop()
@@ -83,7 +79,6 @@ def save_generated_audio(audio_data, session_id):
         aws.s3_upload_wav(obj=audio_file, s3_key=s3_key)
         return s3_key
     except Exception as e:
-        print(f"Error saving generated audio: {e}")
         return None
 def audio_header_creater(audio, channels=1, sample_rate=8000, bits_per_sample=16):
@@ -123,6 +118,7 @@ def ensure_csv_exists(sep="|"):
             "speech_rate",
             "loudness",
             "refine_generation",
             "rating",
             "feedback",
         ]
@@ -154,6 +150,7 @@ def ensure_error_logs_csv_exists(sep="|"):
             "speech_rate",
             "loudness",
             "refine_generation",
         ]
         df = pd.DataFrame(columns=columns)
@@ -174,6 +171,7 @@ def log_initial_submission(
     user_id,
     voice_path,
     text_input,
     expressiveness=1.0,
     stability=100,
     clarity=1.0,
@@ -194,6 +192,7 @@ def log_initial_submission(
                 {
                     "timestamp": [timestamp],
                     "session_id": [session_id],
                     "language": [language],
                     "input_method": [input_method],
                     "agent_used": [agent_used if agent_used else "None"],
@@ -229,7 +228,6 @@ def log_initial_submission(
             return "Audio generated and saved!"
         except Exception as e:
-            print(f"Error saving submission: {e}")
             return f"Error: Could not save data - {str(e)}"
     else:
         try:
@@ -252,6 +250,7 @@ def log_initial_submission(
                     "speech_rate": [speech_rate],
                     "loudness": [loudness],
                     "refine_generation": [refine_generation],
                 }
             )
@@ -286,7 +285,6 @@ def update_rating(session_id, rating_index, feedback_msg: str):
         s3_csv_file = ensure_csv_exists(sep="|")
         if not aws.check_if_exists(object_key=s3_csv_file):
-            print(f"CSV file doesn't exist or is empty: {s3_csv_file}")
             return "Error: No data found"
         with aws.fs.open(f"s3://{aws.bucket_name}/{s3_csv_file}", "r") as f:
@@ -314,12 +312,10 @@ def update_rating(session_id, rating_index, feedback_msg: str):
                 st.success(f"Your rating of {star_dict[rating]} submitted successfully!!\nThank you for the feedback!!")
             )
         else:
-            print(f"Session {session_id} not found in the CSV file")
             return (
                 f"Could not find Session {session_id} in tracks\nMake sure to press Generate button Once!!!"
             ), None
     except Exception as e:
-        print(f"Error updating rating: {e}")
         return f"Error: Could not update rating - {str(e)}", None
@@ -424,7 +420,6 @@ async def v1_generate_speech_async(
     else:
         send_voice_id = voice_id
-    print(f"\nPayload for Generation:-\nRequest goes to:- {request_to}\nText:- {text}\nVoide Id : {send_voice_id}\nextra_body :{extra_body}\nextra_headers : {extra_headers}\n")
     # Use AsyncOpenAI streaming response (matches your original code)
     try:
         async with v1_client.audio.speech.with_streaming_response.create(
@@ -450,6 +445,7 @@ async def v1_generate_speech_async(
             user_id=user_id,
             voice_path=saved_path,
             text_input=text,
             expressiveness=expressive,
             stability=stability,
             clarity=clarity,
@@ -458,26 +454,7 @@ async def v1_generate_speech_async(
         )
         return sr, aud
     except Exception as e:
-        print(f"API request failed with status {response.status_code}")
-        print(f"Error:- {e}")
-        log_initial_submission(
-            code=response.status_code,
-            session_id=session_id,
-            language=language_code,
-            input_method=voice_mode,
-            agent_used=voice_id,
-            user_id=user_id,
-            voice_path=None,
-            text_input=text,
-            expressiveness=expressive,
-            stability=stability,
-            clarity=clarity,
-            speech_rate=speech_rate,
-            loudness=volume_level,
-            refine_generation=False,
-            err_code=response.status_code,
-            err_msg=e,
-        )
 async def v2_generate_speech_async(
         session_id: str,
@@ -515,7 +492,6 @@ async def v2_generate_speech_async(
     else:
         send_voice_id = voice_id
-    print(f"\nPayload for Generation:-\nRequest goes to:- {request_to}\nText:- {text}\nVoide Id : {send_voice_id}\nextra_body :{extra_body}\n")
     # Use AsyncOpenAI streaming response (matches your original code)
     try:
         async with v2_client.audio.speech.with_streaming_response.create(
@@ -540,32 +516,13 @@ async def v2_generate_speech_async(
             user_id=user_id,
             voice_path=saved_path,
             text_input=text,
             expressiveness=expressive,
             stability=stability,
             clarity=clarity,
             speech_rate=speech_rate,
             loudness=volume_level
         )
-        status_code = response.status_code
         return sr, aud
     except Exception as e:
-        print(f"API request failed with status {status_code}")
-        print(f"Error:- {e}")
-        log_initial_submission(
-            code=status_code,
-            session_id=session_id,
-            language=language_code,
-            input_method=voice_mode,
-            agent_used=voice_id,
-            user_id=user_id,
-            voice_path=None,
-            text_input=text,
-            expressiveness=expressive,
-            stability=stability,
-            clarity=clarity,
-            speech_rate=speech_rate,
-            loudness=volume_level,
-            refine_generation=False,
-            err_code=response.status_code,
-            err_msg=e,
-        )

 def unpack_pkl_data(s3_key=parameters.pkl_data_key):
     exists = aws.check_if_exists(object_key=s3_key)
     if not exists:
         return None
     try:
         with aws.fs.open(f"s3://{aws.bucket_name}/{s3_key}", "rb") as f:
             file_bytes = f.read()
             loaded_data = pickle.loads(file_bytes)
             return loaded_data
     except Exception as e:
         return None
 st.session_state.loaded_data = unpack_pkl_data()
     V1_SPEAKERS = st.session_state.loaded_data['V1_SPEAKERS']
     V2_SPEAKERS = st.session_state.loaded_data['V2_SPEAKERS']
 else:
     st.stop()
         aws.s3_upload_wav(obj=audio_file, s3_key=s3_key)
         return s3_key
     except Exception as e:
         return None
 def audio_header_creater(audio, channels=1, sample_rate=8000, bits_per_sample=16):
             "speech_rate",
             "loudness",
             "refine_generation",
+            "model_name"
             "rating",
             "feedback",
         ]
             "speech_rate",
             "loudness",
             "refine_generation",
+            "model_name"
         ]
         df = pd.DataFrame(columns=columns)
     user_id,
     voice_path,
     text_input,
+    model_name,
     expressiveness=1.0,
     stability=100,
     clarity=1.0,
                 {
                     "timestamp": [timestamp],
                     "session_id": [session_id],
+                    "model_name":[model_name],
                     "language": [language],
                     "input_method": [input_method],
                     "agent_used": [agent_used if agent_used else "None"],
             return "Audio generated and saved!"
         except Exception as e:
             return f"Error: Could not save data - {str(e)}"
     else:
         try:
                     "speech_rate": [speech_rate],
                     "loudness": [loudness],
                     "refine_generation": [refine_generation],
+                    "model_name": [model_name]
                 }
             )
         s3_csv_file = ensure_csv_exists(sep="|")
         if not aws.check_if_exists(object_key=s3_csv_file):
             return "Error: No data found"
         with aws.fs.open(f"s3://{aws.bucket_name}/{s3_csv_file}", "r") as f:
                 st.success(f"Your rating of {star_dict[rating]} submitted successfully!!\nThank you for the feedback!!")
             )
         else:
             return (
                 f"Could not find Session {session_id} in tracks\nMake sure to press Generate button Once!!!"
             ), None
     except Exception as e:
         return f"Error: Could not update rating - {str(e)}", None
     else:
         send_voice_id = voice_id
     # Use AsyncOpenAI streaming response (matches your original code)
     try:
         async with v1_client.audio.speech.with_streaming_response.create(
             user_id=user_id,
             voice_path=saved_path,
             text_input=text,
+            model_name=request_to,
             expressiveness=expressive,
             stability=stability,
             clarity=clarity,
         )
         return sr, aud
     except Exception as e:
+        st.Error("There is some in Audios Generation. Pleace try later.")
 async def v2_generate_speech_async(
         session_id: str,
     else:
         send_voice_id = voice_id
     # Use AsyncOpenAI streaming response (matches your original code)
     try:
         async with v2_client.audio.speech.with_streaming_response.create(
             user_id=user_id,
             voice_path=saved_path,
             text_input=text,
+            model_name=request_to,
             expressiveness=expressive,
             stability=stability,
             clarity=clarity,
             speech_rate=speech_rate,
             loudness=volume_level
         )
         return sr, aud
     except Exception as e:
+        st.Error("There is some in Audios Generation. Pleace try later.")