Spaces:

meraj12
/

cloningapp

Sleeping

App Files Files Community

meraj12 commited on Apr 9, 2025

Commit

5e80325

verified ·

1 Parent(s): e1681aa

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -5

app.py CHANGED Viewed

@@ -22,18 +22,30 @@ if "clone_path" not in st.session_state:
     st.session_state.clone_path = None
 if "voice_gender" not in st.session_state:
     st.session_state.voice_gender = "Male"  # Default to Male
 # Sidebar for voice cloning setup
 st.sidebar.header("🧬 Setup Your Clone Voice")
 voice_option = st.sidebar.radio("Choose how to provide clone voice", ["Upload Voice"])
 st.session_state.voice_gender = st.sidebar.selectbox("Select Voice Gender", ["Male", "Female"])
 if voice_option == "Upload Voice":
     uploaded = st.sidebar.file_uploader("Upload a voice sample", type=["wav", "mp3", "m4a", "flac", "ogg"])
     if uploaded:
         path = save_uploaded_audio(uploaded, "reference_voice.wav")
         st.session_state.clone_path = path
-        st.success("✅ Voice uploaded and saved as your clone voice.")
 # --- Conversation section ---
 st.subheader("🗣️ Ask with voice or type text below")
@@ -55,9 +67,10 @@ with tab1:
         # Step 2: Get LLM response
         st.info("Thinking...")
         response = groq_client.chat.completions.create(
             model="llama3-8b-8192",
-            messages=[{"role": "user", "content": user_text}]
         )
         reply = response.choices[0].message.content
         st.success(f"🤖 AI says: {reply}")
@@ -65,7 +78,7 @@ with tab1:
         # Step 3: Voice reply
         if st.session_state.clone_path:
             st.info("Cloning voice reply...")
-            voice_preset = get_voice_preset(st.session_state.voice_gender)
             voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path, voice_preset)
             st.audio(voice_output_path)
         else:
@@ -80,9 +93,10 @@ with tab2:
         else:
             # Step 1: Get LLM response
             st.info("Thinking...")
             response = groq_client.chat.completions.create(
                 model="llama3-8b-8192",
-                messages=[{"role": "user", "content": user_input}]
             )
             reply = response.choices[0].message.content
             st.success(f"🤖 AI says: {reply}")
@@ -90,7 +104,7 @@ with tab2:
             # Step 2: Voice reply
             if st.session_state.clone_path:
                 st.info("Cloning voice reply...")
-                voice_preset = get_voice_preset(st.session_state.voice_gender)
                 voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path, voice_preset)
                 st.audio(voice_output_path)
             else:

     st.session_state.clone_path = None
 if "voice_gender" not in st.session_state:
     st.session_state.voice_gender = "Male"  # Default to Male
+if "voice_name" not in st.session_state:
+    st.session_state.voice_name = "MyVoice"
+if "emotion" not in st.session_state:
+    st.session_state.emotion = "Neutral"
+if "language" not in st.session_state:
+    st.session_state.language = "English"
+if "ai_persona" not in st.session_state:
+    st.session_state.ai_persona = "Assistant"
 # Sidebar for voice cloning setup
 st.sidebar.header("🧬 Setup Your Clone Voice")
 voice_option = st.sidebar.radio("Choose how to provide clone voice", ["Upload Voice"])
 st.session_state.voice_gender = st.sidebar.selectbox("Select Voice Gender", ["Male", "Female"])
+st.session_state.voice_name = st.sidebar.text_input("Name your voice", value=st.session_state.voice_name)
+st.session_state.emotion = st.sidebar.selectbox("Select Emotion", ["Neutral", "Happy", "Sad", "Angry", "Excited", "Calm"])
+st.session_state.language = st.sidebar.selectbox("Select Language", ["English", "Urdu", "Hindi", "Arabic", "Spanish"])
+st.session_state.ai_persona = st.sidebar.selectbox("Select AI Personality", ["Assistant", "Urdu Teacher", "Wise Mentor", "Chill Friend", "Formal Assistant"])
 if voice_option == "Upload Voice":
     uploaded = st.sidebar.file_uploader("Upload a voice sample", type=["wav", "mp3", "m4a", "flac", "ogg"])
     if uploaded:
         path = save_uploaded_audio(uploaded, "reference_voice.wav")
         st.session_state.clone_path = path
+        st.success(f"✅ Voice '{st.session_state.voice_name}' uploaded and saved as your clone voice.")
 # --- Conversation section ---
 st.subheader("🗣️ Ask with voice or type text below")
         # Step 2: Get LLM response
         st.info("Thinking...")
+        persona_prompt = f"You are a {st.session_state.ai_persona}. Respond in {st.session_state.language} with a {st.session_state.emotion} tone."
         response = groq_client.chat.completions.create(
             model="llama3-8b-8192",
+            messages=[{"role": "system", "content": persona_prompt}, {"role": "user", "content": user_text}]
         )
         reply = response.choices[0].message.content
         st.success(f"🤖 AI says: {reply}")
         # Step 3: Voice reply
         if st.session_state.clone_path:
             st.info("Cloning voice reply...")
+            voice_preset = get_voice_preset(st.session_state.voice_gender, st.session_state.emotion)
             voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path, voice_preset)
             st.audio(voice_output_path)
         else:
         else:
             # Step 1: Get LLM response
             st.info("Thinking...")
+            persona_prompt = f"You are a {st.session_state.ai_persona}. Respond in {st.session_state.language} with a {st.session_state.emotion} tone."
             response = groq_client.chat.completions.create(
                 model="llama3-8b-8192",
+                messages=[{"role": "system", "content": persona_prompt}, {"role": "user", "content": user_input}]
             )
             reply = response.choices[0].message.content
             st.success(f"🤖 AI says: {reply}")
             # Step 2: Voice reply
             if st.session_state.clone_path:
                 st.info("Cloning voice reply...")
+                voice_preset = get_voice_preset(st.session_state.voice_gender, st.session_state.emotion)
                 voice_output_path = clone_and_generate_text(reply, st.session_state.clone_path, voice_preset)
                 st.audio(voice_output_path)
             else: