Spaces:

Aranwer
/

Kasoti

Sleeping

App Files Files Community

Aranwer commited on May 2, 2025

Commit

a374aef

verified ·

1 Parent(s): f7a3e32

Update app.py

Browse files

Files changed (1) hide show

app.py +127 -85

app.py CHANGED Viewed

@@ -1,41 +1,46 @@
-import streamlit as st
 import speech_recognition as sr
 import tempfile
 import scipy.io.wavfile
 import os
-import requests
 import numpy as np
-# API Keys
-os.environ["MISTRAL_API_KEY"] = "your-mistral-key"
-os.environ["GROQ_API_KEY"] = "your-groq-key"
-# Game State
-if "state" not in st.session_state:
-    st.session_state.state = {
-        "active": False,
-        "questions_asked": 0,
-        "answers": [],
-        "current_question": None,
-        "consult_mode": False
-    }
-# Functions
-def transcribe_audio(uploaded_file, language):
-    if uploaded_file is None:
         return ""
     try:
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
-            tmp_file.write(uploaded_file.read())
             tmp_file_path = tmp_file.name
         recognizer = sr.Recognizer()
         with sr.AudioFile(tmp_file_path) as source:
-            audio = recognizer.record(source)
-            lang_code = "en-US" if language == "English" else "ur-PK"
-            return recognizer.recognize_google(audio, language=lang_code).lower()
     except Exception as e:
-        return f"Transcription error: {e}"
 def query_llm(api, messages, model=None):
     headers = {
@@ -46,90 +51,127 @@ def query_llm(api, messages, model=None):
         "messages": messages,
         "model": model or ("llama3-70b-8192" if api == "GROQ" else "mistral-medium")
     }
-    url = "https://api.groq.com/openai/v1/chat/completions" if api == "GROQ" else "https://api.mistral.ai/v1/chat/completions"
-    response = requests.post(url, headers=headers, json=payload)
-    if response.ok:
-        return response.json()["choices"][0]["message"]["content"]
-    return "API Error"
-def normalize_answer(ans):
-    ans = ans.strip().lower()
-    return "yes" if ans in ["yes", "y", "ہاں", "haan"] else "no" if ans in ["no", "n", "نہیں", "nahi"] else None
 def generate_question(answers):
-    prompt = "You are playing Kasoti. Ask the next best yes/no question.\n\n"
     for i, (q, a) in enumerate(answers, 1):
         prompt += f"{i}. Q: {q}\n   A: {a}\n"
-    return query_llm("GROQ", [{"role": "user", "content": prompt}])
 def make_guess(answers):
-    prompt = "Based on this history, make a best guess:\n\n"
     for i, (q, a) in enumerate(answers, 1):
         prompt += f"{i}. Q: {q}\n   A: {a}\n"
-    return query_llm("GROQ", [{"role": "user", "content": prompt}])
 def get_hint(question, answers):
-    prompt = f"The player is unsure about: {question}\n\nHistory:\n"
     for q, a in answers:
         prompt += f"- Q: {q}\n  A: {a}\n"
-    return query_llm("MISTRAL", [{"role": "user", "content": prompt}])
-# Streamlit UI
-st.set_page_config(page_title="🎮 Kasoti 20Q", layout="centered")
-st.title("🎮 Kasoti - 20 Questions Game")
-st.info("Think of a famous person, place, or object. Answer with **yes/no** or **ہاں/نہیں** only.")
-if st.button("🔄 Start Game"):
-    st.session_state.state.update({
         "active": True,
         "questions_asked": 1,
         "answers": [],
         "current_question": "Is it a living thing?",
         "consult_mode": False
     })
-if st.session_state.state["active"]:
-    st.success(f"🤔 Question {st.session_state.state['questions_asked']}: {st.session_state.state['current_question']}")
-    with st.form(key="answer_form"):
-        audio_file = st.file_uploader("🎙️ Upload your answer (WAV only)", type=["wav"])
-        language = st.selectbox("🗣️ Language", ["English", "Urdu"])
-        manual_input = st.text_input("💬 Or type your answer:")
-        submit = st.form_submit_button("➡️ Submit")
-    if submit:
-        answer = manual_input or transcribe_audio(audio_file, language)
-        normalized = normalize_answer(answer)
-        if not normalized:
-            st.warning("⚠️ Please reply with 'yes' or 'no' (or 'ہاں/نہیں').")
         else:
-            question = st.session_state.state["current_question"]
-            st.session_state.state["answers"].append((question, normalized))
-            if "is this correct?" in question.lower():
-                if normalized == "yes":
-                    st.balloons()
-                    st.success("🎉 I guessed it right!")
-                    st.session_state.state["active"] = False
-                else:
-                    next_q = generate_question(st.session_state.state["answers"])
-                    st.session_state.state["current_question"] = next_q
-                    st.session_state.state["questions_asked"] += 1
-            elif st.session_state.state["questions_asked"] >= 20:
-                st.session_state.state["active"] = False
-                guess = make_guess(st.session_state.state["answers"])
-                st.error(f"❌ Game over! Final guess: {guess}")
-            elif st.session_state.state["questions_asked"] % 5 == 0:
-                guess = make_guess(st.session_state.state["answers"])
-                st.session_state.state["current_question"] = guess + " Is this correct?"
-                st.session_state.state["questions_asked"] += 1
-            else:
-                next_q = generate_question(st.session_state.state["answers"])
-                st.session_state.state["current_question"] = next_q
-                st.session_state.state["questions_asked"] += 1
-if st.session_state.state["active"]:
-    if st.toggle("💡 Enable Consult Mode"):
-        hint = get_hint(st.session_state.state["current_question"], st.session_state.state["answers"])
-        st.info(f"💭 Hint: {hint}")

+# app.py
+import gradio as gr
+import requests
 import speech_recognition as sr
 import tempfile
 import scipy.io.wavfile
 import os
 import numpy as np
+# Set your API keys as HF secrets or environment variables
+os.environ["MISTRAL_API_KEY"] = os.getenv("MISTRAL_API_KEY", "your-mistral-key")
+os.environ["GROQ_API_KEY"] = os.getenv("GROQ_API_KEY", "your-groq-key")
+game_state = {
+    "active": False,
+    "questions_asked": 0,
+    "answers": [],
+    "current_question": None,
+    "consult_mode": False
+}
+def transcribe_audio(audio, language):
+    if audio is None:
         return ""
     try:
+        sr_rate, audio_data = audio
+        if isinstance(audio_data, tuple):
+            audio_data = np.array(audio_data)
+        with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp_file:
+            scipy.io.wavfile.write(tmp_file.name, sr_rate, audio_data)
             tmp_file_path = tmp_file.name
         recognizer = sr.Recognizer()
         with sr.AudioFile(tmp_file_path) as source:
+            audio_content = recognizer.record(source)
+            language_code = "en-US" if language == "English" else "ur-PK"
+            text = recognizer.recognize_google(audio_content, language=language_code)
+            return text.lower()
     except Exception as e:
+        print(f"Transcription error: {e}")
+        return ""
 def query_llm(api, messages, model=None):
     headers = {
         "messages": messages,
         "model": model or ("llama3-70b-8192" if api == "GROQ" else "mistral-medium")
     }
+    endpoint = {
+        "MISTRAL": "https://api.mistral.ai/v1/chat/completions",
+        "GROQ": "https://api.groq.com/openai/v1/chat/completions"
+    }[api]
+    response = requests.post(endpoint, headers=headers, json=payload)
+    if response.status_code == 200:
+        return response.json()["choices"][0]["message"]["content"]
+    else:
+        print(f"Error from {api} API: {response.text}")
+        return None
 def generate_question(answers):
+    prompt = "You are playing a game called Kasoti (20 Questions)...\n"
     for i, (q, a) in enumerate(answers, 1):
         prompt += f"{i}. Q: {q}\n   A: {a}\n"
+    prompt += "\nAsk ONLY the next best yes/no question."
+    response = query_llm("GROQ", [{"role": "user", "content": prompt}])
+    return response.strip() if response else "Is it something you can hold?"
 def make_guess(answers):
+    prompt = "Based on the following yes/no history, make a best guess.\n\nHistory:\n"
     for i, (q, a) in enumerate(answers, 1):
         prompt += f"{i}. Q: {q}\n   A: {a}\n"
+    response = query_llm("GROQ", [{"role": "user", "content": prompt}])
+    return response.strip() if response else "I need more information."
 def get_hint(question, answers):
+    prompt = f"The player is unsure about answering: '{question}'\n\nHistory:\n"
     for q, a in answers:
         prompt += f"- Q: {q}\n  A: {a}\n"
+    prompt += "\nSuggest a helpful hint to clarify."
+    return query_llm("MISTRAL", [{"role": "user", "content": prompt}]) or "Consider the common meaning."
+def normalize_answer(ans):
+    ans = ans.strip().lower()
+    return "yes" if ans in ["yes", "y", "ہاں", "haan"] else "no" if ans in ["no", "n", "نہیں", "nahi"] else None
+def start_game():
+    game_state.update({
         "active": True,
         "questions_asked": 1,
         "answers": [],
         "current_question": "Is it a living thing?",
         "consult_mode": False
     })
+    intro = "🎯 **Kasoti Started!**\nThink of something... I'll guess in 20 questions.\n\n➡️ First Question: **Is it a living thing?**"
+    return intro, gr.update(interactive=True), gr.update(interactive=True), "🔕 Consult Mode: OFF", gr.update(visible=False)
+def process_answer(answer_text):
+    if not game_state["active"]:
+        return "⚠️ Start the game first.", "", "", gr.update(visible=False)
+    normalized = normalize_answer(answer_text)
+    if normalized is None:
+        return "❌ Please reply with 'yes' or 'no' (or 'ہاں/نہیں').", "", answer_text, gr.update(visible=game_state["consult_mode"])
+    if "is this correct?" in (game_state["current_question"] or "").lower():
+        if normalized == "yes":
+            game_state["active"] = False
+            return "🎉 YAY! I guessed it!", "", answer_text, gr.update(visible=False)
         else:
+            next_q = generate_question(game_state["answers"])
+            game_state["current_question"] = next_q
+            game_state["questions_asked"] += 1
+            return next_q, "", answer_text, gr.update(visible=game_state["consult_mode"])
+    game_state["answers"].append((game_state["current_question"], normalized))
+    if game_state["questions_asked"] >= 20:
+        game_state["active"] = False
+        guess = make_guess(game_state["answers"])
+        return f"🕹️ Game over! My final guess: **{guess}**", "", answer_text, gr.update(visible=False)
+    if game_state["questions_asked"] % 5 == 0:
+        guess = make_guess(game_state["answers"])
+        if guess.startswith("I think it's"):
+            game_state["current_question"] = guess + " Is this correct? (yes/no)"
+            return game_state["current_question"], "", answer_text, gr.update(visible=game_state["consult_mode"])
+    next_q = generate_question(game_state["answers"])
+    game_state["current_question"] = next_q
+    game_state["questions_asked"] += 1
+    return next_q, "", answer_text, gr.update(visible=game_state["consult_mode"])
+def toggle_consult_mode():
+    game_state["consult_mode"] = not game_state["consult_mode"]
+    return ("��� Consult Mode: ON" if game_state["consult_mode"] else "🔕 Consult Mode: OFF",
+            gr.update(visible=game_state["consult_mode"]))
+def get_consult_hint():
+    if not game_state["active"] or not game_state["consult_mode"]:
+        return "ℹ️ Consult mode is not active or game not started."
+    return get_hint(game_state["current_question"], game_state["answers"])
+# Colorful and polished UI
+with gr.Blocks(css=".gr-button {background-color: #4CAF50; color: white} .gr-box {background: #f7f7ff; border: 1px solid #ccc; padding: 10px; border-radius: 10px;}") as demo:
+    gr.Markdown("## 🧠 Kasoti: 20 Questions AI Game")
+    gr.Markdown("Think of a person, place, or thing. I'll try to guess it in 20 questions or less! Just answer 'yes' or 'no'.")
+    with gr.Row():
+        start_btn = gr.Button("🚀 Start Game")
+        consult_btn = gr.Button("💬 Toggle Consult Mode")
+        consult_status = gr.Textbox(label="Consult Mode", interactive=False)
+    with gr.Row():
+        with gr.Column():
+            language = gr.Dropdown(["English", "Urdu"], label="Audio Language", value="English")
+            audio_input = gr.Audio(label="🎤 Answer via Microphone", type="numpy", sources=["microphone"])
+            transcribe_btn = gr.Button("📝 Transcribe Audio")
+            transcribed_text = gr.Textbox(label="✍️ Answer Text", interactive=True)
+            submit_btn = gr.Button("✅ Submit Answer")
+        with gr.Column():
+            game_output = gr.Textbox(label="🎲 Game Progress", interactive=False)
+            consult_output = gr.Textbox(label="💡 Consult Hint", visible=False)
+    start_btn.click(start_game, outputs=[game_output, transcribed_text, submit_btn, consult_status, consult_output])
+    consult_btn.click(toggle_consult_mode, outputs=[consult_status, consult_output])
+    consult_btn.click(get_consult_hint, outputs=[consult_output])
+    transcribe_btn.click(transcribe_audio, inputs=[audio_input, language], outputs=[transcribed_text])
+    submit_btn.click(process_answer, inputs=[transcribed_text], outputs=[game_output, transcribed_text, transcribed_text, consult_output])
+demo.launch()