Spaces:

KB-Infinity-Tech
/

AIMSRICDAy3AIMathTutorforEarlyLearners

Sleeping

App Files Files Community

KB-Infinity-Tech commited on Apr 24

Commit

01176da

verified ·

1 Parent(s): aa13ec6

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +38 -37

src/streamlit_app.py CHANGED Viewed

@@ -4,7 +4,8 @@ import torch
 from langdetect import detect
 from PIL import Image
 import numpy as np
-import pyttsx3
 # ----------------------------
 # Load Model
@@ -24,13 +25,14 @@ def load_model():
 tokenizer, model = load_model()
 # ----------------------------
-# TTS (Offline)
 # ----------------------------
-engine = pyttsx3.init()
-def speak(text):
-    engine.say(text)
-    engine.runAndWait()
 # ----------------------------
 # Language Detection
@@ -46,7 +48,7 @@ def detect_lang(text):
 # ----------------------------
 def build_prompt(user_input, lang):
     if lang == "fr":
-        system = "Tu es un tuteur de mathématiques pour enfants. Réponds simplement avec des exemples."
     elif lang == "sw":
         system = "Wewe ni mwalimu wa hesabu kwa watoto. Eleza kwa urahisi."
     else:
@@ -68,7 +70,7 @@ def generate(prompt):
     return tokenizer.decode(output[0], skip_special_tokens=True)
 # ----------------------------
-# Visual Counting (Lightweight)
 # ----------------------------
 def count_objects(image):
     img = np.array(image.convert("L"))
@@ -77,21 +79,22 @@ def count_objects(image):
     return max(1, count)
 # ----------------------------
-# UI DASHBOARD
 # ----------------------------
 st.set_page_config(layout="wide")
-st.title("🧠📊 AI Math Tutor Dashboard")
 col1, col2 = st.columns(2)
 # ----------------------------
-# LEFT PANEL — INTERACTION
 # ----------------------------
 with col1:
     st.header("👧 Student Interaction")
     mode = st.radio("Choose Mode", ["Text", "Image (Count)", "Voice (Simulated)"])
     if mode == "Text":
         user_input = st.text_input("Ask a math question:")
@@ -99,17 +102,17 @@ with col1:
             lang = detect_lang(user_input)
             prompt = build_prompt(user_input, lang)
-            response = generate(prompt)
             st.write("### 📘 Answer")
             st.write(response)
             if st.button("🔊 Speak Answer"):
-                speak(response)
-    # ----------------------------
-    # IMAGE MODE (Visual Learning)
-    # ----------------------------
     elif mode == "Image (Count)":
         uploaded = st.file_uploader("Upload image with objects", type=["png", "jpg"])
@@ -119,52 +122,50 @@ with col1:
             count = count_objects(image)
-            st.write(f"### 🧮 I see about: {count} objects")
-            explanation = f"There are about {count} objects. Let's count together!"
-            st.write(explanation)
             if st.button("🔊 Speak"):
-                speak(explanation)
-    # ----------------------------
-    # VOICE MODE (SIMULATED)
-    # ----------------------------
     elif mode == "Voice (Simulated)":
-        st.write("🎤 Voice input simulation (type what child says)")
         voice_input = st.text_input("Child says:")
         if voice_input:
             lang = detect_lang(voice_input)
             prompt = build_prompt(voice_input, lang)
             response = generate(prompt)
             st.write("### 🎧 Tutor Response")
             st.write(response)
             if st.button("🔊 Speak Response"):
-                speak(response)
 # ----------------------------
-# RIGHT PANEL — PROGRESS
 # ----------------------------
 with col2:
-    st.header("📈 Learning Progress")
-    # Fake metrics (replace with SQLite later)
     st.metric("Questions Answered", 12)
     st.metric("Accuracy", "75%")
     st.metric("Level", "Beginner → Improving")
-    st.subheader("📊 Skill Breakdown")
     st.progress(0.7)
-    st.subheader("🌍 Language Detected")
-    st.write("Auto-detected per input")
-    st.subheader("⚡ System Info")
-    st.write("CPU Mode ✔")
-    st.write("Offline-ready ✔")
-    st.write("Multilingual ✔")

 from langdetect import detect
 from PIL import Image
 import numpy as np
+from gtts import gTTS
+import tempfile
 # ----------------------------
 # Load Model
 tokenizer, model = load_model()
 # ----------------------------
+# Text-to-Speech (HF SAFE)
 # ----------------------------
+def speak(text, lang="en"):
+    tts = gTTS(text=text, lang=lang)
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as fp:
+        tts.save(fp.name)
+        return fp.name
 # ----------------------------
 # Language Detection
 # ----------------------------
 def build_prompt(user_input, lang):
     if lang == "fr":
+        system = "Tu es un tuteur de mathématiques pour enfants. Explique simplement avec des exemples."
     elif lang == "sw":
         system = "Wewe ni mwalimu wa hesabu kwa watoto. Eleza kwa urahisi."
     else:
     return tokenizer.decode(output[0], skip_special_tokens=True)
 # ----------------------------
+# Visual Counting
 # ----------------------------
 def count_objects(image):
     img = np.array(image.convert("L"))
     return max(1, count)
 # ----------------------------
+# UI CONFIG
 # ----------------------------
 st.set_page_config(layout="wide")
+st.title("🧠📊 AI Math Tutor (Multimodal)")
 col1, col2 = st.columns(2)
 # ----------------------------
+# LEFT PANEL — STUDENT
 # ----------------------------
 with col1:
     st.header("👧 Student Interaction")
     mode = st.radio("Choose Mode", ["Text", "Image (Count)", "Voice (Simulated)"])
+    # ---------------- TEXT MODE ----------------
     if mode == "Text":
         user_input = st.text_input("Ask a math question:")
             lang = detect_lang(user_input)
             prompt = build_prompt(user_input, lang)
+            with st.spinner("Thinking..."):
+                response = generate(prompt)
             st.write("### 📘 Answer")
             st.write(response)
             if st.button("🔊 Speak Answer"):
+                audio_file = speak(response, lang)
+                st.audio(audio_file)
+    # ---------------- IMAGE MODE ----------------
     elif mode == "Image (Count)":
         uploaded = st.file_uploader("Upload image with objects", type=["png", "jpg"])
             count = count_objects(image)
+            explanation = f"I see about {count} objects. Let's count together!"
+            st.write(f"### 🧮 {explanation}")
             if st.button("🔊 Speak"):
+                audio_file = speak(explanation)
+                st.audio(audio_file)
+    # ---------------- VOICE MODE ----------------
     elif mode == "Voice (Simulated)":
+        st.write("🎤 Simulate child's speech (type it)")
         voice_input = st.text_input("Child says:")
         if voice_input:
             lang = detect_lang(voice_input)
             prompt = build_prompt(voice_input, lang)
             response = generate(prompt)
             st.write("### 🎧 Tutor Response")
             st.write(response)
             if st.button("🔊 Speak Response"):
+                audio_file = speak(response, lang)
+                st.audio(audio_file)
 # ----------------------------
+# RIGHT PANEL — DASHBOARD
 # ----------------------------
 with col2:
+    st.header("📈 Learning Dashboard")
+    # Demo metrics (replace with SQLite later)
     st.metric("Questions Answered", 12)
     st.metric("Accuracy", "75%")
     st.metric("Level", "Beginner → Improving")
+    st.subheader("📊 Skill Progress")
     st.progress(0.7)
+    st.subheader("🌍 Language Handling")
+    st.write("Auto-detect + multilingual response")
+    st.subheader("⚡ System Status")
+    st.success("CPU Mode")
+    st.success("Multimodal Enabled")
+    st.success("Deployable on Hugging Face")