Spaces:

SG2407
/

Aarogyan_Project

Paused

App Files Files Community

Sahil commited on Mar 29

Commit

75efae8

1 Parent(s): 49e98e5

Multilingual support added (Marathi , Hindi , English)

Browse files

Files changed (10) hide show

app/__pycache__/__init__.cpython-313.pyc +0 -0
app/__pycache__/config.cpython-313.pyc +0 -0
app/routers/assistant.py +2 -0
app/routers/buddy.py +7 -2
app/services/__pycache__/__init__.cpython-313.pyc +0 -0
app/services/__pycache__/ai.cpython-313.pyc +0 -0
app/services/__pycache__/rag_pipeline.cpython-313.pyc +0 -0
app/services/__pycache__/tts.cpython-313.pyc +0 -0
app/services/ai.py +21 -7
app/services/tts.py +4 -4

app/__pycache__/__init__.cpython-313.pyc CHANGED Viewed

Binary files a/app/__pycache__/__init__.cpython-313.pyc and b/app/__pycache__/__init__.cpython-313.pyc differ

app/__pycache__/config.cpython-313.pyc CHANGED Viewed

Binary files a/app/__pycache__/config.cpython-313.pyc and b/app/__pycache__/config.cpython-313.pyc differ

app/routers/assistant.py CHANGED Viewed

@@ -17,6 +17,7 @@ class MessageIn(BaseModel):
 class ChatRequest(BaseModel):
     conversation_id: Optional[str] = None
     message: str
 class ConversationCreate(BaseModel):
@@ -137,6 +138,7 @@ async def chat(
         user_message=body.message,
         history=history,
         profile_context=profile_context,
     )
     ai_reply = ai_result["reply"]
     ai_sources = ai_result.get("sources", [])

 class ChatRequest(BaseModel):
     conversation_id: Optional[str] = None
     message: str
+    preferred_language: str = "English"
 class ConversationCreate(BaseModel):
         user_message=body.message,
         history=history,
         profile_context=profile_context,
+        preferred_lang=body.preferred_language,
     )
     ai_reply = ai_result["reply"]
     ai_sources = ai_result.get("sources", [])

app/routers/buddy.py CHANGED Viewed

@@ -15,6 +15,10 @@ router = APIRouter(prefix="/buddy", tags=["emotional-buddy"])
 class BuddyTextRequest(BaseModel):
     text: str
     history: Optional[List[dict]] = None
 @router.post("/chat")
@@ -30,14 +34,15 @@ async def text_chat(
         raise HTTPException(status_code=422, detail="Text must not be empty")
     history = body.history or []
     # AI response
-    ai_text, mood_score, emotion = await emotional_buddy_respond(body.text, history)
     # TTS — non-critical: failure returns empty audio, client can still show text
     audio_response = b""
     try:
-        audio_response = await text_to_speech_bytes(ai_text)
     except Exception as tts_err:
         import logging
         logging.getLogger(__name__).warning("TTS failed: %s", tts_err)

 class BuddyTextRequest(BaseModel):
     text: str
     history: Optional[List[dict]] = None
+    preferred_language: str = "English"
+_LANG_CODE: dict[str, str] = {"English": "en", "Hindi": "hi", "Marathi": "mr"}
 @router.post("/chat")
         raise HTTPException(status_code=422, detail="Text must not be empty")
     history = body.history or []
+    lang_code = _LANG_CODE.get(body.preferred_language, "en")
     # AI response
+    ai_text, mood_score, emotion = await emotional_buddy_respond(body.text, history, body.preferred_language)
     # TTS — non-critical: failure returns empty audio, client can still show text
     audio_response = b""
     try:
+        audio_response = await text_to_speech_bytes(ai_text, lang_code)
     except Exception as tts_err:
         import logging
         logging.getLogger(__name__).warning("TTS failed: %s", tts_err)

app/services/__pycache__/__init__.cpython-313.pyc CHANGED Viewed

Binary files a/app/services/__pycache__/__init__.cpython-313.pyc and b/app/services/__pycache__/__init__.cpython-313.pyc differ

app/services/__pycache__/ai.cpython-313.pyc CHANGED Viewed

Binary files a/app/services/__pycache__/ai.cpython-313.pyc and b/app/services/__pycache__/ai.cpython-313.pyc differ

app/services/__pycache__/rag_pipeline.cpython-313.pyc CHANGED Viewed

Binary files a/app/services/__pycache__/rag_pipeline.cpython-313.pyc and b/app/services/__pycache__/rag_pipeline.cpython-313.pyc differ

app/services/__pycache__/tts.cpython-313.pyc CHANGED Viewed

Binary files a/app/services/__pycache__/tts.cpython-313.pyc and b/app/services/__pycache__/tts.cpython-313.pyc differ

app/services/ai.py CHANGED Viewed

@@ -79,7 +79,10 @@ entertainment, general trivia, etc. — respond ONLY with:
 • Do NOT use markdown headers (##), bold (**), or bullet-heavy formatting — write in clean prose
 • End complex answers with a gentle reminder to consult a qualified healthcare provider
-User medical profile context will be provided when available — use it to personalise responses."""
 _RAG_MEDICAL_SYSTEM = """\
 You are Aarogyan's Medical Health Assistant — a supportive, evidence-based AI health companion.
@@ -108,6 +111,9 @@ Use ONLY the provided context to answer. If the context is insufficient, say so
 • Write in clean prose — no markdown headers, no bold, no repeated ideas across paragraphs
 • End with a brief recommendation to consult a healthcare provider if the topic warrants it
 --- Retrieved Medical Context ---
 {context}
 --- End of Context ---
@@ -174,7 +180,10 @@ IMPORTANT: Always respond in JSON format:
   "response": "your empathetic, warm reply here",
   "mood_score": <integer 1-10>,
   "emotion": "<one of: happy, sad, angry, fearful, disgusted, surprised, neutral>"
-}"""
 async def _call_groq(messages: list[dict], system: str, temperature: float = 0.7) -> str:
@@ -222,6 +231,7 @@ async def _chat_with_rag(
     history: list[dict],
     profile_context: str,
     is_complex: bool = False,
 ) -> dict:
     """RAG-augmented chat: retrieve context then synthesise with Groq.
@@ -240,7 +250,7 @@ async def _chat_with_rag(
     if not context_str:
         logger.warning("RAG returned no context — falling back to plain LLM")
-        return await _chat_plain(user_message, history, profile_context)
     profile_section = ""
     if profile_context:
@@ -250,6 +260,7 @@ async def _chat_with_rag(
         context=context_str,
         profile_section=profile_section,
     )
     messages = [*history, {"role": "user", "content": user_message}]
     reply = await _call_groq(messages, system, temperature=0.2)
@@ -261,6 +272,7 @@ async def _chat_plain(
     user_message: str,
     history: list[dict],
     profile_context: str,
 ) -> dict:
     """Plain LLM chat without RAG (fallback when Qdrant returns nothing).
     Returns {"reply": str, "sources": []}
@@ -268,6 +280,7 @@ async def _chat_plain(
     system = MEDICAL_ASSISTANT_SYSTEM
     if profile_context:
         system += f"\n\n--- User Health Profile ---\n{profile_context}"
     messages = [*history, {"role": "user", "content": user_message}]
     reply = await _call_groq(messages, system)
     return {"reply": reply.strip(), "sources": []}
@@ -277,10 +290,11 @@ async def chat_with_ai(
     user_message: str,
     history: list[dict],
     profile_context: str,
 ) -> dict:
     """Returns {"reply": str, "sources": list[str]}."""
     is_complex = await _route_query(user_message)
-    return await _chat_with_rag(user_message, history, profile_context, is_complex=is_complex)
 async def summarise_document(ocr_text: str) -> dict:
@@ -308,11 +322,11 @@ async def summarise_document(ocr_text: str) -> dict:
 import re as _re
-async def emotional_buddy_respond(user_text: str, history: list[dict] | None = None) -> tuple[str, int, str]:
     """Returns (buddy_reply_text, mood_score, emotion)."""
-    messages = list(history or [])
     messages.append({"role": "user", "content": user_text})
-    raw = await _call_groq(messages, EMOTIONAL_BUDDY_SYSTEM)
     reply = raw
     mood_score = 5

 • Do NOT use markdown headers (##), bold (**), or bullet-heavy formatting — write in clean prose
 • End complex answers with a gentle reminder to consult a qualified healthcare provider
+User medical profile context will be provided when available — use it to personalise responses.
+━━━ LANGUAGE ━━━
+Detect the language of the user's message (English, Hindi, or Marathi) and respond in that exact same language. Use the user's preferred language as the fallback when the language is ambiguous."""
 _RAG_MEDICAL_SYSTEM = """\
 You are Aarogyan's Medical Health Assistant — a supportive, evidence-based AI health companion.
 • Write in clean prose — no markdown headers, no bold, no repeated ideas across paragraphs
 • End with a brief recommendation to consult a healthcare provider if the topic warrants it
+━━━ LANGUAGE ━━━
+Detect the language of the user's message (English, Hindi, or Marathi) and respond in that exact same language. Use the user's preferred language as the fallback when the language is ambiguous.
 --- Retrieved Medical Context ---
 {context}
 --- End of Context ---
   "response": "your empathetic, warm reply here",
   "mood_score": <integer 1-10>,
   "emotion": "<one of: happy, sad, angry, fearful, disgusted, surprised, neutral>"
+}
+━━━ LANGUAGE ━━━
+Detect the language of the user's message (English, Hindi, or Marathi) and write the "response" value in that exact same language. If the language is ambiguous, use the user's preferred language as the fallback. Always keep the JSON keys in English."""
 async def _call_groq(messages: list[dict], system: str, temperature: float = 0.7) -> str:
     history: list[dict],
     profile_context: str,
     is_complex: bool = False,
+    preferred_lang: str = "English",
 ) -> dict:
     """RAG-augmented chat: retrieve context then synthesise with Groq.
     if not context_str:
         logger.warning("RAG returned no context — falling back to plain LLM")
+        return await _chat_plain(user_message, history, profile_context, preferred_lang=preferred_lang)
     profile_section = ""
     if profile_context:
         context=context_str,
         profile_section=profile_section,
     )
+    system += f"\n\nThe user's preferred language is {preferred_lang}."
     messages = [*history, {"role": "user", "content": user_message}]
     reply = await _call_groq(messages, system, temperature=0.2)
     user_message: str,
     history: list[dict],
     profile_context: str,
+    preferred_lang: str = "English",
 ) -> dict:
     """Plain LLM chat without RAG (fallback when Qdrant returns nothing).
     Returns {"reply": str, "sources": []}
     system = MEDICAL_ASSISTANT_SYSTEM
     if profile_context:
         system += f"\n\n--- User Health Profile ---\n{profile_context}"
+    system += f"\n\nThe user's preferred language is {preferred_lang}."
     messages = [*history, {"role": "user", "content": user_message}]
     reply = await _call_groq(messages, system)
     return {"reply": reply.strip(), "sources": []}
     user_message: str,
     history: list[dict],
     profile_context: str,
+    preferred_lang: str = "English",
 ) -> dict:
     """Returns {"reply": str, "sources": list[str]}."""
     is_complex = await _route_query(user_message)
+    return await _chat_with_rag(user_message, history, profile_context, is_complex=is_complex, preferred_lang=preferred_lang)
 async def summarise_document(ocr_text: str) -> dict:
 import re as _re
+async def emotional_buddy_respond(user_text: str, history: list[dict] | None = None, preferred_lang: str = "English") -> tuple[str, int, str]:
     """Returns (buddy_reply_text, mood_score, emotion)."""
+    system = EMOTIONAL_BUDDY_SYSTEM + f"\n\nThe user's preferred language is {preferred_lang}."
     messages.append({"role": "user", "content": user_text})
+    raw = await _call_groq(messages, system, temperature=0.75)
     reply = raw
     mood_score = 5

app/services/tts.py CHANGED Viewed

@@ -30,12 +30,12 @@ def _split_text(text: str, limit: int = _MAX_CHARS) -> list[str]:
     return chunks or [text[:limit]]
-async def _fetch_chunk(client: httpx.AsyncClient, chunk: str) -> bytes:
     url = "https://translate.google.com/translate_tts"
     params = {
         "ie": "UTF-8",
         "q": chunk,
-        "tl": "en",
         "client": "tw-ob",
         "total": "1",
         "idx": "0",
@@ -47,7 +47,7 @@ async def _fetch_chunk(client: httpx.AsyncClient, chunk: str) -> bytes:
     return resp.content
-async def text_to_speech_bytes(text: str) -> bytes:
     """Convert text to speech using Google Translate TTS. Returns MP3 bytes.
     Splits long text into chunks and concatenates the audio.
     Raises on failure after 20 seconds total.
@@ -55,7 +55,7 @@ async def text_to_speech_bytes(text: str) -> bytes:
     chunks = _split_text(text)
     async with httpx.AsyncClient(timeout=15) as client:
         parts = await asyncio.wait_for(
-            asyncio.gather(*[_fetch_chunk(client, c) for c in chunks]),
             timeout=20,
         )
     return b"".join(parts)

     return chunks or [text[:limit]]
+async def _fetch_chunk(client: httpx.AsyncClient, chunk: str, lang: str = "en") -> bytes:
     url = "https://translate.google.com/translate_tts"
     params = {
         "ie": "UTF-8",
         "q": chunk,
+        "tl": lang,
         "client": "tw-ob",
         "total": "1",
         "idx": "0",
     return resp.content
+async def text_to_speech_bytes(text: str, lang: str = "en") -> bytes:
     """Convert text to speech using Google Translate TTS. Returns MP3 bytes.
     Splits long text into chunks and concatenates the audio.
     Raises on failure after 20 seconds total.
     chunks = _split_text(text)
     async with httpx.AsyncClient(timeout=15) as client:
         parts = await asyncio.wait_for(
+            asyncio.gather(*[_fetch_chunk(client, c, lang) for c in chunks]),
             timeout=20,
         )
     return b"".join(parts)