Spaces:

arshenoy
/

somAI

Runtime error

App Files Files Community

arshenoy commited on Dec 2, 2025

Commit

f618d4b

verified ·

1 Parent(s): 956cf6f

Implementation of 3 rollbacks to somAI

Browse files

Files changed (1) hide show

services/geminiService.ts +103 -81

services/geminiService.ts CHANGED Viewed

@@ -20,9 +20,14 @@ const getApiKey = () => {
 const API_KEY = getApiKey();
 const ai = new GoogleGenAI({ apiKey: API_KEY });
-// CHANGED: Switched to Flash-Lite for 1,000 Requests/Day (vs 250 for standard Flash)
-const MODEL_FAST = 'gemini-2.5-flash-lite';
 const MODEL_TTS = 'gemini-2.5-flash-preview-tts';
 const FALLBACK_API_BASE = 'https://arshenoy-somai-backend.hf.space';
 // Cleaning for final blocks
@@ -147,25 +152,21 @@ const parseRiskResponse = (text: string, calculatedScore: number): RiskAnalysisR
   }
 };
-// --- UPDATED: NAME EXTRACTION & TTS ---
 export const extractClinicalData = async (imageBase64: string): Promise<ExtractionResult> => {
   const base64Data = imageBase64.includes('base64,') ? imageBase64.split('base64,')[1] : imageBase64;
-  // Improved Prompt for Name Extraction
   const prompt = `Analyze this medical document.
   CRITICAL: Look for the Patient's Name at the top, headers, or labeled 'Patient', 'Name', 'Mr/Mrs'.
   Extract JSON: { name, age, condition, history, allergies, systolicBp, glucose, heartRate, weight, temperature, spo2, clinicalNote }.
   If name is missing, use "Guest". Return JSON only.`;
-  try {
-    if (!API_KEY) throw new Error("API Key missing");
     const response = await ai.models.generateContent({
-      model: MODEL_FAST,
       contents: [{ role: 'user', parts: [{ text: prompt }, { inlineData: { mimeType: 'image/jpeg', data: base64Data } }] }],
       config: { responseMimeType: "application/json", maxOutputTokens: 2000 }
     });
     const text = response.text || "{}";
     const data = JSON.parse(text);
     return {
@@ -173,13 +174,29 @@ export const extractClinicalData = async (imageBase64: string): Promise<Extracti
       vitals: { systolicBp: data.systolicBp, glucose: data.glucose, heartRate: data.heartRate, weight: data.weight, temperature: data.temperature, spo2: data.spo2, clinicalNote: data.clinicalNote },
       confidence: 0.9
     };
   } catch (e: any) {
     try {
         const compressedBase64 = await compressImage(imageBase64);
         const cleanBase64 = compressedBase64.includes('base64,') ? compressedBase64.split('base64,')[1] : compressedBase64;
         const resText = await callFallbackAPI('/vision', { image: cleanBase64, prompt: "Extract patient name and vitals from this document in JSON format." });
         return {
             profile: {},
             vitals: { clinicalNote: `[Auto-Scanned]: ${resText}` },
@@ -200,14 +217,9 @@ export const generateSpeech = async (text: string): Promise<string | null> => {
       contents: [{ parts: [{ text }] }],
       config: {
         responseModalities: ['AUDIO'],
-        speechConfig: {
-          voiceConfig: {
-            prebuiltVoiceConfig: { voiceName: 'Fenrir' }, // Fenrir = Cool Male Voice
-          },
-        },
       },
     });
-    // Return Base64 Audio Data
     return response.candidates?.[0]?.content?.parts?.[0]?.inlineData?.data || null;
   } catch (e) {
     console.warn("TTS Failed", e);
@@ -229,6 +241,7 @@ export const transcribeAudio = async (audioBlob: Blob): Promise<string> => {
     });
 };
 export const analyzeRisk = async (profile: PatientProfile, vitals: ClinicalVitals, calculatedScore: number): Promise<RiskAnalysisResult> => {
   const prompt = `
     Act as a Senior Clinical Risk Assessor.
@@ -241,32 +254,44 @@ export const analyzeRisk = async (profile: PatientProfile, vitals: ClinicalVital
     Return JSON.
   `;
-  try {
-    if (!API_KEY) throw new Error("API Key missing");
     const response = await ai.models.generateContent({
-      model: MODEL_FAST,
-      contents: prompt,
-      config: {
-        responseMimeType: "application/json",
-        maxOutputTokens: 4000,
-        responseSchema: {
-          type: Type.OBJECT,
-          properties: {
-            summary: { type: Type.STRING },
-            actionItems: { type: Type.ARRAY, items: { type: Type.STRING } },
-            primaryConditionCode: { type: Type.OBJECT, properties: { code: {type: Type.STRING}, description: {type: Type.STRING} } },
-            historyCodes: { type: Type.ARRAY, items: { type: Type.OBJECT, properties: { code: {type: Type.STRING}, description: {type: Type.STRING} } } },
-            insuranceNote: { type: Type.STRING }
-          },
-          required: ["summary", "actionItems", "primaryConditionCode", "historyCodes", "insuranceNote"]
         }
-      }
     });
-    return {
-      ...parseRiskResponse(response.text || "{}", calculatedScore),
-      source: 'Gemini 2.5 Flash-Lite'
-    };
   } catch (err: any) {
     try {
       const payload = { ...profile, ...vitals, riskScore: calculatedScore, prompt };
       const fallback = await callFallbackAPI('/analyze', payload);
@@ -282,43 +307,42 @@ export const analyzeRisk = async (profile: PatientProfile, vitals: ClinicalVital
 export const generateHealthInsights = async (profile: PatientProfile, vitals: ClinicalVitals): Promise<HealthInsights> => {
   const prompt = `Based on Patient: ${profile.name}, ${profile.age}y, ${profile.condition}. Vitals: BP ${vitals.systolicBp}, SpO2 ${vitals.spo2}%. Generate JSON: { weeklySummary, progress, tips: [] }.`;
-  try {
-    if (!API_KEY) throw new Error("No Key");
     const response = await ai.models.generateContent({
-      model: MODEL_FAST,
       contents: prompt,
       config: { responseMimeType: "application/json", maxOutputTokens: 2000 }
     });
     return JSON.parse(response.text || "{}");
-  } catch {
     return { weeklySummary: "Keep tracking your vitals.", progress: "Data accumulated.", tips: ["Maintain a balanced diet.", "Stay hydrated."] };
   }
 };
 export const generateSessionName = async (userText: string, aiText: string): Promise<string> => {
-  const prompt = `Generate a very short, specific title (max 4 words) for a medical chat session based on this context.
-  User: ${userText}
-  AI: ${aiText}
-  Title:`;
   try {
     if (!API_KEY) return "New Consultation";
-    const response = await ai.models.generateContent({
-      model: MODEL_FAST,
-      contents: prompt,
-      config: { maxOutputTokens: 20 }
-    });
     return cleanText(response.text || "New Consultation").replace(/^["']|["']$/g, '');
   } catch (e) {
     try {
         const fallbackRes = await callFallbackAPI('/generate', { prompt: prompt });
         return cleanText(fallbackRes).replace(/^["']|["']$/g, '');
-    } catch {
-        return "New Consultation";
-    }
   }
 };
 export const generateChatResponse = async (
   history: ChatMessage[],
   currentMessage: string,
@@ -340,50 +364,48 @@ export const generateChatResponse = async (
   const contents = history.map(msg => ({ role: msg.role === 'user' ? 'user' : 'model', parts: [{ text: msg.text }, ...(msg.image ? [{ inlineData: { mimeType: 'image/jpeg', data: msg.image.split('base64,')[1] } }] : [])] }));
   contents.push({ role: 'user', parts: [{ text: context + "\nUser: " + currentMessage }, ...(image ? [{ inlineData: { mimeType: 'image/jpeg', data: image.split('base64,')[1] } }] : [])] });
-  try {
-    if (!API_KEY) throw new Error("No Key");
-    // 1. Try Gemini
-    onSource('Gemini 2.5 Flash-Lite');
     const response = await ai.models.generateContent({
-      model: MODEL_FAST,
-      contents: contents,
-      config: {
-        maxOutputTokens: 4000,
-        temperature: 0.7
-      }
     });
     return cleanText(response.text || "I didn't catch that.");
-  } catch (e) {
     try {
-      // 2. Fallback
       onSource('Phi-3 Mini (Fallback)');
       const fallbackPrompt = `${context}\n\nChat History:\n${history.slice(-3).map(m => m.text).join('\n')}\nUser: ${currentMessage}`;
       const responseText = await callFallbackAPI('/generate', { prompt: fallbackPrompt });
       return cleanText(responseText);
     } catch {
         return "I'm having trouble connecting. Please check your internet.";
     }
   }
 };
-// --- UPDATED: CONTEXT-AWARE QUICK REPLIES ---
 export const generateQuickReplies = async (history: ChatMessage[]) => {
   if (!API_KEY || history.length === 0) return [];
-  // Use last 3 messages for context
   const recentContext = history.slice(-3).map(m => `${m.role}: ${m.text}`).join('\n');
   const prompt = `Based on this conversation:\n${recentContext}\n\nSuggest 3 short, relevant follow-up questions the USER might want to ask next. Return ONLY a JSON array of strings.`;
   try {
-    const res = await ai.models.generateContent({
-      model: MODEL_FAST,
-      contents: prompt,
-      config: { responseMimeType: "application/json" }
-    });
     return JSON.parse(res.text || "[]");
   } catch { return []; }
 };
@@ -391,7 +413,7 @@ export const generateQuickReplies = async (history: ChatMessage[]) => {
 export const summarizeConversation = async (history: ChatMessage[]) => {
   if (!API_KEY) return "Summary unavailable.";
   try {
-    const res = await ai.models.generateContent({ model: MODEL_FAST, contents: `Summarize clinical conversation:\n${history.map(m=>m.text).join('\n')}` });
     return cleanText(res.text || "");
   } catch { return "Could not summarize."; }
 };

 const API_KEY = getApiKey();
 const ai = new GoogleGenAI({ apiKey: API_KEY });
+// --- TIERED MODEL STRATEGY ---
+// Tier 1: 1,000 RPD (Primary)
+const MODEL_TIER_1 = 'gemini-2.5-flash-lite';
+// Tier 2: 250 RPD (Backup High-Speed)
+const MODEL_TIER_2 = 'gemini-2.5-flash';
+// TTS Model
 const MODEL_TTS = 'gemini-2.5-flash-preview-tts';
 const FALLBACK_API_BASE = 'https://arshenoy-somai-backend.hf.space';
 // Cleaning for final blocks
   }
 };
+// --- UPDATED: VISION EXTRACTION (TIER 1 -> TIER 2 -> FALLBACK) ---
 export const extractClinicalData = async (imageBase64: string): Promise<ExtractionResult> => {
   const base64Data = imageBase64.includes('base64,') ? imageBase64.split('base64,')[1] : imageBase64;
   const prompt = `Analyze this medical document.
   CRITICAL: Look for the Patient's Name at the top, headers, or labeled 'Patient', 'Name', 'Mr/Mrs'.
   Extract JSON: { name, age, condition, history, allergies, systolicBp, glucose, heartRate, weight, temperature, spo2, clinicalNote }.
   If name is missing, use "Guest". Return JSON only.`;
+  // Helper to call Gemini Vision
+  const callGeminiVision = async (modelName: string) => {
     const response = await ai.models.generateContent({
+      model: modelName,
       contents: [{ role: 'user', parts: [{ text: prompt }, { inlineData: { mimeType: 'image/jpeg', data: base64Data } }] }],
       config: { responseMimeType: "application/json", maxOutputTokens: 2000 }
     });
     const text = response.text || "{}";
     const data = JSON.parse(text);
     return {
       vitals: { systolicBp: data.systolicBp, glucose: data.glucose, heartRate: data.heartRate, weight: data.weight, temperature: data.temperature, spo2: data.spo2, clinicalNote: data.clinicalNote },
       confidence: 0.9
     };
+  };
+  try {
+    if (!API_KEY) throw new Error("API Key missing");
+    // 1. Try Tier 1 (Flash Lite)
+    return await callGeminiVision(MODEL_TIER_1);
   } catch (e: any) {
+    // 2. If Quota Error (429), Try Tier 2 (Flash)
+    if (e.toString().includes('429') || e.toString().includes('Quota')) {
+        try {
+            console.warn("Tier 1 Vision Quota Exceeded. Switching to Tier 2 (Flash)...");
+            return await callGeminiVision(MODEL_TIER_2);
+        } catch (e2) {
+            // Tier 2 Failed, proceed to fallback
+        }
+    }
+    // 3. Fallback (Moondream)
     try {
+        console.warn("Gemini Vision Failed. Attempting Fallback...");
         const compressedBase64 = await compressImage(imageBase64);
         const cleanBase64 = compressedBase64.includes('base64,') ? compressedBase64.split('base64,')[1] : compressedBase64;
         const resText = await callFallbackAPI('/vision', { image: cleanBase64, prompt: "Extract patient name and vitals from this document in JSON format." });
         return {
             profile: {},
             vitals: { clinicalNote: `[Auto-Scanned]: ${resText}` },
       contents: [{ parts: [{ text }] }],
       config: {
         responseModalities: ['AUDIO'],
+        speechConfig: { voiceConfig: { prebuiltVoiceConfig: { voiceName: 'Fenrir' } } },
       },
     });
     return response.candidates?.[0]?.content?.parts?.[0]?.inlineData?.data || null;
   } catch (e) {
     console.warn("TTS Failed", e);
     });
 };
+// --- UPDATED: RISK ANALYSIS (TIER 1 -> TIER 2 -> FALLBACK) ---
 export const analyzeRisk = async (profile: PatientProfile, vitals: ClinicalVitals, calculatedScore: number): Promise<RiskAnalysisResult> => {
   const prompt = `
     Act as a Senior Clinical Risk Assessor.
     Return JSON.
   `;
+  // Helper for Gemini Call
+  const callGeminiRisk = async (modelName: string) => {
     const response = await ai.models.generateContent({
+        model: modelName,
+        contents: prompt,
+        config: {
+            responseMimeType: "application/json",
+            maxOutputTokens: 4000,
+            responseSchema: {
+            type: Type.OBJECT,
+            properties: {
+                summary: { type: Type.STRING },
+                actionItems: { type: Type.ARRAY, items: { type: Type.STRING } },
+                primaryConditionCode: { type: Type.OBJECT, properties: { code: {type: Type.STRING}, description: {type: Type.STRING} } },
+                historyCodes: { type: Type.ARRAY, items: { type: Type.OBJECT, properties: { code: {type: Type.STRING}, description: {type: Type.STRING} } } },
+                insuranceNote: { type: Type.STRING }
+            },
+            required: ["summary", "actionItems", "primaryConditionCode", "historyCodes", "insuranceNote"]
+            }
         }
     });
+    return { ...parseRiskResponse(response.text || "{}", calculatedScore), source: modelName === MODEL_TIER_1 ? 'Gemini 2.5 Flash-Lite' : 'Gemini 2.5 Flash' };
+  };
+  try {
+    if (!API_KEY) throw new Error("API Key missing");
+    // 1. Try Tier 1
+    return await callGeminiRisk(MODEL_TIER_1);
   } catch (err: any) {
+    // 2. If Quota Error, Try Tier 2
+    if (err.toString().includes('429') || err.toString().includes('Quota')) {
+        try {
+            console.warn("Tier 1 Risk Quota Exceeded. Switching to Tier 2...");
+            return await callGeminiRisk(MODEL_TIER_2);
+        } catch (e2) {}
+    }
+    // 3. Fallback
     try {
       const payload = { ...profile, ...vitals, riskScore: calculatedScore, prompt };
       const fallback = await callFallbackAPI('/analyze', payload);
 export const generateHealthInsights = async (profile: PatientProfile, vitals: ClinicalVitals): Promise<HealthInsights> => {
   const prompt = `Based on Patient: ${profile.name}, ${profile.age}y, ${profile.condition}. Vitals: BP ${vitals.systolicBp}, SpO2 ${vitals.spo2}%. Generate JSON: { weeklySummary, progress, tips: [] }.`;
+  const callGeminiInsights = async (model: string) => {
     const response = await ai.models.generateContent({
+      model: model,
       contents: prompt,
       config: { responseMimeType: "application/json", maxOutputTokens: 2000 }
     });
     return JSON.parse(response.text || "{}");
+  }
+  try {
+    if (!API_KEY) throw new Error("No Key");
+    return await callGeminiInsights(MODEL_TIER_1);
+  } catch (err: any) {
+    if (err.toString().includes('429')) {
+        try { return await callGeminiInsights(MODEL_TIER_2); } catch (e) {}
+    }
     return { weeklySummary: "Keep tracking your vitals.", progress: "Data accumulated.", tips: ["Maintain a balanced diet.", "Stay hydrated."] };
   }
 };
 export const generateSessionName = async (userText: string, aiText: string): Promise<string> => {
+  const prompt = `Generate a very short, specific title (max 4 words) for a medical chat session based on this context. User: ${userText}. AI: ${aiText}. Title:`;
   try {
     if (!API_KEY) return "New Consultation";
+    const response = await ai.models.generateContent({ model: MODEL_TIER_1, contents: prompt, config: { maxOutputTokens: 20 } });
     return cleanText(response.text || "New Consultation").replace(/^["']|["']$/g, '');
   } catch (e) {
     try {
         const fallbackRes = await callFallbackAPI('/generate', { prompt: prompt });
         return cleanText(fallbackRes).replace(/^["']|["']$/g, '');
+    } catch { return "New Consultation"; }
   }
 };
+// --- UPDATED: CHAT (TIER 1 -> TIER 2 -> FALLBACK) ---
 export const generateChatResponse = async (
   history: ChatMessage[],
   currentMessage: string,
   const contents = history.map(msg => ({ role: msg.role === 'user' ? 'user' : 'model', parts: [{ text: msg.text }, ...(msg.image ? [{ inlineData: { mimeType: 'image/jpeg', data: msg.image.split('base64,')[1] } }] : [])] }));
   contents.push({ role: 'user', parts: [{ text: context + "\nUser: " + currentMessage }, ...(image ? [{ inlineData: { mimeType: 'image/jpeg', data: image.split('base64,')[1] } }] : [])] });
+  // Helper for Chat
+  const callGeminiChat = async (modelName: string) => {
+    onSource(modelName === MODEL_TIER_1 ? 'Gemini 2.5 Flash-Lite' : 'Gemini 2.5 Flash');
     const response = await ai.models.generateContent({
+        model: modelName,
+        contents: contents,
+        config: { maxOutputTokens: 4000, temperature: 0.7 }
     });
     return cleanText(response.text || "I didn't catch that.");
+  };
+  try {
+    if (!API_KEY) throw new Error("No Key");
+    // 1. Try Tier 1
+    return await callGeminiChat(MODEL_TIER_1);
+  } catch (e: any) {
+    // 2. If Quota Error, Try Tier 2
+    if (e.toString().includes('429') || e.toString().includes('Quota')) {
+        try {
+            console.warn("Tier 1 Chat Quota Exceeded. Switching to Tier 2...");
+            return await callGeminiChat(MODEL_TIER_2);
+        } catch (e2) {}
+    }
+    // 3. Fallback
     try {
       onSource('Phi-3 Mini (Fallback)');
       const fallbackPrompt = `${context}\n\nChat History:\n${history.slice(-3).map(m => m.text).join('\n')}\nUser: ${currentMessage}`;
       const responseText = await callFallbackAPI('/generate', { prompt: fallbackPrompt });
       return cleanText(responseText);
     } catch {
         return "I'm having trouble connecting. Please check your internet.";
     }
   }
 };
 export const generateQuickReplies = async (history: ChatMessage[]) => {
   if (!API_KEY || history.length === 0) return [];
   const recentContext = history.slice(-3).map(m => `${m.role}: ${m.text}`).join('\n');
   const prompt = `Based on this conversation:\n${recentContext}\n\nSuggest 3 short, relevant follow-up questions the USER might want to ask next. Return ONLY a JSON array of strings.`;
   try {
+    const res = await ai.models.generateContent({ model: MODEL_TIER_1, contents: prompt, config: { responseMimeType: "application/json" } });
     return JSON.parse(res.text || "[]");
   } catch { return []; }
 };
 export const summarizeConversation = async (history: ChatMessage[]) => {
   if (!API_KEY) return "Summary unavailable.";
   try {
+    const res = await ai.models.generateContent({ model: MODEL_TIER_1, contents: `Summarize clinical conversation:\n${history.map(m=>m.text).join('\n')}` });
     return cleanText(res.text || "");
   } catch { return "Could not summarize."; }
 };