Spaces:

Wills17
/

Fridge2Dish

Running

App Files Files Community

Wills17 commited on Nov 25, 2025

Commit

344d8c3

verified ·

1 Parent(s): 4ea7b45

Update FastAPI_app.py

Browse files

Files changed (1) hide show

FastAPI_app.py +41 -50

FastAPI_app.py CHANGED Viewed

@@ -6,6 +6,7 @@ import io
 import time
 import traceback
 import threading
 import uvicorn
 import numpy as np
@@ -22,9 +23,6 @@ import tensorflow as tf
 import google.generativeai as genai
 from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 # CONFIGURATION
 # Ingredient model (load once)
@@ -47,12 +45,10 @@ else:
         'pineapple', 'pomegranate', 'potato', 'raddish', 'soy beans', 'spinach', 'sweetcorn',
         'sweetpotato', 'tomato', 'turnip', 'watermelon'
     ]
-# Get HF token
-hf_token = os.getenv("HF_TOKEN")
-if not hf_token:
-    raise ValueError("Token not found in environment variable 'HF_TOKEN'.")
 # Thread-safe lazy loading
@@ -60,48 +56,43 @@ _lock = threading.Lock()
 _tokenizer = None
 _model = None
-def load_gemma2_2b():
     global _tokenizer, _model
     if _model is not None:
         return _tokenizer, _model
     with _lock:
         if _model is not None:
             return _tokenizer, _model
-        print("\n🔵 [Fallback] Loading Gemma-2-2B-it 4-bit")
-        quantization_config = BitsAndBytesConfig(
-            load_in_4bit=True,
-            bnb_4bit_compute_dtype=torch.float16,
-            bnb_4bit_quant_type="nf4"
-        )
-        _tokenizer = AutoTokenizer.from_pretrained("google/gemma-2-2b-it", token=hf_token)
-        _model = AutoModelForCausalLM.from_pretrained(
-            "google/gemma-2-2b-it",
-            device_map="auto",
-            quantization_config=quantization_config,
-            torch_dtype=torch.float16,
-            trust_remote_code=True
-        )
-        print("\n🟢 [Fallback] Gemma-2-2B ready!")
-        return _tokenizer, _model
-def generate_recipe_gemma(ingredient_names):
-    tokenizer, model = load_gemma2_2b()
-    prompt = f"""<start_of_turn>user
-        You are an AI chef. Create a short recipe using only: {', '.join(ingredient_names)}.
-        Include:
-        - Recipe name
-        - One-sentence description
-        - Ingredients list with quantities
-        - 6-10 concise steps
-        - Optional tips
-        RETURN RESULT IN MARKDOWN FORMAT ONLY.<end_of_turn>
-        <start_of_turn>model
-        """
     inputs = tokenizer(prompt, return_tensors="pt")
     outputs = model.generate(
         inputs.input_ids,
@@ -112,7 +103,7 @@ def generate_recipe_gemma(ingredient_names):
     )
     recipe_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
     # Strip the prompt part
-    return recipe_text.split("<start_of_turn>model")[-1].strip()
 # Infer uploaded image function
@@ -196,25 +187,25 @@ async def upload_image(file: UploadFile = File(...), user_api_key: str = Form(al
                 RETURN RESULT IN MARKDOWN FORMAT ONLY.
                 """
-                print("Trying Gemini...")
                 response = model.generate_content(prompt)
                 recipe_text = response.text.strip()
-                print("Gemini succeeded.")
             except Exception as e_gemini:
                 print("Gemini failed:", e_gemini)
                 try:
-                    recipe_text = generate_recipe_gemma(ingredient_names)
                 except Exception as e_local1:
-                    print("Gemma local failed:", e_local1)
                     raise e_local1
         else:
             try:
-                print("\n🟡 No API key → Using Gemma fallback.")
-                recipe_text = generate_recipe_gemma(ingredient_names)
             except Exception as e_local2:
-                print("Gemma local failed:", e_local2)
                 raise e_local2
         return {"ingredients": ingredients, "recipe": recipe_text}

 import time
 import traceback
 import threading
+import signal
 import uvicorn
 import numpy as np
 import google.generativeai as genai
 from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 # CONFIGURATION
 # Ingredient model (load once)
         'pineapple', 'pomegranate', 'potato', 'raddish', 'soy beans', 'spinach', 'sweetcorn',
         'sweetpotato', 'tomato', 'turnip', 'watermelon'
     ]
+# Phi-3.5-mini-instruct local model loading
+def timeout_handler(signum, frame):
+    raise TimeoutError("Model load timed out after 300s")
 # Thread-safe lazy loading
 _tokenizer = None
 _model = None
+def load_phi_3_5_mini_instruct():
     global _tokenizer, _model
     if _model is not None:
         return _tokenizer, _model
     with _lock:
         if _model is not None:
             return _tokenizer, _model
+        signal.signal(signal.SIGALRM, timeout_handler)
+        signal.alarm(300)  # 5 min timeout
+        try:
+            print("\n🔵 [Fallback] Loading Phi-3.5-mini-instruct")
+            quantization_config = BitsAndBytesConfig(
+                load_in_4bit=True,
+                bnb_4bit_compute_dtype=torch.float16,
+                bnb_4bit_quant_type="nf4"
+            )
+            _tokenizer = AutoTokenizer.from_pretrained("microsoft/Phi-3.5-mini-instruct", trust_remote_code=True)
+            _model = AutoModelForCausalLM.from_pretrained(
+                "microsoft/Phi-3.5-mini-instruct",
+                device_map="auto",
+                quantization_config=quantization_config,
+                torch_dtype=torch.float16,
+                trust_remote_code=True
+            )
+            print("\n🟢 [Fallback] Phi-3.5 ready!")
+            return _tokenizer, _model
+        except TimeoutError:
+            print("\n🔴 [Fallback] Phi-3.5 load timed out.")
+            signal.alarm(0)
+            raise RuntimeError("\n🔴 Model load failed.")
+def generate_recipe_phi(ingredient_names):
+    tokenizer, model = load_phi_3_5_mini_instruct()  # Now loads Phi-3
+    prompt = f"<|user|>\nYou are an AI chef. Create a short recipe using only: {', '.join(ingredient_names)}.\nInclude:\n- Recipe name\n- One-sentence description\n- Ingredients list with quantities\n- 6-10 concise steps\n- Optional tips\nRETURN RESULT IN MARKDOWN FORMAT ONLY.<|end|>\n<|assistant|>\n"""
     inputs = tokenizer(prompt, return_tensors="pt")
     outputs = model.generate(
         inputs.input_ids,
     )
     recipe_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
     # Strip the prompt part
+    return recipe_text.split("<|assistant|>")[-1].strip()
 # Infer uploaded image function
                 RETURN RESULT IN MARKDOWN FORMAT ONLY.
                 """
+                print("\n🟡 Trying Gemini...")
                 response = model.generate_content(prompt)
                 recipe_text = response.text.strip()
+                print("\n🟢 Gemini succeeded.")
             except Exception as e_gemini:
                 print("Gemini failed:", e_gemini)
                 try:
+                    recipe_text = generate_recipe_phi(ingredient_names)
                 except Exception as e_local1:
+                    print("\n🔴 Phi local failed:", e_local1)
                     raise e_local1
         else:
             try:
+                print("\n🟡 No API key → Using Phi-3.5 fallback.")
+                recipe_text = generate_recipe_phi(ingredient_names)
             except Exception as e_local2:
+                print("\n🔴 Phi local failed:", e_local2)
                 raise e_local2
         return {"ingredients": ingredients, "recipe": recipe_text}