Spaces:

ramonsj11
/

ProyectoFinal_recetas

Sleeping

App Files Files Community

ProyectoFinal_recetas / app_optimized.py

ramonsj11

deploy: automated upload via deploy_to_hf.py

2d97a84 verified 11 days ago

raw

history blame contribute delete

45.8 kB

	"""
	app_optimized.py ― Recipe Recommender Multimodal Demo (optimised build)
	Hugging Face Space \| CPU-only \| Gradio 4.44

	Optimisation notes:
	• CNN + LLM load lazily on first use (lru_cache + threading.Lock).
	• Two-phase UX: Phase 1 (<3 s) = ingredients + recipe table;
	Phase 2 (~30 s) = LLM narration, user-triggered.
	• gr.HTML ingredient panel — real images OR coloured text badges.
	• Pipeline transparency panel — query, scores, per-stage timing.
	• gr.Examples — 5 predefined text queries for instant demos.
	"""

	# ── stdlib ────────────────────────────────────────────────────────────────────
	import base64
	import functools
	import json
	import os
	import threading
	import time
	from pathlib import Path

	# ── third-party ───────────────────────────────────────────────────────────────
	import faiss
	import gradio as gr

	# ── Patch 1: gradio_client 0.6.x — bool JSON-Schema values cause TypeError ───
	import gradio_client.utils as _gcu

	_orig_get_type = _gcu.get_type
	_orig_jstpt = _gcu._json_schema_to_python_type

	def _safe_get_type(schema):
	if not isinstance(schema, dict):
	return "Any"
	return _orig_get_type(schema)

	def _safe_jstpt(schema, defs=None):
	if not isinstance(schema, dict):
	return "Any"
	return _orig_jstpt(schema, defs)

	_gcu.get_type = _safe_get_type
	_gcu._json_schema_to_python_type = _safe_jstpt

	# ── Patch 2: Starlette >=1.0 changed TemplateResponse(name, ctx) → (req, name) ─
	import starlette.templating as _st

	_orig_TemplateResponse = _st.Jinja2Templates.TemplateResponse

	def _compat_TemplateResponse(self, args, *kwargs):
	# Old API (Starlette <1.0): TemplateResponse(name: str, context: dict, ...)
	# New API (Starlette >=1.0): TemplateResponse(request, name: str, context=...)
	if args and isinstance(args[0], str):
	name = args[0]
	context = args[1] if len(args) > 1 else kwargs.pop("context", {})
	request = context.get("request")
	return _orig_TemplateResponse(self, request, name, context=context, **kwargs)
	return _orig_TemplateResponse(self, args, *kwargs)

	_st.Jinja2Templates.TemplateResponse = _compat_TemplateResponse
	# ─────────────────────────────────────────────────────────────────────────────

	import pandas as pd
	import torch
	import torchvision.models as models
	import torchvision.transforms as T
	from huggingface_hub import hf_hub_download
	try:
	from llama_cpp import Llama
	_LLAMA_AVAILABLE = True
	except ImportError:
	Llama = None # type: ignore[assignment, misc]
	_LLAMA_AVAILABLE = False
	print("llama-cpp-python not available — LLM disabled")
	from PIL import Image
	from rapidfuzz import process as rfprocess
	from sentence_transformers import SentenceTransformer

	# ─────────────────────────────────────────────────────────────────────────────
	# CONFIG
	# ─────────────────────────────────────────────────────────────────────────────
	HF_USERNAME = os.environ.get("HF_USERNAME", "ramonsj11")
	HF_SPACE_NAME = os.environ.get("HF_SPACE_NAME", "ProyectoFinal_recetas")
	CNN_REPO = f"{HF_USERNAME}/recipe-ingredient-classifier"
	LLM_REPO = f"{HF_USERNAME}/recipe-llm-gguf"
	EMBED_MODEL = "sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2"
	_EMBED_SHORT = "multilingual-MiniLM-L12-v2 · 384-dim"

	DIETARY_CHOICES = ["any", "vegetarian", "vegan", "gluten-free", "dairy-free"]
	SPEED_CHOICES = ["any", "fast", "medium", "slow"]

	# Pastel palette for missing-ingredient badges
	_BADGE_COLORS = [
	"#FFB3B3", "#B3D9FF", "#B3FFB3", "#FFD9B3",
	"#E8B3FF", "#B3FFE8", "#FFE8B3", "#D9B3FF",
	]
	_GREY = Image.new("RGB", (200, 200), color=(210, 210, 210))

	# ─────────────────────────────────────────────────────────────────────────────
	# STARTUP ARTIFACTS — FAISS + embeddings (fast, always needed)
	# ─────────────────────────────────────────────────────────────────────────────
	print("Loading FAISS index…")
	faiss_index = faiss.read_index("recipe_faiss.index")

	print("Loading dataframe…")
	df = pd.read_parquet("df_final_embeddings.parquet").reset_index(drop=True)

	with open("ingredient_catalog.json") as _f:
	ingredient_catalog: dict[str, str] = json.load(_f)

	try:
	with open("class_labels.json") as _f:
	class_labels: dict[str, str] = json.load(_f)
	print(f" class_labels.json: {len(class_labels)} classes")
	except FileNotFoundError:
	class_labels = {}
	print(" class_labels.json not found — CNN disabled")

	NUM_CLASSES = len(class_labels)
	_catalog_keys = list(ingredient_catalog.keys())

	# Column-name compatibility — prefer Spanish column if present
	if "ingredient_text_es" in df.columns:
	INGR_COL = "ingredient_text_es"
	elif "ingredient_text" in df.columns:
	INGR_COL = "ingredient_text"
	else:
	INGR_COL = "ingredients_text_processed"
	DIETARY_COL = "dietary_profile" if "dietary_profile" in df.columns else "dietary_profile_updated"
	CUISINE_COL = "cuisine_list" if "cuisine_list" in df.columns else "cuisine"
	DISH_TYPE_COLS = [c for c in ("course_list", "course", "category", "subcategory") if c in df.columns]

	print(f" {len(df):,} recipes \| ingr_col={INGR_COL} \| dietary_col={DIETARY_COL}")

	print("Loading SentenceTransformer…")
	# Multilingual model — supports Spanish and English queries (384-dim, same as before)
	embedding_model = SentenceTransformer(EMBED_MODEL)

	print("Startup artifacts ready ✅ CNN + LLM will load on first use.")

	# ─────────────────────────────────────────────────────────────────────────────
	# OPTIMISATION 1 + 2 — lru_cache lazy loaders with thread-safe getters
	# ─────────────────────────────────────────────────────────────────────────────
	_cnn_lock = threading.Lock()
	_llm_lock = threading.Lock()

	_cnn_tf = T.Compose([
	T.Resize(256),
	T.CenterCrop(224),
	T.ToTensor(),
	T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
	])


	@functools.lru_cache(maxsize=1)
	def _load_cnn_cached() -> torch.nn.Module:
	"""Download weights + build model exactly once; result cached in-process."""
	if NUM_CLASSES == 0:
	raise RuntimeError("class_labels.json not found — CNN unavailable")
	weights_path = hf_hub_download(repo_id=CNN_REPO, filename="efficientnet_ingredients.pth")
	mdl = models.efficientnet_b0(weights=None)
	mdl.classifier[1] = torch.nn.Linear(1280, NUM_CLASSES)
	mdl.load_state_dict(torch.load(weights_path, map_location="cpu"))
	mdl.eval()
	return mdl


	@functools.lru_cache(maxsize=1)
	def _load_llm_cached() -> "Llama":
	"""Download GGUF + initialise Llama exactly once; result cached in-process."""
	if not _LLAMA_AVAILABLE:
	raise RuntimeError("llama-cpp-python not installed — LLM unavailable")
	gguf_path = hf_hub_download(repo_id=LLM_REPO, filename="tinyllama-recipes-q4.gguf")
	return Llama(model_path=gguf_path, n_ctx=2048, n_threads=4, verbose=False)


	def get_cnn() -> torch.nn.Module:
	"""Thread-safe lazy getter — safe to call from concurrent Gradio requests."""
	with _cnn_lock:
	return _load_cnn_cached()


	def get_llm() -> Llama:
	"""Thread-safe lazy getter — safe to call from concurrent Gradio requests."""
	with _llm_lock:
	return _load_llm_cached()


	def _cnn_loaded() -> bool:
	return _load_cnn_cached.cache_info().currsize > 0


	def _llm_loaded() -> bool:
	return _load_llm_cached.cache_info().currsize > 0


	# ─────────────────────────────────────────────────────────────────────────────
	# FUNCTION 1 — ingredient classification (lazy CNN)
	# ─────────────────────────────────────────────────────────────────────────────
	def classify_ingredients(image: Image.Image) -> list[tuple[str, float]]:
	"""Return top-10 [(ingredient_name, confidence)] from a PIL image."""
	model = get_cnn()
	tensor = _cnn_tf(image.convert("RGB")).unsqueeze(0)
	with torch.no_grad():
	probs = torch.softmax(model(tensor), dim=1)[0]
	top10 = torch.topk(probs, 10)
	return [
	(class_labels.get(str(i.item()), f"class_{i.item()}"), s.item())
	for i, s in zip(top10.indices, top10.values)
	]


	# ─────────────────────────────────────────────────────────────────────────────
	# FUNCTION 5 — ingredient image lookup
	# ─────────────────────────────────────────────────────────────────────────────
	def get_ingredient_image(name: str) -> str \| None:
	"""Fuzzy-match name against catalog (threshold 72); return path or None."""
	hit = rfprocess.extractOne(name.lower(), _catalog_keys)
	if hit and hit[1] >= 72:
	return ingredient_catalog[hit[0]]
	return None


	# ─────────────────────────────────────────────────────────────────────────────
	# FUNCTION 2 — recipe retrieval (now also returns query string + scores)
	# ─────────────────────────────────────────────────────────────────────────────
	def _parse_dietary(raw) -> list[str]:
	if isinstance(raw, list):
	return [str(x).lower() for x in raw]
	try:
	return [str(x).lower() for x in json.loads(raw)]
	except Exception:
	return [str(raw).lower()]


	def _stringify(val) -> str:
	if isinstance(val, list):
	return ", ".join(str(x) for x in val)
	try:
	return ", ".join(str(x) for x in json.loads(val))
	except Exception:
	return str(val) if pd.notna(val) else ""


	def _choice_values_from_columns(frame: pd.DataFrame, columns: list[str], limit: int = 40) -> list[str]:
	values: set[str] = set()
	for col in columns:
	for raw in frame[col].dropna().head(20000):
	text = _stringify(raw) if "_list" in col else str(raw)
	for item in text.split(","):
	item = item.strip()
	if item and item.lower() not in {"nan", "none", "[]"}:
	values.add(item)
	return ["any"] + sorted(values)[:limit]


	DISH_TYPE_CHOICES = _choice_values_from_columns(df, DISH_TYPE_COLS)


	def _contains_choice(raw, choice: str) -> bool:
	if choice == "any":
	return True
	return choice.lower() in _stringify(raw).lower()


	def _text_blob(row: dict) -> str:
	parts = [
	row.get("recipe_title", ""),
	row.get(INGR_COL, ""),
	row.get("ingredients_text_processed", ""),
	row.get("directions_text", ""),
	row.get("description", ""),
	row.get("category", ""),
	row.get("subcategory", ""),
	row.get("course", ""),
	row.get("course_list", ""),
	]
	return " ".join(_stringify(p).lower() for p in parts if p is not None)


	def _ingredient_overlap(query_terms: list[str], row: dict) -> float:
	terms = [t.lower().strip() for t in query_terms if t and t.strip()]
	if not terms:
	return 0.0
	blob = _text_blob(row)
	return sum(1 for term in terms if term in blob) / len(terms)


	def _has_dish_image(row: dict) -> float:
	path = row.get("dish_image_path") or row.get("image_path") or ""
	return 1.0 if path and Path(path).exists() else 0.0


	class MLPReranker(torch.nn.Module):
	"""Small deterministic MLP over retrieval/filter features."""

	def __init__(self):
	super().__init__()
	self.net = torch.nn.Sequential(
	torch.nn.Linear(7, 8),
	torch.nn.ReLU(),
	torch.nn.Linear(8, 1),
	)
	self._init_reasonable_weights()

	def _init_reasonable_weights(self) -> None:
	with torch.no_grad():
	first: torch.nn.Linear = self.net[0] # type: ignore[assignment]
	second: torch.nn.Linear = self.net[2] # type: ignore[assignment]
	first.weight.zero_()
	first.bias.zero_()
	for i in range(7):
	first.weight[i, i] = 1.0
	first.weight[7] = torch.tensor([0.8, 1.0, 0.5, 0.35, 0.25, 0.45, 0.2])
	second.weight[:] = torch.tensor([[1.5, 1.2, 0.7, 0.5, 0.35, 0.75, 0.25, 1.0]])
	second.bias.zero_()

	@torch.no_grad()
	def score(self, features: list[list[float]]) -> list[float]:
	if not features:
	return []
	tensor = torch.tensor(features, dtype=torch.float32)
	return self.net(tensor).squeeze(-1).tolist()


	reranker = MLPReranker()


	def rerank_recipes(
	cands: pd.DataFrame,
	ingredients: list[str],
	dietary_filter: str,
	speed_filter: str,
	dish_type_filter: str,
	) -> pd.DataFrame:
	rows = cands.to_dict(orient="records")
	features: list[list[float]] = []
	for row in rows:
	features.append([
	float(row.get("_score", 0.0)),
	_ingredient_overlap(ingredients, row),
	1.0 if dietary_filter == "any" or _contains_choice(row.get(DIETARY_COL, ""), dietary_filter) else 0.0,
	1.0 if speed_filter == "any" or str(row.get("cook_speed", "")).lower() == speed_filter.lower() else 0.0,
	1.0 if dish_type_filter == "any" or any(_contains_choice(row.get(col, ""), dish_type_filter) for col in DISH_TYPE_COLS) else 0.0,
	1.0 if any(term.lower() in str(row.get("recipe_title", "")).lower() for term in ingredients) else 0.0,
	_has_dish_image(row),
	])
	ranked = cands.copy()
	ranked["_rerank_score"] = reranker.score(features)
	return ranked.sort_values("_rerank_score", ascending=False)


	def retrieve_recipes(
	ingredients: list[str],
	dietary_filter: str = "any",
	speed_filter: str = "any",
	dish_type_filter: str = "any",
	k: int = 5,
	) -> tuple[list[dict], str, list[float]]:
	"""Returns (recipe_dicts, query_text, reranker_scores)."""
	query = "ingredients: " + ", ".join(ingredients)
	emb = embedding_model.encode([query], normalize_embeddings=True).astype("float32")

	dists, idxs = faiss_index.search(emb, 50)
	cands = df.iloc[idxs[0]].copy()
	cands["_score"] = dists[0]

	if dietary_filter != "any":
	mask = cands[DIETARY_COL].apply(lambda v: dietary_filter.lower() in _parse_dietary(v))
	cands = cands[mask]

	if speed_filter != "any" and "cook_speed" in cands.columns:
	cands = cands[cands["cook_speed"].str.lower() == speed_filter.lower()]

	if dish_type_filter != "any" and DISH_TYPE_COLS:
	mask = cands.apply(
	lambda row: any(_contains_choice(row.get(col, ""), dish_type_filter) for col in DISH_TYPE_COLS),
	axis=1,
	)
	cands = cands[mask]

	ranked = rerank_recipes(cands, ingredients, dietary_filter, speed_filter, dish_type_filter)
	top = ranked.head(k)
	scores = top["_rerank_score"].tolist()
	return top.to_dict(orient="records"), query, scores


	# ─────────────────────────────────────────────────────────────────────────────
	# FUNCTION 3 — streaming LLM narration (lazy LLM)
	# ─────────────────────────────────────────────────────────────────────────────
	def _narration_prompt(row: dict) -> str:
	title = row.get("recipe_title", "Unknown recipe")
	ingr = row.get(INGR_COL) or row.get("ingredients_text_processed", "")
	# ingredient_text is space-separated in this dataset; convert for readability
	ingr = ingr.replace(" ", ", ") if " " in ingr and "," not in ingr else ingr
	dirs = row.get("directions_text", "")[:800]
	dietary = _stringify(row.get(DIETARY_COL) or row.get("dietary_profile_updated", ""))
	return (
	"<\|system\|>\n"
	"You are a helpful cooking assistant. Narrate recipes clearly and engagingly.\n</s>\n"
	"<\|user\|>\n"
	"Please narrate this recipe in a friendly way:\n"
	f"Title: {title}\nIngredients: {ingr}\nInstructions: {dirs}\nDietary: {dietary}\n</s>\n"
	"<\|assistant\|>\n"
	)


	def build_recipe_detail_md(row: dict \| None) -> str:
	if not row:
	return "Select a recipe to see ingredients and procedure."
	title = row.get("recipe_title", "Recipe")
	ingredients = row.get(INGR_COL) or row.get("ingredients_text_processed", "")
	ingredients = ingredients.replace(" ", ", ") if " " in ingredients and "," not in ingredients else ingredients
	directions = row.get("directions_text", "") or row.get("directions", "")
	cuisine = _stringify(row.get(CUISINE_COL, ""))
	dietary = _stringify(row.get(DIETARY_COL, ""))
	speed = row.get("cook_speed", "")
	meta = " · ".join(str(x) for x in [cuisine, dietary, speed] if str(x).strip())
	return (
	f"### {title}\n\n"
	f"{meta}\n\n"
	f"Ingredients\n\n{ingredients or 'Not available'}\n\n"
	f"Procedure\n\n{directions or 'Not available'}"
	)


	def generate_recipe(recipe_row: dict \| None):
	"""Generator — streams growing narration string; shows gr.Info on first LLM load."""
	if not recipe_row:
	yield "Select a recipe from the table above, then click 'Narrate'."
	return
	if not _llm_loaded():
	gr.Info("Loading language model for the first time (~25 s) — please wait…")
	model = get_llm()
	accumulated = ""
	for chunk in model(_narration_prompt(recipe_row), max_tokens=512, temperature=0.7, stream=True):
	accumulated += chunk["choices"][0]["text"]
	yield accumulated


	# ─────────────────────────────────────────────────────────────────────────────
	# FUNCTION 4 — chat about the active recipe (lazy LLM)
	# ─────────────────────────────────────────────────────────────────────────────
	def chat_about_recipe(
	message: str,
	history: list[list[str \| None]],
	recipe_state: dict \| None,
	) -> tuple[list, str]:
	if not message.strip():
	return history, ""
	if recipe_state:
	title = recipe_state.get("recipe_title", "a recipe")
	ingr = recipe_state.get(INGR_COL, "")
	sys_msg = (
	f"The user is asking about '{title}'.\nIngredients: {ingr}\n"
	"Answer only questions related to this recipe."
	)
	else:
	sys_msg = "You are a helpful cooking assistant."

	if not _llm_loaded():
	gr.Info("Loading language model for the first time (~25 s) — please wait…")
	model = get_llm()
	prompt = (
	f"<\|system\|>\n{sys_msg}\n</s>\n"
	f"<\|user\|>\n{message}\n</s>\n"
	"<\|assistant\|>\n"
	)
	reply = model(prompt, max_tokens=300, temperature=0.7, stream=False)["choices"][0]["text"].strip()
	return history + [[message, reply]], ""


	# ─────────────────────────────────────────────────────────────────────────────
	# FIX — ingredient HTML panel (image card OR coloured text badge)
	# ─────────────────────────────────────────────────────────────────────────────
	def _img_to_b64(path: str) -> str \| None:
	"""Encode a local image as a base64 data-URI for inline HTML embedding."""
	try:
	ext = Path(path).suffix.lstrip(".").lower()
	mime = "image/jpeg" if ext in ("jpg", "jpeg") else f"image/{ext}"
	with open(path, "rb") as fh:
	b64 = base64.b64encode(fh.read()).decode()
	return f"data:{mime};base64,{b64}"
	except Exception:
	return None


	def build_ingredient_html(top_ingr: list[tuple[str, float]]) -> str:
	"""
	Returns an HTML string for gr.HTML.
	- Ingredient WITH catalog image → thumbnail card (base64 inline src).
	- Ingredient WITHOUT image → coloured text badge (no grey placeholder).
	"""
	cards: list[str] = []
	for i, (name, conf) in enumerate(top_ingr):
	pct = f"{conf * 100:.1f}%"
	color = _BADGE_COLORS[i % len(_BADGE_COLORS)]
	path = get_ingredient_image(name)
	src = _img_to_b64(path) if path and Path(path).exists() else None

	if src:
	cards.append(
	f'<div style="text-align:center;margin:6px;width:110px">'
	f'<img src="{src}" style="width:100px;height:100px;'
	f'object-fit:cover;border-radius:10px;border:1px solid #ddd">'
	f'<div style="font-size:12px;margin-top:3px;color:#333">{name}</div>'
	f'<div style="font-size:11px;color:#888">{pct}</div>'
	f'</div>'
	)
	else:
	# Coloured badge — no grey rectangle
	cards.append(
	f'<div style="text-align:center;margin:6px;width:110px;'
	f'display:flex;flex-direction:column;align-items:center;justify-content:center">'
	f'<span style="background:{color};padding:6px 12px;border-radius:14px;'
	f'font-size:13px;font-weight:500;display:inline-block">🥬 {name}</span>'
	f'<div style="font-size:11px;color:#888;margin-top:4px">{pct}</div>'
	f'</div>'
	)

	return (
	'<div style="display:flex;flex-wrap:wrap;gap:4px;'
	'padding:8px;min-height:60px;align-items:flex-start">'
	+ "".join(cards)
	+ "</div>"
	)


	# ─────────────────────────────────────────────────────────────────────────────
	# DISH GALLERY
	# ─────────────────────────────────────────────────────────────────────────────
	def build_dish_gallery(recipes: list[dict]) -> list[tuple[Image.Image, str]]:
	items: list[tuple[Image.Image, str]] = []
	for row in recipes:
	path = row.get("dish_image_path") or row.get("image_path") or ""
	if path and Path(path).exists():
	try:
	img = Image.open(path).convert("RGB").resize((300, 200))
	except Exception:
	img = _GREY
	else:
	img = _GREY
	items.append((img, row.get("recipe_title", "Recipe")))
	return items


	# ─────────────────────────────────────────────────────────────────────────────
	# OPTIMISATION 3 — TWO-PHASE SEARCH HANDLER
	# Phase 1 (this function, <3 s): CNN + FAISS → panels A, B, debug
	# Phase 2 (narrate_btn click, ~30 s): LLM narration on demand
	# ─────────────────────────────────────────────────────────────────────────────
	def find_recipes(
	image: Image.Image \| None,
	text_query: str,
	dietary: str,
	speed: str,
	dish_type: str,
	progress=gr.Progress(),
	):
	"""
	Outputs (8):
	search_status, ingr_html, dish_gallery, recipe_df,
	recipe_detail, recipe_state, results_state, pipeline_debug
	"""
	t_total = time.perf_counter()

	if image is None and not (text_query or "").strip():
	raise gr.Error("Please upload a photo or type ingredient names.")

	# OPTIMISATION 5 — debug dict filled throughout this function
	debug: dict = {
	"models": {
	"cnn": f"EfficientNet-B0 ({NUM_CLASSES} classes)",
	"embed": f"{_EMBED_SHORT} (cosine)",
	"reranker": "MLP reranker over FAISS score + overlap + filters + image signal",
	"llm": "TinyLlama-1.1B-Chat Q4_K_M (lazy — loads on Narrate)",
	},
	"query": "",
	"reranker_scores": {},
	"timing_ms": {},
	}

	# ── Phase 1a: classify image or parse text ────────────────────────────────
	top_ingr: list[tuple[str, float]]

	if image is not None:
	if not _cnn_loaded():
	gr.Info("Loading ingredient classifier for the first time (~15 s)…")
	progress(0.15, desc="Running ingredient classifier…")
	t0 = time.perf_counter()
	top_ingr = classify_ingredients(image)
	debug["timing_ms"]["cnn_ms"] = round((time.perf_counter() - t0) * 1000)
	names = [n for n, _ in top_ingr[:5]]
	else:
	names = [s.strip() for s in text_query.split(",") if s.strip()]
	top_ingr = [(n, 1.0) for n in names[:10]]
	debug["timing_ms"]["cnn_ms"] = 0 # not used for text input

	if not names:
	raise gr.Error("Could not extract any ingredient names from the input.")

	# ── Phase 1b: embed + FAISS retrieval ────────────────────────────────────
	progress(0.45, desc="Searching 64k recipes…")
	t0 = time.perf_counter()
	recipes, query_text, scores = retrieve_recipes(names, dietary, speed, dish_type)
	debug["timing_ms"]["faiss_ms"] = round((time.perf_counter() - t0) * 1000)
	debug["query"] = query_text
	debug["reranker_scores"] = {
	r.get("recipe_title", f"recipe_{i}"): round(float(s), 4)
	for i, (r, s) in enumerate(zip(recipes, scores))
	}

	if not recipes:
	raise gr.Error(
	"No recipes matched those filters. "
	"Try setting Dietary and/or Cook speed to 'any'."
	)

	# ── Phase 1c: build result panels ────────────────────────────────────────
	progress(0.75, desc="Building result panels…")
	t0 = time.perf_counter()

	ingr_html_str = build_ingredient_html(top_ingr)
	dish_gal = build_dish_gallery(recipes)

	display = [
	{
	"Title": r.get("recipe_title", ""),
	"Cuisine": _stringify(r.get(CUISINE_COL, "")),
	"Type": _stringify(r.get("course_list", r.get("course", r.get("category", "")))),
	"Speed": r.get("cook_speed", ""),
	"Dietary": _stringify(r.get(DIETARY_COL, "")),
	}
	for r in recipes
	]
	recipe_df_data = pd.DataFrame(display)
	recipe_detail = build_recipe_detail_md(recipes[0])

	debug["timing_ms"]["render_ms"] = round((time.perf_counter() - t0) * 1000)
	debug["timing_ms"]["phase1_total_ms"] = round((time.perf_counter() - t_total) * 1000)

	elapsed_s = debug["timing_ms"]["phase1_total_ms"] / 1000
	faiss_s = debug["timing_ms"]["faiss_ms"] / 1000
	status = (
	f"Phase 1 complete — found {len(recipes)} recipes "
	f"(FAISS {faiss_s:.2f}s · total {elapsed_s:.2f}s) "
	f"\| Click a row or dish image to select, then press Narrate for AI narration."
	)

	progress(1.0, desc="Phase 1 done ✅")
	return (
	status,
	ingr_html_str,
	dish_gal,
	recipe_df_data,
	recipe_detail,
	recipes[0],
	recipes,
	debug,
	)


	# ─────────────────────────────────────────────────────────────────────────────
	# SELECTION HANDLERS
	# ─────────────────────────────────────────────────────────────────────────────
	def select_from_df(evt: gr.SelectData, results: list[dict]) -> tuple[dict, str, str]:
	if not results:
	return None, "", ""
	row_idx = evt.index[0] if isinstance(evt.index, (list, tuple)) else 0
	row = results[min(row_idx, len(results) - 1)]
	return row, f"Selected: {row.get('recipe_title', 'Recipe')}", build_recipe_detail_md(row)


	def select_from_gallery(evt: gr.SelectData, results: list[dict]) -> tuple[dict, str, str]:
	if not results:
	return None, "", ""
	idx = min(int(evt.index), len(results) - 1)
	row = results[idx]
	return row, f"Selected: {row.get('recipe_title', 'Recipe')}", build_recipe_detail_md(row)


	# ─────────────────────────────────────────────────────────────────────────────
	# PIPELINE DIAGRAM — Tab 2
	# ─────────────────────────────────────────────────────────────────────────────
	PIPELINE_MD = """\
	## How the pipeline works

	```
	┌──────────────────────────────────────────────────────────┐
	│ USER INPUT │
	│ Photo ──OR── Text query ──OR── Ingredient list │
	└──────────────┬───────────────────────────────────────────┘
	│
	┌────────▼──────────────────────────────────────────┐
	│ EfficientNet-B0 (lazy — loads on first photo) │
	│ image → top-10 ingredient predictions │
	│ Fruits-360 + Recipe Ingredients Dataset ~150 cls │
	└────────┬──────────────────────────────────────────┘
	│ ingredient name list
	┌────────▼──────────────────────────────────────────┐
	│ multilingual-MiniLM-L12-v2 · 384-dim │
	│ "ingredients: tomato, onion, …" → float32 vec │
	└────────┬──────────────────────────────────────────┘
	│
	┌────────▼──────────────────────────────────────────┐
	│ FAISS IndexFlatIP · 64k recipes │
	│ top-50 → filters: diet + speed + dish type │
	└────────┬──────────────────────────────────────────┘
	│
	┌────────▼──────────────────────────────────────────┐
	│ MLP reranker │
	│ FAISS score + ingredient overlap + filter match │
	└────────┬──────────────────────────────────────────┘
	│ ← PHASE 1 COMPLETE (< 3 s)
	┌────────▼──────────────────────────────────────────┐
	│ Top-5 recipe cards │
	│ (title · cuisine · dietary tags · cook speed) │
	└────────┬──────────────────────────────────────────┘
	│ user clicks "Narrate" ← PHASE 2
	┌────────▼──────────────────────────────────────────┐
	│ TinyLlama-1.1B-Chat Q4_K_M (lazy — ~25 s load)│
	│ Streams friendly narration · ~30 s on CPU │
	└────────┬──────────────────────────────────────────┘
	│ user types in chat
	┌────────▼──────────────────────────────────────────┐
	│ Chat mode: recipe injected as system context │
	└───────────────────────────────────────────────────┘
	```

	### Lazy loading strategy

	\| Component \| Loads at \| Approx. time \|
	\|---\|---\|---\|
	\| FAISS index + dataframe \| App startup \| ~2 s \|
	\| SentenceTransformer \| App startup \| ~3 s \|
	\| EfficientNet-B0 \| First photo upload \| ~10 s (once) \|
	\| TinyLlama GGUF \| First "Narrate" or Chat \| ~25 s (once) \|

	After first load each model is cached in-process for all subsequent requests.

	### Per-stage latency (free-tier CPU, post-load)

	\| Step \| Time \|
	\|---\|---\|
	\| CNN classification \| < 1 s \|
	\| MiniLM embedding \| < 0.5 s \|
	\| FAISS top-50 search + filters + MLP rerank \| < 1.5 s \|
	\| Phase 1 total \| < 3 s \|
	\| LLM narration (512 tokens) \| 25–40 s \|
	\| Chat reply (300 tokens) \| 15–25 s \|
	"""


	# ─────────────────────────────────────────────────────────────────────────────
	# UI
	# ─────────────────────────────────────────────────────────────────────────────
	with gr.Blocks(title="Recipe Recommender (optimised)", theme=gr.themes.Soft()) as demo:

	gr.Markdown("# 🍳 Recipe Recommender — Multimodal AI Demo")
	gr.Markdown(
	"FAISS index and embedding model ready ✅ "
	"\| CNN and LLM load on first use (once only, then cached)."
	)

	# Shared state
	recipe_state = gr.State(None) # currently selected recipe dict
	results_state = gr.State([]) # all retrieved recipe dicts

	with gr.Tabs():

	# ── TAB 1 — Find recipes ───────────────────────────────────────────────
	with gr.Tab("Find recipes"):
	with gr.Row(equal_height=False):

	# ── LEFT COLUMN: inputs + examples ────────────────────────────
	with gr.Column(scale=1, min_width=300):
	img_input = gr.Image(
	label="Photo of your ingredient (optional)",
	type="pil",
	height=220,
	)
	text_input = gr.Textbox(
	label="Or describe ingredients / craving",
	placeholder="tomato, onion, garlic, basil or quick vegan pasta…",
	lines=2,
	)
	dietary_dd = gr.Dropdown(
	label="Dietary preference",
	choices=DIETARY_CHOICES,
	value="any",
	)
	speed_dd = gr.Dropdown(
	label="Cook speed",
	choices=SPEED_CHOICES,
	value="any",
	)
	dish_type_dd = gr.Dropdown(
	label="Dish type",
	choices=DISH_TYPE_CHOICES,
	value="any",
	)
	find_btn = gr.Button("Find Recipes 🔍", variant="primary", size="lg")

	# OPTIMISATION 4 — pre-loaded text examples
	gr.Examples(
	examples=[
	["tomato, mozzarella, basil", "vegetarian", "any", "any"],
	["chicken, garlic, lemon", "any", "medium", "any"],
	["oats, banana, honey", "vegan", "any", "any"],
	["pasta, eggs, bacon, parmesan", "any", "medium", "any"],
	["black beans, corn, avocado", "vegan", "any", "any"],
	],
	inputs=[text_input, dietary_dd, speed_dd, dish_type_dd],
	label="Try an example",
	examples_per_page=5,
	cache_examples=False,
	)

	# ── RIGHT COLUMN: results ──────────────────────────────────────
	with gr.Column(scale=2):

	search_status = gr.Markdown(
	"Upload a photo or type ingredients, then click Find Recipes."
	)

	# Panel A — detected ingredients (HTML: thumbnail OR coloured badge)
	with gr.Accordion("Detected ingredients", open=True):
	ingr_html = gr.HTML(
	value='<p style="color:#aaa;padding:8px;font-size:13px">—</p>'
	)

	# Panel B — top recipes (Phase 1 output)
	with gr.Accordion("Top recipes", open=True):
	dish_gallery = gr.Gallery(
	label="Dish images — click to select a recipe",
	columns=5,
	height=190,
	object_fit="cover",
	show_label=True,
	allow_preview=False,
	)
	recipe_df = gr.Dataframe(
	headers=["Title", "Cuisine", "Type", "Speed", "Dietary"],
	interactive=False,
	wrap=True,
	row_count=(5, "fixed"),
	)

	# Panel C — selected recipe details + LLM narration
	with gr.Accordion(
	"Recipe procedure and ingredients",
	open=True,
	):
	recipe_detail_md = gr.Markdown(
	"Select a recipe to see ingredients and procedure."
	)
	narrate_btn = gr.Button(
	"Narrate selected recipe ▶", variant="secondary"
	)
	narration_box = gr.Textbox(
	lines=12,
	interactive=False,
	placeholder=(
	"Select a recipe in the table above, "
	"then click 'Narrate selected recipe'…"
	),
	show_copy_button=True,
	label="",
	)

	# Panel D — chat about active recipe
	with gr.Accordion(
	"Chat about this recipe [TinyLlama · ~20 s per reply]",
	open=True,
	):
	chatbot = gr.Chatbot(height=300, bubble_full_width=False)
	with gr.Row():
	chat_input = gr.Textbox(
	placeholder="Ask me anything about this recipe…",
	show_label=False,
	scale=5,
	)
	chat_btn = gr.Button("Send ↩", scale=1, variant="primary")
	clear_btn = gr.Button("Clear chat", size="sm")

	# OPTIMISATION 5 — Pipeline transparency panel
	with gr.Accordion("Pipeline transparency", open=False):
	gr.Markdown(
	"_Query embedding text, MLP reranker scores, "
	"and per-stage timing for the last request._"
	)
	pipeline_debug_json = gr.JSON(label="", value={})

	# ── TAB 2 — How it works ───────────────────────────────────────────────
	with gr.Tab("How it works"):
	gr.Markdown(PIPELINE_MD)

	# ── EVENT HANDLERS ────────────────────────────────────────────────────────

	# Phase 1 search — 7 outputs (added ingr_html, pipeline_debug)
	find_btn.click(
	fn=find_recipes,
	inputs=[img_input, text_input, dietary_dd, speed_dd, dish_type_dd],
	outputs=[
	search_status,
	ingr_html,
	dish_gallery,
	recipe_df,
	recipe_detail_md,
	recipe_state,
	results_state,
	pipeline_debug_json,
	],
	)

	# Select recipe via dataframe row click
	recipe_df.select(
	fn=select_from_df,
	inputs=[results_state],
	outputs=[recipe_state, search_status, recipe_detail_md],
	)

	# Select recipe via dish gallery click
	dish_gallery.select(
	fn=select_from_gallery,
	inputs=[results_state],
	outputs=[recipe_state, search_status, recipe_detail_md],
	)

	# Phase 2 — streaming narration (lazy LLM)
	narrate_btn.click(
	fn=generate_recipe,
	inputs=[recipe_state],
	outputs=[narration_box],
	)

	# Chat — button or Enter key
	chat_btn.click(
	fn=chat_about_recipe,
	inputs=[chat_input, chatbot, recipe_state],
	outputs=[chatbot, chat_input],
	)
	chat_input.submit(
	fn=chat_about_recipe,
	inputs=[chat_input, chatbot, recipe_state],
	outputs=[chatbot, chat_input],
	)

	clear_btn.click(fn=lambda: ([], ""), outputs=[chatbot, chat_input])

	# ─────────────────────────────────────────────────────────────────────────────
	# LAUNCH
	# ─────────────────────────────────────────────────────────────────────────────
	demo.queue(max_size=3)
	demo.launch()