Spaces:

blackWizard
/

home-kitchen-admin

Running

Nguyen Minh Nhat

After-Shift Admin Assistant

11b9749 16 days ago

9.13 kB

	"""LLM extraction: messy voice-note text -> structured order records.

	Runs on the unified Gemma 4 model (see gemma.py). Gemma's `transformers` path has no
	GBNF grammar, so instead of a hard guarantee we ask for pure JSON, parse it robustly
	(stripping code fences / surrounding prose), and retry once on failure. The editable
	confirm screen is the final safety net if a field still comes out wrong.

	A single note may describe several customers, so the schema is a list of orders.
	"""

	from __future__ import annotations

	import json
	import re

	import gemma
	import llama_backend
	from config import GEMMA_MAX_NEW_TOKENS

	# Fields every normalized order dict carries. (Storage keys are kept generic so the
	# DB schema is stable; their food meaning: services=items ordered,
	# next_appointment=pickup/delivery, supplies=ingredients to buy.)
	JOB_FIELDS = (
	"customer", "services", "amount_charged", "amount_paid",
	"payment_method", "next_appointment", "supplies", "notes",
	)

	# JSON schema -> GBNF grammar. All fields required so no key can ever go missing;
	# unknown numbers become 0, unknown strings "", empty lists []. payment_method is
	# an enum so the model can't free-type it.
	EXTRACTION_SCHEMA = {
	"type": "object",
	"properties": {
	"jobs": {
	"type": "array",
	"items": {
	"type": "object",
	"properties": {
	"customer": {"type": "string"},
	"services": {"type": "array", "items": {"type": "string"}},
	"amount_charged": {"type": "number"},
	"amount_paid": {"type": "number"},
	"payment_method": {"type": "string", "enum": ["cash", "card", "transfer", ""]},
	"next_appointment": {"type": "string"},
	"supplies": {"type": "array", "items": {"type": "string"}},
	"notes": {"type": "string"},
	},
	"required": list(JOB_FIELDS),
	},
	}
	},
	"required": ["jobs"],
	}

	_SYSTEM = """You convert a home-based food maker's messy spoken voice note into structured ORDER records (custom cakes, party trays, festive treats, catering).

	The JSON keys are generic; fill them with food-order meaning:
	- customer = who the order is for.
	- services = the ITEMS ordered, each as a short string with quantity (e.g. "2 dozen pineapple tarts").
	- amount_charged = the TOTAL price of the order.
	- amount_paid = how much they've paid so far (a deposit, or the full amount).
	• "80, paid 20 deposit" -> amount_charged 80, amount_paid 20.
	• "45, paid already" / "paid cash 45" -> amount_charged 45, amount_paid 45.
	• "200, pay on delivery" -> amount_charged 200, amount_paid 0.
	- payment_method = exactly one of: cash, card, transfer, or "" if not said.
	- next_appointment = the PICKUP / DELIVERY time in her own words ("Saturday", "tomorrow evening").
	- supplies = INGREDIENTS she needs to buy for the order.
	- notes = short reminders that don't fit other fields.

	Rules:
	- A note may contain ONE or SEVERAL orders. Return one entry per order.
	- Unknown number -> 0. Unknown text -> "". Nothing to buy -> [].
	- Never invent data that isn't in the note.
	Return ONLY the JSON object."""

	# Few-shot examples: deposit+balance, paid-in-full, unpaid catering, multi-order.
	_FEWSHOT = [
	(
	"Mrs Tan ordered two dozen pineapple tarts and a kaya cake, eighty dollars "
	"total, she paid twenty deposit by transfer, picking up Saturday. I need "
	"more butter and pandan leaves.",
	{"jobs": [{
	"customer": "Mrs Tan",
	"services": ["2 dozen pineapple tarts", "Kaya cake"],
	"amount_charged": 80, "amount_paid": 20,
	"payment_method": "transfer", "next_appointment": "Saturday",
	"supplies": ["butter", "pandan leaves"], "notes": "",
	}]},
	),
	(
	"David wants a chocolate birthday cake for forty-five, paid cash already, "
	"collecting tomorrow evening.",
	{"jobs": [{
	"customer": "David",
	"services": ["Chocolate birthday cake"],
	"amount_charged": 45, "amount_paid": 45,
	"payment_method": "cash", "next_appointment": "tomorrow evening",
	"supplies": [], "notes": "",
	}]},
	),
	(
	"Catering for the Lim office party, fifty curry puffs and three trays of "
	"nasi lemak, two hundred dollars, they'll pay on delivery Friday. Order more "
	"chicken and curry powder.",
	{"jobs": [{
	"customer": "Lim office party",
	"services": ["50 curry puffs", "3 trays nasi lemak"],
	"amount_charged": 200, "amount_paid": 0,
	"payment_method": "", "next_appointment": "Friday",
	"supplies": ["chicken", "curry powder"], "notes": "",
	}]},
	),
	(
	"Auntie Siti picking up four dozen kueh lapis later, sixty dollars cash done. "
	"And Mr Goh ordered a durian cake for next Sunday, ninety, paid thirty deposit card.",
	{"jobs": [
	{"customer": "Auntie Siti", "services": ["4 dozen kueh lapis"],
	"amount_charged": 60, "amount_paid": 60, "payment_method": "cash",
	"next_appointment": "later today", "supplies": [], "notes": ""},
	{"customer": "Mr Goh", "services": ["Durian cake"],
	"amount_charged": 90, "amount_paid": 30, "payment_method": "card",
	"next_appointment": "next Sunday", "supplies": [], "notes": ""},
	]},
	),
	]

	def _build_messages(text: str) -> list[dict]:
	messages = [{"role": "system", "content": _SYSTEM}]
	for user_text, answer in _FEWSHOT:
	messages.append({"role": "user", "content": user_text})
	messages.append({"role": "assistant", "content": json.dumps(answer, ensure_ascii=False)})
	messages.append({"role": "user", "content": text})
	return messages


	def _to_float(x) -> float:
	try:
	return round(float(x), 2)
	except (TypeError, ValueError):
	return 0.0


	def _normalize(job: dict) -> dict:
	services = [str(s).strip() for s in (job.get("services") or []) if str(s).strip()]
	supplies = [str(s).strip() for s in (job.get("supplies") or []) if str(s).strip()]
	method = str(job.get("payment_method") or "").strip().lower()
	if method not in {"cash", "card", "transfer", ""}:
	method = ""
	return {
	"customer": str(job.get("customer") or "Customer").strip() or "Customer",
	"services": services,
	"amount_charged": _to_float(job.get("amount_charged")),
	"amount_paid": _to_float(job.get("amount_paid")),
	"payment_method": method,
	"next_appointment": str(job.get("next_appointment") or "").strip(),
	"supplies": supplies,
	"notes": str(job.get("notes") or "").strip(),
	}


	def _parse_jobs(content: str) -> list[dict] \| None:
	"""Pull the jobs list out of a model reply. Tolerates ```json fences and prose
	around the object. Returns None if no valid JSON object is found."""
	if not content:
	return None
	# Strip code fences, then grab the outermost {...} block.
	cleaned = re.sub(r"^```(?:json)?\|```$", "", content.strip(), flags=re.MULTILINE).strip()
	start, end = cleaned.find("{"), cleaned.rfind("}")
	if start == -1 or end == -1 or end <= start:
	return None
	try:
	data = json.loads(cleaned[start:end + 1])
	except (json.JSONDecodeError, TypeError):
	return None
	jobs = data.get("jobs") if isinstance(data, dict) else None
	return jobs if isinstance(jobs, list) else None


	def extract(text: str) -> list[dict]:
	"""Extract a list of normalized order dicts from a transcript. Never raises on a
	bad model response — returns [] so the UI can show a friendly message.

	Primary path: llama.cpp with a grammar (JSON is guaranteed valid).
	Fallback: Gemma via transformers (no grammar -> robust parse + one retry)."""
	text = (text or "").strip()
	if not text:
	return []

	messages = _build_messages(text)

	# --- Primary: llama.cpp + GBNF grammar ---
	try:
	content = llama_backend.extract_json(messages, EXTRACTION_SCHEMA)
	jobs = _parse_jobs(content)
	if jobs is not None:
	return [_normalize(j) for j in jobs if isinstance(j, dict)]
	except llama_backend.BackendUnavailable:
	pass # fall through to the transformers backend

	# --- Fallback: Gemma (transformers) ---
	content = gemma.generate_chat(messages, max_new_tokens=GEMMA_MAX_NEW_TOKENS)
	jobs = _parse_jobs(content)
	if jobs is None: # one corrective retry — common fix is stray prose around the JSON
	messages = messages + [
	{"role": "assistant", "content": content},
	{"role": "user", "content": "Output ONLY the JSON object, no prose, no code fences."},
	]
	content = gemma.generate_chat(messages, max_new_tokens=GEMMA_MAX_NEW_TOKENS)
	jobs = _parse_jobs(content)

	if not jobs:
	return []
	return [_normalize(j) for j in jobs if isinstance(j, dict)]