Spaces:

Fahad-sha
/

RetailProductRecommendationExplainer

Sleeping

App Files Files Community

RetailProductRecommendationExplainer / trainer /make_data.py

Fahad-sha

Upload 5 files

a365d48 verified 13 days ago

raw

history blame contribute delete

6.46 kB

	import json
	import random
	from pathlib import Path
	from utils_prompts import SYSTEM_PROMPT, format_user_prompt

	random.seed(7)

	SCENARIOS = [
	{
	"user_intent": "I run 5k daily and want to reduce knee discomfort.",
	"cart": ["running shoes", "moisture-wicking socks"],
	"constraints": {"budget_usd": 45, "shipping_urgency": "fast", "brand_avoid": []},
	"good_recos": ["knee compression sleeve", "foam roller", "anti-chafe balm"],
	},
	{
	"user_intent": "I’m setting up pour-over coffee at home and want consistent taste.",
	"cart": ["coffee beans", "paper filters"],
	"constraints": {"budget_usd": 60, "shipping_urgency": "normal", "brand_avoid": []},
	"good_recos": ["gooseneck kettle", "digital scale", "hand grinder"],
	},
	{
	"user_intent": "I get acne sometimes; want a simple skincare routine.",
	"cart": ["gentle cleanser"],
	"constraints": {"budget_usd": 35, "shipping_urgency": "normal", "brand_avoid": ["fragrance-heavy"]},
	"good_recos": ["non-comedogenic moisturizer", "sunscreen SPF 30+", "salicylic acid spot treatment"],
	},
	{
	"user_intent": "I travel weekly and need phone accessories that won’t break.",
	"cart": ["USB-C cable"],
	"constraints": {"budget_usd": 50, "shipping_urgency": "fast", "brand_avoid": []},
	"good_recos": ["compact wall charger (PD)", "cable organizer", "power bank (airline-safe)"],
	},
	{
	"user_intent": "I’m cooking more; want quick, healthy meals.",
	"cart": ["olive oil", "brown rice"],
	"constraints": {"budget_usd": 40, "shipping_urgency": "normal", "brand_avoid": []},
	"good_recos": ["nonstick skillet", "meal-prep containers", "spice blend (low sodium)"],
	},
	]

	def make_good_answer(ex):
	recos = ex["good_recos"][:]
	random.shuffle(recos)
	recos = recos[: random.choice([1, 2, 3])]

	lines = []
	lines.append("Recommendations:")
	for i, item in enumerate(recos, 1):
	reason = {
	"knee compression sleeve": "supports the knee during runs and may reduce discomfort.",
	"foam roller": "helps with recovery and tightness after running.",
	"anti-chafe balm": "prevents irritation on longer runs.",
	"gooseneck kettle": "improves pour control for consistent extraction.",
	"digital scale": "lets you measure coffee-to-water ratio precisely.",
	"hand grinder": "fresh grind improves flavor consistency.",
	"non-comedogenic moisturizer": "hydrates without clogging pores.",
	"sunscreen SPF 30+": "protects skin daily; important even with acne care.",
	"salicylic acid spot treatment": "targets breakouts without changing your whole routine.",
	"compact wall charger (PD)": "charges faster and is more travel-friendly.",
	"cable organizer": "reduces cable damage and tangles in bags.",
	"power bank (airline-safe)": "keeps devices powered while traveling.",
	"nonstick skillet": "makes quick cooking with less oil easier.",
	"meal-prep containers": "supports batching healthy meals for the week.",
	"spice blend (low sodium)": "adds flavor without extra calories or sodium.",
	}.get(item, "fits your intent and complements your cart.")
	lines.append(f"{i}) {item} — {reason}")

	lines.append("Why these:")
	lines.append(f"- Matches your intent: {ex['user_intent']}")
	lines.append("- Complements what’s already in your cart (no duplicates).")
	if "budget_usd" in ex["constraints"]:
	lines.append(f"- Stays mindful of your budget (≈ ${ex['constraints']['budget_usd']}).")

	lines.append("Compatibility / checks:")
	lines.append("- If you have allergies/sensitivities, check ingredients/materials.")
	if ex["constraints"].get("shipping_urgency") == "fast":
	lines.append("- Prefer items with fast shipping / in-stock options.")

	lines.append("Optional next step:")
	lines.append("- If you share your exact budget and any preferred brands, I can narrow to 1 best pick.")
	return "\n".join(lines)

	def make_bad_answer(ex):
	# Intentionally violates rubric: too many items, salesy, ignores constraints, vague.
	spammy = [
	"premium smartwatch", "designer headphones", "expensive gift card",
	"random subscription", "luxury item bundle"
	]
	recos = ex["good_recos"] + random.sample(spammy, k=2)
	random.shuffle(recos)

	lines = []
	lines.append("You should buy these RIGHT NOW!!!")
	lines.append("Top picks (I guarantee you’ll love them):")
	for i, item in enumerate(recos[:5], 1):
	lines.append(f"{i}. {item} - best quality on the market, unbeatable.")
	lines.append("Trust me, this will fix everything.")
	return "\n".join(lines)

	def to_sft_record(ex):
	return {
	"messages": [
	{"role": "system", "content": SYSTEM_PROMPT},
	{"role": "user", "content": format_user_prompt(ex)},
	{"role": "assistant", "content": make_good_answer(ex)},
	]
	}

	def to_dpo_record(ex):
	return {
	"prompt": f"<\|system\|>\n{SYSTEM_PROMPT}\n<\|user\|>\n{format_user_prompt(ex)}\n<\|assistant\|>\n",
	"chosen": make_good_answer(ex),
	"rejected": make_bad_answer(ex),
	}

	def main(out_dir="data", n_repeat=80):
	out = Path(out_dir)
	out.mkdir(parents=True, exist_ok=True)

	sft_path = out / "sft.jsonl"
	dpo_path = out / "dpo.jsonl"

	sft_records = []
	dpo_records = []

	for _ in range(n_repeat):
	ex = random.choice(SCENARIOS)
	# light randomization
	ex = json.loads(json.dumps(ex))
	# occasionally tweak budget/urgency
	if random.random() < 0.3:
	ex["constraints"]["budget_usd"] = random.choice([25, 35, 45, 60, 80])
	if random.random() < 0.3:
	ex["constraints"]["shipping_urgency"] = random.choice(["fast", "normal"])
	sft_records.append(to_sft_record(ex))
	dpo_records.append(to_dpo_record(ex))

	with sft_path.open("w") as f:
	for r in sft_records:
	f.write(json.dumps(r) + "\n")

	with dpo_path.open("w") as f:
	for r in dpo_records:
	f.write(json.dumps(r) + "\n")

	print(f"Wrote {len(sft_records)} SFT rows to {sft_path}")
	print(f"Wrote {len(dpo_records)} DPO rows to {dpo_path}")

	if __name__ == "__main__":
	main()