Spaces:

lspcloud
/

amazon_mturker

Sleeping

File size: 47,969 Bytes

"""
Streamlit App: AI Product Willingness User Study
=================================================
Run locally (single category):
    streamlit run src/streamlit_app.py -- --category groceries
    streamlit run src/streamlit_app.py -- --category groceries --debug

Run locally (mixed mode — movies + groceries):
    streamlit run src/streamlit_app.py -- --mode mixed
    streamlit run src/streamlit_app.py -- --mode mixed --debug

On HuggingFace Spaces, set these environment variables in Space Settings → Variables:
    HF_TOKEN           - HuggingFace token
    TINKER_API_KEY     - Tinker AI API key
    DATASET_REPO_ID    - HuggingFace dataset repo to upload results
    CATEGORY           - groceries | books | movies | health  (single-category mode)
    MODE               - mixed  (overrides CATEGORY; runs movies + groceries together)
    DEBUG_MODE         - "true" to skip validation (optional)
"""

import csv
import json
import os
import random
import re
import sys
import tempfile
import time
import uuid
from datetime import datetime
from pathlib import Path

import streamlit as st
from dotenv import load_dotenv
from filelock import FileLock
from huggingface_hub import HfApi

load_dotenv()

# ---------------------------------------------------------------------------
# CLI args
# ---------------------------------------------------------------------------
import argparse
parser = argparse.ArgumentParser(add_help=False)
parser.add_argument("--category", choices=["books", "groceries", "movies", "health"], default=None)
parser.add_argument("--mode", choices=["mixed"], default=None)
parser.add_argument("--debug", action="store_true", default=False)
cli_args, _ = parser.parse_known_args()

# ---------------------------------------------------------------------------
# Config
# ---------------------------------------------------------------------------
MODE = os.getenv("MODE") or cli_args.mode  # "mixed" or None
CATEGORY = os.getenv("CATEGORY") or cli_args.category or "groceries"  # used only in single-category mode
DEBUG_MODE = os.getenv("DEBUG_MODE", "").lower() == "true" or cli_args.debug
DATASET_REPO_ID = os.getenv("DATASET_REPO_ID", "your-username/product-study")
HF_TOKEN = os.getenv("HF_TOKEN")

TINKER_API_KEY = os.getenv("TINKER_API_KEY")
MODEL_NAME = "openai/gpt-oss-20b"

# ---------------------------------------------------------------------------
# Mixed-mode constants
# ---------------------------------------------------------------------------
# In mixed mode these two categories are always used together
MIXED_CATEGORIES = ["movies", "groceries"]
# Each category contributes this many items to the shared pool of 100
MIXED_SUBSET_SIZE = 50   # 50 movies + 50 groceries = 100 total
SINGLE_SUBSET_SIZE = 100 # legacy single-category mode

# ---------------------------------------------------------------------------
# Prolific config
# ---------------------------------------------------------------------------
PROLIFIC_COMPLETION_URL = "https://app.prolific.com/submissions/complete?cc=CYC7ALM1"
PROLIFIC_COMPLETION_CODE = "CYC7ALM1"

BASE_DIR = os.path.dirname(os.path.abspath(__file__))
DATA_DIR = os.path.join(BASE_DIR, "data")
ANNOTATIONS_DIR = os.path.join(BASE_DIR, "annotations")
os.makedirs(DATA_DIR, exist_ok=True)
os.makedirs(ANNOTATIONS_DIR, exist_ok=True)

CATEGORY_TO_HF = {
    "books":     "ehejin/amazon_books",
    "groceries": "ehejin/amazon_Grocery_and_Gourmet_Food",
    "movies":    "ehejin/amazon_Movies_and_TV",
    "health":    "ehejin/amazon_Health_and_Household",
}
CATEGORY_DISPLAY = {
    "books":     "Books",
    "groceries": "Grocery Products",
    "movies":    "Movies & TV",
    "health":    "Health & Household Products",
}
# Per-product familiarity label (depends on the individual product's category)
FAMILIARITY_USED_LABEL = {
    "books":     "Read it before",
    "movies":    "Watched it before",
    "groceries": "Used it before",
    "health":    "Used it before",
}

PRODUCTS_PER_USER = 5
MIN_TURNS = 3
MAX_TURNS = 10

# Familiarity values that trigger a product swap
SWAP_FAMILIARITY = {"Purchased it before"}

DEBUG_DEMOGRAPHICS = {
    "age": "30", "gender": "Female", "geographic_region": "West",
    "education_level": "College graduate/some postgrad", "race": "White",
    "us_citizen": "Yes", "marital_status": "Single",
    "religion": "Agnostic", "religious_attendance": "Never",
    "political_affiliation": "Independent", "income": "$50,000-$75,000",
    "political_views": "Moderate", "household_size": "2",
    "employment_status": "Full-time employment",
}

WILLINGNESS_LABELS = {
    1: "Definitely would not buy",
    2: "Probably would not buy",
    3: "Slightly unlikely to buy",
    4: "Neutral",
    5: "Slightly likely to buy",
    6: "Probably would buy",
    7: "Definitely would buy",
}
WILLINGNESS_CHOICES = [f"{v} ({k})" for k, v in WILLINGNESS_LABELS.items()]


# ---------------------------------------------------------------------------
# Helpers: per-category file paths
# ---------------------------------------------------------------------------
def _data_path(category: str, suffix: str) -> str:
    subset = MIXED_SUBSET_SIZE if MODE == "mixed" else SINGLE_SUBSET_SIZE
    return os.path.join(DATA_DIR, f"{category}_test{subset}_{suffix}")


def local_data_path(category: str) -> str:
    return _data_path(category, "primary.json")

def overflow_path(category: str) -> str:
    return _data_path(category, "overflow.json")

def counter_path(category: str) -> str:
    return _data_path(category, "counter.txt")

def counter_lock_path(category: str) -> str:
    return _data_path(category, "counter.lock")

def return_queue_path(category: str) -> str:
    return _data_path(category, "return_queue.json")


# ---------------------------------------------------------------------------
# Dataset loading
# ---------------------------------------------------------------------------
@st.cache_resource
def download_and_cache_dataset(category: str, subset_size: int):
    """Download test split from HuggingFace and cache locally."""
    primary_path = local_data_path(category)
    over_path = overflow_path(category)
    if os.path.exists(primary_path):
        print(f"[DATA] Found cached dataset for {category} at {primary_path}")
        return
    print(f"[DATA] Downloading {CATEGORY_TO_HF[category]} (test split, first {subset_size}) from HuggingFace...")
    try:
        from datasets import load_dataset
        import huggingface_hub
        if HF_TOKEN:
            huggingface_hub.login(token=HF_TOKEN)

        ds = load_dataset(CATEGORY_TO_HF[category], split="test")

        def to_list(val):
            if isinstance(val, list): return val
            if isinstance(val, str): return [val] if val else []
            return []

        all_items = []
        for row in ds:
            meta = row.get("metadata", {})
            item = {
                "id": str(uuid.uuid4()),
                "title": meta.get("title", "") if isinstance(meta, dict) else "",
                "description": to_list(meta.get("description", []) if isinstance(meta, dict) else []),
                "features": to_list(meta.get("features", []) if isinstance(meta, dict) else []),
                "price": meta.get("price", "N/A") if isinstance(meta, dict) else "N/A",
                "category": category,
            }
            all_items.append(item)

        primary = all_items[:subset_size]
        overflow = all_items[subset_size:]

        with open(primary_path, "w") as f:
            json.dump(primary, f, indent=2)
        with open(over_path, "w") as f:
            json.dump(overflow, f, indent=2)

        print(f"[DATA] {category}: cached {len(primary)} primary + {len(overflow)} overflow items.")
    except Exception as e:
        print(f"[DATA] ERROR downloading {category}: {e}")
        raise


@st.cache_resource
def load_primary_dataset(category: str):
    with open(local_data_path(category), "r") as f:
        return json.load(f)


@st.cache_resource
def load_overflow_dataset(category: str):
    path = overflow_path(category)
    if not os.path.exists(path):
        return []
    with open(path, "r") as f:
        return json.load(f)


def _ensure_datasets():
    """Download/cache all needed category datasets."""
    if MODE == "mixed":
        for cat in MIXED_CATEGORIES:
            download_and_cache_dataset(cat, MIXED_SUBSET_SIZE)
    else:
        download_and_cache_dataset(CATEGORY, SINGLE_SUBSET_SIZE)


# ---------------------------------------------------------------------------
# Per-category counter helpers
# ---------------------------------------------------------------------------
def _read_counter(category: str) -> int:
    path = counter_path(category)
    if not os.path.exists(path):
        return 0
    with open(path, "r") as f:
        return int(f.read().strip() or "0")


def _write_counter(category: str, value: int):
    with open(counter_path(category), "w") as f:
        f.write(str(value))


def _read_return_queue(category: str) -> list:
    path = return_queue_path(category)
    if not os.path.exists(path):
        return []
    with open(path, "r") as f:
        try:
            return json.load(f)
        except Exception:
            return []


def _write_return_queue(category: str, queue: list):
    with open(return_queue_path(category), "w") as f:
        json.dump(queue, f)


# ---------------------------------------------------------------------------
# Product assignment
# ---------------------------------------------------------------------------
def _assign_from_category(category: str, n: int) -> list:
    """
    Atomically assign n products from a single category pool.
    - Drains the return queue first.
    - Pulls sequentially from the primary pool.
    - Wraps around (modulo pool size) when exhausted so user 21+ still get valid items.
    """
    items = load_primary_dataset(category)
    total = len(items)
    lock = FileLock(counter_lock_path(category))

    with lock:
        return_queue = _read_return_queue(category)
        counter = _read_counter(category)
        assigned = []

        for _ in range(n):
            if return_queue:
                assigned.append(return_queue.pop(0))
            else:
                # Wrap-around: counter mod total so we cycle through items
                assigned.append(items[counter % total])
                counter += 1

        _write_return_queue(category, return_queue)
        _write_counter(category, counter)

    return assigned


def assign_mixed_products(n: int = PRODUCTS_PER_USER) -> list:
    """
    Assign n products split across movies and groceries.
    Alternates the majority category each call so coverage stays balanced.

    User 1: 3 movies + 2 groceries
    User 2: 2 movies + 3 groceries
    User 3: 3 movies + 2 groceries  ... etc.

    The split is decided by reading the movies counter parity (even → movies gets 3).
    """
    movies_counter = _read_counter("movies")
    # Even call-count → movies gets the larger share
    if (movies_counter // 1) % 2 == 0:
        n_movies, n_groceries = 3, 2
    else:
        n_movies, n_groceries = 2, 3

    # Clamp in case n != 5
    if n_movies + n_groceries != n:
        n_movies = n // 2
        n_groceries = n - n_movies

    movie_items    = _assign_from_category("movies",    n_movies)
    grocery_items  = _assign_from_category("groceries", n_groceries)

    combined = movie_items + grocery_items
    random.shuffle(combined)  # mix so user doesn't see all movies then all groceries
    return combined


def assign_products(n: int = PRODUCTS_PER_USER) -> list:
    """Dispatcher: mixed mode or single-category mode."""
    if MODE == "mixed":
        return assign_mixed_products(n)
    # Single-category (legacy behaviour)
    return _assign_from_category(CATEGORY, n)


def return_product_to_queue(product: dict):
    """Put a rejected/swapped product back so it gets reassigned."""
    cat = product.get("category", CATEGORY)
    lock = FileLock(counter_lock_path(cat))
    with lock:
        queue = _read_return_queue(cat)
        if not any(p["id"] == product["id"] for p in queue):
            queue.append(product)
        _write_return_queue(cat, queue)


def get_swap_product(exclude_ids: set, category: str) -> dict | None:
    """
    Get a replacement product for the given category.
    1. Next unassigned primary product (advances counter).
    2. Wrap-around: any primary product not held by this user.
    3. Overflow pool.
    """
    items    = load_primary_dataset(category)
    overflow = load_overflow_dataset(category)
    total    = len(items)

    lock = FileLock(counter_lock_path(category))
    with lock:
        counter = _read_counter(category)

        # 1. Unassigned (with wrap-around awareness)
        attempts = 0
        while attempts < total:
            candidate = items[counter % total]
            counter += 1
            attempts += 1
            if candidate["id"] not in exclude_ids:
                _write_counter(category, counter)
                return candidate

        # 2. Any primary product not held by this user
        for p in items:
            if p["id"] not in exclude_ids:
                return p

        # 3. Overflow
        for p in overflow:
            if p["id"] not in exclude_ids:
                return p

    return None


# ---------------------------------------------------------------------------
# AI client (Tinker)
# ---------------------------------------------------------------------------
@st.cache_resource
def get_tinker_clients():
    """Initialise and cache Tinker sampling client, renderer, and tokenizer."""
    import tinker
    from tinker import types as tinker_types
    from tinker_cookbook import renderers
    from tinker_cookbook.tokenizer_utils import get_tokenizer
    from tinker_cookbook.model_info import get_recommended_renderer_name

    service_client = tinker.ServiceClient()
    sampling_client = service_client.create_sampling_client(base_model=MODEL_NAME)
    tokenizer = get_tokenizer(MODEL_NAME)
    renderer_name = get_recommended_renderer_name(MODEL_NAME)
    renderer = renderers.get_renderer(renderer_name, tokenizer)
    return sampling_client, renderer, tinker_types


def call_model(messages: list) -> str:
    try:
        from tinker_cookbook import renderers as tinker_renderers
        sampling_client, renderer, tinker_types = get_tinker_clients()

        prompt = renderer.build_generation_prompt(messages)
        params = tinker_types.SamplingParams(
            max_tokens=1000,
            temperature=0.7,
            stop=renderer.get_stop_sequences(),
        )
        result = sampling_client.sample(
            prompt=prompt,
            sampling_params=params,
            num_samples=1,
        ).result()
        parsed_message, _ = renderer.parse_response(result.sequences[0].tokens)
        content = tinker_renderers.format_content_as_string(parsed_message["content"])
        content = re.sub(r"<think>.*?</think>", "", content, flags=re.DOTALL).strip()
        return content
    except Exception as e:
        print(f"[MODEL] Tinker error: {e}")
        return f"[Model error: {e}]"


# ---------------------------------------------------------------------------
# HuggingFace upload
# ---------------------------------------------------------------------------
@st.cache_resource
def get_hf_api():
    api = HfApi(token=HF_TOKEN) if HF_TOKEN else HfApi()
    if HF_TOKEN:
        try:
            api.repo_info(repo_id=DATASET_REPO_ID, repo_type="dataset")
            print(f"[HF] Repo {DATASET_REPO_ID} exists.")
        except Exception as e:
            if "404" in str(e) or "not found" in str(e).lower():
                api.create_repo(repo_id=DATASET_REPO_ID, repo_type="dataset", private=True)
                print(f"[HF] Created repo {DATASET_REPO_ID}.")
            else:
                print(f"[HF] WARNING: {e}")
    return api


def save_and_upload(state: dict):
    hf_api = get_hf_api()
    worker_id = state.get("prolific_pid") or state.get("user_id", "anonymous")
    submission_id = state.get("submission_id", str(uuid.uuid4()))
    safe_worker = "".join(c if c.isalnum() else "_" for c in str(worker_id))
    mode_tag = state.get("mode", "single")
    filename = f"{submission_id}_{mode_tag}.json"
    folder = os.path.join(ANNOTATIONS_DIR, safe_worker)
    os.makedirs(folder, exist_ok=True)
    file_path = os.path.join(folder, filename)
    with open(file_path, "w") as f:
        json.dump(state, f, indent=2)
    print(f"[SAVE] Wrote {file_path}")
    if HF_TOKEN:
        try:
            hf_api.upload_file(
                path_or_fileobj=file_path,
                path_in_repo=f"{safe_worker}/{filename}",
                repo_id=DATASET_REPO_ID,
                repo_type="dataset",
            )
            print("[HF] Uploaded JSON.")
        except Exception as e:
            print(f"[HF] JSON upload error: {e}")
    upload_csv_rows(state, hf_api, safe_worker, submission_id)


def upload_csv_rows(state: dict, hf_api, safe_worker: str, submission_id: str):
    demographics = state.get("demographics", {})
    products = state.get("products", [])
    header = [
        "submission_id", "prolific_pid", "study_id", "session_id",
        "submission_time", "duration_seconds", "mode", "category",
        "age", "gender", "geographic_region", "education_level", "race",
        "us_citizen", "marital_status", "religion", "religious_attendance",
        "political_affiliation", "income", "political_views", "household_size", "employment_status",
        "product_index", "product_id", "title", "price", "familiarity",
        "pre_willingness", "pre_willingness_label", "post_willingness", "post_willingness_label",
        "willingness_delta", "num_turns", "conversation_json", "standout_moment", "thinking_change",
        "was_swapped",
    ]
    rows = []
    for i, prod in enumerate(products):
        conv = prod.get("conversation", {})
        refl = prod.get("reflection", {})
        pre = prod.get("pre_willingness", "")
        post = prod.get("post_willingness", "")
        delta = (post - pre) if isinstance(pre, int) and isinstance(post, int) else ""
        row = [
            submission_id,
            state.get("prolific_pid", ""),
            state.get("study_id", ""),
            state.get("session_id", ""),
            state.get("meta", {}).get("submission_time", ""),
            state.get("meta", {}).get("duration_seconds", ""),
            state.get("mode", "single"),
            prod.get("category", ""),   # per-product category
            demographics.get("age", ""), demographics.get("gender", ""),
            demographics.get("geographic_region", ""), demographics.get("education_level", ""),
            demographics.get("race", ""), demographics.get("us_citizen", ""),
            demographics.get("marital_status", ""), demographics.get("religion", ""),
            demographics.get("religious_attendance", ""), demographics.get("political_affiliation", ""),
            demographics.get("income", ""), demographics.get("political_views", ""),
            demographics.get("household_size", ""), demographics.get("employment_status", ""),
            i + 1, prod.get("id", ""), prod.get("title", ""), prod.get("price", ""),
            prod.get("familiarity", ""),
            pre, WILLINGNESS_LABELS.get(pre, "") if isinstance(pre, int) else "",
            post, WILLINGNESS_LABELS.get(post, "") if isinstance(post, int) else "",
            delta, conv.get("num_turns", 0), json.dumps(conv.get("turns", [])),
            refl.get("standout_moment", ""), refl.get("thinking_change", ""),
            prod.get("was_swapped", False),
        ]
        rows.append(row)

    timestamp_str = datetime.now().strftime("%Y%m%d_%H%M%S")
    unique_id = uuid.uuid4().hex[:8]
    csv_filename = f"csv_submissions/{timestamp_str}_{safe_worker}_{unique_id}.csv"
    with tempfile.NamedTemporaryFile(mode="w", suffix=".csv", delete=False, newline="", encoding="utf-8") as tmp:
        tmp_path = tmp.name
        writer = csv.writer(tmp)
        writer.writerow(header)
        writer.writerows(rows)
    if HF_TOKEN:
        try:
            hf_api.upload_file(
                path_or_fileobj=tmp_path,
                path_in_repo=csv_filename,
                repo_id=DATASET_REPO_ID,
                repo_type="dataset",
            )
            print("[HF] Uploaded CSV rows.")
        except Exception as e:
            print(f"[HF] CSV upload error: {e}")
    os.unlink(tmp_path)


# ---------------------------------------------------------------------------
# Prompt builders
# ---------------------------------------------------------------------------
def build_sales_system_prompt(product: dict) -> str:
    title = product.get("title", "this product")
    price = product.get("price", "N/A")
    description = product.get("description", [])
    features = product.get("features", [])
    desc_text = " ".join(description) if description else "No description available."
    feat_text = " ".join(features) if features else ""
    price_str = f"${price}" if price and price != "N/A" and not str(price).startswith("$") else price
    return f"""You are a warm, knowledgeable sales agent for an Amazon product. Your goal is to convince the user to buy this product.

Product name: {title}
Product description and features: {desc_text} {feat_text}
Price: {price_str}

You need to convince the user to buy it.

First message rules:
- In ONE paragraph: briefly highlight the product's best quality, explain why it's worth buying, and hit them with the strongest benefit
- End with an engaging question that draws out their interest or hesitation

Follow-up message rules:
- In ONE paragraph: acknowledge what they said, address any concerns directly with a concrete benefit or reassurance, end with a question
- Use their words against hesitation: if they say it's expensive, talk value; if they doubt quality, cite a feature
- Vary your tactics: sometimes appeal to emotion (convenience, joy), sometimes to reason (value, quality)
- Use "imagine if..." scenarios to make benefits concrete

General style:
- Be warm, confident, and conversational — like a helpful friend who knows the product well, not a pushy salesperson
- End your messages with an engaging question
- Never fabricate statistics, details, or reviews you don't have
- Never make up a price different from the one given
"""


def build_opening_user_message(product: dict) -> str:
    return f'Tell me about this product and why I should buy it: "{product.get("title", "this product")}"'


def parse_willingness(choice_str: str) -> int:
    try:
        return int(choice_str.split("(")[1].rstrip(")"))
    except Exception:
        return 4


def get_familiarity_choices(category: str) -> list:
    """Return familiarity options with the correct 'used' label for this product's category."""
    used_label = FAMILIARITY_USED_LABEL.get(category, "Used it before")
    return [
        "Never heard of it",
        "Heard of it, but not used/purchased",
        used_label,
        "Purchased it before",
    ]


def needs_swap(familiarity_val: str, pre_will_val: str) -> bool:
    if familiarity_val in SWAP_FAMILIARITY:
        return True
    if pre_will_val == WILLINGNESS_CHOICES[-1]:  # "Definitely would buy (7)"
        return True
    return False


# ---------------------------------------------------------------------------
# Welcome screen helpers
# ---------------------------------------------------------------------------
def study_display_name() -> str:
    """Human-readable name for what the user will evaluate."""
    if MODE == "mixed":
        return "Movies & TV and Grocery Products"
    return CATEGORY_DISPLAY.get(CATEGORY, CATEGORY)


def study_category_breakdown() -> str:
    """Extra sentence shown on welcome screen describing the mix."""
    if MODE == "mixed":
        return (
            "You will evaluate a mix of **Movies & TV** and **Grocery Products** "
            "(roughly 2–3 of each)."
        )
    return ""


# ---------------------------------------------------------------------------
# State initialisation
# ---------------------------------------------------------------------------
def make_product_slot(p: dict, was_swapped: bool = False) -> dict:
    return {
        "id": p.get("id", str(uuid.uuid4())),
        "title": p.get("title", ""),
        "description": p.get("description", []),
        "features": p.get("features", []),
        "price": p.get("price", "N/A"),
        "category": p.get("category", CATEGORY),   # ← per-product category
        "familiarity": None,
        "pre_willingness": None,
        "post_willingness": None,
        "willingness_delta": None,
        "was_swapped": was_swapped,
        "conversation": {
            "system_prompt": "",
            "opening_user_message": "",
            "turns": [],
            "num_turns": 0,
        },
        "reflection": {},
    }


def init_state():
    _ensure_datasets()
    assigned = assign_products(PRODUCTS_PER_USER)

    try:
        params = st.query_params
    except Exception:
        params = {}

    return {
        "submission_id": str(uuid.uuid4()),
        "user_id": str(uuid.uuid4()),
        "prolific_pid": params.get("PROLIFIC_PID", ""),
        "study_id":     params.get("STUDY_ID", ""),
        "session_id":   params.get("SESSION_ID", ""),
        "start_time": time.time(),
        "mode": MODE or "single",
        "category": CATEGORY if MODE != "mixed" else "mixed",
        "demographics": {},
        "products": [make_product_slot(p) for p in assigned],
        "current_product_index": 0,
        "screen": "welcome",
        "meta": {},
    }


# ---------------------------------------------------------------------------
# CSS
# ---------------------------------------------------------------------------
def inject_css():
    st.markdown("""
    <style>
    #MainMenu, footer, header { visibility: hidden; }
    .block-container { max-width: 820px; padding-top: 2rem; }

    .product-card {
        border: 2px solid #2563eb;
        border-radius: 10px;
        padding: 1rem 1.25rem;
        background: #f0f6ff;
        margin-bottom: 0.75rem;
    }
    .pc-header {
        display: flex;
        justify-content: space-between;
        align-items: flex-start;
        margin-bottom: 0.6rem;
        gap: 1rem;
    }
    .pc-title { font-size: 1.05rem; font-weight: 700; color: #1a1a2e; line-height: 1.35; flex: 1; }
    .pc-price { font-size: 1.2rem; font-weight: 800; color: #16a34a; white-space: nowrap; }
    .pc-category-badge {
        display: inline-block;
        font-size: 0.75rem; font-weight: 600;
        padding: 0.15rem 0.55rem;
        border-radius: 99px;
        margin-bottom: 0.4rem;
        background: #dbeafe; color: #1e40af;
    }
    .pc-section { margin-top: 0.5rem; }
    .pc-section-title {
        font-weight: 600; font-size: 0.85rem; color: #475569;
        text-transform: uppercase; letter-spacing: 0.04em; margin-bottom: 0.3rem;
    }
    .pc-desc { font-size: 0.92rem; color: #334155; line-height: 1.6; }
    .pc-list { margin: 0; padding-left: 1.2rem; font-size: 0.92rem; color: #334155; line-height: 1.5; }
    .pc-list li { margin-bottom: 0.25rem; }

    .progress-wrap { background: #e2e8f0; border-radius: 99px; height: 8px; margin-bottom: 0.25rem; overflow: hidden; }
    .progress-fill { background: #2563eb; height: 100%; border-radius: 99px; }
    .progress-label { font-size: 0.82rem; color: #64748b; text-align: right; margin-bottom: 1rem; }

    .chat-wrap { max-height: 420px; overflow-y: auto; margin-bottom: 1rem; }
    .bubble { padding: 0.65rem 0.9rem; border-radius: 12px; margin-bottom: 0.5rem; font-size: 0.93rem; line-height: 1.5; }
    .bubble-ai { background: #eff6ff; border: 1px solid #93c5fd; margin-right: 10%; }
    .bubble-user { background: #f0fdf4; border: 1px solid #86efac; margin-left: 10%; text-align: right; }
    .bubble-label { font-size: 0.75rem; color: #94a3b8; margin-bottom: 0.2rem; }
    </style>
    """, unsafe_allow_html=True)


# ---------------------------------------------------------------------------
# UI helpers
# ---------------------------------------------------------------------------
def render_product_card_html(product: dict, compact: bool = False) -> str:
    title = product.get("title", "Unknown Product")
    price = product.get("price", "N/A")
    description = product.get("description", [])
    features = product.get("features", [])
    category = product.get("category", "")
    price_str = f"${price}" if price and price != "N/A" and not str(price).startswith("$") else price

    # Category badge — only shown in mixed mode
    badge_html = ""
    if MODE == "mixed" and category:
        badge_label = CATEGORY_DISPLAY.get(category, category)
        badge_html = f'<div class="pc-category-badge">📂 {badge_label}</div>'

    desc_html = ""
    if description:
        desc_text = " ".join(d for d in description if d)
        desc_html = f'<div class="pc-section"><div class="pc-section-title">📋 Description</div><div class="pc-desc">{desc_text}</div></div>'

    feat_html = ""
    if features:
        items_html = "".join(f"<li>{feat}</li>" for feat in features if feat)
        feat_html = f'<div class="pc-section"><div class="pc-section-title">✨ Features</div><ul class="pc-list">{items_html}</ul></div>'

    max_h = "max-height:240px;overflow-y:auto;" if compact else ""
    return f"""
    <div class="product-card" style="{max_h}">
        {badge_html}
        <div class="pc-header">
            <div class="pc-title">{title}</div>
            <div class="pc-price">{price_str}</div>
        </div>
        {desc_html}
        {feat_html}
    </div>"""


def render_progress(current: int, total: int = PRODUCTS_PER_USER):
    pct = int((current / total) * 100)
    st.markdown(f"""
    <div class="progress-wrap"><div class="progress-fill" style="width:{pct}%"></div></div>
    <div class="progress-label">Product {current} of {total}</div>
    """, unsafe_allow_html=True)


def render_chat_history(turns: list):
    html = '<div class="chat-wrap">'
    for turn in turns:
        role = turn.get("role", "")
        content = turn.get("content", "")
        if role == "assistant":
            html += f'<div class="bubble-label">🤖 AI Sales Agent</div><div class="bubble bubble-ai">{content}</div>'
        elif role == "user":
            html += f'<div class="bubble-label" style="text-align:right">You</div><div class="bubble bubble-user">{content}</div>'
    html += "</div>"
    st.markdown(html, unsafe_allow_html=True)


# ---------------------------------------------------------------------------
# Screen renderers
# ---------------------------------------------------------------------------
def screen_welcome(s):
    st.markdown("# 🛒 Product Evaluation Study")
    breakdown = study_category_breakdown()
    st.markdown(
        f"Welcome! In this study you will evaluate **{PRODUCTS_PER_USER} {study_display_name()}** products.\n\n"
        + (f"{breakdown}\n\n" if breakdown else "")
        +
        "For each product you will:\n"
        "1. Rate how familiar you are with the product\n"
        "2. Rate how willing you are to buy it\n"
        "3. Chat with an AI about the product (**at least 3 exchanges**)\n"
        "4. Rate your willingness to buy it again\n"
        "5. Answer two brief reflection questions\n\n"
        "After all 5 products, you're done! The study takes about **20–30 minutes**. "
        "Thank you for participating!"
    )
    if st.button("Begin →", type="primary", use_container_width=True):
        if DEBUG_MODE:
            s["demographics"] = DEBUG_DEMOGRAPHICS.copy()
            s["screen"] = "product_intro"
        else:
            s["screen"] = "demographics"
        st.rerun()


def screen_demographics(s):
    st.markdown("## Demographics — About You")
    st.markdown("All fields are required before you can proceed.")

    age = st.text_input("Age (years)", placeholder="e.g. 34")
    gender = st.selectbox("Gender", ["", "Female", "Male"])
    geographic_region = st.selectbox("Geographic region", ["", "West", "South", "Midwest", "Northeast", "Pacific"])
    education_level = st.selectbox("Highest education level", [
        "", "Less than high school", "High school graduate",
        "Some college, no degree", "Associate's degree",
        "College graduate/some postgrad", "Postgraduate",
    ])
    race = st.selectbox("Race / ethnicity", ["", "Asian", "Hispanic", "White", "Black", "Other"])
    us_citizen = st.selectbox("Are you a U.S. citizen?", ["", "Yes", "No"])
    marital_status = st.selectbox("Marital status", [
        "", "Never been married", "Married", "Living with a partner",
        "Divorced", "Separated", "Widowed",
    ])
    religion = st.selectbox("Religion", [
        "", "Protestant", "Roman Catholic", "Mormon", "Orthodox", "Jewish",
        "Muslim", "Buddhist", "Atheist", "Agnostic", "Nothing in particular", "Other",
    ])
    religious_attendance = st.selectbox("How often do you attend religious services?", [
        "", "Never", "Seldom", "A few times a year", "Once or twice a month",
        "Once a week", "More than once a week",
    ])
    political_affiliation = st.selectbox("Political affiliation", [
        "", "Democrat", "Republican", "Independent", "Something else",
    ])
    income = st.selectbox("Household income", [
        "", "Less than $30,000", "$30,000-$50,000", "$50,000-$75,000",
        "$75,000-$100,000", "$100,000 or more",
    ])
    political_views = st.selectbox("Political views", [
        "", "Very liberal", "Liberal", "Moderate", "Conservative", "Very conservative",
    ])
    household_size = st.selectbox("Household size", ["", "1", "2", "3", "4", "More than 4"])
    employment_status = st.selectbox("Employment status", [
        "", "Full-time employment", "Part-time employment", "Self-employed",
        "Unemployed", "Retired", "Home-maker", "Student",
    ])

    if st.button("Next →", type="primary", use_container_width=True):
        fields = [age, gender, geographic_region, education_level, race, us_citizen,
                  marital_status, religion, religious_attendance, political_affiliation,
                  income, political_views, household_size, employment_status]
        if not all([f and (f.strip() if isinstance(f, str) else f) for f in fields]):
            st.error("⚠️ Please complete all fields.")
            return
        if not age.strip().isdigit() or not (1 <= int(age.strip()) <= 120):
            st.error("⚠️ Please enter a valid age.")
            return
        s["demographics"] = {
            "age": age.strip(), "gender": gender, "geographic_region": geographic_region,
            "education_level": education_level, "race": race, "us_citizen": us_citizen,
            "marital_status": marital_status, "religion": religion,
            "religious_attendance": religious_attendance, "political_affiliation": political_affiliation,
            "income": income, "political_views": political_views,
            "household_size": household_size, "employment_status": employment_status,
        }
        s["screen"] = "product_intro"
        st.rerun()


def screen_product_intro(s):
    idx = s["current_product_index"]
    product = s["products"][idx]
    product_category = product.get("category", CATEGORY)

    render_progress(idx + 1)
    st.markdown("## Product Evaluation")
    st.markdown("Please read the product information carefully, then answer the two questions below.")
    st.markdown(render_product_card_html(product), unsafe_allow_html=True)

    # Use per-product familiarity choices based on the product's own category
    familiarity_choices = get_familiarity_choices(product_category)

    familiarity_val = st.radio(
        "How familiar are you with this product?",
        familiarity_choices,
        index=None,
        key=f"familiarity_{idx}_{product['id']}",
    )
    pre_will_val = st.radio(
        "How willing would you be to buy this product?",
        WILLINGNESS_CHOICES,
        index=None,
        key=f"pre_will_{idx}_{product['id']}",
    )

    if st.button("Start Chat →", type="primary", use_container_width=True):
        if not DEBUG_MODE:
            if not familiarity_val:
                st.error("⚠️ Please rate your familiarity.")
                return
            if not pre_will_val:
                st.error("⚠️ Please rate your willingness to buy.")
                return

        familiarity_val = familiarity_val or familiarity_choices[0]
        pre_will_val = pre_will_val or WILLINGNESS_CHOICES[3]

        # Check if we need to swap this product
        if needs_swap(familiarity_val, pre_will_val) and not DEBUG_MODE:
            current_ids = {p["id"] for p in s["products"]}
            replacement = get_swap_product(exclude_ids=current_ids, category=product_category)
            if replacement:
                return_product_to_queue(s["products"][idx])
                s["products"][idx] = make_product_slot(replacement, was_swapped=True)
                st.info("We've swapped this product for a better match. Please review the new product below.")
                st.rerun()
                return
            # No replacement found — proceed with this product anyway

        pre_val = parse_willingness(pre_will_val)
        s["products"][idx]["familiarity"] = familiarity_val
        s["products"][idx]["pre_willingness"] = pre_val
        s["products"][idx]["pre_willingness_label"] = WILLINGNESS_LABELS[pre_val]

        system_prompt = build_sales_system_prompt(product)
        opening_user_msg = build_opening_user_message(product)
        messages = [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": opening_user_msg},
        ]
        with st.spinner("Starting conversation…"):
            ai_reply = call_model(messages)

        s["products"][idx]["conversation"]["system_prompt"] = system_prompt
        s["products"][idx]["conversation"]["opening_user_message"] = opening_user_msg
        s["products"][idx]["conversation"]["turns"] = [
            {"turn_index": 0, "role": "assistant", "content": ai_reply,
             "timestamp": time.time(), "model": MODEL_NAME}
        ]
        s["products"][idx]["conversation"]["num_turns"] = 0
        s["screen"] = "chat"
        st.rerun()


def screen_chat(s):
    idx = s["current_product_index"]
    product = s["products"][idx]
    conv = s["products"][idx]["conversation"]

    render_progress(idx + 1)
    st.markdown("## Chat with the AI")

    title = product.get("title", "Product")
    price = product.get("price", "N/A")
    price_str = f"${price}" if price and price != "N/A" and not str(price).startswith("$") else price
    with st.expander(f"📦 {title} — {price_str} (click to expand product details)"):
        st.markdown(render_product_card_html(product, compact=True), unsafe_allow_html=True)

    num_turns = conv["num_turns"]
    st.markdown(
        f"Chat with the AI about whether you'd like to purchase the product. "
        f"Ask questions, push back, or explore your interest. "
        f"You need at least **{MIN_TURNS} exchanges** before you can move on."
    )

    display_turns = [t for t in conv["turns"] if t["role"] in ("user", "assistant")]
    render_chat_history(display_turns)

    if num_turns >= MAX_TURNS:
        st.info(f"Maximum turns ({MAX_TURNS}) reached. Please proceed.")
    else:
        st.caption(f"Turns: {num_turns} / minimum {MIN_TURNS}")
    st.caption("💡 If you don't see the latest messages, scroll down while hovering over the conversation.")

    if num_turns < MAX_TURNS:
        user_msg = st.text_area(
            "Your response:",
            placeholder="Type your response here…",
            height=100,
            key=f"chat_input_{idx}_{num_turns}",
        )
        col1, col2 = st.columns([3, 1])
        with col2:
            send_clicked = st.button("Send", type="primary", use_container_width=True)
        if send_clicked:
            if not user_msg or not user_msg.strip():
                st.error("⚠️ Please type a message.")
                return
            if len(user_msg.strip().split()) < 5 and not DEBUG_MODE:
                st.error(f"⚠️ Please write at least 5 words ({len(user_msg.strip().split())} so far).")
                return
            user_msg = user_msg.strip()
            messages = [
                {"role": "system", "content": conv["system_prompt"]},
                {"role": "user", "content": conv["opening_user_message"]},
            ]
            for turn in conv["turns"]:
                messages.append({"role": turn["role"], "content": turn["content"]})
            messages.append({"role": "user", "content": user_msg})
            with st.spinner("AI is responding…"):
                ai_reply = call_model(messages)
            conv["turns"].append({"turn_index": len(conv["turns"]), "role": "user",
                                   "content": user_msg, "timestamp": time.time()})
            conv["turns"].append({"turn_index": len(conv["turns"]), "role": "assistant",
                                   "content": ai_reply, "timestamp": time.time(), "model": MODEL_NAME})
            conv["num_turns"] = num_turns + 1
            s["products"][idx]["conversation"] = conv
            st.rerun()

    can_finish = num_turns >= MIN_TURNS or num_turns >= MAX_TURNS or DEBUG_MODE
    if can_finish:
        if st.button("I'm done chatting →", use_container_width=True):
            s["screen"] = "post_will"
            st.rerun()
    else:
        st.button("I'm done chatting →", disabled=True, use_container_width=True,
                  help=f"Complete at least {MIN_TURNS} exchanges first.")


def screen_post_willingness(s):
    idx = s["current_product_index"]
    product = s["products"][idx]
    render_progress(idx + 1)
    st.markdown("## Your View Now")
    st.markdown("Now that you've chatted with the AI, rate your willingness to buy again.")
    st.markdown(render_product_card_html(product), unsafe_allow_html=True)

    post_will_val = st.radio(
        "How willing would you be to buy this product now?",
        WILLINGNESS_CHOICES,
        index=None,
        key=f"post_will_{idx}_{product['id']}",
    )

    if st.button("Next →", type="primary", use_container_width=True):
        if not post_will_val and not DEBUG_MODE:
            st.error("⚠️ Please rate your willingness to buy.")
            return
        post_will_val = post_will_val or WILLINGNESS_CHOICES[3]
        post_val = parse_willingness(post_will_val)
        pre_val = s["products"][idx].get("pre_willingness", 4)
        delta = post_val - pre_val
        s["products"][idx]["post_willingness"] = post_val
        s["products"][idx]["post_willingness_label"] = WILLINGNESS_LABELS[post_val]
        s["products"][idx]["willingness_delta"] = delta
        s["screen"] = "reflection"
        st.rerun()


def screen_reflection(s):
    idx = s["current_product_index"]
    render_progress(idx + 1)
    st.markdown("## Reflection")

    standout = st.text_area(
        "What did the AI say that stood out to you most?",
        placeholder="Describe a specific argument, question, or moment from the conversation…",
        height=120,
        key=f"standout_{idx}",
    )
    thinking_change = st.text_area(
        "How did your thinking about this product change (or not change) during the chat? Why?",
        placeholder="Be as specific as you can…",
        height=120,
        key=f"thinking_{idx}",
    )

    next_label = "Next Product →" if idx + 1 < PRODUCTS_PER_USER else "Submit Study →"
    if st.button(next_label, type="primary", use_container_width=True):
        if not DEBUG_MODE:
            if not standout or not standout.strip():
                st.error("⚠️ Please answer the first reflection question.")
                return
            if len(standout.strip().split()) < 10:
                st.error(f"⚠️ Please write at least 10 words for the first question ({len(standout.strip().split())} so far).")
                return
            if not thinking_change or not thinking_change.strip():
                st.error("⚠️ Please answer the second reflection question.")
                return
            if len(thinking_change.strip().split()) < 10:
                st.error(f"⚠️ Please write at least 10 words for the second question ({len(thinking_change.strip().split())} so far).")
                return

        standout = (standout or "").strip() or "[debug placeholder]"
        thinking_change = (thinking_change or "").strip() or "[debug placeholder]"
        s["products"][idx]["reflection"] = {
            "standout_moment": standout,
            "thinking_change": thinking_change,
        }

        next_idx = idx + 1
        s["current_product_index"] = next_idx

        if next_idx >= PRODUCTS_PER_USER:
            end_time = time.time()
            s["meta"] = {
                "submission_time": end_time,
                "duration_seconds": round(end_time - s.get("start_time", end_time), 1),
                "model": MODEL_NAME,
                "mode": MODE or "single",
                "category": CATEGORY if MODE != "mixed" else "mixed",
            }
            with st.spinner("Saving your responses…"):
                save_and_upload(s)
            s["screen"] = "done"
        else:
            s["screen"] = "product_intro"
        st.rerun()


def screen_done(s):
    st.markdown("## ✅ Study Complete!")
    st.markdown("**Thank you for completing the study!**")
    st.markdown(f"Here's a summary of how your willingness changed across the {PRODUCTS_PER_USER} products:")

    rows = []
    for i, p in enumerate(s["products"]):
        pre = p.get("pre_willingness", "?")
        post = p.get("post_willingness", "?")
        delta = p.get("willingness_delta", 0)
        arrow = "➡️" if delta == 0 else ("⬆️" if delta > 0 else "⬇️")
        cat_label = CATEGORY_DISPLAY.get(p.get("category", ""), "") if MODE == "mixed" else ""
        rows.append({
            "#": i + 1,
            **({"Category": cat_label} if MODE == "mixed" else {}),
            "Product": p.get("title", "")[:55] + ("…" if len(p.get("title", "")) > 55 else ""),
            "Before": WILLINGNESS_LABELS.get(pre, str(pre)),
            "After": WILLINGNESS_LABELS.get(post, str(post)),
            "Change": f"{arrow} {delta:+d}" if isinstance(delta, int) else "–",
        })
    import pandas as pd
    st.dataframe(pd.DataFrame(rows), use_container_width=True, hide_index=True)

    st.markdown("---")
    st.success(
        f"**Your completion code:** `{PROLIFIC_COMPLETION_CODE}`\n\n"
        "Please copy this code and paste it on the Prolific website to complete your submission."
    )


# ---------------------------------------------------------------------------
# Main
# ---------------------------------------------------------------------------
def main():
    st.set_page_config(page_title="Product Study", page_icon="🛒", layout="centered")
    inject_css()

    if "study_state" not in st.session_state:
        st.session_state.study_state = init_state()

    s = st.session_state.study_state
    screen = s.get("screen", "welcome")

    if screen == "welcome":
        screen_welcome(s)
    elif screen == "demographics":
        screen_demographics(s)
    elif screen == "product_intro":
        screen_product_intro(s)
    elif screen == "chat":
        screen_chat(s)
    elif screen == "post_will":
        screen_post_willingness(s)
    elif screen == "reflection":
        screen_reflection(s)
    elif screen == "done":
        screen_done(s)


if __name__ == "__main__":
    main()