File size: 8,761 Bytes
eedb2c4
 
647032a
eedb2c4
 
d3c9e13
647032a
 
d3c9e13
647032a
 
d3c9e13
a48e2a2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d3c9e13
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
647032a
d3c9e13
 
 
647032a
eedb2c4
 
 
 
 
 
 
 
 
 
 
 
 
d3c9e13
eedb2c4
 
 
647032a
eedb2c4
 
d3c9e13
eedb2c4
 
d3c9e13
eedb2c4
 
647032a
eedb2c4
 
 
 
 
 
d3c9e13
eedb2c4
 
 
 
 
 
 
 
 
 
647032a
eedb2c4
 
d3c9e13
 
 
eedb2c4
647032a
eedb2c4
 
d3c9e13
eedb2c4
d3c9e13
eedb2c4
647032a
eedb2c4
 
 
 
 
 
 
 
 
 
647032a
eedb2c4
 
 
 
 
 
 
 
d3c9e13
eedb2c4
 
 
 
 
 
647032a
 
 
d3c9e13
647032a
eedb2c4
 
 
 
d3c9e13
 
 
 
 
 
eedb2c4
 
 
d3c9e13
eedb2c4
 
 
d3c9e13
eedb2c4
 
 
 
 
d3c9e13
eedb2c4
d3c9e13
eedb2c4
a48e2a2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
eedb2c4
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
# app_storefront.py
import os
import sys
import gradio as gr

# Ensure "core/" is importable
sys.path.append(os.path.join(os.path.dirname(__file__), "core"))

# Import only functions; core.storefront doesn't export constants
from core.model import model_generate, MODEL_NAME
from core.memory import build_prompt_from_history
from core.storefront import load_storefront, storefront_qna, extract_products, get_rules
from core.storefront import is_storefront_query

def chat_pipeline(history, message, max_new_tokens=96, temperature=0.7, top_p=0.9):
    # 1) Try storefront facts first
    sf = storefront_qna(DATA, message)
    if sf:
        return sf

    # 2) If not a storefront query, offer guided help (no LLM)
    if not is_storefront_query(message):
        return (
            "I can help with the graduation storefront. Examples:\n"
            "- Parking rules, lots opening times\n"
            "- Attire / dress code\n"
            "- Cap & Gown details and pickup\n"
            "- Parking passes (multiple allowed)\n"
            "Ask one of those, and I’ll answer directly."
        )

    # 3) Otherwise, generate with memory and hard stops
    prompt = build_prompt_from_history(history, message, k=4)
    gen = model_generate(prompt, max_new_tokens, temperature, top_p)
    return clean_generation(gen)

def clean_generation(text: str) -> str:
    return (text or "").strip()

# ---------------- Load data + safe fallbacks ----------------
DATA = load_storefront()  # may be None if storefront_data.json missing/empty

# Fallbacks used if JSON not present
FALLBACK_PRODUCTS = [
    {"sku": "CG-SET", "name": "Cap & Gown Set", "price": 59.00,
     "notes": "Tassel included; ships until 10 days before the event"},
    {"sku": "PK-1",   "name": "Parking Pass",   "price": 10.00,
     "notes": "Multiple passes are allowed per student"}
]
FALLBACK_VENUE = [
    "Formal attire recommended (not required).",
    "No muscle shirts.",
    "No sagging pants."
]
FALLBACK_PARKING = [
    "No double parking.",
    "Vehicles parked in handicap spaces will be towed."
]

# Normalize products/rules for the tabs
if DATA:
    PRODUCTS = extract_products(DATA) or FALLBACK_PRODUCTS
    venue_rules, parking_rules = get_rules(DATA)
    VENUE_RULES = venue_rules or FALLBACK_VENUE
    PARKING_RULES = parking_rules or FALLBACK_PARKING
else:
    PRODUCTS = FALLBACK_PRODUCTS
    VENUE_RULES = FALLBACK_VENUE
    PARKING_RULES = FALLBACK_PARKING



# ---------------- UI ----------------
CSS = """
:root { --bg:#0b0d12; --panel:#0f172a; --border:#1f2940; --text:#e5e7eb; --muted:#9ca3af; }
.gradio-container { background: var(--bg) !important; color: var(--text) !important; }
.panel { border:1px solid var(--border); border-radius:16px; background:var(--panel); }
.small { font-size:12px; color: var(--muted); }
"""

with gr.Blocks(title="Storefront Chat", css=CSS) as demo:
    gr.Markdown("## Storefront Chat")

    # Single history state (kept in sync with Chatbot)
    history_state = gr.State([])

    with gr.Tabs():
        # --- TAB: Chat ---
        with gr.TabItem("Chat"):
            with gr.Group(elem_classes=["panel"]):
                chat = gr.Chatbot(height=360, bubble_full_width=False, label="Chat")

                with gr.Row():
                    msg  = gr.Textbox(placeholder="Ask about parking rules, attire, cap & gown, pickup times…", scale=5)
                    send = gr.Button("Send", scale=1)

                # Quick chips
                with gr.Row():
                    chip1 = gr.Button("Parking rules", variant="secondary")
                    chip2 = gr.Button("Multiple passes", variant="secondary")
                    chip3 = gr.Button("Attire", variant="secondary")
                    chip4 = gr.Button("When do lots open?", variant="secondary")

                # Advanced options (sliders + Health/Capabilities)
                with gr.Accordion("Advanced chat options", open=False):
                    max_new = gr.Slider(32, 512, 128, 1, label="Max new tokens")
                    temp    = gr.Slider(0.1, 1.5, 0.8, 0.05, label="Temperature")
                    topp    = gr.Slider(0.1, 1.0, 0.95, 0.05, label="Top-p")

                    with gr.Row():
                        health_btn = gr.Button("Health", variant="secondary")
                        caps_btn   = gr.Button("Capabilities", variant="secondary")
                        status_md  = gr.Markdown("Status: not checked", elem_classes=["small"])

        # --- TAB: Products ---
        with gr.TabItem("Products"):
            gr.Markdown("### Available Items")
            cols = ["sku", "name", "price", "notes"]
            data = [[p.get(c, "") for c in cols] for p in PRODUCTS]
            gr.Dataframe(headers=[c.upper() for c in cols], value=data, interactive=False, wrap=True, label="Products")

        # --- TAB: Rules ---
        with gr.TabItem("Rules"):
            gr.Markdown("### Venue rules")
            gr.Markdown("- " + "\n- ".join(VENUE_RULES))
            gr.Markdown("### Parking rules")
            gr.Markdown("- " + "\n- ".join(PARKING_RULES))

        # --- TAB: Logistics ---
        with gr.TabItem("Logistics"):
            gr.Markdown(
                "### Event Logistics\n"
                "- Shipping available until 10 days before event (typ. 3–5 business days)\n"
                "- Pickup: Student Center Bookstore during the week prior to event\n"
                "- Graduates arrive 90 minutes early; guests 60 minutes early\n"
                "- Lots A & B open 2 hours before; overflow as needed\n"
                "\n*Try asking the bot:* “What time should I arrive?” • “Where do I pick up the gown?”"
            )

    # ---------- Helpers ----------
    def _append_bot_md(history, md_text):
        history = history or []
        return history + [[None, md_text]]

    # ---------- Callbacks ----------
    def on_send(history, message, max_new_tokens, temperature, top_p):
        t = (message or "").strip()
        if not t:
            return history, history, ""  # no-op; shapes must match
        history = (history or []) + [[t, None]]
        reply = chat_pipeline(history[:-1], t, max_new_tokens, temperature, top_p)
        history[-1][1] = reply
        return history, history, ""

    def _health_cb(history):
        md = (
            f"### Status: ✅ Healthy\n"
            f"- Model: `{MODEL_NAME}`\n"
            f"- Storefront JSON: {'loaded' if bool(DATA) else 'not found'}"
        )
        new_hist = _append_bot_md(history, md)
        return new_hist, new_hist, "Status: ✅ Healthy"

    def _caps_cb(history):
        md = (
            "### Capabilities\n"
            "- Chat (LLM text-generation, memory-aware prompt)\n"
            "- Storefront Q&A (parking, attire, products, logistics)\n"
            "- Adjustable: max_new_tokens, temperature, top-p"
        )
        new_hist = _append_bot_md(history, md)
        return new_hist, new_hist

    # Wire up (state + chatbot)
    send.click(on_send, [history_state, msg, max_new, temp, topp], [history_state, chat, msg])
    msg.submit(on_send, [history_state, msg, max_new, temp, topp], [history_state, chat, msg])

    # Chips → prefill textbox
    chip1.click(lambda: "What are the parking rules?", outputs=msg)
    chip2.click(lambda: "Can I buy multiple parking passes?", outputs=msg)
    chip3.click(lambda: "Is formal attire required?", outputs=msg)
    chip4.click(lambda: "What time do the parking lots open?", outputs=msg)

    # Health / Capabilities live inside Advanced
    health_btn.click(_health_cb, inputs=[history_state], outputs=[history_state, chat, status_md])
    caps_btn.click(_caps_cb,   inputs=[history_state], outputs=[history_state, chat])

def clean_generation(text: str) -> str:
    s = (text or "").strip()

    # If the prompt contained "Assistant:", keep only what comes after the last one
    last = s.rfind("Assistant:")
    if last != -1:
        s = s[last + len("Assistant:"):].strip()

    # If it accidentally continued into a new "User:" or instructions, cut there
    cut_marks = ["\nUser:", "\nYOU ARE ANSWERING", "\nProducts:", "\nVenue rules:", "\nParking rules:"]
    cut_positions = [s.find(m) for m in cut_marks if s.find(m) != -1]
    if cut_positions:
        s = s[:min(cut_positions)].strip()

    # Collapse repeated lines like "Yes, multiple parking passes..." spam
    lines, out = s.splitlines(), []
    seen = set()
    for ln in lines:
        # dedupe only exact consecutive repeats; keep normal conversation lines
        if not out or ln != out[-1]:
            out.append(ln)
    return "\n".join(out).strip()

if __name__ == "__main__":
    demo.launch(server_name="0.0.0.0", server_port=int(os.getenv("PORT", "7860")))