Spaces:

mlops-group8
/

case-study-1-local

Runtime error

App Files Files Community

Mohammed Thameem commited on Sep 15, 2025

Commit

a2eaad1

1 Parent(s): 11a86dd

WIP before rebase

Browse files

Files changed (3) hide show

.github/workflows/hf-sync.yml +19 -3
app.py +264 -54
tests/test_app.py +32 -0

.github/workflows/hf-sync.yml CHANGED Viewed

@@ -1,4 +1,4 @@
-name: Sync to Hugging Face hub
 on:
   push:
@@ -7,7 +7,7 @@ on:
   workflow_dispatch:
 jobs:
-  sync-to-hub:
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
@@ -15,7 +15,23 @@ jobs:
           fetch-depth: 0
           lfs: true
       - name: Push to Hugging Face
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
         run: |
@@ -24,7 +40,7 @@ jobs:
           git push --force https://mlops-group8:$HF_TOKEN@huggingface.co/spaces/mlops-group8/case-study-1-local HEAD:main
       - name: Notify Slack (on success)
-        if: success()
         uses: rtCamp/action-slack-notify@v2
         env:
           SLACK_WEBHOOK: ${{ secrets.SLACK_WEBHOOK_URL }}

+name: Test and Sync to Hugging Face hub
 on:
   push:
   workflow_dispatch:
 jobs:
+  test-and-sync:
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
           fetch-depth: 0
           lfs: true
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+      - name: Install dependencies
+        run: |
+          if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
+          pip install pytest
+      - name: Run tests
+        env:
+          HF_TOKEN: ${{ secrets.HF_TOKEN }}
+        run: PYTHONPATH=. pytest --maxfail=1 --disable-warnings -q
       - name: Push to Hugging Face
+        if: success()  # only run if tests pass
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
         run: |
           git push --force https://mlops-group8:$HF_TOKEN@huggingface.co/spaces/mlops-group8/case-study-1-local HEAD:main
       - name: Notify Slack (on success)
+        if: success()
         uses: rtCamp/action-slack-notify@v2
         env:
           SLACK_WEBHOOK: ${{ secrets.SLACK_WEBHOOK_URL }}

app.py CHANGED Viewed

@@ -4,87 +4,297 @@ import gradio as gr
 from huggingface_hub import login
 from transformers import AutoTokenizer, AutoModelForCausalLM
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
     raise RuntimeError("HF_TOKEN not found. In Spaces, add it under Settings → Repository secrets.")
 login(token=HF_TOKEN)
-MODEL_ID = "meta-llama/Llama-3.2-1B"
 DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, token=HF_TOKEN)
 model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
     token=HF_TOKEN,
-    torch_dtype=torch.float32,
 ).to(DEVICE)
 model.eval()
-# Ensure Llama 3 chat template exists
 if tokenizer.chat_template is None:
-    tokenizer.chat_template = """<|begin_of_text|>{% for message in messages %}{% if message['role'] == 'user' %}{{ '<|start_header_id|>user<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% elif message['role'] == 'system' %}{{ '<|start_header_id|>system<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% elif message['role'] == 'assistant' %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}"""
-def _get_eot_id(tok):
-    tid = tok.convert_tokens_to_ids("<|eot_id|>")
-    return tid if isinstance(tid, int) and tid >= 0 else (tok.eos_token_id or 0)
-EOT_ID = _get_eot_id(tokenizer)
-PAD_ID = tokenizer.eos_token_id if tokenizer.eos_token_id is not None else 0
-SYSTEM_PROMPT = (
-    "You are Sustainable.ai, a friendly, encouraging assistant. "
-    "Offer simple, practical, sustainable alternatives to everyday actions. "
-    "Be supportive and never judgmental."
 )
 @torch.inference_mode()
-def chat(message, history):
-    messages = [{"role": "system", "content": SYSTEM_PROMPT}]
-    for u, a in history:
-        if u:
-            messages.append({"role": "user", "content": u})
-        if a:
-            messages.append({"role": "assistant", "content": a})
-    messages.append({"role": "user", "content": message})
-    prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
-    inputs = tokenizer(prompt, return_tensors="pt")
-    inputs = {k: v.to(DEVICE) for k, v in inputs.items()}
-    outputs = model.generate(
-        **inputs,
-        max_new_tokens=200,
-        do_sample=True,
-        temperature=0.7,
-        top_p=0.9,
-        eos_token_id=EOT_ID,
-        pad_token_id=PAD_ID,
     )
-    new_tokens = outputs[0, inputs["input_ids"].shape[1]:]
-    return tokenizer.decode(new_tokens, skip_special_tokens=True).strip()
-# Create the app with graceful fallback for older Gradio
-try:
-    demo = gr.ChatInterface(
-        fn=chat,
-        title="Sustainable.ai 🌿",
-        description="Tell me what you plan to do, and I’ll suggest a simpler, greener alternative.",
-        submit_btn="Suggest",
-        retry_btn="Regenerate",    # only available on newer Gradio
-        clear_btn="Clear",         # may also be unavailable on older versions
-    )
-except TypeError:
-    # Older Gradio versions
-    demo = gr.ChatInterface(
-        fn=chat,
-        title="Sustainable.ai 🌿",
-        description="Tell me what you plan to do, and I’ll suggest a simpler, greener alternative.",
-        # use defaults for buttons
     )
-demo = demo.queue(max_size=32, default_concurrency=2)
 if __name__ == "__main__":
     demo.launch()

 from huggingface_hub import login
 from transformers import AutoTokenizer, AutoModelForCausalLM
+# ========================== Setup ==========================
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
     raise RuntimeError("HF_TOKEN not found. In Spaces, add it under Settings → Repository secrets.")
 login(token=HF_TOKEN)
+MODEL_ID = os.getenv("MODEL_ID", "google/gemma-3-270m-it")
 DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, token=HF_TOKEN)
+# If pad is missing, map to eos
+if tokenizer.pad_token_id is None and tokenizer.eos_token_id is not None:
+    tokenizer.pad_token = tokenizer.eos_token
 model = AutoModelForCausalLM.from_pretrained(
     MODEL_ID,
     token=HF_TOKEN,
+    torch_dtype=(torch.bfloat16 if torch.cuda.is_available() else torch.float32),
 ).to(DEVICE)
 model.eval()
+# Use model's provided chat template if present; otherwise a minimal one.
 if tokenizer.chat_template is None:
+    tokenizer.chat_template = """{% for message in messages -%}
+<start_of_turn>{{ message['role'] }}
+{{ message['content'] }}<end_of_turn>
+{% endfor -%}{% if add_generation_prompt %}<start_of_turn>assistant
+{% endif %}"""
+EOS_ID = tokenizer.eos_token_id
+PAD_ID = tokenizer.pad_token_id if tokenizer.pad_token_id is not None else (EOS_ID or 0)
+# Detect which assistant role the template expects.
+# Many Gemma-3 templates use "assistant"; some forks use "model".
+TEMPLATE_STR = tokenizer.chat_template or ""
+ASSISTANT_ROLE = "assistant" if "assistant" in TEMPLATE_STR else "model"
+# ================== Sustainability Logic ===================
+EMISSIONS_FACTORS = {
+    "transportation": {"car": 2.3, "bus": 0.1, "train": 0.04, "plane": 0.25},   # kg CO2 per km
+    "food": {"meat": 6.0, "vegetarian": 1.5, "vegan": 1.0},                    # kg CO2 per meal
+}
+def calculate_footprint(car_km, bus_km, train_km, air_km_week, meat_meals, vegetarian_meals, vegan_meals):
+    transport_emissions = (
+        car_km * EMISSIONS_FACTORS["transportation"]["car"] +
+        bus_km * EMISSIONS_FACTORS["transportation"]["bus"] +
+        train_km * EMISSIONS_FACTORS["transportation"]["train"] +
+        air_km_week * EMISSIONS_FACTORS["transportation"]["plane"]
+    )
+    food_emissions = (
+        meat_meals * EMISSIONS_FACTORS["food"]["meat"] +
+        vegetarian_meals * EMISSIONS_FACTORS["food"]["vegetarian"] +
+        vegan_meals * EMISSIONS_FACTORS["food"]["vegan"]
+    )
+    total_emissions = transport_emissions + food_emissions
+    stats = {
+        "trees": round(total_emissions / 21),     # playful rough equivalents
+        "flights": round(total_emissions / 500),
+        "driving100km": round(total_emissions / 230),
+    }
+    return total_emissions, stats
+GUIDANCE = (
+    "You are Sustainable.ai. Give practical, encouraging sustainability alternatives only.\n"
+    "Constraints:\n"
+    "1) Reply in 3 to 6 short bullet points.\n"
+    "2) Include a rough CO2 saving per bullet.\n"
+    "3) No moralizing.\n"
+    "4) Offer 1 easy switch, 1 medium switch, 1 stretch goal.\n"
+)
+GEN_KW = dict(
+    max_new_tokens=256,
+    do_sample=False,            # deterministic for stability
+    temperature=0.0,
+    repetition_penalty=1.05,
+    eos_token_id=EOS_ID,
+    pad_token_id=PAD_ID,
 )
+# ======================= Utilities ========================
+def _to_float(x, default=0.0):
+    try:
+        return float(x)
+    except Exception:
+        return float(default)
+def _add(conv, role, content):
+    """Append a role/content pair if content is non-empty."""
+    if not content:
+        return
+    # Map roles to the template's expected assistant role
+    if role == "assistant":
+        role = ASSISTANT_ROLE
+    elif role == "system":
+        # Gemma templates often do not support 'system'; treat as user context
+        role = "user"
+    elif role not in ("user", "assistant", "model"):
+        role = "user"
+    conv.append({"role": role, "content": str(content)})
+def _normalize_from_history(history, conv):
+    """
+    history may be:
+      - list[tuple(user, assistant)]
+      - list[dict(role, content)]
+    """
+    if not isinstance(history, list):
+        return
+    for item in history:
+        if isinstance(item, tuple) and len(item) == 2:
+            u, a = item
+            if u:
+                _add(conv, "user", u)
+            if a:
+                _add(conv, "assistant", a)
+        elif isinstance(item, dict):
+            _add(conv, item.get("role", "user"), item.get("content", ""))
+def _normalize_from_messages(messages, conv):
+    """
+    messages may be:
+      - list[dict(role, content)]
+      - list[str]
+      - str
+      - None
+    """
+    if messages is None:
+        return
+    if isinstance(messages, list):
+        # If dicts, use them; if strings, treat each as a user turn
+        for m in messages:
+            if isinstance(m, dict):
+                _add(conv, m.get("role", "user"), m.get("content", ""))
+            elif isinstance(m, str):
+                _add(conv, "user", m)
+    elif isinstance(messages, str):
+        _add(conv, "user", messages)
+def _merge_consecutive_same_role(conv):
+    """Merge consecutive same-role messages to satisfy strict alternation."""
+    if not conv:
+        return conv
+    merged = [conv[0]]
+    for msg in conv[1:]:
+        if msg["role"] == merged[-1]["role"]:
+            merged[-1]["content"] = (merged[-1]["content"].rstrip() + "\n\n" + msg["content"].lstrip())
+        else:
+            merged.append(msg)
+    return merged
+def _ensure_last_is_user(conv):
+    """
+    For add_generation_prompt=True, the template expects the last message to be a user turn.
+    If the last is assistant/model, append a light user nudge.
+    """
+    if not conv:
+        return [{"role": "user", "content": "Please respond."}]
+    last_role = conv[-1]["role"]
+    if last_role in ("assistant", "model"):
+        conv.append({"role": "user", "content": "Continue."})
+    return conv
+# ===================== Chat Function ======================
+# Be tolerant to Gradio shapes: (messages, history, ...) or (message, history, ...)
 @torch.inference_mode()
+def chat(messages=None, history=None, car_km=0, bus_km=0, train_km=0, air_km_month=0, meat_meals=0, vegetarian_meals=0, vegan_meals=0, *args):
+    # Convert monthly air travel to weekly to keep units consistent
+    air_km_week = _to_float(air_km_month) / 4.3
+    footprint, stats = calculate_footprint(
+        _to_float(car_km), _to_float(bus_km), _to_float(train_km), air_km_week,
+        _to_float(meat_meals), _to_float(vegetarian_meals), _to_float(vegan_meals)
     )
+    context = (
+        f"User’s estimated weekly footprint: {footprint:.1f} kg CO2.\n"
+        f"Equivalents: about {stats['trees']} trees or {stats['flights']} short flights.\n"
+        "Help them lower this number."
     )
+    # Build conversation seed with guidance folded into the FIRST user turn.
+    conv = []
+    # Prefer Gradio messages if they are structured; otherwise use history.
+    # We'll assemble a provisional conv, then fold guidance in.
+    provisional = []
+    _normalize_from_history(history, provisional)
+    _normalize_from_messages(messages, provisional)
+    # If first message exists and is a user turn, prepend guidance+context to that same message.
+    guidance_block = GUIDANCE + "\n" + context
+    if provisional and provisional[0]["role"] == "user":
+        provisional[0]["content"] = guidance_block + "\n\n" + provisional[0]["content"]
+    else:
+        # Start with a user turn containing guidance and context
+        provisional.insert(0, {"role": "user", "content": guidance_block})
+    # Merge consecutive same-role messages to satisfy alternation
+    conv = _merge_consecutive_same_role(provisional)
+    # Ensure final message is a user turn for add_generation_prompt=True
+    conv = _ensure_last_is_user(conv)
+    # Apply chat template
+    prompt = tokenizer.apply_chat_template(conv, tokenize=False, add_generation_prompt=True)
+    inputs = tokenizer(prompt, return_tensors="pt")
+    inputs = {k: v.to(DEVICE) for k, v in inputs.items()}
+    # Generate
+    outputs = model.generate(**inputs, **GEN_KW)
+    new_tokens = outputs[0, inputs["input_ids"].shape[1]:]
+    text = tokenizer.decode(new_tokens, skip_special_tokens=True).strip()
+    # Light formatting nudge toward bullets
+    if not any(ch in text for ch in ("•", "-", "*")):
+        lines = [l.strip() for l in text.split("\n") if l.strip()]
+        if lines:
+            text = "\n".join(f"• {l}" for l in lines[:6])
+    return text
+# ========================== UI ============================
+with gr.Blocks(css="""
+    body {
+        background: linear-gradient(135deg, #e0f7fa, #f1f8e9);
+        font-family: 'Inter', sans-serif;
+    }
+    .section-card {
+        background: white;
+        padding: 20px;
+        border-radius: 15px;
+        box-shadow: 0px 4px 12px rgba(0,0,0,0.1);
+        margin-bottom: 20px;
+    }
+    .title-text {
+        text-align: center;
+        font-size: 32px;
+        font-weight: bold;
+        color: #1b5e20;
+        margin-bottom: 5px;
+    }
+    .subtitle-text {
+        text-align: center;
+        font-size: 16px;
+        color: #444;
+        margin-bottom: 30px;
+    }
+    footer {
+        text-align: center;
+        font-size: 12px;
+        color: #666;
+        margin-top: 20px;
+    }
+""") as demo:
+    with gr.Column():
+        gr.HTML("<div class='title-text'>🌍 Eco Wise AI</div>")
+        gr.HTML("<div class='subtitle-text'>Track your weekly habits and get personalized sustainability tips 🌱</div>")
+        with gr.Row():
+            with gr.Group(elem_classes="section-card"):
+                gr.Markdown("### 🚗 Transportation (per week)")
+                car_input = gr.Number(label="🚘 Car Travel (km)", value=0)
+                bus_input = gr.Number(label="🚌 Bus Travel (km)", value=0)
+                train_input = gr.Number(label="🚆 Train Travel (km)", value=0)
+                air_input = gr.Number(label="✈️ Air Travel (km/month)", value=0)
+            with gr.Group(elem_classes="section-card"):
+                gr.Markdown("### 🍽️ Food Habits (per week)")
+                meat_input = gr.Number(label="🥩 Meat Meals", value=0)
+                vegetarian_input = gr.Number(label="🥗 Vegetarian Meals", value=0)
+                vegan_input = gr.Number(label="🌱 Vegan Meals", value=0)
+        with gr.Group(elem_classes="section-card"):
+            gr.Markdown("### 💬 Chat with Sustainable.ai")
+            chatbot = gr.ChatInterface(
+                fn=chat,
+                type="messages",  # role/content dicts when available
+                additional_inputs=[
+                    car_input, bus_input, train_input, air_input,
+                    meat_input, vegetarian_input, vegan_input
+                ],
+            )
+        gr.HTML("<footer>⚡ Built with Gemma 3 270M IT & Gradio • Eco Wise AI © 2025</footer>")
+# Queue with concurrency control
+demo = demo.queue(max_size=32, default_concurrency_limit=2)
 if __name__ == "__main__":
     demo.launch()

tests/test_app.py ADDED Viewed

	@@ -0,0 +1,32 @@

+import sys, os
+sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), "..")))
+import app
+import types
+import app
+def test_respond_function_exists():
+    """Check that the app has a respond() function."""
+    assert hasattr(app, "respond")
+    assert callable(app.respond)
+def test_respond_returns_generator():
+    """respond() should return a generator when called with minimal args."""
+    # Fake OAuthToken object for testing (since we don't want to call real HF API in CI)
+    class DummyToken:
+        token = "dummy"
+    gen = app.respond(
+        message="I'm buying a bottle of water.",
+        history=[],
+        system_message="You are Sustainable.ai.",
+        max_tokens=10,
+        temperature=0.7,
+        top_p=0.9,
+        hf_token=DummyToken(),
+    )
+    # respond() is a generator, not a plain string
+    assert isinstance(gen, types.GeneratorType)