Spaces:

marvin-cusm-chatbot
/

champ-chatbot

Paused

App Files Files Community

qyle commited on Jan 26

Commit

622d220

verified ·

1 Parent(s): ae8bc47

initial gitlab files

Browse files

Files changed (15) hide show

.dockerignore +17 -0
.gitignore +4 -0
Dockerfile +11 -0
README.md +53 -10
conftest.py +0 -0
docker-compose.yml +23 -0
dynamodb_helper.py +139 -0
main.py +318 -0
rag_data/netg_baaibge_chunks_v1.pkl +3 -0
requirements.txt +25 -0
static/app.js +162 -0
static/style.css +227 -0
templates/index.html +94 -0
tests/test_dynamodb.py +48 -0
tests/test_main.py +37 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,17 @@

+# Ignore the tests folder
+tests/
+# Ignore development and version control files
+.git
+.gitignore
+.dockerignore
+.vscode
+.idea
+# Ignore Python specific files and directories
+__pycache__
+*.pyc
+.venv
+venv
+*.log
+.DS_Store

.gitignore ADDED Viewed

	@@ -0,0 +1,4 @@

+.DS_Store
+__pycache__/
+.venv/
+venv/

Dockerfile ADDED Viewed

	@@ -0,0 +1,11 @@

+FROM python:3.11-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+ENV PORT=8000
+CMD uvicorn main:app --host 0.0.0.0 --port $PORT

README.md CHANGED Viewed

@@ -1,10 +1,53 @@
----
-title: Champ Chatbot Demo
-emoji: 📉
-colorFrom: yellow
-colorTo: gray
-sdk: docker
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+# MARVIN WebUI Demo
+A lightweight chat interface powered by the MARVIN model, designed for easy deployment and testing. This project can run locally with Docker Compose or be deployed to platforms like Hugging Face Spaces.
+## Features
+- Simple and fast chat interface
+- Python backend with async endpoints
+- Frontend served through a minimal web app
+- Containerized so can start everything with a single command
+## Requirements
+- Docker
+- Docker Compose
+## Local Development
+### Start the project
+From the project root:
+```
+docker compose up --build
+```
+This starts:
+1. Backend service
+2. Frontend service
+3. Database service
+Once everything is ready, open:
+```
+http://localhost:8000
+```
+### Stopping the project
+Use:
+```
+docker compose down
+```
+### Rebuilding after code changes
+Use:
+```
+docker compose up --build
+```

conftest.py ADDED Viewed

File without changes

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,23 @@

+services:
+  api:
+    build: .
+    container_name: chat_api
+    ports:
+      - '8000:8000'
+    env_file:
+      - .env
+    # depends_on:
+    #   - dynamodb-local
+    volumes:
+      - ./:/app
+    command: uvicorn main:app --host 0.0.0.0 --port 8000 --reload
+#   dynamodb-local:
+#     image: amazon/dynamodb-local
+#     ports:
+#       - '9000:8000'
+#     command: '-jar DynamoDBLocal.jar -inMemory -sharedDb'
+#     volumes:
+#       - dynamodb_data:/data
+# volumes:
+#   dynamodb_data:

dynamodb_helper.py ADDED Viewed

	@@ -0,0 +1,139 @@

+import os
+import time
+import boto3
+from boto3.dynamodb.types import TypeDeserializer, TypeSerializer
+from botocore.exceptions import ClientError
+from datetime import datetime, timezone
+from uuid import uuid4
+from decimal import Decimal
+AWS_REGION = os.getenv("AWS_REGION", "us-east-1")
+AWS_ACCESS_KEY = os.getenv("AWS_ACCESS_KEY", None)
+AWS_SECRET_ACCESS_KEY = os.getenv("AWS_SECRET_ACCESS_KEY", None)
+DYNAMODB_ENDPOINT = os.getenv("DYNAMODB_ENDPOINT", None)
+DDB_TABLE = os.getenv("DDB_TABLE", "chatbot-conversations")
+USE_LOCAL_DDB = os.getenv("USE_LOCAL_DDB", "false").lower() == "true"
+def get_dynamodb_client():
+    if USE_LOCAL_DDB: # only for local testing with DynamoDB Local
+        return boto3.resource(
+            "dynamodb",
+            endpoint_url=DYNAMODB_ENDPOINT,
+            region_name=AWS_REGION,
+            aws_access_key_id="fake",
+            aws_secret_access_key="fake"
+        )
+    else: # production AWS DynamoDB
+        return boto3.resource("dynamodb",
+                              region_name=AWS_REGION,
+                              aws_access_key_id=AWS_ACCESS_KEY,
+                              aws_secret_access_key=AWS_SECRET_ACCESS_KEY
+                            )
+dynamodb = get_dynamodb_client()
+table = None
+def create_table_if_not_exists(dynamodb):
+    global table
+    client = dynamodb.meta.client
+    try:
+        existing_tables = client.list_tables()["TableNames"]
+    except Exception as e:
+        print("Cannot list tables:", e)
+        return None
+    if DDB_TABLE in existing_tables:
+        print(f"Table {DDB_TABLE} already exists.")
+        table = dynamodb.Table(DDB_TABLE)
+        return table
+    print(f"Creating DynamoDB table {DDB_TABLE}...")
+    try:
+        table = dynamodb.create_table(
+            TableName=DDB_TABLE,
+            KeySchema=[
+                {"AttributeName": "PK", "KeyType": "HASH"},
+                {"AttributeName": "SK", "KeyType": "RANGE"}
+            ],
+            AttributeDefinitions=[
+                {"AttributeName": "PK", "AttributeType": "S"},
+                {"AttributeName": "SK", "AttributeType": "S"},
+                {"AttributeName": "GSI1_PK", "AttributeType": "S"},
+                {"AttributeName": "GSI1_SK", "AttributeType": "S"}
+            ],
+            GlobalSecondaryIndexes=[
+                {
+                    "IndexName": "GSI1",
+                    "KeySchema": [
+                        {"AttributeName": "GSI1_PK", "KeyType": "HASH"},
+                        {"AttributeName": "GSI1_SK", "KeyType": "RANGE"}
+                    ],
+                    "Projection": {"ProjectionType": "ALL"},
+                    "ProvisionedThroughput": {
+                        "ReadCapacityUnits": 5,
+                        "WriteCapacityUnits": 5
+                    },
+                }
+            ],
+            BillingMode='PAY_PER_REQUEST'
+            # ProvisionedThroughput={
+            #     "ReadCapacityUnits": 5,
+            #     "WriteCapacityUnits": 5
+            # }
+        )
+        table.wait_until_exists()
+        print(f"Table {DDB_TABLE} created.")
+        return table
+    except ClientError as e:
+        print("Error creating table:", e.response["Error"]["Message"])
+        return None
+def iso_ts():
+    # Return the current timestamp in ISO 8601 format
+    return datetime.now(timezone.utc).isoformat()
+table = create_table_if_not_exists(dynamodb)
+def convert_floats(obj):
+    if isinstance(obj, float):
+        return Decimal(str(obj))
+    elif isinstance(obj, dict):
+        return {k: convert_floats(v) for k, v in obj.items()}
+    elif isinstance(obj, list):
+        return [convert_floats(v) for v in obj]
+    else:
+        return obj
+def log_event(user_id, session_id, data):
+    """
+    Log conversation data to DynamoDB table.
+    :param user_id: ID of the user
+    :param session_id: ID of the session
+    :param data: Dictionary containing conversation data
+    """
+    global table
+    if table is None:
+        print("Table not initialized. Skipping log.")
+        return
+    ts = iso_ts()
+    item = {
+        "PK": f"SESSION#{session_id}",
+        "SK": f"TS#{ts}#{uuid4().hex}",
+        'user_id': user_id,
+        "GSI1_PK": f"USER#{user_id}",
+        "GSI1_SK": f"TS#{ts}",
+        'session_id': session_id,
+        'timestamp': ts,
+        'data': convert_floats(data)
+    }
+    print(f"Logging conversation: {item}")
+    try:
+        table.put_item(Item=item)
+    except ClientError as e:
+        print(f"Error logging conversation: {e.response['Error']['Message']}")

main.py ADDED Viewed

	@@ -0,0 +1,318 @@

+import os
+import pickle
+import faiss
+import asyncio
+from contextlib import asynccontextmanager
+from pathlib import Path
+from typing import List, Literal, Optional
+from datetime import datetime, timezone
+from dotenv import load_dotenv
+load_dotenv()
+from fastapi import FastAPI, Request
+from fastapi.responses import HTMLResponse, JSONResponse
+from fastapi.staticfiles import StaticFiles
+from fastapi.templating import Jinja2Templates
+from pydantic import BaseModel
+from dynamodb_helper import log_event
+from fastapi import BackgroundTasks
+from huggingface_hub import InferenceClient
+from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint, HuggingFaceEmbeddings
+from langchain.agents import create_agent
+from langchain.agents.middleware import dynamic_prompt, ModelRequest
+from langchain_community.docstore.in_memory import InMemoryDocstore
+from langchain_community.vectorstores import FAISS
+from langchain_core.messages import HumanMessage, AIMessage, SystemMessage
+# -------------------- Config --------------------
+BASE_DIR = Path(__file__).resolve().parent
+MODEL_MAP = {
+    "champ": "champ-model/placeholder",
+    "openai": "openai/gpt-oss-20b",
+    "google": "google/gemma-2-2b-it"
+}
+HF_TOKEN = os.getenv("HF_TOKEN") or os.getenv("HF_API_TOKEN")
+if HF_TOKEN is None:
+    raise RuntimeError(
+        "HF_TOKEN or HF_API_TOKEN is not set. "
+        "Go to Space → Settings → Variables & secrets and add one."
+    )
+hf_client = InferenceClient(token=HF_TOKEN)
+# Max history messages to keep for context
+MAX_HISTORY = 20
+# -------------------- Prompts --------------------
+DEFAULT_SYSTEM_PROMPT = (
+    "Answer clearly and concisely. You are a helpful assistant. If you do not know the answer, just say you don't know. "
+)
+CHAMP_SYSTEM_PROMPT = (
+    """
+# CONTEXT #
+You are *CHAMP*, a knowledgeable and compassionate pediatrician chatting online with adolescent patients, their families, or their caregivers. Children and adolescents commonly experience infectious illnesses (for example: fever, cough, vomiting, diarrhea). Timely access to credible information can support safe self-management at home and may reduce unnecessary non-emergency ED visits, helping to lower overcrowding and improve the care experience at home.
+#########
+# OBJECTIVE #
+Your task is to answer questions about common pediatric infectious diseases asked by the adolescent patient, their family, or their caregiver. Base your answers only on the background material provided. If the relevant information is not clearly present in that material, reply with: "I don't know." Do not invent or guess information.
+#########
+# STYLE #
+Provide concise, accurate, and actionable information to help them manage these conditions at home when it is safe to do so. Focus on clear next steps and practical advice that help them make informed decisions. Do not exceed four sentences per response.
+#########
+# TONE #
+Maintain a positive, empathetic, and supportive tone throughout, to reduce the questioners worry and help them feel heard. Your responses should feel warm and reassuring, while still reflecting professionalism and seriousness.
+# AUDIENCE #
+Your audience is adolescent patients, their families, or their caregivers. They are seeking practical advice and concrete actions they can take for disease self-management. Write at approximately a sixth-grade reading level, avoiding medical jargon or explaining it briefly when needed.
+#########
+# RESPONSE FORMAT #
+Respond in three to four sentences, as if chatting in a Facebook Messenger conversation. Do not include references, citations, or mention specific document locations in your answer.
+#############
+# START ANALYSIS #
+Here is the user question: {last_query}
+Here are the materials you must rely on for your answers: {context}
+Now, step by step, you can start answering the user’s question.
+"""
+)
+###TODO: And here is the conversation history so far : {history}
+class ChatMessage(BaseModel):
+    role: Literal["user", "assistant", "system"]
+    content: str
+class ChatRequest(BaseModel):
+    user_id: str
+    session_id: str
+    messages: List[ChatMessage]
+    temperature: float = 0.7
+    model_type: str
+    # max_new_tokens: int = 256
+    consent: bool = False
+    system_prompt: Optional[str] = None
+# -------------------- Helpers --------------------
+def convert_messages(messages: List[ChatMessage]):
+    """
+    Convert our internal message format into OpenAI-style messages.
+    """
+    sys = DEFAULT_SYSTEM_PROMPT
+    out = [{"role": "system", "content": sys}]
+    for m in messages:
+        out.append({"role": m.role, "content": m.content})
+    return out
+def convert_messages_langchain(messages: List[ChatMessage]):
+    """
+    Convert our internal message format into Langchain-style messages.
+    """
+    sys = CHAMP_SYSTEM_PROMPT
+    list_chatmessages = [SystemMessage(content = sys)]
+    for m in messages[-MAX_HISTORY:]:
+        if m.role == "user":
+            list_chatmessages.append(HumanMessage(content=m.content))
+        elif m.role == "assistant":
+            list_chatmessages.append(AIMessage(content=m.content))
+        elif m.role == "system":
+            list_chatmessages.append(SystemMessage(content=m.content))
+    return list_chatmessages
+def call_llm(req: ChatRequest) -> str:
+    if req.model_type == "champ":
+        return call_champ(req)
+    MODEL_ID = MODEL_MAP.get(req.model_type, MODEL_MAP["champ"])
+    msgs = convert_messages(req.messages)
+    try:
+        # Call HuggingFace inference API
+        resp = hf_client.chat.completions.create(
+            model=MODEL_ID,
+            messages=msgs,
+            # max_tokens=256,
+            temperature=req.temperature,
+        )
+        # Extract chat reply
+        return resp.choices[0].message["content"].strip()
+    except Exception as e:
+        raise RuntimeError(f"Inference API error: {e}")
+def call_champ(req: ChatRequest) -> str:
+    msgs = convert_messages_langchain(req.messages)
+    # config = {"configurable": {"thread_id": req.user_id}}
+    try:
+        result = agent_retrievalbased.invoke(
+            {"messages": msgs},
+            # config=config,
+        )
+        return result["messages"][-1].text.strip()
+    except Exception as e:
+        raise RuntimeError(f"CHAMP model error: {e}")
+# def log_event(user_id: str, session_id: str, data: dict):
+#     record = {
+#         "user_id": user_id,
+#         "session_id": session_id,
+#         "data": data,
+#         "timestamp": datetime.now(timezone.utc)
+#     }
+#     conversations_collection.insert_one(record)
+# -------------------- CHAMP setup --------------------
+# RAG setup
+def build_vector_store():
+    rag_path = BASE_DIR / "rag_data" / "netg_baaibge_chunks_v1.pkl"
+    with open(rag_path, 'rb') as f:
+        loaded_documents  = pickle.load(f)
+    print("Chunks loaded successfully.")
+    device = "cpu" # to be update if need GPU
+    model_embedding_name = "BAAI/bge-large-en-v1.5"
+    model_embedding_kwargs = {'device': device, "use_auth_token": HF_TOKEN}
+    encode_kwargs = {'normalize_embeddings': True}
+    embeddings = HuggingFaceEmbeddings(
+        model_name=model_embedding_name,
+        model_kwargs=model_embedding_kwargs,
+        encode_kwargs=encode_kwargs,
+    )
+    embedding_dim = len(embeddings.embed_query("hello world"))
+    index = faiss.IndexFlatL2(embedding_dim)
+    vector_store = FAISS(
+        embedding_function=embeddings,
+        index=index,
+        docstore=InMemoryDocstore(),
+        index_to_docstore_id={},
+    )
+    vector_store.add_documents(documents=loaded_documents)
+    return vector_store
+def make_prompt_with_context(vector_store: FAISS):
+    @dynamic_prompt
+    def prompt_with_context(request: ModelRequest) -> str:
+        last_query = request.state["messages"][-1].text
+        retrieved_docs = vector_store.similarity_search(last_query, k = 3)
+        docs_content = "\n\n".join(doc.page_content for doc in retrieved_docs) if retrieved_docs else ""
+        system_message = CHAMP_SYSTEM_PROMPT.format(
+            last_query = last_query,
+            context = docs_content
+        )
+        return system_message
+    return prompt_with_context
+def build_champ_agent(vector_store: FAISS):
+    hf_llm_champ = HuggingFaceEndpoint(
+        repo_id = "openai/gpt-oss-20b",
+        task = "text-generation",
+        max_new_tokens = 1024,
+        # temperature = 0.7,
+    )
+    model_chat = ChatHuggingFace(llm=hf_llm_champ)
+    prompt_middleware = make_prompt_with_context(vector_store)
+    agent = create_agent(model_chat, tools=[], middleware=[prompt_middleware]) #checkpointer = InMemorySaver()
+    return agent
+# -------------------- FastAPI setup --------------------
+vector_store: Optional[FAISS] = None
+agent_retrievalbased = None  # 给 call_champ 用
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    global vector_store, agent_retrievalbased
+    loop = asyncio.get_event_loop()
+    # 在后台线程执行同步的 build_vector_store
+    vector_store = await loop.run_in_executor(
+        None, build_vector_store
+    )
+    agent_retrievalbased = build_champ_agent(vector_store)
+    print("CHAMP RAG + agent initialized.")
+    yield
+app = FastAPI(lifespan=lifespan)
+app.mount("/static", StaticFiles(directory="static"), name="static")
+templates = Jinja2Templates(directory="templates")
+# -------------------- Routes --------------------
+@app.get("/", response_class=HTMLResponse)
+async def home(request: Request):
+    return templates.TemplateResponse("index.html", {"request": request})
+@app.post("/chat")
+async def chat_endpoint(payload: ChatRequest, background_tasks: BackgroundTasks):
+    print(f"Received chat request: {payload}")
+    if not payload.messages:
+        return JSONResponse({"error": "No messages provided"}, status_code=400)
+    try:
+        reply = call_llm(payload)
+    except Exception as e:
+        background_tasks.add_task(
+            log_event,
+            user_id=payload.user_id,
+            session_id=payload.session_id,
+            data={
+                "error": str(e),
+                "model_type": payload.model_type,
+                "consent": payload.consent,
+                "temperature": payload.temperature,
+                "messages": payload.messages[-1].dict() if payload.messages else {},
+            }
+        )
+        return JSONResponse({"error": str(e)}, status_code=500)
+    background_tasks.add_task(
+        log_event,
+        user_id=payload.user_id,
+        session_id=payload.session_id,
+        data={
+            "model_type": payload.model_type,
+            "consent": payload.consent,
+            "temperature": payload.temperature,
+            "messages": payload.messages[-1].dict(),
+            "reply": reply,
+        }
+    )
+    return {"reply": reply}

rag_data/netg_baaibge_chunks_v1.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fffd4dbb98d49ee9dc97d1c530c3c3278a624bf19a79854fde0b03af9977c71
+size 205801

requirements.txt ADDED Viewed

	@@ -0,0 +1,25 @@

+fastapi
+uvicorn[standard]
+jinja2
+python-multipart
+requests
+python-dotenv
+huggingface_hub
+sentence-transformers
+pydantic
+pymongo
+faiss-cpu
+langchain
+langchain-core
+langchain-community
+langchain-huggingface
+boto3
+botocore

static/app.js ADDED Viewed

	@@ -0,0 +1,162 @@

+const chatWindow = document.getElementById('chatWindow');
+const userInput = document.getElementById('userInput');
+const sendBtn = document.getElementById('sendBtn');
+const statusEl = document.getElementById('status');
+const systemPresetSelect = document.getElementById('systemPreset');
+const tempSlider = document.getElementById('tempSlider');
+const tempValue = document.getElementById('tempValue');
+// const maxTokensSlider = document.getElementById("maxTokensSlider");
+// const maxTokensValue = document.getElementById("maxTokensValue");
+const clearBtn = document.getElementById('clearBtn');
+const consentOverlay = document.getElementById('consentOverlay');
+const consentCheckbox = document.getElementById('consentCheckbox');
+const consentBtn = document.getElementById('consentBtn');
+// Local in-browser chat history
+let messages = [];
+let consentGranted = false;
+let sessionId = 'session-' + crypto.randomUUID(); // Unique session ID, generated once per page load
+document.body.classList.add('no-scroll');
+function renderMessages() {
+  chatWindow.innerHTML = '';
+  messages.forEach((m) => {
+    const bubble = document.createElement('div');
+    bubble.classList.add(
+      'msg-bubble',
+      m.role === 'user' ? 'user' : 'assistant'
+    );
+    // convert markdown to HTML safely
+    bubble.innerHTML = DOMPurify.sanitize(marked.parse(m.content));
+    chatWindow.appendChild(bubble);
+  });
+  chatWindow.scrollTop = chatWindow.scrollHeight;
+}
+function updateSlidersUI() {
+  tempValue.textContent = tempSlider.value;
+  // maxTokensValue.textContent = maxTokensSlider.value;
+}
+function getMachineId() {
+  let machineId = localStorage.getItem('MachineId');
+  if (!machineId) {
+    machineId = 'dev-' + crypto.randomUUID();
+    localStorage.setItem('MachineId', machineId);
+  }
+  return machineId;
+}
+// ----- Chat -----
+async function sendMessage() {
+  const text = userInput.value.trim();
+  if (!text) return;
+  // Add user message locally
+  messages.push({ role: 'user', content: text });
+  renderMessages();
+  userInput.value = '';
+  statusEl.textContent = 'Thinking...';
+  statusEl.className = 'status status-info';
+  const temperature = parseFloat(tempSlider.value);
+  // const maxTokens = parseInt(maxTokensSlider.value, 10);
+  // const systemPrompt = systemPresetSelect.value;
+  const modelType = systemPresetSelect.value;
+  const payload = {
+    user_id: getMachineId(),
+    session_id: sessionId,
+    messages: messages.map((m) => ({ role: m.role, content: m.content })),
+    temperature,
+    // max_new_tokens: maxTokens,
+    model_type: modelType,
+    consent: consentGranted,
+  };
+  try {
+    const res = await fetch('/chat', {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify(payload),
+    });
+    const data = await res.json();
+    if (!res.ok) {
+      statusEl.textContent = data.error || 'Error from server.';
+      statusEl.className = 'status status-error';
+      return;
+    }
+    const reply = data.reply || '(No reply)';
+    messages.push({ role: 'assistant', content: reply });
+    renderMessages();
+    statusEl.textContent = 'Ready';
+    statusEl.className = 'status status-ok';
+  } catch (err) {
+    console.error(err);
+    statusEl.textContent = 'Network error.';
+    statusEl.className = 'status status-error';
+  }
+}
+function resetSession() {
+  sessionId = 'session-' + crypto.randomUUID();
+}
+function clearConversation() {
+  resetSession();
+  messages = [];
+  renderMessages();
+  statusEl.textContent = 'Conversation cleared. Start a new chat!';
+  statusEl.className = 'status status-ok';
+}
+// ----- Event wiring -----
+// Consent logic
+// When the checkbox is toggled, enable or disable the button
+consentCheckbox.addEventListener('change', () => {
+  consentBtn.disabled = !consentCheckbox.checked;
+});
+// Handle the consent acceptance
+consentBtn.addEventListener('click', () => {
+  consentOverlay.style.display = 'none'; // Hide overlay
+  document.body.classList.remove('no-scroll'); // NEW: re-enable scrolling
+  consentGranted = true; // Mark consent as granted
+});
+sendBtn.addEventListener('click', sendMessage);
+// Enter to send, Shift+Enter = newline
+userInput.addEventListener('keydown', (e) => {
+  if (e.key === 'Enter' && !e.shiftKey) {
+    e.preventDefault();
+    sendMessage();
+  }
+});
+tempSlider.addEventListener('input', updateSlidersUI);
+// maxTokensSlider.addEventListener("input", updateSlidersUI);
+clearBtn.addEventListener('click', clearConversation);
+systemPresetSelect.addEventListener('change', () => {
+  clearConversation();
+  statusEl.textContent = 'Model changed. History cleared.';
+  statusEl.className = 'status status-ok';
+});
+// initial UI state
+updateSlidersUI();
+statusEl.textContent = 'Ready';
+statusEl.className = 'status status-ok';

static/style.css ADDED Viewed

	@@ -0,0 +1,227 @@

+/* Dark theme page background */
+body {
+  margin: 0;
+  font-family: system-ui, -apple-system, BlinkMacSystemFont, 'Segoe UI',
+    sans-serif;
+  background: #0b1020;
+  color: #f5f5f5;
+}
+/* NEW: prevent scrolling while consent overlay is active */
+body.no-scroll {
+  overflow: hidden;
+}
+.chat-container {
+  max-width: 900px;
+  margin: 40px auto;
+  background: #141b2f;
+  border-radius: 16px;
+  box-shadow: 0 10px 30px rgba(0, 0, 0, 0.45);
+  display: flex;
+  flex-direction: column;
+  height: 80vh;
+  padding: 16px;
+}
+.chat-header {
+  padding: 8px 4px 12px;
+  border-bottom: 1px solid #2c3554;
+}
+.chat-header h1 {
+  margin: 0;
+  font-size: 1.8rem;
+}
+.chat-header .subtitle {
+  margin: 4px 0 0;
+  color: #c0c6e0;
+  font-size: 0.95rem;
+}
+/* Controls bar */
+.controls-bar {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 12px;
+  margin-top: 10px;
+  padding: 8px 4px;
+  border-bottom: 1px solid #2c3554;
+}
+.control-group {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  font-size: 0.85rem;
+  color: #d3dbff;
+}
+.control-group select,
+.control-group input[type='range'] {
+  background: #0d1324;
+  border-radius: 8px;
+  border: 1px solid #2c3554;
+  color: #f5f5f5;
+  padding: 4px 8px;
+  font-size: 0.85rem;
+}
+.secondary-button {
+  align-self: flex-end;
+  padding: 6px 12px;
+  border-radius: 8px;
+  border: 1px solid #2c3554;
+  background: #1f2840;
+  color: #f5f5f5;
+  font-size: 0.85rem;
+  cursor: pointer;
+}
+.secondary-button:hover {
+  background: #273256;
+}
+/* Chat window */
+.chat-window {
+  flex: 1;
+  margin-top: 10px;
+  padding: 10px;
+  overflow-y: auto;
+  background: #0d1324;
+  border-radius: 12px;
+}
+/* Message bubbles */
+.msg-bubble {
+  max-width: 75%;
+  padding: 8px 12px;
+  margin-bottom: 8px;
+  border-radius: 12px;
+  font-size: 0.95rem;
+  line-height: 1.4;
+}
+.msg-bubble.user {
+  margin-left: auto;
+  background: #4c6fff;
+  color: #ffffff;
+  border-bottom-right-radius: 4px;
+}
+.msg-bubble.assistant {
+  margin-right: auto;
+  background: #1f2840;
+  color: #f5f5f5;
+  border-bottom-left-radius: 4px;
+}
+/* Input area */
+.chat-input-area {
+  display: flex;
+  gap: 8px;
+  margin-top: 12px;
+  border-top: 1px solid #2c3554;
+  padding-top: 8px;
+}
+.chat-input-area textarea {
+  flex: 1;
+  border-radius: 10px;
+  border: 1px solid #2c3554;
+  background: #0d1324;
+  color: #f5f5f5;
+  padding: 8px;
+  resize: none;
+  font-size: 0.95rem;
+}
+.chat-input-area button {
+  padding: 8px 18px;
+  border-radius: 10px;
+  border: none;
+  background: #4c6fff;
+  color: white;
+  font-weight: 600;
+  cursor: pointer;
+}
+.chat-input-area button:hover {
+  background: #3453e6;
+}
+/* Status text */
+.status {
+  margin-top: 6px;
+  font-size: 0.85rem;
+}
+.status-info {
+  color: #ffce56;
+}
+.status-ok {
+  color: #8be48b;
+}
+.status-error {
+  color: #ff8080;
+}
+/* RESPONSIVE DESIGN */
+@media (max-width: 768px) {
+  .chat-container {
+    margin: 0;
+    border-radius: 0;
+    height: 100vh;
+  }
+  .msg-bubble {
+    max-width: 90%;
+  }
+  .controls-bar {
+    flex-direction: column;
+    align-items: flex-start;
+  }
+  .secondary-button {
+    align-self: flex-start;
+  }
+}
+/* CONSENT OVERLAY FIXED VERSION */
+.consent-overlay {
+  position: fixed;
+  top: 0;
+  left: 0;
+  width: 100%;
+  height: 100%;
+  background: rgba(0, 0, 0, 0.55); /* CHANGED: darker for visibility */
+  backdrop-filter: blur(4px);
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  z-index: 9999; /* NEW: ensure nothing covers this */
+}
+/* Dark theme overlay box */
+.consent-box {
+  background: #141b2f; /* CHANGED: match theme */
+  color: #f5f5f5; /* NEW: readable on dark bg */
+  padding: 24px;
+  width: 420px;
+  border-radius: 12px;
+  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.4);
+}
+.consent-check {
+  display: flex;
+  align-items: center;
+  margin: 16px 0;
+  gap: 10px;
+}

templates/index.html ADDED Viewed

	@@ -0,0 +1,94 @@

+<!DOCTYPE html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <title>CHAMP Chatbot Demo</title>
+    <link rel="stylesheet" href="/static/style.css" />
+    <!-- Include marked.js for Markdown rendering -->
+    <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
+    <!-- Include DOMPurify to sanitize HTML -->
+    <script src="https://cdn.jsdelivr.net/npm/dompurify@2.4.2/dist/purify.min.js"></script>
+  </head>
+  <body class="no-scroll">
+    <div class="chat-container">
+      <!-- Header -->
+      <header class="chat-header">
+        <h1>CHAMP Chatbot Demo: Model Comparison</h1>
+        <p class="subtitle">
+          Talk to and compare chatbots powered by different models. Please
+          remember to avoid sharing any sensitive or private details during the
+          conversation.
+        </p>
+      </header>
+      <!-- Controls bar -->
+      <div class="controls-bar">
+        <div class="control-group">
+          <label for="systemPreset">Model Selection</label>
+          <select id="systemPreset">
+            <option value="champ" selected>CHAMP</option>
+            <!-- champ is our model -->
+            <option value="openai">ChatGPT</option>
+            <option value="google">Gemma</option>
+          </select>
+        </div>
+        <div class="control-group">
+          <label for="tempSlider">
+            Temperature:
+            <span id="tempValue">0.7</span>
+          </label>
+          <input
+            type="range"
+            id="tempSlider"
+            min="0.1"
+            max="1.2"
+            step="0.1"
+            value="0.7"
+          />
+        </div>
+        <button id="clearBtn" class="secondary-button">Clear</button>
+      </div>
+      <div id="consentOverlay" class="consent-overlay">
+        <div class="consent-box">
+          <h2>Before you continue</h2>
+          <p>
+            By using this demo you agree that your messages will be shared with
+            us for processing. Do not provide sensitive or private details.
+          </p>
+          <label class="consent-check">
+            <input type="checkbox" id="consentCheckbox" />
+            I understand and agree
+          </label>
+          <button id="consentBtn" class="primary-button" disabled>
+            Agree and Continue
+          </button>
+        </div>
+      </div>
+      <!-- Chat window -->
+      <main id="chatWindow" class="chat-window">
+        <!-- Messages get rendered here by app.js -->
+      </main>
+      <!-- Input area -->
+      <footer class="chat-input-area">
+        <textarea
+          id="userInput"
+          rows="2"
+          placeholder="Type your message and press Enter or click Send..."
+        ></textarea>
+        <button id="sendBtn">Send</button>
+      </footer>
+      <!-- Status line -->
+      <div id="status" class="status"></div>
+    </div>
+    <script src="/static/app.js"></script>
+  </body>
+</html>

tests/test_dynamodb.py ADDED Viewed

	@@ -0,0 +1,48 @@

+from moto import mock_aws
+import boto3
+import pytest
+from dynamodb_helper import create_table_if_not_exists, DDB_TABLE
+from botocore.exceptions import ClientError
+import os
+class TestDynamoDBHelper:
+  dynamodb = boto3.resource("dynamodb", region_name="ca-central-1")
+  @mock_aws
+  def test_create_table_if_not_exists(self):
+      # Ensure the table does not exist initially
+      client = self.dynamodb.meta.client
+      existing_tables = client.list_tables()["TableNames"]
+      assert DDB_TABLE not in existing_tables
+      # Create the table
+      table = create_table_if_not_exists(self.dynamodb)
+      assert table is not None
+      # Verify the table now exists
+      existing_tables = client.list_tables()["TableNames"]
+      assert DDB_TABLE in existing_tables
+      # Attempt to create the table again, should not raise an error
+      table = create_table_if_not_exists(self.dynamodb)
+      assert table is not None
+  @mock_aws
+  def test_log_event(self):
+      table = create_table_if_not_exists(self.dynamodb)
+      table_resource = self.dynamodb.Table(DDB_TABLE)
+      user_id = "user123"
+      session_id = "test-session-456"
+      data = {"event": "test_event", "value": 26, "float_value": 3.14}
+      from dynamodb_helper import log_event
+      log_event(user_id, session_id, data)
+      response = table_resource.scan()
+      assert response["Count"] == 1
+      item = response["Items"][0]
+      assert item["PK"] == f"SESSION#{session_id}"
+      assert item["data"]["event"] == "test_event"
+      from decimal import Decimal
+      assert item["data"]["value"] == Decimal(26)
+      assert item["data"]["float_value"] == Decimal("3.14")

tests/test_main.py ADDED Viewed

	@@ -0,0 +1,37 @@

+from main import app
+from fastapi.testclient import TestClient
+from moto import mock_aws
+from dynamodb_helper import create_table_if_not_exists, DDB_TABLE
+from botocore.exceptions import ClientError
+class TestMain:
+    def test_convert_messages(self):
+        from main import convert_messages
+        from main import DEFAULT_SYSTEM_PROMPT
+        from main import ChatMessage
+        messages = [
+          ChatMessage(role="user", content="Hello"),
+          ChatMessage(role="assistant", content="Hi there!"),
+        ]
+        converted = convert_messages(messages)
+        assert converted == [
+            {"role": "system", "content": DEFAULT_SYSTEM_PROMPT},
+            {"role": "user", "content": "Hello"},
+            {"role": "assistant", "content": "Hi there!"},
+        ]
+    def test_convert_messages_langchain(self):
+        from langchain_core.messages import HumanMessage, AIMessage, SystemMessage
+        from main import convert_messages_langchain, ChatMessage, CHAMP_SYSTEM_PROMPT
+        messages = [
+          ChatMessage(role="user", content="Hello"),
+          ChatMessage(role="assistant", content="Hi there!"),
+        ]
+        converted = convert_messages_langchain(messages)
+        # Check types and content only
+        expected_types = [SystemMessage, HumanMessage, AIMessage]
+        expected_contents = [CHAMP_SYSTEM_PROMPT, "Hello", "Hi there!"]
+        for msg, expected_type, expected_content in zip(converted, expected_types, expected_contents):
+          assert isinstance(msg, expected_type)
+          assert msg.content == expected_content