Spaces:

ENUSEC
/

Filter_Phantoms

Paused

App Files Files Community

lewiswatson commited on May 6, 2025

Commit

fa456e1

verified ·

1 Parent(s): 3fcf2dc

Upload app.py

Browse files

Files changed (1) hide show

app.py +23 -12

app.py CHANGED Viewed

@@ -49,17 +49,27 @@ def sanitize(text: str) -> str:
 MAX_CTX = 4096
 def chat(raw_input, history):
-    clean = sanitize(raw_input)
-    if not clean.strip() or clean == "[redacted]":
-        return "I’m not sure what you meant—could you try phrasing it differently?", history
-    # Build prompt from sanitized history + this turn
-    hist = ""
-    for prev_raw, prev_resp in history:
-        hist += f"User: {sanitize(prev_raw)}\nAssistant: {prev_resp}\n"
-    prompt = "\n".join(SYSTEM_PROMPTS) + "\n\n" + hist
-    prompt += f"User: {clean}\nAssistant:"
     # Tokenise & manually truncate to last MAX_CTX tokens
     all_ids = tokenizer.encode(prompt, add_special_tokens=False)
@@ -70,7 +80,7 @@ def chat(raw_input, history):
         "attention_mask": torch.tensor([[1] * len(all_ids)])
     }
-    # Generate
     out = model.generate(
         **inputs,
         max_new_tokens=200,
@@ -81,8 +91,9 @@ def chat(raw_input, history):
     seen = tokenizer.decode(all_ids, skip_special_tokens=True)
     resp = full[len(seen):].strip()
-    history.append((raw_input, resp))
-    return resp, history
 # ————————————————————————————————————————————————————————————————
 # Launch Gradio App

 MAX_CTX = 4096
 def chat(raw_input, history):
+    # history is a list of dicts: {"role": "user"/"assistant", "content": str}
+    # Initialise history list if None
+    history = history or []
+    # Append new raw user message
+    history.append({"role": "user", "content": raw_input})
+    # Sanitize the new user input for the model
+    clean = sanitize(raw_input)
+    if not clean.strip() or clean == "[redacted]":
+        history.append({"role": "assistant", "content": "I’m not sure what you meant—could you try phrasing it differently?"})
+        return history, history
+    # Build prompt: system prompts + conversation history
+    prompt = "\n".join(SYSTEM_PROMPTS) + "\n\n"
+    for turn in history:
+        if turn["role"] == "user":
+            prompt += f"User: {sanitize(turn['content'])}\n"
+        else:
+            prompt += f"Assistant: {turn['content']}\n"
+    prompt += "Assistant:"
     # Tokenise & manually truncate to last MAX_CTX tokens
     all_ids = tokenizer.encode(prompt, add_special_tokens=False)
         "attention_mask": torch.tensor([[1] * len(all_ids)])
     }
+    # Generate response
     out = model.generate(
         **inputs,
         max_new_tokens=200,
     seen = tokenizer.decode(all_ids, skip_special_tokens=True)
     resp = full[len(seen):].strip()
+    # Append model reply
+    history.append({"role": "assistant", "content": resp})
+    return history, history
 # ————————————————————————————————————————————————————————————————
 # Launch Gradio App