Spaces:

vibesecurityguy
/

veris-classifier

Running on Zero

App Files Files Community

vibesecurityguy commited on Mar 8

Commit

4a6f75b

verified ·

1 Parent(s): 265d130

Upload src/veris_classifier/classifier.py with huggingface_hub

Browse files

Files changed (1) hide show

src/veris_classifier/classifier.py +48 -17

src/veris_classifier/classifier.py CHANGED Viewed

@@ -91,15 +91,28 @@ def load_hf_model():
 def _generate_hf(messages: list[dict], max_new_tokens: int = 1024) -> str:
     """Generate a response using the fine-tuned HF model."""
     pipe, tokenizer = load_hf_model()
-    outputs = pipe(
-        messages,
-        max_new_tokens=max_new_tokens,
-        do_sample=True,
-        temperature=0.2,
-        top_p=0.9,
-    )
     return outputs[0]["generated_text"].strip()
@@ -129,6 +142,32 @@ def _generate_openai(
     return response.choices[0].message.content.strip()
 # ── Public API ────────────────────────────────────────────────────────────
@@ -155,7 +194,7 @@ def classify_incident(
     ]
     if use_hf:
-        raw = _generate_hf(messages, max_new_tokens=1024)
     else:
         if client is None:
             raise ValueError("OpenAI client required when use_hf=False")
@@ -163,15 +202,7 @@ def classify_incident(
             client, messages, model=model, temperature=0.2, json_mode=True
         )
-    # Parse JSON from response (handle markdown fences if present)
-    text = raw.strip()
-    if text.startswith("```"):
-        # Strip ```json ... ``` wrapper
-        lines = text.split("\n")
-        text = "\n".join(lines[1:-1]) if len(lines) > 2 else text
-        text = text.strip()
-    return json.loads(text)
 def answer_question(

 def _generate_hf(messages: list[dict], max_new_tokens: int = 1024) -> str:
     """Generate a response using the fine-tuned HF model."""
+    return _generate_hf_with_options(messages, max_new_tokens=max_new_tokens)
+def _generate_hf_with_options(
+    messages: list[dict],
+    max_new_tokens: int = 1024,
+    do_sample: bool = True,
+    temperature: float = 0.2,
+    top_p: float = 0.9,
+) -> str:
+    """Generate a response using the fine-tuned HF model with explicit sampling controls."""
     pipe, tokenizer = load_hf_model()
+    generate_kwargs = {
+        "max_new_tokens": max_new_tokens,
+        "do_sample": do_sample,
+    }
+    if do_sample:
+        generate_kwargs["temperature"] = temperature
+        generate_kwargs["top_p"] = top_p
+    outputs = pipe(messages, **generate_kwargs)
     return outputs[0]["generated_text"].strip()
     return response.choices[0].message.content.strip()
+def _parse_json_response(raw: str) -> dict:
+    """Parse model output into JSON with light recovery for wrapped text."""
+    text = raw.strip()
+    try:
+        return json.loads(text)
+    except json.JSONDecodeError:
+        pass
+    if text.startswith("```"):
+        lines = text.split("\n")
+        text = "\n".join(lines[1:-1]) if len(lines) > 2 else text
+        text = text.strip()
+        try:
+            return json.loads(text)
+        except json.JSONDecodeError:
+            pass
+    # Recover when the model prepends/appends prose around a JSON object.
+    start = text.find("{")
+    end = text.rfind("}")
+    if start != -1 and end != -1 and end > start:
+        return json.loads(text[start : end + 1])
+    raise json.JSONDecodeError("No JSON object found in model output", text, 0)
 # ── Public API ────────────────────────────────────────────────────────────
     ]
     if use_hf:
+        raw = _generate_hf_with_options(messages, max_new_tokens=1024, do_sample=False)
     else:
         if client is None:
             raise ValueError("OpenAI client required when use_hf=False")
             client, messages, model=model, temperature=0.2, json_mode=True
         )
+    return _parse_json_response(raw)
 def answer_question(