# FROM ... (Keep your existing FROM line) #FROM hf.co/ajvikram/Qwen2.5-Coder-3B-Network-Eng-GGUF FROM hf.co/ajvikram/network-compliance-auditor-grpo # --- 1. STOP TOKENS (Keep these!) --- PARAMETER stop "<|im_end|>" PARAMETER stop "" PARAMETER stop "User:" PARAMETER stop "<|fim_prefix|>" PARAMETER stop "<|fim_middle|>" PARAMETER stop "<|fim_suffix|>" PARAMETER stop "<|repo_name|>" # --- 2. CRITICAL FIX: ANTI-LOOPING --- # repeat_penalty 1.15 tells the model: "If you just said this token, don't say it again." # This kills the "😦 😦 😦" loop instantly. PARAMETER repeat_penalty 1.15 # repeat_last_n 64 tells it to look back at the last 64 tokens to check for repeats. PARAMETER repeat_last_n 64 # --- 3. TEMPLATE (Keep this exactly as before) --- TEMPLATE """{{ if .System }}<|im_start|>system {{ .System }}<|im_end|> {{ end }}{{ if .Prompt }}<|im_start|>user {{ .Prompt }}<|im_end|> {{ end }}<|im_start|>assistant {{ .Response }}""" # --- 4. SYSTEM (Keep this exactly as before) --- SYSTEM """ You are an intelligent Network Compliance Auditor. You must output your internal reasoning trace within tags, followed by a final JSON object containing the verdict (PASS/FAIL), the specific control ID, and the evidence line. Dont repeat and provide only one answer."""