Spaces:

colin730
/

SummarizerApp

Sleeping

ming commited on Nov 27, 2025

Commit

bf21a65

1 Parent(s): fe47248

fix: Use Qwen chat template and harden NDJSON parsing

STEP 1: Use Qwen2.5 native chat template
- Replace manual Phi-3 format with tokenizer.apply_chat_template()
- Ensures correct special tokens for Qwen models
- Adds explicit NDJSON-only reminder in user message
- Critical fix: previous Phi-3 format was incompatible with Qwen

STEP 2: Harden NDJSON parsing
- Add heuristic check: skip lines not starting with '{' or missing 'op'
- Prevents parsing C++ code, prose, or random hallucinations
- Reduces log spam from invalid JSON parsing attempts
- Cleaner error messages for debugging

This should fix the model hallucination issue where Qwen2.5-1.5B
was generating C++ code instead of NDJSON patches.

Files changed (1) hide show

app/services/structured_summarizer.py +34 -9

app/services/structured_summarizer.py CHANGED Viewed

@@ -207,7 +207,7 @@ Rules:
         return False
     def _build_prompt(self, text: str, style: str) -> str:
-        """Build the complete prompt for Phi-3."""
         system_prompt = self._build_system_prompt()
         style_instruction = self._build_style_instruction(style)
@@ -217,15 +217,30 @@ Rules:
             text = text[:max_chars]
             logger.warning(f"Truncated text from {len(text)} to {max_chars} chars")
-        # Phi-3 chat template format
-        full_prompt = (
-            f"<|system|>\n{system_prompt}\n<|end|>\n"
-            f"<|user|>\n{style_instruction}\n\nArticle:\n{text}\n<|end|>\n"
-            f"<|assistant|>"
         )
-        return full_prompt
     async def summarize_structured_stream(
         self,
         text: str,
@@ -416,11 +431,21 @@ Rules:
                         if not line:
                             continue
                         # Try to parse JSON patch
                         try:
                             patch = json.loads(line)
                         except json.JSONDecodeError as e:
-                            logger.warning(f"Failed to parse NDJSON line: {line[:100]}... Error: {e}")
                             continue
                         # Apply patch to state

         return False
     def _build_prompt(self, text: str, style: str) -> str:
+        """Build the complete prompt for Qwen2.5 using its chat template."""
         system_prompt = self._build_system_prompt()
         style_instruction = self._build_style_instruction(style)
             text = text[:max_chars]
             logger.warning(f"Truncated text from {len(text)} to {max_chars} chars")
+        messages = [
+            {
+                "role": "system",
+                "content": system_prompt,
+            },
+            {
+                "role": "user",
+                "content": (
+                    f"{style_instruction}\n\n"
+                    f"Article:\n{text}\n\n"
+                    "Remember: respond ONLY with newline-delimited JSON patch objects "
+                    "as described in the system message. "
+                    "No explanations, no comments, no markdown, no code, no prose."
+                ),
+            },
+        ]
+        # Let Qwen's tokenizer construct the correct special tokens and format
+        return self.tokenizer.apply_chat_template(
+            messages,
+            tokenize=False,
+            add_generation_prompt=True,
         )
     async def summarize_structured_stream(
         self,
         text: str,
                         if not line:
                             continue
+                        # Heuristic: skip anything that clearly isn't a JSON patch object
+                        # This filters out lines like "#include <bits/stdc++.h>" or random prose.
+                        if not line.startswith("{") or "op" not in line:
+                            logger.warning(
+                                f"Skipping non-JSON-looking line: {line[:80]}..."
+                            )
+                            continue
                         # Try to parse JSON patch
                         try:
                             patch = json.loads(line)
                         except json.JSONDecodeError as e:
+                            logger.warning(
+                                f"Failed to parse NDJSON line: {line[:100]}... Error: {e}"
+                            )
                             continue
                         # Apply patch to state