Spaces:

arasuezofis
/

documentbasedresponse

Sleeping

App Files Files Community

arasuezofis commited on Oct 13, 2025

Commit

62c1db6

verified ·

1 Parent(s): 9037c59

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -13

app.py CHANGED Viewed

@@ -129,21 +129,26 @@ def parse_page_selection(value, num_pages: int) -> int:
         idx = int(m.group(1)) - 1 if m else 0
     return max(0, min(num_pages - 1, idx))
-def build_messages(history: List[Tuple[str, str]], user_text: str, images: List[Image.Image]):
     """
-    Construct chat-format messages for tokenizer.apply_chat_template.
     """
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
-    trimmed = history[-4:] if history else []
-    for u, a in trimmed:
-        messages.append({"role": "user", "content": u})
-        messages.append({"role": "assistant", "content": a})
     multimodal = []
     for im in images:
         multimodal.append(im)
     if user_text.strip():
         multimodal.append(user_text.strip())
     messages.append({"role": "user", "content": multimodal})
     return messages
@@ -230,19 +235,37 @@ def page_picker_changed(pages_dropdown, images_state):
     selected = images_state[idx]
     return selected, selected  # preview + selected state
-def chat(user_text, history, images_state, selected_img):
     if not user_text or not user_text.strip():
-        return gr.update(), history
     sel_img = selected_img if selected_img is not None else (images_state[0] if images_state else None)
     if sel_img is None:
-        history = history + [(user_text, "Please upload a document first.")]
-        return gr.update(value=history), history
-    stream = generate_reply([sel_img], user_text, history)
     acc = ""
     for chunk in stream:
         acc = chunk
-        yield history + [(user_text, acc)], history + [(user_text, acc)]
 # -----------------------------
 # App definition

         idx = int(m.group(1)) - 1 if m else 0
     return max(0, min(num_pages - 1, idx))
+def build_messages(history_msgs: list, user_text: str, images: List[Image.Image]):
     """
+    Compose the full prompt for the model:
+      - system prompt
+      - trimmed history (already in {'role','content'} format)
+      - current user turn with images + text
     """
     messages = [{"role": "system", "content": SYSTEM_PROMPT}]
+    # Keep last 8 messages to stay lean
+    trimmed = history_msgs[-8:] if history_msgs else []
+    messages.extend(trimmed)
+    # Current user turn: images first, then text
     multimodal = []
     for im in images:
         multimodal.append(im)
     if user_text.strip():
         multimodal.append(user_text.strip())
     messages.append({"role": "user", "content": multimodal})
     return messages
     selected = images_state[idx]
     return selected, selected  # preview + selected state
+def chat(user_text, history_msgs, images_state, selected_img):
     if not user_text or not user_text.strip():
+        return gr.update(), history_msgs
     sel_img = selected_img if selected_img is not None else (images_state[0] if images_state else None)
     if sel_img is None:
+        # push a system-style nudge
+        history_msgs = history_msgs + [
+            {"role": "user", "content": user_text},
+            {"role": "assistant", "content": "Please upload a document first."}
+        ]
+        return gr.update(value=history_msgs), history_msgs
+    # Stream the assistant reply
+    stream = generate_reply([sel_img], user_text, history_msgs)
     acc = ""
     for chunk in stream:
         acc = chunk
+        # do incremental streaming by replacing the last assistant message
+        yield (
+            history_msgs + [
+                {"role": "user", "content": user_text},
+                {"role": "assistant", "content": acc},
+            ],
+            history_msgs + [
+                {"role": "user", "content": user_text},
+                {"role": "assistant", "content": acc},
+            ]
+        )
 # -----------------------------
 # App definition