Spaces:

Sandei
/

tech-support-helpdesk-chatbot

Sleeping

Sandei commited on Feb 3

Commit

d5dcd77

1 Parent(s): 12003d8

truncated answer reponse

Files changed (2) hide show

service/llm_service.py CHANGED Viewed

@@ -17,7 +17,7 @@ class LLMService:
         output = self.model.generate(
             **inputs,
-            max_new_tokens=120,
             do_sample=True,
             temperature=0.7,
             top_p=0.9,

         output = self.model.generate(
             **inputs,
+            max_new_tokens=256,
             do_sample=True,
             temperature=0.7,
             top_p=0.9,

service/rag_service.py CHANGED Viewed

@@ -24,23 +24,26 @@ def generate_answer(question: str, session_id: str) -> str:
     memory = get_memory(session_id)
     prompt = f"""
-<|system|>
-You are a helpful assistant.
-Answer ONLY using the provided context.
-If the answer is not in the context, say "I don't know".
-Conversation memory:
-{memory}
-<|user|>
-Context:
-{chr(10).join(context)}
-Question:
-{question}
-<|assistant|>
-"""
     answer = llm.generate(prompt)

     memory = get_memory(session_id)
     prompt = f"""
+    <|system|>
+    You are a helpful assistant.
+    Answer ONLY using the provided context.
+    Give a COMPLETE, well-formed answer.
+    Do not stop mid-sentence.
+    If the answer is not in the context, say "I don't know".
+    Conversation memory:
+    {memory}
+    <|user|>
+    Context:
+    {chr(10).join(context)}
+    Question:
+    {question}
+    <|assistant|>
+    """
     answer = llm.generate(prompt)