Spaces:

Namitg02
/

Test

Runtime error

App Files Files Community

Namitg02 commited on Jun 20, 2024

Commit

524eae4

verified ·

1 Parent(s): 0b30f86

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -3

app.py CHANGED Viewed

@@ -98,6 +98,25 @@ def format_prompt(prompt,retrieved_documents,k):
         PROMPT+= f"{retrieved_documents['0'][idx]}\n"
     return PROMPT
 # Called by talk function to add retrieved documents to the prompt. Keeps adding text of retrieved documents to string taht are retreived
 def talk(prompt, history):
@@ -109,8 +128,10 @@ def talk(prompt, history):
     print("check5")
     print(retrieved_documents['0'])
     print(formatted_prompt)
-    formatted_prompt = formatted_prompt[:600] # to avoid memory issue
-    print(formatted_prompt)
     messages = [{"role":"system","content":SYS_PROMPT},{"role":"user","content":formatted_prompt}]
     # binding the system context and new prompt for LLM
     # the chat template structure should be based on text generation model format
@@ -130,7 +151,7 @@ def talk(prompt, history):
     ]
 # indicates the end of a sequence
     text = ""
-    stream = model(formatted_prompt, max_tokens=1000, stop=["</s>"], stream=True)
     for output in stream:
         text += output["choices"][0]["text"]
         yield text

         PROMPT+= f"{retrieved_documents['0'][idx]}\n"
     return PROMPT
+#def add_history(formatted_prompt, history, memory_limit=3):
+    # always keep len(history) <= memory_limit
+ #   if len(history) > memory_limit:
+  #      history = history[-memory_limit:]
+   # if len(history) == 0:
+    #    return PROMPT + f"{formatted_prompt} [/INST]"
+    #formatted_message = PROMPT + f"{history[0][0]} [/INST] {history[0][1]} </s>"
+    # Handle conversation history
+#    for user_msg, model_answer in history[1:]:
+ #       formatted_message += f"<s>[INST] {user_msg} [/INST] {model_answer} </s>"
+  #  # Handle the current message
+   # formatted_message += f"<s>[INST] {formatted_prompt} [/INST]"
+    #return formatted_message
 # Called by talk function to add retrieved documents to the prompt. Keeps adding text of retrieved documents to string taht are retreived
 def talk(prompt, history):
     print("check5")
     print(retrieved_documents['0'])
     print(formatted_prompt)
+  #  formatted_prompt_with_history = add_history(formatted_prompt, history)
+   # formatted_prompt_with_history = formatted_prompt_with_history[:600] # to avoid memory issue
+    print(formatted_prompt_with_history)
     messages = [{"role":"system","content":SYS_PROMPT},{"role":"user","content":formatted_prompt}]
     # binding the system context and new prompt for LLM
     # the chat template structure should be based on text generation model format
     ]
 # indicates the end of a sequence
     text = ""
+    stream = model(messages, max_tokens=1000, stop=["</s>"], stream=True)
     for output in stream:
         text += output["choices"][0]["text"]
         yield text