Spaces:

stkrk
/

langchain_rag_chat

Sleeping

Stanislav commited on Apr 24, 2025

Commit

d9d96d2

1 Parent(s): 8ffad45

feat: stream_true and new stop_word

Files changed (1) hide show

rag_pipeline/llm_interface.py CHANGED Viewed

@@ -9,10 +9,11 @@ class LocalLLM:
     def __init__(self, model_path: str,
                  n_ctx: int = 2048,
-                 stop=["</s>", "User Question:"],
                  max_tokens=500,
                  temperature: float = 0.5,
-                 repetition_penalty=1.25):
         """
         Initialize the local LLM model via llama-cpp and Langchain.
@@ -27,6 +28,7 @@ class LocalLLM:
             max_tokens=max_tokens,
             temperature=temperature,
             repetition_penalty=repetition_penalty,
             verbose=False
         )

     def __init__(self, model_path: str,
                  n_ctx: int = 2048,
+                 stop=["</s>", "User Question:", " User Response:"],
                  max_tokens=500,
                  temperature: float = 0.5,
+                 repetition_penalty=1.25,
+                 stream=True):
         """
         Initialize the local LLM model via llama-cpp and Langchain.
             max_tokens=max_tokens,
             temperature=temperature,
             repetition_penalty=repetition_penalty,
+            stream=stream,
             verbose=False
         )