Spaces:

akryldigital
/

audit_assistant

Sleeping

akryldigital commited on 23 days ago

Commit

f877a27

verified ·

1 Parent(s): a9daa85

remove callbacks

Files changed (1) hide show

src/llm/adapters.py CHANGED Viewed

@@ -11,8 +11,8 @@ from langchain_openai.chat_models import ChatOpenAI
 # Legacy dependencies
 from huggingface_hub import InferenceClient
 from langchain_community.llms import HuggingFaceEndpoint
-from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
 from langchain_community.chat_models.huggingface import ChatHuggingFace
 from ..config.loader import load_config
@@ -71,7 +71,7 @@ def _create_dedicated_endpoint_client():
     max_tokens = dedicated_config.get("max_tokens", 768)
     # Set up the streaming callback handler
-    callback = StreamingStdOutCallbackHandler()
     # Initialize the HuggingFaceEndpoint with streaming enabled
     llm_qa = HuggingFaceEndpoint(
@@ -80,11 +80,10 @@ def _create_dedicated_endpoint_client():
         repetition_penalty=1.03,
         timeout=70,
         huggingfacehub_api_token=api_key,
-        streaming=True,
-        callbacks=[callback]
     )
-    # Create a ChatHuggingFace instance with the streaming-enabled endpoint
     return ChatHuggingFace(llm=llm_qa)

 # Legacy dependencies
 from huggingface_hub import InferenceClient
 from langchain_community.llms import HuggingFaceEndpoint
 from langchain_community.chat_models.huggingface import ChatHuggingFace
+# from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
 from ..config.loader import load_config
     max_tokens = dedicated_config.get("max_tokens", 768)
     # Set up the streaming callback handler
+    # callback = StreamingStdOutCallbackHandler()
     # Initialize the HuggingFaceEndpoint with streaming enabled
     llm_qa = HuggingFaceEndpoint(
         repetition_penalty=1.03,
         timeout=70,
         huggingfacehub_api_token=api_key,
+        streaming=True
+        # callbacks=[callback]
     )
     return ChatHuggingFace(llm=llm_qa)