Spaces:

jedick
/

R-help-chat

Running on Zero

App Files Files Community

jedick commited on Jul 28

Commit

158fae7

1 Parent(s): 503a0b6

Further simplify ToolCallingLLM

Browse files

Files changed (3) hide show

app.py +2 -2
graph.py +2 -4
mods/tool_calling_llm.py +9 -115

app.py CHANGED Viewed

@@ -401,7 +401,7 @@ with gr.Blocks(
         info_text = f"""
             **Database:** {len(sources)} emails from {start} to {end}.
             **Features:** RAG, today's date, hybrid search (dense+sparse), thinking output (local),
-            multiple retrievals per turn (remote), answer with citations (remote), chat memory.
             **Tech:** LangChain + Hugging Face + Gradio; ChromaDB and BM25S-based retrievers.<br>
             """
         return info_text
@@ -453,7 +453,7 @@ with gr.Blocks(
                 )
                 multi_turn_questions = [
                     "Lookup emails that reference bugs.r-project.org in 2025",
-                    "Did those authors report bugs before 2025?",
                 ]
                 gr.Examples(
                     examples=[[q] for q in multi_turn_questions],

         info_text = f"""
             **Database:** {len(sources)} emails from {start} to {end}.
             **Features:** RAG, today's date, hybrid search (dense+sparse), thinking output (local),
+            multiple retrievals (remote), citations output (remote), chat memory.
             **Tech:** LangChain + Hugging Face + Gradio; ChromaDB and BM25S-based retrievers.<br>
             """
         return info_text
                 )
                 multi_turn_questions = [
                     "Lookup emails that reference bugs.r-project.org in 2025",
+                    "Did those authors report bugs before 2025? /think",
                 ]
                 gr.Examples(
                     examples=[[q] for q in multi_turn_questions],

graph.py CHANGED Viewed

@@ -71,7 +71,7 @@ def normalize_messages(messages):
     return messages
-def ToolifyHF(chat_model, system_message, system_message_suffix=""):
     """
     Get a Hugging Face model ready for bind_tools().
     """
@@ -86,8 +86,6 @@ def ToolifyHF(chat_model, system_message, system_message_suffix=""):
     chat_model = HuggingFaceWithTools(
         llm=chat_model.llm,
         tool_system_prompt_template=tool_system_prompt_template,
-        # Suffix is for any additional context (not templated)
-        system_message_suffix=system_message_suffix,
     )
     return chat_model
@@ -195,7 +193,7 @@ def BuildGraph(
     if is_local:
         # For local models (ChatHuggingFace with SmolLM, Gemma, or Qwen)
         query_model = ToolifyHF(
-            chat_model, query_prompt(chat_model, think=think_query), ""
         ).bind_tools([retrieve_emails])
         # Don't use answer_with_citations tool because responses with are sometimes unparseable
         generate_model = chat_model

     return messages
+def ToolifyHF(chat_model, system_message):
     """
     Get a Hugging Face model ready for bind_tools().
     """
     chat_model = HuggingFaceWithTools(
         llm=chat_model.llm,
         tool_system_prompt_template=tool_system_prompt_template,
     )
     return chat_model
     if is_local:
         # For local models (ChatHuggingFace with SmolLM, Gemma, or Qwen)
         query_model = ToolifyHF(
+            chat_model, query_prompt(chat_model, think=think_query)
         ).bind_tools([retrieve_emails])
         # Don't use answer_with_citations tool because responses with are sometimes unparseable
         generate_model = chat_model

mods/tool_calling_llm.py CHANGED Viewed

@@ -49,51 +49,6 @@ You must always select one of the above tools and respond with only a JSON objec
 """  # noqa: E501
-def _is_pydantic_class(obj: Any) -> bool:
-    """
-    Checks if the tool provided is a Pydantic class.
-    """
-    return isinstance(obj, type) and (
-        issubclass(obj, BaseModel) or BaseModel in obj.__bases__
-    )
-def _is_pydantic_object(obj: Any) -> bool:
-    """
-    Checks if the tool provided is a Pydantic object.
-    """
-    return isinstance(obj, BaseModel)
-def RawJSONDecoder(index):
-    class _RawJSONDecoder(json.JSONDecoder):
-        end = None
-        def decode(self, s, *_):
-            data, self.__class__.end = self.raw_decode(s, index)
-            return data
-    return _RawJSONDecoder
-def extract_json(s, index=0):
-    while (index := s.find("{", index)) != -1:
-        try:
-            yield json.loads(s, cls=(decoder := RawJSONDecoder(index)))
-            index = decoder.end
-        except json.JSONDecodeError:
-            index += 1
-def parse_json_garbage(s: str) -> Any:
-    # Find the first occurrence of a JSON opening brace or bracket
-    candidates = list(extract_json(s))
-    if len(candidates) >= 1:
-        return candidates[0]
-    raise ValueError("Not a valid JSON string")
 def extract_think(content):
     # Added by Cursor 20250726 jmd
     # Extract content within <think>...</think>
@@ -162,7 +117,7 @@ class ToolCallingLLM(BaseChatModel, ABC):
     Tool calling:
       ```
-      from langchain_core.pydantic_v1 import BaseModel, Field
       class GetWeather(BaseModel):
           '''Get the current weather in a given location'''
@@ -188,78 +143,25 @@ class ToolCallingLLM(BaseChatModel, ABC):
     """  # noqa: E501
     tool_system_prompt_template: str = DEFAULT_SYSTEM_TEMPLATE
-    # Suffix to add to the system prompt that is not templated 20250717 jmd
-    system_message_suffix: str = ""
-    override_bind_tools: bool = True
     def __init__(self, **kwargs: Any) -> None:
-        override_bind_tools = True
-        if "override_bind_tools" in kwargs:
-            override_bind_tools = kwargs["override_bind_tools"]
-            del kwargs["override_bind_tools"]
         super().__init__(**kwargs)
-        self.override_bind_tools = override_bind_tools
-    def bind_tools(
-        self,
-        tools: Sequence[Union[Dict[str, Any], Type[BaseModel], Callable, BaseTool]],
-        **kwargs: Any,
-    ) -> Runnable[LanguageModelInput, BaseMessage]:
-        if self.override_bind_tools:
-            return self.bind(functions=tools, **kwargs)
-        else:
-            return super().bind_tools(tools, **kwargs)
     def _generate_system_message_and_functions(
         self,
         kwargs: Dict[str, Any],
     ) -> Tuple[BaseMessage, List]:
-        functions = kwargs.get("tools", kwargs.get("functions", []))
-        functions = [
-            (
-                fn["function"]
-                if (
-                    not _is_pydantic_class(fn)
-                    and not _is_pydantic_object(fn)
-                    and "name" not in fn.keys()
-                    and "function" in fn.keys()
-                    and "name" in fn["function"].keys()
-                )
-                else fn
-            )
-            for fn in functions
-        ]
-        # langchain_openai/chat_models/base.py:
-        # NOTE: Using bind_tools is recommended instead, as the `functions` and
-        # `function_call` request parameters are officially marked as
-        # deprecated by OpenAI.
-        # if "functions" in kwargs:
-        #    del kwargs["functions"]
-        # if "function_call" in kwargs:
-        #    functions = [
-        #        fn for fn in functions if fn["name"] == kwargs["function_call"]["name"]
-        #    ]
-        #    if not functions:
-        #        raise ValueError(
-        #            "If `function_call` is specified, you must also pass a "
-        #            "matching function in `functions`."
-        #        )
-        #    del kwargs["function_call"]
         functions = [convert_to_openai_tool(fn) for fn in functions]
         system_message_prompt_template = SystemMessagePromptTemplate.from_template(
             self.tool_system_prompt_template
         )
         system_message = system_message_prompt_template.format(
             tools=json.dumps(functions, indent=2)
         )
-        # Add extra context after the formatted system message 20250717 jmd
-        system_message = SystemMessage(
-            system_message.content + self.system_message_suffix
-        )
         return system_message, functions
     def _process_response(
@@ -275,16 +177,8 @@ class ToolCallingLLM(BaseChatModel, ABC):
         try:
             parsed_json_result = json.loads(post_think)
         except json.JSONDecodeError:
-            try:
-                print("parse_json_garbage for content:")
-                print(post_think)
-                parsed_json_result = parse_json_garbage(post_think)
-            except Exception:
-                # Return entire response if JSON is missing or wasn't parsed
-                return AIMessage(content=response_message.content)
-        print("parsed_json_result")
-        print(parsed_json_result)
         # Get tool name from output
         called_tool_name = (
@@ -299,7 +193,7 @@ class ToolCallingLLM(BaseChatModel, ABC):
         )
         if called_tool is None:
             # Issue a warning and return the generated content 20250727 jmd
-            warnings.warn(f"Called tool ({called_tool}) not in functions list")
             return AIMessage(content=response_message.content)
         # Get tool arguments from output
@@ -314,7 +208,7 @@ class ToolCallingLLM(BaseChatModel, ABC):
         )
         # Put together response message
-        response_message_with_functions = AIMessage(
             content=f"<think>\n{think_text}\n</think>",
             tool_calls=[
                 ToolCall(
@@ -325,7 +219,7 @@ class ToolCallingLLM(BaseChatModel, ABC):
             ],
         )
-        return response_message_with_functions
     def _generate(
         self,

 """  # noqa: E501
 def extract_think(content):
     # Added by Cursor 20250726 jmd
     # Extract content within <think>...</think>
     Tool calling:
       ```
+      from pydantic import BaseModel, Field
       class GetWeather(BaseModel):
           '''Get the current weather in a given location'''
     """  # noqa: E501
     tool_system_prompt_template: str = DEFAULT_SYSTEM_TEMPLATE
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(**kwargs)
     def _generate_system_message_and_functions(
         self,
         kwargs: Dict[str, Any],
     ) -> Tuple[BaseMessage, List]:
+        functions = kwargs.get("tools", [])
+        # Convert functions to OpenAI tool schema
         functions = [convert_to_openai_tool(fn) for fn in functions]
+        # Create system message with tool descriptions
         system_message_prompt_template = SystemMessagePromptTemplate.from_template(
             self.tool_system_prompt_template
         )
         system_message = system_message_prompt_template.format(
             tools=json.dumps(functions, indent=2)
         )
         return system_message, functions
     def _process_response(
         try:
             parsed_json_result = json.loads(post_think)
         except json.JSONDecodeError:
+            # Return entire response if JSON wasn't parsed (or is missing)
+            return AIMessage(content=response_message.content)
         # Get tool name from output
         called_tool_name = (
         )
         if called_tool is None:
             # Issue a warning and return the generated content 20250727 jmd
+            warnings.warn(f"Called tool ({called_tool_name}) not in functions list")
             return AIMessage(content=response_message.content)
         # Get tool arguments from output
         )
         # Put together response message
+        response_message = AIMessage(
             content=f"<think>\n{think_text}\n</think>",
             tool_calls=[
                 ToolCall(
             ],
         )
+        return response_message
     def _generate(
         self,