OpenPipe
/

Llama-3.1-70B-Instruct

+{{- bos_token }}
+{%- set template_variant = template_variant | default("official") %}
+{%- if template_variant == "llama31instruct" %}
+  {%- if not tools is defined %}
+    {%- set tools = none %}
+  {%- endif %}
+  {%- if messages[0]['role'] in ['system', 'developer'] %}
+    {%- set system_message = messages[0]['content']|trim %}
+    {%- set messages = messages[1:] %}
+  {%- else %}
+    {%- set system_message = "" %}
+  {%- endif %}
+  {{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
+  {%- if tools is not none and tools|length > 0 %}
+    {{- "Environment: ipython\n" }}
+    {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
+    {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
+    {{- "Do not use variables.\n\n" }}
+    {%- for t in tools %}
+      {{- t | tojson }}
+      {{- "\n\n" }}
+    {%- endfor %}
+  {%- endif %}
+  {{- system_message }}
+  {{- "<|eot_id|>" }}
+  {%- for message in messages %}
+    {%- if not (message.role == 'tool' or 'tool_calls' in message) %}
+      {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] | trim + '<|eot_id|>' }}
+    {%- elif 'tool_calls' in message %}
+      {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
+      {%- for tool_call in message.tool_calls -%}
+        {{- '<|start_tool_call|>' }}
+        {{- '{"name": "' + tool_call.function.name + '", ' }}
+        {{- '"parameters": ' }}
+        {{- tool_call.function.arguments | tojson }}
+        {{- "}" }}
+        {{- '<|end_tool_call|>' }}
+        {%- if not loop.last %}, {% endif %}
+      {%- endfor -%}
+      {{- "<|eot_id|>" }}
+    {%- elif message.role == "tool" %}
+      {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
+      {%- if message.content is mapping or message.content is iterable %}
+        {{- message.content | tojson }}
+      {%- else %}
+        {{- message.content }}
+      {%- endif %}
+      {{- "<|eot_id|>" }}
+    {%- endif %}
+  {%- endfor %}
+  {%- if add_generation_prompt %}
+    {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
+  {%- endif %}
+{%- elif template_variant == "pipeline3" %}
+  {%- if not tools is defined %}
+    {%- set tools = none %}
+  {%- endif %}
+  {%- set functions = tools | map(attribute="function") | map(attribute="name") | list if tools is not none else none %}
+  {{- "### Instruction:\n" }}
+  {%- if functions is not none %}
+    {{- {"messages": messages, "functions": functions} | tojson }}
+  {%- else %}
+    {{- {"messages": messages} | tojson }}
+  {%- endif %}
+  {{- "\n\n### Response:\n" }}
+{%- else %}
+  {%- if custom_tools is defined %}
+    {%- set tools = custom_tools %}
+  {%- endif %}
+  {%- if not tools_in_user_message is defined %}
+    {%- set tools_in_user_message = true %}
+  {%- endif %}
+  {%- if not date_string is defined %}
+    {%- set date_string = "26 Jul 2024" %}
+  {%- endif %}
+  {%- if not tools is defined %}
+    {%- set tools = none %}
+  {%- endif %}
+  {%- if messages[0]['role'] == 'system' %}
+    {%- set system_message = messages[0]['content']|trim %}
+    {%- set messages = messages[1:] %}
+  {%- else %}
+    {%- set system_message = "" %}
+  {%- endif %}
+  {{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
+  {%- if builtin_tools is defined or tools is not none %}
+    {{- "Environment: ipython\n" }}
+  {%- endif %}
+  {%- if builtin_tools is defined %}
+    {{- "Tools: " + builtin_tools | reject('equalto', 'code_interpreter') | join(", ") + "\n\n" }}
+  {%- endif %}
+  {{- "Cutting Knowledge Date: December 2023\n" }}
+  {{- "Today Date: " + date_string + "\n\n" }}
+  {%- if tools is not none and not tools_in_user_message %}
+    {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
+    {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
+    {{- "Do not use variables.\n\n" }}
+    {%- for t in tools %}
+      {{- t | tojson(indent=4) }}
+      {{- "\n\n" }}
+    {%- endfor %}
+  {%- endif %}
+  {{- system_message }}
+  {{- "<|eot_id|>" }}
+  {%- if tools_in_user_message and not tools is none %}
+    {%- if messages | length != 0 %}
+      {%- set first_user_message = messages[0]['content']|trim %}
+      {%- set messages = messages[1:] %}
+    {%- else %}
+      {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
+    {%- endif %}
+    {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
+    {{- "Given the following functions, please respond with a JSON for a function call " }}
+    {{- "with its proper arguments that best answers the given prompt.\n\n" }}
+    {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
+    {{- "Do not use variables.\n\n" }}
+    {%- for t in tools %}
+      {{- t | tojson(indent=4) }}
+      {{- "\n\n" }}
+    {%- endfor %}
+    {{- first_user_message + "<|eot_id|>" }}
+  {%- endif %}
+  {%- for message in messages %}
+    {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
+      {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] | trim + '<|eot_id|>' }}
+    {%- elif 'tool_calls' in message %}
+      {%- if not message.tool_calls|length == 1 %}
+        {{- raise_exception("This model only supports single tool-calls at once!") }}
+      {%- endif %}
+      {%- set tool_call = message.tool_calls[0].function %}
+      {%- if builtin_tools is defined and tool_call.name in builtin_tools %}
+        {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
+        {{- "<|python_tag|>" + tool_call.name + ".call(" }}
+        {%- for arg_name, arg_val in tool_call.arguments | items %}
+          {{- arg_name + '="' + arg_val + '"' }}
+          {%- if not loop.last %}
+            {{- ", " }}
+          {%- endif %}
+        {%- endfor %}
+        {{- ")" }}
+      {%- else %}
+        {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
+        {{- '{"name": "' + tool_call.name + '", ' }}
+        {{- '"parameters": ' }}
+        {{- tool_call.arguments | tojson }}
+        {{- "}" }}
+      {%- endif %}
+      {%- if builtin_tools is defined %}
+        {{- "<|eom_id|>" }}
+      {%- else %}
+        {{- "<|eot_id|>" }}
+      {%- endif %}
+    {%- elif message.role == "tool" or message.role == "ipython" %}
+      {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
+      {%- if message.content is mapping or message.content is iterable %}
+        {{- message.content | tojson }}
+      {%- else %}
+        {{- message.content }}
+      {%- endif %}
+      {{- "<|eot_id|>" }}
+    {%- endif %}
+  {%- endfor %}
+  {%- if add_generation_prompt %}
+    {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
+  {%- endif %}
+{%- endif %}

openpipe_llama_dual.py ADDED Viewed

	@@ -0,0 +1,264 @@

+import json
+from collections.abc import Sequence
+from typing import Any, Optional
+from vllm.entrypoints.openai.chat_completion.protocol import ChatCompletionRequest
+from vllm.entrypoints.openai.engine.protocol import (
+    DeltaFunctionCall,
+    DeltaMessage,
+    DeltaToolCall,
+    ExtractedToolCallInformation,
+    FunctionCall,
+    ToolCall,
+)
+from vllm.tokenizers import TokenizerLike
+from vllm.tool_parsers.abstract_tool_parser import ToolParser, ToolParserManager
+@ToolParserManager.register_module(["openpipe_llama_dual"])
+class OpenPipeLlamaDualParser(ToolParser):
+    """Parse official JSON, llama31 tool markers, and pipeline3 function tags."""
+    LEGACY_START = "<|start_tool_call|>"
+    LEGACY_END = "<|end_tool_call|>"
+    FUNCTION_CALL_TAG = "<function>"
+    FUNCTION_ARGS_TAG = "<arguments>"
+    VARIANT_LLAMA31 = "llama31instruct"
+    VARIANT_PIPELINE3 = "pipeline3"
+    VARIANT_OFFICIAL = "official"
+    def __init__(self, tokenizer: TokenizerLike):
+        super().__init__(tokenizer)
+        self.tokenizer = tokenizer
+    def _get_template_variant(self, request: ChatCompletionRequest) -> Optional[str]:
+        kwargs = getattr(request, "chat_template_kwargs", None)
+        if kwargs is None:
+            return None
+        if isinstance(kwargs, dict):
+            value = kwargs.get("template_variant")
+            return value if isinstance(value, str) else None
+        value = getattr(kwargs, "template_variant", None)
+        return value if isinstance(value, str) else None
+    def _normalize_tool_call(self, payload: dict[str, Any]) -> Optional[dict[str, Any]]:
+        if "name" in payload and "parameters" in payload:
+            return {
+                "name": payload["name"],
+                "arguments": payload["parameters"],
+            }
+        if "function" in payload and isinstance(payload["function"], dict):
+            function = payload["function"]
+            if "name" in function and "arguments" in function:
+                return {
+                    "name": function["name"],
+                    "arguments": function["arguments"],
+                }
+        return None
+    def _extract_legacy_tool_calls(self, text: str) -> list[dict[str, Any]]:
+        tool_calls = []
+        current_index = 0
+        while True:
+            start_index = text.find(self.LEGACY_START, current_index)
+            if start_index == -1:
+                break
+            end_index = text.find(self.LEGACY_END, start_index)
+            if end_index == -1:
+                break
+            tool_call_json = text[start_index + len(self.LEGACY_START) : end_index].strip()
+            payload = json.loads(tool_call_json)
+            normalized = self._normalize_tool_call(payload)
+            if normalized:
+                tool_calls.append(normalized)
+            current_index = end_index + len(self.LEGACY_END)
+        return tool_calls
+    def _extract_function_tag_tool_calls(self, text: str) -> list[dict[str, Any]]:
+        tool_calls = []
+        current_index = 0
+        while True:
+            function_start = text.find(self.FUNCTION_CALL_TAG, current_index)
+            if function_start == -1:
+                break
+            name_start = function_start + len(self.FUNCTION_CALL_TAG)
+            args_tag_index = text.find(self.FUNCTION_ARGS_TAG, name_start)
+            if args_tag_index == -1:
+                break
+            function_name = text[name_start:args_tag_index].strip()
+            if not function_name:
+                break
+            arguments_start = args_tag_index + len(self.FUNCTION_ARGS_TAG)
+            next_function_index = text.find(self.FUNCTION_CALL_TAG, arguments_start)
+            if next_function_index == -1:
+                arguments_raw = text[arguments_start:].strip()
+                current_index = len(text)
+            else:
+                arguments_raw = text[arguments_start:next_function_index].strip()
+                current_index = next_function_index
+            if not arguments_raw:
+                arguments: Any = ""
+            else:
+                try:
+                    arguments = json.loads(arguments_raw)
+                except Exception:
+                    arguments = arguments_raw
+            tool_calls.append(
+                {
+                    "name": function_name,
+                    "arguments": arguments,
+                }
+            )
+        return tool_calls
+    def _extract_official_tool_call(self, text: str) -> Optional[dict[str, Any]]:
+        stripped = text.strip()
+        if not stripped.startswith("{") or not stripped.endswith("}"):
+            return None
+        payload = json.loads(stripped)
+        return self._normalize_tool_call(payload)
+    def _build_delta_tool_call(self, tool_call: dict[str, Any], index: int = 0) -> DeltaMessage:
+        arguments = tool_call["arguments"]
+        return DeltaMessage(
+            tool_calls=[
+                DeltaToolCall(
+                    index=index,
+                    id=f"call_{tool_call['name']}",
+                    type="function",
+                    function=DeltaFunctionCall(
+                        name=tool_call["name"],
+                        arguments=json.dumps(arguments, ensure_ascii=False)
+                        if isinstance(arguments, (dict, list))
+                        else arguments,
+                    ),
+                )
+            ]
+        )
+    def _build_tool_calls_response(
+        self,
+        tool_calls: list[dict[str, Any]],
+    ) -> ExtractedToolCallInformation:
+        return ExtractedToolCallInformation(
+            tools_called=True,
+            tool_calls=[
+                ToolCall(
+                    id=f"call_{index + 1}",
+                    type="function",
+                    function=FunctionCall(
+                        name=tool_call["name"],
+                        arguments=json.dumps(
+                            tool_call["arguments"], ensure_ascii=False
+                        )
+                        if isinstance(tool_call["arguments"], (dict, list))
+                        else tool_call["arguments"],
+                    ),
+                )
+                for index, tool_call in enumerate(tool_calls)
+            ],
+            content=None,
+        )
+    def _looks_like_partial_official_json(self, text: str) -> bool:
+        stripped = text.strip()
+        if not stripped.startswith("{"):
+            return False
+        if stripped.endswith("}"):
+            return False
+        return (
+            '"name"' in stripped
+            or '"parameters"' in stripped
+            or '"function"' in stripped
+        )
+    def extract_tool_calls_streaming(
+        self,
+        previous_text: str,
+        current_text: str,
+        delta_text: str,
+        previous_token_ids: Sequence[int],
+        current_token_ids: Sequence[int],
+        delta_token_ids: Sequence[int],
+        request: ChatCompletionRequest,
+    ) -> DeltaMessage | None:
+        variant = self._get_template_variant(request)
+        try:
+            if (
+                variant == self.VARIANT_LLAMA31
+                or self.LEGACY_START in current_text
+            ):
+                if self.LEGACY_START in current_text and self.LEGACY_END in current_text:
+                    tool_calls = self._extract_legacy_tool_calls(current_text)
+                    if tool_calls:
+                        return self._build_delta_tool_call(
+                            tool_calls[-1], index=len(tool_calls) - 1
+                        )
+                if self.LEGACY_START in current_text:
+                    return None
+                return DeltaMessage(content=delta_text)
+            if variant == self.VARIANT_PIPELINE3 or self.FUNCTION_CALL_TAG in current_text:
+                tool_calls = self._extract_function_tag_tool_calls(current_text)
+                if tool_calls:
+                    return self._build_delta_tool_call(
+                        tool_calls[-1], index=len(tool_calls) - 1
+                    )
+                return None
+            official_tool_call = self._extract_official_tool_call(current_text)
+            if official_tool_call:
+                return self._build_delta_tool_call(official_tool_call)
+            if variant == self.VARIANT_OFFICIAL and self._looks_like_partial_official_json(
+                current_text
+            ):
+                return None
+        except Exception:
+            return DeltaMessage(content=delta_text)
+        return DeltaMessage(content=delta_text)
+    def extract_tool_calls(
+        self,
+        model_output: str,
+        request: ChatCompletionRequest,
+    ) -> ExtractedToolCallInformation:
+        variant = self._get_template_variant(request)
+        try:
+            if (
+                variant == self.VARIANT_LLAMA31
+                or self.LEGACY_START in model_output
+            ):
+                tool_calls = self._extract_legacy_tool_calls(model_output)
+                if tool_calls:
+                    return self._build_tool_calls_response(tool_calls)
+            if variant == self.VARIANT_PIPELINE3 or self.FUNCTION_CALL_TAG in model_output:
+                tool_calls = self._extract_function_tag_tool_calls(model_output)
+                if tool_calls:
+                    return self._build_tool_calls_response(tool_calls)
+            official_tool_call = self._extract_official_tool_call(model_output)
+            if official_tool_call:
+                return self._build_tool_calls_response([official_tool_call])
+        except Exception:
+            pass
+        return ExtractedToolCallInformation(
+            tools_called=False,
+            tool_calls=[],
+            content=model_output,
+        )