.eval_results/claw-eval.yaml DELETED
@@ -1,20 +0,0 @@
1
- - dataset:
2
- id: claw-eval/Claw-Eval
3
- task_id: general
4
- value: 62.7
5
- date: '2026-04-23'
6
- notes: "Pass³% | N=3 | 161 tasks"
7
- source:
8
- url: https://claw-eval.github.io
9
- name: Claw-Eval Leaderboard
10
- user: tobiaslee
11
- - dataset:
12
- id: claw-eval/Claw-Eval
13
- task_id: multi_turn
14
- value: 60.5
15
- date: '2026-04-23'
16
- notes: "Pass³% | N=3 | 38 tasks"
17
- source:
18
- url: https://claw-eval.github.io
19
- name: Claw-Eval Leaderboard
20
- user: tobiaslee
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
chat_template.jinja CHANGED
@@ -94,7 +94,7 @@ For each function call, output the function name and arguments within the follow
94
  {%- endif %}
95
  {%- if m.content is string -%}
96
  {{- '<tool_response>' + m.content + '</tool_response>' -}}
97
- {%- elif m.content is iterable and m.content is not mapping and m.content and m.content.0.type == "tool_reference" -%}
98
  {{- '<tool_response><tools>\n' -}}
99
  {% for tr in m.content %}
100
  {%- for tool in tools -%}
@@ -107,8 +107,6 @@ For each function call, output the function name and arguments within the follow
107
  {%- endfor -%}
108
  {%- endfor -%}
109
  {{- '</tools></tool_response>' -}}
110
- {%- else -%}
111
- {{- '<tool_response>' + visible_text(m.content) + '</tool_response>' -}}
112
  {% endif -%}
113
  {%- elif m.role == 'system' -%}
114
  <|system|>{{ visible_text(m.content) }}
 
94
  {%- endif %}
95
  {%- if m.content is string -%}
96
  {{- '<tool_response>' + m.content + '</tool_response>' -}}
97
+ {%- else -%}
98
  {{- '<tool_response><tools>\n' -}}
99
  {% for tr in m.content %}
100
  {%- for tool in tools -%}
 
107
  {%- endfor -%}
108
  {%- endfor -%}
109
  {{- '</tools></tool_response>' -}}
 
 
110
  {% endif -%}
111
  {%- elif m.role == 'system' -%}
112
  <|system|>{{ visible_text(m.content) }}