SaylorTwift HF Staff commited on
Commit
6b7bd2f
·
verified ·
1 Parent(s): 883f633

Add multimodal Claw-Eval result

Browse files
Files changed (1) hide show
  1. .eval_results/claw_eval.yaml +12 -2
.eval_results/claw_eval.yaml CHANGED
@@ -3,7 +3,7 @@
3
  task_id: general
4
  value: 61.5
5
  date: '2026-04-23'
6
- notes: Pass³% | N=3 | 161 tasks
7
  source:
8
  url: https://claw-eval.github.io
9
  name: Claw-Eval Leaderboard
@@ -13,7 +13,17 @@
13
  task_id: multi_turn
14
  value: 65.8
15
  date: '2026-04-23'
16
- notes: Pass³% | N=3 | 38 tasks
 
 
 
 
 
 
 
 
 
 
17
  source:
18
  url: https://claw-eval.github.io
19
  name: Claw-Eval Leaderboard
 
3
  task_id: general
4
  value: 61.5
5
  date: '2026-04-23'
6
+ notes: "Pass³% | N=3 | 161 tasks"
7
  source:
8
  url: https://claw-eval.github.io
9
  name: Claw-Eval Leaderboard
 
13
  task_id: multi_turn
14
  value: 65.8
15
  date: '2026-04-23'
16
+ notes: "Pass³% | N=3 | 38 tasks"
17
+ source:
18
+ url: https://claw-eval.github.io
19
+ name: Claw-Eval Leaderboard
20
+ user: tobiaslee
21
+ - dataset:
22
+ id: claw-eval/Claw-Eval
23
+ task_id: multimodal
24
+ value: 18.8
25
+ date: '2026-04-23'
26
+ notes: "Pass³% | N=3 | 101 tasks"
27
  source:
28
  url: https://claw-eval.github.io
29
  name: Claw-Eval Leaderboard