File size: 3,057 Bytes
f3d287f
 
 
a83c01d
 
3cb4b1d
a83c01d
f3d287f
 
a83c01d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f3d287f
 
a83c01d
 
 
 
f3d287f
 
a83c01d
 
3cb4b1d
a83c01d
f3d287f
 
a83c01d
 
3cb4b1d
a83c01d
 
 
 
 
 
 
de324c6
 
 
 
 
 
 
 
a83c01d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
de324c6
a83c01d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f3d287f
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "experiments": [
    {
      "name": "Bash Only + Claude Sonnet 4.6",
      "data_file": "bash_only_+_claude_sonnet_4.6_vanilla.json",
      "tag": "vanilla",
      "model_id": "anthropic/claude-sonnet-4-6"
    },
    {
      "name": "Bash Only + Claude Sonnet 4.6",
      "data_file": "bash_only_+_claude_sonnet_4.6_benign.json",
      "tag": "benign",
      "model_id": "anthropic/claude-sonnet-4-6"
    },
    {
      "name": "Bash Only + Claude Sonnet 4.6",
      "data_file": "bash_only_+_claude_sonnet_4.6_malignant.json",
      "tag": "malignant",
      "model_id": "anthropic/claude-sonnet-4-6"
    },
    {
      "name": "Bash Only + Claude Sonnet 4.6",
      "data_file": "bash_only_+_claude_sonnet_4.6_rust-specific.json",
      "tag": "rust-specific",
      "model_id": "anthropic/claude-sonnet-4-6"
    },
    {
      "name": "Bash Only + GPT 5.4",
      "data_file": "bash_only_+_gpt_5.4_vanilla.json",
      "tag": "vanilla",
      "model_id": "openai/gpt-5.4"
    },
    {
      "name": "Bash Only + GPT 5.4",
      "data_file": "bash_only_+_gpt_5.4_benign.json",
      "tag": "benign",
      "model_id": "openai/gpt-5.4"
    },
    {
      "name": "Bash Only + GPT 5.4",
      "data_file": "bash_only_+_gpt_5.4_malignant.json",
      "tag": "malignant",
      "model_id": "openai/gpt-5.4"
    },
    {
      "name": "Bash Only + GPT 5.4",
      "data_file": "bash_only_+_gpt_5.4_rust-specific.json",
      "tag": "rust-specific",
      "model_id": "openai/gpt-5.4"
    },
    {
      "name": "Bash Only + Gemini 3.1 Pro",
      "data_file": "bash_only_+_gemini_3.1_pro_vanilla.json",
      "tag": "vanilla",
      "model_id": "google/gemini-3.1-pro-preview"
    },
    {
      "name": "Bash Only + Gemini 3.1 Pro",
      "data_file": "bash_only_+_gemini_3.1_pro_benign.json",
      "tag": "benign",
      "model_id": "google/gemini-3.1-pro-preview"
    },
    {
      "name": "Bash Only + Gemini 3.1 Pro",
      "data_file": "bash_only_+_gemini_3.1_pro_malignant.json",
      "tag": "malignant",
      "model_id": "google/gemini-3.1-pro-preview"
    },
    {
      "name": "Bash Only + Gemini 3.1 Pro",
      "data_file": "bash_only_+_gemini_3.1_pro_rust-specific.json",
      "tag": "rust-specific",
      "model_id": "google/gemini-3.1-pro-preview"
    },
    {
      "name": "Bash Only + Qwen 3.6 Plus",
      "data_file": "bash_only_+_qwen_3.6_plus_vanilla.json",
      "tag": "vanilla",
      "model_id": "openrouter/qwen/qwen3.6-plus"
    },
    {
      "name": "Bash Only + Qwen 3.6 Plus",
      "data_file": "bash_only_+_qwen_3.6_plus_benign.json",
      "tag": "benign",
      "model_id": "openrouter/qwen/qwen3.6-plus"
    },
    {
      "name": "Bash Only + Qwen 3.6 Plus",
      "data_file": "bash_only_+_qwen_3.6_plus_malignant.json",
      "tag": "malignant",
      "model_id": "openrouter/qwen/qwen3.6-plus"
    },
    {
      "name": "Bash Only + Qwen 3.6 Plus",
      "data_file": "bash_only_+_qwen_3.6_plus_rust-specific.json",
      "tag": "rust-specific",
      "model_id": "openrouter/qwen/qwen3.6-plus"
    }
  ]
}