m4vic commited on
Commit
b73efcd
·
verified ·
1 Parent(s): a9d2366

Upload results summary

Browse files
Files changed (1) hide show
  1. all_results_summary.json +218 -0
all_results_summary.json ADDED
@@ -0,0 +1,218 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "model": "logistic_regression",
4
+ "accuracy": 0.7871,
5
+ "f1_macro": 0.7306,
6
+ "f1_weighted": 0.778,
7
+ "precision_macro": 0.7901,
8
+ "recall_macro": 0.7021,
9
+ "train_time_seconds": 6.97,
10
+ "inference_ms_per_sample": 0.0381,
11
+ "per_class": {
12
+ "benign": {
13
+ "precision": 0.959,
14
+ "recall": 0.9779,
15
+ "f1": 0.9683,
16
+ "support": 813.0
17
+ },
18
+ "direct_injection": {
19
+ "precision": 0.6411,
20
+ "recall": 0.8973,
21
+ "f1": 0.7479,
22
+ "support": 876.0
23
+ },
24
+ "system_extraction": {
25
+ "precision": 0.7306,
26
+ "recall": 0.6851,
27
+ "f1": 0.7071,
28
+ "support": 289.0
29
+ },
30
+ "role_hijack": {
31
+ "precision": 0.8773,
32
+ "recall": 0.7256,
33
+ "f1": 0.7942,
34
+ "support": 266.0
35
+ },
36
+ "obfuscation": {
37
+ "precision": 0.9467,
38
+ "recall": 0.5575,
39
+ "f1": 0.7018,
40
+ "support": 287.0
41
+ },
42
+ "tool_abuse": {
43
+ "precision": 0.9858,
44
+ "recall": 0.8529,
45
+ "f1": 0.9146,
46
+ "support": 408.0
47
+ },
48
+ "indirect_injection": {
49
+ "precision": 0.3902,
50
+ "recall": 0.2184,
51
+ "f1": 0.2801,
52
+ "support": 293.0
53
+ }
54
+ }
55
+ },
56
+ {
57
+ "model": "linear_svm",
58
+ "accuracy": 0.7871,
59
+ "f1_macro": 0.7358,
60
+ "f1_weighted": 0.7826,
61
+ "precision_macro": 0.77,
62
+ "recall_macro": 0.716,
63
+ "train_time_seconds": 1.9,
64
+ "inference_ms_per_sample": 0.0356,
65
+ "per_class": {
66
+ "benign": {
67
+ "precision": 0.9697,
68
+ "recall": 0.9828,
69
+ "f1": 0.9762,
70
+ "support": 813.0
71
+ },
72
+ "direct_injection": {
73
+ "precision": 0.6721,
74
+ "recall": 0.847,
75
+ "f1": 0.7495,
76
+ "support": 876.0
77
+ },
78
+ "system_extraction": {
79
+ "precision": 0.7127,
80
+ "recall": 0.6782,
81
+ "f1": 0.695,
82
+ "support": 289.0
83
+ },
84
+ "role_hijack": {
85
+ "precision": 0.8353,
86
+ "recall": 0.8008,
87
+ "f1": 0.8177,
88
+ "support": 266.0
89
+ },
90
+ "obfuscation": {
91
+ "precision": 0.873,
92
+ "recall": 0.5749,
93
+ "f1": 0.6933,
94
+ "support": 287.0
95
+ },
96
+ "tool_abuse": {
97
+ "precision": 0.9749,
98
+ "recall": 0.8554,
99
+ "f1": 0.9112,
100
+ "support": 408.0
101
+ },
102
+ "indirect_injection": {
103
+ "precision": 0.3524,
104
+ "recall": 0.273,
105
+ "f1": 0.3077,
106
+ "support": 293.0
107
+ }
108
+ }
109
+ },
110
+ {
111
+ "model": "random_forest",
112
+ "accuracy": 0.7812,
113
+ "f1_macro": 0.7121,
114
+ "f1_weighted": 0.7641,
115
+ "precision_macro": 0.774,
116
+ "recall_macro": 0.6899,
117
+ "train_time_seconds": 35.14,
118
+ "inference_ms_per_sample": 0.0825,
119
+ "per_class": {
120
+ "benign": {
121
+ "precision": 0.9603,
122
+ "recall": 0.9815,
123
+ "f1": 0.9708,
124
+ "support": 813.0
125
+ },
126
+ "direct_injection": {
127
+ "precision": 0.6202,
128
+ "recall": 0.9041,
129
+ "f1": 0.7357,
130
+ "support": 876.0
131
+ },
132
+ "system_extraction": {
133
+ "precision": 0.7194,
134
+ "recall": 0.692,
135
+ "f1": 0.7055,
136
+ "support": 289.0
137
+ },
138
+ "role_hijack": {
139
+ "precision": 0.9108,
140
+ "recall": 0.7293,
141
+ "f1": 0.81,
142
+ "support": 266.0
143
+ },
144
+ "obfuscation": {
145
+ "precision": 0.92,
146
+ "recall": 0.561,
147
+ "f1": 0.697,
148
+ "support": 287.0
149
+ },
150
+ "tool_abuse": {
151
+ "precision": 0.9641,
152
+ "recall": 0.8554,
153
+ "f1": 0.9065,
154
+ "support": 408.0
155
+ },
156
+ "indirect_injection": {
157
+ "precision": 0.3229,
158
+ "recall": 0.1058,
159
+ "f1": 0.1594,
160
+ "support": 293.0
161
+ }
162
+ }
163
+ },
164
+ {
165
+ "model": "xgboost",
166
+ "accuracy": 0.733,
167
+ "f1_macro": 0.6767,
168
+ "f1_weighted": 0.7234,
169
+ "precision_macro": 0.7583,
170
+ "recall_macro": 0.6465,
171
+ "train_time_seconds": 522.7,
172
+ "inference_ms_per_sample": 0.083,
173
+ "per_class": {
174
+ "benign": {
175
+ "precision": 0.9611,
176
+ "recall": 0.9717,
177
+ "f1": 0.9664,
178
+ "support": 813.0
179
+ },
180
+ "direct_injection": {
181
+ "precision": 0.569,
182
+ "recall": 0.871,
183
+ "f1": 0.6883,
184
+ "support": 876.0
185
+ },
186
+ "system_extraction": {
187
+ "precision": 0.6901,
188
+ "recall": 0.6782,
189
+ "f1": 0.6841,
190
+ "support": 289.0
191
+ },
192
+ "role_hijack": {
193
+ "precision": 0.8264,
194
+ "recall": 0.7519,
195
+ "f1": 0.7874,
196
+ "support": 266.0
197
+ },
198
+ "obfuscation": {
199
+ "precision": 0.9471,
200
+ "recall": 0.561,
201
+ "f1": 0.7046,
202
+ "support": 287.0
203
+ },
204
+ "tool_abuse": {
205
+ "precision": 0.9524,
206
+ "recall": 0.4902,
207
+ "f1": 0.6472,
208
+ "support": 408.0
209
+ },
210
+ "indirect_injection": {
211
+ "precision": 0.362,
212
+ "recall": 0.2014,
213
+ "f1": 0.2588,
214
+ "support": 293.0
215
+ }
216
+ }
217
+ }
218
+ ]