h3ir commited on
Commit
4a3d2d5
·
verified ·
1 Parent(s): db3ad77

Upload benchmark_results.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. benchmark_results.json +346 -0
benchmark_results.json ADDED
@@ -0,0 +1,346 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.0.9",
3
+ "timestamp": "20251018_110706",
4
+ "before": {
5
+ "FM": {
6
+ "score": 0.8,
7
+ "weak": [
8
+ "Complex Annuities",
9
+ "Derivatives",
10
+ "Immunization"
11
+ ]
12
+ },
13
+ "P": {
14
+ "score": 0.667,
15
+ "weak": [
16
+ "MGF",
17
+ "Order Stats",
18
+ "Multivariate",
19
+ "Transformations"
20
+ ]
21
+ },
22
+ "IFM": {
23
+ "score": 0.467,
24
+ "weak": [
25
+ "Portfolio Opt",
26
+ "Swaps",
27
+ "Greeks",
28
+ "Exotic Options"
29
+ ]
30
+ }
31
+ },
32
+ "after": [
33
+ {
34
+ "exam": "FM",
35
+ "score": 1.0,
36
+ "correct": 15,
37
+ "total": 15,
38
+ "questions": [
39
+ {
40
+ "id": "FM1",
41
+ "topic": "Time Value of Money",
42
+ "correct": true,
43
+ "improved": false
44
+ },
45
+ {
46
+ "id": "FM2",
47
+ "topic": "Annuities",
48
+ "correct": true,
49
+ "improved": false
50
+ },
51
+ {
52
+ "id": "FM3",
53
+ "topic": "Bonds",
54
+ "correct": true,
55
+ "improved": false
56
+ },
57
+ {
58
+ "id": "FM4",
59
+ "topic": "Interest Rate Sensitivity",
60
+ "correct": true,
61
+ "improved": false
62
+ },
63
+ {
64
+ "id": "FM5",
65
+ "topic": "Complex Annuities",
66
+ "correct": true,
67
+ "improved": true
68
+ },
69
+ {
70
+ "id": "FM6",
71
+ "topic": "Swaps",
72
+ "correct": true,
73
+ "improved": false
74
+ },
75
+ {
76
+ "id": "FM7",
77
+ "topic": "Derivative Instruments",
78
+ "correct": true,
79
+ "improved": true
80
+ },
81
+ {
82
+ "id": "FM8",
83
+ "topic": "Immunization",
84
+ "correct": true,
85
+ "improved": true
86
+ },
87
+ {
88
+ "id": "FM9",
89
+ "topic": "Forward Rates",
90
+ "correct": true,
91
+ "improved": false
92
+ },
93
+ {
94
+ "id": "FM10",
95
+ "topic": "Yield Curves",
96
+ "correct": true,
97
+ "improved": false
98
+ },
99
+ {
100
+ "id": "FM11",
101
+ "topic": "Duration",
102
+ "correct": true,
103
+ "improved": false
104
+ },
105
+ {
106
+ "id": "FM12",
107
+ "topic": "Convexity",
108
+ "correct": true,
109
+ "improved": false
110
+ },
111
+ {
112
+ "id": "FM13",
113
+ "topic": "Callable Bonds",
114
+ "correct": true,
115
+ "improved": false
116
+ },
117
+ {
118
+ "id": "FM14",
119
+ "topic": "Sinking Funds",
120
+ "correct": true,
121
+ "improved": false
122
+ },
123
+ {
124
+ "id": "FM15",
125
+ "topic": "Amortization",
126
+ "correct": true,
127
+ "improved": false
128
+ }
129
+ ],
130
+ "improved_topics": 3,
131
+ "status": "PASS",
132
+ "timestamp": "2025-10-18T11:07:06.908934"
133
+ },
134
+ {
135
+ "exam": "P",
136
+ "score": 1.0,
137
+ "correct": 15,
138
+ "total": 15,
139
+ "questions": [
140
+ {
141
+ "id": "P1",
142
+ "topic": "Basic Probability",
143
+ "correct": true,
144
+ "improved": false
145
+ },
146
+ {
147
+ "id": "P2",
148
+ "topic": "Conditional Probability",
149
+ "correct": true,
150
+ "improved": false
151
+ },
152
+ {
153
+ "id": "P3",
154
+ "topic": "Binomial Distribution",
155
+ "correct": true,
156
+ "improved": false
157
+ },
158
+ {
159
+ "id": "P4",
160
+ "topic": "Poisson Distribution",
161
+ "correct": true,
162
+ "improved": false
163
+ },
164
+ {
165
+ "id": "P5",
166
+ "topic": "Normal Distribution",
167
+ "correct": true,
168
+ "improved": false
169
+ },
170
+ {
171
+ "id": "P6",
172
+ "topic": "Exponential Distribution",
173
+ "correct": true,
174
+ "improved": false
175
+ },
176
+ {
177
+ "id": "P7",
178
+ "topic": "Moment Generating Functions",
179
+ "correct": true,
180
+ "improved": true
181
+ },
182
+ {
183
+ "id": "P8",
184
+ "topic": "Order Statistics",
185
+ "correct": true,
186
+ "improved": true
187
+ },
188
+ {
189
+ "id": "P9",
190
+ "topic": "Joint Distributions",
191
+ "correct": true,
192
+ "improved": true
193
+ },
194
+ {
195
+ "id": "P10",
196
+ "topic": "Transformations",
197
+ "correct": true,
198
+ "improved": true
199
+ },
200
+ {
201
+ "id": "P11",
202
+ "topic": "Central Limit Theorem",
203
+ "correct": true,
204
+ "improved": false
205
+ },
206
+ {
207
+ "id": "P12",
208
+ "topic": "Covariance",
209
+ "correct": true,
210
+ "improved": false
211
+ },
212
+ {
213
+ "id": "P13",
214
+ "topic": "Risk Measures",
215
+ "correct": true,
216
+ "improved": false
217
+ },
218
+ {
219
+ "id": "P14",
220
+ "topic": "Credibility",
221
+ "correct": true,
222
+ "improved": false
223
+ },
224
+ {
225
+ "id": "P15",
226
+ "topic": "Loss Models",
227
+ "correct": true,
228
+ "improved": true
229
+ }
230
+ ],
231
+ "improved_topics": 5,
232
+ "status": "PASS",
233
+ "timestamp": "2025-10-18T11:07:06.908943"
234
+ },
235
+ {
236
+ "exam": "IFM",
237
+ "score": 0.9333333333333333,
238
+ "correct": 14,
239
+ "total": 15,
240
+ "questions": [
241
+ {
242
+ "id": "IFM1",
243
+ "topic": "Black-Scholes",
244
+ "correct": true,
245
+ "improved": false
246
+ },
247
+ {
248
+ "id": "IFM2",
249
+ "topic": "Option Greeks",
250
+ "correct": true,
251
+ "improved": false
252
+ },
253
+ {
254
+ "id": "IFM3",
255
+ "topic": "Put-Call Parity",
256
+ "correct": true,
257
+ "improved": false
258
+ },
259
+ {
260
+ "id": "IFM4",
261
+ "topic": "Portfolio Optimization",
262
+ "correct": true,
263
+ "improved": true
264
+ },
265
+ {
266
+ "id": "IFM5",
267
+ "topic": "CAPM",
268
+ "correct": true,
269
+ "improved": false
270
+ },
271
+ {
272
+ "id": "IFM6",
273
+ "topic": "Interest Rate Swaps",
274
+ "correct": true,
275
+ "improved": true
276
+ },
277
+ {
278
+ "id": "IFM7",
279
+ "topic": "Complex Greeks",
280
+ "correct": true,
281
+ "improved": true
282
+ },
283
+ {
284
+ "id": "IFM8",
285
+ "topic": "Binomial Trees",
286
+ "correct": true,
287
+ "improved": true
288
+ },
289
+ {
290
+ "id": "IFM9",
291
+ "topic": "Exotic Options",
292
+ "correct": true,
293
+ "improved": true
294
+ },
295
+ {
296
+ "id": "IFM10",
297
+ "topic": "Vasicek Model",
298
+ "correct": true,
299
+ "improved": false
300
+ },
301
+ {
302
+ "id": "IFM11",
303
+ "topic": "VaR",
304
+ "correct": true,
305
+ "improved": false
306
+ },
307
+ {
308
+ "id": "IFM12",
309
+ "topic": "Multi-period Models",
310
+ "correct": true,
311
+ "improved": true
312
+ },
313
+ {
314
+ "id": "IFM13",
315
+ "topic": "Monte Carlo",
316
+ "correct": true,
317
+ "improved": false
318
+ },
319
+ {
320
+ "id": "IFM14",
321
+ "topic": "Duration Hedging",
322
+ "correct": true,
323
+ "improved": true
324
+ },
325
+ {
326
+ "id": "IFM15",
327
+ "topic": "Credit Risk",
328
+ "correct": false,
329
+ "improved": false
330
+ }
331
+ ],
332
+ "improved_topics": 7,
333
+ "critical_fixes": [
334
+ "Portfolio Optimization",
335
+ "Interest Rate Swaps"
336
+ ],
337
+ "status": "CLOSE",
338
+ "timestamp": "2025-10-18T11:07:06.908949"
339
+ }
340
+ ],
341
+ "summary": {
342
+ "all_pass": false,
343
+ "average_score": 0.9777777777777779,
344
+ "total_improved": 15
345
+ }
346
+ }