{ "curves": { "N5_global_ridge": { "math": -0.3999999999999998, "code": 0.5000000000000002, "science": 1.1666666666666667 }, "N12_global_ridge": { "math": 0.3000000000000002, "code": -0.5000000000000042, "science": 0.5 }, "N12_topk8_global_ridge": { "math": 1.8000000000000043, "code": -0.5000000000000042, "science": 0.3333333333333333 }, "N12_topk12_global_ridge": { "math": -0.29999999999999977, "code": -0.5000000000000042, "science": 0.3333333333333333 }, "N22_global_ridge": { "math": -0.0999999999999998, "code": 0.5, "science": 0.0 }, "N22_topk8_global_ridge": { "math": 1.3000000000000023, "code": 0.0, "science": 0.0 }, "N22_topk12_global_ridge": { "math": 0.20000000000000023, "code": 0.5, "science": 0.5 } }, "details": { "N5_anchors": [ "gsm8k", "svamp", "asdiv", "mawps", "multiarith" ], "gsm_hard": { "N5_global_ridge": { "acc": 0.043333333333333335, "gap_recovered": -0.7999999999999996 }, "N12_global_ridge": { "acc": 0.05, "gap_recovered": -0.3999999999999996 }, "N12_topk8_global_ridge": { "acc": 0.05, "gap_recovered": -0.3999999999999996 }, "N12_topk12_global_ridge": { "acc": 0.04666666666666667, "gap_recovered": -0.5999999999999995 }, "N22_topk12_global_ridge": { "acc": 0.04666666666666667, "gap_recovered": -0.5999999999999995 } }, "math_algebra_medium": { "N5_global_ridge": { "acc": 0.09333333333333334, "gap_recovered": 0.0 }, "N12_global_ridge": { "acc": 0.09666666666666666, "gap_recovered": 1.0 }, "N12_topk8_global_ridge": { "acc": 0.10666666666666667, "gap_recovered": 4.000000000000008 }, "N12_topk12_global_ridge": { "acc": 0.09333333333333334, "gap_recovered": 0.0 }, "N22_topk12_global_ridge": { "acc": 0.09666666666666666, "gap_recovered": 1.0 } }, "humaneval_plus": { "N5_global_ridge": { "acc": 0.054878048780487805, "gap_recovered": 2.0000000000000004 }, "N12_global_ridge": { "acc": 0.06707317073170732, "gap_recovered": 1.0 }, "N12_topk8_global_ridge": { "acc": 0.06707317073170732, "gap_recovered": 1.0 }, "N12_topk12_global_ridge": { "acc": 0.06707317073170732, "gap_recovered": 1.0 }, "N22_topk12_global_ridge": { "acc": 0.06707317073170732, "gap_recovered": 1.0 } }, "mbpp_plus": { "N5_global_ridge": { "acc": 0.21333333333333335, "gap_recovered": -1.0 }, "N12_global_ridge": { "acc": 0.21, "gap_recovered": -2.0000000000000084 }, "N12_topk8_global_ridge": { "acc": 0.21, "gap_recovered": -2.0000000000000084 }, "N12_topk12_global_ridge": { "acc": 0.21, "gap_recovered": -2.0000000000000084 }, "N22_topk12_global_ridge": { "acc": 0.21666666666666667, "gap_recovered": 0.0 } }, "arc_challenge": { "N5_global_ridge": { "acc": 0.7290969899665551, "gap_recovered": 1.1666666666666667 }, "N12_global_ridge": { "acc": 0.7157190635451505, "gap_recovered": 0.5 }, "N12_topk8_global_ridge": { "acc": 0.7123745819397993, "gap_recovered": 0.3333333333333333 }, "N12_topk12_global_ridge": { "acc": 0.7123745819397993, "gap_recovered": 0.3333333333333333 }, "N22_topk12_global_ridge": { "acc": 0.7157190635451505, "gap_recovered": 0.5 } }, "mmlu_college_chemistry": { "N5_global_ridge": { "acc": 0.125, "gap_recovered": null }, "N12_global_ridge": { "acc": 0.375, "gap_recovered": null }, "N12_topk8_global_ridge": { "acc": 0.375, "gap_recovered": null }, "N12_topk12_global_ridge": { "acc": 0.375, "gap_recovered": null }, "N22_topk12_global_ridge": { "acc": 0.375, "gap_recovered": null } }, "N12_anchors": [ "gsm8k", "svamp", "asdiv", "mawps", "multiarith", "aqua_rat", "math_algebra_easy", "math_counting_easy", "mbpp", "humaneval", "codealpaca_mini", "mbpp_sanitized" ], "N22_anchors": [ "gsm8k", "svamp", "asdiv", "mawps", "multiarith", "aqua_rat", "math_algebra_easy", "math_counting_easy", "mbpp", "humaneval", "codealpaca_mini", "mbpp_sanitized", "conala_curated", "livecodebench_easy", "sciq", "arc_easy", "openbookqa", "medmcqa_easy", "mmlu_elementary_math", "mmlu_high_school_biology", "mmlu_high_school_physics", "pubmedqa_pqal" ] } }